npm - @lobehub/chat - Versions diffs - 1.34.6 → 1.35.0 - Mend

@lobehub/chat 1.34.6 → 1.35.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

package/CHANGELOG.md +25 -0
package/README.md +8 -8
package/README.zh-CN.md +8 -8
package/changelog/v1.json +9 -0
package/docs/self-hosting/environment-variables/analytics.mdx +31 -2
package/package.json +2 -2
package/src/config/modelProviders/ollama.ts +14 -13
package/src/libs/agent-runtime/ollama/index.ts +25 -9
package/src/libs/agent-runtime/utils/streams/ollama.test.ts +130 -46
package/src/libs/agent-runtime/utils/streams/ollama.ts +19 -4
package/src/server/modules/AgentRuntime/index.test.ts +2 -1
package/src/server/modules/AgentRuntime/index.ts +7 -1

package/CHANGELOG.md CHANGED Viewed

@@ -2,6 +2,31 @@
 # Changelog
+## [Version 1.35.0](https://github.com/lobehub/lobe-chat/compare/v1.34.6...v1.35.0)
+<sup>Released on **2024-12-01**</sup>
+#### ✨ Features
+- **misc**: Support ollama tools use.
+<br/>
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+#### What's improved
+- **misc**: Support ollama tools use, closes [#3327](https://github.com/lobehub/lobe-chat/issues/3327) ([72d8835](https://github.com/lobehub/lobe-chat/commit/72d8835))
+</details>
+<div align="right">
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+</div>
 ### [Version 1.34.6](https://github.com/lobehub/lobe-chat/compare/v1.34.5...v1.34.6)
 <sup>Released on **2024-12-01**</sup>

package/README.md CHANGED Viewed

@@ -285,14 +285,14 @@ Our marketplace is not just a showcase platform but also a collaborative space.
 <!-- AGENT LIST -->
-| Recent Submits                                                                                                                                                                               | Description                                                                                                                                                                                                 |
-| -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
-| [Backend Development Assistant](https://chat-preview.lobehub.com/market?agent=backend-assistant)<br/><sup>By **[zeno980](https://github.com/zeno980)** on **2024-11-26**</sup>               | Skilled in backend development tasks<br/>`backend-development` `ai-technology` `web-applications` `spring` `sql`                                                                                            |
-| [Bilingual Dictionary Expert](https://chat-preview.lobehub.com/market?agent=english-chinese-dictionary-expert)<br/><sup>By **[swarfte](https://github.com/swarfte)** on **2024-11-26**</sup> | Expert in bilingual English-Chinese vocabulary translation and analysis<br/>`translation` `language-learning` `vocabulary` `dictionary`                                                                     |
-| [SSC Incremental](https://chat-preview.lobehub.com/market?agent=great-for-analysis-coding-and-rubber-ducking)<br/><sup>By **[Base03](https://github.com/Base03)** on **2024-11-26**</sup>    | Claude minus the Reddit<br/>`technology` `analysis` `software` `ai` `research`                                                                                                                              |
-| [Interviewer's Assistant](https://chat-preview.lobehub.com/market?agent=interviewer-assistant)<br/><sup>By **[xandertang](https://github.com/Dr-T)** on **2024-11-26**</sup>                 | Proficient in designing and evaluating interview questions for product managers, generating interview questions based on resume interpretation results.<br/>`interview` `resume` `recruitment` `efficiency` |
-> 📊 Total agents: [<kbd>**446**</kbd> ](https://github.com/lobehub/lobe-chat-agents)
+| Recent Submits                                                                                                                                                                                                   | Description                                                                                                                                                                                                                                                                                                                                                                                                                              |
+| ---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- | ---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| [AI Assistant for Course Content and Teaching Guidelines](https://chat-preview.lobehub.com/market?agent=course-prep-teaching-guide-ai)<br/><sup>By **[HNaga](https://github.com/HNaga)** on **2024-11-29**</sup> | This AI assistant is designed to help educators and instructors prepare comprehensive course content and provide practical teaching guidelines. It leverages advanced NLP capabilities to generate lesson plans, suggest engaging teaching strategies, and offer insights into educational best practices.<br/>`education` `teaching` `course-design` `content-creation` `ai-assistance` `curriculum-development` `instructional-design` |
+| [Backend Development Assistant](https://chat-preview.lobehub.com/market?agent=backend-assistant)<br/><sup>By **[zeno980](https://github.com/zeno980)** on **2024-11-26**</sup>                                   | Skilled in backend development tasks<br/>`backend-development` `ai-technology` `web-applications` `spring` `sql`                                                                                                                                                                                                                                                                                                                         |
+| [Bilingual Dictionary Expert](https://chat-preview.lobehub.com/market?agent=english-chinese-dictionary-expert)<br/><sup>By **[swarfte](https://github.com/swarfte)** on **2024-11-26**</sup>                     | Expert in bilingual English-Chinese vocabulary translation and analysis<br/>`translation` `language-learning` `vocabulary` `dictionary`                                                                                                                                                                                                                                                                                                  |
+| [SSC Incremental](https://chat-preview.lobehub.com/market?agent=great-for-analysis-coding-and-rubber-ducking)<br/><sup>By **[Base03](https://github.com/Base03)** on **2024-11-26**</sup>                        | Claude minus the Reddit<br/>`technology` `analysis` `software` `ai` `research`                                                                                                                                                                                                                                                                                                                                                           |
+> 📊 Total agents: [<kbd>**447**</kbd> ](https://github.com/lobehub/lobe-chat-agents)
  <!-- AGENT LIST -->

package/README.zh-CN.md CHANGED Viewed

@@ -274,14 +274,14 @@ LobeChat 的插件生态系统是其核心功能的重要扩展，它极大地
 <!-- AGENT LIST -->
-| 最近新增                                                                                                                                                                           | 助手说明                                                                                                                                                                                |
-| ---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- | --------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
-| [后端开发助手](https://chat-preview.lobehub.com/market?agent=backend-assistant)<br/><sup>By **[zeno980](https://github.com/zeno980)** on **2024-11-26**</sup>                      | 擅长后端开发任务<br/>`后端开发` `ai技术` `web应用` `spring` `sql`                                                                                                                       |
-| [双语词典专家](https://chat-preview.lobehub.com/market?agent=english-chinese-dictionary-expert)<br/><sup>By **[swarfte](https://github.com/swarfte)** on **2024-11-26**</sup>      | 双语英语 - 中文词汇翻译和分析专家<br/>`翻译` `语言学习` `词汇` `词典`                                                                                                                   |
-| [SSC 增量](https://chat-preview.lobehub.com/market?agent=great-for-analysis-coding-and-rubber-ducking)<br/><sup>By **[Base03](https://github.com/Base03)** on **2024-11-26**</sup> | Claude 减去 Reddit<br/>`技术` `分析` `软件` `人工智能` `研究`                                                                                                                           |
-| [面试官助手](https://chat-preview.lobehub.com/market?agent=interviewer-assistant)<br/><sup>By **[xandertang](https://github.com/Dr-T)** on **2024-11-26**</sup>                    | Proficient in designing and evaluating interview questions for product managers, generating interview questions based on resume interpretation results.<br/>`面试` `简历` `招聘` `效率` |
-> 📊 Total agents: [<kbd>**446**</kbd> ](https://github.com/lobehub/lobe-chat-agents)
+| 最近新增                                                                                                                                                                              | 助手说明                                                                                                                                                                                                                                              |
+| ------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| [课程内容和教学指南的 AI 助手](https://chat-preview.lobehub.com/market?agent=course-prep-teaching-guide-ai)<br/><sup>By **[HNaga](https://github.com/HNaga)** on **2024-11-29**</sup> | 这个 AI 助手旨在帮助教育工作者和讲师准备全面的课程内容并提供实用的教学指南。它利用先进的自然语言处理能力生成课程计划，建议引人入胜的教学策略，并提供教育最佳实践的见解。<br/>`教育` `教学` `课程设计` `内容创作` `人工智能助手` `课程开发` `教学设计` |
+| [后端开发助手](https://chat-preview.lobehub.com/market?agent=backend-assistant)<br/><sup>By **[zeno980](https://github.com/zeno980)** on **2024-11-26**</sup>                         | 擅长后端开发任务<br/>`后端开发` `ai技术` `web应用` `spring` `sql`                                                                                                                                                                                     |
+| [双语词典专家](https://chat-preview.lobehub.com/market?agent=english-chinese-dictionary-expert)<br/><sup>By **[swarfte](https://github.com/swarfte)** on **2024-11-26**</sup>         | 双语英语 - 中文词汇翻译和分析专家<br/>`翻译` `语言学习` `词汇` `词典`                                                                                                                                                                                 |
+| [SSC 增量](https://chat-preview.lobehub.com/market?agent=great-for-analysis-coding-and-rubber-ducking)<br/><sup>By **[Base03](https://github.com/Base03)** on **2024-11-26**</sup>    | Claude 减去 Reddit<br/>`技术` `分析` `软件` `人工智能` `研究`                                                                                                                                                                                         |
+> 📊 Total agents: [<kbd>**447**</kbd> ](https://github.com/lobehub/lobe-chat-agents)
  <!-- AGENT LIST -->

package/changelog/v1.json CHANGED Viewed

@@ -1,4 +1,13 @@
 [
+  {
+    "children": {
+      "features": [
+        "Support ollama tools use."
+      ]
+    },
+    "date": "2024-12-01",
+    "version": "1.35.0"
+  },
   {
     "children": {
       "improvements": [

package/docs/self-hosting/environment-variables/analytics.mdx CHANGED Viewed

@@ -80,5 +80,34 @@ We have integrated several free/open-source data analytics services in LobeChat
 - Default: `https://analytics.umami.is/script.js`
 - Example: `https://umami.your-site.com/script.js`
-[posthog-analytics-url]: https://posthog.com
-[umami-analytics-url]: https://umami.is
+## Langfuse Observability
+[Langfuse](https://langfuse.com/) is an [open-source](https://github.com/langfuse/langfuse) LLM Observability platform. By enabling the Langfuse integration, you can trace your chat data with Langfuse to develop, monitor, and evaluate the use of your LobeChat.
+### `ENABLE_LANGFUSE`
+- Type: Required
+- Description: Determines if Langfuse analytics is enabled.
+- Default: `1`
+- Example: `1`
+### `LANGFUSE_SECRET_KEY`
+- Type: Required
+- Description: Langfuse API secret key. Can be created by signing up for [Langfuse Cloud](https://cloud.langfuse.com) or by self-hosting Langfuse.
+- Default: \`\`
+- Example: `sk-lf-...`
+### `LANGFUSE_PUBLIC_KEY`
+- Type: Required
+- Description: Langfuse API public key. Can be created by signing up for [Langfuse Cloud](https://cloud.langfuse.com) or by self-hosting Langfuse.
+- Default: \`\`
+- Example: `pk-lf-...`
+### `LANGFUSE_HOST`
+- Type: Required
+- Description: Langfuse host address. Use `https://us.cloud.langfuse.com` if your Langfuse project is in the US data region.
+- Default: `https://cloud.langfuse.com`
+- Example: `https://cloud.langfuse.com`

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@lobehub/chat",
-  "version": "1.34.6",
+  "version": "1.35.0",
   "description": "Lobe Chat - an open-source, high-performance chatbot framework that supports speech synthesis, multimodal, and extensible Function Call plugin system. Supports one-click free deployment of your private ChatGPT/LLM web application.",
   "keywords": [
     "framework",
@@ -181,7 +181,7 @@
     "numeral": "^2.0.6",
     "nuqs": "^1.20.0",
     "officeparser": "^4.2.0",
-    "ollama": "^0.5.9",
+    "ollama": "^0.5.10",
     "openai": "^4.68.1",
     "openapi-fetch": "^0.9.8",
     "partial-json": "^0.1.7",

package/src/config/modelProviders/ollama.ts CHANGED Viewed

@@ -1,6 +1,5 @@
 import { ModelProviderCard } from '@/types/llm';
-// ref: https://ollama.com/library
 const Ollama: ModelProviderCard = {
   chatModels: [
     {
@@ -8,6 +7,7 @@ const Ollama: ModelProviderCard = {
         'Llama 3.1 是 Meta 推出的领先模型，支持高达 405B 参数，可应用于复杂对话、多语言翻译和数据分析领域。',
       displayName: 'Llama 3.1 8B',
       enabled: true,
+      functionCall: true,
       id: 'llama3.1',
       tokens: 128_000,
     },
@@ -221,28 +221,29 @@ const Ollama: ModelProviderCard = {
       tokens: 128_000,
     },
     {
-      description: 'Qwen2 是阿里巴巴的新一代大规模语言模型，以优异的性能支持多元化的应用需求。',
-      displayName: 'Qwen2 0.5B',
-      id: 'qwen2:0.5b',
+      description: 'Qwen2.5 是阿里巴巴的新一代大规模语言模型，以优异的性能支持多元化的应用需求。',
+      displayName: 'Qwen2.5 0.5B',
+      id: 'qwen2.5:0.5b',
       tokens: 128_000,
     },
     {
-      description: 'Qwen2 是阿里巴巴的新一代大规模语言模型，以优异的性能支持多元化的应用需求。',
-      displayName: 'Qwen2 1.5B',
-      id: 'qwen2:1.5b',
+      description: 'Qwen2.5 是阿里巴巴的新一代大规模语言模型，以优异的性能支持多元化的应用需求。',
+      displayName: 'Qwen2.5 1.5B',
+      id: 'qwen2.5:1.5b',
       tokens: 128_000,
     },
     {
-      description: 'Qwen2 是阿里巴巴的新一代大规模语言模型，以优异的性能支持多元化的应用需求。',
-      displayName: 'Qwen2 7B',
+      description: 'Qwen2.5 是阿里巴巴的新一代大规模语言模型，以优异的性能支持多元化的应用需求。',
+      displayName: 'Qwen2.5 7B',
       enabled: true,
-      id: 'qwen2',
+      functionCall: true,
+      id: 'qwen2.5',
       tokens: 128_000,
     },
     {
-      description: 'Qwen2 是阿里巴巴的新一代大规模语言模型，以优异的性能支持多元化的应用需求。',
-      displayName: 'Qwen2 72B',
-      id: 'qwen2:72b',
+      description: 'Qwen2.5 是阿里巴巴的新一代大规模语言模型，以优异的性能支持多元化的应用需求。',
+      displayName: 'Qwen2.5 72B',
+      id: 'qwen2.5:72b',
       tokens: 128_000,
     },
     {

package/src/libs/agent-runtime/ollama/index.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { Ollama } from 'ollama/browser';
+import { Ollama, Tool } from 'ollama/browser';
 import { ClientOptions } from 'openai';
 import { OpenAIChatMessage } from '@/libs/agent-runtime';
@@ -8,8 +8,9 @@ import { LobeRuntimeAI } from '../BaseAI';
 import { AgentRuntimeErrorType } from '../error';
 import { ChatCompetitionOptions, ChatStreamPayload, ModelProvider } from '../types';
 import { AgentRuntimeError } from '../utils/createError';
+import { debugStream } from '../utils/debugStream';
 import { StreamingResponse } from '../utils/response';
-import { OllamaStream } from '../utils/streams';
+import { OllamaStream, convertIterableToStream } from '../utils/streams';
 import { parseDataUri } from '../utils/uriParser';
 import { OllamaMessage } from './type';
@@ -45,23 +46,38 @@ export class LobeOllamaAI implements LobeRuntimeAI {
         options: {
           frequency_penalty: payload.frequency_penalty,
           presence_penalty: payload.presence_penalty,
-          temperature:
-            payload.temperature !== undefined
-            ? payload.temperature / 2
-            : undefined,
+          temperature: payload.temperature !== undefined ? payload.temperature / 2 : undefined,
           top_p: payload.top_p,
         },
         stream: true,
+        tools: payload.tools as Tool[],
       });
-      return StreamingResponse(OllamaStream(response, options?.callback), {
+      const stream = convertIterableToStream(response);
+      const [prod, debug] = stream.tee();
+      if (process.env.DEBUG_OLLAMA_CHAT_COMPLETION === '1') {
+        debugStream(debug).catch(console.error);
+      }
+      return StreamingResponse(OllamaStream(prod, options?.callback), {
         headers: options?.headers,
       });
     } catch (error) {
-      const e = error as { message: string; name: string; status_code: number };
+      const e = error as {
+        error: any;
+        message: string;
+        name: string;
+        status_code: number;
+      };
       throw AgentRuntimeError.chat({
-        error: { message: e.message, name: e.name, status_code: e.status_code },
+        error: {
+          ...e.error,
+          message: String(e.error?.message || e.message),
+          name: e.name,
+          status_code: e.status_code,
+        },
         errorType: AgentRuntimeErrorType.OllamaBizError,
         provider: ModelProvider.Ollama,
       });

package/src/libs/agent-runtime/utils/streams/ollama.test.ts CHANGED Viewed

@@ -6,61 +6,145 @@ import * as uuidModule from '@/utils/uuid';
 import { OllamaStream } from './ollama';
 describe('OllamaStream', () => {
-  it('should transform Ollama stream to protocol stream', async () => {
-    vi.spyOn(uuidModule, 'nanoid').mockReturnValueOnce('1');
+  describe('should transform Ollama stream to protocol stream', () => {
+    it('text', async () => {
+      vi.spyOn(uuidModule, 'nanoid').mockReturnValueOnce('1');
+      const mockOllamaStream = new ReadableStream<ChatResponse>({
+        start(controller) {
+          controller.enqueue({ message: { content: 'Hello' }, done: false } as ChatResponse);
+          controller.enqueue({ message: { content: ' world!' }, done: false } as ChatResponse);
+          controller.enqueue({ message: { content: '' }, done: true } as ChatResponse);
+          controller.close();
+        },
+      });
+      const onStartMock = vi.fn();
+      const onTextMock = vi.fn();
+      const onTokenMock = vi.fn();
+      const onCompletionMock = vi.fn();
+      const protocolStream = OllamaStream(mockOllamaStream, {
+        onStart: onStartMock,
+        onText: onTextMock,
+        onToken: onTokenMock,
+        onCompletion: onCompletionMock,
+      });
+      const decoder = new TextDecoder();
+      const chunks = [];
-    const mockOllamaStream: AsyncIterable<ChatResponse> = {
       // @ts-ignore
-      async *[Symbol.asyncIterator]() {
-        yield { message: { content: 'Hello' }, done: false };
-        yield { message: { content: ' world!' }, done: false };
-        yield { message: { content: '' }, done: true };
-      },
-    };
-    const onStartMock = vi.fn();
-    const onTextMock = vi.fn();
-    const onTokenMock = vi.fn();
-    const onCompletionMock = vi.fn();
-    const protocolStream = OllamaStream(mockOllamaStream, {
-      onStart: onStartMock,
-      onText: onTextMock,
-      onToken: onTokenMock,
-      onCompletion: onCompletionMock,
+      for await (const chunk of protocolStream) {
+        chunks.push(decoder.decode(chunk, { stream: true }));
+      }
+      expect(chunks).toEqual([
+        'id: chat_1\n',
+        'event: text\n',
+        `data: "Hello"\n\n`,
+        'id: chat_1\n',
+        'event: text\n',
+        `data: " world!"\n\n`,
+        'id: chat_1\n',
+        'event: stop\n',
+        `data: "finished"\n\n`,
+      ]);
+      expect(onStartMock).toHaveBeenCalledTimes(1);
+      expect(onTextMock).toHaveBeenNthCalledWith(1, '"Hello"');
+      expect(onTextMock).toHaveBeenNthCalledWith(2, '" world!"');
+      expect(onTokenMock).toHaveBeenCalledTimes(2);
+      expect(onCompletionMock).toHaveBeenCalledTimes(1);
     });
-    const decoder = new TextDecoder();
-    const chunks = [];
+    it('tools use', async () => {
+      vi.spyOn(uuidModule, 'nanoid').mockReturnValueOnce('1');
-    // @ts-ignore
-    for await (const chunk of protocolStream) {
-      chunks.push(decoder.decode(chunk, { stream: true }));
-    }
+      const mockOllamaStream = new ReadableStream<ChatResponse>({
+        start(controller) {
+          controller.enqueue({
+            model: 'qwen2.5',
+            created_at: new Date('2024-12-01T03:34:55.166692Z'),
+            message: {
+              role: 'assistant',
+              content: '',
+              tool_calls: [
+                {
+                  function: {
+                    name: 'realtime-weather____fetchCurrentWeather',
+                    arguments: { city: '杭州' },
+                  },
+                },
+              ],
+            },
+            done: false,
+          } as unknown as ChatResponse);
+          controller.enqueue({
+            model: 'qwen2.5',
+            created_at: '2024-12-01T03:34:55.2133Z',
+            message: { role: 'assistant', content: '' },
+            done_reason: 'stop',
+            done: true,
+            total_duration: 1122415333,
+            load_duration: 26178333,
+            prompt_eval_count: 221,
+            prompt_eval_duration: 507000000,
+            eval_count: 26,
+            eval_duration: 583000000,
+          } as unknown as ChatResponse);
+          controller.close();
+        },
+      });
+      const onStartMock = vi.fn();
+      const onTextMock = vi.fn();
+      const onTokenMock = vi.fn();
+      const onToolCall = vi.fn();
+      const onCompletionMock = vi.fn();
-    expect(chunks).toEqual([
-      'id: chat_1\n',
-      'event: text\n',
-      `data: "Hello"\n\n`,
-      'id: chat_1\n',
-      'event: text\n',
-      `data: " world!"\n\n`,
-      'id: chat_1\n',
-      'event: stop\n',
-      `data: "finished"\n\n`,
-    ]);
-    expect(onStartMock).toHaveBeenCalledTimes(1);
-    expect(onTextMock).toHaveBeenNthCalledWith(1, '"Hello"');
-    expect(onTextMock).toHaveBeenNthCalledWith(2, '" world!"');
-    expect(onTokenMock).toHaveBeenCalledTimes(2);
-    expect(onCompletionMock).toHaveBeenCalledTimes(1);
+      const protocolStream = OllamaStream(mockOllamaStream, {
+        onStart: onStartMock,
+        onText: onTextMock,
+        onToken: onTokenMock,
+        onCompletion: onCompletionMock,
+        onToolCall,
+      });
+      const decoder = new TextDecoder();
+      const chunks = [];
+      // @ts-ignore
+      for await (const chunk of protocolStream) {
+        chunks.push(decoder.decode(chunk, { stream: true }));
+      }
+      expect(chunks).toEqual(
+        [
+          'id: chat_1',
+          'event: tool_calls',
+          `data: [{"function":{"arguments":"{\\"city\\":\\"杭州\\"}","name":"realtime-weather____fetchCurrentWeather"},"id":"realtime-weather____fetchCurrentWeather_0","index":0,"type":"function"}]\n`,
+          'id: chat_1',
+          'event: stop',
+          `data: "finished"\n`,
+        ].map((i) => `${i}\n`),
+      );
+      expect(onTextMock).toHaveBeenCalledTimes(0);
+      expect(onStartMock).toHaveBeenCalledTimes(1);
+      expect(onToolCall).toHaveBeenCalledTimes(1);
+      expect(onTokenMock).toHaveBeenCalledTimes(0);
+      expect(onCompletionMock).toHaveBeenCalledTimes(1);
+    });
   });
   it('should handle empty stream', async () => {
-    const mockOllamaStream = {
-      async *[Symbol.asyncIterator]() {},
-    };
+    const mockOllamaStream = new ReadableStream<ChatResponse>({
+      start(controller) {
+        controller.close();
+      },
+    });
     const protocolStream = OllamaStream(mockOllamaStream);

package/src/libs/agent-runtime/utils/streams/ollama.ts CHANGED Viewed

@@ -6,27 +6,42 @@ import { nanoid } from '@/utils/uuid';
 import {
   StreamProtocolChunk,
   StreamStack,
-  convertIterableToStream,
   createCallbacksTransformer,
   createSSEProtocolTransformer,
+  generateToolCallId,
 } from './protocol';
 const transformOllamaStream = (chunk: ChatResponse, stack: StreamStack): StreamProtocolChunk => {
   // maybe need another structure to add support for multiple choices
-  if (chunk.done) {
+  if (chunk.done && !chunk.message.content) {
     return { data: 'finished', id: stack.id, type: 'stop' };
   }
+  if (chunk.message.tool_calls && chunk.message.tool_calls.length > 0) {
+    return {
+      data: chunk.message.tool_calls.map((value, index) => ({
+        function: {
+          arguments: JSON.stringify(value.function?.arguments) ?? '{}',
+          name: value.function?.name ?? null,
+        },
+        id: generateToolCallId(index, value.function?.name),
+        index: index,
+        type: 'function',
+      })),
+      id: stack.id,
+      type: 'tool_calls',
+    };
+  }
   return { data: chunk.message.content, id: stack.id, type: 'text' };
 };
 export const OllamaStream = (
-  res: AsyncIterable<ChatResponse>,
+  res: ReadableStream<ChatResponse>,
   cb?: ChatStreamCallbacks,
 ): ReadableStream<string> => {
   const streamStack: StreamStack = { id: 'chat_' + nanoid() };
-  return convertIterableToStream(res)
+  return res
     .pipeThrough(createSSEProtocolTransformer(transformOllamaStream, streamStack))
     .pipeThrough(createCallbacksTransformer(cb));
 };

package/src/server/modules/AgentRuntime/index.test.ts CHANGED Viewed

@@ -134,6 +134,7 @@ describe('initAgentRuntimeWithUserPayload method', () => {
       const runtime = await initAgentRuntimeWithUserPayload(ModelProvider.Ollama, jwtPayload);
       expect(runtime).toBeInstanceOf(AgentRuntime);
       expect(runtime['_runtime']).toBeInstanceOf(LobeOllamaAI);
+      expect(runtime['_runtime']['baseURL']).toEqual(jwtPayload.endpoint);
     });
     it('Perplexity AI provider: with apikey', async () => {
@@ -391,7 +392,7 @@ describe('initAgentRuntimeWithUserPayload method', () => {
       // endpoint 不存在，应返回 DEFAULT_BASE_URL
       expect(runtime['_runtime'].baseURL).toBe('https://dashscope.aliyuncs.com/compatible-mode/v1');
     });
     it('Unknown Provider', async () => {
       const jwtPayload = {};
       const runtime = await initAgentRuntimeWithUserPayload('unknown', jwtPayload);

package/src/server/modules/AgentRuntime/index.ts CHANGED Viewed

@@ -33,7 +33,7 @@ const getLlmOptionsFromPayload = (provider: string, payload: JWTPayload) => {
     default: {
       let upperProvider = provider.toUpperCase();
-      if (!( `${upperProvider}_API_KEY` in llmConfig)) {
+      if (!(`${upperProvider}_API_KEY` in llmConfig)) {
         upperProvider = ModelProvider.OpenAI.toUpperCase(); // Use OpenAI options as default
       }
@@ -43,6 +43,12 @@ const getLlmOptionsFromPayload = (provider: string, payload: JWTPayload) => {
       return baseURL ? { apiKey, baseURL } : { apiKey };
     }
+    case ModelProvider.Ollama: {
+      const baseURL = payload?.endpoint || process.env.OLLAMA_PROXY_URL;
+      return { baseURL };
+    }
     case ModelProvider.Azure: {
       const { AZURE_API_KEY, AZURE_API_VERSION, AZURE_ENDPOINT } = llmConfig;
       const apikey = apiKeyManager.pick(payload?.apiKey || AZURE_API_KEY);