npm - @lobehub/chat - Versions diffs - 1.133.3 → 1.133.4 - Mend

@lobehub/chat 1.133.3 → 1.133.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (22) hide show

package/.github/workflows/claude-translator.yml CHANGED Viewed

@@ -76,12 +76,11 @@ jobs:
                - Title: English translation (if non-English)
                - Content format:
-                 > [!NOTE]
-                 > This issue/comment/review was translated by Claude.
                  [Translated content]
                  ---
+                 > This issue/comment/review was translated by Claude.
                  <details>
                  <summary>Original Content</summary>
                  [Original content]

package/.github/workflows/issue-auto-comments.yml CHANGED Viewed

@@ -28,8 +28,7 @@ jobs:
             👀 @{{ author }}
             Thank you for raising an issue. We will investigate into the matter and get back to you as soon as possible.
-            Please make sure you have given us as much context as possible.\
-            非常感谢您提交 issue。我们会尽快调查此事，并尽快回复您。 请确保您已经提供了尽可能多的背景信息。
+            Please make sure you have given us as much context as possible.
       - name: Auto Comment on Issues Closed
         uses: wow-actions/auto-comment@v1
         with:
@@ -37,8 +36,7 @@ jobs:
           issuesClosed: |
             ✅ @{{ author }}
-            This issue is closed, If you have any questions, you can comment and reply.\
-            此问题已经关闭。如果您有任何问题，可以留言并回复。
+            This issue is closed, If you have any questions, you can comment and reply.
       - name: Auto Comment on Pull Request Opened
         uses: wow-actions/auto-comment@v1
         with:
@@ -48,9 +46,7 @@ jobs:
             Thank you for raising your pull request and contributing to our Community
             Please make sure you have followed our contributing guidelines. We will review it as soon as possible.
-            If you encounter any problems, please feel free to connect with us.\
-            非常感谢您提出拉取请求并为我们的社区做出贡献，请确保您已经遵循了我们的贡献指南，我们会尽快审查它。
-            如果您遇到任何问题，请随时与我们联系。
+            If you encounter any problems, please feel free to connect with us.
       - name: Auto Comment on Pull Request Merged
         uses: actions-cool/pr-welcome@main
         if: github.event.pull_request.merged == true
@@ -59,8 +55,7 @@ jobs:
           comment: |
             ❤️ Great PR @${{ github.event.pull_request.user.login }} ❤️
-            The growth of project is inseparable from user feedback and contribution, thanks for your contribution! If you are interesting with the lobehub developer community, please join our [discord](https://discord.com/invite/AYFPHvv2jT) and then dm @arvinxx or @canisminor1990. They will invite you to our private developer channel. We are talking about the lobe-chat development or sharing ai newsletter around the world.\
-            项目的成长离不开用户反馈和贡献，感谢您的贡献! 如果您对 LobeHub 开发者社区感兴趣，请加入我们的 [discord](https://discord.com/invite/AYFPHvv2jT)，然后私信 @arvinxx 或 @canisminor1990。他们会邀请您加入我们的私密开发者频道。我们将会讨论关于 Lobe Chat 的开发，分享和讨论全球范围内的 AI 消息。
+            The growth of project is inseparable from user feedback and contribution, thanks for your contribution! If you are interesting with the lobehub developer community, please join our [discord](https://discord.com/invite/AYFPHvv2jT) and then dm @arvinxx or @canisminor1990. They will invite you to our private developer channel. We are talking about the lobe-chat development or sharing ai newsletter around the world.
           emoji: 'hooray'
           pr-emoji: '+1, heart'
       - name: Remove inactive

package/.github/workflows/issue-close-require.yml CHANGED Viewed

@@ -38,8 +38,7 @@ jobs:
           body: |
             👋 @{{ author }}
             <br/>
-            Since the issue was labeled with `✅ Fixed`, but no response in 3 days. This issue will be closed. If you have any questions, you can comment and reply.\
-            由于该 issue 被标记为已修复，同时 3 天未收到回应。现关闭 issue，若有任何问题，可评论回复。
+            Since the issue was labeled with `✅ Fixed`, but no response in 3 days. This issue will be closed. If you have any questions, you can comment and reply.
       - name: need reproduce
         uses: actions-cool/issues-helper@v3
         with:
@@ -50,8 +49,7 @@ jobs:
           body: |
             👋 @{{ author }}
             <br/>
-            Since the issue was labeled with `🤔 Need Reproduce`, but no response in 3 days. This issue will be closed. If you have any questions, you can comment and reply.\
-            由于该 issue 被标记为需要更多信息，却 3 天未收到回应。现关闭 issue，若有任何问题，可评论回复。
+            Since the issue was labeled with `🤔 Need Reproduce`, but no response in 3 days. This issue will be closed. If you have any questions, you can comment and reply.
       - name: need reproduce
         uses: actions-cool/issues-helper@v3
         with:
@@ -62,5 +60,4 @@ jobs:
           body: |
             👋 @{{ github.event.issue.user.login }}
             <br/>
-            Since the issue was labeled with `🙅🏻‍♀️ WON'T DO`, and no response in 3 days. This issue will be closed. If you have any questions, you can comment and reply.\
-            由于该 issue 被标记为暂不处理，同时 3 天未收到回应。现关闭 issue，若有任何问题，可评论回复。
+            Since the issue was labeled with `🙅🏻‍♀️ WON'T DO`, and no response in 3 days. This issue will be closed. If you have any questions, you can comment and reply.

package/CHANGELOG.md CHANGED Viewed

@@ -2,6 +2,39 @@
 # Changelog
+### [Version 1.133.4](https://github.com/lobehub/lobe-chat/compare/v1.133.3...v1.133.4)
+<sup>Released on **2025-10-01**</sup>
+#### 🐛 Bug Fixes
+- **misc**: OllamaCloud error.
+#### 💄 Styles
+- **misc**: Fix chat minimap overflow.
+<br/>
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+#### What's fixed
+- **misc**: OllamaCloud error, closes [#9481](https://github.com/lobehub/lobe-chat/issues/9481) ([55c45a5](https://github.com/lobehub/lobe-chat/commit/55c45a5))
+#### Styles
+- **misc**: Fix chat minimap overflow, closes [#9507](https://github.com/lobehub/lobe-chat/issues/9507) ([d835c33](https://github.com/lobehub/lobe-chat/commit/d835c33))
+</details>
+<div align="right">
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+</div>
 ### [Version 1.133.3](https://github.com/lobehub/lobe-chat/compare/v1.133.2...v1.133.3)
 <sup>Released on **2025-10-01**</sup>

package/changelog/v1.json CHANGED Viewed

@@ -1,4 +1,16 @@
 [
+  {
+    "children": {
+      "fixes": [
+        "OllamaCloud error."
+      ],
+      "improvements": [
+        "Fix chat minimap overflow."
+      ]
+    },
+    "date": "2025-10-01",
+    "version": "1.133.4"
+  },
   {
     "children": {
       "improvements": [

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@lobehub/chat",
-  "version": "1.133.3",
+  "version": "1.133.4",
   "description": "Lobe Chat - an open-source, high-performance chatbot framework that supports speech synthesis, multimodal, and extensible Function Call plugin system. Supports one-click free deployment of your private ChatGPT/LLM web application.",
   "keywords": [
     "framework",

package/packages/model-bank/src/aiModels/aihubmix.ts CHANGED Viewed

@@ -526,6 +526,40 @@ const aihubmixModels: AIChatModelCard[] = [
     },
     type: 'chat',
   },
+  {
+    abilities: {
+      functionCall: true,
+      reasoning: true,
+      search: true,
+      vision: true,
+    },
+    contextWindowTokens: 200_000,
+    description:
+      'Sonnet 4.5 是世界上最好的代理、编码和计算机使用模型。它也是我们在长时间运行任务中最准确、最详细的模型，具有增强的编码、金融和网络安全领域知识。',
+    displayName: 'Claude Sonnet 4.5',
+    enabled: true,
+    id: 'claude-sonnet-4-5-20250929',
+    maxOutput: 64_000,
+    pricing: {
+      units: [
+        { name: 'textInput', rate: 3, strategy: 'fixed', unit: 'millionTokens' },
+        { name: 'textOutput', rate: 15, strategy: 'fixed', unit: 'millionTokens' },
+        { name: 'textInput_cacheRead', rate: 0.3, strategy: 'fixed', unit: 'millionTokens' },
+        {
+          lookup: { prices: { '1h': 6, '5m': 3.75 }, pricingParams: ['ttl'] },
+          name: 'textInput_cacheWrite',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
+      ],
+    },
+    releasedAt: '2025-09-29',
+    settings: {
+      extendParams: ['disableContextCaching', 'enableReasoning', 'reasoningBudgetToken'],
+      searchImpl: 'params',
+    },
+    type: 'chat',
+  },
   {
     abilities: {
       functionCall: true,
@@ -537,7 +571,6 @@ const aihubmixModels: AIChatModelCard[] = [
     description:
       'Claude Sonnet 4 可以产生近乎即时的响应或延长的逐步思考，用户可以清晰地看到这些过程。API 用户还可以对模型思考的时间进行细致的控制',
     displayName: 'Claude Sonnet 4',
-    enabled: true,
     id: 'claude-sonnet-4-20250514',
     maxOutput: 64_000,
     pricing: {

package/packages/model-bank/src/aiModels/anthropic.ts CHANGED Viewed

@@ -22,7 +22,7 @@ const anthropicChatModels: AIChatModelCard[] = [
         { name: 'textInput_cacheWrite', rate: 3.75, strategy: 'fixed', unit: 'millionTokens' },
       ],
     },
-    releasedAt: '2025-09-30',
+    releasedAt: '2025-09-29',
     settings: {
       extendParams: ['disableContextCaching', 'enableReasoning', 'reasoningBudgetToken'],
       searchImpl: 'params',
@@ -107,7 +107,6 @@ const anthropicChatModels: AIChatModelCard[] = [
     description:
       'Claude Sonnet 4 可以产生近乎即时的响应或延长的逐步思考，用户可以清晰地看到这些过程。API 用户还可以对模型思考的时间进行细致的控制',
     displayName: 'Claude Sonnet 4',
-    enabled: true,
     id: 'claude-sonnet-4-20250514',
     maxOutput: 64_000,
     pricing: {
@@ -172,7 +171,7 @@ const anthropicChatModels: AIChatModelCard[] = [
     contextWindowTokens: 200_000,
     description:
       'Claude 3.5 Sonnet 提供了超越 Opus 的能力和比 Sonnet 更快的速度，同时保持与 Sonnet 相同的价格。Sonnet 特别擅长编程、数据科学、视觉处理、代理任务。',
-    displayName: 'Claude 3.5 Sonnet v2',
+    displayName: 'Claude 3.5 Sonnet (New)',
     id: 'claude-3-5-sonnet-20241022',
     maxOutput: 8192,
     pricing: {
@@ -203,7 +202,7 @@ const anthropicChatModels: AIChatModelCard[] = [
     contextWindowTokens: 200_000,
     description:
       'Claude 3.5 Sonnet 提供了超越 Opus 的能力和比 Sonnet 更快的速度，同时保持与 Sonnet 相同的价格。Sonnet 特别擅长编程、数据科学、视觉处理、代理任务。',
-    displayName: 'Claude 3.5 Sonnet',
+    displayName: 'Claude 3.5 Sonnet (Old)',
     id: 'claude-3-5-sonnet-20240620',
     maxOutput: 8192,
     pricing: {
@@ -235,7 +234,6 @@ const anthropicChatModels: AIChatModelCard[] = [
     description:
       'Claude 3.5 Haiku 是 Anthropic 最快的下一代模型。与 Claude 3 Haiku 相比，Claude 3.5 Haiku 在各项技能上都有所提升，并在许多智力基准测试中超越了上一代最大的模型 Claude 3 Opus。',
     displayName: 'Claude 3.5 Haiku',
-    enabled: true,
     id: 'claude-3-5-haiku-20241022',
     maxOutput: 8192,
     pricing: {
@@ -287,33 +285,6 @@ const anthropicChatModels: AIChatModelCard[] = [
     },
     type: 'chat',
   },
-  {
-    abilities: {
-      functionCall: true,
-      vision: true,
-    },
-    contextWindowTokens: 200_000,
-    description:
-      'Claude 3 Sonnet 在智能和速度方面为企业工作负载提供了理想的平衡。它以更低的价格提供最大效用，可靠且适合大规模部署。',
-    displayName: 'Claude 3 Sonnet',
-    id: 'claude-3-sonnet-20240229', // 弃用日期 2025年7月21日
-    maxOutput: 4096,
-    pricing: {
-      units: [
-        { name: 'textInput_cacheRead', rate: 0.3, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textInput', rate: 3, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textOutput', rate: 15, strategy: 'fixed', unit: 'millionTokens' },
-        {
-          lookup: { prices: { '1h': 6, '5m': 3.75 }, pricingParams: ['ttl'] },
-          name: 'textInput_cacheWrite',
-          strategy: 'lookup',
-          unit: 'millionTokens',
-        },
-      ],
-    },
-    releasedAt: '2024-02-29',
-    type: 'chat',
-  },
   {
     abilities: {
       functionCall: true,
@@ -344,38 +315,6 @@ const anthropicChatModels: AIChatModelCard[] = [
     },
     type: 'chat',
   },
-  {
-    contextWindowTokens: 200_000,
-    description:
-      'Claude 2 为企业提供了关键能力的进步，包括业界领先的 200K token 上下文、大幅降低模型幻觉的发生率、系统提示以及一个新的测试功能：工具调用。',
-    displayName: 'Claude 2.1',
-    id: 'claude-2.1', // 弃用日期 2025年7月21日
-    maxOutput: 4096,
-    pricing: {
-      units: [
-        { name: 'textInput', rate: 8, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textOutput', rate: 24, strategy: 'fixed', unit: 'millionTokens' },
-      ],
-    },
-    releasedAt: '2023-11-21',
-    type: 'chat',
-  },
-  {
-    contextWindowTokens: 100_000,
-    description:
-      'Claude 2 为企业提供了关键能力的进步，包括业界领先的 200K token 上下文、大幅降低模型幻觉的发生率、系统提示以及一个新的测试功能：工具调用。',
-    displayName: 'Claude 2.0',
-    id: 'claude-2.0', // 弃用日期 2025年7月21日
-    maxOutput: 4096,
-    pricing: {
-      units: [
-        { name: 'textInput', rate: 8, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textOutput', rate: 24, strategy: 'fixed', unit: 'millionTokens' },
-      ],
-    },
-    releasedAt: '2023-07-11',
-    type: 'chat',
-  },
 ];
 export const allModels = [...anthropicChatModels];

package/packages/model-bank/src/aiModels/novita.ts CHANGED Viewed

@@ -30,8 +30,8 @@ const novitaChatModels: AIChatModelCard[] = [
     maxOutput: 32_768,
     pricing: {
       units: [
-        { name: 'textInput', rate: 0.3, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textOutput', rate: 3, strategy: 'fixed', unit: 'millionTokens' },
+        { name: 'textInput', rate: 0.98, strategy: 'fixed', unit: 'millionTokens' },
+        { name: 'textOutput', rate: 3.95, strategy: 'fixed', unit: 'millionTokens' },
       ],
     },
     type: 'chat',

package/packages/model-bank/src/aiModels/qwen.ts CHANGED Viewed

@@ -55,6 +55,27 @@ const qwenChatModels: AIChatModelCard[] = [
     },
     type: 'chat',
   },
+  {
+    abilities: {
+      reasoning: true,
+    },
+    contextWindowTokens: 131_072,
+    description: 'deepseek-v3.2-exp 引入稀疏注意力机制，旨在提升处理长文本时的训练与推理效率，价格低于 deepseek-v3.1。',
+    displayName: 'DeepSeek V3.2 Exp',
+    id: 'deepseek-v3.2-exp',
+    maxOutput: 65_536,
+    pricing: {
+      currency: 'CNY',
+      units: [
+        { name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
+        { name: 'textOutput', rate: 3, strategy: 'fixed', unit: 'millionTokens' },
+      ],
+    },
+    settings: {
+      extendParams: ['enableReasoning', 'reasoningBudgetToken'],
+    },
+    type: 'chat',
+  },
   {
     abilities: {
       reasoning: true,

package/packages/model-bank/src/aiModels/zhipu.ts CHANGED Viewed

@@ -1,6 +1,72 @@
 import { AIChatModelCard, AIImageModelCard } from '../types/aiModel';
+// price: https://bigmodel.cn/pricing
+// ref: https://docs.bigmodel.cn/cn/guide/start/model-overview
 const zhipuChatModels: AIChatModelCard[] = [
+  {
+    abilities: {
+      functionCall: true,
+      reasoning: true,
+      search: true,
+    },
+    contextWindowTokens: 200_000,
+    description:
+      '智谱最新旗舰模型 GLM-4.6 (355B) 在高级编码、长文本处理、推理与智能体能力上全面超越前代，尤其在编程能力上对齐 Claude Sonnet 4，成为国内顶尖的 Coding 模型。',
+    displayName: 'GLM-4.6',
+    enabled: true,
+    id: 'glm-4.6',
+    maxOutput: 128_000,
+    pricing: {
+      currency: 'CNY',
+      units: [
+        {
+          lookup: {
+            prices: {
+              '[0, 32_000]_[0, 200]': 0.4,
+              '[0, 32_000]_[200, infinity]': 0.6,
+              '[32_000, 200_000]': 0.8,
+            },
+            pricingParams: ['textInput', 'textOutput'],
+          },
+          name: 'textInput_cacheRead',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
+        {
+          lookup: {
+            prices: {
+              '[0, 32_000]_[0, 200]': 2,
+              '[0, 32_000]_[200, infinity]': 3,
+              '[32_000, 200_000]': 4,
+            },
+            pricingParams: ['textInput', 'textOutput'],
+          },
+          name: 'textInput',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
+        {
+          lookup: {
+            prices: {
+              '[0, 32_000]_[0, 200]': 8,
+              '[0, 32_000]_[200, infinity]': 14,
+              '[32_000, 200_000]': 16,
+            },
+            pricingParams: ['textInput', 'textOutput'],
+          },
+          name: 'textOutput',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
+      ],
+    },
+    settings: {
+      extendParams: ['enableReasoning'],
+      searchImpl: 'params',
+    },
+    type: 'chat',
+  },
   {
     abilities: {
       functionCall: true,
@@ -18,10 +84,42 @@ const zhipuChatModels: AIChatModelCard[] = [
     pricing: {
       currency: 'CNY',
       units: [
-        // 输入长度 [0, 32]
-        { name: 'textInput_cacheRead', rate: 0.4, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textOutput', rate: 6, strategy: 'fixed', unit: 'millionTokens' },
+        {
+          lookup: {
+            prices: {
+              '[0, 32_000]': 0.4,
+              '[32_000, 65_536]': 0.8,
+            },
+            pricingParams: ['textInput'],
+          },
+          name: 'textInput_cacheRead',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
+        {
+          lookup: {
+            prices: {
+              '[0, 32_000]': 2,
+              '[32_000, 65_536]': 4,
+            },
+            pricingParams: ['textInput'],
+          },
+          name: 'textInput',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
+        {
+          lookup: {
+            prices: {
+              '[0, 32_000]': 6,
+              '[32_000, 65_536]': 12,
+            },
+            pricingParams: ['textInput'],
+          },
+          name: 'textOutput',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
       ],
     },
     settings: {
@@ -38,17 +136,52 @@ const zhipuChatModels: AIChatModelCard[] = [
     },
     contextWindowTokens: 128_000,
     description:
-      '智谱最新旗舰模型，支持思考模式切换，综合能力达到开源模型的 SOTA 水平，上下文长度可达128K。',
+      '智谱旗舰模型，支持思考模式切换，综合能力达到开源模型的 SOTA 水平，上下文长度可达128K。',
     displayName: 'GLM-4.5',
-    enabled: true,
     id: 'glm-4.5',
     maxOutput: 32_768,
     pricing: {
       currency: 'CNY',
       units: [
-        { name: 'textInput_cacheRead', rate: 0.8, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textInput', rate: 4, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textOutput', rate: 16, strategy: 'fixed', unit: 'millionTokens' },
+        {
+          lookup: {
+            prices: {
+              '[0, 32_000]_[0, 200]': 0.4,
+              '[0, 32_000]_[200, infinity]': 0.6,
+              '[32_000, 128_000]': 0.8,
+            },
+            pricingParams: ['textInput', 'textOutput'],
+          },
+          name: 'textInput_cacheRead',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
+        {
+          lookup: {
+            prices: {
+              '[0, 32_000]_[0, 200]': 2,
+              '[0, 32_000]_[200, infinity]': 3,
+              '[32_000, 128_000]': 4,
+            },
+            pricingParams: ['textInput', 'textOutput'],
+          },
+          name: 'textInput',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
+        {
+          lookup: {
+            prices: {
+              '[0, 32_000]_[0, 200]': 8,
+              '[0, 32_000]_[200, infinity]': 14,
+              '[32_000, 128_000]': 16,
+            },
+            pricingParams: ['textInput', 'textOutput'],
+          },
+          name: 'textOutput',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
       ],
     },
     settings: {
@@ -71,9 +204,45 @@ const zhipuChatModels: AIChatModelCard[] = [
     pricing: {
       currency: 'CNY',
       units: [
-        { name: 'textInput_cacheRead', rate: 3.2, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textInput', rate: 16, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textOutput', rate: 64, strategy: 'fixed', unit: 'millionTokens' },
+        {
+          lookup: {
+            prices: {
+              '[0, 32_000]': 1.6,
+              '[0, 32_000]_[200, infinity]': 2.4,
+              '[32_000, 128_000]': 3.2,
+            },
+            pricingParams: ['textInput', 'textOutput'],
+          },
+          name: 'textInput_cacheRead',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
+        {
+          lookup: {
+            prices: {
+              '[0, 32_000]_[0, 200]': 8,
+              '[0, 32_000]_[200, infinity]': 12,
+              '[32_000, 128_000]': 16,
+            },
+            pricingParams: ['textInput', 'textOutput'],
+          },
+          name: 'textInput',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
+        {
+          lookup: {
+            prices: {
+              '[0, 32_000]_[0, 200]': 16,
+              '[0, 32_000]_[200, infinity]': 32,
+              '[32_000, 128_000]': 64,
+            },
+            pricingParams: ['textInput', 'textOutput'],
+          },
+          name: 'textOutput',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
       ],
     },
     settings: {
@@ -96,9 +265,43 @@ const zhipuChatModels: AIChatModelCard[] = [
     pricing: {
       currency: 'CNY',
       units: [
-        { name: 'textInput_cacheRead', rate: 0.24, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textInput', rate: 1.2, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textOutput', rate: 8, strategy: 'fixed', unit: 'millionTokens' },
+        {
+          lookup: {
+            prices: {
+              '[0, 32_000]': 0.16,
+              '[32_000, 128_000]': 0.24,
+            },
+            pricingParams: ['textInput'],
+          },
+          name: 'textInput_cacheRead',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
+        {
+          lookup: {
+            prices: {
+              '[0, 32_000]': 0.8,
+              '[32_000, 128_000]': 1.2,
+            },
+            pricingParams: ['textInput'],
+          },
+          name: 'textInput',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
+        {
+          lookup: {
+            prices: {
+              '[0, 32_000]_[0, 200]': 2,
+              '[0, 32_000]_[200, infinity]': 6,
+              '[32_000, 128_000]': 8,
+            },
+            pricingParams: ['textInput', 'textOutput'],
+          },
+          name: 'textOutput',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
       ],
     },
     settings: {
@@ -121,9 +324,43 @@ const zhipuChatModels: AIChatModelCard[] = [
     pricing: {
       currency: 'CNY',
       units: [
-        { name: 'textInput_cacheRead', rate: 1.6, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textInput', rate: 8, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textOutput', rate: 32, strategy: 'fixed', unit: 'millionTokens' },
+        {
+          lookup: {
+            prices: {
+              '[0, 32_000]': 0.8,
+              '[32_000, 128_000]': 1.6,
+            },
+            pricingParams: ['textInput'],
+          },
+          name: 'textInput_cacheRead',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
+        {
+          lookup: {
+            prices: {
+              '[0, 32_000]': 4,
+              '[32_000, 128_000]': 8,
+            },
+            pricingParams: ['textInput'],
+          },
+          name: 'textInput',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
+        {
+          lookup: {
+            prices: {
+              '[0, 32_000]_[0, 200]': 12,
+              '[0, 32_000]_[200, infinity]': 16,
+              '[32_000, 128_000]': 32,
+            },
+            pricingParams: ['textInput', 'textOutput'],
+          },
+          name: 'textOutput',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
       ],
     },
     settings: {
@@ -187,7 +424,6 @@ const zhipuChatModels: AIChatModelCard[] = [
     description:
       'GLM-4.1V-Thinking 系列模型是目前已知10B级别的VLM模型中性能最强的视觉模型，融合了同级别SOTA的各项视觉语言任务，包括视频理解、图片问答、学科解题、OCR文字识别、文档和图表解读、GUI Agent、前端网页Coding、Grounding等，多项任务能力甚至超过8倍参数量的Qwen2.5-VL-72B。通过领先的强化学习技术，模型掌握了通过思维链推理的方式提升回答的准确性和丰富度，从最终效果和可解释性等维度都显著超过传统的非thinking模型。',
     displayName: 'GLM-4.1V-Thinking-Flash',
-    enabled: true,
     id: 'glm-4.1v-thinking-flash',
     maxOutput: 16_384,
     pricing: {
@@ -414,28 +650,6 @@ const zhipuChatModels: AIChatModelCard[] = [
     },
     type: 'chat',
   },
-  {
-    abilities: {
-      functionCall: true,
-      search: true,
-    },
-    contextWindowTokens: 128_000,
-    description:
-      'GLM-4-AllTools 是一个多功能智能体模型，优化以支持复杂指令规划与工具调用，如网络浏览、代码解释和文本生成，适用于多任务执行。',
-    displayName: 'GLM-4-AllTools',
-    id: 'glm-4-alltools',
-    pricing: {
-      currency: 'CNY',
-      units: [
-        { name: 'textInput', rate: 100, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textOutput', rate: 100, strategy: 'fixed', unit: 'millionTokens' },
-      ],
-    },
-    settings: {
-      searchImpl: 'params',
-    },
-    type: 'chat',
-  },
   {
     abilities: {
       functionCall: true,
@@ -479,27 +693,6 @@ const zhipuChatModels: AIChatModelCard[] = [
     },
     type: 'chat',
   },
-  {
-    abilities: {
-      functionCall: true,
-      search: true,
-    },
-    contextWindowTokens: 128_000,
-    description: 'GLM-4 是发布于2024年1月的旧旗舰版本，目前已被更强的 GLM-4-0520 取代。',
-    displayName: 'GLM-4',
-    id: 'glm-4', // 弃用时间 2025年6月30日
-    pricing: {
-      currency: 'CNY',
-      units: [
-        { name: 'textInput', rate: 100, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textOutput', rate: 100, strategy: 'fixed', unit: 'millionTokens' },
-      ],
-    },
-    settings: {
-      searchImpl: 'params',
-    },
-    type: 'chat',
-  },
   {
     abilities: {
       vision: true,

package/packages/model-runtime/src/providers/anthropic/index.test.ts CHANGED Viewed

@@ -793,18 +793,6 @@ describe('LobeAnthropicAI', () => {
         expect(result.max_tokens).toBe(4096);
       });
-      it('should set correct max_tokens based on model for non claude-3 models', async () => {
-        const payload: ChatStreamPayload = {
-          messages: [{ content: 'Hello', role: 'user' }],
-          model: 'claude-2.1',
-          temperature: 0.7,
-        };
-        const result = await instance['buildAnthropicPayload'](payload);
-        expect(result.max_tokens).toBe(4096);
-      });
       it('should respect max_tokens when explicitly provided', async () => {
         const payload: ChatStreamPayload = {
           max_tokens: 2000,

package/packages/model-runtime/src/providers/novita/index.ts CHANGED Viewed

@@ -29,6 +29,7 @@ export const LobeNovitaAI = createOpenAICompatibleRuntime({
     const formattedModels = modelList.map((m) => {
       const mm = m as any;
       const features: string[] = Array.isArray(mm.features) ? mm.features : [];
+      const inputModalities: string[] = Array.isArray(mm.input_modalities) ? mm.input_modalities : [];
       return {
         contextWindowTokens: mm.context_size ?? mm.max_output_tokens ?? undefined,
@@ -44,7 +45,7 @@ export const LobeNovitaAI = createOpenAICompatibleRuntime({
         },
         reasoning: features.includes('reasoning') || false,
         type: mm.model_type ?? undefined,
-        vision: features.includes('vision') || false,
+        vision: inputModalities.includes('image') || features.includes('vision') || false,
       } as any;
     });

package/packages/model-runtime/src/providers/novita/type.ts CHANGED Viewed

@@ -2,8 +2,12 @@ export interface NovitaModelCard {
   context_size: number;
   created: number;
   description: string;
+  features?: string[];
   id: string;
+  input_modalities?: string[];
   input_token_price_per_m: number;
+  max_output_tokens?: number;
+  model_type?: string;
   output_token_price_per_m: number;
   status: number;
   tags: string[];

package/packages/model-runtime/src/providers/ollamacloud/index.ts CHANGED Viewed

@@ -4,7 +4,7 @@ import { createOpenAICompatibleRuntime } from '../../core/openaiCompatibleFactor
 import { processMultiProviderModelList } from '../../utils/modelParse';
 export const LobeOllamaCloudAI = createOpenAICompatibleRuntime({
-  baseURL: 'https://api.ollama.com/v1',
+  baseURL: 'https://ollama.com/v1',
   chatCompletion: {
     handlePayload: (payload) => {
       const { model, ...rest } = payload;

package/packages/model-runtime/src/providers/openrouter/index.ts CHANGED Viewed

@@ -73,11 +73,18 @@ export const LobeOpenRouterAI = createOpenAICompatibleRuntime({
       const { endpoint } = model;
       const endpointModel = endpoint?.model;
-      const displayName = model.slug?.toLowerCase().includes('deepseek')
+      const inputModalities = endpointModel?.input_modalities || model.input_modalities;
+      let displayName = model.slug?.toLowerCase().includes('deepseek') && !model.short_name?.toLowerCase().includes('deepseek')
         ? (model.name ?? model.slug)
         : (model.short_name ?? model.name ?? model.slug);
-      const inputModalities = endpointModel?.input_modalities || model.input_modalities;
+      const inputPrice = formatPrice(endpoint?.pricing?.prompt);
+      const outputPrice = formatPrice(endpoint?.pricing?.completion);
+      const isFree = (inputPrice === 0 || outputPrice === 0) && !displayName.endsWith('(free)');
+      if (isFree) {
+        displayName += ' (free)';
+      }
       return {
         contextWindowTokens: endpoint?.context_length || model.context_length,
@@ -90,8 +97,8 @@ export const LobeOpenRouterAI = createOpenAICompatibleRuntime({
             ? endpoint.max_completion_tokens
             : undefined,
         pricing: {
-          input: formatPrice(endpoint?.pricing?.prompt),
-          output: formatPrice(endpoint?.pricing?.completion),
+          input: inputPrice,
+          output: outputPrice,
         },
         reasoning: endpoint?.supports_reasoning || false,
         releasedAt: new Date(model.created_at).toISOString().split('T')[0],

package/packages/utils/package.json CHANGED Viewed

@@ -18,7 +18,6 @@
     "dompurify": "^3.2.7"
   },
   "devDependencies": {
-    "@types/dompurify": "^3.2.0",
     "vitest-canvas-mock": "^0.3.3"
   }
 }

package/src/app/[variants]/(main)/chat/(workspace)/@conversation/features/ChatMinimap/index.tsx CHANGED Viewed

@@ -129,6 +129,26 @@ const useStyles = createStyles(({ css, token }) => ({
       opacity: 1;
     }
   `,
+  railContent: css`
+    scrollbar-width: none;
+    overflow-y: auto;
+    display: flex;
+    flex-direction: column;
+    gap: 0;
+    align-items: end;
+    justify-content: space-between;
+    max-height: round(down, 50vh, 12px);
+    /* Hide scrollbar for IE, Edge and Firefox */
+    -ms-overflow-style: none;
+    /* Hide scrollbar for Chrome, Safari and Opera */
+    &::-webkit-scrollbar {
+      display: none;
+    }
+  `,
 }));
 const getIndicatorWidth = (content: string | undefined) => {
@@ -245,8 +265,6 @@ const ChatMinimap = () => {
           }
           targetPosition = matched === -1 ? 0 : matched;
         } else {
-          console.log('activeIndex', activeIndex);
-          console.log('indicators', indicators);
           let matched = indicators.length - 1;
           for (const [pos, indicator] of indicators.entries()) {
             if (indicator.virtuosoIndex > activeIndex) {
@@ -295,28 +313,38 @@ const ChatMinimap = () => {
             <Icon color={theme.colorTextTertiary} icon={ChevronUp} size={16} />
           </button>
         </Tooltip>
-        {indicators.map(({ id, width, preview, virtuosoIndex }, position) => {
-          const isActive = activeIndicatorPosition === position;
-          return (
-            <Tooltip key={id} mouseEnterDelay={0.1} placement={'left'} title={preview || undefined}>
-              <button
-                aria-current={isActive ? 'true' : undefined}
-                aria-label={t('minimap.jumpToMessage', { index: position + 1 })}
-                className={styles.indicator}
-                onClick={() => handleJump(virtuosoIndex)}
-                style={{
-                  width,
-                }}
-                type={'button'}
+        <Flexbox className={styles.railContent}>
+          {indicators.map(({ id, width, preview, virtuosoIndex }, position) => {
+            const isActive = activeIndicatorPosition === position;
+            return (
+              <Tooltip
+                key={id}
+                mouseEnterDelay={0.1}
+                placement={'left'}
+                title={preview || undefined}
               >
-                <div
-                  className={cx(styles.indicatorContent, isActive && styles.indicatorContentActive)}
-                />
-              </button>
-            </Tooltip>
-          );
-        })}
+                <button
+                  aria-current={isActive ? 'true' : undefined}
+                  aria-label={t('minimap.jumpToMessage', { index: position + 1 })}
+                  className={styles.indicator}
+                  onClick={() => handleJump(virtuosoIndex)}
+                  style={{
+                    width,
+                  }}
+                  type={'button'}
+                >
+                  <div
+                    className={cx(
+                      styles.indicatorContent,
+                      isActive && styles.indicatorContentActive,
+                    )}
+                  />
+                </button>
+              </Tooltip>
+            );
+          })}
+        </Flexbox>
         <Tooltip mouseEnterDelay={0.1} placement={'left'} title={t('minimap.nextMessage')}>
           <button
             aria-label={t('minimap.nextMessage')}

package/src/config/modelProviders/anthropic.ts CHANGED Viewed

@@ -1,6 +1,5 @@
 import { ModelProviderCard } from '@/types/llm';
-// ref: https://docs.anthropic.com/en/docs/about-claude/models#model-names
 const Anthropic: ModelProviderCard = {
   chatModels: [
     {
@@ -83,17 +82,6 @@ const Anthropic: ModelProviderCard = {
       releasedAt: '2024-03-07',
       vision: true,
     },
-    {
-      contextWindowTokens: 200_000,
-      description:
-        'Claude 3 Sonnet 在智能和速度方面为企业工作负载提供了理想的平衡。它以更低的价格提供最大效用，可靠且适合大规模部署。',
-      displayName: 'Claude 3 Sonnet',
-      functionCall: true,
-      id: 'claude-3-sonnet-20240229',
-      maxOutput: 4096,
-      releasedAt: '2024-02-29',
-      vision: true,
-    },
     {
       contextWindowTokens: 200_000,
       description:
@@ -106,24 +94,6 @@ const Anthropic: ModelProviderCard = {
       releasedAt: '2024-02-29',
       vision: true,
     },
-    {
-      contextWindowTokens: 200_000,
-      description:
-        'Claude 2 为企业提供了关键能力的进步，包括业界领先的 200K token 上下文、大幅降低模型幻觉的发生率、系统提示以及一个新的测试功能：工具调用。',
-      displayName: 'Claude 2.1',
-      id: 'claude-2.1',
-      maxOutput: 4096,
-      releasedAt: '2023-11-21',
-    },
-    {
-      contextWindowTokens: 100_000,
-      description:
-        'Claude 2 为企业提供了关键能力的进步，包括业界领先的 200K token 上下文、大幅降低模型幻觉的发生率、系统提示以及一个新的测试功能：工具调用。',
-      displayName: 'Claude 2.0',
-      id: 'claude-2.0',
-      maxOutput: 4096,
-      releasedAt: '2023-07-11',
-    },
   ],
   checkModel: 'claude-3-haiku-20240307',
   description:

package/src/config/modelProviders/ollamacloud.ts CHANGED Viewed

@@ -9,6 +9,7 @@ const OllamaCloud: ModelProviderCard = {
     modelsUrl: 'https://ollama.com/library',
     name: 'Ollama Cloud',
     settings: {
+        disableBrowserRequest: true, // CORS error
         sdkType: 'openai',
         showModelFetcher: true,
     },

package/src/config/modelProviders/zhipu.ts CHANGED Viewed

@@ -1,16 +1,7 @@
 import { ModelProviderCard } from '@/types/llm';
-// ref :https://open.bigmodel.cn/dev/howuse/model
-// api https://open.bigmodel.cn/dev/api#language
-// ref :https://open.bigmodel.cn/modelcenter/square
 const ZhiPu: ModelProviderCard = {
   chatModels: [
-    {
-      contextWindowTokens: 16_384,
-      description: 'GLM-Zero-Preview具备强大的复杂推理能力，在逻辑推理、数学、编程等领域表现优异。',
-      displayName: 'GLM-Zero-Preview',
-      id: 'glm-zero-preview',
-    },
     {
       contextWindowTokens: 128_000,
       description: 'GLM-4-Flash 是处理简单任务的理想选择，速度最快且免费。',
@@ -50,14 +41,6 @@ const ZhiPu: ModelProviderCard = {
       functionCall: true,
       id: 'glm-4-airx',
     },
-    {
-      contextWindowTokens: 128_000,
-      description:
-        'GLM-4-AllTools 是一个多功能智能体模型，优化以支持复杂指令规划与工具调用，如网络浏览、代码解释和文本生成，适用于多任务执行。',
-      displayName: 'GLM-4-AllTools',
-      functionCall: true,
-      id: 'glm-4-alltools',
-    },
     {
       contextWindowTokens: 128_000,
       description:
@@ -115,9 +98,9 @@ const ZhiPu: ModelProviderCard = {
     },
     {
       contextWindowTokens: 4096,
-      description: 'CharGLM-3 专为角色扮演与情感陪伴设计，支持超长多轮记忆与个性化对话，应用广泛。',
-      displayName: 'CharGLM-3',
-      id: 'charglm-3',
+      description: 'CharGLM-4 专为角色扮演与情感陪伴设计，支持超长多轮记忆与个性化对话，应用广泛。',
+      displayName: 'CharGLM-4',
+      id: 'charglm-4',
     },
     {
       contextWindowTokens: 8192,
@@ -126,7 +109,7 @@ const ZhiPu: ModelProviderCard = {
       id: 'emohaa',
     },
   ],
-  checkModel: 'glm-4-flash-250414',
+  checkModel: 'glm-4.5-flash',
   description:
     '智谱 AI 提供多模态与语言模型的开放平台，支持广泛的AI应用场景，包括文本处理、图像理解与编程辅助等。',
   id: 'zhipu',

package/src/features/Conversation/components/WideScreenContainer/index.tsx CHANGED Viewed

@@ -11,6 +11,9 @@ import { systemStatusSelectors } from '@/store/global/selectors';
 const useStyles = createStyles(({ css, token }) => ({
   container: css`
     align-self: center;
+    /* Leave some space for the minimap */
+    padding-inline: 12px;
     transition: width 0.25s ${token.motionEaseInOut};
   `,
 }));