npm - @lobehub/chat - Versions diffs - 1.128.1 → 1.128.3 - Mend

@lobehub/chat 1.128.1 → 1.128.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (91) hide show

package/.cursor/rules/i18n.mdc +97 -95
package/CHANGELOG.md +51 -0
package/changelog/v1.json +18 -0
package/locales/ar/models.json +6 -0
package/locales/bg-BG/models.json +6 -0
package/locales/de-DE/models.json +6 -0
package/locales/en-US/models.json +6 -0
package/locales/es-ES/models.json +6 -0
package/locales/fa-IR/models.json +6 -0
package/locales/fr-FR/models.json +6 -0
package/locales/it-IT/models.json +6 -0
package/locales/ja-JP/models.json +6 -0
package/locales/ko-KR/models.json +6 -0
package/locales/nl-NL/models.json +6 -0
package/locales/pl-PL/models.json +6 -0
package/locales/pt-BR/models.json +6 -0
package/locales/ru-RU/models.json +6 -0
package/locales/tr-TR/models.json +6 -0
package/locales/vi-VN/models.json +6 -0
package/locales/zh-CN/models.json +6 -0
package/locales/zh-TW/models.json +6 -0
package/package.json +2 -2
package/packages/const/src/auth.ts +1 -1
package/packages/database/package.json +4 -2
package/packages/database/src/index.ts +1 -0
package/packages/database/src/repositories/dataExporter/index.test.ts +3 -3
package/packages/model-bank/src/aiModels/deepseek.ts +4 -4
package/packages/model-bank/src/aiModels/google.ts +30 -6
package/packages/model-bank/src/aiModels/groq.ts +1 -19
package/packages/model-bank/src/aiModels/modelscope.ts +24 -18
package/packages/model-bank/src/aiModels/novita.ts +71 -5
package/packages/model-bank/src/aiModels/qwen.ts +87 -2
package/packages/model-bank/src/aiModels/siliconcloud.ts +65 -2
package/packages/model-bank/src/aiModels/volcengine.ts +4 -3
package/packages/model-runtime/src/utils/modelParse.ts +4 -4
package/src/app/(backend)/_deprecated/createBizOpenAI/createAzureOpenai.ts +1 -1
package/src/app/(backend)/_deprecated/createBizOpenAI/createOpenai.ts +1 -1
package/src/app/(backend)/api/webhooks/casdoor/route.ts +1 -1
package/src/app/(backend)/api/webhooks/casdoor/validateRequest.ts +1 -1
package/src/app/(backend)/api/webhooks/clerk/route.ts +1 -1
package/src/app/(backend)/api/webhooks/logto/route.ts +1 -1
package/src/app/(backend)/api/webhooks/logto/validateRequest.ts +1 -1
package/src/{config → envs}/__tests__/analytics.test.ts +1 -1
package/src/{config → envs}/__tests__/app.test.ts +1 -1
package/src/{config → envs}/__tests__/client.test.ts +1 -1
package/src/layout/AuthProvider/index.tsx +1 -1
package/src/libs/next-auth/auth.config.ts +1 -1
package/src/libs/next-auth/sso-providers/auth0.ts +1 -1
package/src/libs/next-auth/sso-providers/authelia.ts +1 -1
package/src/libs/next-auth/sso-providers/authentik.ts +1 -1
package/src/libs/next-auth/sso-providers/azure-ad.ts +1 -1
package/src/libs/next-auth/sso-providers/cloudflare-zero-trust.ts +1 -1
package/src/libs/next-auth/sso-providers/generic-oidc.ts +1 -1
package/src/libs/next-auth/sso-providers/github.ts +1 -1
package/src/libs/next-auth/sso-providers/logto.ts +1 -1
package/src/libs/next-auth/sso-providers/microsoft-entra-id-helper.ts +1 -1
package/src/libs/next-auth/sso-providers/zitadel.ts +1 -1
package/src/libs/oidc-provider/adapter.ts +4 -5
package/src/libs/oidc-provider/provider.ts +1 -1
package/src/libs/trpc/async/asyncAuth.ts +1 -1
package/src/libs/trpc/async/context.ts +1 -1
package/src/middleware.ts +1 -1
package/src/server/globalConfig/_deprecated.test.ts +1 -1
package/src/server/globalConfig/_deprecated.ts +1 -1
package/src/server/globalConfig/genServerAiProviderConfig.test.ts +2 -2
package/src/server/globalConfig/genServerAiProviderConfig.ts +1 -1
package/src/server/globalConfig/index.ts +2 -2
package/src/server/modules/ModelRuntime/apiKeyManager.ts +1 -1
package/src/server/modules/ModelRuntime/index.test.ts +1 -1
package/src/server/modules/ModelRuntime/index.ts +1 -1
package/src/server/modules/S3/index.ts +1 -1
package/src/server/routers/async/file.ts +1 -1
package/src/server/services/agent/index.ts +2 -1
package/src/server/services/aiChat/index.test.ts +1 -1
package/src/server/services/aiChat/index.ts +2 -1
package/src/server/services/chunk/index.ts +1 -1
package/src/server/services/document/index.ts +1 -1
package/src/server/services/file/impls/s3.test.ts +13 -13
package/src/server/services/file/impls/s3.ts +1 -1
package/src/server/services/file/index.ts +1 -1
package/src/server/services/generation/index.ts +1 -1
package/src/server/services/nextAuthUser/index.ts +1 -1
package/src/server/services/user/index.test.ts +1 -1
package/src/server/services/user/index.ts +1 -1
package/src/services/__tests__/upload.test.ts +1 -1
package/src/services/file/_deprecated.test.ts +1 -1
package/src/services/upload.ts +1 -1
/package/src/{config → envs}/__tests__/auth.test.ts +0 -0
/package/src/{config → envs}/auth.ts +0 -0
/package/src/{config → envs}/file.ts +0 -0
/package/src/{config → envs}/llm.ts +0 -0

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@lobehub/chat",
-  "version": "1.128.1",
+  "version": "1.128.3",
   "description": "Lobe Chat - an open-source, high-performance chatbot framework that supports speech synthesis, multimodal, and extensible Function Call plugin system. Supports one-click free deployment of your private ChatGPT/LLM web application.",
   "keywords": [
     "framework",
@@ -157,7 +157,7 @@
     "@lobehub/charts": "^2.1.2",
     "@lobehub/chat-plugin-sdk": "^1.32.4",
     "@lobehub/chat-plugins-gateway": "^1.9.0",
-    "@lobehub/editor": "^1.8.0",
+    "@lobehub/editor": "^1.8.5",
     "@lobehub/icons": "^2.32.2",
     "@lobehub/market-sdk": "^0.22.7",
     "@lobehub/tts": "^2.0.1",

package/packages/const/src/auth.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { authEnv } from '@/config/auth';
+import { authEnv } from '@/envs/auth';
 export const enableClerk = authEnv.NEXT_PUBLIC_ENABLE_CLERK_AUTH;
 export const enableNextAuth = authEnv.NEXT_PUBLIC_ENABLE_NEXT_AUTH;

package/packages/database/package.json CHANGED Viewed

@@ -2,8 +2,10 @@
   "name": "@lobechat/database",
   "version": "1.0.0",
   "private": true,
-  "main": "src/index.ts",
-  "types": "src/index.ts",
+  "exports": {
+    ".": "./src/index.ts",
+    "./schemas": "./src/schemas/index.ts"
+  },
   "scripts": {
     "test": "npm run test:client-db && npm run test:server-db",
     "test:client-db": "vitest run",

package/packages/database/src/index.ts ADDED Viewed

	@@ -0,0 +1 @@
1	+ export * from './type';

package/packages/database/src/repositories/dataExporter/index.test.ts CHANGED Viewed

@@ -1,6 +1,7 @@
 import { afterEach, beforeEach, describe, expect, it, vi } from 'vitest';
 import { clientDB, initializeDB } from '@/database/client/db';
 import {
   agents,
   agentsKnowledgeBases,
@@ -16,9 +17,8 @@ import {
   topics,
   userSettings,
   users,
-} from '@/database/schemas';
-import { LobeChatDatabase } from '@/database/type';
+} from '../../schemas';
+import { LobeChatDatabase } from '../../type';
 import { DATA_EXPORT_CONFIG, DataExporterRepos } from './index';
 let db = clientDB as LobeChatDatabase;

package/packages/model-bank/src/aiModels/deepseek.ts CHANGED Viewed

@@ -17,8 +17,8 @@ const deepseekChatModels: AIChatModelCard[] = [
       currency: 'CNY',
       units: [
         { name: 'textInput_cacheRead', rate: 0.5, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textOutput', rate: 8, strategy: 'fixed', unit: 'millionTokens' },
+        { name: 'textInput', rate: 4, strategy: 'fixed', unit: 'millionTokens' },
+        { name: 'textOutput', rate: 12, strategy: 'fixed', unit: 'millionTokens' },
       ],
     },
     releasedAt: '2025-08-21',
@@ -39,9 +39,9 @@ const deepseekChatModels: AIChatModelCard[] = [
     pricing: {
       currency: 'CNY',
       units: [
-        { name: 'textInput_cacheRead', rate: 1, strategy: 'fixed', unit: 'millionTokens' },
+        { name: 'textInput_cacheRead', rate: 0.5, strategy: 'fixed', unit: 'millionTokens' },
         { name: 'textInput', rate: 4, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textOutput', rate: 16, strategy: 'fixed', unit: 'millionTokens' },
+        { name: 'textOutput', rate: 12, strategy: 'fixed', unit: 'millionTokens' },
       ],
     },
     releasedAt: '2025-08-21',

package/packages/model-bank/src/aiModels/google.ts CHANGED Viewed

@@ -18,7 +18,15 @@ const googleChatModels: AIChatModelCard[] = [
     maxOutput: 65_536,
     pricing: {
       units: [
-        { name: 'textInput_cacheRead', rate: 0.31, strategy: 'fixed', unit: 'millionTokens' },
+        {
+          name: 'textInput_cacheRead',
+          strategy: 'tiered',
+          tiers: [
+            { rate: 0.31, upTo: 200_000 },
+            { rate: 0.625, upTo: 'infinity' },
+          ],
+          unit: 'millionTokens',
+        },
         {
           name: 'textInput',
           strategy: 'tiered',
@@ -57,12 +65,20 @@ const googleChatModels: AIChatModelCard[] = [
     contextWindowTokens: 1_048_576 + 65_536,
     description:
       'Gemini 2.5 Pro Preview 是 Google 最先进的思维模型，能够对代码、数学和STEM领域的复杂问题进行推理，以及使用长上下文分析大型数据集、代码库和文档。',
-    displayName: 'Gemini 2.5 Pro Preview 06-05 (Paid)',
+    displayName: 'Gemini 2.5 Pro Preview 06-05',
     id: 'gemini-2.5-pro-preview-06-05',
     maxOutput: 65_536,
     pricing: {
       units: [
-        { name: 'textInput_cacheRead', rate: 0.31, strategy: 'fixed', unit: 'millionTokens' },
+        {
+          name: 'textInput_cacheRead',
+          strategy: 'tiered',
+          tiers: [
+            { rate: 0.31, upTo: 200_000 },
+            { rate: 0.625, upTo: 'infinity' },
+          ],
+          unit: 'millionTokens',
+        },
         {
           name: 'textInput',
           strategy: 'tiered',
@@ -101,12 +117,20 @@ const googleChatModels: AIChatModelCard[] = [
     contextWindowTokens: 1_048_576 + 65_536,
     description:
       'Gemini 2.5 Pro Preview 是 Google 最先进的思维模型，能够对代码、数学和STEM领域的复杂问题进行推理，以及使用长上下文分析大型数据集、代码库和文档。',
-    displayName: 'Gemini 2.5 Pro Preview 05-06 (Paid)',
+    displayName: 'Gemini 2.5 Pro Preview 05-06',
     id: 'gemini-2.5-pro-preview-05-06',
     maxOutput: 65_536,
     pricing: {
       units: [
-        { name: 'textInput_cacheRead', rate: 0.31, strategy: 'fixed', unit: 'millionTokens' },
+        {
+          name: 'textInput_cacheRead',
+          strategy: 'tiered',
+          tiers: [
+            { rate: 0.31, upTo: 200_000 },
+            { rate: 0.625, upTo: 'infinity' },
+          ],
+          unit: 'millionTokens',
+        },
         {
           name: 'textInput',
           strategy: 'tiered',
@@ -479,7 +503,7 @@ const googleChatModels: AIChatModelCard[] = [
     contextWindowTokens: 2_008_192,
     description:
       'Gemini 1.5 Pro 002 是最新的生产就绪模型，提供更高质量的输出，特别在数学、长上下文和视觉任务方面有显著提升。',
-    displayName: 'Gemini 1.5 Pro 002 (Paid)',
+    displayName: 'Gemini 1.5 Pro 002',
     id: 'gemini-1.5-pro-002', // Deprecated on 2025-09-24
     maxOutput: 8192,
     pricing: {

package/packages/model-bank/src/aiModels/groq.ts CHANGED Viewed

@@ -73,24 +73,6 @@ const groqChatModels: AIChatModelCard[] = [
     displayName: 'Kimi K2 0905',
     enabled: true,
     id: 'moonshotai/kimi-k2-instruct-0905',
-    pricing: {
-      units: [
-        { name: 'textInput', rate: 1, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textOutput', rate: 3, strategy: 'fixed', unit: 'millionTokens' },
-      ],
-    },
-    releasedAt: '2025-09-05',
-    type: 'chat',
-  },
-  {
-    abilities: {
-      functionCall: true,
-    },
-    contextWindowTokens: 131_072,
-    description:
-      'kimi-k2 是一款具备超强代码和 Agent 能力的 MoE 架构基础模型，总参数 1T，激活参数 32B。在通用知识推理、编程、数学、Agent 等主要类别的基准性能测试中，K2 模型的性能超过其他主流开源模型。',
-    displayName: 'Kimi K2 0711',
-    id: 'moonshotai/kimi-k2-instruct',
     maxOutput: 16_384,
     pricing: {
       units: [
@@ -98,7 +80,7 @@ const groqChatModels: AIChatModelCard[] = [
         { name: 'textOutput', rate: 3, strategy: 'fixed', unit: 'millionTokens' },
       ],
     },
-    releasedAt: '2025-07-11',
+    releasedAt: '2025-09-05',
     type: 'chat',
   },
   {

package/packages/model-bank/src/aiModels/modelscope.ts CHANGED Viewed

@@ -4,14 +4,20 @@ const modelscopeChatModels: AIChatModelCard[] = [
   {
     abilities: {
       functionCall: true,
+      reasoning: true,
     },
-    contextWindowTokens: 262_144,
-    description:
-      'kimi-k2-0905-preview 模型上下文长度为 256k，具备更强的 Agentic Coding 能力、更突出的前端代码的美观度和实用性、以及更好的上下文理解能力。',
-    displayName: 'Kimi K2 0905',
-    enabled: true,
-    id: 'moonshotai/Kimi-K2-Instruct-0905',
-    releasedAt: '2025-09-05',
+    contextWindowTokens: 131_072,
+    displayName: 'Qwen3 Next 80B A3B Thinking',
+    id: 'Qwen/Qwen3-Next-80B-A3B-Thinking',
+    type: 'chat',
+  },
+  {
+    abilities: {
+      functionCall: true,
+    },
+    contextWindowTokens: 131_072,
+    displayName: 'Qwen3 Next 80B A3B Instruct',
+    id: 'Qwen/Qwen3-Next-80B-A3B-Instruct',
     type: 'chat',
   },
   {
@@ -20,8 +26,8 @@ const modelscopeChatModels: AIChatModelCard[] = [
       reasoning: true,
     },
     contextWindowTokens: 131_072,
-    description: 'DeepSeek-V3.1 模型为混合推理架构模型，同时支持思考模式与非思考模式。',
-    displayName: 'DeepSeek-V3.1',
+    description: 'DeepSeek V3.1 模型为混合推理架构模型，同时支持思考模式与非思考模式。',
+    displayName: 'DeepSeek V3.1',
     enabled: true,
     id: 'deepseek-ai/DeepSeek-V3.1',
     type: 'chat',
@@ -34,7 +40,7 @@ const modelscopeChatModels: AIChatModelCard[] = [
     contextWindowTokens: 131_072,
     description:
       'DeepSeek R1 通过利用增加的计算资源和在后训练过程中引入算法优化机制，显著提高了其推理和推断能力的深度。该模型在各种基准评估中表现出色，包括数学、编程和一般逻辑方面。其整体性能现已接近领先模型，如 O3 和 Gemini 2.5 Pro。',
-    displayName: 'DeepSeek-R1-0528',
+    displayName: 'DeepSeek R1 0528',
     id: 'deepseek-ai/DeepSeek-R1-0528',
     type: 'chat',
   },
@@ -44,8 +50,8 @@ const modelscopeChatModels: AIChatModelCard[] = [
       reasoning: true,
     },
     contextWindowTokens: 131_072,
-    description: 'DeepSeek-R1是DeepSeek最新的推理模型，专注于复杂推理任务。',
-    displayName: 'DeepSeek-R1',
+    description: 'DeepSeek R1是DeepSeek最新的推理模型，专注于复杂推理任务。',
+    displayName: 'DeepSeek R1',
     id: 'deepseek-ai/DeepSeek-R1',
     type: 'chat',
   },
@@ -54,8 +60,8 @@ const modelscopeChatModels: AIChatModelCard[] = [
       functionCall: true,
     },
     contextWindowTokens: 131_072,
-    description: 'DeepSeek-V3是DeepSeek第三代模型的最新版本，具有强大的推理和对话能力。',
-    displayName: 'DeepSeek-V3',
+    description: 'DeepSeek V3是DeepSeek第三代模型的最新版本，具有强大的推理和对话能力。',
+    displayName: 'DeepSeek V3',
     id: 'deepseek-ai/DeepSeek-V3',
     type: 'chat',
   },
@@ -64,8 +70,8 @@ const modelscopeChatModels: AIChatModelCard[] = [
       functionCall: true,
     },
     contextWindowTokens: 131_072,
-    description: 'Qwen3-235B-A22B是通义千问3代超大规模模型，提供顶级的AI能力。',
-    displayName: 'Qwen3-235B-A22B',
+    description: 'Qwen3 235B A22B是通义千问3代超大规模模型，提供顶级的AI能力。',
+    displayName: 'Qwen3 235B A22B',
     id: 'Qwen/Qwen3-235B-A22B',
     type: 'chat',
   },
@@ -74,8 +80,8 @@ const modelscopeChatModels: AIChatModelCard[] = [
       functionCall: true,
     },
     contextWindowTokens: 131_072,
-    description: 'Qwen3-32B是通义千问3代模型，具有强大的推理和对话能力。',
-    displayName: 'Qwen3-32B',
+    description: 'Qwen3 32B是通义千问3代模型，具有强大的推理和对话能力。',
+    displayName: 'Qwen3 32B',
     id: 'Qwen/Qwen3-32B',
     type: 'chat',
   },

package/packages/model-bank/src/aiModels/novita.ts CHANGED Viewed

@@ -2,6 +2,52 @@ import { AIChatModelCard } from '../types/aiModel';
 // https://novita.ai/pricing
 const novitaChatModels: AIChatModelCard[] = [
+  {
+    abilities: {
+      functionCall: true,
+      reasoning: true,
+    },
+    contextWindowTokens: 65_536,
+    displayName: 'Qwen3 Next 80B A3B Thinking',
+    id: 'qwen/qwen3-next-80b-a3b-thinking',
+    maxOutput: 65_536,
+    pricing: {
+      units: [
+        { name: 'textInput', rate: 0.15, strategy: 'fixed', unit: 'millionTokens' },
+        { name: 'textOutput', rate: 1.5, strategy: 'fixed', unit: 'millionTokens' },
+      ],
+    },
+    type: 'chat',
+  },
+  {
+    abilities: {
+      functionCall: true,
+    },
+    contextWindowTokens: 65_536,
+    displayName: 'Qwen3 Next 80B A3B Instruct',
+    id: 'qwen/qwen3-next-80b-a3b-instruct',
+    maxOutput: 65_536,
+    pricing: {
+      units: [
+        { name: 'textInput', rate: 0.15, strategy: 'fixed', unit: 'millionTokens' },
+        { name: 'textOutput', rate: 1.5, strategy: 'fixed', unit: 'millionTokens' },
+      ],
+    },
+    type: 'chat',
+  },
+  {
+    contextWindowTokens: 4096,
+    displayName: 'Qwen MT Plus',
+    id: 'qwen/qwen-mt-plus',
+    maxOutput: 2048,
+    pricing: {
+      units: [
+        { name: 'textInput', rate: 0.25, strategy: 'fixed', unit: 'millionTokens' },
+        { name: 'textOutput', rate: 0.75, strategy: 'fixed', unit: 'millionTokens' },
+      ],
+    },
+    type: 'chat',
+  },
   {
     abilities: {
       functionCall: true,
@@ -41,13 +87,13 @@ const novitaChatModels: AIChatModelCard[] = [
     abilities: {
       functionCall: true,
     },
-    contextWindowTokens: 262_144,
+    contextWindowTokens: 65_536,
     displayName: 'Qwen3 Coder 480B A35B Instruct',
     id: 'qwen/qwen3-coder-480b-a35b-instruct',
     pricing: {
       units: [
-        { name: 'textInput', rate: 0.35, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textOutput', rate: 1.5, strategy: 'fixed', unit: 'millionTokens' },
+        { name: 'textInput', rate: 0.29, strategy: 'fixed', unit: 'millionTokens' },
+        { name: 'textOutput', rate: 1.2, strategy: 'fixed', unit: 'millionTokens' },
       ],
     },
     type: 'chat',
@@ -83,6 +129,24 @@ const novitaChatModels: AIChatModelCard[] = [
     },
     type: 'chat',
   },
+  {
+    abilities: {
+      functionCall: true,
+      reasoning: true,
+      vision: true,
+    },
+    contextWindowTokens: 65_536,
+    displayName: 'GLM-4.5V',
+    id: 'zai-org/glm-4.5v',
+    maxOutput: 16_384,
+    pricing: {
+      units: [
+        { name: 'textInput', rate: 0.6, strategy: 'fixed', unit: 'millionTokens' },
+        { name: 'textOutput', rate: 1.8, strategy: 'fixed', unit: 'millionTokens' },
+      ],
+    },
+    type: 'chat',
+  },
   {
     abilities: {
       functionCall: true,
@@ -91,6 +155,7 @@ const novitaChatModels: AIChatModelCard[] = [
     contextWindowTokens: 131_072,
     displayName: 'GLM-4.5',
     id: 'zai-org/glm-4.5',
+    maxOutput: 98_304,
     pricing: {
       units: [
         { name: 'textInput', rate: 0.6, strategy: 'fixed', unit: 'millionTokens' },
@@ -103,9 +168,10 @@ const novitaChatModels: AIChatModelCard[] = [
     abilities: {
       functionCall: true,
     },
-    contextWindowTokens: 262_144,
+    contextWindowTokens: 131_072,
     displayName: 'Qwen3 235B A22B Instruct 2507',
     id: 'qwen/qwen3-235b-a22b-instruct-2507',
+    maxOutput: 16_384,
     pricing: {
       units: [
         { name: 'textInput', rate: 0.15, strategy: 'fixed', unit: 'millionTokens' },
@@ -717,6 +783,7 @@ const novitaChatModels: AIChatModelCard[] = [
     contextWindowTokens: 32_000,
     displayName: 'Qwen2.5 72B Instruct',
     id: 'qwen/qwen-2.5-72b-instruct',
+    maxOutput: 8192,
     pricing: {
       units: [
         { name: 'textInput', rate: 0.38, strategy: 'fixed', unit: 'millionTokens' },
@@ -770,7 +837,6 @@ const novitaChatModels: AIChatModelCard[] = [
     },
     contextWindowTokens: 32_768,
     displayName: 'Qwen2.5 VL 72B Instruct',
-    enabled: true,
     id: 'qwen/qwen2.5-vl-72b-instruct',
     pricing: {
       units: [

package/packages/model-bank/src/aiModels/qwen.ts CHANGED Viewed

@@ -48,6 +48,92 @@ const qwenChatModels: AIChatModelCard[] = [
     },
     type: 'chat',
   },
+  {
+    abilities: {
+      reasoning: true,
+    },
+    contextWindowTokens: 131_072,
+    description: 'GLM-4.5系列模型是智谱AI专为智能体设计的混合推理模型，提供思考与非思考两种模式。',
+    displayName: 'GLM-4.5',
+    id: 'glm-4.5',
+    maxOutput: 16_384,
+    pricing: {
+      currency: 'CNY',
+      units: [
+        {
+          lookup: {
+            prices: {
+              '[0, 32_000]': 3,
+              '[32_000, infinity]': 4,
+            },
+            pricingParams: ['textInputRange'],
+          },
+          name: 'textInput',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
+        {
+          lookup: {
+            prices: {
+              '[0, 32_000]': 14,
+              '[32_000, infinity]': 16,
+            },
+            pricingParams: ['textInputRange'],
+          },
+          name: 'textOutput',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
+      ],
+    },
+    settings: {
+      extendParams: ['enableReasoning', 'reasoningBudgetToken'],
+    },
+    type: 'chat',
+  },
+  {
+    abilities: {
+      reasoning: true,
+    },
+    contextWindowTokens: 131_072,
+    description: 'GLM-4.5系列模型是智谱AI专为智能体设计的混合推理模型，提供思考与非思考两种模式。',
+    displayName: 'GLM-4.5-Air',
+    id: 'glm-4.5-air',
+    maxOutput: 16_384,
+    pricing: {
+      currency: 'CNY',
+      units: [
+        {
+          lookup: {
+            prices: {
+              '[0, 32_000]': 0.8,
+              '[32_000, infinity]': 1.2,
+            },
+            pricingParams: ['textInputRange'],
+          },
+          name: 'textInput',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
+        {
+          lookup: {
+            prices: {
+              '[0, 32_000]': 6,
+              '[32_000, infinity]': 8,
+            },
+            pricingParams: ['textInputRange'],
+          },
+          name: 'textOutput',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
+      ],
+    },
+    settings: {
+      extendParams: ['enableReasoning', 'reasoningBudgetToken'],
+    },
+    type: 'chat',
+  },
   {
     abilities: {
       functionCall: true,
@@ -583,7 +669,7 @@ const qwenChatModels: AIChatModelCard[] = [
       search: true,
     },
     config: {
-      deploymentName: 'qwen-plus-2025-07-28',
+      deploymentName: 'qwen-plus-2025-09-11',
     },
     contextWindowTokens: 1_000_000,
     description: '通义千问超大规模语言模型增强版，支持中文、英文等不同语言输入。',
@@ -627,7 +713,6 @@ const qwenChatModels: AIChatModelCard[] = [
               '[0, 128_000]_[false]': 2,
               '[0, 128_000]_[true]': 8,
               '[128_000, 256_000]_[false]': 20,
               '[128_000, 256_000]_[true]': 24,
               '[256_000, infinity]_[false]': 48,
               '[256_000, infinity]_[true]': 64,

package/packages/model-bank/src/aiModels/siliconcloud.ts CHANGED Viewed

@@ -47,6 +47,25 @@ const siliconcloudChatModels: AIChatModelCard[] = [
     },
     type: 'chat',
   },
+  {
+    abilities: {
+      functionCall: true,
+    },
+    contextWindowTokens: 131_072,
+    description:
+      'Ling-mini-2.0 是一款基于 MoE 架构的小尺寸高性能大语言模型。它拥有 16B 总参数，但每个 token 仅激活 1.4B（non-embedding 789M），从而实现了极高的生成速度。得益于高效的 MoE 设计与大规模高质量训练数据，尽管激活参数仅为 1.4B，Ling-mini-2.0 依然在下游任务中展现出可媲美 10B 以下 dense LLM 及更大规模 MoE 模型的顶尖性能',
+    displayName: 'Ling Mini 2.0',
+    id: 'inclusionAI/Ling-mini-2.0',
+    pricing: {
+      currency: 'CNY',
+      units: [
+        { name: 'textInput', rate: 0.5, strategy: 'fixed', unit: 'millionTokens' },
+        { name: 'textOutput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
+      ],
+    },
+    releasedAt: '2025-09-09',
+    type: 'chat',
+  },
   {
     abilities: {
       functionCall: true,
@@ -223,10 +242,51 @@ const siliconcloudChatModels: AIChatModelCard[] = [
     type: 'chat',
   },
   {
+    abilities: {
+      functionCall: true,
+    },
+    contextWindowTokens: 262_144,
+    description:
+      'Kimi K2-Instruct-0905 是 Kimi K2 最新、最强大的版本。它是一款顶尖的混合专家（MoE）语言模型，拥有 1 万亿的总参数和 320 亿的激活参数。该模型的主要特性包括：增强的智能体编码智能，在公开基准测试和真实世界的编码智能体任务中表现出显著的性能提升；改进的前端编码体验，在前端编程的美观性和实用性方面均有进步。',
+    displayName: 'Kimi K2 0905',
+    id: 'moonshotai/Kimi-K2-Instruct-0905',
+    pricing: {
+      currency: 'CNY',
+      units: [
+        { name: 'textInput', rate: 4, strategy: 'fixed', unit: 'millionTokens' },
+        { name: 'textOutput', rate: 16, strategy: 'fixed', unit: 'millionTokens' },
+      ],
+    },
+    releasedAt: '2025-09-05',
+    type: 'chat',
+  },
+  {
+    abilities: {
+      functionCall: true,
+    },
+    contextWindowTokens: 262_144,
+    description:
+      'Kimi K2-Instruct-0905 是 Kimi K2 最新、最强大的版本。它是一款顶尖的混合专家（MoE）语言模型，拥有 1 万亿的总参数和 320 亿的激活参数。该模型的主要特性包括：增强的智能体编码智能，在公开基准测试和真实世界的编码智能体任务中表现出显著的性能提升；改进的前端编码体验，在前端编程的美观性和实用性方面均有进步。',
+    displayName: 'Kimi K2 0905 (Pro)',
+    id: 'Pro/moonshotai/Kimi-K2-Instruct-0905',
+    pricing: {
+      currency: 'CNY',
+      units: [
+        { name: 'textInput', rate: 4, strategy: 'fixed', unit: 'millionTokens' },
+        { name: 'textOutput', rate: 16, strategy: 'fixed', unit: 'millionTokens' },
+      ],
+    },
+    releasedAt: '2025-09-05',
+    type: 'chat',
+  },
+  {
+    abilities: {
+      functionCall: true,
+    },
     contextWindowTokens: 131_072,
     description:
       'Kimi K2 是一款具备超强代码和 Agent 能力的 MoE 架构基础模型，总参数 1T，激活参数 32B。在通用知识推理、编程、数学、Agent 等主要类别的基准性能测试中，K2 模型的性能超过其他主流开源模型。',
-    displayName: 'Kimi K2 Instruct',
+    displayName: 'Kimi K2 0711',
     id: 'moonshotai/Kimi-K2-Instruct',
     pricing: {
       currency: 'CNY',
@@ -239,10 +299,13 @@ const siliconcloudChatModels: AIChatModelCard[] = [
     type: 'chat',
   },
   {
+    abilities: {
+      functionCall: true,
+    },
     contextWindowTokens: 131_072,
     description:
       'Kimi K2 是一款具备超强代码和 Agent 能力的 MoE 架构基础模型，总参数 1T，激活参数 32B。在通用知识推理、编程、数学、Agent 等主要类别的基准性能测试中，K2 模型的性能超过其他主流开源模型。',
-    displayName: 'Kimi K2 Instruct (Pro)',
+    displayName: 'Kimi K2 0711 (Pro)',
     id: 'Pro/moonshotai/Kimi-K2-Instruct',
     pricing: {
       currency: 'CNY',

package/packages/model-bank/src/aiModels/volcengine.ts CHANGED Viewed

@@ -35,17 +35,18 @@ const doubaoChatModels: AIChatModelCard[] = [
       functionCall: true,
     },
     config: {
-      deploymentName: 'kimi-k2-250711',
+      deploymentName: 'kimi-k2-250905',
     },
-    contextWindowTokens: 256_000,
+    contextWindowTokens: 131_072,
     description:
       'Kimi-K2 是一款Moonshot AI推出的具备超强代码和 Agent 能力的 MoE 架构基础模型，总参数 1T，激活参数 32B。在通用知识推理、编程、数学、Agent 等主要类别的基准性能测试中，K2 模型的性能超过其他主流开源模型。',
     displayName: 'Kimi K2',
     id: 'kimi-k2',
-    maxOutput: 16_384,
+    maxOutput: 32_768,
     pricing: {
       currency: 'CNY',
       units: [
+        { name: 'textInput_cacheRead', rate: 0.8, strategy: 'fixed', unit: 'millionTokens' },
         { name: 'textInput', rate: 4, strategy: 'fixed', unit: 'millionTokens' },
         { name: 'textOutput', rate: 16, strategy: 'fixed', unit: 'millionTokens' },
       ],

package/packages/model-runtime/src/utils/modelParse.ts CHANGED Viewed

@@ -53,7 +53,7 @@ export const MODEL_LIST_CONFIGS = {
       'qwen2.5',
       'qwen3',
     ],
-    reasoningKeywords: ['qvq', 'qwq', 'qwen3', '!-instruct-', '!-coder-'],
+    reasoningKeywords: ['qvq', 'qwq', 'qwen3', '!-instruct-', '!-coder-', '!-max-'],
     visionKeywords: ['qvq', 'vl'],
   },
   v0: {
@@ -303,9 +303,9 @@ const processModelCard = (
     )
       ? 'image'
       : isKeywordListMatch(
-            model.id.toLowerCase(),
-            EMBEDDING_MODEL_KEYWORDS.map((k) => k.toLowerCase()),
-          )
+        model.id.toLowerCase(),
+        EMBEDDING_MODEL_KEYWORDS.map((k) => k.toLowerCase()),
+      )
         ? 'embedding'
         : 'chat');

package/src/app/(backend)/_deprecated/createBizOpenAI/createAzureOpenai.ts CHANGED Viewed

@@ -2,7 +2,7 @@ import { ChatErrorType } from '@lobechat/types';
 import OpenAI, { ClientOptions } from 'openai';
 import urlJoin from 'url-join';
-import { getLLMConfig } from '@/config/llm';
+import { getLLMConfig } from '@/envs/llm';
 // create Azure OpenAI Instance
 export const createAzureOpenai = (params: {