npm - @lobehub/chat - Versions diffs - 1.80.0 → 1.80.2 - Mend

@lobehub/chat 1.80.0 → 1.80.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (37) hide show

package/CHANGELOG.md +58 -0
package/changelog/v1.json +21 -0
package/docs/development/basic/feature-development.mdx +370 -619
package/docs/development/basic/feature-development.zh-CN.mdx +368 -611
package/package.json +1 -1
package/src/app/[variants]/oauth/consent/[uid]/Client.tsx +36 -23
package/src/app/[variants]/oauth/consent/[uid]/page.tsx +2 -0
package/src/config/aiModels/azure.ts +79 -1
package/src/config/aiModels/azureai.ts +181 -0
package/src/config/aiModels/google.ts +36 -2
package/src/config/aiModels/groq.ts +31 -3
package/src/config/aiModels/hunyuan.ts +54 -18
package/src/config/aiModels/moonshot.ts +17 -17
package/src/config/aiModels/novita.ts +25 -30
package/src/config/aiModels/siliconcloud.ts +80 -2
package/src/config/aiModels/stepfun.ts +40 -31
package/src/config/aiModels/tencentcloud.ts +7 -6
package/src/config/aiModels/volcengine.ts +1 -0
package/src/config/aiModels/zhipu.ts +91 -27
package/src/const/settings/knowledge.ts +2 -2
package/src/features/ChatInput/ActionBar/Upload/ClientMode.tsx +7 -6
package/src/hooks/useModelSupportFiles.ts +15 -0
package/src/libs/agent-runtime/stepfun/index.ts +7 -1
package/src/libs/agent-runtime/zhipu/index.ts +17 -10
package/src/libs/oidc-provider/config.ts +0 -3
package/src/libs/trpc/edge/index.ts +0 -4
package/src/libs/trpc/lambda/context.ts +90 -6
package/src/libs/trpc/lambda/index.ts +2 -1
package/src/libs/trpc/lambda/middleware/oidcAuth.ts +14 -0
package/src/libs/trpc/middleware/userAuth.ts +2 -4
package/src/server/services/oidc/index.ts +71 -0
package/src/store/aiInfra/slices/aiModel/selectors.ts +7 -0
package/src/utils/parseModels.test.ts +19 -3
package/src/utils/server/__tests__/auth.test.ts +45 -1
package/src/utils/server/auth.ts +26 -2
package/docs/development/basic/feature-development-new.mdx +0 -465
package/docs/development/basic/feature-development-new.zh-CN.mdx +0 -465

package/src/config/aiModels/moonshot.ts CHANGED Viewed

@@ -1,5 +1,5 @@
 import { AIChatModelCard } from '@/types/aiModel';
+// https://platform.moonshot.cn/docs/pricing/chat
 const moonshotChatModels: AIChatModelCard[] = [
   {
     abilities: {
@@ -16,8 +16,8 @@ const moonshotChatModels: AIChatModelCard[] = [
     pricing: {
       cachedInput: 1,
       currency: 'CNY',
-      input: 60,
-      output: 60,
+      input: 10,
+      output: 30,
     },
     releasedAt: '2025-02-17',
     settings: {
@@ -37,8 +37,8 @@ const moonshotChatModels: AIChatModelCard[] = [
     id: 'moonshot-v1-auto',
     pricing: {
       currency: 'CNY',
-      input: 60,
-      output: 60,
+      input: 10,
+      output: 30,
     },
     settings: {
       searchImpl: 'params',
@@ -57,8 +57,8 @@ const moonshotChatModels: AIChatModelCard[] = [
     id: 'moonshot-v1-8k',
     pricing: {
       currency: 'CNY',
-      input: 12,
-      output: 12,
+      input: 2,
+      output: 10,
     },
     settings: {
       searchImpl: 'params',
@@ -77,8 +77,8 @@ const moonshotChatModels: AIChatModelCard[] = [
     id: 'moonshot-v1-32k',
     pricing: {
       currency: 'CNY',
-      input: 24,
-      output: 24,
+      input: 5,
+      output: 20,
     },
     settings: {
       searchImpl: 'params',
@@ -97,8 +97,8 @@ const moonshotChatModels: AIChatModelCard[] = [
     id: 'moonshot-v1-128k',
     pricing: {
       currency: 'CNY',
-      input: 60,
-      output: 60,
+      input: 10,
+      output: 30,
     },
     settings: {
       searchImpl: 'params',
@@ -118,8 +118,8 @@ const moonshotChatModels: AIChatModelCard[] = [
     id: 'moonshot-v1-8k-vision-preview',
     pricing: {
       currency: 'CNY',
-      input: 12,
-      output: 12,
+      input: 2,
+      output: 10,
     },
     releasedAt: '2025-01-14',
     settings: {
@@ -140,8 +140,8 @@ const moonshotChatModels: AIChatModelCard[] = [
     id: 'moonshot-v1-32k-vision-preview',
     pricing: {
       currency: 'CNY',
-      input: 24,
-      output: 24,
+      input: 5,
+      output: 20,
     },
     releasedAt: '2025-01-14',
     settings: {
@@ -162,8 +162,8 @@ const moonshotChatModels: AIChatModelCard[] = [
     id: 'moonshot-v1-128k-vision-preview',
     pricing: {
       currency: 'CNY',
-      input: 60,
-      output: 60,
+      input: 10,
+      output: 30,
     },
     releasedAt: '2025-01-14',
     settings: {

package/src/config/aiModels/novita.ts CHANGED Viewed

@@ -1,26 +1,36 @@
 import { AIChatModelCard } from '@/types/aiModel';
 // https://novita.ai/pricing
 const novitaChatModels: AIChatModelCard[] = [
   {
     contextWindowTokens: 131_072,
-    displayName: 'Llama 3.3 70B Instruct',
+    displayName: 'Llama 4 Scout 17B Instruct',
     enabled: true,
-    id: 'meta-llama/llama-3.3-70b-instruct',
+    id: 'meta-llama/llama-4-scout-17b-16e-instruct',
     pricing: {
-      input: 0.13,
-      output: 0.39,
+      input: 0.1,
+      output: 0.5,
+    },
+    type: 'chat',
+  },
+  {
+    contextWindowTokens: 1_048_576,
+    displayName: 'Llama 4 Maverick 17B Instruct',
+    enabled: true,
+    id: 'meta-llama/llama-4-maverick-17b-128e-instruct-fp8',
+    pricing: {
+      input: 0.2,
+      output: 0.85,
     },
     type: 'chat',
   },
   {
     contextWindowTokens: 16_384,
-    description: 'Llama 3.1 8B Instruct 是 Meta 推出的最新版本，优化了高质量对话场景，表现优于许多领先的闭源模型。',
+    description: 'Llama 3.1 8B Instruct  优化了高质量对话场景，表现优于许多领先的闭源模型。',
     displayName: 'Llama 3.1 8B Instruct',
     id: 'meta-llama/llama-3.1-8b-instruct',
     pricing: {
-      input: 0.05,
+      input: 0.02,
       output: 0.05,
     },
     type: 'chat',
@@ -73,7 +83,6 @@ const novitaChatModels: AIChatModelCard[] = [
     contextWindowTokens: 32_000,
     description: 'Gemma 3 27B 是谷歌的一款开源语言模型，以其在效率和性能方面设立了新的标准。',
     displayName: 'Gemma 3 27B',
-    enabled: true,
     id: 'google/gemma-3-27b-it',
     pricing: {
       input: 0.2,
@@ -190,7 +199,7 @@ const novitaChatModels: AIChatModelCard[] = [
     enabled: true,
     id: 'deepseek/deepseek-v3-0324',
     pricing: {
-      input: 0.4,
+      input: 0.37,
       output: 1.3,
     },
     type: 'chat',
@@ -318,18 +327,12 @@ const novitaChatModels: AIChatModelCard[] = [
     type: 'chat',
   },
   {
-    contextWindowTokens: 32_768,
-    displayName: 'Qwen 2 VL 72B Instruct',
-    id: 'qwen/qwen-2-vl-72b-instruct',
-    pricing: {
-      input: 0.45,
-      output: 0.45,
+    abilities: {
+      vision: true,
     },
-    type: 'chat',
-  },
-  {
     contextWindowTokens: 96_000,
     displayName: 'Qwen 2.5 VL 72B Instruct',
+    enabled: true,
     id: 'qwen/qwen2.5-vl-72b-instruct',
     pricing: {
       input: 0.8,
@@ -378,7 +381,7 @@ const novitaChatModels: AIChatModelCard[] = [
     type: 'chat',
   },
   {
-    contextWindowTokens: 16_000,
+    contextWindowTokens: 8192,
     displayName: 'L31 70B Euryale v2.2',
     id: 'sao10k/l31-70b-euryale-v2.2',
     pricing: {
@@ -387,22 +390,13 @@ const novitaChatModels: AIChatModelCard[] = [
     },
     type: 'chat',
   },
-  {
-    contextWindowTokens: 32_768,
-    displayName: 'Qwen 2 7B Instruct',
-    id: 'qwen/qwen-2-7b-instruct',
-    pricing: {
-      input: 0.054,
-      output: 0.054,
-    },
-    type: 'chat',
-  },
-  {
+    {
     abilities: {
       reasoning: true,
     },
     contextWindowTokens: 32_768,
     displayName: 'QwQ 32B',
+    enabled: true,
     id: 'qwen/qwq-32b',
     pricing: {
       input: 0.18,
@@ -410,6 +404,7 @@ const novitaChatModels: AIChatModelCard[] = [
     },
     type: 'chat',
   },
 ];
 export const allModels = [...novitaChatModels];

package/src/config/aiModels/siliconcloud.ts CHANGED Viewed

@@ -3,6 +3,85 @@ import { AIChatModelCard } from '@/types/aiModel';
 // https://siliconflow.cn/zh-cn/models
 const siliconcloudChatModels: AIChatModelCard[] = [
+  {
+    abilities: {
+      reasoning: true,
+    },
+    contextWindowTokens: 32_768,
+    description:
+      'GLM-Z1-Rumination-32B-0414 是一个具有沉思能力的深度推理模型（与 OpenAI 的 Deep Research 对标）。与典型的深度思考模型不同，沉思模型采用更长时间的深度思考来解决更开放和复杂的问题。',
+    displayName: 'GLM-Z1-Rumination 32B 0414',
+    enabled: true,
+    id: 'THUDM/GLM-Z1-Rumination-32B-0414',
+    pricing: {
+      currency: 'CNY',
+      input: 0.5,
+      output: 0.5,
+    },
+    type: 'chat',
+  },
+  {
+    abilities: {
+      reasoning: true,
+    },
+    contextWindowTokens: 32_768,
+    description:
+      'GLM-Z1-32B-0414 是一个具有深度思考能力的推理模型。该模型基于 GLM-4-32B-0414 通过冷启动和扩展强化学习开发，并在数学、代码和逻辑任务上进行了进一步训练。与基础模型相比，GLM-Z1-32B-0414 显著提升了数学能力和解决复杂任务的能力。',
+    displayName: 'GLM-Z1 32B 0414',
+    enabled: true,
+    id: 'THUDM/GLM-Z1-32B-0414',
+    pricing: {
+      currency: 'CNY',
+      input: 0.5,
+      output: 0.5,
+    },
+    type: 'chat',
+  },
+  {
+    abilities: {
+      reasoning: true,
+    },
+    contextWindowTokens: 32_768,
+    description:
+      'GLM-Z1-9B-0414 是 GLM 系列的小型模型，仅有 90 亿参数，但保持了开源传统的同时展现出惊人的能力。尽管规模较小，该模型在数学推理和通用任务上仍表现出色，其总体性能在同等规模的开源模型中已处于领先水平。',
+    displayName: 'GLM-Z1 9B 0414',
+    enabled: true,
+    id: 'THUDM/GLM-Z1-9B-0414',
+    pricing: {
+      currency: 'CNY',
+      input: 0,
+      output: 0,
+    },
+    type: 'chat',
+  },
+  {
+    contextWindowTokens: 32_768,
+    description:
+      'GLM-4-32B-0414 是 GLM 系列的新一代开源模型，拥有 320 亿参数。该模型性能可与 OpenAI 的 GPT 系列和 DeepSeek 的 V3/R1 系列相媲美。',
+    displayName: 'GLM-4 32B 0414',
+    enabled: true,
+    id: 'THUDM/GLM-4-32B-0414',
+    pricing: {
+      currency: 'CNY',
+      input: 0.5,
+      output: 0.5,
+    },
+    type: 'chat',
+  },
+  {
+    contextWindowTokens: 32_768,
+    description:
+      'GLM-4-9B-0414 是 GLM 系列的小型模型，拥有 90 亿参数。该模型继承了 GLM-4-32B 系列的技术特点，但提供了更轻量级的部署选择。尽管规模较小，GLM-4-9B-0414 仍在代码生成、网页设计、SVG 图形生成和基于搜索的写作等任务上展现出色能力。',
+    displayName: 'GLM-4 9B 0414',
+    enabled: true,
+    id: 'THUDM/GLM-4-9B-0414',
+    pricing: {
+      currency: 'CNY',
+      input: 0,
+      output: 0,
+    },
+    type: 'chat',
+  },
   {
     abilities: {
       functionCall: true,
@@ -29,6 +108,7 @@ const siliconcloudChatModels: AIChatModelCard[] = [
     description:
       'DeepSeek-V3 是一款拥有 6710 亿参数的混合专家（MoE）语言模型，采用多头潜在注意力（MLA）和 DeepSeekMoE 架构，结合无辅助损失的负载平衡策略，优化推理和训练效率。通过在 14.8 万亿高质量tokens上预训练，并进行监督微调和强化学习，DeepSeek-V3 在性能上超越其他开源模型，接近领先闭源模型。',
     displayName: 'DeepSeek V3',
+    enabled: true,
     id: 'deepseek-ai/DeepSeek-V3',
     pricing: {
       currency: 'CNY',
@@ -369,7 +449,6 @@ const siliconcloudChatModels: AIChatModelCard[] = [
     description:
       'Qwen2.5-72B-Instruct 是阿里云发布的最新大语言模型系列之一。该 72B 模型在编码和数学等领域具有显著改进的能力。它支持长达 128K tokens 的输入，可以生成超过 8K tokens 的长文本。该模型还提供了多语言支持，覆盖超过 29 种语言，包括中文、英文等。模型在指令跟随、理解结构化数据以及生成结构化输出（尤其是 JSON）方面都有显著提升',
     displayName: 'Qwen2.5 72B Instruct 128K',
-    enabled: true,
     id: 'Qwen/Qwen2.5-72B-Instruct-128K',
     pricing: {
       currency: 'CNY',
@@ -541,7 +620,6 @@ const siliconcloudChatModels: AIChatModelCard[] = [
     description:
       'Qwen2.5-VL 是 Qwen2.5 系列中的视觉语言模型。该模型在多方面有显著提升：具备更强的视觉理解能力，能够识别常见物体、分析文本、图表和布局；作为视觉代理能够推理并动态指导工具使用；支持理解超过 1 小时的长视频并捕捉关键事件；能够通过生成边界框或点准确定位图像中的物体；支持生成结构化输出，尤其适用于发票、表格等扫描数据。',
     displayName: 'Qwen2.5 VL 72B Instruct',
-    enabled: true,
     id: 'Qwen/Qwen2.5-VL-72B-Instruct',
     pricing: {
       currency: 'CNY',

package/src/config/aiModels/stepfun.ts CHANGED Viewed

@@ -3,6 +3,27 @@ import { AIChatModelCard } from '@/types/aiModel';
 // https://platform.stepfun.com/docs/pricing/details
 const stepfunChatModels: AIChatModelCard[] = [
+  {
+    abilities: {
+      // functionCall: true,
+      reasoning: true,
+      // search: true,
+      vision: true,
+    },
+    contextWindowTokens: 100_000,
+    description: '该模型是拥有强大的图像理解能力的推理大模型，能够处理图像和文字信息，经过深度思考后输出文本生成文本内容。该模型在视觉推理领域表现突出，同时拥有第一梯队的数学、代码、文本推理能力。上下文长度为100k。',
+    displayName: 'Step R1 V Mini',
+    id: 'step-r1-v-mini',
+    pricing: {
+      currency: 'CNY',
+      input: 2.5,
+      output: 8,
+    },
+    // settings: {
+    //   searchImpl: 'params',
+    // },
+    type: 'chat',
+  },
   {
     abilities: {
       functionCall: true,
@@ -11,8 +32,7 @@ const stepfunChatModels: AIChatModelCard[] = [
     contextWindowTokens: 8000,
     description: '高速模型，适合实时对话。',
     displayName: 'Step 1 Flash',
-    enabled: true,
-    id: 'step-1-flash',
+    id: 'step-1-flash', // 将在2025年4月30日下线
     pricing: {
       currency: 'CNY',
       input: 1,
@@ -31,7 +51,6 @@ const stepfunChatModels: AIChatModelCard[] = [
     contextWindowTokens: 8000,
     description: '小型模型，适合轻量级任务。',
     displayName: 'Step 1 8K',
-    enabled: true,
     id: 'step-1-8k',
     pricing: {
       currency: 'CNY',
@@ -51,7 +70,6 @@ const stepfunChatModels: AIChatModelCard[] = [
     contextWindowTokens: 32_000,
     description: '支持中等长度的对话，适用于多种应用场景。',
     displayName: 'Step 1 32K',
-    enabled: true,
     id: 'step-1-32k',
     pricing: {
       currency: 'CNY',
@@ -71,8 +89,7 @@ const stepfunChatModels: AIChatModelCard[] = [
     contextWindowTokens: 128_000,
     description: '平衡性能与成本，适合一般场景。',
     displayName: 'Step 1 128K',
-    enabled: true,
-    id: 'step-1-128k',
+    id: 'step-1-128k', // 将在2025年4月30日下线
     pricing: {
       currency: 'CNY',
       input: 40,
@@ -107,16 +124,18 @@ const stepfunChatModels: AIChatModelCard[] = [
       functionCall: true,
       search: true,
     },
-    contextWindowTokens: 16_000,
-    description: '支持大规模上下文交互，适合复杂对话场景。',
-    displayName: 'Step 2 16K',
+    contextWindowTokens: 8000,
+    description:
+      '基于新一代自研Attention架构MFA的极速大模型，用极低成本达到和step1类似的效果，同时保持了更高的吞吐和更快响应时延。能够处理通用任务，在代码能力上具备特长。',
+    displayName: 'Step 2 Mini',
     enabled: true,
-    id: 'step-2-16k',
-    pricing: {
+    id: 'step-2-mini',
+      pricing: {
       currency: 'CNY',
-      input: 38,
-      output: 120,
+      input: 1,
+      output: 2,
     },
+    releasedAt: '2025-01-14',
     settings: {
       searchImpl: 'params',
     },
@@ -127,18 +146,15 @@ const stepfunChatModels: AIChatModelCard[] = [
       functionCall: true,
       search: true,
     },
-    contextWindowTokens: 8000,
-    description:
-      '基于新一代自研Attention架构MFA的极速大模型，用极低成本达到和step1类似的效果，同时保持了更高的吞吐和更快响应时延。能够处理通用任务，在代码能力上具备特长。',
-    displayName: 'Step 2 Mini',
-    enabled: true,
-    id: 'step-2-mini',
-      pricing: {
+    contextWindowTokens: 16_000,
+    description: '支持大规模上下文交互，适合复杂对话场景。',
+    displayName: 'Step 2 16K',
+    id: 'step-2-16k',
+    pricing: {
       currency: 'CNY',
-      input: 1,
-      output: 2,
+      input: 38,
+      output: 120,
     },
-    releasedAt: '2025-01-14',
     settings: {
       searchImpl: 'params',
     },
@@ -153,7 +169,7 @@ const stepfunChatModels: AIChatModelCard[] = [
     description: 'step-2模型的实验版本，包含最新的特性，滚动更新中。不推荐在正式生产环境使用。',
     displayName: 'Step 2 16K Exp',
     enabled: true,
-    id: 'step-2-16k',
+    id: 'step-2-16k-exp',
     pricing: {
       currency: 'CNY',
       input: 38,
@@ -174,7 +190,6 @@ const stepfunChatModels: AIChatModelCard[] = [
     contextWindowTokens: 8000,
     description: '小型视觉模型，适合基本的图文任务。',
     displayName: 'Step 1V 8K',
-    enabled: true,
     id: 'step-1v-8k',
     pricing: {
       currency: 'CNY',
@@ -208,8 +223,6 @@ const stepfunChatModels: AIChatModelCard[] = [
   },
   {
     abilities: {
-      functionCall: true,
-      search: true,
       vision: true,
     },
     contextWindowTokens: 32_000,
@@ -223,9 +236,6 @@ const stepfunChatModels: AIChatModelCard[] = [
       output: 70,
     },
     releasedAt: '2025-01-22',
-    settings: {
-      searchImpl: 'params',
-    },
     type: 'chat',
   },
   {
@@ -235,7 +245,6 @@ const stepfunChatModels: AIChatModelCard[] = [
     contextWindowTokens: 32_000,
     description: '该模型拥有强大的视频理解能力。',
     displayName: 'Step 1.5V Mini',
-    enabled: true,
     id: 'step-1.5v-mini',
     pricing: {
       currency: 'CNY',

package/src/config/aiModels/tencentcloud.ts CHANGED Viewed

@@ -1,5 +1,5 @@
 import { AIChatModelCard } from '@/types/aiModel';
+// https://cloud.tencent.com/document/product/1772/115969
 const tencentCloudChatModels: AIChatModelCard[] = [
   {
     abilities: {
@@ -7,11 +7,11 @@ const tencentCloudChatModels: AIChatModelCard[] = [
     },
     contextWindowTokens: 65_536,
     description:
-      'DeepSeek-R1 是一款强化学习（RL）驱动的推理模型，解决了模型中的重复性和可读性问题。在 RL 之前，DeepSeek-R1 引入了冷启动数据，进一步优化了推理性能。它在数学、代码和推理任务中与 OpenAI-o1 表现相当，并且通过精心设计的训练方法，提升了整体效果。',
+      'DeepSeek-R1 为671B 模型，使用强化学习训练，推理过程包含大量反思和验证，思维链长度可达数万字。 该系列模型在数学、代码以及各种复杂逻辑推理任务上推理效果优异，并为用户展现了完整的思考过程。',
     displayName: 'DeepSeek R1',
     enabled: true,
     id: 'deepseek-r1',
-    maxOutput: 8192,
+    maxOutput: 16_000,
     pricing: {
       currency: 'CNY',
       input: 4,
@@ -23,9 +23,10 @@ const tencentCloudChatModels: AIChatModelCard[] = [
     contextWindowTokens: 65_536,
     description:
       'DeepSeek-V3-0324 为671B 参数 MoE 模型，在编程与技术能力、上下文理解与长文本处理等方面优势突出。',
-    displayName: 'DeepSeek-V3-0324',
+    displayName: 'DeepSeek V3 0324',
     enabled: true,
     id: 'deepseek-v3-0324',
+    maxOutput: 16_000,
     pricing: {
       currency: 'CNY',
       input: 2,
@@ -36,10 +37,10 @@ const tencentCloudChatModels: AIChatModelCard[] = [
   {
     contextWindowTokens: 65_536,
     description:
-      'DeepSeek-V3 是一款拥有 6710 亿参数的混合专家（MoE）语言模型，采用多头潜在注意力（MLA）和 DeepSeekMoE 架构，结合无辅助损失的负载平衡策略，优化推理和训练效率。通过在 14.8 万亿高质量tokens上预训练，并进行监督微调和强化学习，DeepSeek-V3 在性能上超越其他开源模型，接近领先闭源模型。',
+      'DeepSeek-V3 为671B 参数 MoE 模型，在百科知识、数学推理等多项任务上优势突出。',
     displayName: 'DeepSeek V3',
-    enabled: true,
     id: 'deepseek-v3',
+    maxOutput: 16_000,
     pricing: {
       currency: 'CNY',
       input: 2,

package/src/config/aiModels/volcengine.ts CHANGED Viewed

@@ -149,6 +149,7 @@ const doubaoChatModels: AIChatModelCard[] = [
   },
   {
     abilities: {
+      functionCall: true,
       vision: true,
     },
     config: {