npm - @lobehub/chat - Versions diffs - 1.45.1 → 1.45.2 - Mend

@lobehub/chat 1.45.1 → 1.45.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/CHANGELOG.md +25 -0
package/changelog/v1.json +9 -0
package/package.json +1 -1
package/src/config/aiModels/siliconcloud.ts +6 -72
package/src/config/modelProviders/siliconcloud.ts +4 -65

package/CHANGELOG.md CHANGED Viewed

@@ -2,6 +2,31 @@
 # Changelog
+### [Version 1.45.2](https://github.com/lobehub/lobe-chat/compare/v1.45.1...v1.45.2)
+<sup>Released on **2025-01-09**</sup>
+#### 💄 Styles
+- **misc**: Update siliconcloud model list.
+<br/>
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+#### Styles
+- **misc**: Update siliconcloud model list, closes [#5360](https://github.com/lobehub/lobe-chat/issues/5360) ([69085ac](https://github.com/lobehub/lobe-chat/commit/69085ac))
+</details>
+<div align="right">
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+</div>
 ### [Version 1.45.1](https://github.com/lobehub/lobe-chat/compare/v1.45.0...v1.45.1)
 <sup>Released on **2025-01-09**</sup>

package/changelog/v1.json CHANGED Viewed

@@ -1,4 +1,13 @@
 [
+  {
+    "children": {
+      "improvements": [
+        "Update siliconcloud model list."
+      ]
+    },
+    "date": "2025-01-09",
+    "version": "1.45.2"
+  },
   {
     "children": {
       "fixes": [

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@lobehub/chat",
-  "version": "1.45.1",
+  "version": "1.45.2",
   "description": "Lobe Chat - an open-source, high-performance chatbot framework that supports speech synthesis, multimodal, and extensible Function Call plugin system. Supports one-click free deployment of your private ChatGPT/LLM web application.",
   "keywords": [
     "framework",

package/src/config/aiModels/siliconcloud.ts CHANGED Viewed

@@ -1,20 +1,6 @@
 import { AIChatModelCard } from '@/types/aiModel';
 const siliconcloudChatModels: AIChatModelCard[] = [
-  {
-    contextWindowTokens: 32_768,
-    description:
-      'Hunyuan-Large 是业界最大的开源 Transformer 架构 MoE 模型，拥有 3890 亿总参数量和 520 亿激活参数量。',
-    displayName: 'Hunyuan A52B Instruct',
-    enabled: true,
-    id: 'Tencent/Hunyuan-A52B-Instruct',
-    pricing: {
-      currency: 'CNY',
-      input: 21,
-      output: 21,
-    },
-    type: 'chat',
-  },
   {
     abilities: {
       functionCall: true,
@@ -32,19 +18,6 @@ const siliconcloudChatModels: AIChatModelCard[] = [
     },
     type: 'chat',
   },
-  {
-    contextWindowTokens: 32_768,
-    description:
-      'DeepSeek-V2 是一个强大、经济高效的混合专家（MoE）语言模型。它在 8.1 万亿个 token 的高质量语料库上进行了预训练，并通过监督微调（SFT）和强化学习（RL）进一步提升了模型能力。与 DeepSeek 67B 相比， DeepSeek-V2 在性能更强的同时，节省了 42.5% 的训练成本，减少了 93.3% 的 KV 缓存，并将最大生成吞吐量提高到了 5.76 倍。该模型支持 128k 的上下文长度，在标准基准测试和开放式生成评估中都表现出色',
-    displayName: 'DeepSeek V2 Chat',
-    id: 'deepseek-ai/DeepSeek-V2-Chat',
-    pricing: {
-      currency: 'CNY',
-      input: 1.33,
-      output: 1.33,
-    },
-    type: 'chat',
-  },
   {
     contextWindowTokens: 32_768,
     description:
@@ -238,19 +211,6 @@ const siliconcloudChatModels: AIChatModelCard[] = [
     },
     type: 'chat',
   },
-  {
-    contextWindowTokens: 4096,
-    description:
-      'Qwen2.5-Math-72B 是阿里云发布的 Qwen2.5-Math 系列数学大语言模型之一。该模型支持使用思维链（CoT）和工具集成推理（TIR）方法解决中文和英文数学问题。相比前代 Qwen2-Math 系列，Qwen2.5-Math 系列在中英文数学基准测试中取得了显著的性能提升。该模型在处理精确计算、符号操作和算法操作方面表现出色，尤其适合解决复杂的数学和算法推理任务',
-    displayName: 'Qwen2.5 Math 72B Instruct',
-    id: 'Qwen/Qwen2.5-Math-72B-Instruct',
-    pricing: {
-      currency: 'CNY',
-      input: 4.13,
-      output: 4.13,
-    },
-    type: 'chat',
-  },
   {
     contextWindowTokens: 32_768,
     description:
@@ -303,19 +263,6 @@ const siliconcloudChatModels: AIChatModelCard[] = [
     },
     type: 'chat',
   },
-  {
-    contextWindowTokens: 32_768,
-    description:
-      'Qwen2-72B-Instruct 是 Qwen2 系列中的指令微调大语言模型，参数规模为 72B。该模型基于 Transformer 架构，采用了 SwiGLU 激活函数、注意力 QKV 偏置和组查询注意力等技术。它能够处理大规模输入。该模型在语言理解、生成、多语言能力、编码、数学和推理等多个基准测试中表现出色，超越了大多数开源模型，并在某些任务上展现出与专有模型相当的竞争力',
-    displayName: 'Qwen2 72B Instruct (Vendor-A)',
-    id: 'Vendor-A/Qwen/Qwen2-7B-Instruct',
-    pricing: {
-      currency: 'CNY',
-      input: 1,
-      output: 1,
-    },
-    type: 'chat',
-  },
   {
     abilities: {
       vision: true,
@@ -414,22 +361,6 @@ const siliconcloudChatModels: AIChatModelCard[] = [
     },
     type: 'chat',
   },
-  {
-    abilities: {
-      vision: true,
-    },
-    contextWindowTokens: 8192,
-    description:
-      'InternVL2-Llama3-76B 是 InternVL 2.0 系列中的大规模多模态模型。它由 InternViT-6B-448px-V1-5 视觉模型、MLP 投影层和 Hermes-2-Theta-Llama-3-70B 语言模型组成。该模型在各种视觉语言任务上表现出色，包括文档和图表理解、信息图表问答、场景文本理解和 OCR 任务等。InternVL2-Llama3-76B 使用 8K 上下文窗口训练，能够处理长文本、多图像和视频输入，显著提升了模型在这些任务上的处理能力，在多项基准测试中达到或接近最先进的商业模型水平',
-    displayName: 'InternVL2 Llama3 76B',
-    id: 'OpenGVLab/InternVL2-Llama3-76B',
-    pricing: {
-      currency: 'CNY',
-      input: 4.13,
-      output: 4.13,
-    },
-    type: 'chat',
-  },
   {
     abilities: {
       functionCall: true,
@@ -617,12 +548,15 @@ const siliconcloudChatModels: AIChatModelCard[] = [
     type: 'chat',
   },
   {
+    abilities: {
+      functionCall: true,
+    },
     contextWindowTokens: 32_768,
     description:
-      'Llama-3.1-Nemotron-70B-Instruct 是由 NVIDIA 定制的大型语言模型，旨在提高 LLM 生成的响应对用户查询的帮助程度。该模型在 Arena Hard、AlpacaEval 2 LC 和 GPT-4-Turbo MT-Bench 等基准测试中表现出色，截至 2024 年 10 月 1 日，在所有三个自动对齐基准测试中排名第一。该模型使用 RLHF（特别是 REINFORCE）、Llama-3.1-Nemotron-70B-Reward 和 HelpSteer2-Preference 提示在 Llama-3.1-70B-Instruct 模型基础上进行训练',
-    displayName: 'Llama 3.1 Nemotron 70B Instruct',
+      'Llama 3.3 是 Llama 系列最先进的多语言开源大型语言模型，以极低成本体验媲美 405B 模型的性能。基于 Transformer 结构，并通过监督微调（SFT）和人类反馈强化学习（RLHF）提升有用性和安全性。其指令调优版本专为多语言对话优化，在多项行业基准上表现优于众多开源和封闭聊天模型。知识截止日期为 2023 年 12 月',
+    displayName: 'Llama 3.3 70B Instruct',
     enabled: true,
-    id: 'nvidia/Llama-3.1-Nemotron-70B-Instruct',
+    id: 'meta-llama/Llama-3.3-70B-Instruct',
     pricing: {
       currency: 'CNY',
       input: 4.13,

package/src/config/modelProviders/siliconcloud.ts CHANGED Viewed

@@ -3,19 +3,6 @@ import { ModelProviderCard } from '@/types/llm';
 // ref :https://siliconflow.cn/zh-cn/pricing
 const SiliconCloud: ModelProviderCard = {
   chatModels: [
-    {
-      contextWindowTokens: 32_768,
-      description:
-        'Hunyuan-Large 是业界最大的开源 Transformer 架构 MoE 模型，拥有 3890 亿总参数量和 520 亿激活参数量。',
-      displayName: 'Hunyuan A52B Instruct',
-      enabled: true,
-      id: 'Tencent/Hunyuan-A52B-Instruct',
-      pricing: {
-        currency: 'CNY',
-        input: 21,
-        output: 21,
-      },
-    },
     {
       contextWindowTokens: 32_768,
       description:
@@ -30,18 +17,6 @@ const SiliconCloud: ModelProviderCard = {
         output: 1.33,
       },
     },
-    {
-      contextWindowTokens: 32_768,
-      description:
-        'DeepSeek-V2 是一个强大、经济高效的混合专家（MoE）语言模型。它在 8.1 万亿个 token 的高质量语料库上进行了预训练，并通过监督微调（SFT）和强化学习（RL）进一步提升了模型能力。与 DeepSeek 67B 相比， DeepSeek-V2 在性能更强的同时，节省了 42.5% 的训练成本，减少了 93.3% 的 KV 缓存，并将最大生成吞吐量提高到了 5.76 倍。该模型支持 128k 的上下文长度，在标准基准测试和开放式生成评估中都表现出色',
-      displayName: 'DeepSeek V2 Chat',
-      id: 'deepseek-ai/DeepSeek-V2-Chat',
-      pricing: {
-        currency: 'CNY',
-        input: 1.33,
-        output: 1.33,
-      },
-    },
     {
       contextWindowTokens: 32_768,
       description:
@@ -208,18 +183,6 @@ const SiliconCloud: ModelProviderCard = {
         output: 1.26,
       },
     },
-    {
-      contextWindowTokens: 4096,
-      description:
-        'Qwen2.5-Math-72B 是阿里云发布的 Qwen2.5-Math 系列数学大语言模型之一。该模型支持使用思维链（CoT）和工具集成推理（TIR）方法解决中文和英文数学问题。相比前代 Qwen2-Math 系列，Qwen2.5-Math 系列在中英文数学基准测试中取得了显著的性能提升。该模型在处理精确计算、符号操作和算法操作方面表现出色，尤其适合解决复杂的数学和算法推理任务',
-      displayName: 'Qwen2.5 Math 72B Instruct',
-      id: 'Qwen/Qwen2.5-Math-72B-Instruct',
-      pricing: {
-        currency: 'CNY',
-        input: 4.13,
-        output: 4.13,
-      },
-    },
     {
       contextWindowTokens: 32_768,
       description:
@@ -280,18 +243,6 @@ const SiliconCloud: ModelProviderCard = {
         output: 4.13,
       },
     },
-    {
-      contextWindowTokens: 32_768,
-      description:
-        'Qwen2-72B-Instruct 是 Qwen2 系列中的指令微调大语言模型，参数规模为 72B。该模型基于 Transformer 架构，采用了 SwiGLU 激活函数、注意力 QKV 偏置和组查询注意力等技术。它能够处理大规模输入。该模型在语言理解、生成、多语言能力、编码、数学和推理等多个基准测试中表现出色，超越了大多数开源模型，并在某些任务上展现出与专有模型相当的竞争力',
-      displayName: 'Qwen2 72B Instruct (Vendor-A)',
-      id: 'Vendor-A/Qwen/Qwen2-7B-Instruct',
-      pricing: {
-        currency: 'CNY',
-        input: 1,
-        output: 1,
-      },
-    },
     {
       contextWindowTokens: 32_768,
       description:
@@ -372,19 +323,6 @@ const SiliconCloud: ModelProviderCard = {
       },
       vision: true,
     },
-    {
-      contextWindowTokens: 8192,
-      description:
-        'InternVL2-Llama3-76B 是 InternVL 2.0 系列中的大规模多模态模型。它由 InternViT-6B-448px-V1-5 视觉模型、MLP 投影层和 Hermes-2-Theta-Llama-3-70B 语言模型组成。该模型在各种视觉语言任务上表现出色，包括文档和图表理解、信息图表问答、场景文本理解和 OCR 任务等。InternVL2-Llama3-76B 使用 8K 上下文窗口训练，能够处理长文本、多图像和视频输入，显著提升了模型在这些任务上的处理能力，在多项基准测试中达到或接近最先进的商业模型水平',
-      displayName: 'InternVL2 Llama3 76B',
-      id: 'OpenGVLab/InternVL2-Llama3-76B',
-      pricing: {
-        currency: 'CNY',
-        input: 4.13,
-        output: 4.13,
-      },
-      vision: true,
-    },
     {
       contextWindowTokens: 131_072,
       description:
@@ -553,10 +491,11 @@ const SiliconCloud: ModelProviderCard = {
     {
       contextWindowTokens: 32_768,
       description:
-        'Llama-3.1-Nemotron-70B-Instruct 是由 NVIDIA 定制的大型语言模型，旨在提高 LLM 生成的响应对用户查询的帮助程度。该模型在 Arena Hard、AlpacaEval 2 LC 和 GPT-4-Turbo MT-Bench 等基准测试中表现出色，截至 2024 年 10 月 1 日，在所有三个自动对齐基准测试中排名第一。该模型使用 RLHF（特别是 REINFORCE）、Llama-3.1-Nemotron-70B-Reward 和 HelpSteer2-Preference 提示在 Llama-3.1-70B-Instruct 模型基础上进行训练',
-      displayName: 'Llama 3.1 Nemotron 70B Instruct',
+        'Llama 3.3 是 Llama 系列最先进的多语言开源大型语言模型，以极低成本体验媲美 405B 模型的性能。基于 Transformer 结构，并通过监督微调（SFT）和人类反馈强化学习（RLHF）提升有用性和安全性。其指令调优版本专为多语言对话优化，在多项行业基准上表现优于众多开源和封闭聊天模型。知识截止日期为 2023 年 12 月',
+      displayName: 'Llama 3.3 70B Instruct',
       enabled: true,
-      id: 'nvidia/Llama-3.1-Nemotron-70B-Instruct',
+      functionCall: true,
+      id: 'meta-llama/Llama-3.3-70B-Instruct',
       pricing: {
         currency: 'CNY',
         input: 4.13,