npm - @lobehub/chat - Versions diffs - 1.51.6 → 1.51.7 - Mend

@lobehub/chat 1.51.6 → 1.51.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (4) hide show

package/CHANGELOG.md +25 -0
package/changelog/v1.json +9 -0
package/package.json +1 -1
package/src/config/aiModels/qwen.ts +101 -2

package/CHANGELOG.md CHANGED Viewed

@@ -2,6 +2,31 @@
 # Changelog
+### [Version 1.51.7](https://github.com/lobehub/lobe-chat/compare/v1.51.6...v1.51.7)
+<sup>Released on **2025-02-06**</sup>
+#### 💄 Styles
+- **misc**: Add Aliyun deepseek-r1 distill models.
+<br/>
+<details>
+<summary><kbd>Improvements and Fixes</kbd></summary>
+#### Styles
+- **misc**: Add Aliyun deepseek-r1 distill models, closes [#5769](https://github.com/lobehub/lobe-chat/issues/5769) ([8b68190](https://github.com/lobehub/lobe-chat/commit/8b68190))
+</details>
+<div align="right">
+[![](https://img.shields.io/badge/-BACK_TO_TOP-151515?style=flat-square)](#readme-top)
+</div>
 ### [Version 1.51.6](https://github.com/lobehub/lobe-chat/compare/v1.51.5...v1.51.6)
 <sup>Released on **2025-02-06**</sup>

package/changelog/v1.json CHANGED Viewed

@@ -1,4 +1,13 @@
 [
+  {
+    "children": {
+      "improvements": [
+        "Add Aliyun deepseek-r1 distill models."
+      ]
+    },
+    "date": "2025-02-06",
+    "version": "1.51.7"
+  },
   {
     "children": {
       "fixes": [

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@lobehub/chat",
-  "version": "1.51.6",
+  "version": "1.51.7",
   "description": "Lobe Chat - an open-source, high-performance chatbot framework that supports speech synthesis, multimodal, and extensible Function Call plugin system. Supports one-click free deployment of your private ChatGPT/LLM web application.",
   "keywords": [
     "framework",

package/src/config/aiModels/qwen.ts CHANGED Viewed

@@ -411,10 +411,11 @@ const qwenChatModels: AIChatModelCard[] = [
     abilities: {
       reasoning: true,
     },
-    contextWindowTokens: 65_536,
+    contextWindowTokens: 131_072,
     description:
       'DeepSeek-R1 在后训练阶段大规模使用了强化学习技术，在仅有极少标注数据的情况下，极大提升了模型推理能力，尤其在数学、代码、自然语言推理等任务上。',
     displayName: 'DeepSeek R1',
+    enabled: true,
     id: 'deepseek-r1',
     maxOutput: 8192,
     pricing: {
@@ -429,10 +430,11 @@ const qwenChatModels: AIChatModelCard[] = [
     abilities: {
       functionCall: true,
     },
-    contextWindowTokens: 65_536,
+    contextWindowTokens: 131_072,
     description:
       'DeepSeek-V3 为自研 MoE 模型，671B 参数，激活 37B，在 14.8T token 上进行了预训练，在长文本、代码、数学、百科、中文能力上表现优秀。',
     displayName: 'DeepSeek V3',
+    enabled: true,
     id: 'deepseek-v3',
     maxOutput: 8192,
     pricing: {
@@ -443,6 +445,103 @@ const qwenChatModels: AIChatModelCard[] = [
     releasedAt: '2025-01-27',
     type: 'chat',
   },
+  {
+    abilities: {
+      reasoning: true,
+    },
+    contextWindowTokens: 131_072,
+    description:
+      'DeepSeek-R1-Distill 系列模型通过知识蒸馏技术，将 DeepSeek-R1 生成的样本对 Qwen、Llama 等开源模型进行微调后得到。',
+    displayName: 'DeepSeek R1 Distill Qwen 1.5B',
+    id: 'deepseek-r1-distill-qwen-1.5b',
+    maxOutput: 8192,
+    pricing: {
+      currency: 'CNY',
+      input: 0,
+      output: 0,
+    },
+    type: 'chat',
+  },
+  {
+    abilities: {
+      reasoning: true
+    },
+    contextWindowTokens: 131_072,
+    description: "DeepSeek-R1-Distill 系列模型通过知识蒸馏技术，将 DeepSeek-R1 生成的样本对 Qwen、Llama 等开源模型进行微调后得到。",
+    displayName: "DeepSeek R1 Distill Qwen 7B",
+    id: "deepseek-r1-distill-qwen-7b",
+    maxOutput: 8192,
+    pricing: {
+      currency: "CNY",
+      input: 0,
+      output: 0
+    },
+    type: "chat"
+  },
+  {
+    abilities: {
+      reasoning: true
+    },
+    contextWindowTokens: 131_072,
+    description: "DeepSeek-R1-Distill 系列模型通过知识蒸馏技术，将 DeepSeek-R1 生成的样本对 Qwen、Llama 等开源模型进行微调后得到。",
+    displayName: "DeepSeek R1 Distill Llama 8B",
+    id: "deepseek-r1-distill-llama-8b",
+    maxOutput: 8192,
+    pricing: {
+      currency: "CNY",
+      input: 0,
+      output: 0
+    },
+    type: "chat"
+  },
+  {
+    abilities: {
+      reasoning: true
+    },
+    contextWindowTokens: 131_072,
+    description: "DeepSeek-R1-Distill 系列模型通过知识蒸馏技术，将 DeepSeek-R1 生成的样本对 Qwen、Llama 等开源模型进行微调后得到。",
+    displayName: "DeepSeek R1 Distill Qwen 14B",
+    id: "deepseek-r1-distill-qwen-14b",
+    maxOutput: 8192,
+    pricing: {
+      currency: "CNY",
+      input: 0,
+      output: 0
+    },
+    type: "chat"
+  },
+  {
+    abilities: {
+      reasoning: true
+    },
+    contextWindowTokens: 131_072,
+    description: "DeepSeek-R1-Distill 系列模型通过知识蒸馏技术，将 DeepSeek-R1 生成的样本对 Qwen、Llama 等开源模型进行微调后得到。",
+    displayName: "DeepSeek R1 Distill Qwen 32B",
+    id: "deepseek-r1-distill-qwen-32b",
+    maxOutput: 8192,
+    pricing: {
+      currency: "CNY",
+      input: 0,
+      output: 0
+    },
+    type: "chat"
+  },
+  {
+    abilities: {
+      reasoning: true
+    },
+    contextWindowTokens: 131_072,
+    description: "DeepSeek-R1-Distill 系列模型通过知识蒸馏技术，将 DeepSeek-R1 生成的样本对 Qwen、Llama 等开源模型进行微调后得到。",
+    displayName: "DeepSeek R1 Distill Llama 70B",
+    id: "deepseek-r1-distill-llama-70b",
+    maxOutput: 8192,
+    pricing: {
+      currency: "CNY",
+      input: 0,
+      output: 0
+    },
+    type: "chat"
+  }
 ];
 export const allModels = [...qwenChatModels];