npm - @lobehub/chat - Versions diffs - 1.40.1 → 1.40.3 - Mend

@lobehub/chat 1.40.1 → 1.40.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (118) hide show

package/src/config/modelProviders/openrouter.ts CHANGED Viewed

@@ -4,16 +4,17 @@ import { ModelProviderCard } from '@/types/llm';
 const OpenRouter: ModelProviderCard = {
   chatModels: [
     {
+      contextWindowTokens: 128_000,
       description:
         '根据上下文长度、主题和复杂性，你的请求将发送到 Llama 3 70B Instruct、Claude 3.5 Sonnet（自我调节）或 GPT-4o。',
       displayName: 'Auto (best for prompt)',
       enabled: true,
       functionCall: false,
       id: 'openrouter/auto',
-      tokens: 128_000,
       vision: false,
     },
     {
+      contextWindowTokens: 128_000,
       description:
         'o1-mini是一款针对编程、数学和科学应用场景而设计的快速、经济高效的推理模型。该模型具有128K上下文和2023年10月的知识截止日期。',
       displayName: 'OpenAI o1-mini',
@@ -25,9 +26,9 @@ const OpenRouter: ModelProviderCard = {
         output: 12,
       },
       releasedAt: '2024-09-12',
-      tokens: 128_000,
     },
     {
+      contextWindowTokens: 128_000,
       description:
         'o1是OpenAI新的推理模型，适用于需要广泛通用知识的复杂任务。该模型具有128K上下文和2023年10月的知识截止日期。',
       displayName: 'OpenAI o1-preview',
@@ -39,9 +40,9 @@ const OpenRouter: ModelProviderCard = {
         output: 60,
       },
       releasedAt: '2024-09-12',
-      tokens: 128_000,
     },
     {
+      contextWindowTokens: 128_000,
       description:
         'GPT-4o mini是OpenAI在GPT-4 Omni之后推出的最新模型，支持图文输入并输出文本。作为他们最先进的小型模型，它比其他近期的前沿模型便宜很多，并且比GPT-3.5 Turbo便宜超过60%。它保持了最先进的智能，同时具有显著的性价比。GPT-4o mini在MMLU测试中获得了 82% 的得分，目前在聊天偏好上排名高于 GPT-4。',
       displayName: 'GPT-4o mini',
@@ -53,10 +54,10 @@ const OpenRouter: ModelProviderCard = {
         input: 0.15,
         output: 0.6,
       },
-      tokens: 128_000,
       vision: true,
     },
     {
+      contextWindowTokens: 128_000,
       description:
         'ChatGPT-4o 是一款动态模型，实时更新以保持当前最新版本。它结合了强大的语言理解与生成能力，适合于大规模应用场景，包括客户服务、教育和技术支持。',
       displayName: 'GPT-4o',
@@ -67,10 +68,10 @@ const OpenRouter: ModelProviderCard = {
         input: 2.5,
         output: 10,
       },
-      tokens: 128_000,
       vision: true,
     },
     {
+      contextWindowTokens: 200_000,
       description:
         'Claude 3 Haiku 是 Anthropic 的最快且最紧凑的模型，旨在实现近乎即时的响应。它具有快速且准确的定向性能。',
       displayName: 'Claude 3 Haiku',
@@ -85,10 +86,10 @@ const OpenRouter: ModelProviderCard = {
         writeCacheInput: 0.3125,
       },
       releasedAt: '2024-03-07',
-      tokens: 200_000,
       vision: true,
     },
     {
+      contextWindowTokens: 200_000,
       description:
         'Claude 3.5 Sonnet 提供了超越 Opus 的能力和比 Sonnet 更快的速度，同时保持与 Sonnet 相同的价格。Sonnet 特别擅长编程、数据科学、视觉处理、代理任务。',
       displayName: 'Claude 3.5 Sonnet',
@@ -103,10 +104,10 @@ const OpenRouter: ModelProviderCard = {
         writeCacheInput: 3.75,
       },
       releasedAt: '2024-06-20',
-      tokens: 200_000,
       vision: true,
     },
     {
+      contextWindowTokens: 200_000,
       description:
         'Claude 3 Opus 是 Anthropic 用于处理高度复杂任务的最强大模型。它在性能、智能、流畅性和理解力方面表现卓越。',
       displayName: 'Claude 3 Opus',
@@ -121,10 +122,10 @@ const OpenRouter: ModelProviderCard = {
         writeCacheInput: 18.75,
       },
       releasedAt: '2024-02-29',
-      tokens: 200_000,
       vision: true,
     },
     {
+      contextWindowTokens: 1_000_000 + 8192,
       description: 'Gemini 1.5 Flash 提供了优化后的多模态处理能力，适用多种复杂任务场景。',
       displayName: 'Gemini 1.5 Flash',
       enabled: true,
@@ -135,10 +136,10 @@ const OpenRouter: ModelProviderCard = {
         input: 0.075,
         output: 0.3,
       },
-      tokens: 1_000_000 + 8192,
       vision: true,
     },
     {
+      contextWindowTokens: 2_000_000 + 8192,
       description: 'Gemini 1.5 Pro 结合最新优化技术，带来更高效的多模态数据处理能力。',
       displayName: 'Gemini 1.5 Pro',
       enabled: true,
@@ -149,10 +150,10 @@ const OpenRouter: ModelProviderCard = {
         input: 3.5,
         output: 10.5,
       },
-      tokens: 2_000_000 + 8192,
       vision: true,
     },
     {
+      contextWindowTokens: 128_000,
       description:
         '融合通用与代码能力的全新开源模型, 不仅保留了原有 Chat 模型的通用对话能力和 Coder 模型的强大代码处理能力，还更好地对齐了人类偏好。此外，DeepSeek-V2.5 在写作任务、指令跟随等多个方面也实现了大幅提升。',
       displayName: 'DeepSeek V2.5',
@@ -164,10 +165,11 @@ const OpenRouter: ModelProviderCard = {
         output: 0.28,
       },
       releasedAt: '2024-09-05',
-      tokens: 128_000,
     },
     {
-      description: 'LLaMA 3.2 旨在处理结合视觉和文本数据的任务。它在图像描述和视觉问答等任务中表现出色，跨越了语言生成和视觉推理之间的鸿沟。',
+      contextWindowTokens: 131_072,
+      description:
+        'LLaMA 3.2 旨在处理结合视觉和文本数据的任务。它在图像描述和视觉问答等任务中表现出色，跨越了语言生成和视觉推理之间的鸿沟。',
       displayName: 'Llama 3.2 11B Vision',
       enabled: true,
       id: 'meta-llama/llama-3.2-11b-vision-instruct',
@@ -175,11 +177,12 @@ const OpenRouter: ModelProviderCard = {
         input: 0.162,
         output: 0.162,
       },
-      tokens: 131_072,
       vision: true,
     },
     {
-      description: 'LLaMA 3.2 旨在处理结合视觉和文本数据的任务。它在图像描述和视觉问答等任务中表现出色，跨越了语言生成和视觉推理之间的鸿沟。',
+      contextWindowTokens: 131_072,
+      description:
+        'LLaMA 3.2 旨在处理结合视觉和文本数据的任务。它在图像描述和视觉问答等任务中表现出色，跨越了语言生成和视觉推理之间的鸿沟。',
       displayName: 'Llama 3.2 90B Vision',
       enabled: true,
       id: 'meta-llama/llama-3.2-90b-vision-instruct',
@@ -187,29 +190,28 @@ const OpenRouter: ModelProviderCard = {
         input: 0.4,
         output: 0.4,
       },
-      tokens: 131_072,
       vision: true,
     },
     {
+      contextWindowTokens: 32_768,
       description: 'Qwen2 是全新的大型语言模型系列，具有更强的理解和生成能力。',
       displayName: 'Qwen2 7B (Free)',
       enabled: true,
       id: 'qwen/qwen-2-7b-instruct:free',
-      tokens: 32_768,
     },
     {
+      contextWindowTokens: 32_768,
       description: 'LLaMA 3.1 提供多语言支持，是业界领先的生成模型之一。',
       displayName: 'Llama 3.1 8B (Free)',
       enabled: true,
       id: 'meta-llama/llama-3.1-8b-instruct:free',
-      tokens: 32_768,
     },
     {
+      contextWindowTokens: 8192,
       description: 'Gemma 2 是Google轻量化的开源文本模型系列。',
       displayName: 'Gemma 2 9B (Free)',
       enabled: true,
       id: 'google/gemma-2-9b-it:free',
-      tokens: 8192,
     },
   ],
   checkModel: 'google/gemma-2-9b-it:free',

package/src/config/modelProviders/perplexity.ts CHANGED Viewed

@@ -4,56 +4,56 @@ import { ModelProviderCard } from '@/types/llm';
 const Perplexity: ModelProviderCard = {
   chatModels: [
     {
+      contextWindowTokens: 128_000,
       description:
         'Llama 3.1 Sonar Small Online 模型，具备8B参数，支持约127,000个标记的上下文长度，专为在线聊天设计，能高效处理各种文本交互。',
       displayName: 'Llama 3.1 Sonar Small Online',
       enabled: true,
       id: 'llama-3.1-sonar-small-128k-online',
-      tokens: 128_000,
     },
     {
+      contextWindowTokens: 128_000,
       description:
         'Llama 3.1 Sonar Large Online 模型，具备70B参数，支持约127,000个标记的上下文长度，适用于高容量和多样化聊天任务。',
       displayName: 'Llama 3.1 Sonar Large Online',
       enabled: true,
       id: 'llama-3.1-sonar-large-128k-online',
-      tokens: 128_000,
     },
     {
+      contextWindowTokens: 128_000,
       description:
         'Llama 3.1 Sonar Huge Online 模型，具备405B参数，支持约127,000个标记的上下文长度，设计用于复杂的在线聊天应用。',
       displayName: 'Llama 3.1 Sonar Huge Online',
       enabled: true,
       id: 'llama-3.1-sonar-huge-128k-online',
-      tokens: 128_000,
     },
     {
+      contextWindowTokens: 128_000,
       description:
         'Llama 3.1 Sonar Small Chat 模型，具备8B参数，专为离线聊天设计，支持约127,000个标记的上下文长度。',
       displayName: 'Llama 3.1 Sonar Small Chat',
       enabled: true,
       id: 'llama-3.1-sonar-small-128k-chat',
-      tokens: 128_000,
     },
     {
+      contextWindowTokens: 128_000,
       description:
         'Llama 3.1 Sonar Large Chat 模型，具备70B参数，支持约127,000个标记的上下文长度，适合于复杂的离线聊天任务。',
       displayName: 'Llama 3.1 Sonar Large Chat',
       enabled: true,
       id: 'llama-3.1-sonar-large-128k-chat',
-      tokens: 128_000,
     },
     {
+      contextWindowTokens: 128_000,
       description:
         'Llama 3.1 8B Instruct 模型，具备8B参数，支持画面指示任务的高效执行，提供优质的文本生成能力。',
       id: 'llama-3.1-8b-instruct',
-      tokens: 128_000,
     },
     {
+      contextWindowTokens: 128_000,
       description:
         'Llama 3.1 70B Instruct 模型，具备70B参数，能在大型文本生成和指示任务中提供卓越性能。',
       id: 'llama-3.1-70b-instruct',
-      tokens: 128_000,
     },
   ],
   checkModel: 'llama-3.1-8b-instruct',

package/src/config/modelProviders/qwen.ts CHANGED Viewed

@@ -4,6 +4,7 @@ import { ModelProviderCard } from '@/types/llm';
 const Qwen: ModelProviderCard = {
   chatModels: [
     {
+      contextWindowTokens: 131_072,
       description: '通义千问超大规模语言模型，支持中文、英文等不同语言输入。',
       displayName: 'Qwen Turbo',
       enabled: true,
@@ -14,9 +15,9 @@ const Qwen: ModelProviderCard = {
         input: 0.3,
         output: 0.6,
       },
-      tokens: 131_072,
     },
     {
+      contextWindowTokens: 131_072,
       description: '通义千问超大规模语言模型增强版，支持中文、英文等不同语言输入。',
       displayName: 'Qwen Plus',
       enabled: true,
@@ -27,9 +28,9 @@ const Qwen: ModelProviderCard = {
         input: 0.8,
         output: 2,
       },
-      tokens: 131_072,
     },
     {
+      contextWindowTokens: 32_768,
       description:
         '通义千问千亿级别超大规模语言模型，支持中文、英文等不同语言输入，当前通义千问2.5产品版本背后的API模型。',
       displayName: 'Qwen Max',
@@ -41,9 +42,9 @@ const Qwen: ModelProviderCard = {
         input: 20,
         output: 60,
       },
-      tokens: 32_768,
     },
     {
+      contextWindowTokens: 1_000_000,
       description:
         '通义千问超大规模语言模型，支持长文本上下文，以及基于长文档、多文档等多个场景的对话功能。',
       displayName: 'Qwen Long',
@@ -53,9 +54,9 @@ const Qwen: ModelProviderCard = {
         input: 0.5,
         output: 2,
       },
-      tokens: 1_000_000,
     },
     {
+      contextWindowTokens: 32_000,
       description:
         '通义千问大规模视觉语言模型增强版。大幅提升细节识别能力和文字识别能力，支持超百万像素分辨率和任意长宽比规格的图像。',
       displayName: 'Qwen VL Plus',
@@ -66,10 +67,10 @@ const Qwen: ModelProviderCard = {
         input: 8,
         output: 8,
       },
-      tokens: 32_000,
       vision: true,
     },
     {
+      contextWindowTokens: 32_000,
       description:
         '通义千问超大规模视觉语言模型。相比增强版，再次提升视觉推理能力和指令遵循能力，提供更高的视觉感知和认知水平。',
       displayName: 'Qwen VL Max',
@@ -80,12 +81,11 @@ const Qwen: ModelProviderCard = {
         input: 20,
         output: 20,
       },
-      tokens: 32_000,
       vision: true,
     },
     {
-      description:
-        '通义千问数学模型是专门用于数学解题的语言模型。',
+      contextWindowTokens: 4096,
+      description: '通义千问数学模型是专门用于数学解题的语言模型。',
       displayName: 'Qwen Math Turbo',
       id: 'qwen-math-turbo-latest',
       pricing: {
@@ -93,11 +93,10 @@ const Qwen: ModelProviderCard = {
         input: 2,
         output: 6,
       },
-      tokens: 4096,
     },
     {
-      description:
-        '通义千问数学模型是专门用于数学解题的语言模型。',
+      contextWindowTokens: 4096,
+      description: '通义千问数学模型是专门用于数学解题的语言模型。',
       displayName: 'Qwen Math Plus',
       id: 'qwen-math-plus-latest',
       pricing: {
@@ -105,9 +104,9 @@ const Qwen: ModelProviderCard = {
         input: 4,
         output: 12,
       },
-      tokens: 4096,
     },
     {
+      contextWindowTokens: 131_072,
       description: '通义千问代码模型。',
       displayName: 'Qwen Coder Turbo',
       id: 'qwen-coder-turbo-latest',
@@ -116,9 +115,9 @@ const Qwen: ModelProviderCard = {
         input: 2,
         output: 6,
       },
-      tokens: 131_072,
     },
     {
+      contextWindowTokens: 131_072,
       description: '通义千问代码模型。',
       displayName: 'Qwen Coder Plus',
       id: 'qwen-coder-plus-latest',
@@ -127,9 +126,9 @@ const Qwen: ModelProviderCard = {
         input: 3.5,
         output: 7,
       },
-      tokens: 131_072,
     },
     {
+      contextWindowTokens: 32_768,
       description: 'QwQ模型是由 Qwen 团队开发的实验性研究模型，专注于增强 AI 推理能力。',
       displayName: 'QwQ 32B Preview',
       id: 'qwq-32b-preview',
@@ -138,9 +137,9 @@ const Qwen: ModelProviderCard = {
         input: 0,
         output: 0,
       },
-      tokens: 32_768,
     },
     {
+      contextWindowTokens: 131_072,
       description: '通义千问2.5对外开源的7B规模的模型。',
       displayName: 'Qwen2.5 7B',
       functionCall: true,
@@ -150,9 +149,9 @@ const Qwen: ModelProviderCard = {
         input: 1,
         output: 2,
       },
-      tokens: 131_072,
     },
     {
+      contextWindowTokens: 131_072,
       description: '通义千问2.5对外开源的14B规模的模型。',
       displayName: 'Qwen2.5 14B',
       functionCall: true,
@@ -162,9 +161,9 @@ const Qwen: ModelProviderCard = {
         input: 2,
         output: 6,
       },
-      tokens: 131_072,
     },
     {
+      contextWindowTokens: 131_072,
       description: '通义千问2.5对外开源的32B规模的模型。',
       displayName: 'Qwen2.5 32B',
       functionCall: true,
@@ -174,9 +173,9 @@ const Qwen: ModelProviderCard = {
         input: 3.5,
         output: 7,
       },
-      tokens: 131_072,
     },
     {
+      contextWindowTokens: 131_072,
       description: '通义千问2.5对外开源的72B规模的模型。',
       displayName: 'Qwen2.5 72B',
       functionCall: true,
@@ -186,9 +185,9 @@ const Qwen: ModelProviderCard = {
         input: 4,
         output: 12,
       },
-      tokens: 131_072,
     },
     {
+      contextWindowTokens: 4096,
       description: 'Qwen-Math 模型具有强大的数学解题能力。',
       displayName: 'Qwen2.5 Math 7B',
       id: 'qwen2.5-math-7b-instruct',
@@ -197,9 +196,9 @@ const Qwen: ModelProviderCard = {
         input: 1,
         output: 2,
       },
-      tokens: 4096,
     },
     {
+      contextWindowTokens: 4096,
       description: 'Qwen-Math 模型具有强大的数学解题能力。',
       displayName: 'Qwen2.5 Math 72B',
       id: 'qwen2.5-math-72b-instruct',
@@ -208,9 +207,9 @@ const Qwen: ModelProviderCard = {
         input: 4,
         output: 12,
       },
-      tokens: 4096,
     },
     {
+      contextWindowTokens: 131_072,
       description: '通义千问代码模型开源版。',
       displayName: 'Qwen2.5 Coder 7B',
       id: 'qwen2.5-coder-7b-instruct',
@@ -219,9 +218,9 @@ const Qwen: ModelProviderCard = {
         input: 1,
         output: 2,
       },
-      tokens: 131_072,
     },
     {
+      contextWindowTokens: 131_072,
       description: '通义千问代码模型开源版。',
       displayName: 'Qwen2.5 Coder 32B',
       id: 'qwen2.5-coder-32b-instruct',
@@ -230,9 +229,9 @@ const Qwen: ModelProviderCard = {
         input: 3.5,
         output: 7,
       },
-      tokens: 131_072,
     },
     {
+      contextWindowTokens: 8000,
       description: '以 Qwen-7B 语言模型初始化，添加图像模型，图像输入分辨率为448的预训练模型。',
       displayName: 'Qwen VL',
       id: 'qwen-vl-v1',
@@ -241,10 +240,10 @@ const Qwen: ModelProviderCard = {
         input: 0,
         output: 0,
       },
-      tokens: 8000,
       vision: true,
     },
     {
+      contextWindowTokens: 8000,
       description: '通义千问VL支持灵活的交互方式，包括多图、多轮问答、创作等能力的模型。',
       displayName: 'Qwen VL Chat',
       id: 'qwen-vl-chat-v1',
@@ -253,7 +252,6 @@ const Qwen: ModelProviderCard = {
         input: 0,
         output: 0,
       },
-      tokens: 8000,
       vision: true,
     },
   ],

package/src/config/modelProviders/sensenova.ts CHANGED Viewed

@@ -5,6 +5,7 @@ import { ModelProviderCard } from '@/types/llm';
 const SenseNova: ModelProviderCard = {
   chatModels: [
     {
+      contextWindowTokens: 131_072,
       description:
         '最新版本模型 (V5.5)，128K上下文长度，在数学推理、英文对话、指令跟随以及长文本理解等领域能力显著提升，比肩GPT-4o',
       displayName: 'SenseChat 5.5',
@@ -16,7 +17,6 @@ const SenseNova: ModelProviderCard = {
         input: 40,
         output: 100,
       },
-      tokens: 131_072,
     },
     /*
     // Not compatible with local mode (Not support Base64 Image)
@@ -35,6 +35,7 @@ const SenseNova: ModelProviderCard = {
     },
 */
     {
+      contextWindowTokens: 32_768,
       description: '适用于快速问答、模型微调场景',
       displayName: 'SenseChat 5.0 Turbo',
       enabled: true,
@@ -44,9 +45,9 @@ const SenseNova: ModelProviderCard = {
         input: 2,
         output: 5,
       },
-      tokens: 32_768,
     },
     {
+      contextWindowTokens: 32_768,
       description:
         '32K上下文长度，在粤语的对话理解上超越了GPT-4，在知识、推理、数学及代码编写等多个领域均能与GPT-4 Turbo相媲美',
       displayName: 'SenseChat 5.0 Cantonese',
@@ -56,9 +57,9 @@ const SenseNova: ModelProviderCard = {
         input: 27,
         output: 27,
       },
-      tokens: 32_768,
     },
     {
+      contextWindowTokens: 131_072,
       description: '基础版本模型 (V4)，128K上下文长度，在长文本理解及生成等任务中表现出色',
       displayName: 'SenseChat 4.0 128K',
       enabled: true,
@@ -68,9 +69,9 @@ const SenseNova: ModelProviderCard = {
         input: 60,
         output: 60,
       },
-      tokens: 131_072,
     },
     {
+      contextWindowTokens: 32_768,
       description: '基础版本模型 (V4)，32K上下文长度，灵活应用于各类场景',
       displayName: 'SenseChat 4.0 32K',
       enabled: true,
@@ -80,9 +81,9 @@ const SenseNova: ModelProviderCard = {
         input: 36,
         output: 36,
       },
-      tokens: 32_768,
     },
     {
+      contextWindowTokens: 4096,
       description: '基础版本模型 (V4)，4K上下文长度，通用能力强大',
       displayName: 'SenseChat 4.0 4K',
       enabled: true,
@@ -92,9 +93,9 @@ const SenseNova: ModelProviderCard = {
         input: 12,
         output: 12,
       },
-      tokens: 4096,
     },
     {
+      contextWindowTokens: 8192,
       description: '标准版模型，8K上下文长度，高响应速度',
       displayName: 'SenseChat Character',
       id: 'SenseChat-Character',
@@ -103,9 +104,9 @@ const SenseNova: ModelProviderCard = {
         input: 12,
         output: 12,
       },
-      tokens: 8192,
     },
     {
+      contextWindowTokens: 32_768,
       description: '高级版模型，32K上下文长度，能力全面提升，支持中/英文对话',
       displayName: 'SenseChat Character Pro',
       id: 'SenseChat-Character-Pro',
@@ -114,7 +115,6 @@ const SenseNova: ModelProviderCard = {
         input: 15,
         output: 15,
       },
-      tokens: 32_768,
     },
   ],
   checkModel: 'SenseChat-Turbo',