npm - @lobehub/lobehub - Versions diffs - 2.1.3 → 2.1.4 - Mend

@lobehub/lobehub 2.1.3 → 2.1.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (129) hide show

package/.env.example +0 -3
package/.env.example.development +0 -3
package/CHANGELOG.md +34 -0
package/changelog/v2.json +9 -0
package/docker-compose/deploy/.env.example +3 -1
package/docker-compose/deploy/.env.zh-CN.example +4 -1
package/docker-compose/local/.env.example +0 -1
package/docker-compose/local/.env.zh-CN.example +0 -1
package/docker-compose/local/grafana/.env.example +0 -1
package/docker-compose/local/grafana/.env.zh-CN.example +0 -1
package/docker-compose/local/logto/docker-compose.yml +0 -1
package/docker-compose/local/zitadel/.env.example +1 -2
package/docker-compose/local/zitadel/.env.zh-CN.example +1 -2
package/docker-compose/production/grafana/.env.example +0 -1
package/docker-compose/production/grafana/.env.zh-CN.example +0 -1
package/docker-compose/production/logto/.env.example +0 -2
package/docker-compose/production/logto/.env.zh-CN.example +0 -2
package/docker-compose/production/zitadel/.env.example +0 -2
package/docker-compose/production/zitadel/.env.zh-CN.example +0 -2
package/docker-compose/setup.sh +16 -2
package/docs/development/basic/folder-structure.mdx +23 -14
package/docs/development/basic/folder-structure.zh-CN.mdx +23 -14
package/docs/development/basic/work-with-server-side-database.mdx +0 -1
package/docs/development/basic/work-with-server-side-database.zh-CN.mdx +0 -1
package/docs/development/start.mdx +19 -12
package/docs/development/start.zh-CN.mdx +19 -12
package/docs/self-hosting/advanced/s3/cloudflare-r2.mdx +0 -5
package/docs/self-hosting/advanced/s3/cloudflare-r2.zh-CN.mdx +0 -5
package/docs/self-hosting/advanced/s3/rustfs.mdx +0 -2
package/docs/self-hosting/advanced/s3/rustfs.zh-CN.mdx +0 -2
package/docs/self-hosting/advanced/s3/tencent-cloud.mdx +0 -1
package/docs/self-hosting/advanced/s3/tencent-cloud.zh-CN.mdx +0 -2
package/docs/self-hosting/advanced/s3.mdx +0 -9
package/docs/self-hosting/advanced/s3.zh-CN.mdx +0 -8
package/docs/self-hosting/environment-variables/s3.mdx +0 -7
package/docs/self-hosting/environment-variables/s3.zh-CN.mdx +0 -7
package/docs/self-hosting/platform/docker-compose.mdx +0 -1
package/docs/self-hosting/platform/docker-compose.zh-CN.mdx +0 -1
package/docs/self-hosting/platform/docker.mdx +5 -3
package/docs/self-hosting/platform/docker.zh-CN.mdx +5 -4
package/docs/self-hosting/platform/dokploy.mdx +0 -2
package/docs/self-hosting/platform/dokploy.zh-CN.mdx +0 -2
package/docs/self-hosting/platform/vercel.mdx +0 -7
package/docs/self-hosting/platform/vercel.zh-CN.mdx +0 -7
package/e2e/src/steps/home/sidebarAgent.steps.ts +56 -24
package/locales/ar/authError.json +1 -0
package/locales/ar/models.json +25 -22
package/locales/ar/providers.json +0 -1
package/locales/ar/setting.json +16 -0
package/locales/bg-BG/authError.json +1 -0
package/locales/bg-BG/models.json +18 -21
package/locales/bg-BG/providers.json +0 -1
package/locales/bg-BG/setting.json +16 -0
package/locales/de-DE/authError.json +1 -0
package/locales/de-DE/models.json +20 -20
package/locales/de-DE/providers.json +0 -1
package/locales/de-DE/setting.json +16 -0
package/locales/en-US/models.json +22 -22
package/locales/en-US/providers.json +0 -1
package/locales/es-ES/authError.json +1 -0
package/locales/es-ES/models.json +84 -20
package/locales/es-ES/providers.json +0 -1
package/locales/es-ES/setting.json +16 -0
package/locales/fa-IR/authError.json +1 -0
package/locales/fa-IR/models.json +43 -20
package/locales/fa-IR/providers.json +0 -1
package/locales/fa-IR/setting.json +16 -0
package/locales/fr-FR/authError.json +1 -0
package/locales/fr-FR/models.json +19 -21
package/locales/fr-FR/providers.json +0 -1
package/locales/fr-FR/setting.json +16 -0
package/locales/it-IT/authError.json +1 -0
package/locales/it-IT/models.json +17 -19
package/locales/it-IT/providers.json +0 -1
package/locales/it-IT/setting.json +16 -0
package/locales/ja-JP/authError.json +1 -0
package/locales/ja-JP/models.json +43 -22
package/locales/ja-JP/providers.json +0 -1
package/locales/ja-JP/setting.json +16 -0
package/locales/ko-KR/authError.json +1 -0
package/locales/ko-KR/models.json +41 -20
package/locales/ko-KR/providers.json +0 -1
package/locales/ko-KR/setting.json +16 -0
package/locales/nl-NL/authError.json +1 -0
package/locales/nl-NL/models.json +48 -20
package/locales/nl-NL/providers.json +0 -1
package/locales/nl-NL/setting.json +16 -0
package/locales/pl-PL/authError.json +1 -0
package/locales/pl-PL/models.json +19 -22
package/locales/pl-PL/providers.json +0 -1
package/locales/pl-PL/setting.json +16 -0
package/locales/pt-BR/authError.json +1 -0
package/locales/pt-BR/models.json +21 -21
package/locales/pt-BR/providers.json +0 -1
package/locales/pt-BR/setting.json +16 -0
package/locales/ru-RU/authError.json +1 -0
package/locales/ru-RU/models.json +23 -20
package/locales/ru-RU/providers.json +0 -1
package/locales/ru-RU/setting.json +16 -0
package/locales/tr-TR/authError.json +1 -0
package/locales/tr-TR/models.json +37 -20
package/locales/tr-TR/providers.json +0 -1
package/locales/tr-TR/setting.json +16 -0
package/locales/vi-VN/authError.json +1 -0
package/locales/vi-VN/models.json +15 -19
package/locales/vi-VN/providers.json +0 -1
package/locales/vi-VN/setting.json +16 -0
package/locales/zh-CN/models.json +20 -20
package/locales/zh-CN/providers.json +0 -1
package/locales/zh-TW/authError.json +1 -0
package/locales/zh-TW/models.json +20 -20
package/locales/zh-TW/providers.json +0 -1
package/locales/zh-TW/setting.json +16 -0
package/package.json +1 -1
package/packages/model-bank/src/aiModels/google.ts +0 -19
package/packages/model-bank/src/aiModels/moonshot.ts +56 -5
package/packages/model-bank/src/aiModels/ollamacloud.ts +14 -0
package/packages/model-bank/src/aiModels/openrouter.ts +0 -14
package/packages/model-bank/src/aiModels/qwen.ts +105 -4
package/packages/model-bank/src/aiModels/siliconcloud.ts +39 -0
package/packages/model-bank/src/aiModels/wenxin.ts +0 -99
package/packages/model-runtime/src/core/contextBuilders/openai.test.ts +24 -0
package/packages/model-runtime/src/core/contextBuilders/openai.ts +22 -5
package/packages/model-runtime/src/core/openaiCompatibleFactory/index.ts +10 -3
package/packages/model-runtime/src/core/streams/google/google-ai.test.ts +54 -13
package/packages/model-runtime/src/core/streams/google/index.ts +1 -4
package/packages/model-runtime/src/providers/moonshot/index.ts +24 -2
package/packages/model-runtime/src/providers/qwen/index.ts +16 -15
package/src/server/routers/lambda/__tests__/integration/aiAgent/execAgent.integration.test.ts +3 -2

package/locales/zh-TW/providers.json CHANGED Viewed

@@ -29,7 +29,6 @@
   "internlm.description": "一個專注於大型模型研究與工具的開源組織，提供高效、易用的平台，讓尖端模型與演算法更易於取得。",
   "jina.description": "Jina AI 成立於 2020 年，是領先的搜尋 AI 公司。其搜尋技術堆疊包含向量模型、重排序器與小型語言模型，打造可靠且高品質的生成式與多模態搜尋應用。",
   "lmstudio.description": "LM Studio 是一款桌面應用程式，可在本機開發與實驗大型語言模型。",
-  "lobehub.description": "LobeHub Cloud 使用官方 API 存取 AI 模型，並以與模型代幣相關的點數（Credits）來計算使用量。",
   "minimax.description": "MiniMax 成立於 2021 年，致力於打造通用 AI，擁有多模態基礎模型，包括兆級參數的 MoE 文本模型、語音模型與視覺模型，並推出如海螺 AI 等應用。",
   "mistral.description": "Mistral 提供先進的通用、專業與研究模型，支援複雜推理、多語言任務與程式碼生成，並支援函式呼叫以實現自訂整合。",
   "modelscope.description": "ModelScope 是阿里雲的模型即服務平台，提供多樣化的 AI 模型與推理服務。",

package/locales/zh-TW/setting.json CHANGED Viewed

@@ -34,11 +34,20 @@
   "agentCronJobs.empty.description": "建立您的第一個排程任務以自動化代理程式",
   "agentCronJobs.empty.title": "尚無排程任務",
   "agentCronJobs.enable": "啟用",
+  "agentCronJobs.form.at": "在",
   "agentCronJobs.form.content.placeholder": "輸入給代理程式的提示或指令",
+  "agentCronJobs.form.every": "每",
+  "agentCronJobs.form.frequency": "頻率",
+  "agentCronJobs.form.hours": "小時",
+  "agentCronJobs.form.maxExecutions": "執行次數上限",
   "agentCronJobs.form.maxExecutions.placeholder": "留空表示無限制",
   "agentCronJobs.form.name.placeholder": "輸入任務名稱",
+  "agentCronJobs.form.time": "時間",
   "agentCronJobs.form.timeRange.end": "結束時間",
   "agentCronJobs.form.timeRange.start": "開始時間",
+  "agentCronJobs.form.times": "次",
+  "agentCronJobs.form.timezone": "時區",
+  "agentCronJobs.form.unlimited": "持續執行",
   "agentCronJobs.form.validation.contentRequired": "任務內容為必填",
   "agentCronJobs.form.validation.invalidTimeRange": "開始時間必須早於結束時間",
   "agentCronJobs.form.validation.nameRequired": "任務名稱為必填",
@@ -83,6 +92,13 @@
   "agentCronJobs.weekday.tuesday": "星期二",
   "agentCronJobs.weekday.wednesday": "星期三",
   "agentCronJobs.weekdays": "平日",
+  "agentCronJobs.weekdays.fri": "週五",
+  "agentCronJobs.weekdays.mon": "週一",
+  "agentCronJobs.weekdays.sat": "週六",
+  "agentCronJobs.weekdays.sun": "週日",
+  "agentCronJobs.weekdays.thu": "週四",
+  "agentCronJobs.weekdays.tue": "週二",
+  "agentCronJobs.weekdays.wed": "週三",
   "agentInfoDescription.basic.avatar": "頭像",
   "agentInfoDescription.basic.description": "描述",
   "agentInfoDescription.basic.name": "名稱",

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@lobehub/lobehub",
-  "version": "2.1.3",
+  "version": "2.1.4",
   "description": "LobeHub - an open-source,comprehensive AI Agent framework that supports speech synthesis, multimodal, and extensible Function Call plugin system. Supports one-click free deployment of your private ChatGPT/LLM web application.",
   "keywords": [
     "framework",

package/packages/model-bank/src/aiModels/google.ts CHANGED Viewed

@@ -651,25 +651,6 @@ const googleChatModels: AIChatModelCard[] = [
     releasedAt: '2025-02-05',
     type: 'chat',
   },
-  {
-    abilities: {
-      imageOutput: true,
-      vision: true,
-    },
-    contextWindowTokens: 1_048_576 + 8192,
-    description: 'A Gemini 2.0 Flash variant optimized for cost efficiency and low latency.',
-    displayName: 'Gemini 2.0 Flash Exp',
-    id: 'gemini-2.0-flash-exp',
-    maxOutput: 8192,
-    pricing: {
-      units: [
-        { name: 'textInput', rate: 0, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textOutput', rate: 0, strategy: 'fixed', unit: 'millionTokens' },
-      ],
-    },
-    releasedAt: '2025-02-05',
-    type: 'chat',
-  },
   {
     abilities: {
       vision: true,

package/packages/model-bank/src/aiModels/moonshot.ts CHANGED Viewed

@@ -2,6 +2,34 @@ import { AIChatModelCard } from '../types/aiModel';
 // https://platform.moonshot.cn/docs/pricing/chat
 const moonshotChatModels: AIChatModelCard[] = [
+  {
+    abilities: {
+      functionCall: true,
+      reasoning: true,
+      structuredOutput: true,
+      vision: true,
+    },
+    contextWindowTokens: 262_144,
+    description:
+      'Kimi K2.5 is Kimi\'s most versatile model to date, featuring a native multimodal architecture that supports both vision and text inputs, "thinking" and "non-thinking" modes, and both conversational and agent tasks.',
+    displayName: 'Kimi K2.5',
+    enabled: true,
+    id: 'kimi-k2.5',
+    maxOutput: 32_768,
+    pricing: {
+      currency: 'CNY',
+      units: [
+        { name: 'textInput_cacheRead', rate: 0.7, strategy: 'fixed', unit: 'millionTokens' },
+        { name: 'textInput', rate: 4, strategy: 'fixed', unit: 'millionTokens' },
+        { name: 'textOutput', rate: 21, strategy: 'fixed', unit: 'millionTokens' },
+      ],
+    },
+    releasedAt: '2026-01-27',
+    settings: {
+      extendParams: ['enableReasoning'],
+    },
+    type: 'chat',
+  },
   {
     abilities: {
       functionCall: true,
@@ -12,7 +40,6 @@ const moonshotChatModels: AIChatModelCard[] = [
     description:
       'K2 long-thinking model with 256k context, supporting multi-step tool use and reasoning for complex problems.',
     displayName: 'Kimi K2 Thinking',
-    enabled: true,
     id: 'kimi-k2-thinking',
     maxOutput: 65_536,
     pricing: {
@@ -58,7 +85,6 @@ const moonshotChatModels: AIChatModelCard[] = [
     description:
       'kimi-k2-0905-preview offers a 256k context window, stronger agentic coding, better front-end code quality, and improved context understanding.',
     displayName: 'Kimi K2 0905',
-    enabled: true,
     id: 'kimi-k2-0905-preview',
     pricing: {
       currency: 'CNY',
@@ -126,8 +152,32 @@ const moonshotChatModels: AIChatModelCard[] = [
       currency: 'CNY',
       units: [
         { name: 'textInput_cacheRead', rate: 1, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textInput', rate: 10, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textOutput', rate: 30, strategy: 'fixed', unit: 'millionTokens' },
+        {
+          lookup: {
+            prices: {
+              '[0, 0.008_192]': 2,
+              '[0.008_193, 0.032_768]': 5,
+              '[0.032_769, 0.131_072]': 10,
+            },
+            pricingParams: ['textInput'],
+          },
+          name: 'textInput',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
+        {
+          lookup: {
+            prices: {
+              '[0, 0.008_192]': 10,
+              '[0.008_193, 0.032_768]': 20,
+              '[0.032_769, 0.131_072]': 30,
+            },
+            pricingParams: ['textInput'],
+          },
+          name: 'textOutput',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
       ],
     },
     releasedAt: '2025-02-17',
@@ -138,7 +188,8 @@ const moonshotChatModels: AIChatModelCard[] = [
       functionCall: true,
     },
     contextWindowTokens: 131_072,
-    description: 'Moonshot V1 Auto selects the appropriate model based on current context token usage.',
+    description:
+      'Moonshot V1 Auto selects the appropriate model based on current context token usage.',
     displayName: 'Moonshot V1 Auto',
     id: 'moonshot-v1-auto',
     pricing: {

package/packages/model-bank/src/aiModels/ollamacloud.ts CHANGED Viewed

@@ -1,6 +1,20 @@
 import { AIChatModelCard } from '../types/aiModel';
 const ollamaCloudModels: AIChatModelCard[] = [
+  {
+    abilities: {
+      functionCall: true,
+      reasoning: true,
+      vision: true,
+    },
+    contextWindowTokens: 262_144,
+    description:
+      'Kimi K2.5 is an open-source, native multimodal agentic model that seamlessly integrates vision and language understanding with advanced agentic capabilities, instant and thinking modes, as well as conversational and agentic paradigms.',
+    displayName: 'Kimi K2.5',
+    enabled: true,
+    id: 'kimi-k2.5',
+    type: 'chat',
+  },
   {
     abilities: {
       functionCall: true,

package/packages/model-bank/src/aiModels/openrouter.ts CHANGED Viewed

@@ -1079,20 +1079,6 @@ const openrouterChatModels: AIChatModelCard[] = [
     id: 'google/gemma-2-9b-it:free',
     type: 'chat',
   },
-  {
-    abilities: {
-      functionCall: true,
-      vision: true,
-    },
-    contextWindowTokens: 1_048_576 + 8192,
-    description:
-      'Gemini 2.0 Flash Experimental is Google’s latest experimental multimodal AI model with quality improvements over prior versions, especially in world knowledge, code, and long context.',
-    displayName: 'Gemini 2.0 Flash Experimental (Free)',
-    id: 'google/gemini-2.0-flash-exp:free',
-    maxOutput: 8192,
-    releasedAt: '2024-12-11',
-    type: 'chat',
-  },
 ];
 export const allModels = [...openrouterChatModels];

package/packages/model-bank/src/aiModels/qwen.ts CHANGED Viewed

@@ -3,6 +3,55 @@ import { AIChatModelCard, AIImageModelCard } from '../types/aiModel';
 // https://help.aliyun.com/zh/model-studio/models?spm=a2c4g.11186623
 const qwenChatModels: AIChatModelCard[] = [
+  {
+    abilities: {
+      functionCall: true,
+      reasoning: true,
+      vision: true,
+    },
+    contextWindowTokens: 262_144,
+    description:
+      'Kimi K2.5 is the most capable Kimi model, delivering open-source SOTA in agent tasks, coding, and vision understanding. It supports multimodal inputs and both thinking and non-thinking modes.',
+    displayName: 'Kimi K2.5',
+    id: 'kimi-k2.5',
+    maxOutput: 32_768,
+    organization: 'Qwen',
+    pricing: {
+      currency: 'CNY',
+      units: [
+        { name: 'textInput', rate: 4, strategy: 'fixed', unit: 'millionTokens' },
+        { name: 'textOutput', rate: 21, strategy: 'fixed', unit: 'millionTokens' },
+      ],
+    },
+    settings: {
+      extendParams: ['enableReasoning', 'reasoningBudgetToken'],
+    },
+    type: 'chat',
+  },
+  {
+    abilities: {
+      functionCall: true,
+      reasoning: true,
+      search: true,
+    },
+    contextWindowTokens: 204_800,
+    description:
+      'MiniMax-M2.1 is a flagship open-source large model from MiniMax, focusing on solving complex real-world tasks. Its core strengths are multi-language programming capabilities and the ability to solve complex tasks as an Agent.',
+    displayName: 'MiniMax-M2.1',
+    id: 'MiniMax-M2.1',
+    maxOutput: 32_768,
+    pricing: {
+      currency: 'CNY',
+      units: [
+        { name: 'textInput', rate: 2.1, strategy: 'fixed', unit: 'millionTokens' },
+        { name: 'textOutput', rate: 8.4, strategy: 'fixed', unit: 'millionTokens' },
+      ],
+    },
+    settings: {
+      searchImpl: 'params',
+    },
+    type: 'chat',
+  },
   {
     abilities: {
       reasoning: true,
@@ -61,7 +110,7 @@ const qwenChatModels: AIChatModelCard[] = [
       vision: true,
     },
     config: {
-      deploymentName: 'qwen3-vl-flash-2025-10-15',
+      deploymentName: 'qwen3-vl-flash-2026-01-22',
     },
     contextWindowTokens: 262_144,
     description:
@@ -101,7 +150,6 @@ const qwenChatModels: AIChatModelCard[] = [
         },
       ],
     },
-    releasedAt: '2025-10-15',
     settings: {
       extendParams: ['enableReasoning', 'reasoningBudgetToken'],
     },
@@ -1019,7 +1067,8 @@ const qwenChatModels: AIChatModelCard[] = [
       deploymentName: 'qwen-plus-2025-12-01',
     },
     contextWindowTokens: 1_000_000,
-    description: 'Enhanced ultra-large Qwen model supporting Chinese, English, and other languages.',
+    description:
+      'Enhanced ultra-large Qwen model supporting Chinese, English, and other languages.',
     displayName: 'Qwen Plus',
     enabled: true,
     id: 'qwen-plus',
@@ -1078,6 +1127,57 @@ const qwenChatModels: AIChatModelCard[] = [
     },
     type: 'chat',
   },
+  {
+    abilities: {
+      functionCall: true,
+      search: true,
+      reasoning: true,
+    },
+    contextWindowTokens: 262_144,
+    description:
+      'Qwen3 Max models deliver large gains over the 2.5 series in general ability, Chinese/English understanding, complex instruction following, subjective open tasks, multilingual ability, and tool use, with fewer hallucinations. The latest qwen3-max improves agentic programming and tool use over qwen3-max-preview. This release reaches field SOTA and targets more complex agent needs.',
+    displayName: 'Qwen3 Max Thinking',
+    id: 'qwen3-max-2026-01-23',
+    maxOutput: 65_536,
+    organization: 'Qwen',
+    pricing: {
+      currency: 'CNY',
+      units: [
+        {
+          lookup: {
+            prices: {
+              '[0, 0.032]': 2.5,
+              '[0.032, 0.128]': 4,
+              '[0.128, 0.252]': 7,
+            },
+            pricingParams: ['textInputRange'],
+          },
+          name: 'textInput',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
+        {
+          lookup: {
+            prices: {
+              '[0, 0.032]': 10,
+              '[0.032, 0.128]': 16,
+              '[0.128, 0.252]': 28,
+            },
+            pricingParams: ['textInputRange'],
+          },
+          name: 'textOutput',
+          strategy: 'lookup',
+          unit: 'millionTokens',
+        },
+      ],
+    },
+    releasedAt: '2026-01-23',
+    settings: {
+      extendParams: ['enableReasoning', 'reasoningBudgetToken'],
+      searchImpl: 'params',
+    },
+    type: 'chat',
+  },
   {
     abilities: {
       functionCall: true,
@@ -1477,7 +1577,8 @@ const qwenChatModels: AIChatModelCard[] = [
       vision: true,
     },
     contextWindowTokens: 131_072,
-    description: 'Qwen3 VL 8B non-thinking mode (Instruct) for standard multimodal generation and recognition.',
+    description:
+      'Qwen3 VL 8B non-thinking mode (Instruct) for standard multimodal generation and recognition.',
     displayName: 'Qwen3 VL 8B Instruct',
     id: 'qwen3-vl-8b-instruct',
     maxOutput: 32_768,

package/packages/model-bank/src/aiModels/siliconcloud.ts CHANGED Viewed

@@ -2,6 +2,45 @@ import { AIChatModelCard, AIImageModelCard } from '../types/aiModel';
 // https://siliconflow.cn/zh-cn/models
 const siliconcloudChatModels: AIChatModelCard[] = [
+  {
+    abilities: {
+      functionCall: true,
+      reasoning: true,
+      vision: true,
+    },
+    contextWindowTokens: 262_144,
+    description:
+      'Kimi K2.5 is an open-source native multimodal agent model, built on Kimi-K2-Base, trained on approximately 1.5 trillion mixed vision and text tokens. The model adopts an MoE architecture with 1T total parameters and 32B active parameters, supporting a 256K context window, seamlessly integrating vision and language understanding capabilities.',
+    displayName: 'Kimi-K2.5 (Pro)',
+    id: 'Pro/moonshotai/Kimi-K2.5',
+    pricing: {
+      currency: 'CNY',
+      units: [
+        { name: 'textInput', rate: 4, strategy: 'fixed', unit: 'millionTokens' },
+        { name: 'textOutput', rate: 21, strategy: 'fixed', unit: 'millionTokens' },
+      ],
+    },
+    releasedAt: '2026-01-27',
+    type: 'chat',
+  },
+  {
+    abilities: {
+      vision: true,
+    },
+    description:
+      'PaddleOCR-VL-1.5 is an upgraded version of the PaddleOCR-VL series, achieving 94.5% accuracy on the OmniDocBench v1.5 document parsing benchmark, surpassing leading general large models and specialized document parsing models. It innovatively supports irregular bounding box localization for document elements, handling scanned, tilted, and screen-captured images effectively.',
+    displayName: 'PaddleOCR-VL 1.5',
+    id: 'PaddlePaddle/PaddleOCR-VL-1.5',
+    pricing: {
+      currency: 'CNY',
+      units: [
+        { name: 'textInput', rate: 0, strategy: 'fixed', unit: 'millionTokens' },
+        { name: 'textOutput', rate: 0, strategy: 'fixed', unit: 'millionTokens' },
+      ],
+    },
+    releasedAt: '2026-01-29',
+    type: 'chat',
+  },
   {
     abilities: {
       functionCall: true,

package/packages/model-bank/src/aiModels/wenxin.ts CHANGED Viewed

@@ -191,37 +191,6 @@ const wenxinChatModels: AIChatModelCard[] = [
     },
     type: 'chat',
   },
-  {
-    contextWindowTokens: 131_072,
-    description:
-      'ERNIE Speed 128K is a no-I/O-fee model for long-text understanding and large-scale trials.',
-    displayName: 'ERNIE Speed 128K',
-    id: 'ernie-speed-128k',
-    maxOutput: 4096,
-    pricing: {
-      currency: 'CNY',
-      units: [
-        { name: 'textInput', rate: 0, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textOutput', rate: 0, strategy: 'fixed', unit: 'millionTokens' },
-      ],
-    },
-    type: 'chat',
-  },
-  {
-    contextWindowTokens: 8192,
-    description: 'ERNIE Speed 8K is a free, fast model for daily chat and light text tasks.',
-    displayName: 'ERNIE Speed 8K',
-    id: 'ernie-speed-8k',
-    maxOutput: 2048,
-    pricing: {
-      currency: 'CNY',
-      units: [
-        { name: 'textInput', rate: 0, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textOutput', rate: 0, strategy: 'fixed', unit: 'millionTokens' },
-      ],
-    },
-    type: 'chat',
-  },
   {
     contextWindowTokens: 131_072,
     description:
@@ -238,22 +207,6 @@ const wenxinChatModels: AIChatModelCard[] = [
     },
     type: 'chat',
   },
-  {
-    contextWindowTokens: 8192,
-    description:
-      'ERNIE Lite 8K is a lightweight general model for cost-sensitive daily QA and content generation.',
-    displayName: 'ERNIE Lite 8K',
-    id: 'ernie-lite-8k',
-    maxOutput: 2048,
-    pricing: {
-      currency: 'CNY',
-      units: [
-        { name: 'textInput', rate: 0, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textOutput', rate: 0, strategy: 'fixed', unit: 'millionTokens' },
-      ],
-    },
-    type: 'chat',
-  },
   {
     abilities: {
       functionCall: true,
@@ -273,22 +226,6 @@ const wenxinChatModels: AIChatModelCard[] = [
     },
     type: 'chat',
   },
-  {
-    contextWindowTokens: 8192,
-    description:
-      'ERNIE Tiny 8K is ultra-lightweight for simple QA, classification, and low-cost inference.',
-    displayName: 'ERNIE Tiny 8K',
-    id: 'ernie-tiny-8k',
-    maxOutput: 2048,
-    pricing: {
-      currency: 'CNY',
-      units: [
-        { name: 'textInput', rate: 0, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textOutput', rate: 0, strategy: 'fixed', unit: 'millionTokens' },
-      ],
-    },
-    type: 'chat',
-  },
   {
     contextWindowTokens: 8192,
     description:
@@ -486,24 +423,6 @@ const wenxinChatModels: AIChatModelCard[] = [
     maxOutput: 2048,
     type: 'chat',
   },
-  {
-    contextWindowTokens: 32_768,
-    description:
-      'Qianfan Agent Speed 32K is a high-throughput agent model for large-scale, multi-task agent apps.',
-    displayName: 'Qianfan Agent Speed 32K',
-    id: 'qianfan-agent-speed-32k',
-    maxOutput: 4096,
-    type: 'chat',
-  },
-  {
-    contextWindowTokens: 8192,
-    description:
-      'Qianfan Agent Speed 8K is a high-concurrency agent model for short-to-mid conversations and fast response.',
-    displayName: 'Qianfan Agent Speed 8K',
-    id: 'qianfan-agent-speed-8k',
-    maxOutput: 2048,
-    type: 'chat',
-  },
   {
     abilities: {
       vision: true,
@@ -1616,24 +1535,6 @@ const wenxinChatModels: AIChatModelCard[] = [
     },
     type: 'chat',
   },
-  {
-    contextWindowTokens: 32_768,
-    description: 'Qwen3 235B A22B is a general large model for complex tasks.',
-    displayName: 'Qwen3 235B A22B',
-    id: 'qwen3-235b-a22b',
-    maxOutput: 8192,
-    pricing: {
-      currency: 'CNY',
-      units: [
-        { name: 'textInput', rate: 2, strategy: 'fixed', unit: 'millionTokens' },
-        { name: 'textOutput', rate: 8, strategy: 'fixed', unit: 'millionTokens' },
-      ],
-    },
-    settings: {
-      extendParams: ['enableReasoning', 'reasoningBudgetToken'],
-    },
-    type: 'chat',
-  },
   {
     contextWindowTokens: 32_768,
     description: 'Qwen3 30B A3B is a mid-large general model balancing cost and quality.',

package/packages/model-runtime/src/core/contextBuilders/openai.test.ts CHANGED Viewed

@@ -73,6 +73,30 @@ describe('convertMessageContent', () => {
     expect(result).toEqual(content);
     expect(imageUrlToBase64).not.toHaveBeenCalled();
   });
+  it('should convert image URL when forceImageBase64 is true', async () => {
+    process.env.LLM_VISION_IMAGE_USE_BASE64 = undefined;
+    const content = {
+      type: 'image_url',
+      image_url: { url: 'https://example.com/image.jpg' },
+    } as OpenAI.ChatCompletionContentPart;
+    vi.mocked(parseDataUri).mockReturnValue({ type: 'url', base64: null, mimeType: null });
+    vi.mocked(imageUrlToBase64).mockResolvedValue({
+      base64: 'forcedBase64',
+      mimeType: 'image/jpeg',
+    });
+    const result = await convertMessageContent(content, { forceImageBase64: true });
+    expect(result).toEqual({
+      type: 'image_url',
+      image_url: { url: 'data:image/jpeg;base64,forcedBase64' },
+    });
+    expect(imageUrlToBase64).toHaveBeenCalledWith('https://example.com/image.jpg');
+  });
 });
 describe('convertOpenAIMessages', () => {

package/packages/model-runtime/src/core/contextBuilders/openai.ts CHANGED Viewed

@@ -5,13 +5,21 @@ import { disableStreamModels, systemToUserModels } from '../../const/models';
 import { ChatStreamPayload, OpenAIChatMessage } from '../../types';
 import { parseDataUri } from '../../utils/uriParser';
+type ConvertMessageContentOptions = {
+  forceImageBase64?: boolean;
+};
 export const convertMessageContent = async (
   content: OpenAI.ChatCompletionContentPart,
+  options?: ConvertMessageContentOptions,
 ): Promise<OpenAI.ChatCompletionContentPart> => {
   if (content.type === 'image_url') {
     const { type } = parseDataUri(content.image_url.url);
-    if (type === 'url' && process.env.LLM_VISION_IMAGE_USE_BASE64 === '1') {
+    const shouldUseBase64 =
+      options?.forceImageBase64 || process.env.LLM_VISION_IMAGE_USE_BASE64 === '1';
+    if (type === 'url' && shouldUseBase64) {
       const { base64, mimeType } = await imageUrlToBase64(content.image_url.url);
       return {
@@ -24,7 +32,10 @@ export const convertMessageContent = async (
   return content;
 };
-export const convertOpenAIMessages = async (messages: OpenAI.ChatCompletionMessageParam[]) => {
+export const convertOpenAIMessages = async (
+  messages: OpenAI.ChatCompletionMessageParam[],
+  options?: ConvertMessageContentOptions,
+) => {
   return (await Promise.all(
     messages.map(async (message) => {
       const msg = message as any;
@@ -37,7 +48,7 @@ export const convertOpenAIMessages = async (messages: OpenAI.ChatCompletionMessa
             ? message.content
             : await Promise.all(
                 (message.content || []).map((c) =>
-                  convertMessageContent(c as OpenAI.ChatCompletionContentPart),
+                  convertMessageContent(c as OpenAI.ChatCompletionContentPart, options),
                 ),
               ),
         role: msg.role,
@@ -59,7 +70,10 @@ export const convertOpenAIMessages = async (messages: OpenAI.ChatCompletionMessa
   )) as OpenAI.ChatCompletionMessageParam[];
 };
-export const convertOpenAIResponseInputs = async (messages: OpenAIChatMessage[]) => {
+export const convertOpenAIResponseInputs = async (
+  messages: OpenAIChatMessage[],
+  options?: ConvertMessageContentOptions,
+) => {
   let input: OpenAI.Responses.ResponseInputItem[] = [];
   await Promise.all(
     messages.map(async (message) => {
@@ -113,7 +127,10 @@ export const convertOpenAIResponseInputs = async (messages: OpenAIChatMessage[])
                     return { ...c, type: 'input_text' };
                   }
-                  const image = await convertMessageContent(c as OpenAI.ChatCompletionContentPart);
+                  const image = await convertMessageContent(
+                    c as OpenAI.ChatCompletionContentPart,
+                    options,
+                  );
                   return {
                     image_url: (image as OpenAI.ChatCompletionContentPartImage).image_url?.url,
                     type: 'input_image',