npm - @lobehub/chat - Versions diffs - 1.74.11 → 1.75.0 - Mend

@lobehub/chat 1.74.11 → 1.75.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (46) hide show

package/CHANGELOG.md +35 -0
package/Dockerfile +2 -0
package/Dockerfile.database +2 -0
package/Dockerfile.pglite +2 -0
package/changelog/v1.json +12 -0
package/locales/ar/models.json +9 -0
package/locales/bg-BG/models.json +9 -0
package/locales/de-DE/models.json +9 -0
package/locales/en-US/models.json +9 -0
package/locales/es-ES/models.json +9 -0
package/locales/fa-IR/models.json +9 -0
package/locales/fr-FR/models.json +9 -0
package/locales/it-IT/models.json +9 -0
package/locales/ja-JP/models.json +9 -0
package/locales/ko-KR/models.json +9 -0
package/locales/nl-NL/models.json +9 -0
package/locales/pl-PL/models.json +9 -0
package/locales/pt-BR/models.json +9 -0
package/locales/ru-RU/models.json +9 -0
package/locales/tr-TR/models.json +9 -0
package/locales/vi-VN/models.json +9 -0
package/locales/zh-CN/models.json +9 -0
package/locales/zh-TW/models.json +9 -0
package/package.json +1 -1
package/packages/web-crawler/src/crawImpl/__tests__/browserless.test.ts +41 -0
package/packages/web-crawler/src/crawImpl/search1api.ts +2 -2
package/src/app/[variants]/(main)/chat/(workspace)/@conversation/features/ChatList/ChatItem/index.tsx +1 -1
package/src/app/[variants]/(main)/settings/llm/ProviderList/providers.tsx +2 -0
package/src/config/aiModels/google.ts +26 -0
package/src/config/aiModels/index.ts +3 -0
package/src/config/aiModels/xinference.ts +171 -0
package/src/config/llm.ts +6 -0
package/src/config/modelProviders/index.ts +4 -0
package/src/config/modelProviders/xinference.ts +18 -0
package/src/features/Conversation/components/AutoScroll.tsx +2 -1
package/src/features/Conversation/components/ChatItem/ActionsBar.tsx +7 -2
package/src/features/Conversation/components/ChatItem/index.tsx +6 -1
package/src/features/Conversation/components/VirtualizedList/VirtuosoContext.ts +4 -0
package/src/features/Conversation/components/VirtualizedList/index.tsx +34 -31
package/src/features/Portal/Thread/Chat/ChatItem.tsx +1 -1
package/src/libs/agent-runtime/runtimeMap.ts +2 -0
package/src/libs/agent-runtime/types/type.ts +1 -0
package/src/libs/agent-runtime/xinference/index.ts +53 -0
package/src/store/chat/slices/message/selectors.test.ts +42 -0
package/src/store/chat/slices/message/selectors.ts +4 -0
package/src/types/user/settings/keyVaults.ts +1 -0

package/src/app/[variants]/(main)/chat/(workspace)/@conversation/features/ChatList/ChatItem/index.tsx CHANGED Viewed

@@ -64,7 +64,7 @@ const MainChatItem = memo<ThreadChatItemProps>(({ id, index }) => {
   const placement = displayMode === 'chat' && userRole === 'user' ? 'end' : 'start';
-  const actionBar = useMemo(() => <ActionsBar id={id} />, [id]);
+  const actionBar = useMemo(() => <ActionsBar id={id} index={index} />, [id]);
   return (
     <ChatItem

package/src/app/[variants]/(main)/settings/llm/ProviderList/providers.tsx CHANGED Viewed

@@ -37,6 +37,7 @@ import {
   VLLMProviderCard,
   WenxinProviderCard,
   XAIProviderCard,
+  XinferenceProviderCard,
   ZeroOneProviderCard,
   ZhiPuProviderCard,
 } from '@/config/modelProviders';
@@ -65,6 +66,7 @@ export const useProviderList = (): ProviderItem[] => {
       AzureProvider,
       OllamaProvider,
       VLLMProviderCard,
+      XinferenceProviderCard,
       AnthropicProviderCard,
       BedrockProvider,
       GoogleProviderCard,

package/src/config/aiModels/google.ts CHANGED Viewed

@@ -26,6 +26,32 @@ const googleChatModels: AIChatModelCard[] = [
     },
     type: 'chat',
   },
+  {
+    abilities: {
+      functionCall: true,
+      reasoning: true,
+      search: true,
+      vision: true,
+    },
+    contextWindowTokens: 1_048_576 + 8192,
+    description:
+      'Gemini 2.5 Pro Experimental 是 Google 最先进的思维模型，能够对代码、数学和STEM领域的复杂问题进行推理，还能利用长上下文来分析大型数据集、代码库和文档。',
+    displayName: 'Gemini 2.5 Pro Experimental 03-25',
+    enabled: true,
+    id: 'gemini-2.5-pro-exp-03-25',
+    maxOutput: 8192,
+    pricing: {
+      cachedInput: 0,
+      input: 0,
+      output: 0,
+    },
+    releasedAt: '2025-03-25',
+    settings: {
+      searchImpl: 'params',
+      searchProvider: 'google',
+    },
+    type: 'chat',
+  },
   {
     abilities: {
       functionCall: true,

package/src/config/aiModels/index.ts CHANGED Viewed

@@ -49,6 +49,7 @@ import { default as vllm } from './vllm';
 import { default as volcengine } from './volcengine';
 import { default as wenxin } from './wenxin';
 import { default as xai } from './xai';
+import { default as xinference } from './xinference';
 import { default as zeroone } from './zeroone';
 import { default as zhipu } from './zhipu';
@@ -121,6 +122,7 @@ export const LOBE_DEFAULT_MODEL_LIST = buildDefaultModelList({
   volcengine,
   wenxin,
   xai,
+  xinference,
   zeroone,
   zhipu,
 });
@@ -174,5 +176,6 @@ export { default as vllm } from './vllm';
 export { default as volcengine } from './volcengine';
 export { default as wenxin } from './wenxin';
 export { default as xai } from './xai';
+export { default as xinference } from './xinference';
 export { default as zeroone } from './zeroone';
 export { default as zhipu } from './zhipu';

package/src/config/aiModels/xinference.ts ADDED Viewed

@@ -0,0 +1,171 @@
+import { AIChatModelCard } from '@/types/aiModel';
+const xinferenceChatModels: AIChatModelCard[] = [
+  {
+    abilities: {
+      functionCall: true,
+    },
+    contextWindowTokens: 163_840,
+    description:
+      'DeepSeek-V3 是一个强大的专家混合（MoE）语言模型，拥有总计 6710 亿参数，每个 token 激活 370 亿参数。',
+    displayName: 'DeepSeek V3',
+    enabled: true,
+    id: 'deepseek-v3',
+    type: 'chat'
+  },
+  {
+    abilities: {
+      reasoning: true,
+    },
+    contextWindowTokens: 163_840,
+    description:
+      'DeepSeek-R1 在强化学习（RL）之前引入了冷启动数据，在数学、代码和推理任务上表现可与 OpenAI-o1 相媲美。',
+    displayName: 'DeepSeek R1',
+    enabled: true,
+    id: 'deepseek-r1',
+    type: 'chat'
+  },
+  {
+    abilities: {
+      reasoning: true,
+    },
+    contextWindowTokens: 131_072,
+    description:
+      'deepseek-r1-distill-llama 是基于 Llama 从 DeepSeek-R1 蒸馏而来的模型。',
+    displayName: 'DeepSeek R1 Distill Llama',
+    enabled: true,
+    id: 'deepseek-r1-distill-llama',
+    type: 'chat'
+  },
+  {
+    abilities: {
+      reasoning: true,
+    },
+    contextWindowTokens: 131_072,
+    description:
+      'deepseek-r1-distill-qwen 是基于 Qwen 从 DeepSeek-R1 蒸馏而来的模型。',
+    displayName: 'DeepSeek R1 Distill Qwen',
+    enabled: true,
+    id: 'deepseek-r1-distill-qwen',
+    type: 'chat'
+  },
+  {
+    abilities: {
+      reasoning: true,
+    },
+    contextWindowTokens: 32_768,
+    description:
+      'QwQ 是 Qwen 系列的推理模型。与传统的指令微调模型相比，QwQ 具备思考和推理能力，在下游任务中，尤其是复杂问题上，能够实现显著增强的性能。QwQ-32B 是一款中型推理模型，其性能可与最先进的推理模型（如 DeepSeek-R1、o1-mini）相媲美。',
+    displayName: 'QwQ 32B',
+    enabled: true,
+    id: 'qwq-32b',
+    type: 'chat'
+  },
+  {
+    abilities: {
+      reasoning: true,
+      vision: true,
+    },
+    contextWindowTokens: 32_768,
+    description:
+      'QVQ-72B-Preview 是由 Qwen 团队开发的实验性研究模型，专注于提升视觉推理能力。',
+    displayName: 'QVQ 72B Preview',
+    enabled: true,
+    id: 'qvq-72b-preview',
+    type: 'chat'
+  },
+  {
+    abilities: {
+      functionCall: true,
+    },
+    contextWindowTokens: 32_768,
+    description:
+      'Qwen2.5 是 Qwen 大型语言模型的最新系列。对于 Qwen2.5，我们发布了多个基础语言模型和指令微调语言模型，参数范围从 5 亿到 72 亿不等。',
+    displayName: 'Qwen2.5 Instruct',
+    enabled: true,
+    id: 'qwen2.5-instruct',
+    type: 'chat'
+  },
+  {
+    abilities: {
+      functionCall: true,
+    },
+    contextWindowTokens: 32_768,
+    description:
+      'Qwen2.5-Coder 是 Qwen 系列中最新的代码专用大型语言模型（前身为 CodeQwen）。',
+    displayName: 'Qwen2.5 Coder Instruct',
+    enabled: true,
+    id: 'qwen2.5-coder-instruct',
+    type: 'chat'
+  },
+  {
+    abilities: {
+      vision: true,
+    },
+    contextWindowTokens: 128_000,
+    description:
+      'Qwen2.5-VL 是 Qwen 模型家族中视觉语言模型的最新版本。',
+    displayName: 'Qwen2.5 VL Instruct',
+    enabled: true,
+    id: 'qwen2.5-vl-instruct',
+    type: 'chat'
+  },
+  {
+    contextWindowTokens: 1_024_000,
+    description:
+      'Mistral-Nemo-Instruct-2407 大型语言模型（LLM）是 Mistral-Nemo-Base-2407 的指令微调版本。',
+    displayName: 'Mistral Nemo Instruct',
+    enabled: true,
+    id: 'mistral-nemo-instruct',
+    type: 'chat'
+  },
+  {
+    contextWindowTokens: 131_072,
+    description:
+      'Mistral-Large-Instruct-2407 是一款先进的稠密大型语言模型（LLM），拥有 1230 亿参数，具备最先进的推理、知识和编码能力。',
+    displayName: 'Mistral Large Instruct',
+    enabled: true,
+    id: 'mistral-large-instruct',
+    type: 'chat'
+  },
+  {
+    abilities: {
+      functionCall: true,
+    },
+    contextWindowTokens: 131_072,
+    description:
+      'Llama 3.3 指令微调模型针对对话场景进行了优化，在常见的行业基准测试中，超越了许多现有的开源聊天模型。',
+    displayName: 'Llama 3.3 Instruct',
+    enabled: true,
+    id: 'llama-3.3-instruct',
+    type: 'chat'
+  },
+  {
+    abilities: {
+      vision: true,
+    },
+    contextWindowTokens: 163_840,
+    description:
+      'Llama 3.2-Vision 指令微调模型针对视觉识别、图像推理、图像描述和回答与图像相关的常规问题进行了优化。',
+    displayName: 'Llama 3.2 Vision Instruct',
+    enabled: true,
+    id: 'llama-3.2-vision-instruct',
+    type: 'chat'
+  },
+  {
+    abilities: {
+      functionCall: true,
+    },
+    contextWindowTokens: 131_072,
+    description:
+      'Llama 3.1 指令微调模型针对对话场景进行了优化，在常见的行业基准测试中，超越了许多现有的开源聊天模型。',
+    displayName: 'Llama 3.1 Instruct',
+    enabled: true,
+    id: 'llama-3.1-instruct',
+    type: 'chat'
+  },
+]
+export const allModels = [...xinferenceChatModels];
+export default allModels;

package/src/config/llm.ts CHANGED Viewed

@@ -75,6 +75,9 @@ export const getLLMConfig = () => {
       ENABLED_VLLM: z.boolean(),
       VLLM_API_KEY: z.string().optional(),
+      ENABLED_XINFERENCE: z.boolean(),
+      XINFERENCE_API_KEY: z.string().optional(),
       ENABLED_QWEN: z.boolean(),
       QWEN_API_KEY: z.string().optional(),
@@ -234,6 +237,9 @@ export const getLLMConfig = () => {
       ENABLED_VLLM: !!process.env.VLLM_API_KEY,
       VLLM_API_KEY: process.env.VLLM_API_KEY,
+      ENABLED_XINFERENCE: !!process.env.XINFERENCE_API_KEY,
+      XINFERENCE_API_KEY: process.env.XINFERENCE_API_KEY,
       ENABLED_QWEN: !!process.env.QWEN_API_KEY,
       QWEN_API_KEY: process.env.QWEN_API_KEY,

package/src/config/modelProviders/index.ts CHANGED Viewed

@@ -49,6 +49,7 @@ import VLLMProvider from './vllm';
 import VolcengineProvider from './volcengine';
 import WenxinProvider from './wenxin';
 import XAIProvider from './xai';
+import XinferenceProvider from './xinference';
 import ZeroOneProvider from './zeroone';
 import ZhiPuProvider from './zhipu';
@@ -69,6 +70,7 @@ export const LOBE_DEFAULT_MODEL_LIST: ChatModelCard[] = [
   MoonshotProvider.chatModels,
   OllamaProvider.chatModels,
   VLLMProvider.chatModels,
+  XinferenceProvider.chatModels,
   OpenRouterProvider.chatModels,
   TogetherAIProvider.chatModels,
   FireworksAIProvider.chatModels,
@@ -108,6 +110,7 @@ export const DEFAULT_MODEL_PROVIDER_LIST = [
   AzureAIProvider,
   OllamaProvider,
   VLLMProvider,
+  XinferenceProvider,
   AnthropicProvider,
   BedrockProvider,
   GoogleProvider,
@@ -215,5 +218,6 @@ export { default as VLLMProviderCard } from './vllm';
 export { default as VolcengineProviderCard } from './volcengine';
 export { default as WenxinProviderCard } from './wenxin';
 export { default as XAIProviderCard } from './xai';
+export { default as XinferenceProviderCard } from './xinference';
 export { default as ZeroOneProviderCard } from './zeroone';
 export { default as ZhiPuProviderCard } from './zhipu';

package/src/config/modelProviders/xinference.ts ADDED Viewed

@@ -0,0 +1,18 @@
+import { ModelProviderCard } from '@/types/llm';
+const Xinference: ModelProviderCard = {
+  chatModels: [],
+  description: 'Xorbits Inference (Xinference) 是一个开源平台，用于简化各种 AI 模型的运行和集成。借助 Xinference，您可以使用任何开源 LLM、嵌入模型和多模态模型在云端或本地环境中运行推理，并创建强大的 AI 应用。',
+  id: 'xinference',
+  modelsUrl: 'https://inference.readthedocs.io/zh-cn/latest/models/builtin/index.html',
+  name: 'Xinference',
+  settings: {
+    proxyUrl: {
+      placeholder: 'http://localhost:9997/v1',
+    },
+    sdkType: 'openai',
+  },
+  url: 'https://inference.readthedocs.io/zh-cn/v0.12.3/index.html',
+};
+export default Xinference;

package/src/features/Conversation/components/AutoScroll.tsx CHANGED Viewed

@@ -13,12 +13,13 @@ interface AutoScrollProps {
 const AutoScroll = memo<AutoScrollProps>(({ atBottom, isScrolling, onScrollToBottom }) => {
   const trackVisibility = useChatStore(chatSelectors.isAIGenerating);
   const str = useChatStore(chatSelectors.mainAIChatsMessageString);
+  const reasoningStr = useChatStore(chatSelectors.mainAILatestMessageReasoningContent);
   useEffect(() => {
     if (atBottom && trackVisibility && !isScrolling) {
       onScrollToBottom?.('auto');
     }
-  }, [atBottom, trackVisibility, str]);
+  }, [atBottom, trackVisibility, str, reasoningStr]);
   return <BackBottom onScrollToBottom={() => onScrollToBottom('click')} visible={!atBottom} />;
 });

package/src/features/Conversation/components/ChatItem/ActionsBar.tsx CHANGED Viewed

@@ -1,9 +1,10 @@
 import { ActionEvent, ActionIconGroup, type ActionIconGroupProps } from '@lobehub/ui';
 import { App } from 'antd';
 import isEqual from 'fast-deep-equal';
-import { memo, useCallback } from 'react';
+import { memo, use, useCallback } from 'react';
 import { useTranslation } from 'react-i18next';
+import { VirtuosoContext } from '@/features/Conversation/components/VirtualizedList/VirtuosoContext';
 import { useChatStore } from '@/store/chat';
 import { chatSelectors } from '@/store/chat/selectors';
 import { MessageRoleType } from '@/types/message';
@@ -29,9 +30,10 @@ const ActionsBar = memo<ActionsBarProps>((props) => {
 interface ActionsProps {
   id: string;
   inPortalThread?: boolean;
+  index: number;
 }
-const Actions = memo<ActionsProps>(({ id, inPortalThread }) => {
+const Actions = memo<ActionsProps>(({ id, inPortalThread, index }) => {
   const item = useChatStore(chatSelectors.getMessageById(id), isEqual);
   const { t } = useTranslation('common');
   const [
@@ -58,12 +60,15 @@ const Actions = memo<ActionsProps>(({ id, inPortalThread }) => {
     s.toggleMessageEditing,
   ]);
   const { message } = App.useApp();
+  const virtuosoRef = use(VirtuosoContext);
   const handleActionClick = useCallback(
     async (action: ActionEvent) => {
       switch (action.key) {
         case 'edit': {
           toggleMessageEditing(id, true);
+          virtuosoRef?.current?.scrollIntoView({ align: 'start', behavior: 'auto', index });
         }
       }
       if (!item) return;

package/src/features/Conversation/components/ChatItem/index.tsx CHANGED Viewed

@@ -3,10 +3,11 @@
 import { ChatItem } from '@lobehub/ui';
 import { createStyles } from 'antd-style';
 import isEqual from 'fast-deep-equal';
-import { MouseEventHandler, ReactNode, memo, useCallback, useMemo } from 'react';
+import { MouseEventHandler, ReactNode, memo, use, useCallback, useMemo } from 'react';
 import { useTranslation } from 'react-i18next';
 import { Flexbox } from 'react-layout-kit';
+import { VirtuosoContext } from '@/features/Conversation/components/VirtualizedList/VirtuosoContext';
 import { useAgentStore } from '@/store/agent';
 import { agentChatConfigSelectors } from '@/store/agent/selectors';
 import { useChatStore } from '@/store/chat';
@@ -64,6 +65,7 @@ const Item = memo<ChatListItemProps>(
     endRender,
     disableEditing,
     inPortalThread = false,
+    index,
   }) => {
     const { t } = useTranslation('common');
     const { styles, cx } = useStyles();
@@ -188,6 +190,7 @@ const Item = memo<ChatListItemProps>(
     );
     const onChange = useCallback((value: string) => updateMessageContent(id, value), [id]);
+    const virtuosoRef = use(VirtuosoContext);
     const onDoubleClick = useCallback<MouseEventHandler<HTMLDivElement>>(
       (e) => {
@@ -195,6 +198,8 @@ const Item = memo<ChatListItemProps>(
         if (item.id === 'default' || item.error) return;
         if (item.role && ['assistant', 'user'].includes(item.role) && e.altKey) {
           toggleMessageEditing(id, true);
+          virtuosoRef?.current?.scrollIntoView({ align: 'start', behavior: 'auto', index });
         }
       },
       [item, disableEditing],

package/src/features/Conversation/components/VirtualizedList/VirtuosoContext.ts ADDED Viewed

@@ -0,0 +1,4 @@
+import { RefObject, createContext } from 'react';
+import { VirtuosoHandle } from 'react-virtuoso';
+export const VirtuosoContext = createContext<RefObject<VirtuosoHandle | null> | null>(null);

package/src/features/Conversation/components/VirtualizedList/index.tsx CHANGED Viewed

@@ -13,6 +13,7 @@ import { chatSelectors } from '@/store/chat/selectors';
 import AutoScroll from '../AutoScroll';
 import SkeletonList from '../SkeletonList';
+import { VirtuosoContext } from './VirtuosoContext';
 interface VirtualizedListProps {
   dataSource: string[];
@@ -69,38 +70,40 @@ const VirtualizedList = memo<VirtualizedListProps>(({ mobile, dataSource, itemCo
     );
   return (
-    <Flexbox height={'100%'}>
-      <Virtuoso
-        atBottomStateChange={setAtBottom}
-        atBottomThreshold={50 * (mobile ? 2 : 1)}
-        computeItemKey={(_, item) => item}
-        data={dataSource}
-        followOutput={getFollowOutput}
-        increaseViewportBy={overscan}
-        initialTopMostItemIndex={dataSource?.length - 1}
-        isScrolling={setIsScrolling}
-        itemContent={itemContent}
-        overscan={overscan}
-        ref={virtuosoRef}
-      />
-      <AutoScroll
-        atBottom={atBottom}
-        isScrolling={isScrolling}
-        onScrollToBottom={(type) => {
-          const virtuoso = virtuosoRef.current;
-          switch (type) {
-            case 'auto': {
-              virtuoso?.scrollToIndex({ align: 'end', behavior: 'auto', index: 'LAST' });
-              break;
-            }
-            case 'click': {
-              virtuoso?.scrollToIndex({ align: 'end', behavior: 'smooth', index: 'LAST' });
-              break;
+    <VirtuosoContext value={virtuosoRef}>
+      <Flexbox height={'100%'}>
+        <Virtuoso
+          atBottomStateChange={setAtBottom}
+          atBottomThreshold={50 * (mobile ? 2 : 1)}
+          computeItemKey={(_, item) => item}
+          data={dataSource}
+          followOutput={getFollowOutput}
+          increaseViewportBy={overscan}
+          initialTopMostItemIndex={dataSource?.length - 1}
+          isScrolling={setIsScrolling}
+          itemContent={itemContent}
+          overscan={overscan}
+          ref={virtuosoRef}
+        />
+        <AutoScroll
+          atBottom={atBottom}
+          isScrolling={isScrolling}
+          onScrollToBottom={(type) => {
+            const virtuoso = virtuosoRef.current;
+            switch (type) {
+              case 'auto': {
+                virtuoso?.scrollToIndex({ align: 'end', behavior: 'auto', index: 'LAST' });
+                break;
+              }
+              case 'click': {
+                virtuoso?.scrollToIndex({ align: 'end', behavior: 'smooth', index: 'LAST' });
+                break;
+              }
             }
-          }
-        }}
-      />
-    </Flexbox>
+          }}
+        />
+      </Flexbox>
+    </VirtuosoContext>
   );
 });

package/src/features/Portal/Thread/Chat/ChatItem.tsx CHANGED Viewed

@@ -31,7 +31,7 @@ const ThreadChatItem = memo<ThreadChatItemProps>(({ id, index }) => {
   const isParentMessage = index <= threadStartMessageIndex;
   const actionBar = useMemo(
-    () => !isParentMessage && <ActionsBar id={id} inPortalThread />,
+    () => !isParentMessage && <ActionsBar id={id} inPortalThread index={index} />,
     [id, isParentMessage],
   );

package/src/libs/agent-runtime/runtimeMap.ts CHANGED Viewed

@@ -45,6 +45,7 @@ import { LobeVLLMAI } from './vllm';
 import { LobeVolcengineAI } from './volcengine';
 import { LobeWenxinAI } from './wenxin';
 import { LobeXAI } from './xai';
+import { LobeXinferenceAI } from './xinference';
 import { LobeZeroOneAI } from './zeroone';
 import { LobeZhipuAI } from './zhipu';
@@ -97,6 +98,7 @@ export const providerRuntimeMap = {
   volcengine: LobeVolcengineAI,
   wenxin: LobeWenxinAI,
   xai: LobeXAI,
+  xinference: LobeXinferenceAI,
   zeroone: LobeZeroOneAI,
   zhipu: LobeZhipuAI,
 };

package/src/libs/agent-runtime/types/type.ts CHANGED Viewed

@@ -74,6 +74,7 @@ export enum ModelProvider {
   Volcengine = 'volcengine',
   Wenxin = 'wenxin',
   XAI = 'xai',
+  Xinference = 'xinference',
   ZeroOne = 'zeroone',
   ZhiPu = 'zhipu',
 }

package/src/libs/agent-runtime/xinference/index.ts ADDED Viewed

@@ -0,0 +1,53 @@
+import { ModelProvider } from '../types';
+import { LobeOpenAICompatibleFactory } from '../utils/openaiCompatibleFactory';
+import type { ChatModelCard } from '@/types/llm';
+export interface XinferenceModelCard {
+  context_length: number;
+  id: string;
+  model_ability: string[];
+  model_description: string;
+  model_type: string;
+  name: string;
+}
+export const LobeXinferenceAI = LobeOpenAICompatibleFactory({
+  baseURL: 'http://localhost:9997/v1',
+  debug: {
+    chatCompletion: () => process.env.DEBUG_XINFERENCE_CHAT_COMPLETION === '1',
+  },
+  models: async ({ client }) => {
+    const { LOBE_DEFAULT_MODEL_LIST } = await import('@/config/aiModels');
+    const modelsPage = await client.models.list() as any;
+    const modelList: XinferenceModelCard[] = modelsPage.data;
+    return modelList
+      .map((model) => {
+        const knownModel = LOBE_DEFAULT_MODEL_LIST.find((m) => model.id.toLowerCase() === m.id.toLowerCase());
+        return {
+          contextWindowTokens: model.context_length,
+          description: model.model_description,
+          displayName: model.name,
+          enabled: knownModel?.enabled || false,
+          functionCall:
+            (model.model_ability && model.model_ability.includes("tools"))
+            || knownModel?.abilities?.functionCall
+            || false,
+          id: model.id,
+          reasoning:
+            (model.model_ability && model.model_ability.includes("reasoning"))
+            || knownModel?.abilities?.reasoning
+            || false,
+          vision:
+            (model.model_ability && model.model_ability.includes("vision"))
+            || knownModel?.abilities?.vision
+            || false,
+        };
+      })
+      .filter(Boolean) as ChatModelCard[];
+  },
+  provider: ModelProvider.Xinference,
+});

package/src/store/chat/slices/message/selectors.test.ts CHANGED Viewed

@@ -48,6 +48,27 @@ const mockMessages = [
   },
 ] as ChatMessage[];
+const mockReasoningMessages = [
+  {
+    id: 'msg1',
+    content: 'Hello World',
+    role: 'user',
+  },
+  {
+    id: 'msg2',
+    content: 'Goodbye World',
+    role: 'user',
+  },
+  {
+    id: 'msg3',
+    content: 'Content Message',
+    role: 'assistant',
+    reasoning: {
+      content: 'Reasoning Content',
+    },
+  },
+] as ChatMessage[];
 const mockedChats = [
   {
     id: 'msg1',
@@ -270,6 +291,27 @@ describe('chatSelectors', () => {
     });
   });
+  describe('latestMessageReasoningContent', () => {
+    it('should return the reasoning content of the latest message', () => {
+      // Prepare a state with a few messages
+      const state = merge(initialStore, {
+        messagesMap: {
+          [messageMapKey('active-session')]: mockReasoningMessages,
+        },
+        activeId: 'active-session',
+      });
+      const expectedString = mockReasoningMessages.at(-1)?.reasoning?.content;
+      // Call the selector and verify the result
+      const reasoningContent = chatSelectors.mainAILatestMessageReasoningContent(state);
+      expect(reasoningContent).toBe(expectedString);
+      // Restore the mocks after the test
+      vi.restoreAllMocks();
+    });
+  });
   describe('showInboxWelcome', () => {
     it('should return false if the active session is not the inbox session', () => {
       const state = merge(initialStore, { activeId: 'someActiveId' });

package/src/store/chat/slices/message/selectors.ts CHANGED Viewed

@@ -98,6 +98,9 @@ const mainAIChatsMessageString = (s: ChatStoreState): string => {
   return chats.map((m) => m.content).join('');
 };
+const mainAILatestMessageReasoningContent = (s: ChatStoreState) =>
+  mainAIChats(s).at(-1)?.reasoning?.content;
 const currentToolMessages = (s: ChatStoreState) => {
   const messages = activeBaseChats(s);
@@ -214,6 +217,7 @@ export const chatSelectors = {
   mainAIChats,
   mainAIChatsMessageString,
   mainAIChatsWithHistoryConfig,
+  mainAILatestMessageReasoningContent,
   mainDisplayChatIDs,
   mainDisplayChats,
   showInboxWelcome,