npm - @lobehub/chat - Versions diffs - 1.36.31 → 1.36.33 - Mend

@lobehub/chat 1.36.31 → 1.36.33

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (47) hide show

package/src/database/server/models/topic.ts CHANGED Viewed

@@ -29,46 +29,42 @@ export class TopicModel {
   }
   // **************** Query *************** //
-  async query({ current = 0, pageSize = 9999, sessionId }: QueryTopicParams = {}) {
+  query = async ({ current = 0, pageSize = 9999, sessionId }: QueryTopicParams = {}) => {
     const offset = current * pageSize;
-    return (
-      this.db
-        .select({
-          createdAt: topics.createdAt,
-          favorite: topics.favorite,
-          historySummary: topics.historySummary,
-          id: topics.id,
-          metadata: topics.metadata,
-          title: topics.title,
-          updatedAt: topics.updatedAt,
-        })
-        .from(topics)
-        .where(and(eq(topics.userId, this.userId), this.matchSession(sessionId)))
-        // In boolean sorting, false is considered "smaller" than true.
-        // So here we use desc to ensure that topics with favorite as true are in front.
-        .orderBy(desc(topics.favorite), desc(topics.updatedAt))
-        .limit(pageSize)
-        .offset(offset)
-    );
-  }
-  async findById(id: string) {
+    return this.db
+      .select({
+        createdAt: topics.createdAt,
+        favorite: topics.favorite,
+        historySummary: topics.historySummary,
+        id: topics.id,
+        metadata: topics.metadata,
+        title: topics.title,
+        updatedAt: topics.updatedAt,
+      })
+      .from(topics)
+      .where(and(eq(topics.userId, this.userId), this.matchSession(sessionId)))
+      // In boolean sorting, false is considered "smaller" than true.
+      // So here we use desc to ensure that topics with favorite as true are in front.
+      .orderBy(desc(topics.favorite), desc(topics.updatedAt))
+      .limit(pageSize)
+      .offset(offset);
+  };
+  findById = async (id: string) => {
     return this.db.query.topics.findFirst({
       where: and(eq(topics.id, id), eq(topics.userId, this.userId)),
     });
-  }
+  };
-  async queryAll(): Promise<TopicItem[]> {
+  queryAll = async (): Promise<TopicItem[]> => {
     return this.db
       .select()
       .from(topics)
       .orderBy(topics.updatedAt)
-      .where(eq(topics.userId, this.userId))
-      .execute();
-  }
+      .where(eq(topics.userId, this.userId));
+  };
-  async queryByKeyword(keyword: string, sessionId?: string | null): Promise<TopicItem[]> {
+  queryByKeyword = async (keyword: string, sessionId?: string | null): Promise<TopicItem[]> => {
     if (!keyword) return [];
     const keywordLowerCase = keyword.toLowerCase();
@@ -92,26 +88,25 @@ export class TopicModel {
         ),
       ),
     });
-  }
+  };
-  async count() {
+  count = async (): Promise<number> => {
     const result = await this.db
       .select({
-        count: count(),
+        count: count(topics.id),
       })
       .from(topics)
-      .where(eq(topics.userId, this.userId))
-      .execute();
+      .where(eq(topics.userId, this.userId));
     return result[0].count;
-  }
+  };
   // **************** Create *************** //
-  async create(
+  create = async (
     { messages: messageIds, ...params }: CreateTopicParams,
     id: string = this.genId(),
-  ): Promise<TopicItem> {
+  ): Promise<TopicItem> => {
     return this.db.transaction(async (tx) => {
       // 在 topics 表中插入新的 topic
       const [topic] = await tx
@@ -133,9 +128,9 @@ export class TopicModel {
       return topic;
     });
-  }
+  };
-  async batchCreate(topicParams: (CreateTopicParams & { id?: string })[]) {
+  batchCreate = async (topicParams: (CreateTopicParams & { id?: string })[]) => {
     // 开始一个事务
     return this.db.transaction(async (tx) => {
       // 在 topics 表中批量插入新的 topics
@@ -167,9 +162,9 @@ export class TopicModel {
       return createdTopics;
     });
-  }
+  };
-  async duplicate(topicId: string, newTitle?: string) {
+  duplicate = async (topicId: string, newTitle?: string) => {
     return this.db.transaction(async (tx) => {
       // find original topic
       const originalTopic = await tx.query.topics.findFirst({
@@ -217,48 +212,48 @@ export class TopicModel {
         topic: duplicatedTopic,
       };
     });
-  }
+  };
   // **************** Delete *************** //
   /**
    * Delete a session, also delete all messages and topics associated with it.
    */
-  async delete(id: string) {
+  delete = async (id: string) => {
     return this.db.delete(topics).where(and(eq(topics.id, id), eq(topics.userId, this.userId)));
-  }
+  };
   /**
    * Deletes multiple topics based on the sessionId.
    */
-  async batchDeleteBySessionId(sessionId?: string | null) {
+  batchDeleteBySessionId = async (sessionId?: string | null) => {
     return this.db
       .delete(topics)
       .where(and(this.matchSession(sessionId), eq(topics.userId, this.userId)));
-  }
+  };
   /**
    * Deletes multiple topics and all messages associated with them in a transaction.
    */
-  async batchDelete(ids: string[]) {
+  batchDelete = async (ids: string[]) => {
     return this.db
       .delete(topics)
       .where(and(inArray(topics.id, ids), eq(topics.userId, this.userId)));
-  }
+  };
-  async deleteAll() {
+  deleteAll = async () => {
     return this.db.delete(topics).where(eq(topics.userId, this.userId));
-  }
+  };
   // **************** Update *************** //
-  async update(id: string, data: Partial<TopicItem>) {
+  update = async (id: string, data: Partial<TopicItem>) => {
     return this.db
       .update(topics)
       .set({ ...data, updatedAt: new Date() })
       .where(and(eq(topics.id, id), eq(topics.userId, this.userId)))
       .returning();
-  }
+  };
   // **************** Helper *************** //

package/src/database/server/models/user.ts CHANGED Viewed

@@ -26,7 +26,7 @@ export class UserModel {
     this.db = db;
   }
-  async getUserState() {
+  getUserState = async () => {
     const result = await this.db
       .select({
         isOnboarded: users.isOnboarded,
@@ -81,20 +81,20 @@ export class UserModel {
       settings,
       userId: this.userId,
     };
-  }
+  };
-  async updateUser(value: Partial<UserItem>) {
+  updateUser = async (value: Partial<UserItem>) => {
     return this.db
       .update(users)
       .set({ ...value, updatedAt: new Date() })
       .where(eq(users.id, this.userId));
-  }
+  };
-  async deleteSetting() {
+  deleteSetting = async () => {
     return this.db.delete(userSettings).where(eq(userSettings.id, this.userId));
-  }
+  };
-  async updateSetting(value: Partial<UserSettings>) {
+  updateSetting = async (value: Partial<UserSettings>) => {
     const { keyVaults, ...res } = value;
     // Encrypt keyVaults
@@ -120,9 +120,9 @@ export class UserModel {
     }
     return this.db.update(userSettings).set(newValue).where(eq(userSettings.id, this.userId));
-  }
+  };
-  async updatePreference(value: Partial<UserPreference>) {
+  updatePreference = async (value: Partial<UserPreference>) => {
     const user = await this.db.query.users.findFirst({ where: eq(users.id, this.userId) });
     if (!user) return;
@@ -130,9 +130,9 @@ export class UserModel {
       .update(users)
       .set({ preference: merge(user.preference, value) })
       .where(eq(users.id, this.userId));
-  }
+  };
-  async updateGuide(value: Partial<UserGuide>) {
+  updateGuide = async (value: Partial<UserGuide>) => {
     const user = await this.db.query.users.findFirst({ where: eq(users.id, this.userId) });
     if (!user) return;
@@ -141,7 +141,7 @@ export class UserModel {
       .update(users)
       .set({ preference: { ...prevPreference, guide: merge(prevPreference.guide || {}, value) } })
       .where(eq(users.id, this.userId));
-  }
+  };
   // Static method

package/src/libs/agent-runtime/github/index.test.ts CHANGED Viewed

@@ -21,15 +21,10 @@ let instance: LobeOpenAICompatibleRuntime;
 beforeEach(() => {
   instance = new LobeGithubAI({ apiKey: 'test' });
-  // Use vi.spyOn to mock the chat.completions.create method
-  vi.spyOn(instance['client'].chat.completions, 'create').mockResolvedValue(
-    new ReadableStream() as any,
-  );
 });
 afterEach(() => {
-  vi.clearAllMocks();
+  vi.restoreAllMocks();
 });
 describe('LobeGithubAI', () => {
@@ -42,6 +37,13 @@ describe('LobeGithubAI', () => {
   });
   describe('chat', () => {
+    beforeEach(() => {
+      // Use vi.spyOn to mock the chat.completions.create method
+      vi.spyOn(instance['client'].chat.completions, 'create').mockResolvedValue(
+        new ReadableStream() as any,
+      );
+    });
     describe('Error', () => {
       it('should return GithubBizError with an openai error response when OpenAI.APIError is thrown', async () => {
         // Arrange
@@ -119,41 +121,6 @@ describe('LobeGithubAI', () => {
         }
       });
-      it('should return GithubBizError with an cause response with desensitize Url', async () => {
-        // Arrange
-        const errorInfo = {
-          stack: 'abc',
-          cause: { message: 'api is undefined' },
-        };
-        const apiError = new OpenAI.APIError(400, errorInfo, 'module error', {});
-        instance = new LobeGithubAI({
-          apiKey: 'test',
-          baseURL: 'https://api.abc.com/v1',
-        });
-        vi.spyOn(instance['client'].chat.completions, 'create').mockRejectedValue(apiError);
-        // Act
-        try {
-          await instance.chat({
-            messages: [{ content: 'Hello', role: 'user' }],
-            model: 'meta-llama-3-70b-instruct',
-            temperature: 0.7,
-          });
-        } catch (e) {
-          expect(e).toEqual({
-            endpoint: 'https://api.***.com/v1',
-            error: {
-              cause: { message: 'api is undefined' },
-              stack: 'abc',
-            },
-            errorType: bizErrorType,
-            provider,
-          });
-        }
-      });
       it('should throw an InvalidGithubToken error type on 401 status code', async () => {
         // Mock the API call to simulate a 401 error
         const error = new Error('InvalidApiKey') as any;
@@ -243,4 +210,64 @@ describe('LobeGithubAI', () => {
       });
     });
   });
+  describe('models', () => {
+    beforeEach(() => {});
+    it('should return a list of models', async () => {
+      // Arrange
+      const arr = [
+        {
+          id: 'azureml://registries/azureml-ai21/models/AI21-Jamba-Instruct/versions/2',
+          name: 'AI21-Jamba-Instruct',
+          friendly_name: 'AI21-Jamba-Instruct',
+          model_version: 2,
+          publisher: 'AI21 Labs',
+          model_family: 'AI21 Labs',
+          model_registry: 'azureml-ai21',
+          license: 'custom',
+          task: 'chat-completion',
+          description:
+            "Jamba-Instruct is the world's first production-grade Mamba-based LLM model and leverages its hybrid Mamba-Transformer architecture to achieve best-in-class performance, quality, and cost efficiency.\n\n**Model Developer Name**: _AI21 Labs_\n\n## Model Architecture\n\nJamba-Instruct leverages a hybrid Mamba-Transformer architecture to achieve best-in-class performance, quality, and cost efficiency.\nAI21's Jamba architecture features a blocks-and-layers approach that allows Jamba to successfully integrate the two architectures. Each Jamba block contains either an attention or a Mamba layer, followed by a multi-layer perceptron (MLP), producing an overall ratio of one Transformer layer out of every eight total layers.\n",
+          summary:
+            "Jamba-Instruct is the world's first production-grade Mamba-based LLM model and leverages its hybrid Mamba-Transformer architecture to achieve best-in-class performance, quality, and cost efficiency.",
+          tags: ['chat', 'rag'],
+        },
+        {
+          id: 'azureml://registries/azureml-cohere/models/Cohere-command-r/versions/3',
+          name: 'Cohere-command-r',
+          friendly_name: 'Cohere Command R',
+          model_version: 3,
+          publisher: 'cohere',
+          model_family: 'cohere',
+          model_registry: 'azureml-cohere',
+          license: 'custom',
+          task: 'chat-completion',
+          description:
+            "Command R is a highly performant generative large language model, optimized for a variety of use cases including reasoning, summarization, and question answering. \n\nThe model is optimized to perform well in the following languages: English, French, Spanish, Italian, German, Brazilian Portuguese, Japanese, Korean, Simplified Chinese, and Arabic.\n\nPre-training data additionally included the following 13 languages: Russian, Polish, Turkish, Vietnamese, Dutch, Czech, Indonesian, Ukrainian, Romanian, Greek, Hindi, Hebrew, Persian.\n\n## Resources\n\nFor full details of this model, [release blog post](https://aka.ms/cohere-blog).\n\n## Model Architecture\n\nThis is an auto-regressive language model that uses an optimized transformer architecture. After pretraining, this model uses supervised fine-tuning (SFT) and preference training to align model behavior to human preferences for helpfulness and safety.\n\n### Tool use capabilities\n\nCommand R has been specifically trained with conversational tool use capabilities. These have been trained into the model via a mixture of supervised fine-tuning and preference fine-tuning, using a specific prompt template. Deviating from this prompt template will likely reduce performance, but we encourage experimentation.\n\nCommand R's tool use functionality takes a conversation as input (with an optional user-system preamble), along with a list of available tools. The model will then generate a json-formatted list of actions to execute on a subset of those tools. Command R may use one of its supplied tools more than once.\n\nThe model has been trained to recognise a special directly_answer tool, which it uses to indicate that it doesn't want to use any of its other tools. The ability to abstain from calling a specific tool can be useful in a range of situations, such as greeting a user, or asking clarifying questions. We recommend including the directly_answer tool, but it can be removed or renamed if required.\n\n### Grounded Generation and RAG Capabilities\n\nCommand R has been specifically trained with grounded generation capabilities. This means that it can generate responses based on a list of supplied document snippets, and it will include grounding spans (citations) in its response indicating the source of the information. This can be used to enable behaviors such as grounded summarization and the final step of Retrieval Augmented Generation (RAG).This behavior has been trained into the model via a mixture of supervised fine-tuning and preference fine-tuning, using a specific prompt template. Deviating from this prompt template may reduce performance, but we encourage experimentation.\n\nCommand R's grounded generation behavior takes a conversation as input (with an optional user-supplied system preamble, indicating task, context and desired output style), along with a list of retrieved document snippets. The document snippets should be chunks, rather than long documents, typically around 100-400 words per chunk. Document snippets consist of key-value pairs. The keys should be short descriptive strings, the values can be text or semi-structured.\n\nBy default, Command R will generate grounded responses by first predicting which documents are relevant, then predicting which ones it will cite, then generating an answer. Finally, it will then insert grounding spans into the answer. See below for an example. This is referred to as accurate grounded generation.\n\nThe model is trained with a number of other answering modes, which can be selected by prompt changes . A fast citation mode is supported in the tokenizer, which will directly generate an answer with grounding spans in it, without first writing the answer out in full. This sacrifices some grounding accuracy in favor of generating fewer tokens.\n\n### Code Capabilities\n\nCommand R has been optimized to interact with your code, by requesting code snippets, code explanations, or code rewrites. It might not perform well out-of-the-box for pure code completion. For better performance, we also recommend using a low temperature (and even greedy decoding) for code-generation related instructions.\n",
+          summary:
+            'Command R is a scalable generative model targeting RAG and Tool Use to enable production-scale AI for enterprise.',
+          tags: ['rag', 'multilingual'],
+        },
+      ];
+      vi.spyOn(instance['client'].models, 'list').mockResolvedValue({
+        body: arr,
+      } as any);
+      // Act & Assert
+      const models = await instance.models();
+      const modelsCount = models.length;
+      expect(modelsCount).toBe(arr.length);
+      for (let i = 0; i < arr.length; i++) {
+        const model = models[i];
+        expect(model).toEqual({
+          description: arr[i].description,
+          displayName: arr[i].friendly_name,
+          id: arr[i].name,
+        });
+      }
+    });
+  });
 });

package/src/libs/agent-runtime/github/index.ts CHANGED Viewed

@@ -1,7 +1,35 @@
+import { LOBE_DEFAULT_MODEL_LIST } from '@/config/modelProviders';
+import type { ChatModelCard } from '@/types/llm';
 import { AgentRuntimeErrorType } from '../error';
 import { o1Models, pruneO1Payload } from '../openai';
 import { ModelProvider } from '../types';
-import { LobeOpenAICompatibleFactory } from '../utils/openaiCompatibleFactory';
+import {
+  CHAT_MODELS_BLOCK_LIST,
+  LobeOpenAICompatibleFactory,
+} from '../utils/openaiCompatibleFactory';
+enum Task {
+  'chat-completion',
+  'embeddings',
+}
+/* eslint-disable typescript-sort-keys/interface */
+type Model = {
+  id: string;
+  name: string;
+  friendly_name: string;
+  model_version: number;
+  publisher: string;
+  model_family: string;
+  model_registry: string;
+  license: string;
+  task: Task;
+  description: string;
+  summary: string;
+  tags: string[];
+};
+/* eslint-enable typescript-sort-keys/interface */
 export const LobeGithubAI = LobeOpenAICompatibleFactory({
   baseURL: 'https://models.inference.ai.azure.com',
@@ -23,5 +51,27 @@ export const LobeGithubAI = LobeOpenAICompatibleFactory({
     bizError: AgentRuntimeErrorType.ProviderBizError,
     invalidAPIKey: AgentRuntimeErrorType.InvalidGithubToken,
   },
+  models: async ({ client }) => {
+    const modelsPage = (await client.models.list()) as any;
+    const modelList: Model[] = modelsPage.body;
+    return modelList
+      .filter((model) => {
+        return CHAT_MODELS_BLOCK_LIST.every(
+          (keyword) => !model.name.toLowerCase().includes(keyword),
+        );
+      })
+      .map((model) => {
+        const knownModel = LOBE_DEFAULT_MODEL_LIST.find((m) => m.id === model.name);
+        if (knownModel) return knownModel;
+        return {
+          description: model.description,
+          displayName: model.friendly_name,
+          id: model.name,
+        };
+      })
+      .filter(Boolean) as ChatModelCard[];
+  },
   provider: ModelProvider.Github,
 });

package/src/libs/agent-runtime/togetherai/index.ts CHANGED Viewed

@@ -16,7 +16,8 @@ export const LobeTogetherAI = LobeOpenAICompatibleFactory({
   debug: {
     chatCompletion: () => process.env.DEBUG_TOGETHERAI_CHAT_COMPLETION === '1',
   },
-  models: async ({ apiKey }) => {
+  models: async ({ client }) => {
+    const apiKey = client.apiKey;
     const data = await fetch(`${baseURL}/api/models`, {
       headers: {
         Authorization: `Bearer ${apiKey}`,

package/src/libs/agent-runtime/utils/openaiCompatibleFactory/index.ts CHANGED Viewed

@@ -2,17 +2,18 @@ import OpenAI, { ClientOptions } from 'openai';
 import { Stream } from 'openai/streaming';
 import { LOBE_DEFAULT_MODEL_LIST } from '@/config/modelProviders';
-import { ChatModelCard } from '@/types/llm';
+import type { ChatModelCard } from '@/types/llm';
 import { LobeRuntimeAI } from '../../BaseAI';
 import { AgentRuntimeErrorType, ILobeAgentRuntimeErrorType } from '../../error';
-import {
+import type {
   ChatCompetitionOptions,
   ChatCompletionErrorPayload,
   ChatStreamPayload,
   Embeddings,
   EmbeddingsOptions,
   EmbeddingsPayload,
+  ModelProvider,
   TextToImagePayload,
   TextToSpeechOptions,
   TextToSpeechPayload,
@@ -26,7 +27,7 @@ import { StreamingResponse } from '../response';
 import { OpenAIStream, OpenAIStreamOptions } from '../streams';
 // the model contains the following keywords is not a chat model, so we should filter them out
-const CHAT_MODELS_BLOCK_LIST = [
+export const CHAT_MODELS_BLOCK_LIST = [
   'embedding',
   'davinci',
   'curie',
@@ -77,7 +78,7 @@ interface OpenAICompatibleFactoryOptions<T extends Record<string, any> = any> {
     invalidAPIKey: ILobeAgentRuntimeErrorType;
   };
   models?:
-    | ((params: { apiKey: string }) => Promise<ChatModelCard[]>)
+    | ((params: { client: OpenAI }) => Promise<ChatModelCard[]>)
     | {
         transformModel?: (model: OpenAI.Model) => ChatModelCard;
       };
@@ -157,7 +158,7 @@ export const LobeOpenAICompatibleFactory = <T extends Record<string, any> = any>
     client!: OpenAI;
     baseURL!: string;
-    private _options: ConstructorOptions<T>;
+    protected _options: ConstructorOptions<T>;
     constructor(options: ClientOptions & Record<string, any> = {}) {
       const _options = {
@@ -249,7 +250,7 @@ export const LobeOpenAICompatibleFactory = <T extends Record<string, any> = any>
     }
     async models() {
-      if (typeof models === 'function') return models({ apiKey: this.client.apiKey });
+      if (typeof models === 'function') return models({ client: this.client });
       const list = await this.client.models.list();
@@ -312,7 +313,7 @@ export const LobeOpenAICompatibleFactory = <T extends Record<string, any> = any>
       }
     }
-    private handleError(error: any): ChatCompletionErrorPayload {
+    protected handleError(error: any): ChatCompletionErrorPayload {
       let desensitizedEndpoint = this.baseURL;
       // refs: https://github.com/lobehub/lobe-chat/issues/842
@@ -337,7 +338,7 @@ export const LobeOpenAICompatibleFactory = <T extends Record<string, any> = any>
               endpoint: desensitizedEndpoint,
               error: error as any,
               errorType: ErrorType.invalidAPIKey,
-              provider: provider as any,
+              provider: provider as ModelProvider,
             });
           }
@@ -353,7 +354,7 @@ export const LobeOpenAICompatibleFactory = <T extends Record<string, any> = any>
         endpoint: desensitizedEndpoint,
         error: errorResult,
         errorType: RuntimeError || ErrorType.bizError,
-        provider: provider as any,
+        provider: provider as ModelProvider,
       });
     }
   };

package/src/libs/agent-runtime/utils/streams/azureOpenai.test.ts CHANGED Viewed

@@ -1,4 +1,3 @@
-import { desc } from 'drizzle-orm/expressions';
 import { describe, expect, it, vi } from 'vitest';
 import { AzureOpenAIStream } from './azureOpenai';

package/src/libs/next-auth/adapter/index.ts CHANGED Viewed

@@ -4,7 +4,7 @@ import type {
   AdapterUser,
   VerificationToken,
 } from '@auth/core/adapters';
-import { and, eq } from 'drizzle-orm';
+import { and, eq } from 'drizzle-orm/expressions';
 import type { NeonDatabase } from 'drizzle-orm/neon-serverless';
 import { Adapter, AdapterAccount } from 'next-auth/adapters';

package/src/server/routers/lambda/chunk.ts CHANGED Viewed

@@ -1,14 +1,14 @@
-import { inArray } from 'drizzle-orm';
+import { inArray } from 'drizzle-orm/expressions';
 import { z } from 'zod';
 import { DEFAULT_EMBEDDING_MODEL } from '@/const/settings';
+import { knowledgeBaseFiles } from '@/database/schemas';
 import { serverDB } from '@/database/server';
 import { AsyncTaskModel } from '@/database/server/models/asyncTask';
 import { ChunkModel } from '@/database/server/models/chunk';
 import { EmbeddingModel } from '@/database/server/models/embedding';
 import { FileModel } from '@/database/server/models/file';
 import { MessageModel } from '@/database/server/models/message';
-import { knowledgeBaseFiles } from '@/database/schemas';
 import { ModelProvider } from '@/libs/agent-runtime';
 import { authedProcedure, router } from '@/libs/trpc';
 import { keyVaults } from '@/libs/trpc/middleware/keyVaults';

package/vercel.json CHANGED Viewed

@@ -1,3 +1,3 @@
 {
-  "installCommand": "bun install"
+  "installCommand": "npx bun@1.1.38 install"
 }