npm - @librechat/agents - Versions diffs - 3.1.52 → 3.1.54 - Mend

@librechat/agents 3.1.52 → 3.1.54

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (36) hide show

package/dist/cjs/llm/bedrock/utils/message_outputs.cjs +16 -5
package/dist/cjs/llm/bedrock/utils/message_outputs.cjs.map +1 -1
package/dist/cjs/llm/google/index.cjs.map +1 -1
package/dist/cjs/llm/openrouter/index.cjs +59 -5
package/dist/cjs/llm/openrouter/index.cjs.map +1 -1
package/dist/cjs/llm/vertexai/index.cjs +16 -2
package/dist/cjs/llm/vertexai/index.cjs.map +1 -1
package/dist/cjs/main.cjs +2 -0
package/dist/cjs/main.cjs.map +1 -1
package/dist/esm/llm/bedrock/utils/message_outputs.mjs +16 -5
package/dist/esm/llm/bedrock/utils/message_outputs.mjs.map +1 -1
package/dist/esm/llm/google/index.mjs.map +1 -1
package/dist/esm/llm/openrouter/index.mjs +59 -5
package/dist/esm/llm/openrouter/index.mjs.map +1 -1
package/dist/esm/llm/vertexai/index.mjs +16 -2
package/dist/esm/llm/vertexai/index.mjs.map +1 -1
package/dist/esm/main.mjs +1 -0
package/dist/esm/main.mjs.map +1 -1
package/dist/types/index.d.ts +2 -0
package/dist/types/llm/bedrock/utils/message_outputs.d.ts +1 -1
package/dist/types/llm/google/index.d.ts +2 -3
package/dist/types/llm/openrouter/index.d.ts +21 -1
package/dist/types/llm/vertexai/index.d.ts +2 -1
package/dist/types/types/llm.d.ts +7 -2
package/package.json +1 -1
package/src/index.ts +6 -0
package/src/llm/bedrock/llm.spec.ts +233 -4
package/src/llm/bedrock/utils/message_outputs.ts +51 -11
package/src/llm/google/index.ts +2 -3
package/src/llm/openrouter/index.ts +117 -6
package/src/llm/openrouter/reasoning.test.ts +207 -0
package/src/llm/vertexai/index.ts +20 -3
package/src/scripts/bedrock-cache-debug.ts +250 -0
package/src/specs/openrouter.simple.test.ts +163 -2
package/src/types/llm.ts +7 -2
package/src/utils/llmConfig.ts +3 -4

package/src/specs/openrouter.simple.test.ts CHANGED Viewed

@@ -7,6 +7,7 @@ import {
   UsageMetadata,
 } from '@langchain/core/messages';
 import type * as t from '@/types';
+import type { ChatOpenRouterCallOptions } from '@/llm/openrouter';
 import { ToolEndHandler, ModelEndHandler } from '@/events';
 import { ContentTypes, GraphEvents, Providers, TitleMethod } from '@/common';
 import { capitalizeFirstLetter } from './spec.utils';
@@ -33,6 +34,8 @@ describeIf(`${capitalizeFirstLetter(provider)} Streaming Tests`, () => {
     version: 'v2' as const,
   };
+  const baseLLMConfig = getLLMConfig(provider);
   beforeEach(async () => {
     conversationHistory = [];
     collectedUsage = [];
@@ -56,16 +59,81 @@ describeIf(`${capitalizeFirstLetter(provider)} Streaming Tests`, () => {
     [GraphEvents.CHAT_MODEL_END]: new ModelEndHandler(collectedUsage),
   });
+  /**
+   * Helper: run a reasoning test against a specific model with the given reasoning config.
+   * Asserts that reasoning tokens are reported and content is produced.
+   */
+  // eslint-disable-next-line @typescript-eslint/explicit-function-return-type
+  async function runReasoningTest(opts: {
+    model: string;
+    reasoning?: ChatOpenRouterCallOptions['reasoning'];
+    threadId: string;
+    runId: string;
+  }) {
+    const { reasoning: _baseReasoning, ...baseWithoutReasoning } =
+      baseLLMConfig as unknown as Record<string, unknown>;
+    const llmConfig = {
+      ...baseWithoutReasoning,
+      model: opts.model,
+      ...(opts.reasoning != null ? { reasoning: opts.reasoning } : {}),
+    } as t.LLMConfig;
+    const customHandlers = setupCustomHandlers();
+    run = await Run.create<t.IState>({
+      runId: opts.runId,
+      graphConfig: {
+        type: 'standard',
+        llmConfig,
+        instructions: 'You are a helpful AI assistant. Think step by step.',
+      },
+      returnContent: true,
+      skipCleanup: true,
+      customHandlers,
+    });
+    const userMessage = 'What is 15 * 37 + 128 / 4? Show your work.';
+    conversationHistory.push(new HumanMessage(userMessage));
+    const finalContentParts = await run.processStream(
+      { messages: conversationHistory },
+      { ...configV2, configurable: { thread_id: opts.threadId } }
+    );
+    expect(finalContentParts).toBeDefined();
+    expect(finalContentParts?.length).toBeGreaterThan(0);
+    // Verify usage metadata was collected
+    expect(collectedUsage.length).toBeGreaterThan(0);
+    const usage = collectedUsage[0];
+    expect(usage.input_tokens).toBeGreaterThan(0);
+    expect(usage.output_tokens).toBeGreaterThan(0);
+    // Verify reasoning tokens are reported in output_token_details
+    const reasoningTokens =
+      (usage.output_token_details as Record<string, number> | undefined)
+        ?.reasoning ?? 0;
+    expect(reasoningTokens).toBeGreaterThan(0);
+    // Verify the final message has content
+    const finalMessages = run.getRunMessages();
+    expect(finalMessages).toBeDefined();
+    expect(finalMessages?.length).toBeGreaterThan(0);
+    const assistantMsg = finalMessages?.[0];
+    expect(typeof assistantMsg?.content).toBe('string');
+    expect((assistantMsg?.content as string).length).toBeGreaterThan(0);
+    return { usage, reasoningTokens, finalMessages };
+  }
   test(`${capitalizeFirstLetter(provider)}: simple stream + title`, async () => {
     const { userName, location } = await getArgs();
-    const llmConfig = getLLMConfig(provider);
     const customHandlers = setupCustomHandlers();
     run = await Run.create<t.IState>({
       runId: 'or-run-1',
       graphConfig: {
         type: 'standard',
-        llmConfig,
+        llmConfig: baseLLMConfig,
         tools: [new Calculator()],
         instructions: 'You are a friendly AI assistant.',
         additional_instructions: `The user's name is ${userName} and they are located in ${location}.`,
@@ -104,4 +172,97 @@ describeIf(`${capitalizeFirstLetter(provider)} Streaming Tests`, () => {
     });
     expect(titleRes.title).toBeDefined();
   });
+  test(`${capitalizeFirstLetter(provider)}: Anthropic does NOT reason by default (no config)`, async () => {
+    const { reasoning: _baseReasoning, ...baseWithoutReasoning } =
+      baseLLMConfig as unknown as Record<string, unknown>;
+    const llmConfig = {
+      ...baseWithoutReasoning,
+      model: 'anthropic/claude-sonnet-4',
+    } as t.LLMConfig;
+    const customHandlers = setupCustomHandlers();
+    run = await Run.create<t.IState>({
+      runId: 'or-anthropic-default-1',
+      graphConfig: {
+        type: 'standard',
+        llmConfig,
+        instructions: 'You are a helpful AI assistant.',
+      },
+      returnContent: true,
+      skipCleanup: true,
+      customHandlers,
+    });
+    conversationHistory.push(
+      new HumanMessage('What is 15 * 37 + 128 / 4? Show your work.')
+    );
+    await run.processStream(
+      { messages: conversationHistory },
+      { ...configV2, configurable: { thread_id: 'or-anthropic-default-1' } }
+    );
+    expect(collectedUsage.length).toBeGreaterThan(0);
+    const usage = collectedUsage[0];
+    // Anthropic requires explicit reasoning config — no reasoning tokens by default
+    const reasoningTokens =
+      (usage.output_token_details as Record<string, number> | undefined)
+        ?.reasoning ?? 0;
+    expect(reasoningTokens).toBe(0);
+  });
+  test(`${capitalizeFirstLetter(provider)}: Gemini 3 reasons by default (no config)`, async () => {
+    await runReasoningTest({
+      model: 'google/gemini-3-pro-preview',
+      reasoning: undefined,
+      threadId: 'or-gemini-default-1',
+      runId: 'or-gemini-default-1',
+    });
+  });
+  test(`${capitalizeFirstLetter(provider)}: Gemini reasoning with max_tokens`, async () => {
+    await runReasoningTest({
+      model: 'google/gemini-3-pro-preview',
+      reasoning: { max_tokens: 4000 },
+      threadId: 'or-gemini-reasoning-1',
+      runId: 'or-gemini-reasoning-1',
+    });
+  });
+  test(`${capitalizeFirstLetter(provider)}: Gemini reasoning with effort`, async () => {
+    await runReasoningTest({
+      model: 'google/gemini-3-flash-preview',
+      reasoning: { effort: 'low' },
+      threadId: 'or-gemini-effort-1',
+      runId: 'or-gemini-effort-1',
+    });
+  });
+  test(`${capitalizeFirstLetter(provider)}: Anthropic reasoning with max_tokens`, async () => {
+    await runReasoningTest({
+      model: 'anthropic/claude-sonnet-4',
+      reasoning: { max_tokens: 4000 },
+      threadId: 'or-anthropic-reasoning-1',
+      runId: 'or-anthropic-reasoning-1',
+    });
+  });
+  test(`${capitalizeFirstLetter(provider)}: Anthropic sonnet-4 reasoning with effort`, async () => {
+    await runReasoningTest({
+      model: 'anthropic/claude-sonnet-4',
+      reasoning: { effort: 'medium' },
+      threadId: 'or-anthropic-effort-s4-1',
+      runId: 'or-anthropic-effort-s4-1',
+    });
+  });
+  test(`${capitalizeFirstLetter(provider)}: Anthropic sonnet-4-6 reasoning with effort`, async () => {
+    await runReasoningTest({
+      model: 'anthropic/claude-sonnet-4-6',
+      reasoning: { effort: 'medium' },
+      threadId: 'or-anthropic-effort-s46-1',
+      runId: 'or-anthropic-effort-s46-1',
+    });
+  });
 });

package/src/types/llm.ts CHANGED Viewed

@@ -11,7 +11,6 @@ import type {
   ClientOptions as OAIClientOptions,
 } from '@langchain/openai';
 import type { GoogleGenerativeAIChatInput } from '@langchain/google-genai';
-import type { GeminiGenerationConfig } from '@langchain/google-common';
 import type { ChatVertexAIInput } from '@langchain/google-vertexai';
 import type { ChatDeepSeekCallOptions } from '@langchain/deepseek';
 import type { ChatOpenRouterCallOptions } from '@/llm/openrouter';
@@ -55,6 +54,11 @@ export type AnthropicReasoning = {
   thinking?: ThinkingConfig | boolean;
   thinkingBudget?: number;
 };
+export type GoogleThinkingConfig = {
+  thinkingBudget?: number;
+  includeThoughts?: boolean;
+  thinkingLevel?: string;
+};
 export type OpenAIClientOptions = ChatOpenAIFields;
 export type AnthropicClientOptions = AnthropicInput & {
   promptCache?: boolean;
@@ -62,6 +66,7 @@ export type AnthropicClientOptions = AnthropicInput & {
 export type MistralAIClientOptions = ChatMistralAIInput;
 export type VertexAIClientOptions = ChatVertexAIInput & {
   includeThoughts?: boolean;
+  thinkingConfig?: GoogleThinkingConfig;
 };
 export type BedrockAnthropicInput = ChatBedrockConverseInput & {
   additionalModelRequestFields?: ChatBedrockConverseInput['additionalModelRequestFields'] &
@@ -72,7 +77,7 @@ export type BedrockConverseClientOptions = ChatBedrockConverseInput;
 export type BedrockAnthropicClientOptions = BedrockAnthropicInput;
 export type GoogleClientOptions = GoogleGenerativeAIChatInput & {
   customHeaders?: RequestOptions['customHeaders'];
-  thinkingConfig?: GeminiGenerationConfig['thinkingConfig'];
+  thinkingConfig?: GoogleThinkingConfig;
 };
 export type DeepSeekClientOptions = ChatDeepSeekCallOptions;
 export type XAIClientOptions = ChatXAIInput;

package/src/utils/llmConfig.ts CHANGED Viewed

@@ -67,11 +67,10 @@ export const llmConfigs: Record<string, t.LLMConfig | undefined> = {
         'X-Title': 'LibreChat',
       },
     },
-    include_reasoning: true,
+    reasoning: {
+      max_tokens: 8000,
+    },
     modelKwargs: {
-      reasoning: {
-        max_tokens: 8000,
-      },
       max_tokens: 10000,
     },
   } as or.ChatOpenRouterCallOptions & t.LLMConfig,