npm - @librechat/agents - Versions diffs - 3.1.71-dev.0 → 3.1.71 - Mend

@librechat/agents 3.1.71-dev.0 → 3.1.71

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (38) hide show

package/dist/cjs/graphs/Graph.cjs +7 -0
package/dist/cjs/graphs/Graph.cjs.map +1 -1
package/dist/cjs/llm/invoke.cjs +13 -2
package/dist/cjs/llm/invoke.cjs.map +1 -1
package/dist/cjs/tools/BashExecutor.cjs +3 -1
package/dist/cjs/tools/BashExecutor.cjs.map +1 -1
package/dist/cjs/tools/ToolNode.cjs +84 -55
package/dist/cjs/tools/ToolNode.cjs.map +1 -1
package/dist/cjs/tools/toolOutputReferences.cjs +195 -0
package/dist/cjs/tools/toolOutputReferences.cjs.map +1 -1
package/dist/esm/graphs/Graph.mjs +7 -0
package/dist/esm/graphs/Graph.mjs.map +1 -1
package/dist/esm/llm/invoke.mjs +13 -2
package/dist/esm/llm/invoke.mjs.map +1 -1
package/dist/esm/tools/BashExecutor.mjs +3 -1
package/dist/esm/tools/BashExecutor.mjs.map +1 -1
package/dist/esm/tools/ToolNode.mjs +85 -56
package/dist/esm/tools/ToolNode.mjs.map +1 -1
package/dist/esm/tools/toolOutputReferences.mjs +195 -1
package/dist/esm/tools/toolOutputReferences.mjs.map +1 -1
package/dist/types/graphs/Graph.d.ts +9 -2
package/dist/types/llm/invoke.d.ts +29 -3
package/dist/types/tools/ToolNode.d.ts +11 -13
package/dist/types/tools/toolOutputReferences.d.ts +31 -0
package/dist/types/types/index.d.ts +1 -0
package/dist/types/types/messages.d.ts +26 -0
package/package.json +1 -1
package/src/graphs/Graph.ts +8 -1
package/src/llm/invoke.test.ts +446 -0
package/src/llm/invoke.ts +45 -5
package/src/tools/BashExecutor.ts +3 -1
package/src/tools/ToolNode.ts +94 -81
package/src/tools/__tests__/BashExecutor.test.ts +13 -0
package/src/tools/__tests__/ToolNode.outputReferences.test.ts +98 -55
package/src/tools/__tests__/annotateMessagesForLLM.test.ts +479 -0
package/src/tools/toolOutputReferences.ts +235 -0
package/src/types/index.ts +1 -0
package/src/types/messages.ts +27 -0

package/src/llm/invoke.test.ts ADDED Viewed

@@ -0,0 +1,446 @@
+import { z } from 'zod';
+import { tool } from '@langchain/core/tools';
+import {
+  AIMessage,
+  AIMessageChunk,
+  HumanMessage,
+  ToolMessage,
+} from '@langchain/core/messages';
+import { describe, it, expect, jest } from '@jest/globals';
+import type { BaseMessage } from '@langchain/core/messages';
+import type { StructuredToolInterface } from '@langchain/core/tools';
+import type * as t from '@/types';
+import { attemptInvoke, tryFallbackProviders } from '@/llm/invoke';
+import { ToolOutputReferenceRegistry } from '@/tools/toolOutputReferences';
+import { ToolNode } from '@/tools/ToolNode';
+import { Providers } from '@/common';
+/**
+ * Minimal stub model shape `attemptInvoke` reads. Either `invoke` or
+ * `stream` is populated depending on which path the test exercises;
+ * extending the real `BaseChatModel` would pull in too much surface.
+ */
+type StubModel = {
+  invoke?: (messages: BaseMessage[], config?: unknown) => Promise<AIMessage>;
+  stream?: (
+    messages: BaseMessage[],
+    config?: unknown
+  ) => AsyncGenerator<AIMessageChunk>;
+};
+type CapturingModel = {
+  invokeMessages: BaseMessage[][];
+  model: StubModel;
+};
+type StreamingCapturingModel = {
+  streamMessages: BaseMessage[][];
+  model: StubModel;
+};
+function buildCapturingModel(): CapturingModel {
+  const invokeMessages: BaseMessage[][] = [];
+  const responseMsg = new AIMessage({ content: 'ok' });
+  const model: StubModel = {
+    invoke: jest.fn(async (messages: BaseMessage[]): Promise<AIMessage> => {
+      invokeMessages.push(messages);
+      return responseMsg;
+    }),
+  };
+  return { invokeMessages, model };
+}
+function buildStreamingCapturingModel(): StreamingCapturingModel {
+  const streamMessages: BaseMessage[][] = [];
+  const model: StubModel = {
+    stream: jest.fn(async function* (
+      messages: BaseMessage[]
+    ): AsyncGenerator<AIMessageChunk> {
+      streamMessages.push(messages);
+      yield new AIMessageChunk({ content: 'ok' });
+    }),
+  };
+  return { streamMessages, model };
+}
+describe('attemptInvoke applies lazy ref annotation', () => {
+  it('annotates ToolMessages with live _refKey before sending to provider (non-streaming)', async () => {
+    const registry = new ToolOutputReferenceRegistry();
+    registry.set('run-1', 'tool0turn0', 'stored');
+    const context = {
+      getOrCreateToolOutputRegistry: () => registry,
+    } as unknown as Parameters<typeof attemptInvoke>[0]['context'];
+    const messages: BaseMessage[] = [
+      new HumanMessage('hi'),
+      new ToolMessage({
+        name: 'echo',
+        tool_call_id: 'tc1',
+        status: 'success',
+        content: 'output',
+        additional_kwargs: { _refKey: 'tool0turn0' },
+      }),
+    ];
+    const { invokeMessages, model } = buildCapturingModel();
+    await attemptInvoke(
+      {
+        model: model as t.ChatModel,
+        messages,
+        provider: Providers.ANTHROPIC,
+        context,
+      },
+      { configurable: { run_id: 'run-1' } }
+    );
+    expect(invokeMessages).toHaveLength(1);
+    const sent = invokeMessages[0];
+    expect(sent[1].content).toBe('[ref: tool0turn0]\noutput');
+    const original = messages[1] as ToolMessage;
+    expect(original.content).toBe('output');
+    expect(original.additional_kwargs._refKey).toBe('tool0turn0');
+    expect(messages[1]).not.toBe(sent[1]);
+  });
+  it('annotates messages passed to model.stream (streaming path)', async () => {
+    const registry = new ToolOutputReferenceRegistry();
+    registry.set('run-2', 'tool0turn0', 'stored');
+    const context = {
+      getOrCreateToolOutputRegistry: () => registry,
+    } as unknown as Parameters<typeof attemptInvoke>[0]['context'];
+    const messages: BaseMessage[] = [
+      new ToolMessage({
+        name: 'echo',
+        tool_call_id: 'tc1',
+        status: 'success',
+        content: 'output',
+        additional_kwargs: { _refKey: 'tool0turn0' },
+      }),
+    ];
+    const { streamMessages, model } = buildStreamingCapturingModel();
+    await attemptInvoke(
+      {
+        model: model as t.ChatModel,
+        messages,
+        provider: Providers.ANTHROPIC,
+        context,
+        onChunk: () => {
+          /* swallow */
+        },
+      },
+      { configurable: { run_id: 'run-2' } }
+    );
+    expect(streamMessages).toHaveLength(1);
+    expect(streamMessages[0][0].content).toBe('[ref: tool0turn0]\noutput');
+    expect(messages[0].content).toBe('output');
+  });
+  it('passes messages unchanged when no registry is exposed on context (e.g. summarization)', async () => {
+    const messages: BaseMessage[] = [
+      new ToolMessage({
+        name: 'echo',
+        tool_call_id: 'tc1',
+        status: 'success',
+        content: 'output',
+        additional_kwargs: { _refKey: 'tool0turn0' },
+      }),
+    ];
+    const { invokeMessages, model } = buildCapturingModel();
+    await attemptInvoke({
+      model: model as t.ChatModel,
+      messages,
+      provider: Providers.ANTHROPIC,
+    });
+    expect(invokeMessages).toHaveLength(1);
+    expect(invokeMessages[0][0].content).toBe('output');
+  });
+  it('skips annotation for stale _refKey not present in current run registry (cross-run scenario)', async () => {
+    const registry = new ToolOutputReferenceRegistry();
+    // run-3 registry holds tool0turn0 - the current run's live ref
+    registry.set('run-3', 'tool0turn0', 'live-stored');
+    const context = {
+      getOrCreateToolOutputRegistry: () => registry,
+    } as unknown as Parameters<typeof attemptInvoke>[0]['context'];
+    const messages: BaseMessage[] = [
+      // Stale ToolMessage from a hydrated prior run - its _refKey points
+      // at a key that exists in registry, but conceptually different
+      // semantics. For this test, use a key that doesn't exist in the
+      // current registry to demonstrate the no-op behavior.
+      new ToolMessage({
+        name: 'echo',
+        tool_call_id: 'old',
+        status: 'success',
+        content: 'old-output',
+        additional_kwargs: { _refKey: 'tool5turn5' },
+      }),
+      new ToolMessage({
+        name: 'echo',
+        tool_call_id: 'new',
+        status: 'success',
+        content: 'new-output',
+        additional_kwargs: { _refKey: 'tool0turn0' },
+      }),
+    ];
+    const { invokeMessages, model } = buildCapturingModel();
+    await attemptInvoke(
+      {
+        model: model as t.ChatModel,
+        messages,
+        provider: Providers.ANTHROPIC,
+        context,
+      },
+      { configurable: { run_id: 'run-3' } }
+    );
+    const sent = invokeMessages[0];
+    expect(sent[0].content).toBe('old-output');
+    expect(sent[1].content).toBe('[ref: tool0turn0]\nnew-output');
+  });
+  it('applies unresolved-refs annotation regardless of registry presence', async () => {
+    const registry = new ToolOutputReferenceRegistry();
+    const context = {
+      getOrCreateToolOutputRegistry: () => registry,
+    } as unknown as Parameters<typeof attemptInvoke>[0]['context'];
+    const messages: BaseMessage[] = [
+      new ToolMessage({
+        name: 'echo',
+        tool_call_id: 'tc1',
+        status: 'error',
+        content: 'Error: bad ref',
+        additional_kwargs: { _unresolvedRefs: ['tool9turn9'] },
+      }),
+    ];
+    const { invokeMessages, model } = buildCapturingModel();
+    await attemptInvoke(
+      {
+        model: model as t.ChatModel,
+        messages,
+        provider: Providers.ANTHROPIC,
+        context,
+      },
+      { configurable: { run_id: 'run-err' } }
+    );
+    expect(invokeMessages[0][0].content).toBe(
+      'Error: bad ref\n[unresolved refs: tool9turn9]'
+    );
+  });
+  it('annotates refs registered under an anonymous-batch scope (no run_id)', async () => {
+    /**
+     * Regression: anonymous ToolNode invocations register refs under
+     * a synthetic per-batch scope (`\0anon-<n>`) that
+     * `config.configurable.run_id` cannot recover. The transform must
+     * read the message-stamped `_refScope` rather than relying on the
+     * config-derived runId, otherwise the registry lookup misses and
+     * the LLM never sees the `[ref: …]` marker.
+     */
+    const registry = new ToolOutputReferenceRegistry();
+    const anonScope = '\0anon-0';
+    registry.set(anonScope, 'tool0turn0', 'stored');
+    const context = {
+      getOrCreateToolOutputRegistry: () => registry,
+    } as unknown as Parameters<typeof attemptInvoke>[0]['context'];
+    const messages: BaseMessage[] = [
+      new ToolMessage({
+        name: 'echo',
+        tool_call_id: 'tc1',
+        status: 'success',
+        content: 'output',
+        additional_kwargs: {
+          _refKey: 'tool0turn0',
+          _refScope: anonScope,
+        },
+      }),
+    ];
+    const { invokeMessages, model } = buildCapturingModel();
+    await attemptInvoke({
+      model: model as t.ChatModel,
+      messages,
+      provider: Providers.ANTHROPIC,
+      context,
+    });
+    expect(invokeMessages[0][0].content).toBe('[ref: tool0turn0]\noutput');
+  });
+});
+describe('tryFallbackProviders applies the same lazy annotation transform', () => {
+  it('threads context through to attemptInvoke so fallback messages are annotated', async () => {
+    const registry = new ToolOutputReferenceRegistry();
+    registry.set('run-fb', 'tool0turn0', 'stored');
+    const context = {
+      getOrCreateToolOutputRegistry: () => registry,
+    } as unknown as Parameters<typeof attemptInvoke>[0]['context'];
+    const messages: BaseMessage[] = [
+      new ToolMessage({
+        name: 'echo',
+        tool_call_id: 'tc1',
+        status: 'success',
+        content: 'output',
+        additional_kwargs: { _refKey: 'tool0turn0' },
+      }),
+    ];
+    const { invokeMessages, model } = buildCapturingModel();
+    /**
+     * Mock `initializeModel` indirectly by stubbing the LLM init via
+     * Jest's manual `mock` so the fallback path returns our capturing
+     * model. Skipping this here would require pulling in the real
+     * provider init chain (Anthropic, etc.) which the rest of this
+     * test layer does not bring in.
+     */
+    jest.doMock('@/llm/init', () => ({
+      initializeModel: (): unknown => model,
+    }));
+    // Reset the module so the doMock takes effect.
+    jest.resetModules();
+    const { tryFallbackProviders: freshTry } = (await import(
+      '@/llm/invoke'
+    )) as { tryFallbackProviders: typeof tryFallbackProviders };
+    await freshTry({
+      fallbacks: [{ provider: Providers.ANTHROPIC }],
+      messages,
+      primaryError: new Error('primary failed'),
+      context,
+      config: { configurable: { run_id: 'run-fb' } },
+    });
+    expect(invokeMessages.length).toBeGreaterThanOrEqual(1);
+    expect(invokeMessages[invokeMessages.length - 1][0].content).toBe(
+      '[ref: tool0turn0]\noutput'
+    );
+    jest.dontMock('@/llm/init');
+    jest.resetModules();
+  });
+});
+describe('cross-run hydration through ToolNode + attemptInvoke', () => {
+  it('annotates run 2 refs but leaves hydrated run 1 ToolMessages untouched', async () => {
+    /**
+     * Smoke test for the headline scenario: ToolMessages produced in
+     * run 1 are persisted with clean content + `_refKey`/`_refScope`
+     * metadata. When those messages are hydrated into run 2's state
+     * and run 2 produces its own tool output, the annotation transform
+     * must (a) annotate run 2's fresh tool message because its
+     * `_refScope` is live in run 2's registry, and (b) leave run 1's
+     * tool message clean because run 1's scope is not in run 2's
+     * registry. Same `tool0turn0` key collides across runs without any
+     * confusion.
+     */
+    const echo = tool(async (input) => (input as { command: string }).command, {
+      name: 'echo',
+      description: 'echoes its command back',
+      schema: z.object({ command: z.string() }),
+    }) as unknown as StructuredToolInterface;
+    /* Run 1 */
+    const run1Node = new ToolNode({
+      tools: [echo],
+      toolOutputReferences: { enabled: true },
+    });
+    const run1Result = (await run1Node.invoke(
+      {
+        messages: [
+          new AIMessage({
+            content: '',
+            tool_calls: [
+              { id: 'r1c1', name: 'echo', args: { command: 'run-1-output' } },
+            ],
+          }),
+        ],
+      },
+      { configurable: { run_id: 'run-1' } }
+    )) as { messages: ToolMessage[] };
+    const run1ToolMsg = run1Result.messages[0];
+    expect(run1ToolMsg.content).toBe('run-1-output');
+    expect(run1ToolMsg.additional_kwargs._refKey).toBe('tool0turn0');
+    expect(run1ToolMsg.additional_kwargs._refScope).toBe('run-1');
+    /* Run 2 - fresh ToolNode and registry, simulating a new session */
+    const run2Node = new ToolNode({
+      tools: [echo],
+      toolOutputReferences: { enabled: true },
+    });
+    const run2Result = (await run2Node.invoke(
+      {
+        messages: [
+          new AIMessage({
+            content: '',
+            tool_calls: [
+              { id: 'r2c1', name: 'echo', args: { command: 'run-2-output' } },
+            ],
+          }),
+        ],
+      },
+      { configurable: { run_id: 'run-2' } }
+    )) as { messages: ToolMessage[] };
+    const run2ToolMsg = run2Result.messages[0];
+    expect(run2ToolMsg.content).toBe('run-2-output');
+    expect(run2ToolMsg.additional_kwargs._refKey).toBe('tool0turn0');
+    expect(run2ToolMsg.additional_kwargs._refScope).toBe('run-2');
+    /* Hydrate run 1's message + run 2's message into a single state */
+    const hydrated: BaseMessage[] = [
+      new HumanMessage('first request'),
+      run1ToolMsg,
+      new HumanMessage('second request'),
+      run2ToolMsg,
+    ];
+    /* attemptInvoke with run 2's registry */
+    const context = {
+      getOrCreateToolOutputRegistry: () =>
+        run2Node._unsafeGetToolOutputRegistry(),
+    } as unknown as Parameters<typeof attemptInvoke>[0]['context'];
+    const { invokeMessages, model } = buildCapturingModel();
+    await attemptInvoke(
+      {
+        model: model as t.ChatModel,
+        messages: hydrated,
+        provider: Providers.ANTHROPIC,
+        context,
+      },
+      { configurable: { run_id: 'run-2' } }
+    );
+    const sent = invokeMessages[0];
+    /* Run 1's hydrated tool message stays clean — its scope is stale */
+    expect(sent[1].content).toBe('run-1-output');
+    /* Run 2's tool message gets annotated — its scope is live */
+    expect(sent[3].content).toBe('[ref: tool0turn0]\nrun-2-output');
+    /* Persisted state is unchanged */
+    expect(hydrated[1].content).toBe('run-1-output');
+    expect(hydrated[3].content).toBe('run-2-output');
+  });
+});

package/src/llm/invoke.ts CHANGED Viewed

@@ -3,18 +3,47 @@ import { AIMessageChunk } from '@langchain/core/messages';
 import type { RunnableConfig } from '@langchain/core/runnables';
 import type { ToolCall } from '@langchain/core/messages/tool';
 import type { BaseMessage } from '@langchain/core/messages';
+import type { ToolOutputReferenceRegistry } from '@/tools/toolOutputReferences';
 import type * as t from '@/types';
 import { manualToolStreamProviders } from '@/llm/providers';
+import { annotateMessagesForLLM } from '@/tools/toolOutputReferences';
 import { modifyDeltaProperties } from '@/messages';
 import { ChatModelStreamHandler } from '@/stream';
 import { GraphEvents, Providers } from '@/common';
 import { initializeModel } from '@/llm/init';
 /**
- * Context passed to `attemptInvoke` for the default stream handler.
- * Matches the subset of Graph that `ChatModelStreamHandler.handle` needs.
+ * Context passed to `attemptInvoke`. Matches the subset of Graph that
+ * `ChatModelStreamHandler.handle` needs *plus* the explicit
+ * `getOrCreateToolOutputRegistry()` accessor that `attemptInvoke`
+ * itself calls to pull the run-scoped tool-output registry off the
+ * graph and project each relevant ToolMessage into a transient
+ * annotated copy before the provider call.
+ *
+ * The intersection is intentional: `Parameters<...>[3]` resolves
+ * indirectly through the stream handler's signature (which returns
+ * `StandardGraph` and already exposes the accessor since #117), but
+ * stating it explicitly here surfaces the contract at the call site —
+ * a developer reading `attemptInvoke` doesn't have to chase the
+ * upstream handler's parameter list to discover that
+ * `context?.getOrCreateToolOutputRegistry()` is a real thing. Single
+ * optional chain only — the method itself is required on the
+ * `StandardGraph` branch of the intersection, so the second `?.` is
+ * unnecessary at the call site.
+ *
+ * `NonNullable<...>` strips `undefined` from the upstream parameter
+ * type so the intersection doesn't collapse to `never` on the
+ * undefined branch; callers express optionality via `context?:
+ * InvokeContext` on the function signature instead.
+ *
+ * Callers without a registry (e.g. summarization) simply pass no
+ * `context` and the transform safely no-ops.
  */
-export type InvokeContext = Parameters<ChatModelStreamHandler['handle']>[3];
+export type InvokeContext = NonNullable<
+  Parameters<ChatModelStreamHandler['handle']>[3]
+> & {
+  getOrCreateToolOutputRegistry?(): ToolOutputReferenceRegistry | undefined;
+};
 /**
  * Per-chunk callback for custom stream processing.
@@ -47,8 +76,19 @@ export async function attemptInvoke(
   },
   config?: RunnableConfig
 ): Promise<Partial<t.BaseGraphState>> {
+  /**
+   * Pull the run-scoped tool output registry off the graph (when one
+   * exists) and project ToolMessages carrying ref metadata into a
+   * transient annotated copy. The original `messages` array stays
+   * untouched so the graph state never sees `[ref: …]` / `_ref`
+   * payload.
+   */
+  const registry = context?.getOrCreateToolOutputRegistry();
+  const runId = config?.configurable?.run_id as string | undefined;
+  const messagesForProvider = annotateMessagesForLLM(messages, registry, runId);
   if (model.stream) {
-    const stream = await model.stream(messages, config);
+    const stream = await model.stream(messagesForProvider, config);
     let finalChunk: AIMessageChunk | undefined;
     if (onChunk) {
@@ -83,7 +123,7 @@ export async function attemptInvoke(
     return { messages: [finalChunk as AIMessageChunk] };
   }
-  const finalMessage = await model.invoke(messages, config);
+  const finalMessage = await model.invoke(messagesForProvider, config);
   if ((finalMessage.tool_calls?.length ?? 0) > 0) {
     finalMessage.tool_calls = finalMessage.tool_calls?.filter(
       (tool_call: ToolCall) => !!tool_call.name

package/src/tools/BashExecutor.ts CHANGED Viewed

@@ -66,7 +66,9 @@ Referencing previous tool outputs:
 - Every successful tool result is tagged with a reference key of the form \`tool<idx>turn<turn>\` (e.g., \`tool0turn0\`). The key appears either as a \`[ref: tool0turn0]\` prefix line or, when the output is a JSON object, as a \`_ref\` field on the object.
 - To pipe a previous tool output into this tool, embed the placeholder \`{{tool<idx>turn<turn>}}\` literally anywhere in the \`command\` string (or any string arg). It will be substituted with the stored output verbatim before the command runs.
 - The substituted value is the original output string (no \`[ref: …]\` prefix, no \`_ref\` key), so it is safe to pipe directly into \`jq\`, \`grep\`, \`awk\`, etc.
-- Example: \`echo '{{tool0turn0}}' | jq '.foo'\` takes the full output of the first tool from the first turn and pipes it into jq.
+- Example (simple ASCII output): \`echo '{{tool0turn0}}' | jq '.foo'\` takes the full output of the first tool from the first turn and pipes it into jq.
+- For payloads that may contain quotes, parentheses, backticks, or arbitrary bytes (random/binary data, JSON with embedded quotes, multi-line strings), prefer a quoted-delimiter heredoc over \`echo '…'\`. The heredoc body is not interpreted by the shell, so substituted payloads pass through unchanged.
+- Heredoc example: \`wc -c << 'EOF'\\n{{tool0turn0}}\\nEOF\` (the quotes around \`'EOF'\` disable interpolation inside the body).
 - Unknown reference keys are left in place and surfaced as \`[unresolved refs: …]\` after the output.
 `.trim();