npm - @librechat/agents - Versions diffs - 3.1.73 → 3.1.75 - Mend

@librechat/agents 3.1.73 → 3.1.75

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (53) hide show

package/README.md +66 -0
package/dist/cjs/agents/AgentContext.cjs +146 -57
package/dist/cjs/agents/AgentContext.cjs.map +1 -1
package/dist/cjs/llm/anthropic/utils/message_inputs.cjs +4 -1
package/dist/cjs/llm/anthropic/utils/message_inputs.cjs.map +1 -1
package/dist/cjs/main.cjs +1 -0
package/dist/cjs/main.cjs.map +1 -1
package/dist/cjs/messages/cache.cjs +37 -3
package/dist/cjs/messages/cache.cjs.map +1 -1
package/dist/cjs/tools/BashExecutor.cjs +21 -11
package/dist/cjs/tools/BashExecutor.cjs.map +1 -1
package/dist/cjs/tools/CodeExecutor.cjs +37 -10
package/dist/cjs/tools/CodeExecutor.cjs.map +1 -1
package/dist/cjs/tools/ProgrammaticToolCalling.cjs +16 -11
package/dist/cjs/tools/ProgrammaticToolCalling.cjs.map +1 -1
package/dist/esm/agents/AgentContext.mjs +147 -58
package/dist/esm/agents/AgentContext.mjs.map +1 -1
package/dist/esm/llm/anthropic/utils/message_inputs.mjs +4 -1
package/dist/esm/llm/anthropic/utils/message_inputs.mjs.map +1 -1
package/dist/esm/main.mjs +1 -1
package/dist/esm/messages/cache.mjs +37 -3
package/dist/esm/messages/cache.mjs.map +1 -1
package/dist/esm/tools/BashExecutor.mjs +22 -12
package/dist/esm/tools/BashExecutor.mjs.map +1 -1
package/dist/esm/tools/CodeExecutor.mjs +37 -11
package/dist/esm/tools/CodeExecutor.mjs.map +1 -1
package/dist/esm/tools/ProgrammaticToolCalling.mjs +17 -12
package/dist/esm/tools/ProgrammaticToolCalling.mjs.map +1 -1
package/dist/types/agents/AgentContext.d.ts +29 -4
package/dist/types/agents/__tests__/promptCacheLiveHelpers.d.ts +46 -0
package/dist/types/tools/CodeExecutor.d.ts +6 -0
package/dist/types/types/graph.d.ts +3 -1
package/dist/types/types/run.d.ts +2 -0
package/dist/types/types/tools.d.ts +9 -0
package/package.json +1 -1
package/src/agents/AgentContext.ts +189 -71
package/src/agents/__tests__/AgentContext.anthropic.live.test.ts +116 -0
package/src/agents/__tests__/AgentContext.bedrock.live.test.ts +149 -0
package/src/agents/__tests__/AgentContext.test.ts +333 -2
package/src/agents/__tests__/promptCacheLiveHelpers.ts +165 -0
package/src/llm/anthropic/utils/message_inputs.ts +6 -1
package/src/llm/anthropic/utils/server-tool-inputs.test.ts +77 -0
package/src/messages/cache.test.ts +104 -3
package/src/messages/cache.ts +54 -3
package/src/specs/anthropic.simple.test.ts +61 -0
package/src/specs/summarization.test.ts +7 -3
package/src/tools/BashExecutor.ts +37 -13
package/src/tools/CodeExecutor.ts +55 -11
package/src/tools/ProgrammaticToolCalling.ts +29 -14
package/src/tools/__tests__/ProgrammaticToolCalling.test.ts +60 -0
package/src/types/graph.ts +3 -1
package/src/types/run.ts +2 -0
package/src/types/tools.ts +9 -0

package/README.md ADDED Viewed

@@ -0,0 +1,66 @@
+# @librechat/agents
+TypeScript utilities for building LibreChat agent workflows. The package provides graph orchestration, streaming event handling, tool execution, provider adapters, and message formatting for single-agent and multi-agent runs.
+## Features
+- LangGraph-based single-agent and multi-agent workflows
+- Streaming content aggregation and run-step event handlers
+- Tool calling, tool search, subagent handoffs, and programmatic tool execution
+- Provider adapters for Anthropic, Bedrock, Vertex AI, OpenAI-compatible providers, Google, Mistral, DeepSeek, and xAI
+- Message formatting, context pruning, summarization, and cache-control helpers
+## Installation
+```bash
+npm install @librechat/agents
+```
+## Basic Usage
+```typescript
+import { HumanMessage } from '@langchain/core/messages';
+import { Providers, Run } from '@librechat/agents';
+const run = await Run.create({
+  runId: crypto.randomUUID(),
+  graphConfig: {
+    type: 'standard',
+    instructions: 'You are a helpful assistant.',
+    llmConfig: {
+      provider: Providers.OPENAI,
+      model: 'gpt-4o-mini',
+      apiKey: process.env.OPENAI_API_KEY,
+    },
+  },
+  returnContent: true,
+});
+const content = await run.processStream(
+  { messages: [new HumanMessage('Hello')] },
+  {
+    runId: crypto.randomUUID(),
+    streamMode: 'values',
+    version: 'v2',
+  }
+);
+```
+## Development
+```bash
+npm ci
+npm run build
+npm test
+npx tsc --noEmit
+npx eslint src/
+```
+## Documentation
+- [Multi-agent patterns](./docs/multi-agent-patterns.md)
+- [Summarization behavior](./docs/summarization-behavior.md)
+## License
+MIT

package/dist/cjs/agents/AgentContext.cjs CHANGED Viewed

@@ -192,7 +192,7 @@ class AgentContext {
     summaryTokenCount = 0;
     /**
      * Where the summary should be injected:
-     * - `'system_prompt'`: cross-run summary, included in `buildInstructionsString`
+     * - `'system_prompt'`: cross-run summary, included in the dynamic system tail
      * - `'user_message'`: mid-run compaction, injected as HumanMessage on clean slate
      * - `'none'`: no summary present
      */
@@ -298,15 +298,18 @@ class AgentContext {
     }
     /**
      * Gets the system runnable, creating it lazily if needed.
-     * Includes instructions, additional instructions, and programmatic-only tools documentation.
+     * Includes stable instructions, dynamic additional instructions, and
+     * programmatic-only tools documentation.
      * Only rebuilds when marked stale (via markToolsAsDiscovered).
      */
     get systemRunnable() {
         if (!this.systemRunnableStale && this.cachedSystemRunnable !== undefined) {
             return this.cachedSystemRunnable;
         }
-        const instructionsString = this.buildInstructionsString();
-        this.cachedSystemRunnable = this.buildSystemRunnable(instructionsString);
+        this.cachedSystemRunnable = this.buildSystemRunnable({
+            stableInstructions: this.buildStableInstructionsString(),
+            dynamicInstructions: this.buildDynamicInstructionsString(),
+        });
         this.systemRunnableStale = false;
         return this.cachedSystemRunnable;
     }
@@ -316,16 +319,18 @@ class AgentContext {
      */
     initializeSystemRunnable() {
         if (this.systemRunnableStale || this.cachedSystemRunnable === undefined) {
-            const instructionsString = this.buildInstructionsString();
-            this.cachedSystemRunnable = this.buildSystemRunnable(instructionsString);
+            this.cachedSystemRunnable = this.buildSystemRunnable({
+                stableInstructions: this.buildStableInstructionsString(),
+                dynamicInstructions: this.buildDynamicInstructionsString(),
+            });
             this.systemRunnableStale = false;
         }
     }
     /**
-     * Builds the raw instructions string (without creating SystemMessage).
+     * Builds the cacheable instructions string (without creating SystemMessage).
      * Includes agent identity preamble and handoff context when available.
      */
-    buildInstructionsString() {
+    buildStableInstructionsString() {
         const parts = [];
         const identityPreamble = this.buildIdentityPreamble();
         if (identityPreamble) {
@@ -334,17 +339,27 @@ class AgentContext {
         if (this.instructions != null && this.instructions !== '') {
             parts.push(this.instructions);
         }
-        if (this.additionalInstructions != null &&
-            this.additionalInstructions !== '') {
-            parts.push(this.additionalInstructions);
-        }
         const programmaticToolsDoc = this.buildProgrammaticOnlyToolsInstructions();
         if (programmaticToolsDoc) {
             parts.push(programmaticToolsDoc);
         }
-        // Cross-run summary: include in system prompt so the model has context
-        // from the prior run.  Mid-run summaries are injected as a HumanMessage
-        // on the post-compaction clean slate instead (see buildSystemRunnable).
+        return parts.join('\n\n');
+    }
+    /**
+     * Builds the dynamic system-tail string (without creating SystemMessage).
+     * Keep this out of prompt-cache-marked content so volatile context does not
+     * invalidate the stable prefix.
+     */
+    buildDynamicInstructionsString() {
+        const parts = [];
+        if (this.additionalInstructions != null &&
+            this.additionalInstructions !== '') {
+            parts.push(this.additionalInstructions);
+        }
+        // Cross-run summary: include in the system tail so the model has context
+        // from the prior run without invalidating the cacheable prefix. Mid-run
+        // summaries are injected as a HumanMessage on the post-compaction clean
+        // slate instead (see buildSystemRunnable).
         if (this._summaryLocation === 'system_prompt' &&
             this.summaryText != null &&
             this.summaryText !== '') {
@@ -375,34 +390,20 @@ class AgentContext {
      * Build system runnable from pre-built instructions string.
      * Only called when content has actually changed.
      */
-    buildSystemRunnable(instructionsString) {
+    buildSystemRunnable({ stableInstructions, dynamicInstructions, }) {
         const hasMidRunSummary = this._summaryLocation === 'user_message' &&
             this.summaryText != null &&
             this.summaryText !== '';
-        if (!instructionsString && !hasMidRunSummary) {
+        if (!stableInstructions && !dynamicInstructions && !hasMidRunSummary) {
             this.systemMessageTokens = 0;
             return undefined;
         }
-        let finalInstructions = instructionsString;
-        let usePromptCache = false;
-        if (this.provider === _enum.Providers.ANTHROPIC) {
-            const anthropicOptions = this.clientOptions;
-            if (anthropicOptions?.promptCache === true) {
-                usePromptCache = true;
-                finalInstructions = {
-                    content: [
-                        {
-                            type: 'text',
-                            text: instructionsString,
-                            cache_control: { type: 'ephemeral' },
-                        },
-                    ],
-                };
-            }
-        }
-        const systemMessage = instructionsString
-            ? new messages.SystemMessage(finalInstructions)
-            : undefined;
+        const usePromptCache = this.hasAnthropicPromptCache();
+        const systemMessage = this.buildSystemMessage({
+            stableInstructions,
+            dynamicInstructions,
+            usePromptCache,
+        });
         if (this.tokenCounter) {
             this.systemMessageTokens = systemMessage
                 ? this.tokenCounter(systemMessage)
@@ -444,6 +445,52 @@ class AgentContext {
             return [...prefix, ...body];
         }).withConfig({ runName: 'prompt' });
     }
+    hasAnthropicPromptCache() {
+        if (this.provider !== _enum.Providers.ANTHROPIC) {
+            return false;
+        }
+        const anthropicOptions = this.clientOptions;
+        return anthropicOptions?.promptCache === true;
+    }
+    hasBedrockPromptCache() {
+        if (this.provider !== _enum.Providers.BEDROCK) {
+            return false;
+        }
+        const bedrockOptions = this.clientOptions;
+        return bedrockOptions?.promptCache === true;
+    }
+    buildSystemMessage({ stableInstructions, dynamicInstructions, usePromptCache, }) {
+        if (!stableInstructions && !dynamicInstructions) {
+            return undefined;
+        }
+        if (usePromptCache) {
+            const content = [];
+            if (stableInstructions) {
+                content.push({
+                    type: 'text',
+                    text: stableInstructions,
+                    cache_control: { type: 'ephemeral' },
+                });
+            }
+            if (dynamicInstructions) {
+                content.push({ type: 'text', text: dynamicInstructions });
+            }
+            return new messages.SystemMessage({ content });
+        }
+        if (this.hasBedrockPromptCache() && stableInstructions) {
+            const content = [
+                { type: 'text', text: stableInstructions },
+                { cachePoint: { type: 'default' } },
+            ];
+            if (dynamicInstructions) {
+                content.push({ type: 'text', text: dynamicInstructions });
+            }
+            return new messages.SystemMessage({ content });
+        }
+        return new messages.SystemMessage([stableInstructions, dynamicInstructions]
+            .filter((part) => part !== '')
+            .join('\n\n'));
+    }
     /**
      * Reset context for a new run
      */
@@ -505,7 +552,44 @@ class AgentContext {
         if (!this.toolDefinitions) {
             return [];
         }
-        return this.toolDefinitions.filter((def) => def.defer_loading !== true || this.discoveredToolNames.has(def.name));
+        /**
+         * Mirror `getEventDrivenToolsForBinding`'s gate: a definition is only
+         * bound to the model when its `allowed_callers` include `'direct'` and
+         * (if deferred) it has been discovered. Filtering by `defer_loading`
+         * alone left programmatic-only definitions counted in
+         * `toolSchemaTokens` even though they were never bound.
+         */
+        return this.toolDefinitions.filter((def) => {
+            const allowedCallers = def.allowed_callers ?? ['direct'];
+            if (!allowedCallers.includes('direct')) {
+                return false;
+            }
+            return (def.defer_loading !== true || this.discoveredToolNames.has(def.name));
+        });
+    }
+    /**
+     * Single source of truth for "which entries of `this.tools` should be
+     * treated as actually bound". Callers:
+     *   - `getToolsForBinding` (non-event-driven branch)
+     *   - `getEventDrivenToolsForBinding` (appends instance tools alongside
+     *     schema-only definitions)
+     *   - `calculateInstructionTokens` (counts schema bytes for accounting)
+     *
+     * In event-driven mode (`toolDefinitions` present) instance tools are
+     * appended unfiltered; outside event-driven mode they pass through
+     * `filterToolsForBinding`. Centralizing the decision here prevents the
+     * accounting/binding paths from drifting apart, which was the root
+     * cause of the original miscount.
+     */
+    getEffectiveInstanceTools() {
+        if (!this.tools) {
+            return undefined;
+        }
+        const isEventDriven = (this.toolDefinitions?.length ?? 0) > 0;
+        if (isEventDriven || !this.toolRegistry) {
+            return this.tools;
+        }
+        return this.filterToolsForBinding(this.tools);
     }
     /**
      * Calculate tool tokens and add to instruction tokens
@@ -520,9 +604,17 @@ class AgentContext {
          * populated after `fromConfig()` kicks off the initial calculation, so
          * callers that mutate `graphTools` must re-trigger this method to
          * refresh `toolSchemaTokens`.
+         *
+         * Use `getEffectiveInstanceTools()` so accounting reflects exactly the
+         * subset that `getToolsForBinding` would emit — preventing the
+         * worst-case-ceiling miscount that triggered spurious `empty_messages`
+         * preflight rejections at low `maxContextTokens`. Deferred and
+         * non-`'direct'` `toolDefinitions` are excluded by
+         * `getActiveToolDefinitions()` below.
          */
         const instanceTools = [
-            ...(this.tools ?? []),
+            ...(this.getEffectiveInstanceTools() ??
+                []),
             ...(this.graphTools ?? []),
         ];
         if (instanceTools.length > 0) {
@@ -682,7 +774,16 @@ class AgentContext {
      */
     getTokenBudgetBreakdown(messages) {
         const maxContextTokens = this.maxContextTokens ?? 0;
-        const toolCount = (this.tools?.length ?? 0) + this.getActiveToolDefinitions().length;
+        /**
+         * Derive `toolCount` from `getToolsForBinding()` so the diagnostic stays
+         * aligned with what is actually bound to the model — and with what
+         * `calculateInstructionTokens` counts into `toolSchemaTokens`. Using raw
+         * `this.tools.length` would inflate the count whenever the registry
+         * marks instance tools as deferred-undiscovered or non-`'direct'`,
+         * producing the same misleading "N tools" diagnostic this fix is meant
+         * to eliminate.
+         */
+        const toolCount = this.getToolsForBinding()?.length ?? 0;
         const messageCount = messages?.length ?? 0;
         let messageTokens = 0;
         if (messages != null) {
@@ -780,9 +881,7 @@ class AgentContext {
         if (this.toolDefinitions && this.toolDefinitions.length > 0) {
             return this.getEventDrivenToolsForBinding();
         }
-        const filtered = !this.tools || !this.toolRegistry
-            ? this.tools
-            : this.filterToolsForBinding(this.tools);
+        const filtered = this.getEffectiveInstanceTools();
         if (this.graphTools && this.graphTools.length > 0) {
             return [...(filtered ?? []), ...this.graphTools];
         }
@@ -793,24 +892,14 @@ class AgentContext {
         if (!this.toolDefinitions) {
             return this.graphTools ?? [];
         }
-        const defsToInclude = this.toolDefinitions.filter((def) => {
-            const allowedCallers = def.allowed_callers ?? ['direct'];
-            if (!allowedCallers.includes('direct')) {
-                return false;
-            }
-            if (def.defer_loading === true &&
-                !this.discoveredToolNames.has(def.name)) {
-                return false;
-            }
-            return true;
-        });
-        const schemaTools = schema$1.createSchemaOnlyTools(defsToInclude);
+        const schemaTools = schema$1.createSchemaOnlyTools(this.getActiveToolDefinitions());
         const allTools = [...schemaTools];
         if (this.graphTools && this.graphTools.length > 0) {
             allTools.push(...this.graphTools);
         }
-        if (this.tools && this.tools.length > 0) {
-            allTools.push(...this.tools);
+        const instanceTools = this.getEffectiveInstanceTools();
+        if (instanceTools && instanceTools.length > 0) {
+            allTools.push(...instanceTools);
         }
         return allTools;
     }