npm - @illuma-ai/agents - Versions diffs - 1.1.20 → 1.1.22 - Mend

@illuma-ai/agents 1.1.20 → 1.1.22

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (246) hide show

package/dist/cjs/graphs/Graph.cjs +12 -1
package/dist/cjs/graphs/Graph.cjs.map +1 -1
package/dist/cjs/graphs/MultiAgentGraph.cjs +85 -1
package/dist/cjs/graphs/MultiAgentGraph.cjs.map +1 -1
package/dist/cjs/llm/bedrock/index.cjs +14 -0
package/dist/cjs/llm/bedrock/index.cjs.map +1 -1
package/dist/cjs/run.cjs +20 -9
package/dist/cjs/run.cjs.map +1 -1
package/dist/esm/graphs/Graph.mjs +12 -1
package/dist/esm/graphs/Graph.mjs.map +1 -1
package/dist/esm/graphs/MultiAgentGraph.mjs +85 -1
package/dist/esm/graphs/MultiAgentGraph.mjs.map +1 -1
package/dist/esm/llm/bedrock/index.mjs +14 -0
package/dist/esm/llm/bedrock/index.mjs.map +1 -1
package/dist/esm/run.mjs +20 -9
package/dist/esm/run.mjs.map +1 -1
package/dist/types/graphs/MultiAgentGraph.d.ts +17 -0
package/package.json +1 -1
package/src/graphs/Graph.ts +12 -1
package/src/graphs/MultiAgentGraph.ts +105 -1
package/src/graphs/__tests__/multi-agent-delegate.test.ts +191 -0
package/src/llm/bedrock/index.ts +17 -0
package/src/run.ts +20 -11
package/src/scripts/test-bedrock-handoff-autonomous.ts +231 -0
package/src/agents/AgentContext.js +0 -782
package/src/agents/AgentContext.test.js +0 -421
package/src/agents/__tests__/AgentContext.test.js +0 -678
package/src/agents/__tests__/resolveStructuredOutputMode.test.js +0 -117
package/src/common/enum.js +0 -192
package/src/common/index.js +0 -3
package/src/events.js +0 -166
package/src/graphs/Graph.js +0 -1857
package/src/graphs/MultiAgentGraph.js +0 -1092
package/src/graphs/__tests__/structured-output.integration.test.js +0 -624
package/src/graphs/__tests__/structured-output.test.js +0 -144
package/src/graphs/contextManagement.e2e.test.js +0 -718
package/src/graphs/contextManagement.test.js +0 -485
package/src/graphs/handoffValidation.test.js +0 -276
package/src/graphs/index.js +0 -3
package/src/index.js +0 -28
package/src/instrumentation.js +0 -21
package/src/llm/anthropic/index.js +0 -319
package/src/llm/anthropic/types.js +0 -46
package/src/llm/anthropic/utils/message_inputs.js +0 -627
package/src/llm/anthropic/utils/message_outputs.js +0 -290
package/src/llm/anthropic/utils/output_parsers.js +0 -89
package/src/llm/anthropic/utils/tools.js +0 -25
package/src/llm/bedrock/__tests__/bedrock-caching.test.js +0 -392
package/src/llm/bedrock/index.js +0 -303
package/src/llm/bedrock/types.js +0 -2
package/src/llm/bedrock/utils/index.js +0 -6
package/src/llm/bedrock/utils/message_inputs.js +0 -463
package/src/llm/bedrock/utils/message_outputs.js +0 -269
package/src/llm/fake.js +0 -92
package/src/llm/google/index.js +0 -215
package/src/llm/google/types.js +0 -12
package/src/llm/google/utils/common.js +0 -670
package/src/llm/google/utils/tools.js +0 -111
package/src/llm/google/utils/zod_to_genai_parameters.js +0 -47
package/src/llm/openai/index.js +0 -1033
package/src/llm/openai/types.js +0 -2
package/src/llm/openai/utils/index.js +0 -756
package/src/llm/openai/utils/isReasoningModel.test.js +0 -79
package/src/llm/openrouter/index.js +0 -261
package/src/llm/openrouter/reasoning.test.js +0 -181
package/src/llm/providers.js +0 -36
package/src/llm/text.js +0 -65
package/src/llm/vertexai/index.js +0 -402
package/src/messages/__tests__/tools.test.js +0 -392
package/src/messages/cache.js +0 -404
package/src/messages/cache.test.js +0 -1167
package/src/messages/content.js +0 -48
package/src/messages/content.test.js +0 -314
package/src/messages/core.js +0 -359
package/src/messages/ensureThinkingBlock.test.js +0 -997
package/src/messages/format.js +0 -973
package/src/messages/formatAgentMessages.test.js +0 -2278
package/src/messages/formatAgentMessages.tools.test.js +0 -362
package/src/messages/formatMessage.test.js +0 -608
package/src/messages/ids.js +0 -18
package/src/messages/index.js +0 -9
package/src/messages/labelContentByAgent.test.js +0 -725
package/src/messages/prune.js +0 -438
package/src/messages/reducer.js +0 -60
package/src/messages/shiftIndexTokenCountMap.test.js +0 -63
package/src/messages/summarize.js +0 -146
package/src/messages/summarize.test.js +0 -332
package/src/messages/tools.js +0 -90
package/src/mockStream.js +0 -81
package/src/prompts/collab.js +0 -7
package/src/prompts/index.js +0 -3
package/src/prompts/taskmanager.js +0 -58
package/src/run.js +0 -427
package/src/schemas/index.js +0 -3
package/src/schemas/schema-preparation.test.js +0 -370
package/src/schemas/validate.js +0 -314
package/src/schemas/validate.test.js +0 -264
package/src/scripts/abort.js +0 -127
package/src/scripts/ant_web_search.js +0 -130
package/src/scripts/ant_web_search_edge_case.js +0 -133
package/src/scripts/ant_web_search_error_edge_case.js +0 -119
package/src/scripts/args.js +0 -41
package/src/scripts/bedrock-cache-debug.js +0 -186
package/src/scripts/bedrock-content-aggregation-test.js +0 -195
package/src/scripts/bedrock-merge-test.js +0 -80
package/src/scripts/bedrock-parallel-tools-test.js +0 -150
package/src/scripts/caching.js +0 -106
package/src/scripts/cli.js +0 -152
package/src/scripts/cli2.js +0 -119
package/src/scripts/cli3.js +0 -163
package/src/scripts/cli4.js +0 -165
package/src/scripts/cli5.js +0 -165
package/src/scripts/code_exec.js +0 -171
package/src/scripts/code_exec_files.js +0 -180
package/src/scripts/code_exec_multi_session.js +0 -185
package/src/scripts/code_exec_ptc.js +0 -265
package/src/scripts/code_exec_session.js +0 -217
package/src/scripts/code_exec_simple.js +0 -120
package/src/scripts/content.js +0 -111
package/src/scripts/empty_input.js +0 -125
package/src/scripts/handoff-test.js +0 -96
package/src/scripts/image.js +0 -138
package/src/scripts/memory.js +0 -83
package/src/scripts/multi-agent-chain.js +0 -271
package/src/scripts/multi-agent-conditional.js +0 -185
package/src/scripts/multi-agent-document-review-chain.js +0 -171
package/src/scripts/multi-agent-hybrid-flow.js +0 -264
package/src/scripts/multi-agent-parallel-start.js +0 -214
package/src/scripts/multi-agent-parallel.js +0 -346
package/src/scripts/multi-agent-sequence.js +0 -184
package/src/scripts/multi-agent-supervisor.js +0 -324
package/src/scripts/multi-agent-test.js +0 -147
package/src/scripts/parallel-asymmetric-tools-test.js +0 -202
package/src/scripts/parallel-full-metadata-test.js +0 -176
package/src/scripts/parallel-tools-test.js +0 -256
package/src/scripts/programmatic_exec.js +0 -277
package/src/scripts/programmatic_exec_agent.js +0 -168
package/src/scripts/search.js +0 -118
package/src/scripts/sequential-full-metadata-test.js +0 -143
package/src/scripts/simple.js +0 -174
package/src/scripts/single-agent-metadata-test.js +0 -152
package/src/scripts/stream.js +0 -113
package/src/scripts/test-custom-prompt-key.js +0 -132
package/src/scripts/test-handoff-input.js +0 -143
package/src/scripts/test-handoff-preamble.js +0 -227
package/src/scripts/test-handoff-steering.js +0 -353
package/src/scripts/test-multi-agent-list-handoff.js +0 -318
package/src/scripts/test-parallel-agent-labeling.js +0 -253
package/src/scripts/test-parallel-handoffs.js +0 -229
package/src/scripts/test-thinking-handoff-bedrock.js +0 -132
package/src/scripts/test-thinking-handoff.js +0 -132
package/src/scripts/test-thinking-to-thinking-handoff-bedrock.js +0 -140
package/src/scripts/test-tool-before-handoff-role-order.js +0 -223
package/src/scripts/test-tools-before-handoff.js +0 -187
package/src/scripts/test_code_api.js +0 -263
package/src/scripts/thinking-bedrock.js +0 -128
package/src/scripts/thinking-vertexai.js +0 -130
package/src/scripts/thinking.js +0 -134
package/src/scripts/tool_search.js +0 -114
package/src/scripts/tools.js +0 -125
package/src/specs/agent-handoffs-bedrock.integration.test.js +0 -280
package/src/specs/agent-handoffs.test.js +0 -924
package/src/specs/anthropic.simple.test.js +0 -287
package/src/specs/azure.simple.test.js +0 -381
package/src/specs/cache.simple.test.js +0 -282
package/src/specs/custom-event-await.test.js +0 -148
package/src/specs/deepseek.simple.test.js +0 -189
package/src/specs/emergency-prune.test.js +0 -308
package/src/specs/moonshot.simple.test.js +0 -237
package/src/specs/observability.integration.test.js +0 -1337
package/src/specs/openai.simple.test.js +0 -233
package/src/specs/openrouter.simple.test.js +0 -202
package/src/specs/prune.test.js +0 -733
package/src/specs/reasoning.test.js +0 -144
package/src/specs/spec.utils.js +0 -4
package/src/specs/thinking-handoff.test.js +0 -486
package/src/specs/thinking-prune.test.js +0 -600
package/src/specs/token-distribution-edge-case.test.js +0 -246
package/src/specs/token-memoization.test.js +0 -32
package/src/specs/tokens.test.js +0 -49
package/src/specs/tool-error.test.js +0 -139
package/src/splitStream.js +0 -204
package/src/splitStream.test.js +0 -504
package/src/stream.js +0 -650
package/src/stream.test.js +0 -225
package/src/test/mockTools.js +0 -340
package/src/tools/BrowserTools.js +0 -245
package/src/tools/Calculator.js +0 -38
package/src/tools/Calculator.test.js +0 -225
package/src/tools/CodeExecutor.js +0 -233
package/src/tools/ProgrammaticToolCalling.js +0 -602
package/src/tools/StreamingToolCallBuffer.js +0 -179
package/src/tools/ToolNode.js +0 -930
package/src/tools/ToolSearch.js +0 -904
package/src/tools/__tests__/BrowserTools.test.js +0 -306
package/src/tools/__tests__/ProgrammaticToolCalling.integration.test.js +0 -276
package/src/tools/__tests__/ProgrammaticToolCalling.test.js +0 -807
package/src/tools/__tests__/StreamingToolCallBuffer.test.js +0 -175
package/src/tools/__tests__/ToolApproval.test.js +0 -675
package/src/tools/__tests__/ToolNode.recovery.test.js +0 -200
package/src/tools/__tests__/ToolNode.session.test.js +0 -319
package/src/tools/__tests__/ToolSearch.integration.test.js +0 -125
package/src/tools/__tests__/ToolSearch.test.js +0 -812
package/src/tools/__tests__/handlers.test.js +0 -799
package/src/tools/__tests__/truncation-recovery.integration.test.js +0 -362
package/src/tools/handlers.js +0 -306
package/src/tools/schema.js +0 -25
package/src/tools/search/anthropic.js +0 -34
package/src/tools/search/content.js +0 -116
package/src/tools/search/content.test.js +0 -133
package/src/tools/search/firecrawl.js +0 -173
package/src/tools/search/format.js +0 -198
package/src/tools/search/highlights.js +0 -241
package/src/tools/search/index.js +0 -3
package/src/tools/search/jina-reranker.test.js +0 -106
package/src/tools/search/rerankers.js +0 -165
package/src/tools/search/schema.js +0 -102
package/src/tools/search/search.js +0 -561
package/src/tools/search/serper-scraper.js +0 -126
package/src/tools/search/test.js +0 -129
package/src/tools/search/tool.js +0 -453
package/src/tools/search/types.js +0 -2
package/src/tools/search/utils.js +0 -59
package/src/types/graph.js +0 -24
package/src/types/graph.test.js +0 -192
package/src/types/index.js +0 -7
package/src/types/llm.js +0 -2
package/src/types/messages.js +0 -2
package/src/types/run.js +0 -2
package/src/types/stream.js +0 -2
package/src/types/tools.js +0 -2
package/src/utils/contextAnalytics.js +0 -79
package/src/utils/contextAnalytics.test.js +0 -166
package/src/utils/events.js +0 -26
package/src/utils/graph.js +0 -11
package/src/utils/handlers.js +0 -65
package/src/utils/index.js +0 -10
package/src/utils/llm.js +0 -21
package/src/utils/llmConfig.js +0 -205
package/src/utils/logging.js +0 -37
package/src/utils/misc.js +0 -51
package/src/utils/run.js +0 -69
package/src/utils/schema.js +0 -21
package/src/utils/title.js +0 -119
package/src/utils/tokens.js +0 -92
package/src/utils/toonFormat.js +0 -379

package/src/tools/__tests__/truncation-recovery.integration.test.js DELETED Viewed

@@ -1,362 +0,0 @@
-/**
- * Integration test: Full Truncation Recovery Pipeline
- *
- * Tests the end-to-end flow that would catch the Bedrock buffer bug:
- *   Streaming chunks → handleToolCallChunks → StreamingToolCallBuffer → handleToolCalls → ToolNode.recoverTruncatedArgs → tool receives recovered args
- *
- * Uses real StreamingToolCallBuffer (not mocked) and real ToolNode with real tool definitions.
- * Only the graph dispatch layer is mocked (since we're not testing SSE dispatch).
- *
- * Verified against live Bedrock API output (see bedrock-live-poc.ts):
- *   START chunk: { id, name, index, args: "" }
- *   DELTA chunks: { args, index } — NO id, NO name
- */
-import { z } from 'zod';
-import { tool } from '@langchain/core/tools';
-import { AIMessage } from '@langchain/core/messages';
-import { describe, it, expect, beforeEach, jest } from '@jest/globals';
-import { StepTypes } from '@/common';
-import { StreamingToolCallBuffer } from '../StreamingToolCallBuffer';
-import { handleToolCallChunks } from '../handlers';
-import { ToolNode } from '../ToolNode';
-// ---------------------------------------------------------------------------
-// Helpers
-// ---------------------------------------------------------------------------
-/** Creates a mock graph that delegates buffer operations to a REAL StreamingToolCallBuffer */
-function createIntegrationGraph(buffer) {
-    let stepCounter = 0;
-    return {
-        getStepKey: jest.fn().mockReturnValue('step-key'),
-        getStepIdByKey: jest.fn().mockReturnValue('prev-step-id'),
-        getRunStep: jest.fn().mockReturnValue({
-            type: StepTypes.MESSAGE_CREATION,
-            id: 'prev-step-id',
-            index: 0,
-            stepDetails: { type: StepTypes.MESSAGE_CREATION, message_creation: { message_id: 'msg-1' } },
-            usage: null,
-        }),
-        dispatchRunStep: jest.fn()
-            .mockImplementation(async () => `step-${++stepCounter}`),
-        dispatchRunStepDelta: jest.fn().mockResolvedValue(undefined),
-        toolCallStepIds: new Map(),
-        messageStepHasToolCalls: new Map(),
-        messageIdsByStepKey: new Map(),
-        prelimMessageIdsByStepKey: new Map(),
-        streamingToolCallBuffer: buffer, // REAL buffer, not mocked
-    };
-}
-/** Creates a tool that captures received args for assertion */
-function createCaptureTool(name, schema, capturedArgs) {
-    return tool(async (input) => {
-        capturedArgs.push({ ...input });
-        return `OK`;
-    }, { name, description: `Test tool: ${name}`, schema });
-}
-/** Simulates Bedrock streaming: START chunk with {id, name, index, args:""}, then DELTA chunks with {args, index} */
-function simulateBedrockChunks(toolCallId, toolName, index, argsJson, chunkSize = 30) {
-    const chunks = [];
-    // START chunk: id + name + index, args="" (verified from live Bedrock API)
-    chunks.push({
-        id: toolCallId,
-        name: toolName,
-        index,
-        args: '',
-        type: 'tool_call_chunk',
-    });
-    // DELTA chunks: args + index, NO id, NO name (verified from live Bedrock API)
-    for (let i = 0; i < argsJson.length; i += chunkSize) {
-        chunks.push({
-            id: undefined,
-            name: undefined,
-            index,
-            args: argsJson.substring(i, i + chunkSize),
-            type: 'tool_call_chunk',
-        });
-    }
-    return chunks;
-}
-/** Simulates OpenAI/Anthropic streaming: every chunk has {id, args} */
-function simulateOpenAIChunks(toolCallId, toolName, index, argsJson, chunkSize = 30) {
-    const chunks = [];
-    // First chunk: id + name + first args fragment
-    const firstArgs = argsJson.substring(0, chunkSize);
-    chunks.push({
-        id: toolCallId,
-        name: toolName,
-        index,
-        args: firstArgs,
-        type: 'tool_call_chunk',
-    });
-    // Subsequent chunks: id + args (OpenAI sends id on every chunk)
-    for (let i = chunkSize; i < argsJson.length; i += chunkSize) {
-        chunks.push({
-            id: toolCallId,
-            name: undefined,
-            index,
-            args: argsJson.substring(i, i + chunkSize),
-            type: 'tool_call_chunk',
-        });
-    }
-    return chunks;
-}
-const contentToolSchema = z.object({
-    action: z.string(),
-    filename: z.string().optional(),
-    content: z.string().optional(),
-});
-const codeExecutorSchema = z.object({
-    code: z.string(),
-    language: z.string().optional(),
-});
-// ---------------------------------------------------------------------------
-// Tests
-// ---------------------------------------------------------------------------
-describe('Truncation Recovery Pipeline (Integration)', () => {
-    let buffer;
-    beforeEach(() => {
-        buffer = new StreamingToolCallBuffer();
-    });
-    it('Bedrock truncated write — full pipeline recovery', async () => {
-        const capturedArgs = [];
-        const graph = createIntegrationGraph(buffer);
-        // Full args JSON that Bedrock would stream (including content)
-        const fullArgsJson = '{"action":"write","filename":"app.tsx","content":"import React from \\"react\\";\\nexport default function App() {\\n  return <div>Hello World</div>;\\n}"}';
-        // Simulate Bedrock streaming: START + DELTA chunks
-        const chunks = simulateBedrockChunks('tooluse_abc', 'content_tool', 0, fullArgsJson, 20);
-        // Feed all chunks through handleToolCallChunks (real buffer accumulation)
-        for (const chunk of chunks) {
-            await handleToolCallChunks({
-                graph: graph,
-                stepKey: 'step-key',
-                toolCallChunks: [chunk],
-                metadata: { run_id: 'test' },
-            });
-        }
-        // Verify buffer was populated
-        expect(buffer.has('tooluse_abc')).toBe(true);
-        expect(buffer.getRawArgs('tooluse_abc')).toBe(fullArgsJson);
-        // Simulate truncation: parsePartialJson lost the content field
-        const truncatedArgs = { action: 'write', filename: 'app.tsx' }; // content MISSING
-        // Create ToolNode with real buffer
-        const contentTool = createCaptureTool('content_tool', contentToolSchema, capturedArgs);
-        const toolNode = new ToolNode({
-            tools: [contentTool],
-            streamingToolCallBuffer: buffer,
-        });
-        // Invoke ToolNode with truncated args
-        const aiMsg = new AIMessage({
-            content: '',
-            tool_calls: [{ id: 'tooluse_abc', name: 'content_tool', args: truncatedArgs }],
-        });
-        await toolNode.invoke({ messages: [aiMsg] });
-        // Assert: tool received RECOVERED content, not truncated
-        expect(capturedArgs).toHaveLength(1);
-        expect(capturedArgs[0].action).toBe('write');
-        expect(capturedArgs[0].filename).toBe('app.tsx');
-        expect(capturedArgs[0].content).toBe('import React from "react";\nexport default function App() {\n  return <div>Hello World</div>;\n}');
-    });
-    it('OpenAI/Anthropic chunked write — full pipeline recovery', async () => {
-        const capturedArgs = [];
-        const graph = createIntegrationGraph(buffer);
-        const fullArgsJson = '{"action":"write","filename":"test.tsx","content":"const x = 42;\\nconst y = 100;"}';
-        const chunks = simulateOpenAIChunks('tc_openai', 'content_tool', 0, fullArgsJson, 15);
-        for (const chunk of chunks) {
-            await handleToolCallChunks({
-                graph: graph,
-                stepKey: 'step-key',
-                toolCallChunks: [chunk],
-                metadata: { run_id: 'test' },
-            });
-        }
-        expect(buffer.has('tc_openai')).toBe(true);
-        expect(buffer.getRawArgs('tc_openai')).toBe(fullArgsJson);
-        // Simulate truncation: content missing
-        const contentTool = createCaptureTool('content_tool', contentToolSchema, capturedArgs);
-        const toolNode = new ToolNode({
-            tools: [contentTool],
-            streamingToolCallBuffer: buffer,
-        });
-        const aiMsg = new AIMessage({
-            content: '',
-            tool_calls: [{ id: 'tc_openai', name: 'content_tool', args: { action: 'write', filename: 'test.tsx' } }],
-        });
-        await toolNode.invoke({ messages: [aiMsg] });
-        expect(capturedArgs[0].content).toBe('const x = 42;\nconst y = 100;');
-    });
-    it('multiple parallel tool calls — no cross-contamination', async () => {
-        const capturedArgs = [];
-        const graph = createIntegrationGraph(buffer);
-        // Two parallel tool calls with different indexes
-        const args1 = '{"action":"write","filename":"a.tsx","content":"file A content"}';
-        const args2 = '{"action":"write","filename":"b.tsx","content":"file B content"}';
-        const chunks1 = simulateBedrockChunks('tc_1', 'content_tool', 0, args1, 15);
-        const chunks2 = simulateBedrockChunks('tc_2', 'content_tool', 1, args2, 15);
-        // Interleave chunks (realistic concurrent streaming)
-        const interleaved = [];
-        const maxLen = Math.max(chunks1.length, chunks2.length);
-        for (let i = 0; i < maxLen; i++) {
-            if (i < chunks1.length)
-                interleaved.push(chunks1[i]);
-            if (i < chunks2.length)
-                interleaved.push(chunks2[i]);
-        }
-        for (const chunk of interleaved) {
-            await handleToolCallChunks({
-                graph: graph,
-                stepKey: 'step-key',
-                toolCallChunks: [chunk],
-                metadata: { run_id: 'test' },
-            });
-        }
-        expect(buffer.getRawArgs('tc_1')).toBe(args1);
-        expect(buffer.getRawArgs('tc_2')).toBe(args2);
-        const contentTool = createCaptureTool('content_tool', contentToolSchema, capturedArgs);
-        const toolNode = new ToolNode({
-            tools: [contentTool],
-            streamingToolCallBuffer: buffer,
-        });
-        // Only tc_1 is truncated (missing content), tc_2 has all fields
-        const aiMsg = new AIMessage({
-            content: '',
-            tool_calls: [
-                { id: 'tc_1', name: 'content_tool', args: { action: 'write', filename: 'a.tsx' } }, // truncated
-                { id: 'tc_2', name: 'content_tool', args: { action: 'write', filename: 'b.tsx', content: 'file B content' } }, // complete
-            ],
-        });
-        await toolNode.invoke({ messages: [aiMsg] });
-        expect(capturedArgs).toHaveLength(2);
-        // tc_1: content recovered from buffer
-        expect(capturedArgs[0].content).toBe('file A content');
-        // tc_2: content unchanged (already present in parsed args)
-        expect(capturedArgs[1].content).toBe('file B content');
-    });
-    it('buffer cleanup after recovery — no stale data', async () => {
-        const capturedArgs = [];
-        const graph = createIntegrationGraph(buffer);
-        const fullArgs = '{"action":"write","filename":"x.tsx","content":"test"}';
-        const chunks = simulateBedrockChunks('tc_cleanup', 'content_tool', 0, fullArgs);
-        for (const chunk of chunks) {
-            await handleToolCallChunks({
-                graph: graph,
-                stepKey: 'step-key',
-                toolCallChunks: [chunk],
-                metadata: { run_id: 'test' },
-            });
-        }
-        expect(buffer.has('tc_cleanup')).toBe(true);
-        const contentTool = createCaptureTool('content_tool', contentToolSchema, capturedArgs);
-        const toolNode = new ToolNode({
-            tools: [contentTool],
-            streamingToolCallBuffer: buffer,
-        });
-        const aiMsg = new AIMessage({
-            content: '',
-            tool_calls: [{ id: 'tc_cleanup', name: 'content_tool', args: { action: 'write' } }],
-        });
-        await toolNode.invoke({ messages: [aiMsg] });
-        // Buffer should be cleared after processing
-        expect(buffer.has('tc_cleanup')).toBe(false);
-        expect(buffer.getRawArgs('tc_cleanup')).toBeUndefined();
-    });
-    it('no truncation — buffer populated but not used for overwrite', async () => {
-        const capturedArgs = [];
-        const graph = createIntegrationGraph(buffer);
-        const fullArgs = '{"action":"read","filename":"existing.tsx"}';
-        const chunks = simulateBedrockChunks('tc_complete', 'content_tool', 0, fullArgs);
-        for (const chunk of chunks) {
-            await handleToolCallChunks({
-                graph: graph,
-                stepKey: 'step-key',
-                toolCallChunks: [chunk],
-                metadata: { run_id: 'test' },
-            });
-        }
-        const contentTool = createCaptureTool('content_tool', contentToolSchema, capturedArgs);
-        const toolNode = new ToolNode({
-            tools: [contentTool],
-            streamingToolCallBuffer: buffer,
-        });
-        // Complete args — nothing missing
-        const aiMsg = new AIMessage({
-            content: '',
-            tool_calls: [{ id: 'tc_complete', name: 'content_tool', args: { action: 'read', filename: 'existing.tsx' } }],
-        });
-        await toolNode.invoke({ messages: [aiMsg] });
-        expect(capturedArgs[0].action).toBe('read');
-        expect(capturedArgs[0].filename).toBe('existing.tsx');
-        // No content field in args or buffer — should stay absent
-        expect(capturedArgs[0]).not.toHaveProperty('content');
-    });
-    it('generic tool recovery — non-content_tool (code_executor)', async () => {
-        const capturedArgs = [];
-        const graph = createIntegrationGraph(buffer);
-        const largeCode = 'function fibonacci(n) {\\n  if (n <= 1) return n;\\n  return fibonacci(n-1) + fibonacci(n-2);\\n}\\nconsole.log(fibonacci(10));';
-        const fullArgs = `{"code":"${largeCode}","language":"javascript"}`;
-        const chunks = simulateBedrockChunks('tc_code', 'execute_code', 0, fullArgs, 20);
-        for (const chunk of chunks) {
-            await handleToolCallChunks({
-                graph: graph,
-                stepKey: 'step-key',
-                toolCallChunks: [chunk],
-                metadata: { run_id: 'test' },
-            });
-        }
-        const codeTool = createCaptureTool('execute_code', codeExecutorSchema, capturedArgs);
-        const toolNode = new ToolNode({
-            tools: [codeTool],
-            streamingToolCallBuffer: buffer,
-        });
-        // Truncated: only has language, code is missing
-        const aiMsg = new AIMessage({
-            content: '',
-            tool_calls: [{ id: 'tc_code', name: 'execute_code', args: { language: 'javascript' } }],
-        });
-        await toolNode.invoke({ messages: [aiMsg] });
-        expect(capturedArgs[0].code).toContain('fibonacci');
-        expect(capturedArgs[0].language).toBe('javascript');
-    });
-    it('Bedrock large content (5000+ chars) — recovery preserves full content', async () => {
-        const capturedArgs = [];
-        const graph = createIntegrationGraph(buffer);
-        // Generate large content (simulating a real dashboard component)
-        const lines = [];
-        lines.push('import React from \\"react\\";');
-        lines.push('import { useState, useEffect } from \\"react\\";');
-        for (let i = 0; i < 100; i++) {
-            lines.push(`// Component section ${i}`);
-            lines.push(`const Section${i} = () => <div>Section ${i}</div>;`);
-        }
-        lines.push('export default function Dashboard() {');
-        lines.push('  return <div>Dashboard</div>;');
-        lines.push('}');
-        const content = lines.join('\\n');
-        const fullArgs = `{"action":"write","filename":"dashboard.tsx","content":"${content}"}`;
-        const chunks = simulateBedrockChunks('tc_large', 'content_tool', 0, fullArgs, 50);
-        for (const chunk of chunks) {
-            await handleToolCallChunks({
-                graph: graph,
-                stepKey: 'step-key',
-                toolCallChunks: [chunk],
-                metadata: { run_id: 'test' },
-            });
-        }
-        const contentTool = createCaptureTool('content_tool', contentToolSchema, capturedArgs);
-        const toolNode = new ToolNode({
-            tools: [contentTool],
-            streamingToolCallBuffer: buffer,
-        });
-        // Completely empty args (truncation wiped everything)
-        const aiMsg = new AIMessage({
-            content: '',
-            tool_calls: [{ id: 'tc_large', name: 'content_tool', args: {} }],
-        });
-        await toolNode.invoke({ messages: [aiMsg] });
-        expect(capturedArgs[0].action).toBe('write');
-        expect(capturedArgs[0].filename).toBe('dashboard.tsx');
-        const recoveredContent = capturedArgs[0].content;
-        expect(recoveredContent).toContain('import React from "react"');
-        expect(recoveredContent).toContain('Section 99');
-        expect(recoveredContent).toContain('export default function Dashboard()');
-    });
-});
-//# sourceMappingURL=truncation-recovery.integration.test.js.map

package/src/tools/handlers.js DELETED Viewed

@@ -1,306 +0,0 @@
-/* eslint-disable no-console */
-// src/tools/handlers.ts
-import { nanoid } from 'nanoid';
-import { ToolMessage } from '@langchain/core/messages';
-import { ToolCallTypes, GraphEvents, StepTypes, Providers, Constants, } from '@/common';
-import { coerceAnthropicSearchResults, isAnthropicWebSearchResult, } from '@/tools/search/anthropic';
-import { formatResultsForLLM } from '@/tools/search/format';
-import { getMessageId } from '@/messages';
-export async function handleToolCallChunks({ graph, stepKey, toolCallChunks, metadata, }) {
-    let prevStepId;
-    let prevRunStep;
-    try {
-        prevStepId = graph.getStepIdByKey(stepKey);
-        prevRunStep = graph.getRunStep(prevStepId);
-    }
-    catch {
-        /** Edge Case: If no previous step exists, create a new message creation step */
-        const message_id = getMessageId(stepKey, graph, true) ?? '';
-        prevStepId = await graph.dispatchRunStep(stepKey, {
-            type: StepTypes.MESSAGE_CREATION,
-            message_creation: {
-                message_id,
-            },
-        }, metadata);
-        prevRunStep = graph.getRunStep(prevStepId);
-    }
-    const _stepId = graph.getStepIdByKey(stepKey);
-    /** Edge Case: Tool Call Run Step or `tool_call_ids` never dispatched */
-    const tool_calls = prevStepId && prevRunStep && prevRunStep.type === StepTypes.MESSAGE_CREATION
-        ? []
-        : undefined;
-    /**
-     * Feed streaming tool call buffer — accumulate raw arg strings for truncation recovery.
-     *
-     * Provider chunk patterns:
-     * - OpenAI/Anthropic: every chunk has {id, args} → direct append
-     * - Bedrock: START chunk has {id, name, index}, DELTA chunks have {args, index} (no id)
-     *   → use index-to-id mapping to resolve the target buffer entry
-     */
-    for (const toolCallChunk of toolCallChunks) {
-        const chunkIndex = toolCallChunk.index;
-        // START chunk: has id (and usually name). Store index→id mapping for future DELTA chunks.
-        if (toolCallChunk.id) {
-            if (typeof chunkIndex === 'number') {
-                graph.streamingToolCallBuffer.setIndexMapping(chunkIndex, toolCallChunk.id);
-            }
-            if (toolCallChunk.name) {
-                graph.streamingToolCallBuffer.setToolName(toolCallChunk.id, toolCallChunk.name);
-            }
-            // Append args if present on the same chunk (OpenAI/Anthropic pattern)
-            if (toolCallChunk.args) {
-                graph.streamingToolCallBuffer.append(toolCallChunk.id, toolCallChunk.args);
-            }
-        }
-        else if (toolCallChunk.args && typeof chunkIndex === 'number') {
-            // DELTA chunk: no id, but has args + index. Resolve id via index mapping (Bedrock pattern).
-            const resolvedId = graph.streamingToolCallBuffer.getIdByIndex(chunkIndex);
-            if (resolvedId) {
-                graph.streamingToolCallBuffer.append(resolvedId, toolCallChunk.args);
-            }
-        }
-    }
-    /** Edge Case: `id` and `name` fields cannot be empty strings */
-    for (const toolCallChunk of toolCallChunks) {
-        if (toolCallChunk.name === '') {
-            toolCallChunk.name = undefined;
-        }
-        if (toolCallChunk.id === '') {
-            toolCallChunk.id = undefined;
-        }
-        else if (tool_calls != null &&
-            toolCallChunk.id != null &&
-            toolCallChunk.name != null) {
-            tool_calls.push({
-                args: {},
-                id: toolCallChunk.id,
-                name: toolCallChunk.name,
-                type: ToolCallTypes.TOOL_CALL,
-            });
-        }
-    }
-    let stepId = _stepId;
-    const alreadyDispatched = prevRunStep?.type === StepTypes.MESSAGE_CREATION &&
-        graph.messageStepHasToolCalls.has(prevStepId);
-    if (prevRunStep?.type === StepTypes.TOOL_CALLS) {
-        /**
-         * If previous step is already a tool_calls step, use that step ID
-         * This ensures tool call deltas are dispatched to the correct step
-         */
-        stepId = prevStepId;
-    }
-    else if (!alreadyDispatched &&
-        prevRunStep?.type === StepTypes.MESSAGE_CREATION) {
-        /**
-         * Create tool_calls step as soon as we receive the first tool call chunk
-         * This ensures deltas are always associated with the correct step
-         *
-         * NOTE: We do NOT dispatch an empty text block here because:
-         * - Empty text blocks cause providers (Anthropic, Bedrock) to reject messages
-         * - The tool_calls themselves are sufficient for the step
-         * - Empty content with tool_call_ids gets stored in conversation history
-         *   and causes "messages must have non-empty content" errors on replay
-         */
-        graph.messageStepHasToolCalls.set(prevStepId, true);
-        stepId = await graph.dispatchRunStep(stepKey, {
-            type: StepTypes.TOOL_CALLS,
-            tool_calls: tool_calls ?? [],
-        }, metadata);
-    }
-    await graph.dispatchRunStepDelta(stepId, {
-        type: StepTypes.TOOL_CALLS,
-        tool_calls: toolCallChunks,
-    });
-}
-export const handleToolCalls = async (toolCalls, metadata, graph) => {
-    if (!graph || !metadata) {
-        console.warn('Graph or metadata not found in `handleToolCalls`');
-        return;
-    }
-    if (!toolCalls) {
-        return;
-    }
-    if (toolCalls.length === 0) {
-        return;
-    }
-    const stepKey = graph.getStepKey(metadata);
-    /**
-     * Track whether we've already reused an empty TOOL_CALLS step created by
-     * handleToolCallChunks during streaming. Only reuse it once (for the first
-     * tool call); subsequent parallel tool calls must create their own steps.
-     */
-    let reusedChunkStepId;
-    for (const tool_call of toolCalls) {
-        const toolCallId = tool_call.id ?? `toolu_${nanoid()}`;
-        tool_call.id = toolCallId;
-        // If this tool call ID was already tracked via handleToolCallChunks,
-        // the step exists but may lack the name (Bedrock sends name only at model end).
-        // Dispatch a delta with the complete data so the client can fill in the name.
-        if (toolCallId && graph.toolCallStepIds.has(toolCallId)) {
-            const existingStepId = graph.toolCallStepIds.get(toolCallId);
-            if (existingStepId != null && existingStepId !== '') {
-                const argsStr = typeof tool_call.args === 'string'
-                    ? tool_call.args
-                    : JSON.stringify(tool_call.args);
-                await graph.dispatchRunStepDelta(existingStepId, {
-                    type: StepTypes.TOOL_CALLS,
-                    tool_calls: [{ name: tool_call.name, args: argsStr, id: toolCallId }],
-                });
-            }
-            continue;
-        }
-        let prevStepId = '';
-        let prevRunStep;
-        try {
-            prevStepId = graph.getStepIdByKey(stepKey);
-            prevRunStep = graph.getRunStep(prevStepId);
-        }
-        catch {
-            // no previous step
-        }
-        // If the previous step is TOOL_CALLS (created by handleToolCallChunks),
-        // either reuse it (if empty) or dispatch a new TOOL_CALLS step directly —
-        // skip the intermediate MESSAGE_CREATION to avoid orphaned gaps.
-        if (prevRunStep?.type === StepTypes.TOOL_CALLS) {
-            const details = prevRunStep.stepDetails;
-            const isEmpty = !details.tool_calls || details.tool_calls.length === 0;
-            if (isEmpty && prevStepId !== reusedChunkStepId) {
-                graph.toolCallStepIds.set(toolCallId, prevStepId);
-                reusedChunkStepId = prevStepId;
-                continue;
-            }
-            await graph.dispatchRunStep(stepKey, { type: StepTypes.TOOL_CALLS, tool_calls: [tool_call] }, metadata);
-            continue;
-        }
-        /**
-         * NOTE: We do NOT dispatch empty text blocks with tool_call_ids because:
-         * - Empty text blocks cause providers (Anthropic, Bedrock) to reject messages
-         * - They get stored in conversation history and cause errors on replay:
-         *   "messages must have non-empty content" (Anthropic)
-         *   "The content field in the Message object is empty" (Bedrock)
-         * - The tool_calls themselves are sufficient
-         */
-        /* If the previous step exists and is a message creation */
-        if (prevStepId && prevRunStep) {
-            graph.messageStepHasToolCalls.set(prevStepId, true);
-            /* If the previous step doesn't exist */
-        }
-        else if (!prevRunStep) {
-            const messageId = getMessageId(stepKey, graph, true) ?? '';
-            const stepId = await graph.dispatchRunStep(stepKey, {
-                type: StepTypes.MESSAGE_CREATION,
-                message_creation: {
-                    message_id: messageId,
-                },
-            }, metadata);
-            graph.messageStepHasToolCalls.set(stepId, true);
-        }
-        await graph.dispatchRunStep(stepKey, {
-            type: StepTypes.TOOL_CALLS,
-            tool_calls: [tool_call],
-        }, metadata);
-    }
-};
-export const toolResultTypes = new Set([
-    // 'tool_use',
-    // 'server_tool_use',
-    // 'input_json_delta',
-    'tool_result',
-    'web_search_result',
-    'web_search_tool_result',
-]);
-/**
- * Handles the result of a server tool call; in other words, a provider's built-in tool.
- * As of 2025-07-06, only Anthropic handles server tool calls with this pattern.
- */
-export async function handleServerToolResult({ graph, content, metadata, agentContext, }) {
-    let skipHandling = false;
-    if (agentContext?.provider !== Providers.ANTHROPIC) {
-        return skipHandling;
-    }
-    if (typeof content === 'string' ||
-        content == null ||
-        content.length === 0 ||
-        (content.length === 1 &&
-            content[0].tool_use_id == null)) {
-        return skipHandling;
-    }
-    for (const contentPart of content) {
-        const toolUseId = contentPart.tool_use_id;
-        if (toolUseId == null || toolUseId === '') {
-            continue;
-        }
-        const stepId = graph.toolCallStepIds.get(toolUseId);
-        if (stepId == null || stepId === '') {
-            console.warn(`Tool use ID ${toolUseId} not found in graph, cannot dispatch tool result.`);
-            continue;
-        }
-        const runStep = graph.getRunStep(stepId);
-        if (!runStep) {
-            console.warn(`Run step for ${stepId} does not exist, cannot dispatch tool result.`);
-            continue;
-        }
-        else if (runStep.type !== StepTypes.TOOL_CALLS) {
-            console.warn(`Run step for ${stepId} is not a tool call step, cannot dispatch tool result.`);
-            continue;
-        }
-        const toolCall = runStep.stepDetails.type === StepTypes.TOOL_CALLS
-            ? runStep.stepDetails.tool_calls?.find((toolCall) => toolCall.id === toolUseId)
-            : undefined;
-        if (!toolCall) {
-            continue;
-        }
-        if (contentPart.type === 'web_search_result' ||
-            contentPart.type === 'web_search_tool_result') {
-            await handleAnthropicSearchResults({
-                contentPart: contentPart,
-                toolCall,
-                metadata,
-                graph,
-            });
-        }
-        if (!skipHandling) {
-            skipHandling = true;
-        }
-    }
-    return skipHandling;
-}
-async function handleAnthropicSearchResults({ contentPart, toolCall, metadata, graph, }) {
-    if (!Array.isArray(contentPart.content)) {
-        console.warn(`Expected content to be an array, got ${typeof contentPart.content}`);
-        return;
-    }
-    if (!isAnthropicWebSearchResult(contentPart.content[0])) {
-        console.warn(`Expected content to be an Anthropic web search result, got ${JSON.stringify(contentPart.content)}`);
-        return;
-    }
-    const turn = graph.invokedToolIds?.size ?? 0;
-    const searchResultData = coerceAnthropicSearchResults({
-        turn,
-        results: contentPart.content,
-    });
-    const name = toolCall.name;
-    const input = toolCall.args ?? {};
-    const artifact = {
-        [Constants.WEB_SEARCH]: searchResultData,
-    };
-    const { output: formattedOutput } = formatResultsForLLM(turn, searchResultData);
-    const output = new ToolMessage({
-        name,
-        artifact,
-        content: formattedOutput,
-        tool_call_id: toolCall.id,
-    });
-    const toolEndData = {
-        input,
-        output,
-    };
-    await graph.handlerRegistry
-        ?.getHandler(GraphEvents.TOOL_END)
-        ?.handle(GraphEvents.TOOL_END, toolEndData, metadata, graph);
-    if (graph.invokedToolIds == null) {
-        graph.invokedToolIds = new Set();
-    }
-    graph.invokedToolIds.add(toolCall.id);
-}
-//# sourceMappingURL=handlers.js.map