npm - @illuma-ai/agents - Versions diffs - 1.1.21 → 1.1.22 - Mend

@illuma-ai/agents 1.1.21 → 1.1.22

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (241) hide show

package/dist/cjs/graphs/Graph.cjs +12 -1
package/dist/cjs/graphs/Graph.cjs.map +1 -1
package/dist/cjs/graphs/MultiAgentGraph.cjs +85 -1
package/dist/cjs/graphs/MultiAgentGraph.cjs.map +1 -1
package/dist/cjs/run.cjs +20 -9
package/dist/cjs/run.cjs.map +1 -1
package/dist/esm/graphs/Graph.mjs +12 -1
package/dist/esm/graphs/Graph.mjs.map +1 -1
package/dist/esm/graphs/MultiAgentGraph.mjs +85 -1
package/dist/esm/graphs/MultiAgentGraph.mjs.map +1 -1
package/dist/esm/run.mjs +20 -9
package/dist/esm/run.mjs.map +1 -1
package/dist/types/graphs/MultiAgentGraph.d.ts +17 -0
package/package.json +1 -1
package/src/graphs/Graph.ts +12 -1
package/src/graphs/MultiAgentGraph.ts +105 -1
package/src/graphs/__tests__/multi-agent-delegate.test.ts +191 -0
package/src/run.ts +20 -11
package/src/scripts/test-bedrock-handoff-autonomous.ts +231 -0
package/src/agents/AgentContext.js +0 -782
package/src/agents/AgentContext.test.js +0 -421
package/src/agents/__tests__/AgentContext.test.js +0 -678
package/src/agents/__tests__/resolveStructuredOutputMode.test.js +0 -117
package/src/common/enum.js +0 -192
package/src/common/index.js +0 -3
package/src/events.js +0 -166
package/src/graphs/Graph.js +0 -1857
package/src/graphs/MultiAgentGraph.js +0 -1092
package/src/graphs/__tests__/structured-output.integration.test.js +0 -624
package/src/graphs/__tests__/structured-output.test.js +0 -144
package/src/graphs/contextManagement.e2e.test.js +0 -718
package/src/graphs/contextManagement.test.js +0 -485
package/src/graphs/handoffValidation.test.js +0 -276
package/src/graphs/index.js +0 -3
package/src/index.js +0 -28
package/src/instrumentation.js +0 -21
package/src/llm/anthropic/index.js +0 -319
package/src/llm/anthropic/types.js +0 -46
package/src/llm/anthropic/utils/message_inputs.js +0 -627
package/src/llm/anthropic/utils/message_outputs.js +0 -290
package/src/llm/anthropic/utils/output_parsers.js +0 -89
package/src/llm/anthropic/utils/tools.js +0 -25
package/src/llm/bedrock/__tests__/bedrock-caching.test.js +0 -392
package/src/llm/bedrock/index.js +0 -303
package/src/llm/bedrock/types.js +0 -2
package/src/llm/bedrock/utils/index.js +0 -6
package/src/llm/bedrock/utils/message_inputs.js +0 -463
package/src/llm/bedrock/utils/message_outputs.js +0 -269
package/src/llm/fake.js +0 -92
package/src/llm/google/index.js +0 -215
package/src/llm/google/types.js +0 -12
package/src/llm/google/utils/common.js +0 -670
package/src/llm/google/utils/tools.js +0 -111
package/src/llm/google/utils/zod_to_genai_parameters.js +0 -47
package/src/llm/openai/index.js +0 -1033
package/src/llm/openai/types.js +0 -2
package/src/llm/openai/utils/index.js +0 -756
package/src/llm/openai/utils/isReasoningModel.test.js +0 -79
package/src/llm/openrouter/index.js +0 -261
package/src/llm/openrouter/reasoning.test.js +0 -181
package/src/llm/providers.js +0 -36
package/src/llm/text.js +0 -65
package/src/llm/vertexai/index.js +0 -402
package/src/messages/__tests__/tools.test.js +0 -392
package/src/messages/cache.js +0 -404
package/src/messages/cache.test.js +0 -1167
package/src/messages/content.js +0 -48
package/src/messages/content.test.js +0 -314
package/src/messages/core.js +0 -359
package/src/messages/ensureThinkingBlock.test.js +0 -997
package/src/messages/format.js +0 -973
package/src/messages/formatAgentMessages.test.js +0 -2278
package/src/messages/formatAgentMessages.tools.test.js +0 -362
package/src/messages/formatMessage.test.js +0 -608
package/src/messages/ids.js +0 -18
package/src/messages/index.js +0 -9
package/src/messages/labelContentByAgent.test.js +0 -725
package/src/messages/prune.js +0 -438
package/src/messages/reducer.js +0 -60
package/src/messages/shiftIndexTokenCountMap.test.js +0 -63
package/src/messages/summarize.js +0 -146
package/src/messages/summarize.test.js +0 -332
package/src/messages/tools.js +0 -90
package/src/mockStream.js +0 -81
package/src/prompts/collab.js +0 -7
package/src/prompts/index.js +0 -3
package/src/prompts/taskmanager.js +0 -58
package/src/run.js +0 -427
package/src/schemas/index.js +0 -3
package/src/schemas/schema-preparation.test.js +0 -370
package/src/schemas/validate.js +0 -314
package/src/schemas/validate.test.js +0 -264
package/src/scripts/abort.js +0 -127
package/src/scripts/ant_web_search.js +0 -130
package/src/scripts/ant_web_search_edge_case.js +0 -133
package/src/scripts/ant_web_search_error_edge_case.js +0 -119
package/src/scripts/args.js +0 -41
package/src/scripts/bedrock-cache-debug.js +0 -186
package/src/scripts/bedrock-content-aggregation-test.js +0 -195
package/src/scripts/bedrock-merge-test.js +0 -80
package/src/scripts/bedrock-parallel-tools-test.js +0 -150
package/src/scripts/caching.js +0 -106
package/src/scripts/cli.js +0 -152
package/src/scripts/cli2.js +0 -119
package/src/scripts/cli3.js +0 -163
package/src/scripts/cli4.js +0 -165
package/src/scripts/cli5.js +0 -165
package/src/scripts/code_exec.js +0 -171
package/src/scripts/code_exec_files.js +0 -180
package/src/scripts/code_exec_multi_session.js +0 -185
package/src/scripts/code_exec_ptc.js +0 -265
package/src/scripts/code_exec_session.js +0 -217
package/src/scripts/code_exec_simple.js +0 -120
package/src/scripts/content.js +0 -111
package/src/scripts/empty_input.js +0 -125
package/src/scripts/handoff-test.js +0 -96
package/src/scripts/image.js +0 -138
package/src/scripts/memory.js +0 -83
package/src/scripts/multi-agent-chain.js +0 -271
package/src/scripts/multi-agent-conditional.js +0 -185
package/src/scripts/multi-agent-document-review-chain.js +0 -171
package/src/scripts/multi-agent-hybrid-flow.js +0 -264
package/src/scripts/multi-agent-parallel-start.js +0 -214
package/src/scripts/multi-agent-parallel.js +0 -346
package/src/scripts/multi-agent-sequence.js +0 -184
package/src/scripts/multi-agent-supervisor.js +0 -324
package/src/scripts/multi-agent-test.js +0 -147
package/src/scripts/parallel-asymmetric-tools-test.js +0 -202
package/src/scripts/parallel-full-metadata-test.js +0 -176
package/src/scripts/parallel-tools-test.js +0 -256
package/src/scripts/programmatic_exec.js +0 -277
package/src/scripts/programmatic_exec_agent.js +0 -168
package/src/scripts/search.js +0 -118
package/src/scripts/sequential-full-metadata-test.js +0 -143
package/src/scripts/simple.js +0 -174
package/src/scripts/single-agent-metadata-test.js +0 -152
package/src/scripts/stream.js +0 -113
package/src/scripts/test-custom-prompt-key.js +0 -132
package/src/scripts/test-handoff-input.js +0 -143
package/src/scripts/test-handoff-preamble.js +0 -227
package/src/scripts/test-handoff-steering.js +0 -353
package/src/scripts/test-multi-agent-list-handoff.js +0 -318
package/src/scripts/test-parallel-agent-labeling.js +0 -253
package/src/scripts/test-parallel-handoffs.js +0 -229
package/src/scripts/test-thinking-handoff-bedrock.js +0 -132
package/src/scripts/test-thinking-handoff.js +0 -132
package/src/scripts/test-thinking-to-thinking-handoff-bedrock.js +0 -140
package/src/scripts/test-tool-before-handoff-role-order.js +0 -223
package/src/scripts/test-tools-before-handoff.js +0 -187
package/src/scripts/test_code_api.js +0 -263
package/src/scripts/thinking-bedrock.js +0 -128
package/src/scripts/thinking-vertexai.js +0 -130
package/src/scripts/thinking.js +0 -134
package/src/scripts/tool_search.js +0 -114
package/src/scripts/tools.js +0 -125
package/src/specs/agent-handoffs-bedrock.integration.test.js +0 -280
package/src/specs/agent-handoffs.test.js +0 -924
package/src/specs/anthropic.simple.test.js +0 -287
package/src/specs/azure.simple.test.js +0 -381
package/src/specs/cache.simple.test.js +0 -282
package/src/specs/custom-event-await.test.js +0 -148
package/src/specs/deepseek.simple.test.js +0 -189
package/src/specs/emergency-prune.test.js +0 -308
package/src/specs/moonshot.simple.test.js +0 -237
package/src/specs/observability.integration.test.js +0 -1337
package/src/specs/openai.simple.test.js +0 -233
package/src/specs/openrouter.simple.test.js +0 -202
package/src/specs/prune.test.js +0 -733
package/src/specs/reasoning.test.js +0 -144
package/src/specs/spec.utils.js +0 -4
package/src/specs/thinking-handoff.test.js +0 -486
package/src/specs/thinking-prune.test.js +0 -600
package/src/specs/token-distribution-edge-case.test.js +0 -246
package/src/specs/token-memoization.test.js +0 -32
package/src/specs/tokens.test.js +0 -49
package/src/specs/tool-error.test.js +0 -139
package/src/splitStream.js +0 -204
package/src/splitStream.test.js +0 -504
package/src/stream.js +0 -650
package/src/stream.test.js +0 -225
package/src/test/mockTools.js +0 -340
package/src/tools/BrowserTools.js +0 -245
package/src/tools/Calculator.js +0 -38
package/src/tools/Calculator.test.js +0 -225
package/src/tools/CodeExecutor.js +0 -233
package/src/tools/ProgrammaticToolCalling.js +0 -602
package/src/tools/StreamingToolCallBuffer.js +0 -179
package/src/tools/ToolNode.js +0 -930
package/src/tools/ToolSearch.js +0 -904
package/src/tools/__tests__/BrowserTools.test.js +0 -306
package/src/tools/__tests__/ProgrammaticToolCalling.integration.test.js +0 -276
package/src/tools/__tests__/ProgrammaticToolCalling.test.js +0 -807
package/src/tools/__tests__/StreamingToolCallBuffer.test.js +0 -175
package/src/tools/__tests__/ToolApproval.test.js +0 -675
package/src/tools/__tests__/ToolNode.recovery.test.js +0 -200
package/src/tools/__tests__/ToolNode.session.test.js +0 -319
package/src/tools/__tests__/ToolSearch.integration.test.js +0 -125
package/src/tools/__tests__/ToolSearch.test.js +0 -812
package/src/tools/__tests__/handlers.test.js +0 -799
package/src/tools/__tests__/truncation-recovery.integration.test.js +0 -362
package/src/tools/handlers.js +0 -306
package/src/tools/schema.js +0 -25
package/src/tools/search/anthropic.js +0 -34
package/src/tools/search/content.js +0 -116
package/src/tools/search/content.test.js +0 -133
package/src/tools/search/firecrawl.js +0 -173
package/src/tools/search/format.js +0 -198
package/src/tools/search/highlights.js +0 -241
package/src/tools/search/index.js +0 -3
package/src/tools/search/jina-reranker.test.js +0 -106
package/src/tools/search/rerankers.js +0 -165
package/src/tools/search/schema.js +0 -102
package/src/tools/search/search.js +0 -561
package/src/tools/search/serper-scraper.js +0 -126
package/src/tools/search/test.js +0 -129
package/src/tools/search/tool.js +0 -453
package/src/tools/search/types.js +0 -2
package/src/tools/search/utils.js +0 -59
package/src/types/graph.js +0 -24
package/src/types/graph.test.js +0 -192
package/src/types/index.js +0 -7
package/src/types/llm.js +0 -2
package/src/types/messages.js +0 -2
package/src/types/run.js +0 -2
package/src/types/stream.js +0 -2
package/src/types/tools.js +0 -2
package/src/utils/contextAnalytics.js +0 -79
package/src/utils/contextAnalytics.test.js +0 -166
package/src/utils/events.js +0 -26
package/src/utils/graph.js +0 -11
package/src/utils/handlers.js +0 -65
package/src/utils/index.js +0 -10
package/src/utils/llm.js +0 -21
package/src/utils/llmConfig.js +0 -205
package/src/utils/logging.js +0 -37
package/src/utils/misc.js +0 -51
package/src/utils/run.js +0 -69
package/src/utils/schema.js +0 -21
package/src/utils/title.js +0 -119
package/src/utils/tokens.js +0 -92
package/src/utils/toonFormat.js +0 -379

package/src/scripts/test-handoff-steering.js DELETED Viewed

@@ -1,353 +0,0 @@
-import { config } from 'dotenv';
-config();
-import { HumanMessage } from '@langchain/core/messages';
-import { ChatModelStreamHandler, createContentAggregator } from '@/stream';
-import { ToolEndHandler, ModelEndHandler } from '@/events';
-import { GraphEvents, Providers } from '@/common';
-import { Run } from '@/run';
-/**
- * Test LLM steering quality after handoff with system prompt instructions.
- *
- * Validates that the receiving agent clearly understands:
- * 1. WHO it is (its role/identity)
- * 2. WHAT the task is (instructions from the handoff)
- * 3. WHO transferred control (source agent context)
- *
- * Uses specific, verifiable instructions so we can check the output.
- */
-async function testHandoffSteering() {
-    console.log('='.repeat(60));
-    console.log('Test: Handoff Steering Quality (System Prompt Instructions)');
-    console.log('='.repeat(60));
-    const { contentParts, aggregateContent } = createContentAggregator();
-    let currentAgent = '';
-    const agentResponses = {};
-    const customHandlers = {
-        [GraphEvents.TOOL_END]: new ToolEndHandler(),
-        [GraphEvents.CHAT_MODEL_END]: new ModelEndHandler(),
-        [GraphEvents.CHAT_MODEL_STREAM]: new ChatModelStreamHandler(),
-        [GraphEvents.ON_RUN_STEP]: {
-            handle: (event, data) => {
-                const runStep = data;
-                if (runStep.agentId) {
-                    currentAgent = runStep.agentId;
-                    console.log(`\n[Agent: ${currentAgent}] Processing...`);
-                }
-                aggregateContent({ event, data: runStep });
-            },
-        },
-        [GraphEvents.ON_RUN_STEP_COMPLETED]: {
-            handle: (event, data) => {
-                aggregateContent({
-                    event,
-                    data: data,
-                });
-            },
-        },
-        [GraphEvents.ON_MESSAGE_DELTA]: {
-            handle: (event, data) => {
-                aggregateContent({ event, data: data });
-            },
-        },
-        [GraphEvents.TOOL_START]: {
-            handle: (_event, data, _metadata) => {
-                const toolData = data;
-                if (toolData?.name?.includes('transfer_to_')) {
-                    const specialist = toolData.name.replace('lc_transfer_to_', '');
-                    console.log(`\n  >> Handoff to: ${specialist}`);
-                }
-            },
-        },
-    };
-    /**
-     * Test 1: Basic handoff with specific task instructions
-     * The specialist should clearly follow the coordinator's instructions.
-     */
-    async function test1_basicInstructions() {
-        console.log('\n' + '-'.repeat(60));
-        console.log('TEST 1: Basic handoff with specific task instructions');
-        console.log('-'.repeat(60));
-        const agents = [
-            {
-                agentId: 'coordinator',
-                provider: Providers.OPENAI,
-                clientOptions: {
-                    modelName: 'gpt-4.1-mini',
-                    apiKey: process.env.OPENAI_API_KEY,
-                },
-                instructions: `You are a Task Coordinator. When a user makes a request:
-1. Analyze what they need
-2. Transfer to the specialist with SPECIFIC instructions about what to do
-IMPORTANT: Always use the transfer tool. Do not try to do the work yourself.`,
-                maxContextTokens: 8000,
-            },
-            {
-                agentId: 'specialist',
-                provider: Providers.OPENAI,
-                clientOptions: {
-                    modelName: 'gpt-4.1-mini',
-                    apiKey: process.env.OPENAI_API_KEY,
-                },
-                instructions: `You are a Technical Specialist. You provide detailed technical responses.
-When you receive a task, execute it thoroughly. Always identify yourself as the Technical Specialist in your response.`,
-                maxContextTokens: 8000,
-            },
-        ];
-        const edges = [
-            {
-                from: 'coordinator',
-                to: 'specialist',
-                edgeType: 'transfer',
-                description: 'Transfer to specialist for detailed work',
-                prompt: 'Provide specific instructions for the specialist about what to analyze or create',
-                promptKey: 'instructions',
-            },
-        ];
-        const run = await Run.create({
-            runId: `steering-test1-${Date.now()}`,
-            graphConfig: { type: 'multi-agent', agents, edges },
-            customHandlers,
-            returnContent: true,
-            skipCleanup: true,
-        });
-        const streamConfig = {
-            configurable: { thread_id: 'steering-test1' },
-            streamMode: 'values',
-            version: 'v2',
-        };
-        const query = 'Explain the difference between TCP and UDP. I need exactly 3 bullet points for each protocol.';
-        console.log(`\nQuery: "${query}"\n`);
-        const messages = [new HumanMessage(query)];
-        await run.processStream({ messages }, streamConfig);
-        const finalMessages = run.getRunMessages();
-        console.log('\n--- Specialist Response ---');
-        if (finalMessages) {
-            for (const msg of finalMessages) {
-                if (msg.getType() === 'ai' && typeof msg.content === 'string') {
-                    console.log(msg.content);
-                    agentResponses['test1'] = msg.content;
-                }
-            }
-        }
-        // Check steering quality
-        const response = agentResponses['test1'] || '';
-        const mentionsSpecialist = response.toLowerCase().includes('specialist') ||
-            response.toLowerCase().includes('technical');
-        const hasBulletPoints = (response.match(/[-•*]\s/g) || []).length >= 4 ||
-            (response.match(/\d\./g) || []).length >= 4;
-        const mentionsTCP = response.toLowerCase().includes('tcp');
-        const mentionsUDP = response.toLowerCase().includes('udp');
-        console.log('\n--- Steering Checks ---');
-        console.log(`  Identifies as specialist: ${mentionsSpecialist ? 'YES' : 'NO'}`);
-        console.log(`  Has bullet points: ${hasBulletPoints ? 'YES' : 'NO'}`);
-        console.log(`  Covers TCP: ${mentionsTCP ? 'YES' : 'NO'}`);
-        console.log(`  Covers UDP: ${mentionsUDP ? 'YES' : 'NO'}`);
-    }
-    /**
-     * Test 2: Handoff with very specific formatting instructions
-     * Tests whether the receiving agent follows precise instructions from the handoff.
-     */
-    async function test2_preciseFormatting() {
-        console.log('\n' + '-'.repeat(60));
-        console.log('TEST 2: Handoff with precise formatting instructions');
-        console.log('-'.repeat(60));
-        const agents = [
-            {
-                agentId: 'manager',
-                provider: Providers.OPENAI,
-                clientOptions: {
-                    modelName: 'gpt-4.1-mini',
-                    apiKey: process.env.OPENAI_API_KEY,
-                },
-                instructions: `You are a Project Manager. When a user asks about a topic:
-1. Transfer to the writer with VERY SPECIFIC formatting instructions
-2. Tell the writer to start their response with "REPORT:" and end with "END REPORT"
-3. Tell the writer to use exactly 2 paragraphs
-CRITICAL: Always transfer to the writer. Do NOT write the report yourself.`,
-                maxContextTokens: 8000,
-            },
-            {
-                agentId: 'writer',
-                provider: Providers.OPENAI,
-                clientOptions: {
-                    modelName: 'gpt-4.1-mini',
-                    apiKey: process.env.OPENAI_API_KEY,
-                },
-                instructions: `You are a Report Writer. Follow any formatting instructions you receive precisely.
-You must follow the exact format requested.`,
-                maxContextTokens: 8000,
-            },
-        ];
-        const edges = [
-            {
-                from: 'manager',
-                to: 'writer',
-                edgeType: 'transfer',
-                description: 'Transfer to writer for report creation',
-                prompt: 'Provide specific formatting and content instructions for the writer',
-                promptKey: 'instructions',
-            },
-        ];
-        const run = await Run.create({
-            runId: `steering-test2-${Date.now()}`,
-            graphConfig: { type: 'multi-agent', agents, edges },
-            customHandlers,
-            returnContent: true,
-            skipCleanup: true,
-        });
-        const streamConfig = {
-            configurable: { thread_id: 'steering-test2' },
-            streamMode: 'values',
-            version: 'v2',
-        };
-        const query = 'Write a brief report about cloud computing benefits.';
-        console.log(`\nQuery: "${query}"\n`);
-        const messages = [new HumanMessage(query)];
-        await run.processStream({ messages }, streamConfig);
-        const finalMessages = run.getRunMessages();
-        console.log('\n--- Writer Response ---');
-        if (finalMessages) {
-            for (const msg of finalMessages) {
-                if (msg.getType() === 'ai' && typeof msg.content === 'string') {
-                    console.log(msg.content);
-                    agentResponses['test2'] = msg.content;
-                }
-            }
-        }
-        // Check if the writer followed the manager's formatting instructions
-        const response = agentResponses['test2'] || '';
-        const startsWithReport = response.trimStart().startsWith('REPORT:');
-        const endsWithEndReport = response.trimEnd().endsWith('END REPORT');
-        const mentionsCloud = response.toLowerCase().includes('cloud');
-        console.log('\n--- Steering Checks ---');
-        console.log(`  Starts with "REPORT:": ${startsWithReport ? 'YES' : 'NO'}`);
-        console.log(`  Ends with "END REPORT": ${endsWithEndReport ? 'YES' : 'NO'}`);
-        console.log(`  Covers cloud computing: ${mentionsCloud ? 'YES' : 'NO'}`);
-    }
-    /**
-     * Test 3: Multi-turn after handoff
-     * Tests that identity and context persist across turns.
-     */
-    async function test3_multiTurn() {
-        console.log('\n' + '-'.repeat(60));
-        console.log('TEST 3: Multi-turn conversation after handoff');
-        console.log('-'.repeat(60));
-        const agents = [
-            {
-                agentId: 'router',
-                provider: Providers.OPENAI,
-                clientOptions: {
-                    modelName: 'gpt-4.1-mini',
-                    apiKey: process.env.OPENAI_API_KEY,
-                },
-                instructions: `You are a Router. Transfer all requests to the chef.
-When transferring, tell the chef to respond ONLY about Italian cuisine.
-CRITICAL: Always transfer. Never answer directly.`,
-                maxContextTokens: 8000,
-            },
-            {
-                agentId: 'chef',
-                provider: Providers.OPENAI,
-                clientOptions: {
-                    modelName: 'gpt-4.1-mini',
-                    apiKey: process.env.OPENAI_API_KEY,
-                },
-                instructions: `You are Chef Marco, an Italian cuisine expert.
-Always introduce yourself as Chef Marco. Only discuss Italian food.
-If asked about non-Italian food, politely redirect to Italian alternatives.`,
-                maxContextTokens: 8000,
-            },
-        ];
-        const edges = [
-            {
-                from: 'router',
-                to: 'chef',
-                edgeType: 'transfer',
-                description: 'Transfer to chef',
-                prompt: 'Instructions for the chef about how to respond',
-                promptKey: 'instructions',
-            },
-        ];
-        const run = await Run.create({
-            runId: `steering-test3-${Date.now()}`,
-            graphConfig: { type: 'multi-agent', agents, edges },
-            customHandlers,
-            returnContent: true,
-            skipCleanup: true,
-        });
-        const streamConfig = {
-            configurable: { thread_id: 'steering-test3' },
-            streamMode: 'values',
-            version: 'v2',
-        };
-        const conversationHistory = [];
-        // Turn 1
-        const query1 = 'What is a good pasta recipe?';
-        console.log(`\nTurn 1: "${query1}"\n`);
-        conversationHistory.push(new HumanMessage(query1));
-        await run.processStream({ messages: conversationHistory }, streamConfig);
-        const turn1Messages = run.getRunMessages();
-        if (turn1Messages) {
-            conversationHistory.push(...turn1Messages);
-            for (const msg of turn1Messages) {
-                if (msg.getType() === 'ai' && typeof msg.content === 'string') {
-                    console.log(msg.content.substring(0, 300) + '...');
-                    agentResponses['test3_turn1'] = msg.content;
-                }
-            }
-        }
-        // Turn 2 - follow up
-        const query2 = 'What about sushi instead?';
-        console.log(`\nTurn 2: "${query2}"\n`);
-        conversationHistory.push(new HumanMessage(query2));
-        await run.processStream({ messages: conversationHistory }, streamConfig);
-        const turn2Messages = run.getRunMessages();
-        if (turn2Messages) {
-            conversationHistory.push(...turn2Messages);
-            for (const msg of turn2Messages) {
-                if (msg.getType() === 'ai' && typeof msg.content === 'string') {
-                    console.log(msg.content.substring(0, 300) + '...');
-                    agentResponses['test3_turn2'] = msg.content;
-                }
-            }
-        }
-        const response1 = agentResponses['test3_turn1'] || '';
-        const response2 = agentResponses['test3_turn2'] || '';
-        const t1Identity = response1.toLowerCase().includes('marco') ||
-            response1.toLowerCase().includes('chef');
-        const t1Italian = response1.toLowerCase().includes('italian') ||
-            response1.toLowerCase().includes('pasta');
-        const t2Redirects = response2.toLowerCase().includes('italian') ||
-            response2.toLowerCase().includes('instead');
-        console.log('\n--- Steering Checks ---');
-        console.log(`  Turn 1 - Chef identity: ${t1Identity ? 'YES' : 'NO'}`);
-        console.log(`  Turn 1 - Italian focus: ${t1Italian ? 'YES' : 'NO'}`);
-        console.log(`  Turn 2 - Redirects to Italian: ${t2Redirects ? 'YES' : 'NO'}`);
-    }
-    try {
-        await test1_basicInstructions();
-        await test2_preciseFormatting();
-        await test3_multiTurn();
-        console.log('\n\n' + '='.repeat(60));
-        console.log('ALL TESTS COMPLETE');
-        console.log('='.repeat(60));
-        console.log('\nReview the steering checks above.');
-        console.log('If the receiving agents consistently follow instructions and maintain identity,');
-        console.log('the system prompt injection approach is working correctly.');
-    }
-    catch (error) {
-        console.error('\nTest failed:', error);
-        process.exit(1);
-    }
-}
-process.on('unhandledRejection', (reason) => {
-    console.error('Unhandled Rejection:', reason);
-    process.exit(1);
-});
-testHandoffSteering().catch((err) => {
-    console.error('Test failed:', err);
-    process.exit(1);
-});
-//# sourceMappingURL=test-handoff-steering.js.map

package/src/scripts/test-multi-agent-list-handoff.js DELETED Viewed

@@ -1,318 +0,0 @@
-#!/usr/bin/env bun
-import { config } from 'dotenv';
-config();
-import { HumanMessage } from '@langchain/core/messages';
-import { labelContentByAgent, formatAgentMessages } from '@/messages/format';
-import { ChatModelStreamHandler, createContentAggregator } from '@/stream';
-import { Providers, GraphEvents, Constants, StepTypes } from '@/common';
-import { ToolEndHandler, ModelEndHandler } from '@/events';
-import { Run } from '@/run';
-const conversationHistory = [];
-/**
- * Test supervisor-based multi-agent system using a single edge with multiple destinations
- *
- * Instead of creating 5 separate edges, we use one edge with an array of destinations
- * This should create handoff tools for all 5 specialists from a single edge definition
- */
-async function testSupervisorListHandoff() {
-    console.log('Testing Supervisor with List-Based Handoff Edge...\n');
-    // Set up content aggregator
-    const { contentParts, aggregateContent } = createContentAggregator();
-    // Track which specialist role was selected
-    let selectedRole = '';
-    // Create custom handlers
-    const customHandlers = {
-        [GraphEvents.TOOL_END]: new ToolEndHandler(),
-        [GraphEvents.CHAT_MODEL_END]: new ModelEndHandler(),
-        [GraphEvents.CHAT_MODEL_STREAM]: new ChatModelStreamHandler(),
-        [GraphEvents.ON_RUN_STEP]: {
-            handle: (event, data) => {
-                const runStepData = data;
-                if (runStepData?.name) {
-                    console.log(`\n[${runStepData.name}] Processing...`);
-                }
-                aggregateContent({ event, data: data });
-            },
-        },
-        [GraphEvents.ON_RUN_STEP_COMPLETED]: {
-            handle: (event, data) => {
-                aggregateContent({
-                    event,
-                    data: data,
-                });
-            },
-        },
-        [GraphEvents.ON_MESSAGE_DELTA]: {
-            handle: (event, data) => {
-                aggregateContent({ event, data: data });
-            },
-        },
-        [GraphEvents.TOOL_START]: {
-            handle: (_event, data, metadata) => {
-                const toolData = data;
-                if (toolData?.name?.startsWith(Constants.LC_TRANSFER_TO_)) {
-                    const specialist = toolData.name.replace(Constants.LC_TRANSFER_TO_, '');
-                    console.log(`\n🔀 Transferring to ${specialist}...`);
-                    selectedRole = specialist;
-                }
-            },
-        },
-    };
-    // Function to create the graph with a single edge to multiple specialists
-    function createSupervisorGraphWithListEdge() {
-        console.log(`\nCreating graph with supervisor and 5 specialist agents.`);
-        console.log('Using a SINGLE edge with multiple destinations (list-based handoff).\n');
-        // Define the adaptive specialist configuration that will be reused
-        const specialistConfig = {
-            provider: Providers.ANTHROPIC,
-            clientOptions: {
-                modelName: 'claude-haiku-4-5',
-                apiKey: process.env.ANTHROPIC_API_KEY,
-            },
-            instructions: `You are an Adaptive Specialist. Your agent ID indicates your role:
-      - data_analyst: Focus on statistical analysis, metrics, ML evaluation, A/B testing
-      - security_expert: Focus on cybersecurity, vulnerability assessment, compliance
-      - product_designer: Focus on UX/UI design, user research, accessibility
-      - devops_engineer: Focus on CI/CD, infrastructure, cloud platforms, monitoring
-      - legal_advisor: Focus on licensing, privacy laws, contracts, regulatory compliance
-      The supervisor will provide specific instructions. Follow them while maintaining your expert perspective.`,
-            maxContextTokens: 8000,
-        };
-        // Create the graph with supervisor and all 5 specialists
-        const agents = [
-            {
-                agentId: 'supervisor',
-                provider: Providers.ANTHROPIC,
-                clientOptions: {
-                    modelName: 'claude-haiku-4-5',
-                    apiKey: process.env.ANTHROPIC_API_KEY,
-                },
-                instructions: `You are a Task Supervisor with access to 5 specialist agents:
-        1. transfer_to_data_analyst - For statistical analysis and metrics
-        2. transfer_to_security_expert - For cybersecurity and vulnerability assessment
-        3. transfer_to_product_designer - For UX/UI design
-        4. transfer_to_devops_engineer - For infrastructure and deployment
-        5. transfer_to_legal_advisor - For compliance and licensing
-        Your role is to:
-        1. Analyze the incoming request
-        2. Decide which specialist is best suited
-        3. Use the appropriate transfer tool (e.g., transfer_to_data_analyst)
-        4. Provide specific instructions to guide their work
-        Be specific about what you need from the specialist.`,
-                maxContextTokens: 8000,
-            },
-            // Include all 5 specialists with the same adaptive configuration
-            {
-                agentId: 'data_analyst',
-                ...specialistConfig,
-            },
-            {
-                agentId: 'security_expert',
-                ...specialistConfig,
-            },
-            {
-                agentId: 'product_designer',
-                ...specialistConfig,
-            },
-            {
-                agentId: 'devops_engineer',
-                ...specialistConfig,
-            },
-            {
-                agentId: 'legal_advisor',
-                ...specialistConfig,
-            },
-        ];
-        // Create a SINGLE edge from supervisor to ALL 5 specialists using a list
-        const edges = [
-            {
-                from: 'supervisor',
-                to: [
-                    'data_analyst',
-                    'security_expert',
-                    'product_designer',
-                    'devops_engineer',
-                    'legal_advisor',
-                ],
-                description: 'Transfer to appropriate specialist based on task requirements',
-                edgeType: 'transfer',
-            },
-        ];
-        return {
-            runId: `supervisor-list-handoff-${Date.now()}`,
-            graphConfig: {
-                type: 'multi-agent',
-                agents,
-                edges,
-            },
-            customHandlers,
-            returnContent: true,
-            skipCleanup: true,
-        };
-    }
-    try {
-        // Test with different queries
-        const testQueries = [
-            'What are the legal implications of using GPL-licensed code in our product?',
-        ];
-        const config = {
-            configurable: {
-                thread_id: 'supervisor-list-handoff-1',
-            },
-            streamMode: 'values',
-            version: 'v2',
-        };
-        for (const query of testQueries) {
-            console.log(`\n${'='.repeat(80)}`);
-            console.log(`FIRST RUN - USER QUERY: "${query}"`);
-            console.log('='.repeat(80));
-            // Reset conversation
-            conversationHistory.length = 0;
-            conversationHistory.push(new HumanMessage(query));
-            // Create graph with supervisor having a single edge to multiple specialists
-            const runConfig = createSupervisorGraphWithListEdge();
-            const run = await Run.create(runConfig);
-            console.log('Processing first request...');
-            // Process with streaming
-            const inputs = {
-                messages: conversationHistory,
-            };
-            const finalContentParts = await run.processStream(inputs, config);
-            const finalMessages = run.getRunMessages();
-            if (finalMessages) {
-                conversationHistory.push(...finalMessages);
-            }
-            // Demo: Map contentParts to agentIds
-            console.log(`\n${'─'.repeat(60)}`);
-            console.log('CONTENT PARTS TO AGENT MAPPING:');
-            console.log('─'.repeat(60));
-            if (run.Graph) {
-                // Get the mapping of contentPart index to agentId
-                const contentPartAgentMap = run.Graph.getContentPartAgentMap();
-                console.log(`\nTotal content parts: ${contentParts.length}`);
-                console.log(`\nContent Part → Agent Mapping:`);
-                contentPartAgentMap.forEach((agentId, index) => {
-                    const contentPart = contentParts[index];
-                    const contentType = contentPart?.type || 'unknown';
-                    const preview = contentType === 'text'
-                        ? contentPart.text?.slice(0, 50) || ''
-                        : contentType === 'tool_call'
-                            ? `Tool: ${contentPart.tool_call?.name || 'unknown'}`
-                            : contentType;
-                    console.log(`  [${index}] ${agentId} → ${contentType}: ${preview}${preview.length >= 50 ? '...' : ''}`);
-                });
-                // Show agent participation summary
-                console.log(`\n${'─'.repeat(60)}`);
-                console.log('AGENT PARTICIPATION SUMMARY:');
-                console.log('─'.repeat(60));
-                const activeAgents = run.Graph.getActiveAgentIds();
-                console.log(`\nActive agents (${activeAgents.length}):`, activeAgents);
-                const stepsByAgent = run.Graph.getRunStepsByAgent();
-                stepsByAgent.forEach((steps, agentId) => {
-                    const toolCallSteps = steps.filter((s) => s.type === StepTypes.TOOL_CALLS).length;
-                    const messageSteps = steps.filter((s) => s.type === StepTypes.MESSAGE_CREATION).length;
-                    console.log(`\n  ${agentId}:`);
-                    console.log(`    - Total steps: ${steps.length}`);
-                    console.log(`    - Message steps: ${messageSteps}`);
-                    console.log(`    - Tool call steps: ${toolCallSteps}`);
-                });
-            }
-            // Show graph structure summary
-            console.log(`\n${'─'.repeat(60)}`);
-            console.log(`GRAPH STRUCTURE:`);
-            console.log(`- Agents: 6 total (supervisor + 5 specialists)`);
-            console.log(`- Edges: 1 edge with multiple destinations`);
-            console.log(`- Edge type: handoff (creates individual tools for each destination)`);
-            console.log(`- Result: Supervisor has 5 handoff tools from a single edge`);
-            console.log('─'.repeat(60));
-            // =============================================================
-            // SECOND RUN: Demonstrate agent-labeled history
-            // =============================================================
-            console.log(`\n${'='.repeat(80)}`);
-            console.log(`SECOND RUN - Simulating DB Load with Agent-Labeled History`);
-            console.log('='.repeat(80));
-            // Simulate what happens in the main app:
-            // 1. Store contentParts + agentIdMap to "DB" (in-memory here)
-            const dbStoredContentParts = [...contentParts];
-            const dbStoredAgentIdMap = Object.fromEntries(run.Graph.getContentPartAgentMap());
-            console.log('\n📦 Simulating DB storage:');
-            console.log(`  - Stored ${dbStoredContentParts.length} content parts`);
-            console.log(`  - Stored agent mappings for ${Object.keys(dbStoredAgentIdMap).length} parts`);
-            // 2. On next run, load from "DB" and label by agent
-            console.log('\n📥 Loading from DB and labeling by agent...');
-            const agentNames = {
-                supervisor: 'Supervisor',
-                legal_advisor: 'Legal Advisor',
-                data_analyst: 'Data Analyst',
-                security_expert: 'Security Expert',
-                product_designer: 'Product Designer',
-                devops_engineer: 'DevOps Engineer',
-            };
-            const labeledContentParts = labelContentByAgent(dbStoredContentParts.filter((p) => p != null), dbStoredAgentIdMap, agentNames);
-            console.log(`  - Labeled ${labeledContentParts.length} content parts by agent`);
-            // 3. Convert labeled content parts to payload format
-            const payload = [
-                {
-                    role: 'user',
-                    content: query,
-                },
-                {
-                    role: 'assistant',
-                    content: labeledContentParts,
-                },
-            ];
-            // 4. Format using formatAgentMessages (simulates what main app does)
-            console.log('\n🔧 Calling formatAgentMessages...');
-            const { messages: formattedMessages } = formatAgentMessages(payload);
-            console.log(`  - Formatted into ${formattedMessages.length} BaseMessages`);
-            // Show a preview of what the supervisor will see
-            console.log('\n👁️  Preview of formatted history for supervisor:');
-            console.log('─'.repeat(80));
-            for (let i = 0; i < formattedMessages.length; i++) {
-                const msg = formattedMessages[i];
-                const role = msg._getType();
-                const preview = typeof msg.content === 'string'
-                    ? msg.content.slice(0, 200)
-                    : JSON.stringify(msg.content).slice(0, 200);
-                console.log(`[${i}] ${role}: ${preview}${preview.length >= 200 ? '...' : ''}`);
-            }
-            console.log('─'.repeat(80));
-            // 5. Create a new run with the formatted history + a followup question
-            console.log('\n🚀 Starting second run with agent-labeled history + followup question...');
-            const followupQuery = 'Can you summarize the key legal points from your previous response?';
-            console.log(`   Followup: "${followupQuery}"`);
-            // Reset for second run
-            const secondRunHistory = [
-                ...formattedMessages,
-                new HumanMessage(followupQuery),
-            ];
-            const runConfig2 = createSupervisorGraphWithListEdge();
-            const run2 = await Run.create(runConfig2);
-            const inputs2 = {
-                messages: secondRunHistory,
-            };
-            await run2.processStream(inputs2, config);
-            console.log('\n✅ Second run completed successfully!');
-            console.log('   The supervisor correctly understood that the legal_advisor handled');
-            console.log('   the previous query, avoiding identity confusion.');
-        }
-        // Final summary
-        console.log(`\n${'='.repeat(60)}`);
-        console.log('TEST COMPLETE');
-        console.log('='.repeat(60));
-        console.log('\nThis test demonstrates that a single edge with multiple');
-        console.log('destinations in the "to" field creates individual handoff');
-        console.log('tools for each destination agent, achieving the same result');
-        console.log('as creating separate edges for each specialist.');
-    }
-    catch (error) {
-        console.error('Error in supervisor list handoff test:', error);
-    }
-}
-// Run the test
-testSupervisorListHandoff();
-//# sourceMappingURL=test-multi-agent-list-handoff.js.map