npm - @flink-app/flink - Versions diffs - 0.14.3 → 2.0.0-alpha.100 - Mend

@flink-app/flink 0.14.3 → 2.0.0-alpha.100

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (280) hide show

package/CHANGELOG.md +1051 -0
package/SCHEMA_EXTRACTION_ANALYSIS.md +494 -0
package/SIMPLE_AST_FEASIBILITY.md +570 -0
package/bin/flink.ts +13 -2
package/cli/build.ts +24 -44
package/cli/clean.ts +13 -25
package/cli/cli-utils.ts +190 -17
package/cli/dev.ts +252 -0
package/cli/loadEnvFiles.ts +116 -0
package/cli/run.ts +45 -62
package/dist/bin/flink.js +61 -2
package/dist/cli/build.js +20 -25
package/dist/cli/clean.js +12 -10
package/dist/cli/cli-utils.d.ts +34 -3
package/dist/cli/cli-utils.js +193 -12
package/dist/cli/dev.d.ts +2 -0
package/dist/cli/dev.js +279 -0
package/dist/cli/loadEnvFiles.d.ts +30 -0
package/dist/cli/loadEnvFiles.js +113 -0
package/dist/cli/run.js +47 -46
package/dist/src/DependencyTracker.d.ts +44 -0
package/dist/src/DependencyTracker.js +239 -0
package/dist/src/FlinkApp.d.ts +163 -10
package/dist/src/FlinkApp.js +847 -184
package/dist/src/FlinkContext.d.ts +41 -0
package/dist/src/FlinkErrors.d.ts +19 -6
package/dist/src/FlinkErrors.js +36 -42
package/dist/src/FlinkHttpHandler.d.ts +219 -26
package/dist/src/FlinkHttpHandler.js +37 -1
package/dist/src/FlinkJob.d.ts +10 -0
package/dist/src/FlinkLog.d.ts +82 -18
package/dist/src/FlinkLog.js +165 -13
package/dist/src/FlinkLogFactory.d.ts +288 -0
package/dist/src/FlinkLogFactory.js +619 -0
package/dist/src/FlinkRepo.d.ts +10 -2
package/dist/src/FlinkRepo.js +11 -1
package/dist/src/FlinkRequestContext.d.ts +63 -0
package/dist/src/FlinkRequestContext.js +74 -0
package/dist/src/FlinkResponse.d.ts +6 -0
package/dist/src/FlinkService.d.ts +38 -0
package/dist/src/FlinkService.js +46 -0
package/dist/src/LeaderElection.d.ts +45 -0
package/dist/src/LeaderElection.js +269 -0
package/dist/src/SchemaCache.d.ts +84 -0
package/dist/src/SchemaCache.js +289 -0
package/dist/src/TypeScriptCompiler.d.ts +161 -51
package/dist/src/TypeScriptCompiler.js +1253 -617
package/dist/src/TypeScriptUtils.js +4 -0
package/dist/src/ai/AgentRunner.d.ts +39 -0
package/dist/src/ai/AgentRunner.js +760 -0
package/dist/src/ai/ConversationAgent.d.ts +279 -0
package/dist/src/ai/ConversationAgent.js +404 -0
package/dist/src/ai/ConversationFlinkAgent.d.ts +278 -0
package/dist/src/ai/ConversationFlinkAgent.js +404 -0
package/dist/src/ai/FlinkAgent.d.ts +690 -0
package/dist/src/ai/FlinkAgent.js +729 -0
package/dist/src/ai/FlinkTool.d.ts +135 -0
package/dist/src/ai/FlinkTool.js +2 -0
package/dist/src/ai/InMemoryConversationAgent.d.ts +121 -0
package/dist/src/ai/InMemoryConversationAgent.js +209 -0
package/dist/src/ai/LLMAdapter.d.ts +148 -0
package/dist/src/ai/LLMAdapter.js +2 -0
package/dist/src/ai/PersistentFlinkAgent.d.ts +278 -0
package/dist/src/ai/PersistentFlinkAgent.js +403 -0
package/dist/src/ai/SubAgentExecutor.d.ts +38 -0
package/dist/src/ai/SubAgentExecutor.js +223 -0
package/dist/src/ai/ToolExecutor.d.ts +64 -0
package/dist/src/ai/ToolExecutor.js +497 -0
package/dist/src/ai/agentInstructions.d.ts +68 -0
package/dist/src/ai/agentInstructions.js +286 -0
package/dist/src/ai/index.d.ts +8 -0
package/dist/src/ai/index.js +26 -0
package/dist/src/ai/instructionFileLoader.d.ts +44 -0
package/dist/src/ai/instructionFileLoader.js +179 -0
package/dist/src/auth/FlinkAuthPlugin.d.ts +1 -1
package/dist/src/handlers/StreamWriterFactory.d.ts +20 -0
package/dist/src/handlers/StreamWriterFactory.js +83 -0
package/dist/src/index.d.ts +14 -0
package/dist/src/index.js +17 -0
package/dist/src/loadPluginSchemas.d.ts +45 -0
package/dist/src/loadPluginSchemas.js +143 -0
package/dist/src/schema-extraction/ComplexTypeDetection.d.ts +40 -0
package/dist/src/schema-extraction/ComplexTypeDetection.js +75 -0
package/dist/src/schema-extraction/TypeScriptSourceParser.d.ts +321 -0
package/dist/src/schema-extraction/TypeScriptSourceParser.js +925 -0
package/dist/src/schema-extraction/TypeScriptSourceParser.spec.d.ts +1 -0
package/dist/src/schema-extraction/TypeScriptSourceParser.spec.js +233 -0
package/dist/src/schema-extraction/TypeScriptTokenizer.d.ts +57 -0
package/dist/src/schema-extraction/TypeScriptTokenizer.js +177 -0
package/dist/src/schema-extraction/index.d.ts +2 -0
package/dist/src/schema-extraction/index.js +20 -0
package/dist/src/schema-extraction/types.d.ts +31 -0
package/dist/src/schema-extraction/types.js +2 -0
package/dist/src/utils/loadFlinkConfig.d.ts +53 -0
package/dist/src/utils/loadFlinkConfig.js +77 -0
package/dist/src/utils.d.ts +30 -0
package/dist/src/utils.js +52 -0
package/dist/src/workers/SchemaGeneratorWorker.d.ts +1 -0
package/dist/src/workers/SchemaGeneratorWorker.js +49 -0
package/dist/src/workers/WorkerPool.d.ts +60 -0
package/dist/src/workers/WorkerPool.js +306 -0
package/examples/logging-hierarchical-example.ts +125 -0
package/package.json +29 -4
package/readme.md +499 -0
package/spec/AgentDescendantDetection.spec.ts +335 -0
package/spec/AgentDuplicateDetection.spec.ts +112 -0
package/spec/AgentObserver.spec.ts +266 -0
package/spec/AgentRunner.spec.ts +1062 -0
package/spec/AsyncLocalStorageContext.spec.ts +223 -0
package/spec/ConversationHooks.spec.ts +257 -0
package/spec/FlinkAgent.spec.ts +681 -0
package/spec/FlinkApp.htmlResponse.spec.ts +260 -0
package/spec/FlinkApp.onError.invocation.spec.ts +151 -0
package/spec/FlinkApp.onError.spec.ts +1 -2
package/spec/FlinkApp.query.spec.ts +107 -0
package/spec/FlinkApp.routeOrdering.spec.ts +61 -0
package/spec/FlinkApp.undefinedResponse.spec.ts +123 -0
package/spec/FlinkApp.validationMode.spec.ts +155 -0
package/spec/FlinkJob.spec.ts +171 -0
package/spec/FlinkLogFactory.spec.ts +337 -0
package/spec/FlinkRepo.spec.ts +1 -1
package/spec/LeaderElection.spec.ts +174 -0
package/spec/StreamingIntegration.spec.ts +139 -0
package/spec/ToolExecutor.spec.ts +465 -0
package/spec/TypeScriptCompiler.spec.ts +1 -1
package/spec/TypeScriptSourceParser.spec.ts +1215 -0
package/spec/TypeScriptTokenizer.spec.ts +366 -0
package/spec/ai/ContextCompaction.spec.ts +405 -0
package/spec/ai/ConversationAgent.spec.ts +520 -0
package/spec/ai/InMemoryConversationAgent.spec.ts +144 -0
package/spec/ai/agentInstructions.spec.ts +358 -0
package/spec/fixtures/agent-instructions/TestAgent.ts +24 -0
package/spec/fixtures/agent-instructions/simple.md +3 -0
package/spec/fixtures/agent-instructions/template.md +18 -0
package/spec/fixtures/agent-instructions/yaml-format.yaml +9 -0
package/spec/mock-project/dist/.tsbuildinfo +1 -0
package/spec/mock-project/dist/spec/mock-project/src/handlers/GetCar.js +56 -0
package/spec/mock-project/dist/spec/mock-project/src/handlers/GetCar2.js +58 -0
package/spec/mock-project/dist/spec/mock-project/src/handlers/GetCarWithArraySchema.js +52 -0
package/spec/mock-project/dist/spec/mock-project/src/handlers/GetCarWithArraySchema2.js +52 -0
package/spec/mock-project/dist/spec/mock-project/src/handlers/GetCarWithArraySchema3.js +52 -0
package/spec/mock-project/dist/spec/mock-project/src/handlers/GetCarWithLiteralSchema.js +54 -0
package/spec/mock-project/dist/spec/mock-project/src/handlers/GetCarWithLiteralSchema2.js +54 -0
package/spec/mock-project/dist/spec/mock-project/src/handlers/GetCarWithSchemaInFile.js +57 -0
package/spec/mock-project/dist/spec/mock-project/src/handlers/GetCarWithSchemaInFile2.js +57 -0
package/spec/mock-project/dist/spec/mock-project/src/handlers/ManuallyAddedHandler.js +53 -0
package/spec/mock-project/dist/spec/mock-project/src/handlers/ManuallyAddedHandler2.js +55 -0
package/spec/mock-project/dist/spec/mock-project/src/handlers/PatchCar.js +57 -0
package/spec/mock-project/dist/spec/mock-project/src/handlers/PatchOnboardingSession.js +75 -0
package/spec/mock-project/dist/spec/mock-project/src/handlers/PatchOrderWithComplexTypes.js +57 -0
package/spec/mock-project/dist/spec/mock-project/src/handlers/PatchProductWithIntersection.js +58 -0
package/spec/mock-project/dist/spec/mock-project/src/handlers/PatchUserWithUnion.js +58 -0
package/spec/mock-project/dist/spec/mock-project/src/handlers/PostCar.js +54 -0
package/spec/mock-project/dist/spec/mock-project/src/handlers/PostLogin.js +55 -0
package/spec/mock-project/dist/spec/mock-project/src/handlers/PostLogout.js +54 -0
package/spec/mock-project/dist/spec/mock-project/src/handlers/PutCar.js +54 -0
package/spec/mock-project/dist/spec/mock-project/src/index.js +83 -0
package/spec/mock-project/dist/spec/mock-project/src/repos/CarRepo.js +26 -0
package/spec/mock-project/dist/spec/mock-project/src/schemas/Car.js +2 -0
package/spec/mock-project/dist/spec/mock-project/src/schemas/DefaultExportSchema.js +2 -0
package/spec/mock-project/dist/spec/mock-project/src/schemas/FileWithTwoSchemas.js +2 -0
package/spec/mock-project/dist/src/FlinkApp.js +1000 -0
package/spec/mock-project/dist/src/FlinkContext.js +2 -0
package/spec/mock-project/dist/src/FlinkErrors.js +143 -0
package/spec/mock-project/dist/src/FlinkHttpHandler.js +47 -0
package/spec/mock-project/dist/src/FlinkJob.js +2 -0
package/spec/mock-project/dist/src/FlinkLog.js +119 -0
package/spec/mock-project/dist/src/FlinkLogFactory.js +617 -0
package/spec/mock-project/dist/src/FlinkPlugin.js +2 -0
package/spec/mock-project/dist/src/FlinkRepo.js +224 -0
package/spec/mock-project/dist/src/FlinkRequestContext.js +74 -0
package/spec/mock-project/dist/src/FlinkResponse.js +2 -0
package/spec/mock-project/dist/src/ai/AgentExecutor.js +279 -0
package/spec/mock-project/dist/src/ai/AgentRunner.js +632 -0
package/spec/mock-project/dist/src/ai/ConversationAgent.js +402 -0
package/spec/mock-project/dist/src/ai/ConversationFlinkAgent.js +422 -0
package/spec/mock-project/dist/src/ai/FlinkAgent.js +699 -0
package/spec/mock-project/dist/src/ai/FlinkTool.js +2 -0
package/spec/mock-project/dist/src/ai/InMemoryConversationAgent.js +209 -0
package/spec/mock-project/dist/src/ai/LLMAdapter.js +2 -0
package/spec/mock-project/dist/src/ai/SubAgentExecutor.js +223 -0
package/spec/mock-project/dist/src/ai/ToolExecutor.js +412 -0
package/spec/mock-project/dist/src/ai/agentInstructions.js +246 -0
package/spec/mock-project/dist/src/auth/FlinkAuthPlugin.js +2 -0
package/spec/mock-project/dist/src/auth/FlinkAuthUser.js +2 -0
package/spec/mock-project/dist/src/handlers/GetCar.js +26 -52
package/spec/mock-project/dist/src/handlers/GetCar.js.map +1 -0
package/spec/mock-project/dist/src/handlers/GetCar2.js +32 -54
package/spec/mock-project/dist/src/handlers/GetCar2.js.map +1 -0
package/spec/mock-project/dist/src/handlers/GetCarWithArraySchema.js +26 -48
package/spec/mock-project/dist/src/handlers/GetCarWithArraySchema.js.map +1 -0
package/spec/mock-project/dist/src/handlers/GetCarWithArraySchema2.js +28 -48
package/spec/mock-project/dist/src/handlers/GetCarWithArraySchema2.js.map +1 -0
package/spec/mock-project/dist/src/handlers/GetCarWithArraySchema3.js +29 -48
package/spec/mock-project/dist/src/handlers/GetCarWithArraySchema3.js.map +1 -0
package/spec/mock-project/dist/src/handlers/GetCarWithLiteralSchema.js +26 -50
package/spec/mock-project/dist/src/handlers/GetCarWithLiteralSchema.js.map +1 -0
package/spec/mock-project/dist/src/handlers/GetCarWithLiteralSchema2.js +28 -50
package/spec/mock-project/dist/src/handlers/GetCarWithLiteralSchema2.js.map +1 -0
package/spec/mock-project/dist/src/handlers/GetCarWithSchemaInFile.js +27 -53
package/spec/mock-project/dist/src/handlers/GetCarWithSchemaInFile.js.map +1 -0
package/spec/mock-project/dist/src/handlers/GetCarWithSchemaInFile2.js +29 -53
package/spec/mock-project/dist/src/handlers/GetCarWithSchemaInFile2.js.map +1 -0
package/spec/mock-project/dist/src/handlers/ManuallyAddedHandler.js +16 -49
package/spec/mock-project/dist/src/handlers/ManuallyAddedHandler.js.map +1 -0
package/spec/mock-project/dist/src/handlers/ManuallyAddedHandler2.js +25 -50
package/spec/mock-project/dist/src/handlers/ManuallyAddedHandler2.js.map +1 -0
package/spec/mock-project/dist/src/handlers/PatchCar.js +27 -53
package/spec/mock-project/dist/src/handlers/PatchCar.js.map +1 -0
package/spec/mock-project/dist/src/handlers/PatchOnboardingSession.js +44 -70
package/spec/mock-project/dist/src/handlers/PatchOnboardingSession.js.map +1 -0
package/spec/mock-project/dist/src/handlers/PatchOrderWithComplexTypes.js +27 -53
package/spec/mock-project/dist/src/handlers/PatchOrderWithComplexTypes.js.map +1 -0
package/spec/mock-project/dist/src/handlers/PatchProductWithIntersection.js +28 -54
package/spec/mock-project/dist/src/handlers/PatchProductWithIntersection.js.map +1 -0
package/spec/mock-project/dist/src/handlers/PatchUserWithUnion.js +28 -54
package/spec/mock-project/dist/src/handlers/PatchUserWithUnion.js.map +1 -0
package/spec/mock-project/dist/src/handlers/PostCar.js +24 -50
package/spec/mock-project/dist/src/handlers/PostCar.js.map +1 -0
package/spec/mock-project/dist/src/handlers/PostLogin.js +25 -51
package/spec/mock-project/dist/src/handlers/PostLogin.js.map +1 -0
package/spec/mock-project/dist/src/handlers/PostLogout.js +24 -50
package/spec/mock-project/dist/src/handlers/PostLogout.js.map +1 -0
package/spec/mock-project/dist/src/handlers/PutCar.js +24 -50
package/spec/mock-project/dist/src/handlers/PutCar.js.map +1 -0
package/spec/mock-project/dist/src/handlers/StreamWriterFactory.js +83 -0
package/spec/mock-project/dist/src/index.js +52 -76
package/spec/mock-project/dist/src/index.js.map +1 -0
package/spec/mock-project/dist/src/mock-data-generator.js +9 -0
package/spec/mock-project/dist/src/repos/CarRepo.js +12 -24
package/spec/mock-project/dist/src/repos/CarRepo.js.map +1 -0
package/spec/mock-project/dist/src/schemas/Car.js +3 -1
package/spec/mock-project/dist/src/schemas/Car.js.map +1 -0
package/spec/mock-project/dist/src/schemas/DefaultExportSchema.js +3 -1
package/spec/mock-project/dist/src/schemas/DefaultExportSchema.js.map +1 -0
package/spec/mock-project/dist/src/schemas/FileWithTwoSchemas.js +3 -1
package/spec/mock-project/dist/src/schemas/FileWithTwoSchemas.js.map +1 -0
package/spec/mock-project/dist/src/utils.js +290 -0
package/spec/mock-project/tsconfig.json +6 -1
package/spec/schema-generation-nested-objects.spec.ts +97 -0
package/spec/testHelpers.ts +49 -0
package/spec/utils.caseConversion.spec.ts +78 -0
package/spec/utils.spec.ts +13 -13
package/src/DependencyTracker.ts +166 -0
package/src/FlinkApp.ts +919 -155
package/src/FlinkContext.ts +43 -0
package/src/FlinkErrors.ts +32 -12
package/src/FlinkHttpHandler.ts +246 -28
package/src/FlinkJob.ts +11 -0
package/src/FlinkLog.ts +119 -12
package/src/FlinkLogFactory.ts +699 -0
package/src/FlinkRepo.ts +10 -3
package/src/FlinkRequestContext.ts +95 -0
package/src/FlinkResponse.ts +6 -0
package/src/FlinkService.ts +49 -0
package/src/LeaderElection.ts +203 -0
package/src/SchemaCache.ts +232 -0
package/src/TypeScriptCompiler.ts +1347 -610
package/src/TypeScriptUtils.ts +5 -0
package/src/ai/AgentRunner.ts +646 -0
package/src/ai/ConversationAgent.ts +413 -0
package/src/ai/FlinkAgent.ts +1069 -0
package/src/ai/FlinkTool.ts +165 -0
package/src/ai/InMemoryConversationAgent.ts +149 -0
package/src/ai/LLMAdapter.ts +126 -0
package/src/ai/ToolExecutor.ts +485 -0
package/src/ai/agentInstructions.ts +245 -0
package/src/ai/index.ts +8 -0
package/src/ai/instructionFileLoader.ts +156 -0
package/src/auth/FlinkAuthPlugin.ts +2 -1
package/src/handlers/StreamWriterFactory.ts +84 -0
package/src/index.ts +14 -0
package/src/loadPluginSchemas.ts +141 -0
package/src/schema-extraction/TypeScriptSourceParser.ts +1058 -0
package/src/schema-extraction/TypeScriptTokenizer.ts +205 -0
package/src/schema-extraction/index.ts +2 -0
package/src/schema-extraction/types.ts +34 -0
package/src/utils/loadFlinkConfig.ts +89 -0
package/src/utils.ts +52 -0
package/tsconfig.json +6 -1

package/spec/AgentRunner.spec.ts ADDED Viewed

@@ -0,0 +1,1062 @@
+import { z } from "zod";
+import { AgentRunner } from "../src/ai/AgentRunner";
+import { FlinkAgentProps } from "../src/ai/FlinkAgent";
+import { ToolExecutor } from "../src/ai/ToolExecutor";
+import { FlinkContext } from "../src/FlinkContext";
+import { FlinkToolProps } from "../src/ai/FlinkTool";
+import { LLMAdapter } from "../src/ai/LLMAdapter";
+import { createStreamingMock } from "./testHelpers";
+describe("AgentRunner", () => {
+    let mockCtx: FlinkContext;
+    let mockLLMAdapter: LLMAdapter;
+    beforeEach(() => {
+        mockCtx = {
+            repos: {},
+            plugins: {},
+        };
+        // Mock LLM Adapter with default response
+        mockLLMAdapter = createStreamingMock([
+            {
+                textContent: "Test response",
+                toolCalls: [],
+                usage: { inputTokens: 10, outputTokens: 20 },
+                stopReason: "end_turn" as const,
+            },
+        ]);
+    });
+    describe("Basic execution", () => {
+        it("should execute simple agent without tools", async () => {
+            const agentProps: FlinkAgentProps<typeof mockCtx> = {
+                id: "test_agent",
+                description: "Test agent",
+                instructions: "You are a helpful assistant",
+                tools: [],
+            };
+            const toolsMap = new Map();
+            const llmAdapters = new Map();
+            llmAdapters.set("default", mockLLMAdapter);
+            const runner = new AgentRunner(agentProps, toolsMap, llmAdapters);
+            const generator = runner.streamGenerator({ message: "Hello" });
+            const chunks: any[] = [];
+            for await (const chunk of generator) {
+                chunks.push(chunk);
+            }
+            // Should have complete event
+            expect(chunks.length).toBeGreaterThan(0);
+            const completeChunk = chunks.find((c) => c.type === "complete");
+            expect(completeChunk).toBeDefined();
+            expect(completeChunk.result.message).toBe("Test response");
+            expect(completeChunk.result.stepsUsed).toBeGreaterThan(0);
+            expect(completeChunk.result.toolCalls).toEqual([]);
+        });
+        it("should track token usage", async () => {
+            const agentProps: FlinkAgentProps<typeof mockCtx> = {
+                id: "test_agent",
+                description: "Test agent",
+                instructions: "You are a helpful assistant",
+                tools: [],
+            };
+            const toolsMap = new Map();
+            const llmAdapters = new Map();
+            llmAdapters.set("default", mockLLMAdapter);
+            const runner = new AgentRunner(agentProps, toolsMap, llmAdapters);
+            const generator = runner.streamGenerator({ message: "Hello" });
+            for await (const chunk of generator) {
+                if (chunk.type === "complete") {
+                    expect(chunk.result.usage).toBeDefined();
+                    expect(chunk.result.usage?.inputTokens).toBeGreaterThan(0);
+                    expect(chunk.result.usage?.outputTokens).toBeGreaterThan(0);
+                }
+            }
+        });
+    });
+    describe("Tool calling", () => {
+        it("should execute tool calls", async () => {
+            // Create mock tool
+            const toolProps: FlinkToolProps = {
+                id: "get_weather",
+                description: "Get weather",
+                inputSchema: z.object({ city: z.string() }),
+            };
+            const toolFn = jasmine.createSpy("toolFn").and.returnValue(
+                Promise.resolve({
+                    success: true,
+                    data: { temperature: 22, conditions: "sunny" },
+                })
+            );
+            const toolExecutor = new ToolExecutor(toolProps, toolFn as any, mockCtx);
+            const toolsMap = new Map([["get_weather", toolExecutor]]);
+            // Mock LLM adapter response with tool call
+            const weatherMockAdapter = createStreamingMock([
+                // First call: agent requests tool
+                {
+                    textContent: "Let me check the weather",
+                    toolCalls: [
+                        {
+                            id: "tool_1",
+                            name: "get_weather",
+                            input: { city: "Stockholm" },
+                        },
+                    ],
+                    usage: { inputTokens: 10, outputTokens: 20 },
+                    stopReason: "tool_use" as const,
+                },
+                // Second call: agent responds with result
+                {
+                    textContent: "It's sunny and 22°C",
+                    toolCalls: [],
+                    usage: { inputTokens: 15, outputTokens: 10 },
+                    stopReason: "end_turn" as const,
+                },
+            ]);
+            const agentProps: FlinkAgentProps<typeof mockCtx> = {
+                id: "weather_agent",
+                description: "Weather assistant",
+                instructions: "You help with weather",
+                tools: ["get_weather"],
+            };
+            const llmAdapters = new Map();
+            llmAdapters.set("default", weatherMockAdapter);
+            const runner = new AgentRunner(agentProps, toolsMap, llmAdapters);
+            const generator = runner.streamGenerator({ message: "What's the weather in Stockholm?" });
+            for await (const chunk of generator) {
+                if (chunk.type === "complete") {
+                    expect(chunk.result.message).toBe("It's sunny and 22°C");
+                    expect(chunk.result.toolCalls.length).toBe(1);
+                    expect(chunk.result.toolCalls[0].name).toBe("get_weather");
+                    expect(chunk.result.toolCalls[0].input).toEqual({ city: "Stockholm" });
+                    expect(chunk.result.toolCalls[0].output).toEqual({
+                        temperature: 22,
+                        conditions: "sunny",
+                    });
+                    expect(chunk.result.stepsUsed).toBe(2);
+                }
+            }
+            // Verify tool was called
+            expect(toolFn).toHaveBeenCalledWith({
+                input: { city: "Stockholm" },
+                ctx: mockCtx,
+                user: undefined,
+                permissions: undefined,
+                conversationCtx: undefined,
+            });
+        });
+        it("should handle tool errors gracefully", async () => {
+            // Create mock tool that returns error
+            const toolProps: FlinkToolProps = {
+                id: "get_weather",
+                description: "Get weather",
+                inputSchema: z.object({ city: z.string() }),
+            };
+            const toolFn = jasmine.createSpy("toolFn").and.returnValue(
+                Promise.resolve({
+                    success: false,
+                    error: "API unavailable",
+                    code: "SERVICE_ERROR",
+                })
+            );
+            const toolExecutor = new ToolExecutor(toolProps, toolFn as any, mockCtx);
+            const toolsMap = new Map([["get_weather", toolExecutor]]);
+            // Mock LLM adapter response with tool call
+            const errorMockAdapter = createStreamingMock([
+                // First call: agent requests tool
+                {
+                    textContent: undefined,
+                    toolCalls: [
+                        {
+                            id: "tool_1",
+                            name: "get_weather",
+                            input: { city: "Stockholm" },
+                        },
+                    ],
+                    usage: { inputTokens: 10, outputTokens: 20 },
+                    stopReason: "tool_use" as const,
+                },
+                // Second call: agent handles error
+                {
+                    textContent: "Sorry, weather service is unavailable",
+                    toolCalls: [],
+                    usage: { inputTokens: 15, outputTokens: 10 },
+                    stopReason: "end_turn" as const,
+                },
+            ]);
+            const agentProps: FlinkAgentProps<typeof mockCtx> = {
+                id: "weather_agent",
+                description: "Weather assistant",
+                instructions: "You help with weather",
+                tools: ["get_weather"],
+            };
+            const llmAdapters = new Map();
+            llmAdapters.set("default", errorMockAdapter);
+            const runner = new AgentRunner(agentProps, toolsMap, llmAdapters);
+            const generator = runner.streamGenerator({ message: "What's the weather?" });
+            for await (const chunk of generator) {
+                if (chunk.type === "complete") {
+                    expect(chunk.result.toolCalls.length).toBe(1);
+                    expect(chunk.result.toolCalls[0].error).toBe("API unavailable");
+                    expect(chunk.result.toolCalls[0].output).toBeNull();
+                }
+            }
+        });
+        it("should handle missing tools", async () => {
+            const toolsMap = new Map(); // No tools registered
+            // Mock LLM adapter response requesting non-existent tool
+            const missingToolMockAdapter = createStreamingMock([
+                {
+                    textContent: undefined,
+                    toolCalls: [
+                        {
+                            id: "tool_1",
+                            name: "missing_tool",
+                            input: {},
+                        },
+                    ],
+                    usage: { inputTokens: 10, outputTokens: 20 },
+                    stopReason: "tool_use" as const,
+                },
+                {
+                    textContent: "Tool not available",
+                    toolCalls: [],
+                    usage: { inputTokens: 15, outputTokens: 10 },
+                    stopReason: "end_turn" as const,
+                },
+            ]);
+            const agentProps: FlinkAgentProps<typeof mockCtx> = {
+                id: "test_agent",
+                description: "Test agent",
+                instructions: "You are helpful",
+                tools: [],
+            };
+            const llmAdapters = new Map();
+            llmAdapters.set("default", missingToolMockAdapter);
+            const runner = new AgentRunner(agentProps, toolsMap, llmAdapters);
+            const generator = runner.streamGenerator({ message: "Test" });
+            for await (const chunk of generator) {
+                if (chunk.type === "complete") {
+                    expect(chunk.result.toolCalls.length).toBe(1);
+                    expect(chunk.result.toolCalls[0].error).toContain("not found");
+                }
+            }
+        });
+    });
+    describe("Step limits", () => {
+        it("should respect maxSteps limit", async () => {
+            // Mock infinite tool calling loop
+            const infiniteLoopMockAdapter = createStreamingMock([
+                {
+                    textContent: undefined,
+                    toolCalls: [
+                        {
+                            id: "tool_1",
+                            name: "test_tool",
+                            input: {},
+                        },
+                    ],
+                    usage: { inputTokens: 10, outputTokens: 20 },
+                    stopReason: "tool_use" as const,
+                },
+            ]);
+            const toolProps: FlinkToolProps = {
+                id: "test_tool",
+                description: "Test tool",
+                inputSchema: z.object({}),
+            };
+            const toolFn = async () => ({ success: true as const, data: {} });
+            const toolExecutor = new ToolExecutor(toolProps, toolFn, mockCtx);
+            const toolsMap = new Map([["test_tool", toolExecutor]]);
+            const agentProps: FlinkAgentProps<typeof mockCtx> = {
+                id: "test_agent",
+                description: "Test agent",
+                instructions: "You are helpful",
+                tools: ["test_tool"],
+                limits: { maxSteps: 3 },
+            };
+            const llmAdapters = new Map();
+            llmAdapters.set("default", infiniteLoopMockAdapter);
+            const runner = new AgentRunner(agentProps, toolsMap, llmAdapters);
+            const generator = runner.streamGenerator({ message: "Test" });
+            for await (const chunk of generator) {
+                if (chunk.type === "complete") {
+                    expect(chunk.result.stepsUsed).toBe(3);
+                    expect(chunk.result.stoppedEarly).toBe(true);
+                }
+            }
+        });
+        it("should allow runtime maxSteps override", async () => {
+            const runtimeOverrideMockAdapter = createStreamingMock([
+                {
+                    textContent: undefined,
+                    toolCalls: [
+                        {
+                            id: "tool_1",
+                            name: "test_tool",
+                            input: {},
+                        },
+                    ],
+                    usage: { inputTokens: 10, outputTokens: 20 },
+                    stopReason: "tool_use" as const,
+                },
+            ]);
+            const toolProps: FlinkToolProps = {
+                id: "test_tool",
+                description: "Test tool",
+                inputSchema: z.object({}),
+            };
+            const toolFn = async () => ({ success: true as const, data: {} });
+            const toolExecutor = new ToolExecutor(toolProps, toolFn, mockCtx);
+            const toolsMap = new Map([["test_tool", toolExecutor]]);
+            const agentProps: FlinkAgentProps<typeof mockCtx> = {
+                id: "test_agent",
+                description: "Test agent",
+                instructions: "You are helpful",
+                tools: ["test_tool"],
+                limits: { maxSteps: 10 },
+            };
+            const llmAdapters = new Map();
+            llmAdapters.set("default", runtimeOverrideMockAdapter);
+            const runner = new AgentRunner(agentProps, toolsMap, llmAdapters);
+            const generator = runner.streamGenerator({
+                message: "Test",
+                options: { maxSteps: 2 },
+            });
+            for await (const chunk of generator) {
+                if (chunk.type === "complete") {
+                    expect(chunk.result.stepsUsed).toBe(2);
+                    expect(chunk.result.stoppedEarly).toBe(true);
+                }
+            }
+        });
+    });
+    describe("Message format conversion", () => {
+        it("should convert string to message array", async () => {
+            const agentProps: FlinkAgentProps<typeof mockCtx> = {
+                id: "test_agent",
+                description: "Test agent",
+                instructions: "You are helpful",
+                tools: [],
+            };
+            const toolsMap = new Map();
+            const llmAdapters = new Map();
+            llmAdapters.set("default", mockLLMAdapter);
+            const runner = new AgentRunner(agentProps, toolsMap, llmAdapters);
+            const generator = runner.streamGenerator({ message: "Hello" });
+            for await (const chunk of generator) {
+                if (chunk.type === "complete") {
+                    expect(chunk.result).toBeDefined();
+                }
+            }
+            // Verify LLM adapter was called with user message
+            expect(mockLLMAdapter.stream).toHaveBeenCalled();
+            const callArgs = (mockLLMAdapter.stream as jasmine.Spy).calls.first().args[0];
+            expect(callArgs.messages.length).toBeGreaterThanOrEqual(1);
+            expect(callArgs.messages[0]).toEqual({ role: "user", content: "Hello" });
+        });
+        it("should convert Message[] to Anthropic format", async () => {
+            const agentProps: FlinkAgentProps<typeof mockCtx> = {
+                id: "test_agent",
+                description: "Test agent",
+                instructions: "You are helpful",
+                tools: [],
+            };
+            const toolsMap = new Map();
+            const llmAdapters = new Map();
+            llmAdapters.set("default", mockLLMAdapter);
+            const runner = new AgentRunner(agentProps, toolsMap, llmAdapters);
+            const generator = runner.streamGenerator({
+                message: [
+                    { role: "user", content: "Hello" },
+                    { role: "user", content: "How are you?" },
+                ],
+            });
+            for await (const chunk of generator) {
+                if (chunk.type === "complete") {
+                    expect(chunk.result).toBeDefined();
+                }
+            }
+            expect(mockLLMAdapter.stream).toHaveBeenCalled();
+        });
+    });
+    describe("Model configuration", () => {
+        it("should pass configuration to LLM adapter", async () => {
+            const agentProps: FlinkAgentProps<typeof mockCtx> = {
+                id: "test_agent",
+                description: "Test agent",
+                instructions: "You are helpful",
+                tools: [],
+            };
+            const toolsMap = new Map();
+            const llmAdapters = new Map();
+            llmAdapters.set("default", mockLLMAdapter);
+            const runner = new AgentRunner(agentProps, toolsMap, llmAdapters);
+            const generator = runner.streamGenerator({ message: "Hello" });
+            for await (const chunk of generator) {
+                if (chunk.type === "complete") {
+                    break;
+                }
+            }
+            // Verify LLM adapter was called via stream
+            expect(mockLLMAdapter.stream).toHaveBeenCalled();
+            const callArgs = (mockLLMAdapter.stream as jasmine.Spy).calls.mostRecent().args[0];
+            expect(callArgs.instructions).toBe("You are helpful");
+        });
+        it("should pass custom temperature and maxTokens", async () => {
+            const agentProps: FlinkAgentProps<typeof mockCtx> = {
+                id: "test_agent",
+                description: "Test agent",
+                instructions: "You are helpful",
+                tools: [],
+                model: {
+                    temperature: 0.3,
+                    maxTokens: 2000,
+                },
+            };
+            const toolsMap = new Map();
+            const llmAdapters = new Map();
+            llmAdapters.set("default", mockLLMAdapter);
+            const runner = new AgentRunner(agentProps, toolsMap, llmAdapters);
+            const generator = runner.streamGenerator({ message: "Hello" });
+            for await (const chunk of generator) {
+                if (chunk.type === "complete") {
+                    break;
+                }
+            }
+            const callArgs = (mockLLMAdapter.stream as jasmine.Spy).calls.mostRecent().args[0];
+            expect(callArgs.temperature).toBe(0.3);
+            expect(callArgs.maxTokens).toBe(2000);
+        });
+    });
+    describe("Error handling", () => {
+        it("should throw error when LLM adapter not configured", () => {
+            const agentProps: FlinkAgentProps<typeof mockCtx> = {
+                id: "test_agent",
+                description: "Test agent",
+                instructions: "You are helpful",
+                tools: [],
+            };
+            const toolsMap = new Map();
+            const llmAdapters = new Map(); // Empty map
+            expect(() => {
+                new AgentRunner(agentProps, toolsMap, llmAdapters);
+            }).toThrowError(/not configured/);
+        });
+        it("should throw error for unregistered adapter", () => {
+            const agentProps: FlinkAgentProps<typeof mockCtx> = {
+                id: "test_agent",
+                description: "Test agent",
+                instructions: "You are helpful",
+                tools: [],
+                model: {
+                    adapterId: "openai",
+                },
+            };
+            const toolsMap = new Map();
+            const llmAdapters = new Map();
+            llmAdapters.set("default", mockLLMAdapter);
+            expect(() => {
+                new AgentRunner(agentProps, toolsMap, llmAdapters);
+            }).toThrowError(/LLM adapter "openai" not configured/);
+        });
+    });
+    describe("Message Conversion with Conversation History", () => {
+        it("should preserve assistant messages without tool calls", async () => {
+            const agentProps: FlinkAgentProps<typeof mockCtx> = {
+                id: "test_agent",
+                description: "Test agent",
+                instructions: "You are helpful",
+                tools: [],
+            };
+            const toolsMap = new Map();
+            const llmAdapters = new Map();
+            llmAdapters.set("default", mockLLMAdapter);
+            const runner = new AgentRunner(agentProps, toolsMap, llmAdapters);
+            const history = [
+                { role: "user" as const, content: "Who are you?" },
+                { role: "assistant" as const, content: "I'm a weather assistant." },
+            ];
+            const generator = runner.streamGenerator({
+                message: "What's the weather?",
+                history,
+            });
+            for await (const chunk of generator) {
+                if (chunk.type === "complete") {
+                    break;
+                }
+            }
+            // Verify LLM adapter was called with history preserved
+            expect(mockLLMAdapter.stream).toHaveBeenCalled();
+            const callArgs = (mockLLMAdapter.stream as jasmine.Spy).calls.first().args[0];
+            const messages = callArgs.messages;
+            // Note: messages array gets mutated after LLM call (assistant message added)
+            // So we check that the first 3 messages are correct (history + new user message)
+            expect(messages.length).toBeGreaterThanOrEqual(3);
+            expect(messages[0]).toEqual({ role: "user", content: "Who are you?" });
+            expect(messages[1]).toEqual({ role: "assistant", content: "I'm a weather assistant." });
+            expect(messages[2]).toEqual({ role: "user", content: "What's the weather?" });
+            // Verify assistant message from history was preserved (not filtered out)
+            expect(messages[1].role).toBe("assistant");
+            expect(messages[1].content).toBe("I'm a weather assistant.");
+        });
+        it("should preserve assistant messages with tool calls", async () => {
+            const agentProps: FlinkAgentProps<typeof mockCtx> = {
+                id: "test_agent",
+                description: "Test agent",
+                instructions: "You are helpful",
+                tools: [],
+            };
+            const toolsMap = new Map();
+            const llmAdapters = new Map();
+            llmAdapters.set("default", mockLLMAdapter);
+            const runner = new AgentRunner(agentProps, toolsMap, llmAdapters);
+            const history = [
+                { role: "user" as const, content: "What's the weather in Stockholm?" },
+                {
+                    role: "assistant" as const,
+                    content: "",
+                    toolCalls: [{ id: "1", name: "get-weather", input: { city: "Stockholm" } }],
+                },
+                { role: "tool" as const, toolCallId: "1", toolName: "get-weather", result: "22°C, Sunny" },
+            ];
+            const generator = runner.streamGenerator({
+                message: "And tomorrow?",
+                history,
+            });
+            for await (const chunk of generator) {
+                if (chunk.type === "complete") {
+                    break;
+                }
+            }
+            expect(mockLLMAdapter.stream).toHaveBeenCalled();
+            const callArgs = (mockLLMAdapter.stream as jasmine.Spy).calls.first().args[0];
+            const messages = callArgs.messages;
+            // Note: messages array gets mutated after LLM call
+            // Check first 4 messages: history (3) + new user message (1)
+            expect(messages.length).toBeGreaterThanOrEqual(4);
+            expect(messages[0].role).toBe("user");
+            expect(messages[1].role).toBe("assistant");
+            expect(messages[2].role).toBe("user"); // Tool result
+            expect(messages[3].role).toBe("user"); // New message
+            // Assistant message should have tool_use content blocks (preserved from history)
+            expect(Array.isArray(messages[1].content)).toBe(true);
+            const contentBlocks = messages[1].content as any[];
+            expect(contentBlocks.length).toBe(1);
+            expect(contentBlocks[0].type).toBe("tool_use");
+            expect(contentBlocks[0].name).toBe("get-weather");
+            expect(contentBlocks[0].input).toEqual({ city: "Stockholm" });
+        });
+        it("should maintain alternating user/assistant pattern", async () => {
+            const agentProps: FlinkAgentProps<typeof mockCtx> = {
+                id: "test_agent",
+                description: "Test agent",
+                instructions: "You are helpful",
+                tools: [],
+            };
+            const toolsMap = new Map();
+            const llmAdapters = new Map();
+            llmAdapters.set("default", mockLLMAdapter);
+            const runner = new AgentRunner(agentProps, toolsMap, llmAdapters);
+            const history = [
+                { role: "user" as const, content: "Hello" },
+                { role: "assistant" as const, content: "Hi there!" },
+                { role: "user" as const, content: "How are you?" },
+                { role: "assistant" as const, content: "I'm doing well!" },
+            ];
+            const generator = runner.streamGenerator({
+                message: "What's your name?",
+                history,
+            });
+            for await (const chunk of generator) {
+                if (chunk.type === "complete") {
+                    break;
+                }
+            }
+            expect(mockLLMAdapter.stream).toHaveBeenCalled();
+            const callArgs = (mockLLMAdapter.stream as jasmine.Spy).calls.first().args[0];
+            const messages = callArgs.messages;
+            // Note: messages array gets mutated after LLM call
+            // Check first 5 messages: history (4) + new user message (1)
+            expect(messages.length).toBeGreaterThanOrEqual(5);
+            // Verify no consecutive user or assistant messages in the first 5 (input messages)
+            for (let i = 1; i < Math.min(5, messages.length); i++) {
+                expect(messages[i].role).not.toBe(messages[i - 1].role);
+            }
+        });
+        it("should handle assistant messages with both text and tool calls", async () => {
+            const agentProps: FlinkAgentProps<typeof mockCtx> = {
+                id: "test_agent",
+                description: "Test agent",
+                instructions: "You are helpful",
+                tools: [],
+            };
+            const toolsMap = new Map();
+            const llmAdapters = new Map();
+            llmAdapters.set("default", mockLLMAdapter);
+            const runner = new AgentRunner(agentProps, toolsMap, llmAdapters);
+            const history = [
+                { role: "user" as const, content: "Check the weather" },
+                {
+                    role: "assistant" as const,
+                    content: "Let me check that for you",
+                    toolCalls: [{ id: "1", name: "get-weather", input: { city: "Stockholm" } }],
+                },
+            ];
+            const generator = runner.streamGenerator({ message: history });
+            for await (const chunk of generator) {
+                if (chunk.type === "complete") {
+                    break;
+                }
+            }
+            expect(mockLLMAdapter.stream).toHaveBeenCalled();
+            const callArgs = (mockLLMAdapter.stream as jasmine.Spy).calls.first().args[0];
+            const messages = callArgs.messages;
+            // Assistant message should have both text and tool_use blocks
+            expect(Array.isArray(messages[1].content)).toBe(true);
+            const contentBlocks = messages[1].content as any[];
+            expect(contentBlocks.length).toBe(2);
+            expect(contentBlocks[0].type).toBe("text");
+            expect(contentBlocks[0].text).toBe("Let me check that for you");
+            expect(contentBlocks[1].type).toBe("tool_use");
+            expect(contentBlocks[1].name).toBe("get-weather");
+        });
+        it("should convert tool messages to user messages with results", async () => {
+            const agentProps: FlinkAgentProps<typeof mockCtx> = {
+                id: "test_agent",
+                description: "Test agent",
+                instructions: "You are helpful",
+                tools: [],
+            };
+            const toolsMap = new Map();
+            const llmAdapters = new Map();
+            llmAdapters.set("default", mockLLMAdapter);
+            const runner = new AgentRunner(agentProps, toolsMap, llmAdapters);
+            const history = [
+                { role: "user" as const, content: "Check weather" },
+                {
+                    role: "assistant" as const,
+                    content: "",
+                    toolCalls: [{ id: "1", name: "get-weather", input: { city: "Stockholm" } }],
+                },
+                { role: "tool" as const, toolCallId: "1", toolName: "get-weather", result: "22°C" },
+            ];
+            const generator = runner.streamGenerator({ message: history });
+            for await (const chunk of generator) {
+                if (chunk.type === "complete") {
+                    break;
+                }
+            }
+            expect(mockLLMAdapter.stream).toHaveBeenCalled();
+            const callArgs = (mockLLMAdapter.stream as jasmine.Spy).calls.first().args[0];
+            const messages = callArgs.messages;
+            // Tool message should be converted to user message with tool_result content block
+            expect(messages[2].role).toBe("user");
+            expect(Array.isArray(messages[2].content)).toBe(true);
+            const contentBlocks = messages[2].content as any[];
+            expect(contentBlocks.length).toBe(1);
+            expect(contentBlocks[0].type).toBe("tool_result");
+            expect(contentBlocks[0].tool_use_id).toBe("1");
+            expect(contentBlocks[0].content).toBe("22°C");
+        });
+        it("should handle empty content with tool calls", async () => {
+            const agentProps: FlinkAgentProps<typeof mockCtx> = {
+                id: "test_agent",
+                description: "Test agent",
+                instructions: "You are helpful",
+                tools: [],
+            };
+            const toolsMap = new Map();
+            const llmAdapters = new Map();
+            llmAdapters.set("default", mockLLMAdapter);
+            const runner = new AgentRunner(agentProps, toolsMap, llmAdapters);
+            const history = [
+                { role: "user" as const, content: "Check weather" },
+                {
+                    role: "assistant" as const,
+                    content: "", // Empty content
+                    toolCalls: [{ id: "1", name: "get-weather", input: {} }],
+                },
+            ];
+            const generator = runner.streamGenerator({ message: history });
+            for await (const chunk of generator) {
+                if (chunk.type === "complete") {
+                    break;
+                }
+            }
+            expect(mockLLMAdapter.stream).toHaveBeenCalled();
+            const callArgs = (mockLLMAdapter.stream as jasmine.Spy).calls.first().args[0];
+            const messages = callArgs.messages;
+            // Assistant message should only have tool_use block (no text block for empty content)
+            expect(Array.isArray(messages[1].content)).toBe(true);
+            const contentBlocks = messages[1].content as any[];
+            expect(contentBlocks.length).toBe(1);
+            expect(contentBlocks[0].type).toBe("tool_use");
+        });
+    });
+    describe("Dynamic Instructions", () => {
+        it("should use static string instructions (backwards compatibility)", async () => {
+            const agentProps: FlinkAgentProps<typeof mockCtx> = {
+                id: "test_agent",
+                description: "Test agent",
+                instructions: "Static instructions",
+                tools: [],
+            };
+            const toolsMap = new Map();
+            const llmAdapters = new Map();
+            llmAdapters.set("default", mockLLMAdapter);
+            const runner = new AgentRunner(agentProps, toolsMap, llmAdapters, "test_agent", mockCtx);
+            const generator = runner.streamGenerator({ message: "Hello" });
+            for await (const chunk of generator) {
+                if (chunk.type === "complete") {
+                    break;
+                }
+            }
+            // Verify LLM was called with static instructions
+            expect(mockLLMAdapter.stream).toHaveBeenCalled();
+            const callArgs = (mockLLMAdapter.stream as jasmine.Spy).calls.first().args[0];
+            expect(callArgs.instructions).toBe("Static instructions");
+        });
+        it("should resolve synchronous callback instructions", async () => {
+            const instructionsCallback = jasmine.createSpy("instructionsCallback").and.returnValue("Dynamic: test-user");
+            const agentProps: FlinkAgentProps<typeof mockCtx> = {
+                id: "test_agent",
+                description: "Test agent",
+                instructions: instructionsCallback,
+                tools: [],
+            };
+            const toolsMap = new Map();
+            const llmAdapters = new Map();
+            llmAdapters.set("default", mockLLMAdapter);
+            const runner = new AgentRunner(agentProps, toolsMap, llmAdapters, "test_agent", mockCtx);
+            const generator = runner.streamGenerator({
+                message: "Hello",
+                user: { id: "123", name: "test-user" },
+            });
+            for await (const chunk of generator) {
+                if (chunk.type === "complete") {
+                    break;
+                }
+            }
+            // Verify callback was called with correct context
+            expect(instructionsCallback).toHaveBeenCalledTimes(1);
+            const callArgs = instructionsCallback.calls.first().args;
+            expect(callArgs[0]).toBe(mockCtx); // ctx
+            expect(callArgs[1].user).toEqual({ id: "123", name: "test-user" }); // agentContext
+            // Verify LLM was called with resolved instructions
+            expect(mockLLMAdapter.stream).toHaveBeenCalled();
+            const llmCallArgs = (mockLLMAdapter.stream as jasmine.Spy).calls.first().args[0];
+            expect(llmCallArgs.instructions).toBe("Dynamic: test-user");
+        });
+        it("should resolve async callback instructions", async () => {
+            const mockUser = { id: "123", name: "test-user", tier: "premium" };
+            const mockRepoCtx = {
+                repos: {
+                    userRepo: {
+                        getById: jasmine.createSpy("getById").and.returnValue(Promise.resolve(mockUser)),
+                    },
+                },
+                plugins: {},
+            };
+            const instructionsCallback = async (ctx: any, agentContext: any) => {
+                const profile = await ctx.repos.userRepo.getById(agentContext.user.id);
+                return `You are a support agent. Customer: ${profile.name}, Tier: ${profile.tier}`;
+            };
+            const agentProps: FlinkAgentProps<typeof mockCtx> = {
+                id: "test_agent",
+                description: "Test agent",
+                instructions: instructionsCallback,
+                tools: [],
+            };
+            const toolsMap = new Map();
+            const llmAdapters = new Map();
+            llmAdapters.set("default", mockLLMAdapter);
+            const runner = new AgentRunner(agentProps, toolsMap, llmAdapters, "test_agent", mockRepoCtx);
+            const generator = runner.streamGenerator({
+                message: "Hello",
+                user: { id: "123" },
+            });
+            for await (const chunk of generator) {
+                if (chunk.type === "complete") {
+                    break;
+                }
+            }
+            // Verify repo was called
+            expect(mockRepoCtx.repos.userRepo.getById).toHaveBeenCalledWith("123");
+            // Verify LLM was called with resolved instructions
+            expect(mockLLMAdapter.stream).toHaveBeenCalled();
+            const llmCallArgs = (mockLLMAdapter.stream as jasmine.Spy).calls.first().args[0];
+            expect(llmCallArgs.instructions).toBe("You are a support agent. Customer: test-user, Tier: premium");
+        });
+        it("should pass correct context to callback", async () => {
+            const instructionsCallback = jasmine.createSpy("instructionsCallback").and.returnValue("Instructions");
+            const agentProps: FlinkAgentProps<typeof mockCtx> = {
+                id: "test_agent",
+                description: "Test agent",
+                instructions: instructionsCallback,
+                tools: [],
+            };
+            const toolsMap = new Map();
+            const llmAdapters = new Map();
+            llmAdapters.set("default", mockLLMAdapter);
+            const runner = new AgentRunner(agentProps, toolsMap, llmAdapters, "test_agent", mockCtx);
+            const generator = runner.streamGenerator({
+                message: "Hello",
+                user: { id: "123" },
+                conversationId: "conv-456",
+                metadata: { source: "handler" },
+            });
+            for await (const chunk of generator) {
+                if (chunk.type === "complete") {
+                    break;
+                }
+            }
+            // Verify callback received correct context
+            expect(instructionsCallback).toHaveBeenCalledTimes(1);
+            const callArgs = instructionsCallback.calls.first().args;
+            // Check ctx parameter
+            expect(callArgs[0]).toBe(mockCtx);
+            // Check execContext parameter
+            const execContext = callArgs[1];
+            expect(execContext.agentId).toBe("test_agent");
+            expect(execContext.conversationId).toBe("conv-456");
+            expect(execContext.user).toEqual({ id: "123" });
+            expect(execContext.metadata).toEqual({ source: "handler" });
+        });
+        it("should handle callback errors gracefully", async () => {
+            const instructionsCallback = () => {
+                throw new Error("Database connection failed");
+            };
+            const agentProps: FlinkAgentProps<typeof mockCtx> = {
+                id: "test_agent",
+                description: "Test agent",
+                instructions: instructionsCallback,
+                tools: [],
+            };
+            const toolsMap = new Map();
+            const llmAdapters = new Map();
+            llmAdapters.set("default", mockLLMAdapter);
+            const runner = new AgentRunner(agentProps, toolsMap, llmAdapters, "test_agent", mockCtx);
+            const generator = runner.streamGenerator({ message: "Hello" });
+            try {
+                for await (const chunk of generator) {
+                    // Should not reach here
+                }
+                fail("Expected error to be thrown");
+            } catch (err: any) {
+                expect(err.message).toContain("Failed to resolve instructions for agent test_agent");
+                expect(err.message).toContain("Database connection failed");
+            }
+        });
+        it("should resolve instructions once per execution", async () => {
+            let callCount = 0;
+            const instructionsCallback = () => {
+                callCount++;
+                return "Instructions";
+            };
+            // Mock adapter that calls LLM 3 times (3 steps with tool calls)
+            const multiStepMockAdapter = createStreamingMock([
+                {
+                    textContent: undefined,
+                    toolCalls: [{ id: "tool_1", name: "test_tool", input: {} }],
+                    usage: { inputTokens: 10, outputTokens: 20 },
+                    stopReason: "tool_use" as const,
+                },
+                {
+                    textContent: undefined,
+                    toolCalls: [{ id: "tool_2", name: "test_tool", input: {} }],
+                    usage: { inputTokens: 10, outputTokens: 20 },
+                    stopReason: "tool_use" as const,
+                },
+                {
+                    textContent: "Final response",
+                    toolCalls: [],
+                    usage: { inputTokens: 10, outputTokens: 20 },
+                    stopReason: "end_turn" as const,
+                },
+            ]);
+            const toolProps: FlinkToolProps = {
+                id: "test_tool",
+                description: "Test tool",
+                inputSchema: z.object({}),
+            };
+            const toolFn = async () => ({ success: true as const, data: {} });
+            const toolExecutor = new ToolExecutor(toolProps, toolFn, mockCtx);
+            const toolsMap = new Map([["test_tool", toolExecutor]]);
+            const agentProps: FlinkAgentProps<typeof mockCtx> = {
+                id: "test_agent",
+                description: "Test agent",
+                instructions: instructionsCallback,
+                tools: ["test_tool"],
+            };
+            const llmAdapters = new Map();
+            llmAdapters.set("default", multiStepMockAdapter);
+            const runner = new AgentRunner(agentProps, toolsMap, llmAdapters, "test_agent", mockCtx);
+            const generator = runner.streamGenerator({ message: "Hello" });
+            for await (const chunk of generator) {
+                if (chunk.type === "complete") {
+                    expect(chunk.result.stepsUsed).toBe(3);
+                }
+            }
+            // Callback should be called ONCE, not 3 times
+            expect(callCount).toBe(1);
+        });
+    });
+});