npm - @flink-app/flink - Versions diffs - 2.0.0-alpha.91 → 2.0.0-alpha.93 - Mend

@flink-app/flink 2.0.0-alpha.91 → 2.0.0-alpha.93

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

package/CHANGELOG.md +47 -0
package/dist/src/FlinkApp.d.ts +17 -0
package/dist/src/FlinkApp.js +4 -2
package/dist/src/ai/AgentRunner.d.ts +9 -2
package/dist/src/ai/AgentRunner.js +507 -363
package/dist/src/ai/FlinkAgent.d.ts +100 -1
package/dist/src/ai/FlinkAgent.js +16 -3
package/package.json +1 -1
package/spec/AgentObserver.spec.ts +266 -0
package/src/FlinkApp.ts +22 -1
package/src/ai/AgentRunner.ts +141 -15
package/src/ai/FlinkAgent.ts +112 -2

package/dist/src/ai/AgentRunner.js CHANGED Viewed

@@ -77,16 +77,20 @@ var __spreadArray = (this && this.__spreadArray) || function (to, from, pack) {
 };
 Object.defineProperty(exports, "__esModule", { value: true });
 exports.AgentRunner = void 0;
+var uuid_1 = require("uuid");
+var FlinkLogFactory_1 = require("../FlinkLogFactory");
 var FlinkLog_1 = require("../FlinkLog");
+var observerLog = FlinkLogFactory_1.FlinkLogFactory.createLogger("flink.ai.observer");
 var AgentRunner = /** @class */ (function () {
     function AgentRunner(agentProps, tools, llmAdapters, agentName, // Optional agent name for logging
-    ctx // FlinkContext for instruction callbacks (any for flexibility)
-    ) {
+    ctx, // FlinkContext for instruction callbacks (any for flexibility)
+    observer) {
         var _a, _b, _c, _d, _e;
         this.agentProps = agentProps;
         this.tools = tools;
         this.agentName = agentName;
         this.ctx = ctx;
+        this.observer = observer;
         // Get appropriate LLM adapter based on adapterId
         var adapterId = ((_a = agentProps.model) === null || _a === void 0 ? void 0 : _a.adapterId) || "default";
         var adapter = llmAdapters.get(adapterId);
@@ -101,37 +105,47 @@ var AgentRunner = /** @class */ (function () {
     }
     AgentRunner.prototype.streamGenerator = function (input) {
         return __asyncGenerator(this, arguments, function streamGenerator_1() {
-            var maxSteps, toolCalls, execContext, resolvedInstructions, _a, err_1, messages, step, finalMessage, stoppedEarly, totalInputTokens, totalOutputTokens, totalCachedInputTokens, totalCacheCreationInputTokens, finalProviderMetadata, availableTools, needsCompaction, beforeCount, originalMessages, compactedMessages, error_1, llmStream, textContent, toolCallsFromStream, usage, stopReason, providerMetadata, _b, llmStream_1, llmStream_1_1, chunk, _c, e_1_1, llmResponse, assistantContent, _i, _d, toolCall, stepContext, toolResults, _e, _f, toolCall, toolExecutor, toolOutput, toolError, toolResult, formattedResult, err_2, stepContext, result, finishContext;
-            var _g, e_1, _h, _j;
-            var _k, _l, _m;
-            return __generator(this, function (_o) {
-                switch (_o.label) {
+            var maxSteps, toolCalls, runId, runStartedAt, agentId, modelInfo, declaredToolNames, execContext, resolvedInstructions, _a, err_1, messages, step, finalMessage, stoppedEarly, totalInputTokens, totalOutputTokens, totalCachedInputTokens, totalCacheCreationInputTokens, finalProviderMetadata, buildResult, _loop_1, this_1, state_1, result_1, finishContext, err_2;
+            var _this = this;
+            var _b, e_1, _c, _d;
+            var _e, _f, _g, _h;
+            return __generator(this, function (_j) {
+                switch (_j.label) {
                     case 0:
-                        maxSteps = ((_k = input.options) === null || _k === void 0 ? void 0 : _k.maxSteps) || this.maxSteps;
+                        maxSteps = ((_e = input.options) === null || _e === void 0 ? void 0 : _e.maxSteps) || this.maxSteps;
                         toolCalls = [];
+                        runId = (0, uuid_1.v4)();
+                        runStartedAt = Date.now();
+                        agentId = this.agentName || "unknown";
+                        modelInfo = {
+                            adapterId: (_f = this.agentProps.model) === null || _f === void 0 ? void 0 : _f.adapterId,
+                            maxTokens: this.maxTokens,
+                            temperature: this.temperature,
+                        };
+                        declaredToolNames = Array.from(this.tools.keys());
                         execContext = {
-                            agentId: this.agentName || "unknown",
+                            agentId: agentId,
                             conversationId: input.conversationId,
                             user: input.user,
                             metadata: input.metadata,
                             conversationContext: input.conversationContext,
                         };
-                        _o.label = 1;
+                        _j.label = 1;
                     case 1:
-                        _o.trys.push([1, 5, , 6]);
+                        _j.trys.push([1, 5, , 6]);
                         if (!(typeof this.agentProps.instructions === "function")) return [3 /*break*/, 3];
                         return [4 /*yield*/, __await(this.agentProps.instructions(this.ctx, execContext))];
                     case 2:
-                        _a = _o.sent();
+                        _a = _j.sent();
                         return [3 /*break*/, 4];
                     case 3:
                         _a = this.agentProps.instructions;
-                        _o.label = 4;
+                        _j.label = 4;
                     case 4:
                         resolvedInstructions = _a;
                         return [3 /*break*/, 6];
                     case 5:
-                        err_1 = _o.sent();
+                        err_1 = _j.sent();
                         throw new Error("Failed to resolve instructions for agent ".concat(this.agentName, ": ").concat(err_1.message));
                     case 6:
                         if (input.history && input.history.length > 0) {
@@ -152,6 +166,20 @@ var AgentRunner = /** @class */ (function () {
                         else {
                             messages.push.apply(messages, this.convertMessages(input.message));
                         }
+                        // Dispatch observer onRun (pre-loop, before compaction / tool filtering)
+                        this.safeDispatch("onRun", function () {
+                            var _a, _b;
+                            return (_b = (_a = _this.observer) === null || _a === void 0 ? void 0 : _a.onRun) === null || _b === void 0 ? void 0 : _b.call(_a, {
+                                runId: runId,
+                                agentId: agentId,
+                                instructions: resolvedInstructions,
+                                input: input,
+                                messages: __spreadArray([], messages, true),
+                                tools: declaredToolNames,
+                                model: modelInfo,
+                                context: execContext,
+                            });
+                        });
                         step = 0;
                         finalMessage = "";
                         stoppedEarly = false;
@@ -160,371 +188,487 @@ var AgentRunner = /** @class */ (function () {
                         totalCachedInputTokens = 0;
                         totalCacheCreationInputTokens = 0;
                         finalProviderMetadata = {};
-                        _o.label = 7;
+                        buildResult = function () { return ({
+                            runId: runId,
+                            message: finalMessage,
+                            toolCalls: toolCalls,
+                            stepsUsed: step,
+                            stoppedEarly: stoppedEarly,
+                            usage: __assign(__assign({ inputTokens: totalInputTokens, outputTokens: totalOutputTokens }, (totalCachedInputTokens > 0 && { cachedInputTokens: totalCachedInputTokens })), (totalCacheCreationInputTokens > 0 && { cacheCreationInputTokens: totalCacheCreationInputTokens })),
+                            providerMetadata: Object.keys(finalProviderMetadata).length > 0 ? finalProviderMetadata : undefined,
+                        }); };
+                        _j.label = 7;
                     case 7:
-                        if (!(step < maxSteps)) return [3 /*break*/, 53];
-                        step++;
-                        return [4 /*yield*/, __await(this.filterToolsByPermissions(input.user, input.userPermissions, input.conversationContext))];
+                        _j.trys.push([7, 16, , 17]);
+                        _loop_1 = function () {
+                            var availableTools, needsCompaction, beforeCount, originalMessages, compactedMessages, error_1, toolCallsBeforeStep, llmStream, textContent, toolCallsFromStream, usage, stopReason, providerMetadata, _k, llmStream_1, llmStream_1_1, chunk, _l, e_1_1, llmResponse, assistantContent, _i, _m, toolCall, stepContext, toolResults, _o, _p, toolCall, toolExecutor, toolOutput, toolError, toolResult, formattedResult, err_3, stepContext;
+                            return __generator(this, function (_q) {
+                                switch (_q.label) {
+                                    case 0:
+                                        step++;
+                                        return [4 /*yield*/, __await(this_1.filterToolsByPermissions(input.user, input.userPermissions, input.conversationContext))];
+                                    case 1:
+                                        availableTools = _q.sent();
+                                        if (!this_1.agentProps.shouldCompact) return [3 /*break*/, 9];
+                                        _q.label = 2;
+                                    case 2:
+                                        _q.trys.push([2, 8, , 9]);
+                                        return [4 /*yield*/, __await(this_1.agentProps.shouldCompact(messages, step))];
+                                    case 3:
+                                        needsCompaction = _q.sent();
+                                        if (!needsCompaction) return [3 /*break*/, 7];
+                                        beforeCount = messages.length;
+                                        originalMessages = messages;
+                                        compactedMessages = void 0;
+                                        if (!this_1.agentProps.compactHistory) return [3 /*break*/, 5];
+                                        return [4 /*yield*/, __await(this_1.agentProps.compactHistory(messages, step))];
+                                    case 4:
+                                        compactedMessages = _q.sent();
+                                        return [3 /*break*/, 6];
+                                    case 5:
+                                        // Default strategy: sliding window keeping last 10 messages
+                                        compactedMessages = messages.slice(-10);
+                                        _q.label = 6;
+                                    case 6:
+                                        // Validation: ensure compacted array is not empty
+                                        if (!compactedMessages || compactedMessages.length === 0) {
+                                            throw new Error("compactHistory must return at least one message");
+                                        }
+                                        // Apply compaction
+                                        messages = compactedMessages;
+                                        // Log compaction for debugging
+                                        FlinkLog_1.log.debug("[Agent:".concat(this_1.agentName, "] Step ").concat(step, ": Compacted ").concat(beforeCount, " messages \u2192 ").concat(messages.length));
+                                        FlinkLog_1.log.debug("[Agent:".concat(this_1.agentName, "] Compacted messages:"), {
+                                            messageCount: messages.length,
+                                            messages: messages.map(function (m) { return ({
+                                                role: m.role,
+                                                contentPreview: typeof m.content === "string"
+                                                    ? m.content.substring(0, 100) + (m.content.length > 100 ? "..." : "")
+                                                    : "".concat(m.content.length, " blocks"),
+                                            }); }),
+                                        });
+                                        _q.label = 7;
+                                    case 7: return [3 /*break*/, 9];
+                                    case 8:
+                                        error_1 = _q.sent();
+                                        // Log error but don't fail execution - compaction is optional optimization
+                                        FlinkLog_1.log.error("[Agent:".concat(this_1.agentName, "] Context compaction failed:"), error_1.message);
+                                        return [3 /*break*/, 9];
+                                    case 9:
+                                        FlinkLog_1.log.debug("[Agent:".concat(this_1.agentName, "] Step ").concat(step, "/").concat(maxSteps, " - Calling LLM with:"), {
+                                            instructionsType: typeof this_1.agentProps.instructions === "function" ? "dynamic-callback" : "static",
+                                            messageCount: messages.length,
+                                            messages: messages.map(function (m) { return ({
+                                                role: m.role,
+                                                contentPreview: typeof m.content === "string"
+                                                    ? m.content.substring(0, 100) + (m.content.length > 100 ? "..." : "")
+                                                    : "".concat(m.content.length, " blocks"),
+                                            }); }),
+                                            toolCount: availableTools.length,
+                                            tools: availableTools.map(function (t) { return t.name; }),
+                                            maxTokens: this_1.maxTokens,
+                                            temperature: this_1.temperature,
+                                        });
+                                        // Dispatch observer onLlmCall — messages reflect post-compaction state;
+                                        // tools reflect per-step permission filtering
+                                        this_1.safeDispatch("onLlmCall", function () {
+                                            var _a, _b;
+                                            return (_b = (_a = _this.observer) === null || _a === void 0 ? void 0 : _a.onLlmCall) === null || _b === void 0 ? void 0 : _b.call(_a, {
+                                                runId: runId,
+                                                agentId: agentId,
+                                                step: step,
+                                                maxSteps: maxSteps,
+                                                instructions: resolvedInstructions,
+                                                messages: __spreadArray([], messages, true),
+                                                tools: availableTools.map(function (t) { return t.name; }),
+                                                model: modelInfo,
+                                                context: execContext,
+                                            });
+                                        });
+                                        toolCallsBeforeStep = toolCalls.length;
+                                        llmStream = this_1.llmAdapter.stream({
+                                            instructions: resolvedInstructions,
+                                            messages: messages,
+                                            tools: availableTools,
+                                            maxTokens: this_1.maxTokens,
+                                            temperature: this_1.temperature,
+                                            providerMetadata: input.providerMetadata,
+                                        });
+                                        textContent = "";
+                                        toolCallsFromStream = [];
+                                        usage = { inputTokens: 0, outputTokens: 0 };
+                                        stopReason = "end_turn";
+                                        providerMetadata = {};
+                                        _q.label = 10;
+                                    case 10:
+                                        _q.trys.push([10, 22, 23, 28]);
+                                        _k = true, llmStream_1 = (e_1 = void 0, __asyncValues(llmStream));
+                                        _q.label = 11;
+                                    case 11: return [4 /*yield*/, __await(llmStream_1.next())];
+                                    case 12:
+                                        if (!(llmStream_1_1 = _q.sent(), _b = llmStream_1_1.done, !_b)) return [3 /*break*/, 21];
+                                        _d = llmStream_1_1.value;
+                                        _k = false;
+                                        chunk = _d;
+                                        _l = chunk.type;
+                                        switch (_l) {
+                                            case "text": return [3 /*break*/, 13];
+                                            case "tool_call": return [3 /*break*/, 16];
+                                            case "usage": return [3 /*break*/, 17];
+                                            case "metadata": return [3 /*break*/, 18];
+                                            case "done": return [3 /*break*/, 19];
+                                        }
+                                        return [3 /*break*/, 20];
+                                    case 13:
+                                        textContent += chunk.delta;
+                                        return [4 /*yield*/, __await({ type: "text_delta", delta: chunk.delta })];
+                                    case 14:
+                                    // Yield text_delta event in real-time
+                                    return [4 /*yield*/, _q.sent()];
+                                    case 15:
+                                        // Yield text_delta event in real-time
+                                        _q.sent();
+                                        return [3 /*break*/, 20];
+                                    case 16:
+                                        toolCallsFromStream.push(chunk.toolCall);
+                                        return [3 /*break*/, 20];
+                                    case 17:
+                                        usage = chunk.usage;
+                                        totalInputTokens += chunk.usage.inputTokens;
+                                        totalOutputTokens += chunk.usage.outputTokens;
+                                        totalCachedInputTokens += chunk.usage.cachedInputTokens || 0;
+                                        totalCacheCreationInputTokens += chunk.usage.cacheCreationInputTokens || 0;
+                                        return [3 /*break*/, 20];
+                                    case 18:
+                                        // Merge provider metadata (e.g., responseId for continuation)
+                                        providerMetadata = __assign(__assign({}, providerMetadata), chunk.metadata);
+                                        finalProviderMetadata = __assign(__assign({}, finalProviderMetadata), chunk.metadata);
+                                        return [3 /*break*/, 20];
+                                    case 19:
+                                        stopReason = chunk.stopReason;
+                                        return [3 /*break*/, 20];
+                                    case 20:
+                                        _k = true;
+                                        return [3 /*break*/, 11];
+                                    case 21: return [3 /*break*/, 28];
+                                    case 22:
+                                        e_1_1 = _q.sent();
+                                        e_1 = { error: e_1_1 };
+                                        return [3 /*break*/, 28];
+                                    case 23:
+                                        _q.trys.push([23, , 26, 27]);
+                                        if (!(!_k && !_b && (_c = llmStream_1.return))) return [3 /*break*/, 25];
+                                        return [4 /*yield*/, __await(_c.call(llmStream_1))];
+                                    case 24:
+                                        _q.sent();
+                                        _q.label = 25;
+                                    case 25: return [3 /*break*/, 27];
+                                    case 26:
+                                        if (e_1) throw e_1.error;
+                                        return [7 /*endfinally*/];
+                                    case 27: return [7 /*endfinally*/];
+                                    case 28:
+                                        llmResponse = {
+                                            textContent: textContent || undefined,
+                                            toolCalls: toolCallsFromStream,
+                                            usage: usage,
+                                            stopReason: stopReason,
+                                        };
+                                        FlinkLog_1.log.debug("[Agent:".concat(this_1.agentName, "] Step ").concat(step, " - LLM Response:"), {
+                                            textLength: ((_g = llmResponse.textContent) === null || _g === void 0 ? void 0 : _g.length) || 0,
+                                            textPreview: ((_h = llmResponse.textContent) === null || _h === void 0 ? void 0 : _h.substring(0, 200)) + (llmResponse.textContent && llmResponse.textContent.length > 200 ? "..." : ""),
+                                            toolCallsCount: llmResponse.toolCalls.length,
+                                            toolCalls: llmResponse.toolCalls.map(function (tc) { return ({
+                                                name: tc.name,
+                                                inputKeys: Object.keys(tc.input),
+                                                input: tc.input,
+                                            }); }),
+                                            stopReason: llmResponse.stopReason,
+                                            usage: llmResponse.usage,
+                                        });
+                                        // Extract text response
+                                        if (llmResponse.textContent) {
+                                            finalMessage = llmResponse.textContent;
+                                        }
+                                        assistantContent = [];
+                                        if (llmResponse.textContent) {
+                                            assistantContent.push({
+                                                type: "text",
+                                                text: llmResponse.textContent,
+                                            });
+                                        }
+                                        for (_i = 0, _m = llmResponse.toolCalls; _i < _m.length; _i++) {
+                                            toolCall = _m[_i];
+                                            assistantContent.push({
+                                                type: "tool_use",
+                                                id: toolCall.id,
+                                                name: toolCall.name,
+                                                input: toolCall.input,
+                                            });
+                                        }
+                                        messages.push({
+                                            role: "assistant",
+                                            content: assistantContent,
+                                        });
+                                        if (!(llmResponse.toolCalls.length === 0)) return [3 /*break*/, 31];
+                                        if (!this_1.agentProps.onStep) return [3 /*break*/, 30];
+                                        stepContext = __assign(__assign({}, execContext), { step: step, maxSteps: maxSteps, messages: __spreadArray([], messages, true) });
+                                        return [4 /*yield*/, __await(this_1.agentProps.onStep(stepContext))];
+                                    case 29:
+                                        _q.sent();
+                                        _q.label = 30;
+                                    case 30:
+                                        // Dispatch observer onStep (no tool calls executed this step)
+                                        this_1.safeDispatch("onStep", function () {
+                                            var _a, _b;
+                                            return (_b = (_a = _this.observer) === null || _a === void 0 ? void 0 : _a.onStep) === null || _b === void 0 ? void 0 : _b.call(_a, {
+                                                runId: runId,
+                                                agentId: agentId,
+                                                step: step,
+                                                maxSteps: maxSteps,
+                                                messages: __spreadArray([], messages, true),
+                                                assistantText: llmResponse.textContent,
+                                                toolCalls: toolCalls.slice(toolCallsBeforeStep),
+                                                usage: usage,
+                                                context: execContext,
+                                            });
+                                        });
+                                        return [2 /*return*/, "break"];
+                                    case 31:
+                                        toolResults = [];
+                                        _o = 0, _p = llmResponse.toolCalls;
+                                        _q.label = 32;
+                                    case 32:
+                                        if (!(_o < _p.length)) return [3 /*break*/, 43];
+                                        toolCall = _p[_o];
+                                        toolExecutor = this_1.tools.get(toolCall.name);
+                                        toolOutput = void 0;
+                                        toolError = void 0;
+                                        FlinkLog_1.log.debug("[Agent:".concat(this_1.agentName, "] Executing tool '").concat(toolCall.name, "':"), {
+                                            input: toolCall.input,
+                                            inputSize: JSON.stringify(toolCall.input).length,
+                                        });
+                                        _q.label = 33;
+                                    case 33:
+                                        _q.trys.push([33, 39, , 42]);
+                                        if (!toolExecutor) {
+                                            throw new Error("Tool ".concat(toolCall.name, " not found"));
+                                        }
+                                        return [4 /*yield*/, __await({
+                                                type: "tool_call_start",
+                                                toolCall: {
+                                                    id: toolCall.id,
+                                                    name: toolCall.name,
+                                                    input: toolCall.input,
+                                                },
+                                            })];
+                                    case 34:
+                                    // Yield tool_call_start event
+                                    return [4 /*yield*/, _q.sent()];
+                                    case 35:
+                                        // Yield tool_call_start event
+                                        _q.sent();
+                                        return [4 /*yield*/, __await(toolExecutor.execute(toolCall.input, {
+                                                user: input.user,
+                                                permissions: input.userPermissions,
+                                                conversationContext: input.conversationContext,
+                                            }))];
+                                    case 36:
+                                        toolResult = _q.sent();
+                                        formattedResult = toolExecutor.formatResultForAI(toolResult);
+                                        toolResults.push({
+                                            type: "tool_result",
+                                            tool_use_id: toolCall.id,
+                                            content: formattedResult,
+                                            is_error: !toolResult.success,
+                                        });
+                                        return [4 /*yield*/, __await({
+                                                type: "tool_call_result",
+                                                toolCall: {
+                                                    id: toolCall.id,
+                                                    name: toolCall.name,
+                                                    input: toolCall.input,
+                                                },
+                                                output: toolResult.success ? toolResult.data : null,
+                                                error: toolResult.success ? undefined : toolResult.error,
+                                            })];
+                                    case 37:
+                                    // Yield tool_call_result event
+                                    return [4 /*yield*/, _q.sent()];
+                                    case 38:
+                                        // Yield tool_call_result event
+                                        _q.sent();
+                                        toolCalls.push({
+                                            name: toolCall.name,
+                                            input: toolCall.input,
+                                            output: toolResult.success ? toolResult.data : null,
+                                            error: toolResult.success ? undefined : toolResult.error,
+                                        });
+                                        FlinkLog_1.log.debug("[Agent:".concat(this_1.agentName, "] Tool '").concat(toolCall.name, "' ").concat(toolResult.success ? "succeeded" : "failed", ":"), {
+                                            success: toolResult.success,
+                                            outputSize: toolResult.success ? JSON.stringify(toolResult.data).length : 0,
+                                            outputPreview: toolResult.success
+                                                ? JSON.stringify(toolResult.data).substring(0, 200) + (JSON.stringify(toolResult.data).length > 200 ? "..." : "")
+                                                : toolResult.error,
+                                            code: toolResult.code,
+                                        });
+                                        if (!toolResult.success) {
+                                            FlinkLog_1.log.warn("Tool ".concat(toolCall.name, " returned error:"), toolResult.error);
+                                        }
+                                        return [3 /*break*/, 42];
+                                    case 39:
+                                        err_3 = _q.sent();
+                                        // Unexpected errors (not from tool itself)
+                                        toolError = err_3.message;
+                                        return [4 /*yield*/, __await({
+                                                type: "tool_call_result",
+                                                toolCall: {
+                                                    id: toolCall.id,
+                                                    name: toolCall.name,
+                                                    input: toolCall.input,
+                                                },
+                                                output: null,
+                                                error: toolError,
+                                            })];
+                                    case 40:
+                                    // Yield tool_call_result with error
+                                    return [4 /*yield*/, _q.sent()];
+                                    case 41:
+                                        // Yield tool_call_result with error
+                                        _q.sent();
+                                        toolResults.push({
+                                            type: "tool_result",
+                                            tool_use_id: toolCall.id,
+                                            content: "Error: ".concat(err_3.message),
+                                            is_error: true,
+                                        });
+                                        toolCalls.push({
+                                            name: toolCall.name,
+                                            input: toolCall.input,
+                                            output: null,
+                                            error: toolError,
+                                        });
+                                        FlinkLog_1.log.error("Tool ".concat(toolCall.name, " execution failed:"), err_3.message);
+                                        return [3 /*break*/, 42];
+                                    case 42:
+                                        _o++;
+                                        return [3 /*break*/, 32];
+                                    case 43:
+                                        // Add tool results to conversation
+                                        messages.push({
+                                            role: "user",
+                                            content: toolResults,
+                                        });
+                                        if (!this_1.agentProps.onStep) return [3 /*break*/, 45];
+                                        stepContext = __assign(__assign({}, execContext), { step: step, maxSteps: maxSteps, messages: __spreadArray([], messages, true) });
+                                        return [4 /*yield*/, __await(this_1.agentProps.onStep(stepContext))];
+                                    case 44:
+                                        _q.sent();
+                                        _q.label = 45;
+                                    case 45:
+                                        // Dispatch observer onStep with per-step tool calls slice
+                                        this_1.safeDispatch("onStep", function () {
+                                            var _a, _b;
+                                            return (_b = (_a = _this.observer) === null || _a === void 0 ? void 0 : _a.onStep) === null || _b === void 0 ? void 0 : _b.call(_a, {
+                                                runId: runId,
+                                                agentId: agentId,
+                                                step: step,
+                                                maxSteps: maxSteps,
+                                                messages: __spreadArray([], messages, true),
+                                                assistantText: llmResponse.textContent,
+                                                toolCalls: toolCalls.slice(toolCallsBeforeStep),
+                                                usage: usage,
+                                                context: execContext,
+                                            });
+                                        });
+                                        return [2 /*return*/];
+                                }
+                            });
+                        };
+                        this_1 = this;
+                        _j.label = 8;
                     case 8:
-                        availableTools = _o.sent();
-                        if (!this.agentProps.shouldCompact) return [3 /*break*/, 16];
-                        _o.label = 9;
+                        if (!(step < maxSteps)) return [3 /*break*/, 10];
+                        return [5 /*yield**/, _loop_1()];
                     case 9:
-                        _o.trys.push([9, 15, , 16]);
-                        return [4 /*yield*/, __await(this.agentProps.shouldCompact(messages, step))];
+                        state_1 = _j.sent();
+                        if (state_1 === "break")
+                            return [3 /*break*/, 10];
+                        return [3 /*break*/, 8];
                     case 10:
-                        needsCompaction = _o.sent();
-                        if (!needsCompaction) return [3 /*break*/, 14];
-                        beforeCount = messages.length;
-                        originalMessages = messages;
-                        compactedMessages = void 0;
-                        if (!this.agentProps.compactHistory) return [3 /*break*/, 12];
-                        return [4 /*yield*/, __await(this.agentProps.compactHistory(messages, step))];
-                    case 11:
-                        compactedMessages = _o.sent();
-                        return [3 /*break*/, 13];
-                    case 12:
-                        // Default strategy: sliding window keeping last 10 messages
-                        compactedMessages = messages.slice(-10);
-                        _o.label = 13;
-                    case 13:
-                        // Validation: ensure compacted array is not empty
-                        if (!compactedMessages || compactedMessages.length === 0) {
-                            throw new Error("compactHistory must return at least one message");
-                        }
-                        // Apply compaction
-                        messages = compactedMessages;
-                        // Log compaction for debugging
-                        FlinkLog_1.log.debug("[Agent:".concat(this.agentName, "] Step ").concat(step, ": Compacted ").concat(beforeCount, " messages \u2192 ").concat(messages.length));
-                        FlinkLog_1.log.debug("[Agent:".concat(this.agentName, "] Compacted messages:"), {
-                            messageCount: messages.length,
-                            messages: messages.map(function (m) { return ({
-                                role: m.role,
-                                contentPreview: typeof m.content === "string"
-                                    ? m.content.substring(0, 100) + (m.content.length > 100 ? "..." : "")
-                                    : "".concat(m.content.length, " blocks"),
-                            }); }),
-                        });
-                        _o.label = 14;
-                    case 14: return [3 /*break*/, 16];
-                    case 15:
-                        error_1 = _o.sent();
-                        // Log error but don't fail execution - compaction is optional optimization
-                        FlinkLog_1.log.error("[Agent:".concat(this.agentName, "] Context compaction failed:"), error_1.message);
-                        return [3 /*break*/, 16];
-                    case 16:
-                        FlinkLog_1.log.debug("[Agent:".concat(this.agentName, "] Step ").concat(step, "/").concat(maxSteps, " - Calling LLM with:"), {
-                            instructionsType: typeof this.agentProps.instructions === "function" ? "dynamic-callback" : "static",
-                            messageCount: messages.length,
-                            messages: messages.map(function (m) { return ({
-                                role: m.role,
-                                contentPreview: typeof m.content === "string"
-                                    ? m.content.substring(0, 100) + (m.content.length > 100 ? "..." : "")
-                                    : "".concat(m.content.length, " blocks"),
-                            }); }),
-                            toolCount: availableTools.length,
-                            tools: availableTools.map(function (t) { return t.name; }),
-                            maxTokens: this.maxTokens,
-                            temperature: this.temperature,
-                        });
-                        llmStream = this.llmAdapter.stream({
-                            instructions: resolvedInstructions,
-                            messages: messages,
-                            tools: availableTools,
-                            maxTokens: this.maxTokens,
-                            temperature: this.temperature,
-                            providerMetadata: input.providerMetadata,
-                        });
-                        textContent = "";
-                        toolCallsFromStream = [];
-                        usage = { inputTokens: 0, outputTokens: 0 };
-                        stopReason = "end_turn";
-                        providerMetadata = {};
-                        _o.label = 17;
-                    case 17:
-                        _o.trys.push([17, 29, 30, 35]);
-                        _b = true, llmStream_1 = (e_1 = void 0, __asyncValues(llmStream));
-                        _o.label = 18;
-                    case 18: return [4 /*yield*/, __await(llmStream_1.next())];
-                    case 19:
-                        if (!(llmStream_1_1 = _o.sent(), _g = llmStream_1_1.done, !_g)) return [3 /*break*/, 28];
-                        _j = llmStream_1_1.value;
-                        _b = false;
-                        chunk = _j;
-                        _c = chunk.type;
-                        switch (_c) {
-                            case "text": return [3 /*break*/, 20];
-                            case "tool_call": return [3 /*break*/, 23];
-                            case "usage": return [3 /*break*/, 24];
-                            case "metadata": return [3 /*break*/, 25];
-                            case "done": return [3 /*break*/, 26];
-                        }
-                        return [3 /*break*/, 27];
-                    case 20:
-                        textContent += chunk.delta;
-                        return [4 /*yield*/, __await({ type: "text_delta", delta: chunk.delta })];
-                    case 21:
-                    // Yield text_delta event in real-time
-                    return [4 /*yield*/, _o.sent()];
-                    case 22:
-                        // Yield text_delta event in real-time
-                        _o.sent();
-                        return [3 /*break*/, 27];
-                    case 23:
-                        toolCallsFromStream.push(chunk.toolCall);
-                        return [3 /*break*/, 27];
-                    case 24:
-                        usage = chunk.usage;
-                        totalInputTokens += chunk.usage.inputTokens;
-                        totalOutputTokens += chunk.usage.outputTokens;
-                        totalCachedInputTokens += chunk.usage.cachedInputTokens || 0;
-                        totalCacheCreationInputTokens += chunk.usage.cacheCreationInputTokens || 0;
-                        return [3 /*break*/, 27];
-                    case 25:
-                        // Merge provider metadata (e.g., responseId for continuation)
-                        providerMetadata = __assign(__assign({}, providerMetadata), chunk.metadata);
-                        finalProviderMetadata = __assign(__assign({}, finalProviderMetadata), chunk.metadata);
-                        return [3 /*break*/, 27];
-                    case 26:
-                        stopReason = chunk.stopReason;
-                        return [3 /*break*/, 27];
-                    case 27:
-                        _b = true;
-                        return [3 /*break*/, 18];
-                    case 28: return [3 /*break*/, 35];
-                    case 29:
-                        e_1_1 = _o.sent();
-                        e_1 = { error: e_1_1 };
-                        return [3 /*break*/, 35];
-                    case 30:
-                        _o.trys.push([30, , 33, 34]);
-                        if (!(!_b && !_g && (_h = llmStream_1.return))) return [3 /*break*/, 32];
-                        return [4 /*yield*/, __await(_h.call(llmStream_1))];
-                    case 31:
-                        _o.sent();
-                        _o.label = 32;
-                    case 32: return [3 /*break*/, 34];
-                    case 33:
-                        if (e_1) throw e_1.error;
-                        return [7 /*endfinally*/];
-                    case 34: return [7 /*endfinally*/];
-                    case 35:
-                        llmResponse = {
-                            textContent: textContent || undefined,
-                            toolCalls: toolCallsFromStream,
-                            usage: usage,
-                            stopReason: stopReason,
-                        };
-                        FlinkLog_1.log.debug("[Agent:".concat(this.agentName, "] Step ").concat(step, " - LLM Response:"), {
-                            textLength: ((_l = llmResponse.textContent) === null || _l === void 0 ? void 0 : _l.length) || 0,
-                            textPreview: ((_m = llmResponse.textContent) === null || _m === void 0 ? void 0 : _m.substring(0, 200)) + (llmResponse.textContent && llmResponse.textContent.length > 200 ? "..." : ""),
-                            toolCallsCount: llmResponse.toolCalls.length,
-                            toolCalls: llmResponse.toolCalls.map(function (tc) { return ({
-                                name: tc.name,
-                                inputKeys: Object.keys(tc.input),
-                                input: tc.input,
-                            }); }),
-                            stopReason: llmResponse.stopReason,
-                            usage: llmResponse.usage,
-                        });
-                        // Extract text response
-                        if (llmResponse.textContent) {
-                            finalMessage = llmResponse.textContent;
-                        }
-                        assistantContent = [];
-                        if (llmResponse.textContent) {
-                            assistantContent.push({
-                                type: "text",
-                                text: llmResponse.textContent,
-                            });
-                        }
-                        for (_i = 0, _d = llmResponse.toolCalls; _i < _d.length; _i++) {
-                            toolCall = _d[_i];
-                            assistantContent.push({
-                                type: "tool_use",
-                                id: toolCall.id,
-                                name: toolCall.name,
-                                input: toolCall.input,
-                            });
-                        }
-                        messages.push({
-                            role: "assistant",
-                            content: assistantContent,
-                        });
-                        if (!(llmResponse.toolCalls.length === 0)) return [3 /*break*/, 38];
-                        if (!this.agentProps.onStep) return [3 /*break*/, 37];
-                        stepContext = __assign(__assign({}, execContext), { step: step, maxSteps: maxSteps, messages: __spreadArray([], messages, true) });
-                        return [4 /*yield*/, __await(this.agentProps.onStep(stepContext))];
-                    case 36:
-                        _o.sent();
-                        _o.label = 37;
-                    case 37: return [3 /*break*/, 53]; // No more tool calls - done
-                    case 38:
-                        toolResults = [];
-                        _e = 0, _f = llmResponse.toolCalls;
-                        _o.label = 39;
-                    case 39:
-                        if (!(_e < _f.length)) return [3 /*break*/, 50];
-                        toolCall = _f[_e];
-                        toolExecutor = this.tools.get(toolCall.name);
-                        toolOutput = void 0;
-                        toolError = void 0;
-                        FlinkLog_1.log.debug("[Agent:".concat(this.agentName, "] Executing tool '").concat(toolCall.name, "':"), {
-                            input: toolCall.input,
-                            inputSize: JSON.stringify(toolCall.input).length,
-                        });
-                        _o.label = 40;
-                    case 40:
-                        _o.trys.push([40, 46, , 49]);
-                        if (!toolExecutor) {
-                            throw new Error("Tool ".concat(toolCall.name, " not found"));
-                        }
-                        return [4 /*yield*/, __await({
-                                type: "tool_call_start",
-                                toolCall: {
-                                    id: toolCall.id,
-                                    name: toolCall.name,
-                                    input: toolCall.input,
-                                },
-                            })];
-                    case 41:
-                    // Yield tool_call_start event
-                    return [4 /*yield*/, _o.sent()];
-                    case 42:
-                        // Yield tool_call_start event
-                        _o.sent();
-                        return [4 /*yield*/, __await(toolExecutor.execute(toolCall.input, {
-                                user: input.user,
-                                permissions: input.userPermissions,
-                                conversationContext: input.conversationContext,
-                            }))];
-                    case 43:
-                        toolResult = _o.sent();
-                        formattedResult = toolExecutor.formatResultForAI(toolResult);
-                        toolResults.push({
-                            type: "tool_result",
-                            tool_use_id: toolCall.id,
-                            content: formattedResult,
-                            is_error: !toolResult.success,
-                        });
-                        return [4 /*yield*/, __await({
-                                type: "tool_call_result",
-                                toolCall: {
-                                    id: toolCall.id,
-                                    name: toolCall.name,
-                                    input: toolCall.input,
-                                },
-                                output: toolResult.success ? toolResult.data : null,
-                                error: toolResult.success ? undefined : toolResult.error,
-                            })];
-                    case 44:
-                    // Yield tool_call_result event
-                    return [4 /*yield*/, _o.sent()];
-                    case 45:
-                        // Yield tool_call_result event
-                        _o.sent();
-                        toolCalls.push({
-                            name: toolCall.name,
-                            input: toolCall.input,
-                            output: toolResult.success ? toolResult.data : null,
-                            error: toolResult.success ? undefined : toolResult.error,
-                        });
-                        FlinkLog_1.log.debug("[Agent:".concat(this.agentName, "] Tool '").concat(toolCall.name, "' ").concat(toolResult.success ? "succeeded" : "failed", ":"), {
-                            success: toolResult.success,
-                            outputSize: toolResult.success ? JSON.stringify(toolResult.data).length : 0,
-                            outputPreview: toolResult.success
-                                ? JSON.stringify(toolResult.data).substring(0, 200) + (JSON.stringify(toolResult.data).length > 200 ? "..." : "")
-                                : toolResult.error,
-                            code: toolResult.code,
-                        });
-                        if (!toolResult.success) {
-                            FlinkLog_1.log.warn("Tool ".concat(toolCall.name, " returned error:"), toolResult.error);
-                        }
-                        return [3 /*break*/, 49];
-                    case 46:
-                        err_2 = _o.sent();
-                        // Unexpected errors (not from tool itself)
-                        toolError = err_2.message;
-                        return [4 /*yield*/, __await({
-                                type: "tool_call_result",
-                                toolCall: {
-                                    id: toolCall.id,
-                                    name: toolCall.name,
-                                    input: toolCall.input,
-                                },
-                                output: null,
-                                error: toolError,
-                            })];
-                    case 47:
-                    // Yield tool_call_result with error
-                    return [4 /*yield*/, _o.sent()];
-                    case 48:
-                        // Yield tool_call_result with error
-                        _o.sent();
-                        toolResults.push({
-                            type: "tool_result",
-                            tool_use_id: toolCall.id,
-                            content: "Error: ".concat(err_2.message),
-                            is_error: true,
-                        });
-                        toolCalls.push({
-                            name: toolCall.name,
-                            input: toolCall.input,
-                            output: null,
-                            error: toolError,
-                        });
-                        FlinkLog_1.log.error("Tool ".concat(toolCall.name, " execution failed:"), err_2.message);
-                        return [3 /*break*/, 49];
-                    case 49:
-                        _e++;
-                        return [3 /*break*/, 39];
-                    case 50:
-                        // Add tool results to conversation
-                        messages.push({
-                            role: "user",
-                            content: toolResults,
-                        });
-                        if (!this.agentProps.onStep) return [3 /*break*/, 52];
-                        stepContext = __assign(__assign({}, execContext), { step: step, maxSteps: maxSteps, messages: __spreadArray([], messages, true) });
-                        return [4 /*yield*/, __await(this.agentProps.onStep(stepContext))];
-                    case 51:
-                        _o.sent();
-                        _o.label = 52;
-                    case 52: return [3 /*break*/, 7];
-                    case 53:
                         if (step >= maxSteps && toolCalls.length > 0) {
                             stoppedEarly = true;
                             FlinkLog_1.log.warn("Agent ".concat(this.agentName || "unknown", " stopped early after ").concat(maxSteps, " steps"));
                         }
-                        result = {
-                            message: finalMessage,
-                            toolCalls: toolCalls,
-                            stepsUsed: step,
-                            stoppedEarly: stoppedEarly,
-                            usage: __assign(__assign({ inputTokens: totalInputTokens, outputTokens: totalOutputTokens }, (totalCachedInputTokens > 0 && { cachedInputTokens: totalCachedInputTokens })), (totalCacheCreationInputTokens > 0 && { cacheCreationInputTokens: totalCacheCreationInputTokens })),
-                            providerMetadata: Object.keys(finalProviderMetadata).length > 0 ? finalProviderMetadata : undefined,
-                        };
-                        if (!this.agentProps.afterRun) return [3 /*break*/, 55];
-                        finishContext = __assign(__assign({}, execContext), { messages: __spreadArray([], messages, true), result: result });
-                        return [4 /*yield*/, __await(this.agentProps.afterRun(result, finishContext))];
-                    case 54:
-                        _o.sent();
-                        _o.label = 55;
-                    case 55: return [4 /*yield*/, __await({ type: "complete", result: result })];
-                    case 56:
+                        result_1 = buildResult();
+                        if (!this.agentProps.afterRun) return [3 /*break*/, 12];
+                        finishContext = __assign(__assign({}, execContext), { messages: __spreadArray([], messages, true), result: result_1 });
+                        return [4 /*yield*/, __await(this.agentProps.afterRun(result_1, finishContext))];
+                    case 11:
+                        _j.sent();
+                        _j.label = 12;
+                    case 12:
+                        // Dispatch observer onFinish (success path)
+                        this.safeDispatch("onFinish", function () {
+                            var _a, _b;
+                            return (_b = (_a = _this.observer) === null || _a === void 0 ? void 0 : _a.onFinish) === null || _b === void 0 ? void 0 : _b.call(_a, {
+                                runId: runId,
+                                agentId: agentId,
+                                result: result_1,
+                                messages: __spreadArray([], messages, true),
+                                durationMs: Date.now() - runStartedAt,
+                                context: execContext,
+                            });
+                        });
+                        return [4 /*yield*/, __await({ type: "complete", result: result_1 })];
+                    case 13:
                     // Phase 1: Yield only complete event
                     // Phase 2: Will yield text_delta and tool events during loop
-                    return [4 /*yield*/, _o.sent()];
-                    case 57:
+                    return [4 /*yield*/, _j.sent()];
+                    case 14:
                         // Phase 1: Yield only complete event
                         // Phase 2: Will yield text_delta and tool events during loop
-                        _o.sent();
-                        return [4 /*yield*/, __await(result)];
-                    case 58: return [2 /*return*/, _o.sent()];
+                        _j.sent();
+                        return [4 /*yield*/, __await(result_1)];
+                    case 15: return [2 /*return*/, _j.sent()];
+                    case 16:
+                        err_2 = _j.sent();
+                        // Dispatch observer onFinish with error before rethrowing
+                        this.safeDispatch("onFinish", function () {
+                            var _a, _b;
+                            return (_b = (_a = _this.observer) === null || _a === void 0 ? void 0 : _a.onFinish) === null || _b === void 0 ? void 0 : _b.call(_a, {
+                                runId: runId,
+                                agentId: agentId,
+                                result: buildResult(),
+                                messages: __spreadArray([], messages, true),
+                                durationMs: Date.now() - runStartedAt,
+                                error: (err_2 === null || err_2 === void 0 ? void 0 : err_2.message) || String(err_2),
+                                context: execContext,
+                            });
+                        });
+                        throw err_2;
+                    case 17: return [2 /*return*/];
                 }
             });
         });
     };
+    /**
+     * Fire-and-forget observer dispatch: catches synchronous throws and
+     * rejected promises so observer failures never break agent execution.
+     */
+    AgentRunner.prototype.safeDispatch = function (eventName, invoke) {
+        try {
+            var maybePromise = invoke();
+            if (maybePromise && typeof maybePromise.then === "function") {
+                maybePromise.catch(function (err) {
+                    observerLog.warn("AgentObserver.".concat(eventName, " threw (async):"), (err === null || err === void 0 ? void 0 : err.message) || err);
+                });
+            }
+        }
+        catch (err) {
+            observerLog.warn("AgentObserver.".concat(eventName, " threw (sync):"), (err === null || err === void 0 ? void 0 : err.message) || err);
+        }
+    };
     /**
      * Convert Message[] to LLM message format
      * Supports multi-turn conversations with history