npm - @botbotgo/agent-harness - Versions diffs - 0.0.298 → 0.0.299 - Mend

@botbotgo/agent-harness 0.0.298 → 0.0.299

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (166) hide show

package/README.md +77 -37
package/README.zh.md +79 -30
package/dist/acp.d.ts +3 -0
package/dist/acp.js +10 -2
package/dist/api.d.ts +14 -2
package/dist/api.js +19 -3
package/dist/cli.d.ts +18 -1
package/dist/cli.js +1408 -319
package/dist/client/acp.d.ts +9 -3
package/dist/client/acp.js +55 -1
package/dist/client/in-process.d.ts +5 -2
package/dist/client/in-process.js +4 -6
package/dist/client/index.d.ts +1 -1
package/dist/client/types.d.ts +6 -5
package/dist/config/agents/direct.yaml +7 -17
package/dist/config/agents/orchestra.yaml +9 -65
package/dist/config/catalogs/embedding-models.yaml +1 -1
package/dist/config/catalogs/stores.yaml +1 -1
package/dist/config/knowledge/knowledge-runtime.yaml +36 -2
package/dist/config/knowledge/procedural-memory-runtime.yaml +78 -0
package/dist/config/{catalogs/models.yaml → models.yaml} +2 -2
package/dist/config/prompts/direct-system.md +16 -0
package/dist/config/prompts/orchestra-system.md +62 -0
package/dist/config/prompts/routing-system.md +14 -0
package/dist/config/runtime/runtime-memory.yaml +39 -5
package/dist/config/runtime/workspace.yaml +7 -16
package/dist/contracts/runtime.d.ts +242 -1
package/dist/contracts/workspace.d.ts +2 -0
package/dist/index.d.ts +5 -3
package/dist/index.js +2 -1
package/dist/init-project.js +178 -33
package/dist/knowledge/contracts.d.ts +5 -0
package/dist/knowledge/module.d.ts +5 -0
package/dist/knowledge/module.js +340 -18
package/dist/package-version.d.ts +1 -1
package/dist/package-version.js +1 -1
package/dist/persistence/file-store.d.ts +5 -1
package/dist/persistence/file-store.js +16 -0
package/dist/persistence/sqlite-store.d.ts +4 -1
package/dist/persistence/sqlite-store.js +88 -14
package/dist/persistence/types.d.ts +4 -1
package/dist/procedural/config.d.ts +63 -0
package/dist/procedural/config.js +125 -0
package/dist/procedural/index.d.ts +2 -0
package/dist/procedural/index.js +1 -0
package/dist/protocol/ag-ui/http.d.ts +3 -0
package/dist/protocol/ag-ui/http.js +10 -0
package/dist/request-events.d.ts +63 -0
package/dist/request-events.js +400 -0
package/dist/resource/isolation.js +11 -0
package/dist/resource/resource-impl.d.ts +1 -0
package/dist/resource/resource-impl.js +103 -12
package/dist/resources/init-templates/agent-context/deep-research.md +5 -0
package/dist/resources/init-templates/prompts/research-analyst-basic.md +1 -0
package/dist/resources/init-templates/prompts/research-analyst-web-search.md +1 -0
package/dist/resources/init-templates/prompts/research-host-deep-research-basic.md +1 -0
package/dist/resources/init-templates/prompts/research-host-deep-research-web-search.md +1 -0
package/dist/resources/init-templates/prompts/research-host-single-agent-basic.md +1 -0
package/dist/resources/init-templates/prompts/research-host-single-agent-web-search.md +1 -0
package/dist/resources/prompts/runtime/browser-capability-disclaimer-recovery.md +1 -0
package/dist/resources/prompts/runtime/default-subagent.md +2 -0
package/dist/resources/prompts/runtime/durable-memory-context.md +7 -0
package/dist/resources/prompts/runtime/execution-with-tool-evidence-retry.md +1 -0
package/dist/resources/prompts/runtime/execution-with-tool-evidence.md +1 -0
package/dist/resources/prompts/runtime/invalid-tool-selection-recovery.md +1 -0
package/dist/resources/prompts/runtime/memory-manager.md +31 -0
package/dist/resources/prompts/runtime/memory-mutation-reconciliation.md +22 -0
package/dist/resources/prompts/runtime/slash-command-skill.md +6 -0
package/dist/resources/prompts/runtime/strict-tool-json.md +1 -0
package/dist/resources/prompts/runtime/workspace-boundary-guidance.md +3 -0
package/dist/resources/prompts/runtime/workspace-relative-path.md +1 -0
package/dist/resources/prompts/runtime/write-todos-descriptive-content.md +1 -0
package/dist/resources/prompts/runtime/write-todos-full-entry.md +1 -0
package/dist/resources/prompts/runtime/write-todos-non-empty-initial-list.md +1 -0
package/dist/resources/tools/_runtime_tool_helpers.mjs +152 -0
package/dist/resources/tools/cancel_request.mjs +21 -0
package/dist/resources/tools/fetch_url.mjs +23 -0
package/dist/resources/tools/http_request.mjs +30 -0
package/dist/resources/tools/inspect_approvals.mjs +27 -0
package/dist/resources/tools/inspect_artifacts.mjs +21 -0
package/dist/resources/tools/inspect_events.mjs +21 -0
package/dist/resources/tools/inspect_requests.mjs +27 -0
package/dist/resources/tools/inspect_sessions.mjs +21 -0
package/dist/resources/tools/list_files.mjs +27 -0
package/dist/resources/tools/read_artifact.mjs +22 -0
package/dist/resources/tools/request_approval.mjs +27 -0
package/dist/resources/tools/run_command.mjs +21 -0
package/dist/resources/tools/schedule_task.mjs +76 -0
package/dist/resources/tools/search_files.mjs +47 -0
package/dist/resources/tools/send_message.mjs +23 -0
package/dist/runtime/adapter/direct-builtin-utility.d.ts +1 -0
package/dist/runtime/adapter/direct-builtin-utility.js +90 -0
package/dist/runtime/adapter/flow/execution-context.d.ts +1 -1
package/dist/runtime/adapter/flow/execution-context.js +1 -1
package/dist/runtime/adapter/flow/invocation-flow.d.ts +1 -0
package/dist/runtime/adapter/flow/invocation-flow.js +9 -1
package/dist/runtime/adapter/flow/invoke-runtime.d.ts +1 -1
package/dist/runtime/adapter/flow/stream-runtime.d.ts +5 -1
package/dist/runtime/adapter/flow/stream-runtime.js +556 -35
package/dist/runtime/adapter/invocation-result.js +3 -2
package/dist/runtime/adapter/local-tool-invocation.d.ts +1 -1
package/dist/runtime/adapter/local-tool-invocation.js +28 -4
package/dist/runtime/adapter/middleware-assembly.js +3 -1
package/dist/runtime/adapter/model/invocation-request.d.ts +4 -1
package/dist/runtime/adapter/model/invocation-request.js +138 -16
package/dist/runtime/adapter/model/message-assembly.js +2 -6
package/dist/runtime/adapter/model/model-providers.js +103 -5
package/dist/runtime/adapter/resilience.js +17 -2
package/dist/runtime/adapter/runtime-adapter-support.d.ts +11 -7
package/dist/runtime/adapter/runtime-adapter-support.js +39 -5
package/dist/runtime/adapter/tool/builtin-middleware-tools.d.ts +63 -1
package/dist/runtime/adapter/tool/builtin-middleware-tools.js +193 -21
package/dist/runtime/adapter/tool/tool-arguments.d.ts +3 -1
package/dist/runtime/adapter/tool/tool-arguments.js +52 -17
package/dist/runtime/adapter/tool-resolution.d.ts +1 -0
package/dist/runtime/adapter/tool-resolution.js +4 -2
package/dist/runtime/agent-runtime-adapter.d.ts +27 -0
package/dist/runtime/agent-runtime-adapter.js +163 -11
package/dist/runtime/harness/events/event-bus.d.ts +1 -0
package/dist/runtime/harness/events/event-bus.js +3 -0
package/dist/runtime/harness/events/event-sink.d.ts +3 -0
package/dist/runtime/harness/events/event-sink.js +16 -7
package/dist/runtime/harness/events/streaming.d.ts +18 -1
package/dist/runtime/harness/events/streaming.js +23 -10
package/dist/runtime/harness/run/inspection.js +26 -5
package/dist/runtime/harness/run/stream-run.d.ts +13 -4
package/dist/runtime/harness/run/stream-run.js +448 -4
package/dist/runtime/harness/run/surface-semantics.js +7 -34
package/dist/runtime/harness/system/runtime-memory-manager.d.ts +3 -0
package/dist/runtime/harness/system/runtime-memory-manager.js +384 -69
package/dist/runtime/harness/system/runtime-memory-policy.d.ts +20 -1
package/dist/runtime/harness/system/runtime-memory-policy.js +65 -17
package/dist/runtime/harness/system/runtime-memory-records.js +100 -0
package/dist/runtime/harness/system/runtime-memory-sync.js +2 -2
package/dist/runtime/harness/system/store.d.ts +4 -0
package/dist/runtime/harness/system/store.js +153 -0
package/dist/runtime/harness.d.ts +9 -1
package/dist/runtime/harness.js +141 -7
package/dist/runtime/maintenance/sqlite-checkpoint-saver.d.ts +8 -3
package/dist/runtime/maintenance/sqlite-checkpoint-saver.js +152 -53
package/dist/runtime/parsing/output-parsing.d.ts +10 -2
package/dist/runtime/parsing/output-parsing.js +223 -16
package/dist/runtime/parsing/stream-event-parsing.d.ts +7 -0
package/dist/runtime/parsing/stream-event-parsing.js +51 -1
package/dist/runtime/scheduling/system-schedule-manager.d.ts +41 -0
package/dist/runtime/scheduling/system-schedule-manager.js +532 -0
package/dist/runtime/support/embedding-models.d.ts +1 -1
package/dist/runtime/support/embedding-models.js +5 -2
package/dist/runtime/support/runtime-factories.js +1 -1
package/dist/runtime/support/runtime-layout.d.ts +3 -0
package/dist/runtime/support/runtime-layout.js +10 -1
package/dist/runtime/support/runtime-prompts.d.ts +30 -0
package/dist/runtime/support/runtime-prompts.js +55 -0
package/dist/runtime/support/vector-stores.d.ts +1 -1
package/dist/runtime/support/vector-stores.js +5 -2
package/dist/upstream-events.js +8 -7
package/dist/utils/bundled-text.d.ts +3 -0
package/dist/utils/bundled-text.js +25 -0
package/dist/utils/id.js +3 -2
package/dist/workspace/agent-binding-compiler.js +53 -13
package/dist/workspace/object-loader.js +64 -2
package/dist/workspace/support/workspace-ref-utils.d.ts +2 -1
package/dist/workspace/support/workspace-ref-utils.js +24 -5
package/dist/workspace/yaml-object-reader.d.ts +1 -0
package/dist/workspace/yaml-object-reader.js +95 -17
package/package.json +11 -5

package/dist/runtime/harness/run/stream-run.js CHANGED Viewed

@@ -1,9 +1,162 @@
 import { AGENT_INTERRUPT_SENTINEL_PREFIX, RuntimeOperationTimeoutError } from "../../agent-runtime-adapter.js";
+import { buildRequestPlanState, summarizeBuiltinWriteTodosArgs } from "../../adapter/runtime-adapter-support.js";
 import { renderRuntimeFailure, renderToolFailure } from "../../support/harness-support.js";
 import { getBindingPrimaryModel } from "../../support/compiled-binding.js";
 import { createContentBlocksItem, createToolResultKey, } from "../events/streaming.js";
 import { projectRuntimeSurfaceFromSingleUpstreamEvent } from "./inspection.js";
 import { formatAgentName } from "../../../utils/agent-display.js";
+function createInitialPlanState(sessionId, requestId, updatedAt) {
+    return {
+        sessionId,
+        requestId,
+        version: 0,
+        updatedAt,
+        items: [],
+        summary: {
+            total: 0,
+            pending: 0,
+            inProgress: 0,
+            completed: 0,
+            failed: 0,
+            cancelled: 0,
+            blocked: 0,
+        },
+    };
+}
+function getPlanStateFromToolResult(input) {
+    if (typeof input.output !== "object" || input.output === null) {
+        return null;
+    }
+    const summary = input.output.summary;
+    if (summary && typeof summary === "object" && Array.isArray(summary.items)) {
+        const typedSummary = summary;
+        if (typedSummary.summary && typeof typedSummary.summary === "object") {
+            return {
+                sessionId: input.sessionId,
+                requestId: input.requestId,
+                version: input.version,
+                updatedAt: input.updatedAt,
+                items: typedSummary.items,
+                summary: typedSummary.summary,
+            };
+        }
+    }
+    const snapshot = summarizeBuiltinWriteTodosArgs(input.output);
+    return buildRequestPlanState({
+        sessionId: input.sessionId,
+        requestId: input.requestId,
+        updatedAt: input.updatedAt,
+        version: input.version,
+        snapshot,
+    });
+}
+function getStructuredPlanStateFromToolResult(input) {
+    if (typeof input.output !== "object" || input.output === null) {
+        return null;
+    }
+    const summary = input.output.summary;
+    if (!summary || typeof summary !== "object" || !Array.isArray(summary.items)) {
+        return null;
+    }
+    const typedSummary = summary;
+    if (!typedSummary.summary || typeof typedSummary.summary !== "object") {
+        return null;
+    }
+    return {
+        sessionId: input.sessionId,
+        requestId: input.requestId,
+        version: input.version,
+        updatedAt: input.updatedAt,
+        items: typedSummary.items,
+        summary: typedSummary.summary,
+    };
+}
+function buildPlanStateSignature(planState) {
+    return JSON.stringify({
+        items: planState.items,
+        summary: planState.summary,
+    });
+}
+function countStructuredTodoIds(items) {
+    return items.filter((item) => typeof item.id === "string" && item.id.length > 0).length;
+}
+function shouldEmitPlanState(currentPlanState, nextPlanState) {
+    if (!currentPlanState || currentPlanState.items.length === 0) {
+        return true;
+    }
+    if (nextPlanState.items.length === 0) {
+        return false;
+    }
+    const currentStructuredIds = countStructuredTodoIds(currentPlanState.items);
+    const nextStructuredIds = countStructuredTodoIds(nextPlanState.items);
+    if (currentStructuredIds > 0
+        && nextStructuredIds === 0
+        && nextPlanState.items.length < currentPlanState.items.length) {
+        return false;
+    }
+    return true;
+}
+function extractTodosArray(value) {
+    if (typeof value !== "object" || value === null) {
+        return null;
+    }
+    const record = value;
+    if (Array.isArray(record.todos)) {
+        return record.todos;
+    }
+    if (typeof record.output === "object" && record.output !== null) {
+        const nested = record.output.todos;
+        if (Array.isArray(nested)) {
+            return nested;
+        }
+    }
+    return null;
+}
+function getPlanStateFromUpstreamEvent(input) {
+    if (typeof input.event !== "object" || input.event === null) {
+        return null;
+    }
+    const typed = input.event;
+    const todos = extractTodosArray(typed.data?.output)
+        ?? extractTodosArray(typed.data?.chunk);
+    if (!todos) {
+        return null;
+    }
+    return buildRequestPlanState({
+        sessionId: input.sessionId,
+        requestId: input.requestId,
+        updatedAt: input.updatedAt,
+        version: input.version,
+        snapshot: summarizeBuiltinWriteTodosArgs({ todos }),
+    });
+}
+function getLatestPlanStateFromExecutedToolResults(input) {
+    const executedToolResults = Array.isArray(input.metadata?.executedToolResults)
+        ? input.metadata.executedToolResults
+        : [];
+    for (const latest of [...executedToolResults].reverse()) {
+        const structured = getStructuredPlanStateFromToolResult({
+            sessionId: input.sessionId,
+            requestId: input.requestId,
+            output: latest.output,
+            version: input.version,
+            updatedAt: input.updatedAt,
+        });
+        if (structured) {
+            return structured;
+        }
+        if (latest.toolName === "write_todos") {
+            return getPlanStateFromToolResult({
+                sessionId: input.sessionId,
+                requestId: input.requestId,
+                output: latest.output,
+                version: input.version,
+                updatedAt: input.updatedAt,
+            });
+        }
+    }
+    return null;
+}
 function normalizeStreamChunk(chunk) {
     if (typeof chunk === "string") {
         if (chunk.startsWith(AGENT_INTERRUPT_SENTINEL_PREFIX)) {
@@ -11,6 +164,9 @@ function normalizeStreamChunk(chunk) {
         }
         return { kind: "content", content: chunk };
     }
+    if (chunk.kind === "commentary") {
+        return { kind: "commentary", content: chunk.content ?? "" };
+    }
     if (chunk.kind === "upstream-event") {
         return { kind: "upstream-event", event: (chunk.event ?? {}) };
     }
@@ -28,8 +184,117 @@ function normalizeStreamChunk(chunk) {
             isError: chunk.isError,
         };
     }
+    if (chunk.kind === "profile") {
+        return {
+            kind: "profile",
+            step: chunk.step,
+        };
+    }
     return { kind: "content", content: chunk.content ?? "" };
 }
+function normalizeCommentaryText(value) {
+    return value.replace(/\s+/g, " ").trim();
+}
+function ensureCommentarySentence(value) {
+    const normalized = normalizeCommentaryText(value);
+    if (!normalized) {
+        return normalized;
+    }
+    return /[.!?]$/.test(normalized) ? normalized : `${normalized}.`;
+}
+function summarizePlanState(planState) {
+    if (planState.summary.total <= 0) {
+        return null;
+    }
+    const counts = [
+        planState.summary.inProgress > 0 ? `${planState.summary.inProgress} in progress` : "",
+        planState.summary.pending > 0 ? `${planState.summary.pending} pending` : "",
+        planState.summary.completed > 0 ? `${planState.summary.completed} completed` : "",
+        planState.summary.blocked > 0 ? `${planState.summary.blocked} blocked` : "",
+        planState.summary.failed > 0 ? `${planState.summary.failed} failed` : "",
+    ].filter((value) => value.length > 0);
+    if (counts.length === 0) {
+        counts.push(`${planState.summary.total} total`);
+    }
+    return `Plan updated: ${counts.join(", ")}.`;
+}
+function createSurfaceCommentary(surfaceItem) {
+    const name = normalizeCommentaryText(surfaceItem.name);
+    if (!name) {
+        return null;
+    }
+    if (surfaceItem.kind === "tool") {
+        if (surfaceItem.status === "started") {
+            return `Running tool ${name}.`;
+        }
+        if (surfaceItem.status === "completed") {
+            return `Tool ${name} completed.`;
+        }
+        if (surfaceItem.status === "failed") {
+            return `Tool ${name} failed.`;
+        }
+        return null;
+    }
+    if (surfaceItem.kind === "skill") {
+        if (surfaceItem.status === "started") {
+            return `Applying skill ${name}.`;
+        }
+        if (surfaceItem.status === "completed") {
+            return `Skill ${name} applied.`;
+        }
+        if (surfaceItem.status === "failed") {
+            return `Skill ${name} failed.`;
+        }
+        return null;
+    }
+    if (surfaceItem.kind === "agent") {
+        if (surfaceItem.status === "started") {
+            return `Delegating work to ${name}.`;
+        }
+        if (surfaceItem.status === "completed") {
+            return `Delegation to ${name} completed.`;
+        }
+        if (surfaceItem.status === "failed") {
+            return `Delegation to ${name} failed.`;
+        }
+        return null;
+    }
+    if (surfaceItem.kind === "llm") {
+        if (surfaceItem.status === "started") {
+            return `Running model ${name}.`;
+        }
+        if (surfaceItem.status === "completed") {
+            return `Model ${name} completed.`;
+        }
+        if (surfaceItem.status === "failed") {
+            return `Model ${name} failed.`;
+        }
+        return null;
+    }
+    if (surfaceItem.kind === "memory") {
+        if (surfaceItem.status === "started") {
+            return `Checking memory ${name}.`;
+        }
+        if (surfaceItem.status === "completed") {
+            return ensureCommentarySentence(`Finished checking memory ${name}`);
+        }
+        if (surfaceItem.status === "failed") {
+            return `Memory ${name} failed.`;
+        }
+        return null;
+    }
+    return null;
+}
+function createProfileStepCommentary(step) {
+    const name = normalizeCommentaryText(step.name);
+    if (!name || step.status !== "started") {
+        return null;
+    }
+    if (step.kind === "memory") {
+        return `Checking memory ${name}.`;
+    }
+    return null;
+}
 function isOpenAICompatibleStreamingCompatibilityError(binding, error) {
     const primaryModel = getBindingPrimaryModel(binding);
     if (primaryModel?.provider !== "openai-compatible") {
@@ -38,33 +303,107 @@ function isOpenAICompatibleStreamingCompatibilityError(binding, error) {
     const message = error instanceof Error ? error.message : String(error);
     return message.toLowerCase().includes("received empty response from chat model call");
 }
+function createRuntimeMemoryRecallSteps(sessionId, requestId, items) {
+    if (items.length === 0) {
+        return [];
+    }
+    const timestamp = new Date().toISOString();
+    const scopes = Array.from(new Set(items.map((item) => item.scope)));
+    const primaryScope = scopes.length === 1 ? scopes[0] : "mixed";
+    const primarySummary = items[0]?.summary;
+    const name = scopes.length === 1 ? `durable ${primaryScope} memory` : "durable memory";
+    const detail = {
+        source: "runtime-durable-memory",
+        scope: primaryScope,
+        scopes,
+        count: items.length,
+        summaries: items.map((item) => item.summary).slice(0, 5),
+        ...(primarySummary ? { summary: primarySummary } : {}),
+    };
+    const startedStep = {
+        id: `runtime-memory-recall:${requestId}:started`,
+        kind: "memory",
+        name,
+        action: "recall",
+        status: "started",
+        occurredAt: timestamp,
+        detail,
+    };
+    const completedStep = {
+        ...startedStep,
+        id: `runtime-memory-recall:${requestId}:completed`,
+        status: "completed",
+    };
+    return [
+        {
+            type: "profile-step",
+            sessionId,
+            requestId,
+            step: startedStep,
+        },
+        {
+            type: "profile-step",
+            sessionId,
+            requestId,
+            step: completedStep,
+        },
+    ];
+}
 export async function* streamHarnessRun(options) {
     const priorHistoryPromise = Promise.resolve(options.isNewSession ? [] : undefined).then((historyHint) => historyHint ?? options.loadPriorHistory(options.sessionId, options.requestId));
     yield { type: "event", event: await options.requestCreatedEventPromise };
+    let planStateVersion = 0;
+    let lastPlanStateSignature;
+    let currentPlanState = null;
     let releaseRunSlot = async () => undefined;
     let emitted = false;
     let streamActivityObserved = false;
     let nonUpstreamStreamActivityObserved = false;
+    let assistantOutput = "";
     let currentAgentId = options.selectedAgentId;
     let currentAgentName = formatAgentName(options.selectedAgentId);
     let delegationChain = [options.selectedAgentId];
     let upstreamEventOrdinal = 0;
     let syntheticFallback;
+    const emittedCommentary = new Set();
+    const emitCommentary = function* (content) {
+        const normalized = normalizeCommentaryText(content);
+        if (!normalized || emittedCommentary.has(normalized)) {
+            return;
+        }
+        emittedCommentary.add(normalized);
+        yield {
+            type: "commentary",
+            sessionId: options.sessionId,
+            requestId: options.requestId,
+            agentId: currentAgentId,
+            content: normalized,
+        };
+    };
     try {
         const [priorHistory, acquiredReleaseRunSlot] = await Promise.all([
             priorHistoryPromise,
             options.releaseRequestSlotPromise,
         ]).then(([loadedPriorHistory, resolvedReleaseRunSlot]) => [loadedPriorHistory, resolvedReleaseRunSlot]);
         releaseRunSlot = acquiredReleaseRunSlot;
-        let assistantOutput = "";
         const toolErrors = [];
         let lastToolResultKey = null;
+        const recalledMemories = options.invocation.memoryRecall?.items ?? [];
+        for (const item of createRuntimeMemoryRecallSteps(options.sessionId, options.requestId, recalledMemories)) {
+            yield item;
+            if (item.type === "profile-step") {
+                const commentary = createProfileStepCommentary(item.step);
+                if (commentary) {
+                    yield* emitCommentary(commentary);
+                }
+            }
+        }
         for await (const rawChunk of options.stream(options.binding, options.input, options.sessionId, priorHistory, {
             context: options.invocation.context,
             state: options.invocation.state,
             files: options.invocation.files,
             requestId: options.requestId,
-            memoryContext: options.invocation.memoryContext,
+            memoryContext: options.invocation.memoryRecall?.prompt,
         })) {
             if (!rawChunk) {
                 continue;
@@ -72,6 +411,32 @@ export async function* streamHarnessRun(options) {
             streamActivityObserved = true;
             const normalizedChunk = normalizeStreamChunk(rawChunk);
             if (normalizedChunk.kind === "upstream-event") {
+                const upstreamPlanState = getPlanStateFromUpstreamEvent({
+                    sessionId: options.sessionId,
+                    requestId: options.requestId,
+                    event: normalizedChunk.event,
+                    version: planStateVersion + 1,
+                    updatedAt: new Date().toISOString(),
+                });
+                if (upstreamPlanState) {
+                    const signature = buildPlanStateSignature(upstreamPlanState);
+                    if (signature !== lastPlanStateSignature && shouldEmitPlanState(currentPlanState, upstreamPlanState)) {
+                        planStateVersion = upstreamPlanState.version;
+                        lastPlanStateSignature = signature;
+                        currentPlanState = upstreamPlanState;
+                        yield {
+                            type: "plan-state",
+                            sessionId: options.sessionId,
+                            requestId: options.requestId,
+                            agentId: currentAgentId,
+                            planState: upstreamPlanState,
+                        };
+                        const commentary = summarizePlanState(upstreamPlanState);
+                        if (commentary) {
+                            yield* emitCommentary(commentary);
+                        }
+                    }
+                }
                 upstreamEventOrdinal += 1;
                 const projectionBinding = options.getBinding(currentAgentId) ?? options.binding;
                 const surfaceProjection = projectRuntimeSurfaceFromSingleUpstreamEvent({
@@ -121,6 +486,10 @@ export async function* streamHarnessRun(options) {
                         surfaceItem,
                         event: normalizedChunk.event,
                     };
+                    const commentary = createSurfaceCommentary(surfaceItem);
+                    if (commentary) {
+                        yield* emitCommentary(commentary);
+                    }
                 }
                 continue;
             }
@@ -150,9 +519,26 @@ export async function* streamHarnessRun(options) {
                 };
                 return;
             }
+            if (normalizedChunk.kind === "commentary") {
+                yield* emitCommentary(normalizedChunk.content);
+                continue;
+            }
             if (normalizedChunk.kind === "reasoning") {
                 continue;
             }
+            if (normalizedChunk.kind === "profile") {
+                yield {
+                    type: "profile-step",
+                    sessionId: options.sessionId,
+                    requestId: options.requestId,
+                    step: normalizedChunk.step,
+                };
+                const commentary = createProfileStepCommentary(normalizedChunk.step);
+                if (commentary) {
+                    yield* emitCommentary(commentary);
+                }
+                continue;
+            }
             if (normalizedChunk.kind === "tool-result") {
                 const toolResultKey = createToolResultKey(normalizedChunk.toolName, normalizedChunk.output, normalizedChunk.isError);
                 if (toolResultKey === lastToolResultKey) {
@@ -171,6 +557,39 @@ export async function* streamHarnessRun(options) {
                     output: normalizedChunk.output,
                     isError: normalizedChunk.isError,
                 };
+                const planState = normalizedChunk.toolName === "write_todos"
+                    ? getPlanStateFromToolResult({
+                        sessionId: options.sessionId,
+                        requestId: options.requestId,
+                        output: normalizedChunk.output,
+                        version: ++planStateVersion,
+                        updatedAt: new Date().toISOString(),
+                    })
+                    : getStructuredPlanStateFromToolResult({
+                        sessionId: options.sessionId,
+                        requestId: options.requestId,
+                        output: normalizedChunk.output,
+                        version: ++planStateVersion,
+                        updatedAt: new Date().toISOString(),
+                    });
+                if (planState) {
+                    const signature = buildPlanStateSignature(planState);
+                    if (signature !== lastPlanStateSignature && shouldEmitPlanState(currentPlanState, planState)) {
+                        lastPlanStateSignature = signature;
+                        currentPlanState = planState;
+                        yield {
+                            type: "plan-state",
+                            sessionId: options.sessionId,
+                            requestId: options.requestId,
+                            agentId: currentAgentId,
+                            planState,
+                        };
+                        const commentary = summarizePlanState(planState);
+                        if (commentary) {
+                            yield* emitCommentary(commentary);
+                        }
+                    }
+                }
                 continue;
             }
             emitted = true;
@@ -200,6 +619,32 @@ export async function* streamHarnessRun(options) {
                 assistantOutput = actual.output;
                 emitted = true;
             }
+            const finalPlanState = getLatestPlanStateFromExecutedToolResults({
+                sessionId: options.sessionId,
+                requestId: options.requestId,
+                metadata: actual.metadata,
+                version: planStateVersion + 1,
+                updatedAt: new Date().toISOString(),
+            });
+            if (finalPlanState) {
+                const signature = buildPlanStateSignature(finalPlanState);
+                if (signature !== lastPlanStateSignature && shouldEmitPlanState(currentPlanState, finalPlanState)) {
+                    planStateVersion = finalPlanState.version;
+                    lastPlanStateSignature = signature;
+                    currentPlanState = finalPlanState;
+                    yield {
+                        type: "plan-state",
+                        sessionId: options.sessionId,
+                        requestId: options.requestId,
+                        agentId: currentAgentId,
+                        planState: finalPlanState,
+                    };
+                    const commentary = summarizePlanState(finalPlanState);
+                    if (commentary) {
+                        yield* emitCommentary(commentary);
+                    }
+                }
+            }
         }
         await options.appendAssistantMessage(options.sessionId, options.requestId, assistantOutput);
         const completedEvent = await options.setRequestStateAndEmit(options.sessionId, options.requestId, 6, "completed", {
@@ -222,8 +667,7 @@ export async function* streamHarnessRun(options) {
         };
     }
     catch (error) {
-        const shouldRetryAfterStreamingCompatibilityError = streamActivityObserved &&
-            !nonUpstreamStreamActivityObserved &&
+        const shouldRetryAfterStreamingCompatibilityError = !assistantOutput &&
             isOpenAICompatibleStreamingCompatibilityError(options.binding, error);
         if ((emitted || streamActivityObserved) && !shouldRetryAfterStreamingCompatibilityError) {
             const runtimeFailure = renderRuntimeFailure(error);

package/dist/runtime/harness/run/surface-semantics.js CHANGED Viewed

@@ -34,24 +34,18 @@ export function stripStepPrefix(label) {
         .replace(/^Accessing memory\s+/i, "")
         .replace(/^Completed memory\s+/i, "");
 }
-function isGenericMemoryMiddlewareName(value) {
-    return /^(memorymiddleware\.before[_\s]?agent|memory middleware before agent)$/i.test(normalizeLabel(value));
-}
 function canonicalMemoryName(memorySource) {
     const normalized = normalizeLabel(memorySource.replace(/^memory\//i, ""));
     const segments = normalized.split(/[\\/]/).filter(Boolean);
     return (segments.at(-1) ?? normalized).toLowerCase() || "memory";
 }
-function isGenericSkillMiddlewareName(value) {
-    return /^(skillsmiddleware\.before[_\s]?agent|skills middleware before agent)$/i.test(normalizeLabel(value));
-}
 export function resolveSurfaceDisplayName(input) {
     const baseName = stripStepPrefix(input.step) || formatAgentName(input.kind);
-    if (input.kind === "memory" && input.binding && isGenericMemoryMiddlewareName(baseName)) {
+    if (input.kind === "memory" && input.binding && baseName.length === 0) {
         const memorySources = getBindingMemorySources(input.binding).filter((name) => name.trim().length > 0);
         return memorySources.length === 1 ? canonicalMemoryName(memorySources[0]) : baseName;
     }
-    if (input.kind !== "skill" || !input.binding || !isGenericSkillMiddlewareName(baseName)) {
+    if (input.kind !== "skill" || !input.binding || baseName.length > 0) {
         return baseName;
     }
     const skillNames = getBindingSkills(input.binding)
@@ -59,32 +53,11 @@ export function resolveSurfaceDisplayName(input) {
         .filter((name) => typeof name === "string" && name.trim().length > 0);
     return skillNames.length === 1 ? skillNames[0] : baseName;
 }
-function normalizeActionHint(value) {
-    return value
-        .replace(/([a-z0-9])([A-Z])/g, "$1 $2")
-        .replace(/[.:/]+/g, " ")
-        .replace(/[_-]+/g, " ")
-        .replace(/\s+/g, " ")
-        .trim()
-        .toLowerCase();
-}
-function resolveMemoryAction(event, step) {
+function resolveMemoryAction(event) {
     const typed = asObject(event);
-    const hints = [
-        typeof typed?.event === "string" ? typed.event : "",
-        typeof typed?.name === "string" ? typed.name : "",
-        typeof typed?.run_type === "string" ? typed.run_type : "",
-        ...readStringArray(typed?.tags),
-        ...readStringArray(typed?.ns),
-        step,
-    ].map(normalizeActionHint);
-    if (hints.some((value) => /\b(store|memorize|sync|formation|ingestion|archive|write)\b/.test(value))) {
-        return "memorize";
-    }
-    if (hints.some((value) => /\b(recall|retrieve|memorymiddleware|before agent|checkpoint|context)\b/.test(value)
-        || value.includes("accessing memory")
-        || value.includes("access memory"))) {
-        return "recall";
+    const runType = typeof typed?.run_type === "string" ? typed.run_type.trim().toLowerCase() : "";
+    if (runType === "memory") {
+        return "access";
     }
     return "access";
 }
@@ -99,7 +72,7 @@ export function resolveSurfaceAction(input) {
         case "skill":
             return "apply";
         case "memory":
-            return resolveMemoryAction(input.event, input.step ?? "");
+            return resolveMemoryAction(input.event);
         default:
             return "run";
     }

package/dist/runtime/harness/system/runtime-memory-manager.d.ts CHANGED Viewed

@@ -10,6 +10,7 @@ export type ResolvedRuntimeMemoryFormationConfig = {
         enabled: boolean;
         strategy: "rules" | "model";
         modelRef?: string;
+        prompt?: string;
         maxContextRecords: number;
     };
     background: {
@@ -64,6 +65,8 @@ export declare function runModelMemoryManager(input: {
     requestId: string;
     recordedAt: string;
     existingRecords: MemoryRecord[];
+    maxContextRecords?: number;
+    promptTemplate?: string;
     modelResolver?: (modelId: string) => unknown;
 }): Promise<MemoryCandidate[]>;
 export declare function createRuntimeMemoryManager(input: {