npm - @flowdesk/opencode-plugin - Versions diffs - 0.1.13 → 0.1.15 - Mend

@flowdesk/opencode-plugin 0.1.13 → 0.1.15

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (80) hide show

package/README.md +1 -1
package/dist/agent-task-output.d.ts +29 -0
package/dist/agent-task-output.d.ts.map +1 -0
package/dist/agent-task-output.js +225 -0
package/dist/agent-task-output.js.map +1 -0
package/dist/agent-task-runner.d.ts +34 -0
package/dist/agent-task-runner.d.ts.map +1 -1
package/dist/agent-task-runner.js +634 -84
package/dist/agent-task-runner.js.map +1 -1
package/dist/auto-continue-preview-tool.d.ts +36 -0
package/dist/auto-continue-preview-tool.d.ts.map +1 -0
package/dist/auto-continue-preview-tool.js +119 -0
package/dist/auto-continue-preview-tool.js.map +1 -0
package/dist/completion-ui-cache.d.ts +6 -0
package/dist/completion-ui-cache.d.ts.map +1 -0
package/dist/completion-ui-cache.js +390 -0
package/dist/completion-ui-cache.js.map +1 -0
package/dist/event-hook-observer.d.ts +14 -0
package/dist/event-hook-observer.d.ts.map +1 -0
package/dist/event-hook-observer.js +257 -0
package/dist/event-hook-observer.js.map +1 -0
package/dist/managed-dispatch-adapter.d.ts +62 -0
package/dist/managed-dispatch-adapter.d.ts.map +1 -1
package/dist/managed-dispatch-adapter.js +472 -4
package/dist/managed-dispatch-adapter.js.map +1 -1
package/dist/model-selection-engine.d.ts +60 -0
package/dist/model-selection-engine.d.ts.map +1 -0
package/dist/model-selection-engine.js +242 -0
package/dist/model-selection-engine.js.map +1 -0
package/dist/provider-usage-live-tool.d.ts +10 -0
package/dist/provider-usage-live-tool.d.ts.map +1 -1
package/dist/provider-usage-live-tool.js +262 -33
package/dist/provider-usage-live-tool.js.map +1 -1
package/dist/server.d.ts +36 -1
package/dist/server.d.ts.map +1 -1
package/dist/server.js +497 -20
package/dist/server.js.map +1 -1
package/dist/stall-recovery.d.ts +34 -0
package/dist/stall-recovery.d.ts.map +1 -1
package/dist/stall-recovery.js +680 -3
package/dist/stall-recovery.js.map +1 -1
package/dist/status-live-tool.d.ts +54 -0
package/dist/status-live-tool.d.ts.map +1 -1
package/dist/status-live-tool.js +449 -44
package/dist/status-live-tool.js.map +1 -1
package/dist/tui-subtask-activity.d.ts +73 -0
package/dist/tui-subtask-activity.d.ts.map +1 -0
package/dist/tui-subtask-activity.js +271 -0
package/dist/tui-subtask-activity.js.map +1 -0
package/dist/tui-usage-snapshot.d.ts +14 -0
package/dist/tui-usage-snapshot.d.ts.map +1 -1
package/dist/tui-usage-snapshot.js +275 -8
package/dist/tui-usage-snapshot.js.map +1 -1
package/dist/tui.d.ts.map +1 -1
package/dist/tui.js +102 -44
package/dist/tui.js.map +1 -1
package/dist/workflow-assign-tool.d.ts +23 -0
package/dist/workflow-assign-tool.d.ts.map +1 -0
package/dist/workflow-assign-tool.js +135 -0
package/dist/workflow-assign-tool.js.map +1 -0
package/dist/workflow-author-tool.d.ts +29 -0
package/dist/workflow-author-tool.d.ts.map +1 -0
package/dist/workflow-author-tool.js +227 -0
package/dist/workflow-author-tool.js.map +1 -0
package/dist/workflow-dispatch-tool.d.ts +12 -0
package/dist/workflow-dispatch-tool.d.ts.map +1 -1
package/dist/workflow-dispatch-tool.js +31 -3
package/dist/workflow-dispatch-tool.js.map +1 -1
package/dist/workflow-orchestrator.d.ts +31 -0
package/dist/workflow-orchestrator.d.ts.map +1 -0
package/dist/workflow-orchestrator.js +160 -0
package/dist/workflow-orchestrator.js.map +1 -0
package/dist/workflow-scheduler.d.ts.map +1 -1
package/dist/workflow-scheduler.js +3 -1
package/dist/workflow-scheduler.js.map +1 -1
package/dist/workflow-synthesis-tool.d.ts +31 -0
package/dist/workflow-synthesis-tool.d.ts.map +1 -0
package/dist/workflow-synthesis-tool.js +194 -0
package/dist/workflow-synthesis-tool.js.map +1 -0
package/package.json +2 -2

package/dist/agent-task-runner.js CHANGED Viewed

@@ -1,9 +1,25 @@
 import { createHash } from "node:crypto";
-import { applyFlowDeskSessionEvidenceWriteIntentsV1, prepareFlowDeskSessionEvidenceWriteIntentV1, } from "@flowdesk/core";
+import { applyFlowDeskSessionEvidenceWriteIntentsV1, prepareFlowDeskSessionEvidenceWriteIntentV1, reloadFlowDeskSessionEvidenceV1, validateTopTierReviewVerdictV1, } from "@flowdesk/core";
 import { launchFlowDeskInjectedSdkRuntimeLaneFromPlanV1, materializeFlowDeskRuntimeLaneLaunchLifecycleEvidenceV1, } from "./managed-dispatch-adapter.js";
+import { observeFlowDeskAgentTaskOutputV1 } from "./agent-task-output.js";
+import { refreshFlowDeskCompletionUiCachesV1 } from "./completion-ui-cache.js";
 import { recordFlowDeskLaneHeartbeatV1 } from "./lane-heartbeat-writer.js";
 const TASK_RESULT_MAX_TEXT = 32_768;
 const AGENT_TASK_CONTEXT_MAX_PROMPT_TEXT = 32_768;
+const INVALID_PARENT_SESSION_REF = "ses-invalid-parent-session-binding";
+/** Schema version for async child session tracking evidence */
+export const AGENT_TASK_CHILD_SESSION_SCHEMA_VERSION = "flowdesk.agent_task_child_session.v1";
+/** Stable-idle finalization thresholds for non-terminal captured text. */
+const STABLE_IDLE_MIN_CYCLES = 3;
+const STABLE_IDLE_MIN_MS = 12_000;
+const STABLE_IDLE_MIN_LEN = 16;
+export function sanitizeFlowDeskTaskResultTextV1(text) {
+    return {
+        text: text.length > TASK_RESULT_MAX_TEXT ? text.slice(0, TASK_RESULT_MAX_TEXT) : text,
+        changed: false,
+        truncated: text.length > TASK_RESULT_MAX_TEXT,
+    };
+}
 function agentTaskLaunchPlan(input) {
     return {
         schema_version: "flowdesk.runtime_lane_launch_plan.v1",
@@ -32,66 +48,194 @@ function agentTaskLaunchPlan(input) {
         runtimeExecution: false,
     };
 }
-function extractAssistantTextFromResponse(client, childSessionId) {
-    // We extract response text via messages API
+function validateAgentTaskParentSessionId(parentSessionId) {
+    const value = parentSessionId.trim();
+    if (value.length === 0)
+        return { ok: false, redactedReason: "missing_parent_session_binding", parentSessionRef: INVALID_PARENT_SESSION_REF };
+    if (value.length > 128)
+        return { ok: false, redactedReason: "invalid_parent_session_binding", parentSessionRef: INVALID_PARENT_SESSION_REF };
+    // `ses-...` is FlowDesk's opaque session-ref wrapper, not the raw OpenCode
+    // session id expected by SDK `session.create({ parentID })`. Accepting it here
+    // causes evidence such as `ses-ses-flowdesk-coordinator` and can make the SDK
+    // wait on a non-existent synthetic parent session until launch timeout.
+    if (value.startsWith("ses-"))
+        return { ok: false, redactedReason: "invalid_parent_session_binding", parentSessionRef: INVALID_PARENT_SESSION_REF };
+    if (/\s/.test(value))
+        return { ok: false, redactedReason: "invalid_parent_session_binding", parentSessionRef: INVALID_PARENT_SESSION_REF };
+    if (!/^[A-Za-z0-9_.:-]+$/.test(value))
+        return { ok: false, redactedReason: "invalid_parent_session_binding", parentSessionRef: INVALID_PARENT_SESSION_REF };
+    return { ok: true, parentSessionRef: `ses-${value}` };
+}
+/** Bounded nudge text — versioned constant, never echoes user input */
+const AGENT_TASK_NUDGE_TEXT = "Please provide your final answer now. If you have completed your analysis, output your complete response.";
+/**
+ * Polls `session.messages` with a per-call 3-second cap so it works whether the SDK
+ * uses snapshot (returns immediately) or long-poll (blocks until output) semantics.
+ *
+ * Heartbeat: fires every `quietPeriodMs` of silence — only when inactive.
+ * Nudge:     after `quietPeriodMs` of silence, sends a bounded prompt to the child
+ *            session asking for the final answer. Max `maxNudges` nudges total.
+ *            After exhausting nudges with no response, returns undefined.
+ */
+async function extractAssistantTextFromResponse(client, childSessionId, opts) {
     const messages = client.session.messages;
     if (messages === undefined)
         return undefined;
-    return (async () => {
-        try {
-            const method = messages;
+    const quietPeriodMs = opts?.quietPeriodMs ?? 10_000;
+    const maxNudges = opts?.maxNudges ?? 2;
+    const MESSAGES_TIMEOUT_MS = opts?.messagesTimeoutMs ?? 3_000; // per-call cap — handles both snapshot and long-poll
+    const method = messages;
+    /**
+     * Call session.messages with a ceiling timeout so we can check inactivity periodically.
+     * This handles both snapshot APIs (return immediately) and long-poll APIs
+     * (block until LLM produces output). With the timeout, a long-poll call that
+     * hasn't returned after MESSAGES_TIMEOUT_MS resolves as null so we can
+     * check the inactivity clock and possibly send a nudge.
+     */
+    const callMessages = () => {
+        const messagePromise = (async () => {
             const current = await method.call(client.session, { sessionID: childSessionId });
-            const response = isSdkErrorResponse(current)
-                ? await method.call(client.session, { path: { id: childSessionId } })
-                : current;
-            const data = asResponseData(response);
-            const record = asRecord(data);
-            const items = Array.isArray(data)
-                ? data
-                : Array.isArray(record?.items)
-                    ? record.items
-                    : Array.isArray(record?.messages)
-                        ? record.messages
-                        : [];
-            for (let index = items.length - 1; index >= 0; index -= 1) {
-                const message = items[index];
-                const record = asRecord(message);
-                const info = asRecord(record?.info) ?? record;
-                if (info?.role !== "assistant")
-                    continue;
-                const parts = Array.isArray(record?.parts)
-                    ? record.parts
-                    : Array.isArray(info?.parts)
-                        ? info.parts
-                        : [];
-                for (const part of parts) {
-                    const partRecord = asRecord(part);
-                    const text = typeof partRecord?.text === "string"
-                        ? partRecord.text
-                        : typeof partRecord?.content === "string"
-                            ? partRecord.content
-                            : undefined;
-                    if (typeof text === "string" && text.trim().length > 0)
-                        return text;
-                }
-            }
-            return undefined;
+            if (isSdkErrorResponse(current))
+                return method.call(client.session, { path: { id: childSessionId } });
+            return current;
+        })();
+        // Only race against timeout when the API might block (MESSAGES_TIMEOUT_MS > 0)
+        if (MESSAGES_TIMEOUT_MS <= 0)
+            return messagePromise;
+        return Promise.race([
+            messagePromise,
+            new Promise(resolve => setTimeout(() => resolve(null), MESSAGES_TIMEOUT_MS)),
+        ]);
+    };
+    /** Send a nudge to the child session with a hard timeout to prevent blocking.
+     * Uses noReply: true so the child does not generate a spurious second assistant turn.
+     */
+    const sendNudge = async () => {
+        const promptFn = client.session.prompt ?? client.session.promptAsync;
+        if (promptFn === undefined)
+            return "skipped";
+        const NUDGE_TIMEOUT_MS = 5_000;
+        try {
+            await Promise.race([
+                promptFn.call(client.session, {
+                    sessionID: childSessionId,
+                    noReply: true,
+                    ...(opts?.runtimeModel !== undefined ? { model: opts.runtimeModel } : {}),
+                    ...(opts?.agentName !== undefined ? { agent: opts.agentName } : {}),
+                    parts: [{ type: "text", text: AGENT_TASK_NUDGE_TEXT }],
+                }),
+                new Promise((_, reject) => setTimeout(() => reject(new Error("nudge timeout")), NUDGE_TIMEOUT_MS)),
+            ]);
+            return "sent";
         }
         catch {
-            return undefined;
+            return "timeout";
         }
-    })();
-}
-function isProcessOnlyAssistantOutput(text) {
-    const normalized = text.trim().toLowerCase();
-    return normalized.length === 0 || [
-        "working",
-        "thinking",
-        "i'll take a look",
-        "i will take a look",
-        "let me inspect",
-        "i'm going to inspect",
-    ].some((fragment) => normalized.includes(fragment));
+    };
+    const observe = (response) => {
+        if (response === null)
+            return undefined; // timed-out poll cycle
+        return observeFlowDeskAgentTaskOutputV1(response);
+    };
+    const startMs = Date.now();
+    let lastActivityMs = startMs;
+    let lastSignature = "";
+    let lastHeartbeatMs = startMs;
+    let nudgeCount = 0;
+    let latestCandidate;
+    // Stable-idle tracking: capture non-terminal text once it has settled, so a
+    // good answer is not lost just because the SDK shape never surfaced an
+    // explicit terminal/finish marker.
+    let stableText;
+    let stableCount = 0;
+    let firstStableMs = 0;
+    try {
+        while (true) {
+            const response = await callMessages();
+            const nowMs = Date.now();
+            // Build signature (null response = timeout, no change)
+            const sig = response === null ? lastSignature : (() => {
+                const data = asResponseData(response);
+                const record = asRecord(data);
+                const items = Array.isArray(data) ? data
+                    : Array.isArray(record?.items) ? record.items
+                        : Array.isArray(record?.messages) ? record.messages : [];
+                const observed = observe(response);
+                return `${items.length}:${observed?.latestText?.length ?? 0}:${observed?.terminalObserved === true ? "terminal" : "open"}`;
+            })();
+            if (sig !== lastSignature) {
+                // New activity — reset all inactivity clocks
+                lastSignature = sig;
+                lastActivityMs = nowMs;
+                lastHeartbeatMs = nowMs;
+            }
+            const observed = observe(response);
+            if (observed?.latestText !== undefined && observed.latestText.trim().length > 0) {
+                latestCandidate = observed;
+                // Track text stability for idle finalization. Active tool runs reset
+                // stability so we never finalize mid tool-call.
+                if (observed.hasRunningTool) {
+                    stableText = undefined;
+                    stableCount = 0;
+                }
+                else if (observed.latestText === stableText) {
+                    stableCount++;
+                }
+                else {
+                    stableText = observed.latestText;
+                    stableCount = 1;
+                    firstStableMs = nowMs;
+                }
+            }
+            if (observed?.terminalObserved === true && observed.latestText !== undefined && observed.latestText.trim().length > 0) {
+                return { text: observed.latestText, completionStatus: "final", outputKind: observed.outputKind, usableForSynthesis: observed.usableForSynthesis, finalizationReason: "terminal_marker", looksLikeRefusalOrError: observed.looksLikeRefusalOrError };
+            }
+            // Stable-idle: non-terminal text that has been unchanged across several
+            // poll cycles and a minimum interval is treated as captured (not a
+            // semantic success claim — completion_status stays "final" but the
+            // finalization_reason records that this was idle-based capture).
+            if (latestCandidate?.latestText !== undefined &&
+                stableText !== undefined &&
+                stableText.trim().length >= STABLE_IDLE_MIN_LEN &&
+                stableCount >= STABLE_IDLE_MIN_CYCLES &&
+                nowMs - firstStableMs >= STABLE_IDLE_MIN_MS) {
+                return { text: latestCandidate.latestText, completionStatus: "final", outputKind: latestCandidate.outputKind, usableForSynthesis: latestCandidate.usableForSynthesis, finalizationReason: "stable_idle", looksLikeRefusalOrError: latestCandidate.looksLikeRefusalOrError };
+            }
+            const silenceMs = nowMs - lastActivityMs;
+            if (silenceMs >= quietPeriodMs) {
+                // Emit heartbeat on first quiet-period expiry of each silence window
+                if (nowMs - lastHeartbeatMs >= quietPeriodMs) {
+                    lastHeartbeatMs = nowMs;
+                    opts?.heartbeatFn?.(nowMs - startMs);
+                }
+                // Send nudge after quiet period
+                if (nudgeCount < maxNudges) {
+                    nudgeCount++;
+                    await sendNudge();
+                    // Reset activity clock after nudge — give a fresh quiet window
+                    lastActivityMs = Date.now();
+                    lastHeartbeatMs = lastActivityMs;
+                }
+                else {
+                    // Exhausted all nudges. Preserve usable candidate text as partial output.
+                    if (latestCandidate?.latestText !== undefined && latestCandidate.latestText.trim().length > 0) {
+                        return { text: latestCandidate.latestText, completionStatus: "partial", outputKind: latestCandidate.outputKind, usableForSynthesis: latestCandidate.usableForSynthesis, finalizationReason: "nudge_exhausted_partial", looksLikeRefusalOrError: latestCandidate.looksLikeRefusalOrError };
+                    }
+                    return undefined;
+                }
+            }
+            else {
+                // No activity and not yet at quiet period — yield to event loop before next poll.
+                // Sleep for up to 1s or quietPeriodMs/10, whichever is smaller, to avoid tight loops
+                // while still being responsive when messages arrive quickly (snapshot mode).
+                const yieldMs = Math.max(10, Math.min(1_000, Math.floor(quietPeriodMs / 10)));
+                await new Promise(resolve => setTimeout(resolve, yieldMs));
+            }
+        }
+    }
+    catch {
+        return undefined;
+    }
 }
 function asRecord(value) {
     return typeof value === "object" && value !== null && !Array.isArray(value)
@@ -117,11 +261,42 @@ function writeSessionEvidence(input) {
         record: input.record,
     });
     if (prepared.ok && prepared.writeIntent !== undefined) {
-        applyFlowDeskSessionEvidenceWriteIntentsV1(input.rootDir, [prepared.writeIntent]);
+        const applied = applyFlowDeskSessionEvidenceWriteIntentsV1(input.rootDir, [prepared.writeIntent]);
+        return applied.ok && applied.writtenPaths.length > 0;
     }
+    return false;
+}
+function progressLabel(value) {
+    const compact = value.replace(/\s+/g, " ").trim();
+    return compact.length > 120 ? `${compact.slice(0, 119)}…` : compact;
+}
+function writeAgentTaskProgress(input) {
+    const observedAt = input.observedAt ?? new Date().toISOString();
+    const record = {
+        schema_version: "flowdesk.agent_task_progress.v1",
+        workflow_id: input.workflowId,
+        lane_id: input.laneId,
+        task_id: input.taskId,
+        agent_ref: input.agentRef,
+        provider_qualified_model_id: input.providerQualifiedModelId,
+        progress_seq: input.progressSeq,
+        observed_at: observedAt,
+        phase: input.phase,
+        progress_label: progressLabel(input.progressLabel),
+        progress_ref: `progress-${input.laneId}-${input.progressSeq}`,
+        redaction_version: "v1",
+        dispatch_authority_enabled: false,
+    };
+    writeSessionEvidence({
+        rootDir: input.rootDir,
+        workflowId: input.workflowId,
+        evidenceId: `agent-task-progress-${input.laneId}-${input.progressSeq}`,
+        record: record,
+    });
 }
 function writeAgentTaskTerminalLifecycle(input) {
     const childSessionRef = input.childSessionRef === input.parentSessionRef ? undefined : input.childSessionRef;
+    const messageRef = input.messageRef ?? (input.state === "complete" ? `msg-${input.laneId}` : undefined);
     const record = {
         schema_version: "flowdesk.lane_lifecycle_record.v1",
         lane_id: input.laneId,
@@ -129,11 +304,13 @@ function writeAgentTaskTerminalLifecycle(input) {
         attempt_id: input.attemptId,
         parent_session_ref: input.parentSessionRef,
         ...(childSessionRef === undefined ? {} : { child_session_ref: childSessionRef }),
-        ...(input.messageRef === undefined ? {} : { message_ref: input.messageRef }),
+        ...(messageRef === undefined ? {} : { message_ref: messageRef }),
         agent_ref: input.agentRef,
         provider_qualified_model_id: input.providerQualifiedModelId,
         state: input.state,
+        ...(input.verdictRef === undefined ? {} : { verdict_ref: input.verdictRef }),
         ...(input.outputRef === undefined ? {} : { output_ref: input.outputRef }),
+        ...(input.state === "complete" ? { runtime_echo_ref: `runtime-echo-${input.laneId}`, telemetry_ref: `telemetry-${input.laneId}` } : {}),
         timeout_ms: input.timeoutMs ?? 0,
         orphan_max_age_ms: 0,
         retry_count: 0,
@@ -151,9 +328,113 @@ function writeAgentTaskTerminalLifecycle(input) {
         record: record,
     });
 }
+function extractJsonBlocksFromText(raw) {
+    const trimmed = raw.trim();
+    const results = [];
+    if (trimmed.startsWith("{") && trimmed.endsWith("}"))
+        return [trimmed];
+    const fencePattern = /```(?:json)?\s*\n?(\{[\s\S]*?\})\s*\n?```/g;
+    for (const match of trimmed.matchAll(fencePattern)) {
+        if (match[1])
+            results.push(match[1].trim());
+    }
+    if (results.length > 0)
+        return results;
+    let depth = 0;
+    let start = -1;
+    let lastBlock;
+    for (let i = 0; i < trimmed.length; i++) {
+        const ch = trimmed[i];
+        if (ch === "{") {
+            if (depth === 0)
+                start = i;
+            depth++;
+        }
+        else if (ch === "}") {
+            depth--;
+            if (depth === 0 && start !== -1) {
+                lastBlock = trimmed.slice(start, i + 1).trim();
+                start = -1;
+            }
+        }
+    }
+    return lastBlock === undefined ? [] : [lastBlock];
+}
+function observedTopTierReviewerVerdictFromText(input) {
+    for (const block of extractJsonBlocksFromText(input.text)) {
+        try {
+            const candidate = JSON.parse(block);
+            const validation = validateTopTierReviewVerdictV1(candidate);
+            if (!validation.ok)
+                continue;
+            const verdict = candidate;
+            if (verdict.workflow_id === input.workflowId)
+                return verdict;
+        }
+        catch {
+            // Keep scanning candidates.
+        }
+    }
+    return undefined;
+}
+function persistObservedReviewerVerdict(input) {
+    const evidenceId = input.verdict.verdict_id;
+    if (!writeSessionEvidence({
+        rootDir: input.rootDir,
+        workflowId: input.workflowId,
+        evidenceId,
+        record: input.verdict,
+    }))
+        return false;
+    const reloaded = reloadFlowDeskSessionEvidenceV1({
+        rootDir: input.rootDir,
+        workflowId: input.workflowId,
+    });
+    return reloaded.ok && reloaded.blocked.length === 0 && reloaded.entries.some((entry) => entry.evidenceClass === "reviewer_verdict" &&
+        entry.evidenceId === evidenceId &&
+        entry.record.verdict_id === input.verdict.verdict_id);
+}
 export async function executeFlowDeskAgentTaskV1(input) {
     const observedAt = new Date().toISOString();
     const token = `${Date.now().toString(36)}-${Math.random().toString(36).slice(2, 8)}`;
+    const parentBinding = validateAgentTaskParentSessionId(input.parentSessionId);
+    const parentSessionRef = parentBinding.parentSessionRef;
+    const attemptId = `attempt-task-${token}`;
+    if (!parentBinding.ok) {
+        const taskFailedEvidenceId = `task-failed-${input.taskId}-${token}-invalid-parent`;
+        const redactedReason = parentBinding.redactedReason;
+        writeSessionEvidence({
+            rootDir: input.rootDir,
+            workflowId: input.workflowId,
+            evidenceId: taskFailedEvidenceId,
+            record: {
+                schema_version: "flowdesk.task_failed.v1",
+                workflow_id: input.workflowId,
+                lane_id: input.laneId,
+                task_id: input.taskId,
+                agent_ref: input.agentRef,
+                provider_qualified_model_id: input.providerQualifiedModelId,
+                failure_category: "sdk_create_failed",
+                redacted_reason: redactedReason,
+                created_at: observedAt,
+                dispatch_authority_enabled: false,
+            },
+        });
+        writeAgentTaskTerminalLifecycle({
+            rootDir: input.rootDir,
+            workflowId: input.workflowId,
+            laneId: input.laneId,
+            attemptId,
+            parentSessionRef,
+            agentRef: input.agentRef,
+            providerQualifiedModelId: input.providerQualifiedModelId,
+            state: "invocation_failed",
+            evidenceId: `lifecycle-task-terminal-${input.laneId}-${token}-invalid-parent`,
+            createdAt: observedAt,
+            updatedAt: observedAt,
+        });
+        return { status: "task_failed", failureCategory: "sdk_create_failed", redactedReason, laneId: input.laneId };
+    }
     const launchPlan = agentTaskLaunchPlan({
         workflowId: input.workflowId,
         laneId: input.laneId,
@@ -163,8 +444,6 @@ export async function executeFlowDeskAgentTaskV1(input) {
         token,
     });
     const runningLifecycleEvidenceId = `lifecycle-task-running-${input.laneId}-${token}`;
-    const attemptId = launchPlan.attempt_id ?? `attempt-task-${token}`;
-    const parentSessionRef = `ses-${input.parentSessionId}`;
     const promptTextTruncated = input.promptText.length > AGENT_TASK_CONTEXT_MAX_PROMPT_TEXT;
     const agentTaskContextRecord = {
         schema_version: "flowdesk.agent_task_context.v1",
@@ -189,17 +468,72 @@ export async function executeFlowDeskAgentTaskV1(input) {
         evidenceId: `agent-task-context-${input.taskId}-${token}`,
         record: agentTaskContextRecord,
     });
-    // Launch the lane
-    const launchResult = await launchFlowDeskInjectedSdkRuntimeLaneFromPlanV1({
-        client: input.client,
-        launchPlan,
-        request: {
-            allowActualLaneLaunch: true,
-            parentSessionId: input.parentSessionId,
-            promptText: input.promptText,
-            dispatchMethod: "prompt",
-        },
+    writeAgentTaskProgress({
+        rootDir: input.rootDir,
+        workflowId: input.workflowId,
+        laneId: input.laneId,
+        taskId: input.taskId,
+        agentRef: input.agentRef,
+        providerQualifiedModelId: input.providerQualifiedModelId,
+        phase: "started",
+        progressSeq: 1,
+        progressLabel: "agent task lane launch started",
+        observedAt,
     });
+    // Launch the lane — wrap in absolute timeout so session.prompt blocking doesn't hang forever.
+    // 30s default — if session.prompt blocks for more than 30s with no activity, give up.
+    const LAUNCH_TIMEOUT_MS = input._launchTimeoutMs ?? 30_000;
+    const launchTimeoutHandle = setTimeout(() => { }, LAUNCH_TIMEOUT_MS);
+    const dispatchMethod = input.client.session.promptAsync !== undefined ? "promptAsync" : "prompt";
+    const launchResult = await Promise.race([
+        launchFlowDeskInjectedSdkRuntimeLaneFromPlanV1({
+            client: input.client,
+            launchPlan,
+            request: {
+                allowActualLaneLaunch: true,
+                parentSessionId: input.parentSessionId,
+                promptText: input.promptText,
+                dispatchMethod,
+            },
+        }),
+        new Promise(resolve => setTimeout(() => resolve({ status: "launch_timeout" }), LAUNCH_TIMEOUT_MS)),
+    ]);
+    clearTimeout(launchTimeoutHandle);
+    if ("status" in launchResult && launchResult.status === "launch_timeout") {
+        // session.prompt blocked for too long — treat as invocation failure
+        const failedEvidenceId = `task-failed-${input.taskId}-${token}-launch-timeout`;
+        writeSessionEvidence({
+            rootDir: input.rootDir,
+            workflowId: input.workflowId,
+            evidenceId: failedEvidenceId,
+            record: {
+                schema_version: "flowdesk.task_failed.v1",
+                workflow_id: input.workflowId,
+                lane_id: input.laneId,
+                task_id: input.taskId,
+                agent_ref: input.agentRef,
+                provider_qualified_model_id: input.providerQualifiedModelId,
+                failure_category: "sdk_create_failed",
+                redacted_reason: "lane launch timed out: session.prompt did not respond",
+                created_at: observedAt,
+                dispatch_authority_enabled: false,
+            },
+        });
+        writeAgentTaskTerminalLifecycle({
+            rootDir: input.rootDir,
+            workflowId: input.workflowId,
+            laneId: input.laneId,
+            attemptId,
+            parentSessionRef,
+            agentRef: input.agentRef,
+            providerQualifiedModelId: input.providerQualifiedModelId,
+            state: "invocation_failed",
+            evidenceId: `lifecycle-task-terminal-${input.laneId}-${token}-launch-timeout`,
+            createdAt: observedAt,
+            updatedAt: new Date().toISOString(),
+        });
+        return { status: "task_failed", failureCategory: "sdk_create_failed", redactedReason: "launch timeout: session.prompt did not respond within the allowed window", laneId: input.laneId };
+    }
     // Write running lifecycle evidence
     materializeFlowDeskRuntimeLaneLaunchLifecycleEvidenceV1({
         rootDir: input.rootDir,
@@ -258,6 +592,11 @@ export async function executeFlowDeskAgentTaskV1(input) {
             updatedAt: new Date().toISOString(),
             timeoutMs: input.timeoutMs,
         });
+        refreshFlowDeskCompletionUiCachesV1({
+            rootDir: input.rootDir,
+            workflowId: input.workflowId,
+            observedAt,
+        });
         return {
             status: "task_failed",
             failureCategory,
@@ -278,22 +617,91 @@ export async function executeFlowDeskAgentTaskV1(input) {
         observedAt,
         progressSummaryLabel: `agent task lane launch heartbeat`,
     });
-    // Extract child session ID and get response text
+    refreshFlowDeskCompletionUiCachesV1({
+        rootDir: input.rootDir,
+        workflowId: input.workflowId,
+        observedAt,
+    });
+    // Extract child session ID
     const childSessionId = launchResult.childSessionRef?.startsWith("ses-")
         ? launchResult.childSessionRef.slice("ses-".length)
         : undefined;
-    let resultText;
+    // ── Async mode: return immediately, watchdog handles polling/nudging/abort ──
+    if (input.asyncMode === true) {
+        const resolvedChildId = childSessionId ?? "";
+        // Write child session evidence so watchdog can find it
+        writeSessionEvidence({
+            rootDir: input.rootDir,
+            workflowId: input.workflowId,
+            evidenceId: `agent-task-child-session-${input.laneId}-${token}`,
+            record: {
+                schema_version: AGENT_TASK_CHILD_SESSION_SCHEMA_VERSION,
+                workflow_id: input.workflowId,
+                lane_id: input.laneId,
+                task_id: input.taskId,
+                child_session_id: resolvedChildId,
+                parent_session_ref: parentSessionRef,
+                provider_qualified_model_id: input.providerQualifiedModelId,
+                agent_ref: input.agentRef,
+                nudge_count: 0,
+                last_nudge_at: null,
+                created_at: observedAt,
+                dispatch_authority_enabled: false,
+            },
+        });
+        writeAgentTaskProgress({
+            rootDir: input.rootDir,
+            workflowId: input.workflowId,
+            laneId: input.laneId,
+            taskId: input.taskId,
+            agentRef: input.agentRef,
+            providerQualifiedModelId: input.providerQualifiedModelId,
+            phase: "waiting",
+            progressSeq: 2,
+            progressLabel: "agent task waiting for async child result",
+        });
+        refreshFlowDeskCompletionUiCachesV1({
+            rootDir: input.rootDir,
+            workflowId: input.workflowId,
+            observedAt: new Date().toISOString(),
+        });
+        return { status: "task_launched", laneId: input.laneId, childSessionId: resolvedChildId };
+    }
+    let resultObservation;
     if (childSessionId !== undefined) {
-        resultText = await extractAssistantTextFromResponse(input.client, childSessionId);
+        const runtimeModel = launchResult.status === "lane_launch_started" && typeof launchResult.model === "string"
+            ? launchResult.model : undefined;
+        const agentName = launchResult.status === "lane_launch_started" && typeof launchResult.agent === "string"
+            ? launchResult.agent : undefined;
+        resultObservation = await extractAssistantTextFromResponse(input.client, childSessionId, {
+            quietPeriodMs: input._nudgeQuietPeriodMs ?? 10_000, // default 10s per policy
+            maxNudges: 2,
+            runtimeModel,
+            agentName,
+            messagesTimeoutMs: input._messagesTimeoutMs,
+            heartbeatFn: (elapsedMs) => {
+                recordFlowDeskLaneHeartbeatV1({
+                    rootDir: input.rootDir,
+                    workflowId: input.workflowId,
+                    attemptId,
+                    laneId: input.laneId,
+                    parentSessionRef,
+                    agentRef: input.agentRef,
+                    providerQualifiedModelId: input.providerQualifiedModelId,
+                    state: "running",
+                    observedAt: new Date().toISOString(),
+                    progressSummaryLabel: `agent task waiting for response elapsed=${Math.floor(elapsedMs / 1000)}s`,
+                });
+            },
+        });
     }
-    if (resultText === undefined || (input.outputContract === "final_assistant_text" && isProcessOnlyAssistantOutput(resultText))) {
+    const resultText = resultObservation?.text;
+    if (resultText === undefined) {
         // No response text - write task_failed
         const taskFailedEvidenceId = `task-failed-${input.taskId}-${token}`;
-        const failureCategory = resultText === undefined ? "no_response" : "contract_not_satisfied";
-        const evidenceFailureCategory = resultText === undefined ? "no_response" : "unknown";
-        const redactedReason = resultText === undefined
-            ? "lane launched but no assistant response text found"
-            : "lane launched but final assistant response did not satisfy requested output contract";
+        const failureCategory = "no_response";
+        const evidenceFailureCategory = "no_response";
+        const redactedReason = "lane launched but no assistant response text found";
         const taskFailedRecord = {
             schema_version: "flowdesk.task_failed.v1",
             workflow_id: input.workflowId,
@@ -312,6 +720,17 @@ export async function executeFlowDeskAgentTaskV1(input) {
             evidenceId: taskFailedEvidenceId,
             record: taskFailedRecord,
         });
+        writeAgentTaskProgress({
+            rootDir: input.rootDir,
+            workflowId: input.workflowId,
+            laneId: input.laneId,
+            taskId: input.taskId,
+            agentRef: input.agentRef,
+            providerQualifiedModelId: input.providerQualifiedModelId,
+            phase: "failed",
+            progressSeq: 3,
+            progressLabel: failureCategory === "no_response" ? "agent task finished without response" : "agent task output contract not satisfied",
+        });
         writeAgentTaskTerminalLifecycle({
             rootDir: input.rootDir,
             workflowId: input.workflowId,
@@ -322,12 +741,43 @@ export async function executeFlowDeskAgentTaskV1(input) {
             messageRef: launchResult.messageRef?.startsWith("msg-") ? launchResult.messageRef : undefined,
             agentRef: input.agentRef,
             providerQualifiedModelId: input.providerQualifiedModelId,
-            state: resultText === undefined ? "no_output" : "incomplete",
+            state: "no_output",
             evidenceId: `lifecycle-task-terminal-${input.laneId}-${token}`,
             createdAt: observedAt,
             updatedAt: new Date().toISOString(),
             timeoutMs: input.timeoutMs,
         });
+        refreshFlowDeskCompletionUiCachesV1({
+            rootDir: input.rootDir,
+            workflowId: input.workflowId,
+            observedAt: new Date().toISOString(),
+        });
+        // Auto-retry with fallback binding if configured and this is not already a retry
+        if (input.fallbackBinding !== undefined && !input._isFallbackRetry) {
+            const retryToken = `${Date.now().toString(36)}-${Math.random().toString(36).slice(2, 8)}`;
+            const retryTaskId = `${input.taskId}-retry-${retryToken.slice(0, 6)}`;
+            const retryLaneId = `${input.laneId}-retry`;
+            writeAgentTaskProgress({
+                rootDir: input.rootDir,
+                workflowId: input.workflowId,
+                laneId: retryLaneId,
+                taskId: retryTaskId,
+                agentRef: input.fallbackBinding.agentRef,
+                providerQualifiedModelId: input.fallbackBinding.providerQualifiedModelId,
+                phase: "retrying",
+                progressSeq: 0,
+                progressLabel: `auto-retry with ${input.fallbackBinding.providerQualifiedModelId} after ${failureCategory}`,
+            });
+            return executeFlowDeskAgentTaskV1({
+                ...input,
+                taskId: retryTaskId,
+                laneId: retryLaneId,
+                agentRef: input.fallbackBinding.agentRef,
+                providerQualifiedModelId: input.fallbackBinding.providerQualifiedModelId,
+                fallbackBinding: undefined,
+                _isFallbackRetry: true,
+            });
+        }
         return {
             status: "task_failed",
             failureCategory,
@@ -335,10 +785,9 @@ export async function executeFlowDeskAgentTaskV1(input) {
             laneId: input.laneId,
         };
     }
-    // Truncate if needed
     const fullResultText = resultText;
-    const truncated = fullResultText.length > TASK_RESULT_MAX_TEXT;
-    const storedResultText = truncated ? fullResultText.slice(0, TASK_RESULT_MAX_TEXT) : fullResultText;
+    const sanitizedResult = sanitizeFlowDeskTaskResultTextV1(fullResultText);
+    const storedResultText = sanitizedResult.text;
     const promptSha256 = sha256Hex(input.promptText);
     const resultSha256 = sha256Hex(fullResultText);
     // Write task_result evidence
@@ -352,17 +801,112 @@ export async function executeFlowDeskAgentTaskV1(input) {
         provider_qualified_model_id: input.providerQualifiedModelId,
         task_prompt_sha256: promptSha256,
         result_text: storedResultText,
-        result_text_truncated: truncated,
+        result_text_truncated: sanitizedResult.truncated,
         result_text_sha256: resultSha256,
+        completion_status: resultObservation?.completionStatus ?? "final",
+        output_kind: resultObservation?.outputKind ?? "final_answer",
+        usable_for_synthesis: resultObservation?.usableForSynthesis ?? true,
+        // Capture/judgement separation: text was captured, so this is NOT a
+        // contract failure. output_kind/completion_status/looks_like_refusal_or_error
+        // are advisory inputs for the coordinator's substance judgement, never a
+        // capture-side drop. missing_contract is only ever true when an explicit
+        // contract was requested AND no text was captured (that path returns
+        // task_failed above, so here it is always false).
+        missing_contract: false,
+        ...(resultObservation?.finalizationReason === undefined
+            ? {}
+            : { finalization_reason: resultObservation.finalizationReason }),
+        looks_like_refusal_or_error: resultObservation?.looksLikeRefusalOrError ?? false,
         created_at: observedAt,
         dispatch_authority_enabled: false,
     };
-    writeSessionEvidence({
+    const taskResultWritten = writeSessionEvidence({
         rootDir: input.rootDir,
         workflowId: input.workflowId,
         evidenceId: taskResultEvidenceId,
         record: taskResultRecord,
     });
+    if (!taskResultWritten) {
+        const taskFailedEvidenceId = `task-failed-${input.taskId}-${token}-result-write`;
+        const redactedReason = "task_result evidence persistence failed";
+        writeSessionEvidence({
+            rootDir: input.rootDir,
+            workflowId: input.workflowId,
+            evidenceId: taskFailedEvidenceId,
+            record: {
+                schema_version: "flowdesk.task_failed.v1",
+                workflow_id: input.workflowId,
+                lane_id: input.laneId,
+                task_id: input.taskId,
+                agent_ref: input.agentRef,
+                provider_qualified_model_id: input.providerQualifiedModelId,
+                failure_category: "unknown",
+                redacted_reason: redactedReason,
+                created_at: observedAt,
+                dispatch_authority_enabled: false,
+            },
+        });
+        writeAgentTaskProgress({
+            rootDir: input.rootDir,
+            workflowId: input.workflowId,
+            laneId: input.laneId,
+            taskId: input.taskId,
+            agentRef: input.agentRef,
+            providerQualifiedModelId: input.providerQualifiedModelId,
+            phase: "failed",
+            progressSeq: 4,
+            progressLabel: "agent task result persistence failed",
+        });
+        writeAgentTaskTerminalLifecycle({
+            rootDir: input.rootDir,
+            workflowId: input.workflowId,
+            laneId: input.laneId,
+            attemptId,
+            parentSessionRef,
+            agentRef: input.agentRef,
+            providerQualifiedModelId: input.providerQualifiedModelId,
+            state: "invocation_failed",
+            evidenceId: `lifecycle-task-terminal-${input.laneId}-${token}-result-write`,
+            createdAt: observedAt,
+            updatedAt: new Date().toISOString(),
+            timeoutMs: input.timeoutMs,
+        });
+        refreshFlowDeskCompletionUiCachesV1({
+            rootDir: input.rootDir,
+            workflowId: input.workflowId,
+            observedAt,
+        });
+        return {
+            status: "task_failed",
+            failureCategory: "unknown",
+            redactedReason,
+            laneId: input.laneId,
+        };
+    }
+    const observedReviewerVerdict = observedTopTierReviewerVerdictFromText({
+        text: fullResultText,
+        workflowId: input.workflowId,
+    });
+    const reviewerVerdictPersisted = observedReviewerVerdict === undefined
+        ? false
+        : persistObservedReviewerVerdict({
+            rootDir: input.rootDir,
+            workflowId: input.workflowId,
+            verdict: observedReviewerVerdict,
+        });
+    writeAgentTaskProgress({
+        rootDir: input.rootDir,
+        workflowId: input.workflowId,
+        laneId: input.laneId,
+        taskId: input.taskId,
+        agentRef: input.agentRef,
+        providerQualifiedModelId: input.providerQualifiedModelId,
+        phase: "finalizing",
+        progressSeq: 3,
+        progressLabel: reviewerVerdictPersisted
+            ? "agent task result captured with reviewer verdict evidence"
+            : "agent task result captured",
+    });
     writeAgentTaskTerminalLifecycle({
         rootDir: input.rootDir,
         workflowId: input.workflowId,
@@ -373,13 +917,19 @@ export async function executeFlowDeskAgentTaskV1(input) {
         messageRef: launchResult.messageRef?.startsWith("msg-") ? launchResult.messageRef : undefined,
         agentRef: input.agentRef,
         providerQualifiedModelId: input.providerQualifiedModelId,
-        state: "incomplete",
+        state: reviewerVerdictPersisted ? "complete" : "incomplete",
+        verdictRef: reviewerVerdictPersisted ? observedReviewerVerdict?.verdict_id : undefined,
         outputRef: `output-${taskResultEvidenceId}`,
         evidenceId: `lifecycle-task-terminal-${input.laneId}-${token}`,
         createdAt: observedAt,
         updatedAt: new Date().toISOString(),
         timeoutMs: input.timeoutMs,
     });
+    refreshFlowDeskCompletionUiCachesV1({
+        rootDir: input.rootDir,
+        workflowId: input.workflowId,
+        observedAt,
+    });
     return {
         status: "task_completed",
         resultText: fullResultText,