npm - @exaudeus/workrail - Versions diffs - 3.31.1 → 3.33.0 - Mend

@exaudeus/workrail 3.31.1 → 3.33.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (82) hide show

package/dist/cli/commands/index.d.ts +1 -0
package/dist/cli/commands/index.js +3 -1
package/dist/cli/commands/worktrain-await.js +11 -9
package/dist/cli/commands/worktrain-daemon-install.d.ts +35 -0
package/dist/cli/commands/worktrain-daemon-install.js +291 -0
package/dist/cli/commands/worktrain-daemon.d.ts +31 -0
package/dist/cli/commands/worktrain-daemon.js +272 -0
package/dist/cli/commands/worktrain-spawn.js +11 -9
package/dist/cli-worktrain.js +329 -0
package/dist/cli.js +4 -22
package/dist/console/standalone-console.d.ts +28 -0
package/dist/console/standalone-console.js +142 -0
package/dist/{console/assets/index-6H9DeFxj.js → console-ui/assets/index-BuJFLLfY.js} +1 -1
package/dist/{console → console-ui}/index.html +1 -1
package/dist/daemon/agent-loop.d.ts +26 -0
package/dist/daemon/agent-loop.js +53 -2
package/dist/daemon/daemon-events.d.ts +103 -0
package/dist/daemon/daemon-events.js +56 -0
package/dist/daemon/workflow-runner.d.ts +6 -3
package/dist/daemon/workflow-runner.js +229 -33
package/dist/infrastructure/session/HttpServer.js +133 -34
package/dist/manifest.json +134 -70
package/dist/mcp/output-schemas.d.ts +30 -30
package/dist/mcp/transports/bridge-events.d.ts +4 -0
package/dist/mcp/transports/fatal-exit.js +4 -0
package/dist/mcp/transports/http-entry.js +2 -0
package/dist/mcp/transports/stdio-entry.js +26 -6
package/dist/mcp/v2/tools.d.ts +4 -4
package/dist/trigger/adapters/github-poller.d.ts +44 -0
package/dist/trigger/adapters/github-poller.js +190 -0
package/dist/trigger/adapters/gitlab-poller.d.ts +27 -0
package/dist/trigger/adapters/gitlab-poller.js +81 -0
package/dist/trigger/delivery-client.d.ts +2 -1
package/dist/trigger/delivery-client.js +4 -1
package/dist/trigger/index.d.ts +4 -1
package/dist/trigger/index.js +5 -1
package/dist/trigger/polled-event-store.d.ts +22 -0
package/dist/trigger/polled-event-store.js +173 -0
package/dist/trigger/polling-scheduler.d.ts +20 -0
package/dist/trigger/polling-scheduler.js +249 -0
package/dist/trigger/trigger-listener.d.ts +5 -0
package/dist/trigger/trigger-listener.js +53 -4
package/dist/trigger/trigger-router.d.ts +4 -2
package/dist/trigger/trigger-router.js +7 -4
package/dist/trigger/trigger-store.js +114 -33
package/dist/trigger/types.d.ts +17 -1
package/dist/v2/durable-core/schemas/export-bundle/index.d.ts +224 -224
package/dist/v2/durable-core/schemas/session/events.d.ts +42 -42
package/dist/v2/durable-core/schemas/session/manifest.d.ts +6 -6
package/dist/v2/durable-core/schemas/session/validation-event.d.ts +2 -2
package/dist/v2/durable-core/tokens/payloads.d.ts +52 -52
package/dist/v2/usecases/console-routes.js +3 -3
package/dist/v2/usecases/console-service.js +133 -9
package/dist/v2/usecases/console-types.d.ts +7 -0
package/docs/design/daemon-conversation-logging-plan.md +98 -0
package/docs/design/daemon-conversation-logging-review.md +55 -0
package/docs/design/daemon-conversation-logging.md +129 -0
package/docs/design/github-polling-adapter-design-candidates.md +226 -0
package/docs/design/github-polling-adapter-design-review-findings.md +131 -0
package/docs/design/github-polling-adapter-implementation-plan.md +284 -0
package/docs/design/implementation_plan.md +192 -0
package/docs/design/workflow-id-validation-at-startup.md +146 -0
package/docs/design/workflow-id-validation-design-review.md +87 -0
package/docs/design/workflow-id-validation-implementation-plan.md +185 -0
package/docs/design/worktrain-system-prompt-report-issue-candidates.md +135 -0
package/docs/design/worktrain-system-prompt-report-issue-design-review.md +73 -0
package/docs/ideas/backlog.md +465 -0
package/package.json +1 -1
package/workflows/architecture-scalability-audit.json +1 -1
package/workflows/bug-investigation.agentic.v2.json +3 -3
package/workflows/coding-task-workflow-agentic.json +32 -32
package/workflows/coding-task-workflow-agentic.lean.v2.json +1 -1
package/workflows/coding-task-workflow-agentic.v2.json +7 -7
package/workflows/mr-review-workflow.agentic.v2.json +21 -12
package/workflows/personal-learning-materials-creation-branched.json +2 -2
package/workflows/production-readiness-audit.json +1 -1
package/workflows/relocation-workflow-us.json +2 -2
package/workflows/ui-ux-design-workflow.json +14 -14
package/workflows/workflow-for-workflows.json +3 -3
package/workflows/workflow-for-workflows.v2.json +2 -2
package/workflows/wr.discovery.json +1 -1
/package/dist/{console → console-ui}/assets/index-8dh0Psu-.css +0 -0

package/dist/daemon/workflow-runner.js CHANGED Viewed

@@ -42,6 +42,7 @@ exports.readAllDaemonSessions = readAllDaemonSessions;
 exports.runStartupRecovery = runStartupRecovery;
 exports.makeContinueWorkflowTool = makeContinueWorkflowTool;
 exports.makeBashTool = makeBashTool;
+exports.makeReportIssueTool = makeReportIssueTool;
 exports.buildSessionRecap = buildSessionRecap;
 exports.buildSystemPrompt = buildSystemPrompt;
 exports.runWorkflow = runWorkflow;
@@ -338,7 +339,7 @@ function getSchemas() {
     };
     return _schemas;
 }
-function makeContinueWorkflowTool(sessionId, ctx, onAdvance, onComplete, schemas, _executeContinueWorkflowFn = index_js_1.executeContinueWorkflow) {
+function makeContinueWorkflowTool(sessionId, ctx, onAdvance, onComplete, schemas, _executeContinueWorkflowFn = index_js_1.executeContinueWorkflow, emitter, workrailSessionId) {
     return {
         name: 'continue_workflow',
         description: 'Advance the WorkRail workflow to the next step. Call this after completing all work ' +
@@ -347,6 +348,7 @@ function makeContinueWorkflowTool(sessionId, ctx, onAdvance, onComplete, schemas
         label: 'Continue Workflow',
         execute: async (_toolCallId, params) => {
             console.log(`[WorkflowRunner] Tool: continue_workflow sessionId=${sessionId}`);
+            emitter?.emit({ kind: 'tool_called', sessionId, toolName: 'continue_workflow', summary: params.intent ?? 'advance', ...(workrailSessionId != null ? { workrailSessionId } : {}) });
             const result = await _executeContinueWorkflowFn({
                 continueToken: params.continueToken,
                 intent: (params.intent ?? 'advance'),
@@ -425,7 +427,7 @@ function makeContinueWorkflowTool(sessionId, ctx, onAdvance, onComplete, schemas
         },
     };
 }
-function makeBashTool(workspacePath, schemas) {
+function makeBashTool(workspacePath, schemas, sessionId, emitter, workrailSessionId) {
     return {
         name: 'Bash',
         description: 'Execute a shell command. Throws on failure (non-zero exit with stderr, or exit code 2+). ' +
@@ -436,11 +438,14 @@ function makeBashTool(workspacePath, schemas) {
         label: 'Bash',
         execute: async (_toolCallId, params) => {
             console.log(`[WorkflowRunner] Tool: bash "${String(params.command).slice(0, 80)}"`);
+            if (sessionId)
+                emitter?.emit({ kind: 'tool_called', sessionId, toolName: 'Bash', summary: String(params.command).slice(0, 80), ...(workrailSessionId != null ? { workrailSessionId } : {}) });
             const cwd = params.cwd ?? workspacePath;
             try {
                 const { stdout, stderr } = await execAsync(params.command, {
                     cwd,
                     timeout: BASH_TIMEOUT_MS,
+                    shell: '/bin/bash',
                 });
                 const output = [stdout, stderr].filter(Boolean).join('\n');
                 return {
@@ -470,13 +475,15 @@ function makeBashTool(workspacePath, schemas) {
         },
     };
 }
-function makeReadTool(schemas) {
+function makeReadTool(schemas, sessionId, emitter, workrailSessionId) {
     return {
         name: 'Read',
         description: 'Read the contents of a file at the given absolute path.',
         inputSchema: schemas['ReadParams'],
         label: 'Read',
         execute: async (_toolCallId, params) => {
+            if (sessionId)
+                emitter?.emit({ kind: 'tool_called', sessionId, toolName: 'Read', summary: String(params.filePath).slice(0, 80), ...(workrailSessionId != null ? { workrailSessionId } : {}) });
             const content = await fs.readFile(params.filePath, 'utf8');
             return {
                 content: [{ type: 'text', text: content }],
@@ -485,13 +492,15 @@ function makeReadTool(schemas) {
         },
     };
 }
-function makeWriteTool(schemas) {
+function makeWriteTool(schemas, sessionId, emitter, workrailSessionId) {
     return {
         name: 'Write',
         description: 'Write content to a file at the given absolute path. Creates parent directories if needed.',
         inputSchema: schemas['WriteParams'],
         label: 'Write',
         execute: async (_toolCallId, params) => {
+            if (sessionId)
+                emitter?.emit({ kind: 'tool_called', sessionId, toolName: 'Write', summary: String(params.filePath).slice(0, 80), ...(workrailSessionId != null ? { workrailSessionId } : {}) });
             await fs.mkdir(path.dirname(params.filePath), { recursive: true });
             await fs.writeFile(params.filePath, params.content, 'utf8');
             return {
@@ -501,6 +510,140 @@ function makeWriteTool(schemas) {
         },
     };
 }
+async function appendIssueAsync(issuesDir, sessionId, record) {
+    await fs.mkdir(issuesDir, { recursive: true });
+    const filePath = path.join(issuesDir, `${sessionId}.jsonl`);
+    const line = JSON.stringify({ ...record, ts: Date.now() }) + '\n';
+    await fs.appendFile(filePath, line, 'utf8');
+}
+function makeReportIssueTool(sessionId, emitter, issuesDirOverride) {
+    const issuesDir = issuesDirOverride ?? path.join(os.homedir(), '.workrail', 'issues');
+    return {
+        name: 'report_issue',
+        description: "Record a structured issue, error, or unexpected behavior. Call this AND continue_workflow (unless fatal). " +
+            "Does not stop the session -- it creates a record for the auto-fix coordinator.",
+        inputSchema: {
+            type: 'object',
+            properties: {
+                kind: {
+                    type: 'string',
+                    enum: ['tool_failure', 'blocked', 'unexpected_behavior', 'needs_human', 'self_correction'],
+                    description: 'Category of issue being reported.',
+                },
+                severity: {
+                    type: 'string',
+                    enum: ['info', 'warn', 'error', 'fatal'],
+                    description: 'Severity level. Fatal means the session cannot continue productively.',
+                },
+                summary: {
+                    type: 'string',
+                    description: 'One-line summary of the issue. Max 200 chars.',
+                    maxLength: 200,
+                },
+                context: {
+                    type: 'string',
+                    description: 'What you were trying to do when this issue occurred.',
+                },
+                toolName: {
+                    type: 'string',
+                    description: 'Name of the tool that failed or behaved unexpectedly, if applicable.',
+                },
+                command: {
+                    type: 'string',
+                    description: 'The shell command or expression that caused the issue, if applicable.',
+                },
+                suggestedFix: {
+                    type: 'string',
+                    description: 'A suggested fix or recovery action for the auto-fix coordinator.',
+                },
+                continueToken: {
+                    type: 'string',
+                    description: 'The current continueToken, so the coordinator can resume this session.',
+                },
+            },
+            required: ['kind', 'severity', 'summary'],
+            additionalProperties: false,
+        },
+        label: 'report_issue',
+        execute: async (_toolCallId, params) => {
+            const record = {
+                sessionId,
+                kind: params.kind,
+                severity: params.severity,
+                summary: String(params.summary ?? '').slice(0, 200),
+                ...(params.context !== undefined && { context: String(params.context) }),
+                ...(params.toolName !== undefined && { toolName: String(params.toolName) }),
+                ...(params.command !== undefined && { command: String(params.command) }),
+                ...(params.suggestedFix !== undefined && { suggestedFix: String(params.suggestedFix) }),
+                ...(params.continueToken !== undefined && { continueToken: String(params.continueToken) }),
+            };
+            void appendIssueAsync(issuesDir, sessionId, record).catch(() => {
+            });
+            emitter?.emit({
+                kind: 'issue_reported',
+                sessionId,
+                issueKind: record.kind,
+                severity: record.severity,
+                summary: record.summary,
+                ...(record.continueToken !== undefined && { continueToken: record.continueToken }),
+            });
+            const isFatal = record.severity === 'fatal';
+            const message = isFatal
+                ? `FATAL issue recorded. Call continue_workflow with notes explaining the blocker, then the session will end.`
+                : `Issue recorded (severity=${record.severity}). Continue with your work unless this is fatal.`;
+            return {
+                content: [{ type: 'text', text: message }],
+                details: { sessionId, kind: record.kind, severity: record.severity },
+            };
+        },
+    };
+}
+const BASE_SYSTEM_PROMPT = `\
+You are WorkRail Auto, an autonomous agent that executes workflows step by step. You are running unattended -- there is no user watching. Your entire job is to faithfully complete the current workflow.
+## What you are
+You are highly capable. You handle ambitious, multi-step tasks that require real codebase understanding. You don't hedge, ask for permission, or stop to check in. You work.
+## Your oracle (consult in this order when uncertain)
+1. The daemon soul rules (## Agent Rules and Philosophy below)
+2. AGENTS.md / CLAUDE.md in the workspace (injected below under Workspace Context)
+3. The current workflow step's prompt and guidance
+4. Local code patterns in the relevant module (grep the directory, not the whole repo)
+5. Industry best practices -- only when nothing above applies
+## Self-directed reasoning
+Ask yourself questions to clarify your approach, then answer them yourself using tools before acting. Never wait for a human to answer -- you are the oracle.
+Bad pattern: "I'll analyze both layers." (no justification)
+Good pattern: "Question: Should I check the middleware? Answer: The workflow step says 'trace the full call chain', and the AGENTS.md says the entry point is in the middleware layer. Yes, start there."
+## Your tools
+- \`continue_workflow\`: Advance to the next step. Call this after completing each step's work. Always include your notes in notesMarkdown and round-trip the continueToken exactly.
+- \`Bash\`: Run shell commands. Use for building, testing, running scripts.
+- \`Read\`: Read files.
+- \`Write\`: Write files.
+- \`report_issue\`: Record a structured issue, error, or unexpected behavior. Call this AND continue_workflow (unless fatal). Does not stop the session -- it creates a record for the auto-fix coordinator.
+## Execution contract
+1. Read the step carefully. Do ALL the work the step asks for.
+2. Call \`continue_workflow\` with your notes. Include the continueToken exactly.
+3. Repeat until the workflow reports it is complete.
+4. Do NOT skip steps. Do NOT call \`continue_workflow\` without completing the step's work.
+## The workflow is the contract
+Every step must be fully completed before you call continue_workflow. The workflow step prompt is the specification of what 'done' means -- not a suggestion. Don't advance until the work is actually done.
+Your cognitive mode changes per step: some steps make you a researcher, others a reviewer, others an implementer. Adopt the mode the step describes. Don't bring your own agenda.
+## Silent failure is the worst outcome
+If something goes wrong: call report_issue, then continue unless severity is 'fatal'. Do NOT silently retry forever, work around failures without noting them, or pretend things worked. The issue record is how the system learns and self-heals.
+## Tools are your hands, not your voice
+Don't narrate what you're about to do. Use the tool and report what you found. Token efficiency matters -- you have a wall-clock timeout.
+## You don't have a user. You have a workflow and a soul.
+If you're unsure, consult the oracle above. If nothing answers the question, make a reasoned decision, call report_issue with kind='self_correction' to document it, and continue.\
+`;
 function buildSessionRecap(notes) {
     if (notes.length === 0)
         return '';
@@ -511,20 +654,7 @@ function buildSessionRecap(notes) {
 }
 function buildSystemPrompt(trigger, sessionState, soulContent, workspaceContext) {
     const lines = [
-        'You are WorkRail Auto, an autonomous agent that executes workflows step by step.',
-        '',
-        '## Your tools',
-        '- `continue_workflow`: Advance to the next step. Call this after completing each step\'s work.',
-        '  Always include your notes in notesMarkdown and round-trip the continueToken exactly.',
-        '- `Bash`: Run shell commands. Use for building, testing, running scripts.',
-        '- `Read`: Read files.',
-        '- `Write`: Write files.',
-        '',
-        '## Execution contract',
-        '1. Read the step carefully. Do ALL the work the step asks for.',
-        '2. Call `continue_workflow` with your notes. Include the continueToken exactly.',
-        '3. Repeat until the workflow reports it is complete.',
-        '4. Do NOT skip steps. Do NOT call `continue_workflow` without completing the step\'s work.',
+        BASE_SYSTEM_PROMPT,
         '',
         `<workrail_session_state>${sessionState}</workrail_session_state>`,
         '',
@@ -554,16 +684,21 @@ function buildUserMessage(text) {
         timestamp: Date.now(),
     };
 }
-async function runWorkflow(trigger, ctx, apiKey, daemonRegistry) {
+async function runWorkflow(trigger, ctx, apiKey, daemonRegistry, emitter) {
     const sessionId = (0, node_crypto_1.randomUUID)();
     console.log(`[WorkflowRunner] Session started: sessionId=${sessionId} workflowId=${trigger.workflowId}`);
-    daemonRegistry?.register(sessionId, trigger.workflowId);
+    emitter?.emit({
+        kind: 'session_started',
+        sessionId,
+        workflowId: trigger.workflowId,
+        workspacePath: trigger.workspacePath,
+    });
+    let workrailSessionId = null;
     let agentClient;
     let modelId;
     if (trigger.agentConfig?.model) {
         const slashIdx = trigger.agentConfig.model.indexOf('/');
         if (slashIdx === -1) {
-            daemonRegistry?.unregister(sessionId, 'failed');
             return {
                 _tag: 'error',
                 workflowId: trigger.workflowId,
@@ -591,7 +726,9 @@ async function runWorkflow(trigger, ctx, apiKey, daemonRegistry) {
     let lastStepNotes;
     const onAdvance = (stepText, _continueToken) => {
         pendingSteerText = stepText;
-        daemonRegistry?.heartbeat(sessionId);
+        if (workrailSessionId !== null)
+            daemonRegistry?.heartbeat(workrailSessionId);
+        emitter?.emit({ kind: 'step_advanced', sessionId, ...(workrailSessionId != null ? { workrailSessionId } : {}) });
     };
     const onComplete = (notes) => {
         isComplete = true;
@@ -602,9 +739,8 @@ async function runWorkflow(trigger, ctx, apiKey, daemonRegistry) {
         firstStep = trigger._preAllocatedStartResponse;
     }
     else {
-        const startResult = await (0, start_js_1.executeStartWorkflow)({ workflowId: trigger.workflowId, workspacePath: trigger.workspacePath, goal: trigger.goal }, ctx, { is_autonomous: 'true' });
+        const startResult = await (0, start_js_1.executeStartWorkflow)({ workflowId: trigger.workflowId, workspacePath: trigger.workspacePath, goal: trigger.goal }, ctx, { is_autonomous: 'true', workspacePath: trigger.workspacePath });
         if (startResult.isErr()) {
-            daemonRegistry?.unregister(sessionId, 'failed');
             return {
                 _tag: 'error',
                 workflowId: trigger.workflowId,
@@ -616,20 +752,35 @@ async function runWorkflow(trigger, ctx, apiKey, daemonRegistry) {
     }
     const startContinueToken = firstStep.continueToken ?? '';
     const startCheckpointToken = firstStep.checkpointToken ?? null;
+    if (startContinueToken) {
+        const decoded = await (0, v2_token_ops_js_1.parseContinueTokenOrFail)(startContinueToken, ctx.v2.tokenCodecPorts, ctx.v2.tokenAliasStore);
+        if (decoded.isOk()) {
+            workrailSessionId = decoded.value.sessionId;
+        }
+        else {
+            console.error(`[WorkflowRunner] Error: could not decode WorkRail session ID from continueToken -- isLive and liveActivity will not work for this session. Reason: ${decoded.error.message}`);
+        }
+    }
+    if (workrailSessionId !== null) {
+        daemonRegistry?.register(workrailSessionId, trigger.workflowId);
+    }
     if (startContinueToken) {
         await persistTokens(sessionId, startContinueToken, startCheckpointToken);
     }
     if (firstStep.isComplete) {
         await fs.unlink(path.join(exports.DAEMON_SESSIONS_DIR, `${sessionId}.json`)).catch(() => { });
-        daemonRegistry?.unregister(sessionId, 'completed');
+        emitter?.emit({ kind: 'session_completed', sessionId, workflowId: trigger.workflowId, outcome: 'success', detail: 'stop', ...(workrailSessionId != null ? { workrailSessionId } : {}) });
+        if (workrailSessionId !== null)
+            daemonRegistry?.unregister(workrailSessionId, 'completed');
         return { _tag: 'success', workflowId: trigger.workflowId, stopReason: 'stop' };
     }
     const schemas = getSchemas();
     const tools = [
-        makeContinueWorkflowTool(sessionId, ctx, onAdvance, onComplete, schemas),
-        makeBashTool(trigger.workspacePath, schemas),
-        makeReadTool(schemas),
-        makeWriteTool(schemas),
+        makeContinueWorkflowTool(sessionId, ctx, onAdvance, onComplete, schemas, index_js_1.executeContinueWorkflow, emitter, workrailSessionId),
+        makeBashTool(trigger.workspacePath, schemas, sessionId, emitter, workrailSessionId),
+        makeReadTool(schemas, sessionId, emitter, workrailSessionId),
+        makeWriteTool(schemas, sessionId, emitter, workrailSessionId),
+        makeReportIssueTool(sessionId, emitter),
     ];
     const [soulContent, workspaceContext, sessionNotes] = await Promise.all([
         loadDaemonSoul(trigger.soulFile),
@@ -644,12 +795,37 @@ async function runWorkflow(trigger, ctx, apiKey, daemonRegistry) {
         `\n\ncontinueToken: ${startContinueToken}` +
         contextJson +
         '\n\nComplete all step work, then call continue_workflow with your notes to begin.';
+    const agentCallbacks = {
+        onLlmTurnStarted: ({ messageCount }) => {
+            emitter?.emit({ kind: 'llm_turn_started', sessionId, messageCount });
+        },
+        onLlmTurnCompleted: ({ stopReason, outputTokens, inputTokens, toolNamesRequested }) => {
+            emitter?.emit({
+                kind: 'llm_turn_completed',
+                sessionId,
+                stopReason,
+                outputTokens,
+                inputTokens,
+                toolNamesRequested,
+            });
+        },
+        onToolCallStarted: ({ toolName, argsSummary }) => {
+            emitter?.emit({ kind: 'tool_call_started', sessionId, toolName, argsSummary });
+        },
+        onToolCallCompleted: ({ toolName, durationMs, resultSummary }) => {
+            emitter?.emit({ kind: 'tool_call_completed', sessionId, toolName, durationMs, resultSummary });
+        },
+        onToolCallFailed: ({ toolName, durationMs, errorMessage }) => {
+            emitter?.emit({ kind: 'tool_call_failed', sessionId, toolName, durationMs, errorMessage });
+        },
+    };
     const agent = new agent_loop_js_1.AgentLoop({
         systemPrompt: buildSystemPrompt(trigger, sessionState, soulContent, workspaceContext),
         modelId,
         tools,
         client: agentClient,
         toolExecution: 'sequential',
+        callbacks: agentCallbacks,
     });
     const sessionTimeoutMs = (trigger.agentConfig?.maxSessionMinutes ?? DEFAULT_SESSION_TIMEOUT_MINUTES) * 60 * 1000;
     const maxTurns = trigger.agentConfig?.maxTurns ?? 0;
@@ -658,6 +834,12 @@ async function runWorkflow(trigger, ctx, apiKey, daemonRegistry) {
     const unsubscribe = agent.subscribe(async (event) => {
         if (event.type !== 'turn_end')
             return;
+        for (const toolResult of event.toolResults) {
+            if (toolResult.isError) {
+                const errorText = toolResult.result?.content[0]?.text ?? 'tool error';
+                emitter?.emit({ kind: 'tool_error', sessionId, toolName: toolResult.toolName, error: errorText.slice(0, 200), ...(workrailSessionId != null ? { workrailSessionId } : {}) });
+            }
+        }
         turnCount++;
         if (maxTurns > 0 && turnCount >= maxTurns && timeoutReason === null) {
             timeoutReason = 'max_turns';
@@ -711,7 +893,9 @@ async function runWorkflow(trigger, ctx, apiKey, daemonRegistry) {
         console.log(`[WorkflowRunner] Agent loop ended: sessionId=${sessionId} stopReason=${stopReason}${errorMessage ? ` error=${errorMessage.slice(0, 120)}` : ''}`);
     }
     if (timeoutReason !== null) {
-        daemonRegistry?.unregister(sessionId, 'failed');
+        emitter?.emit({ kind: 'session_completed', sessionId, workflowId: trigger.workflowId, outcome: 'timeout', detail: timeoutReason, ...(workrailSessionId != null ? { workrailSessionId } : {}) });
+        if (workrailSessionId !== null)
+            daemonRegistry?.unregister(workrailSessionId, 'failed');
         const limitDescription = timeoutReason === 'wall_clock'
             ? `${trigger.agentConfig?.maxSessionMinutes ?? DEFAULT_SESSION_TIMEOUT_MINUTES} minutes`
             : `${trigger.agentConfig?.maxTurns} turns`;
@@ -724,17 +908,29 @@ async function runWorkflow(trigger, ctx, apiKey, daemonRegistry) {
         };
     }
     if (stopReason === 'error' || errorMessage) {
-        daemonRegistry?.unregister(sessionId, 'failed');
+        const errMsg = errorMessage ?? 'Agent stopped with error reason';
+        emitter?.emit({ kind: 'session_completed', sessionId, workflowId: trigger.workflowId, outcome: 'error', detail: errMsg.slice(0, 200), ...(workrailSessionId != null ? { workrailSessionId } : {}) });
+        if (workrailSessionId !== null)
+            daemonRegistry?.unregister(workrailSessionId, 'failed');
+        const stuckMarker = `\n\nWORKTRAIN_STUCK: ${JSON.stringify({
+            reason: 'session_error',
+            error: errMsg.slice(0, 500),
+            workflowId: trigger.workflowId,
+            sessionId,
+        })}`;
         return {
             _tag: 'error',
             workflowId: trigger.workflowId,
-            message: errorMessage ?? 'Agent stopped with error reason',
+            message: errMsg,
             stopReason,
+            lastStepNotes: stuckMarker,
         };
     }
     await fs.unlink(path.join(exports.DAEMON_SESSIONS_DIR, `${sessionId}.json`)).catch(() => {
     });
-    daemonRegistry?.unregister(sessionId, 'completed');
+    emitter?.emit({ kind: 'session_completed', sessionId, workflowId: trigger.workflowId, outcome: 'success', detail: stopReason, ...(workrailSessionId != null ? { workrailSessionId } : {}) });
+    if (workrailSessionId !== null)
+        daemonRegistry?.unregister(workrailSessionId, 'completed');
     return {
         _tag: 'success',
         workflowId: trigger.workflowId,