npm - @exaudeus/workrail - Versions diffs - 3.25.0 → 3.26.1 - Mend

@exaudeus/workrail 3.25.0 → 3.26.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (59) hide show

package/dist/cli/commands/index.d.ts +5 -0
package/dist/cli/commands/index.js +12 -1
package/dist/cli/commands/worktrain-await.d.ts +35 -0
package/dist/cli/commands/worktrain-await.js +207 -0
package/dist/cli/commands/worktrain-inbox.d.ts +23 -0
package/dist/cli/commands/worktrain-inbox.js +82 -0
package/dist/cli/commands/worktrain-init.d.ts +23 -0
package/dist/cli/commands/worktrain-init.js +338 -0
package/dist/cli/commands/worktrain-spawn.d.ts +28 -0
package/dist/cli/commands/worktrain-spawn.js +106 -0
package/dist/cli/commands/worktrain-tell.d.ts +25 -0
package/dist/cli/commands/worktrain-tell.js +32 -0
package/dist/cli-worktrain.d.ts +2 -0
package/dist/cli-worktrain.js +169 -0
package/dist/cli.js +13 -3
package/dist/config/config-file.d.ts +2 -0
package/dist/config/config-file.js +55 -0
package/dist/daemon/agent-loop.d.ts +90 -0
package/dist/daemon/agent-loop.js +214 -0
package/dist/daemon/pi-mono-loader.d.ts +0 -5
package/dist/daemon/pi-mono-loader.js +0 -64
package/dist/daemon/soul-template.d.ts +2 -0
package/dist/daemon/soul-template.js +22 -0
package/dist/daemon/workflow-runner.d.ts +24 -2
package/dist/daemon/workflow-runner.js +244 -120
package/dist/manifest.json +147 -51
package/dist/mcp/output-schemas.d.ts +154 -154
package/dist/mcp/transports/bridge-entry.js +20 -2
package/dist/mcp/transports/bridge-events.d.ts +34 -0
package/dist/mcp/transports/bridge-events.js +24 -0
package/dist/mcp/transports/fatal-exit.d.ts +5 -0
package/dist/mcp/transports/fatal-exit.js +82 -0
package/dist/mcp/transports/http-entry.js +3 -0
package/dist/mcp/transports/stdio-entry.js +3 -7
package/dist/mcp/v2/tools.d.ts +7 -7
package/dist/trigger/delivery-action.d.ts +37 -0
package/dist/trigger/delivery-action.js +204 -0
package/dist/trigger/delivery-client.d.ts +11 -0
package/dist/trigger/delivery-client.js +27 -0
package/dist/trigger/trigger-listener.d.ts +2 -0
package/dist/trigger/trigger-listener.js +12 -2
package/dist/trigger/trigger-router.d.ts +8 -2
package/dist/trigger/trigger-router.js +164 -6
package/dist/trigger/trigger-store.d.ts +11 -3
package/dist/trigger/trigger-store.js +254 -13
package/dist/trigger/types.d.ts +24 -0
package/dist/trigger/types.js +4 -0
package/dist/v2/durable-core/schemas/execution-snapshot/blocked-snapshot.d.ts +22 -22
package/dist/v2/durable-core/schemas/execution-snapshot/execution-snapshot.v1.d.ts +114 -114
package/dist/v2/durable-core/schemas/export-bundle/index.d.ts +454 -454
package/dist/v2/durable-core/schemas/session/blockers.d.ts +14 -14
package/dist/v2/durable-core/schemas/session/events.d.ts +93 -93
package/dist/v2/durable-core/schemas/session/gaps.d.ts +2 -2
package/dist/v2/durable-core/schemas/session/validation-event.d.ts +4 -4
package/dist/v2/usecases/console-routes.js +33 -3
package/package.json +6 -4
package/spec/workflow-tags.json +1 -0
package/workflows/classify-task-workflow.json +68 -0
package/workflows/coding-task-workflow-agentic.lean.v2.json +43 -13

package/dist/v2/durable-core/schemas/session/gaps.d.ts CHANGED Viewed

@@ -170,7 +170,7 @@ export declare const GapRecordedDataV1Schema: z.ZodObject<{
         resolvesGapId: string;
     };
     gapId: string;
-    severity: "warning" | "info" | "critical";
+    severity: "info" | "warning" | "critical";
     evidenceRefs?: ({
         kind: "event";
         eventId: string;
@@ -200,7 +200,7 @@ export declare const GapRecordedDataV1Schema: z.ZodObject<{
         resolvesGapId: string;
     };
     gapId: string;
-    severity: "warning" | "info" | "critical";
+    severity: "info" | "warning" | "critical";
     evidenceRefs?: ({
         kind: "event";
         eventId: string;

package/dist/v2/durable-core/schemas/session/validation-event.d.ts CHANGED Viewed

@@ -47,22 +47,22 @@ export declare const ValidationPerformedDataV1Schema: z.ZodObject<{
     }>;
 }, "strict", z.ZodTypeAny, {
     contractRef: string;
-    attemptId: string;
-    validationId: string;
     result: {
         issues: readonly string[];
         valid: boolean;
         suggestions: readonly string[];
     };
-}, {
-    contractRef: string;
     attemptId: string;
     validationId: string;
+}, {
+    contractRef: string;
     result: {
         issues: readonly string[];
         valid: boolean;
         suggestions: readonly string[];
     };
+    attemptId: string;
+    validationId: string;
 }>;
 export type ValidationPerformedDataV1 = z.infer<typeof ValidationPerformedDataV1Schema>;
 export type ValidationPerformedResultV1 = z.infer<typeof ValidationPerformedResultV1Schema>;

package/dist/v2/usecases/console-routes.js CHANGED Viewed

@@ -44,6 +44,8 @@ const worktree_service_js_1 = require("./worktree-service.js");
 const workflow_js_1 = require("../../types/workflow.js");
 const dev_mode_js_1 = require("../../mcp/dev-mode.js");
 const workflow_runner_js_1 = require("../../daemon/workflow-runner.js");
+const start_js_1 = require("../../mcp/handlers/v2-execution/start.js");
+const v2_token_ops_js_1 = require("../../mcp/handlers/v2-token-ops.js");
 function watchSessionsDir(sessionsDir, onChanged) {
     try {
         fs_1.default.mkdirSync(sessionsDir, { recursive: true });
@@ -384,20 +386,48 @@ function mountConsoleRoutes(app, consoleService, workflowService, timingRingBuff
             res.status(503).json({ success: false, error: 'No LLM credentials available. Set ANTHROPIC_API_KEY or AWS_PROFILE.' });
             return;
         }
+        const startResult = await (0, start_js_1.executeStartWorkflow)({ workflowId, workspacePath, goal }, v2ToolContext, { is_autonomous: 'true' });
+        if (startResult.isErr()) {
+            const errDetail = `${startResult.error.kind}${'message' in startResult.error ? `: ${startResult.error.message}` : ''}`;
+            res.status(400).json({ success: false, error: `Session creation failed: ${errDetail}` });
+            return;
+        }
+        const startResponse = startResult.value.response;
+        const startContinueToken = startResponse.continueToken;
+        let sessionHandle;
+        if (startContinueToken) {
+            const tokenResult = await (0, v2_token_ops_js_1.parseContinueTokenOrFail)(startContinueToken, v2ToolContext.v2.tokenCodecPorts, v2ToolContext.v2.tokenAliasStore);
+            if (tokenResult.isErr()) {
+                console.error(`[ConsoleRoutes] Failed to decode session handle from continueToken: ${tokenResult.error.message}`);
+                res.status(500).json({ success: false, error: 'Internal error: could not extract session handle.' });
+                return;
+            }
+            sessionHandle = tokenResult.value.sessionId;
+        }
+        else {
+            sessionHandle = workflowId;
+        }
+        const trigger = { workflowId, goal, workspacePath, context, _preAllocatedStartResponse: startResponse };
         if (triggerRouter) {
-            triggerRouter.dispatch({ workflowId, goal, workspacePath, context });
+            triggerRouter.dispatch(trigger);
         }
         else {
-            void (0, workflow_runner_js_1.runWorkflow)({ workflowId, goal, workspacePath, context }, v2ToolContext, apiKey ?? '').then((result) => {
+            void (0, workflow_runner_js_1.runWorkflow)(trigger, v2ToolContext, apiKey ?? '').then((result) => {
                 if (result._tag === 'success') {
                     console.log(`[ConsoleRoutes] Auto dispatch completed: workflowId=${workflowId} stopReason=${result.stopReason}`);
                 }
+                else if (result._tag === 'timeout') {
+                    console.log(`[ConsoleRoutes] Auto dispatch timed out: workflowId=${workflowId}`);
+                }
+                else if (result._tag === 'delivery_failed') {
+                    console.log(`[ConsoleRoutes] Auto dispatch delivery failed: workflowId=${workflowId}`);
+                }
                 else {
                     console.log(`[ConsoleRoutes] Auto dispatch failed: workflowId=${workflowId} error=${result.message}`);
                 }
             });
         }
-        res.json({ success: true, data: { status: 'dispatched', workflowId } });
+        res.json({ success: true, data: { status: 'dispatched', workflowId, sessionHandle } });
     });
     app.get('/api/v2/triggers', (_req, res) => {
         if (!triggerRouter) {

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@exaudeus/workrail",
-  "version": "3.25.0",
+  "version": "3.26.1",
   "description": "Step-by-step workflow enforcement for AI agents via MCP",
   "license": "MIT",
   "repository": {
@@ -12,7 +12,8 @@
   },
   "homepage": "https://github.com/EtienneBBeaulac/workrail#readme",
   "bin": {
-    "workrail": "dist/mcp-server.js"
+    "workrail": "dist/mcp-server.js",
+    "worktrain": "dist/cli-worktrain.js"
   },
   "exports": {
     ".": "./dist/mcp-server.js",
@@ -84,8 +85,8 @@
     "prepare": "bash scripts/setup-hooks.sh"
   },
   "dependencies": {
-    "@mariozechner/pi-agent-core": "0.67.2",
-    "@mariozechner/pi-ai": "0.67.2",
+    "@anthropic-ai/bedrock-sdk": "^0.28.1",
+    "@anthropic-ai/sdk": "^0.73.0",
     "@modelcontextprotocol/sdk": "^1.24.0",
     "@scure/base": "1.1.9",
     "ajv": "^8.17.1",
@@ -112,6 +113,7 @@
     "task-management"
   ],
   "devDependencies": {
+    "@duckdb/node-api": "^1.5.2-r.1",
     "@playwright/test": "^1.55.1",
     "@semantic-release/changelog": "^6.0.3",
     "@semantic-release/exec": "^7.1.0",

package/spec/workflow-tags.json CHANGED Viewed

@@ -125,6 +125,7 @@
     "workflow-diagnose-environment": { "tags": ["investigation"] },
     "workflow-for-workflows": { "tags": ["authoring"] },
     "wr.discovery": { "tags": ["design", "investigation"] },
+    "classify-task-workflow": { "tags": ["routines", "coding"] },
     "test-artifact-loop-control": { "tags": ["coding"], "hidden": true },
     "test-session-persistence": { "tags": ["coding"], "hidden": true },
     "test-missing-context": { "tags": ["coding"], "hidden": true }

package/workflows/classify-task-workflow.json ADDED Viewed

@@ -0,0 +1,68 @@
+{
+  "id": "classify-task-workflow",
+  "name": "Classify Task",
+  "version": "0.1.0",
+  "description": "Classifies a software task from the session goal into structured output variables used by coordinator scripts to decide which pipeline phases to run.",
+  "about": "## Classify Task Workflow\n\nThis is a fast, single-step classification utility. It reads the session goal and outputs structured variables that coordinator scripts use to decide which pipeline phases to run.\n\n### What it does\n\nGiven a task description, the agent classifies the work along seven dimensions and recommends an ordered pipeline of workflow IDs to execute.\n\n### When to use it\n\nUse this workflow at the start of a coordinator pipeline when you need to decide which downstream workflows to run. It is intentionally fast and cheap -- one LLM step, no subagents, no codebase reads.\n\n### What it produces\n\nA structured classification block in the step notes containing all seven output variables:\n- `taskComplexity` -- Small / Medium / Large\n- `riskLevel` -- Low / Medium / High\n- `hasUI` -- true / false\n- `touchesArchitecture` -- true / false\n- `taskType` -- feature / bug-fix / refactor / investigation / docs / chore\n- `affectedDomains` -- array of likely codebase areas\n- `recommendedPipeline` -- ordered array of workflow IDs\n\n### How to get good results\n\nProvide a specific, concrete task description as the session goal. The more specific the goal, the more accurate the classification. When the goal is ambiguous, the workflow defaults to conservative (higher complexity, more pipeline phases).",
+  "examples": [
+    "Classify: add real-time presence indicators to the messaging inbox UI",
+    "Classify: fix the race condition in the cache invalidation path",
+    "Classify: refactor the payment module to use Result types instead of exceptions",
+    "Classify: investigate why the build server fails on the integration test suite",
+    "Classify: update the onboarding docs to reflect the new CLI commands"
+  ],
+  "validatedAgainstSpecVersion": 3,
+  "recommendedPreferences": {
+    "recommendedAutonomy": "full_auto_never_stop",
+    "recommendedRiskPolicy": "aggressive"
+  },
+  "metaGuidance": [
+    "CONSERVATIVE DEFAULT: when in doubt, classify up -- higher complexity, more pipeline phases. It is safer to recommend an extra phase than to skip a critical one.",
+    "STRUCTURED OUTPUT REQUIRED: output must be a labeled structured block. Free-form prose does not satisfy this workflow's contract.",
+    "NO TOOLS NEEDED: classify from the goal text alone. Do not read files, run commands, or gather context. This workflow is intentionally cheap.",
+    "NO SUBAGENTS: do not delegate. The classification is a single reasoning pass by the main agent.",
+    "PIPELINE SELECTION LOGIC: use the provided decision rules in the step procedure. Do not invent new pipeline logic."
+  ],
+  "steps": [
+    {
+      "id": "classify-task",
+      "title": "Classify Task",
+      "promptBlocks": {
+        "goal": "Read the session goal and classify the software task into all seven required output variables. Produce a structured classification block that a coordinator script can parse reliably.",
+        "constraints": [
+          "Classify from goal text only. Do not read files, search the codebase, or gather context.",
+          "When any dimension is ambiguous, default to the more conservative value (higher complexity, higher risk, more pipeline phases).",
+          "All seven output variables are required. An empty or missing variable is a failure.",
+          "Output the classification block in the exact format shown in the procedure. Use the exact key names.",
+          "Output `affectedDomains` and `recommendedPipeline` as single-line JSON arrays -- no line breaks within the array value."
+        ],
+        "procedure": [
+          "1. Read the session goal carefully.",
+          "2. Classify each dimension using these rules:\n\n   **taskComplexity** (Small / Medium / Large)\n   - Small: isolated change, one component, clear path, low ambiguity (e.g. fix a typo, rename a symbol, update a config value)\n   - Medium: touches 2-4 components, moderate scope, some design decisions needed\n   - Large: cross-cutting change, architectural impact, high ambiguity, or significant new behavior\n   - Default: Medium when unsure\n\n   **riskLevel** (Low / Medium / High)\n   - Low: no user-visible behavior change, reversible, isolated\n   - Medium: user-visible change, moderate blast radius, or touches shared infrastructure\n   - High: data migration, payment/auth paths, production-critical infrastructure, irreversible changes\n   - Default: Medium when unsure\n\n   **hasUI** (true / false)\n   - true: task mentions UI, frontend, visual, screen, component, design, UX, CSS, layout, accessibility, animation, or any user-facing interface\n   - false: otherwise\n   - Default: false when unsure\n\n   **touchesArchitecture** (true / false)\n   - true: task introduces new abstractions, changes system boundaries, affects how components interact, changes APIs, or modifies data models in a non-trivial way\n   - false: otherwise (e.g. bug fix in existing logic, docs update, minor refactor within a component)\n   - Default: false when unsure\n   - Rule: Large tasks always set `touchesArchitecture: true` -- large scope changes affect system structure by definition\n\n   **taskType** (feature / bug-fix / refactor / investigation / docs / chore)\n   - feature: new user-visible functionality\n   - bug-fix: fixing incorrect behavior\n   - refactor: restructuring existing code without changing observable behavior\n   - investigation: diagnosing or understanding a problem without implementing a fix\n   - docs: documentation changes only\n   - chore: tooling, CI, deps, build, internal cleanup with no user impact\n   - Default: feature when unsure\n\n   **affectedDomains** (array)\n   - Scan the goal text for known domain keywords and infer likely areas. Use these domain labels: daemon, trigger, console, mcp, schema, engine, workflows, docs, infra, api, auth, payments, mobile, web\n   - Include a domain if the goal text strongly implies it, even if not named explicitly\n   - Use an empty array only if no domains can be reasonably inferred\n\n   **recommendedPipeline** (array of workflow IDs, in execution order)\n   Apply these selection rules in order:\n   - If taskType = 'bug-fix': prepend 'bug-investigation.agentic.v2'\n   - If taskComplexity is Medium or Large: include 'wr.discovery'\n   - If hasUI = true: include 'ui-ux-design-workflow'\n   - If touchesArchitecture = true OR riskLevel = High: include 'architecture-scalability-audit'\n   - If taskType is NOT 'investigation' AND taskType is NOT 'docs': include 'coding-task-workflow-agentic' -- note: chore is included here because chores can require code changes and benefit from review\n   - If 'coding-task-workflow-agentic' is included: include 'mr-review-workflow.agentic.v2' after it\n   - If riskLevel = High: append 'production-readiness-audit' at the end\n   - Order: [bug-investigation?, wr.discovery?, ui-ux-design-workflow?, architecture-scalability-audit?, coding-task-workflow-agentic?, mr-review-workflow.agentic.v2?, production-readiness-audit?]",
+          "3. Output the classification block using this exact format:\n\n```\n## Task Classification\n\ntaskComplexity: <Small|Medium|Large>\nriskLevel: <Low|Medium|High>\nhasUI: <true|false>\ntouchesArchitecture: <true|false>\ntaskType: <feature|bug-fix|refactor|investigation|docs|chore>\naffectedDomains: [\"<domain1>\", \"<domain2>\"]\nrecommendedPipeline: [\"<workflow-id-1>\", \"<workflow-id-2>\"]\n```\n\nAfter the block, add 2-4 sentences of reasoning: why you chose the key values, and what made anything uncertain."
+        ],
+        "outputRequired": {
+          "taskComplexity": "One of: Small / Medium / Large",
+          "riskLevel": "One of: Low / Medium / High",
+          "hasUI": "true or false -- does this task touch any UI, frontend, or visual layer?",
+          "touchesArchitecture": "true or false -- does this introduce new abstractions, change system boundaries, or affect how components interact?",
+          "taskType": "One of: feature / bug-fix / refactor / investigation / docs / chore",
+          "affectedDomains": "Array of likely codebase areas (e.g. [\"daemon\", \"console\"]). Use [] only if none can be inferred.",
+          "recommendedPipeline": "Ordered array of workflow IDs selected using the pipeline selection rules in the procedure."
+        },
+        "verify": [
+          "All seven output variables are present in the classification block.",
+          "Each variable uses the exact key name specified (taskComplexity, riskLevel, hasUI, touchesArchitecture, taskType, affectedDomains, recommendedPipeline).",
+          "recommendedPipeline contains only valid workflow IDs from the available library.",
+          "If taskType is feature, bug-fix, or refactor, recommendedPipeline includes coding-task-workflow-agentic.",
+          "If riskLevel is High, production-readiness-audit is the last item in recommendedPipeline.",
+          "If `hasUI` is true, `recommendedPipeline` includes `ui-ux-design-workflow`.",
+          "If `touchesArchitecture` is true OR `riskLevel` is High, `recommendedPipeline` includes `architecture-scalability-audit`.",
+          "If `taskType` is `bug-fix`, `bug-investigation.agentic.v2` is the first item in `recommendedPipeline`.",
+          "If `coding-task-workflow-agentic` is present in `recommendedPipeline`, `mr-review-workflow.agentic.v2` immediately follows it.",
+          "If `taskComplexity` is `Large`, `touchesArchitecture` must be `true`."
+        ]
+      }
+    }
+  ]
+}

package/workflows/coding-task-workflow-agentic.lean.v2.json CHANGED Viewed

@@ -22,7 +22,10 @@
         {
           "id": "design_soundness",
           "purpose": "Design decision is made, tradeoffs are recorded, and there is no remaining ambiguity about the chosen approach.",
-          "levels": ["low", "high"]
+          "levels": [
+            "low",
+            "high"
+          ]
         }
       ]
     },
@@ -33,7 +36,10 @@
         {
           "id": "design_gaps",
           "purpose": "Active scan completed: either no material gaps were found, or any found were addressed or explicitly filed.",
-          "levels": ["low", "high"]
+          "levels": [
+            "low",
+            "high"
+          ]
         }
       ]
     },
@@ -44,7 +50,10 @@
         {
           "id": "plan_completeness",
           "purpose": "Slices have clear boundaries and acceptance criteria. The agent knows what done looks like for each.",
-          "levels": ["low", "high"]
+          "levels": [
+            "low",
+            "high"
+          ]
         }
       ]
     },
@@ -55,7 +64,10 @@
         {
           "id": "invariant_clarity",
           "purpose": "Named invariants are checkable in the implementation. Non-goals are stated and will prevent scope creep.",
-          "levels": ["low", "high"]
+          "levels": [
+            "low",
+            "high"
+          ]
         }
       ]
     },
@@ -66,7 +78,10 @@
         {
           "id": "plan_gaps",
           "purpose": "Active scan completed: either no material gaps were found, or any found were addressed or explicitly filed.",
-          "levels": ["low", "high"]
+          "levels": [
+            "low",
+            "high"
+          ]
         }
       ]
     },
@@ -77,7 +92,10 @@
         {
           "id": "build_correctness",
           "purpose": "Build succeeds and tests pass. No compilation errors or failing assertions.",
-          "levels": ["low", "high"]
+          "levels": [
+            "low",
+            "high"
+          ]
         }
       ]
     },
@@ -88,7 +106,10 @@
         {
           "id": "invariant_preservation",
           "purpose": "Each named invariant from the plan has been verified in the implementation.",
-          "levels": ["low", "high"]
+          "levels": [
+            "low",
+            "high"
+          ]
         }
       ]
     },
@@ -99,7 +120,10 @@
         {
           "id": "implementation_gaps",
           "purpose": "Active scan completed: gaps found are either fixed inline, filed as follow-up tickets, or explicitly deferred with rationale.",
-          "levels": ["low", "high"]
+          "levels": [
+            "low",
+            "high"
+          ]
         }
       ]
     }
@@ -260,7 +284,9 @@
       ],
       "assessmentConsequences": [
         {
-          "when": { "anyEqualsLevel": "low" },
+          "when": {
+            "anyEqualsLevel": "low"
+          },
           "effect": {
             "kind": "require_followup",
             "guidance": "Address whichever gate scored low: design_soundness low -- the design decision is still ambiguous; commit to an approach and record the rationale before proceeding. design_gaps low -- the gap scan was not completed or found unaddressed gaps; either resolve them or explicitly file them before proceeding."
@@ -361,7 +387,9 @@
       ],
       "assessmentConsequences": [
         {
-          "when": { "anyEqualsLevel": "low" },
+          "when": {
+            "anyEqualsLevel": "low"
+          },
           "effect": {
             "kind": "require_followup",
             "guidance": "Address whichever gate scored low: plan_completeness low -- one or more slices lack clear boundaries or verifiable acceptance criteria; sharpen them before implementation begins. invariant_clarity low -- invariants or non-goals are too vague to verify against; make them concrete. plan_gaps low -- the gap scan was not completed or found unaddressed gaps; resolve or file them before proceeding."
@@ -472,7 +500,7 @@
         "var": "taskComplexity",
         "equals": "Small"
       },
-      "prompt": "For Small tasks, fast does not mean shallow. Every item below is required.\n\n**1. Confirm all wiring points with tools.**\nDon't assume a file you create is reachable. Check every public entry point:\n- Does the new symbol need to be exported from an index file?\n- Does it need to be imported and registered somewhere (CLI command map, router, DI container, plugin registry)?\n- Is there a test file that needs to reference it?\nTrace the full call path from the public interface down to your new code before writing anything.\n\n**2. Implement the smallest correct change.**\nChange exactly what needs changing. No drive-by refactors, no extra abstractions.\n\n**3. Verify end-to-end.**\n- Run build and tests. Both must pass.\n- Manually trace the new behavior through the public entry point (e.g. run the CLI command, check the export resolves, hit the endpoint). If you can't do this deterministically with tools, say why.\n- Apply the user's coding philosophy as the review lens. Flag any violation by principle name.\n\n**4. Produce a handoff note.**\nOutput a notes artifact containing:\n- `commitType`: feat / fix / chore / refactor / docs / test / perf (pick one)\n- `commitScope`: product area only (console / mcp / workflows / engine / schema / docs)\n- `commitSubject`: imperative mood, max 72 chars total with type(scope): prefix, no period\n- `prTitle`: same as full commit first line\n- `prBody`: markdown with ## Summary (bullets) and ## Test plan (checklist)\n- `followUpTickets`: list of deferred items, or empty\n- `filesChanged`: list of every file you created or modified\n\nThe daemon will use this artifact to run git commit and open the PR. Do not commit or push yourself.\n\nDo not create heavyweight planning artifacts unless risk unexpectedly grows.",
+      "prompt": "For Small tasks, fast does not mean shallow. Every item below is required.\n\n**1. Confirm all wiring points with tools.**\nDon't assume a file you create is reachable. Check every public entry point:\n- Does the new symbol need to be exported from an index file?\n- Does it need to be imported and registered somewhere (CLI command map, router, DI container, plugin registry)?\n- Is there a test file that needs to reference it?\nTrace the full call path from the public interface down to your new code before writing anything.\n\n**2. Implement the smallest correct change.**\nChange exactly what needs changing. No drive-by refactors, no extra abstractions.\n\n**3. Verify end-to-end.**\n- Run build and tests. Both must pass.\n- Manually trace the new behavior through the public entry point (e.g. run the CLI command, check the export resolves, hit the endpoint). If you can't do this deterministically with tools, say why.\n- Apply the user's coding philosophy as the review lens. Flag any violation by principle name.\n\n**4. Produce a handoff note.**\nOutput a notes artifact containing a JSON fenced block with the following fields.\nThe daemon reads this block to run `git commit` and `gh pr create` -- write it exactly as shown:\n\n```json\n{\n  \"commitType\": \"feat\",\n  \"commitScope\": \"mcp\",\n  \"commitSubject\": \"imperative mood, max 72 chars total with type(scope): prefix, no period\",\n  \"prTitle\": \"same as full commit first line\",\n  \"prBody\": \"markdown with ## Summary (bullets) and ## Test plan (checklist)\",\n  \"followUpTickets\": [],\n  \"filesChanged\": [\"src/path/to/file.ts\", \"tests/unit/file.test.ts\"]\n}\n```\n\nFields:\n- `commitType`: feat / fix / chore / refactor / docs / test / perf (pick one)\n- `commitScope`: product area only (console / mcp / workflows / engine / schema / docs)\n- `commitSubject`: imperative mood, max 72 chars total with type(scope): prefix, no period\n- `prTitle`: same as full commit first line\n- `prBody`: markdown with ## Summary (bullets) and ## Test plan (checklist)\n- `followUpTickets`: list of deferred items, or empty array\n- `filesChanged`: list of every file you created or modified (required -- do not omit)\n\nThe daemon will use this artifact to run git commit and open the PR. Do not commit or push yourself.\n\nDo not create heavyweight planning artifacts unless risk unexpectedly grows.",
       "requireConfirmation": false
     },
     {
@@ -594,7 +622,9 @@
           ],
           "assessmentConsequences": [
             {
-              "when": { "anyEqualsLevel": "low" },
+              "when": {
+                "anyEqualsLevel": "low"
+              },
               "effect": {
                 "kind": "require_followup",
                 "guidance": "Address whichever gate scored low: build_correctness low -- the build or tests are still failing; fix them before this step can complete. invariant_preservation low -- one or more invariants from the plan are violated; fix the implementation. implementation_gaps low -- the gap scan was not completed or found unaddressed gaps; fix them inline, file as follow-up tickets, or explicitly defer with rationale."
@@ -606,7 +636,7 @@
         {
           "id": "phase-7c-loop-decision",
           "title": "Final Verification Loop Decision",
-          "prompt": "Decide whether final verification needs another pass or whether we're done.\n\nThis loop gets up to two verify/fix passes.\n- If verification found real issues and you fixed them, keep going so the fixes get re-verified.\n- If the issues are clean or resolved, stop.\n- If you've hit the limit, stop and record what remains.\n\nWhen you stop, include:\n- acceptance criteria status\n- invariant status\n- test/build summary\n- a concise PR/MR draft (why, test plan, rollout notes)\n- follow-up tickets\n- any philosophy tensions you accepted on purpose\n\nThen emit the required loop-control artifact in this shape (`decision` must be `continue` or `stop`):\n```json\n{\n  \"artifacts\": [{\n    \"kind\": \"wr.loop_control\",\n    \"decision\": \"continue\"\n  }]\n}\n```",
+          "prompt": "Decide whether final verification needs another pass or whether we're done.\n\nThis loop gets up to two verify/fix passes.\n- If verification found real issues and you fixed them, keep going so the fixes get re-verified.\n- If the issues are clean or resolved, stop.\n- If you've hit the limit, stop and record what remains.\n\nWhen you stop, include:\n- acceptance criteria status\n- invariant status\n- test/build summary\n- follow-up tickets\n- any philosophy tensions you accepted on purpose\n\n**Handoff block (required for daemon auto-commit):**\nInclude a JSON fenced block in your notes. The daemon reads this to run `git commit` and `gh pr create`:\n\n```json\n{\n  \"commitType\": \"feat\",\n  \"commitScope\": \"mcp\",\n  \"commitSubject\": \"imperative mood, max 72 chars total with type(scope): prefix, no period\",\n  \"prTitle\": \"same as full commit first line\",\n  \"prBody\": \"markdown with ## Summary (bullets) and ## Test plan (checklist)\",\n  \"followUpTickets\": [],\n  \"filesChanged\": [\"src/path/to/file.ts\", \"tests/unit/file.test.ts\"]\n}\n```\n\nFields: `commitType` (feat/fix/chore/refactor/docs/test/perf), `commitScope` (product area only: console/mcp/workflows/engine/schema/docs), `commitSubject` (imperative, <=72 chars including prefix, no period), `prTitle` (same as commit first line), `prBody` (markdown), `followUpTickets` (array), `filesChanged` (required -- every file created or modified).\n\nThen emit the required loop-control artifact in this shape (`decision` must be `continue` or `stop`):\n```json\n{\n  \"artifacts\": [{\n    \"kind\": \"wr.loop_control\",\n    \"decision\": \"continue\"\n  }]\n}\n```",
           "requireConfirmation": true,
           "outputContract": {
             "contractRef": "wr.contracts.loop_control"