npm - @exaudeus/workrail - Versions diffs - 3.18.1 → 3.19.0 - Mend

@exaudeus/workrail 3.18.1 → 3.19.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

package/dist/console/assets/index-QhCFuxQV.js +28 -0
package/dist/console/index.html +1 -1
package/dist/manifest.json +22 -22
package/dist/mcp/server.js +25 -4
package/dist/mcp/tool-call-timing.d.ts +4 -0
package/dist/mcp/tool-call-timing.js +52 -0
package/dist/v2/durable-core/domain/observation-builder.js +2 -0
package/dist/v2/infra/local/data-dir/index.d.ts +1 -0
package/dist/v2/infra/local/data-dir/index.js +3 -0
package/dist/v2/ports/data-dir.port.d.ts +1 -0
package/dist/v2/usecases/console-routes.d.ts +1 -1
package/dist/v2/usecases/console-routes.js +61 -4
package/package.json +1 -1
package/workflows/workflow-for-workflows.json +33 -5
package/dist/console/assets/index-DMaX2-CW.js +0 -28

package/dist/console/index.html CHANGED Viewed

@@ -4,7 +4,7 @@
     <meta charset="UTF-8" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
     <title>WorkRail Console</title>
-    <script type="module" crossorigin src="/console/assets/index-DMaX2-CW.js"></script>
+    <script type="module" crossorigin src="/console/assets/index-QhCFuxQV.js"></script>
     <link rel="stylesheet" crossorigin href="/console/assets/index-ibLhWBmX.css">
   </head>
   <body>

package/dist/manifest.json CHANGED Viewed

@@ -369,16 +369,16 @@
       "sha256": "5fe866e54f796975dec5d8ba9983aefd86074db212d3fccd64eed04bc9f0b3da",
       "bytes": 8011
     },
-    "console/assets/index-DMaX2-CW.js": {
-      "sha256": "9f9fe84d6eac1497afc2564f1b975a3494514c9b7b36b4a32c5473b831e56fbf",
-      "bytes": 712124
+    "console/assets/index-QhCFuxQV.js": {
+      "sha256": "0096a86267fdf969abc3e3976ca44b3d3447271c7394345c8d6c27c084e6412c",
+      "bytes": 719937
     },
     "console/assets/index-ibLhWBmX.css": {
       "sha256": "346e55635d4d3dc2836dae83edb8563872721bf4b0e7e1ecf47fb9603424c206",
       "bytes": 58826
     },
     "console/index.html": {
-      "sha256": "c708c996c5682570d44110dbef54b7b2a367bfa3bd99e36b358e94dda74302a4",
+      "sha256": "4232baa5128b860125a649d8e135da858f07290bbb9da04861945649b53ac85d",
       "bytes": 417
     },
     "core/error-handler.d.ts": {
@@ -1026,8 +1026,8 @@
       "bytes": 960
     },
     "mcp/server.js": {
-      "sha256": "f8414b17dcbf8f48eefd69f932785ce3e3a58a50609eb2309300c018ac6e1418",
-      "bytes": 15106
+      "sha256": "a54d39ce8d7282abe16d140abbe1011e67cd3f9d9353f40727c44c1c212a90c2",
+      "bytes": 16152
     },
     "mcp/step-content-envelope.d.ts": {
       "sha256": "19bd63c4d4de1d5d93393d346625d28ffd1bebdc320d4ba4e694cb740ec97d3b",
@@ -1038,12 +1038,12 @@
       "bytes": 483
     },
     "mcp/tool-call-timing.d.ts": {
-      "sha256": "b16ef00e70dcb03f3117d3489bef93d1da6c86a6b15678b5d21076316f281a33",
-      "bytes": 1116
+      "sha256": "d775153fb5bb7c7b2bc896b2f9a57dc48ee0d0949307778dcdfea293bf0e394b",
+      "bytes": 1320
     },
     "mcp/tool-call-timing.js": {
-      "sha256": "2aa6997582d52abb2fdb2bb27a46ab6aca2b26657c2771b153a720e8c322196d",
-      "bytes": 2715
+      "sha256": "b3ae45196ab4f9d089a77703efaaa17e7e012e7019b1a5cfee9b128e67119c0c",
+      "bytes": 4776
     },
     "mcp/tool-description-provider.d.ts": {
       "sha256": "1d46abc3112e11b68e57197e846f5708293ec9b2281fa71a9124ee2aad71e41b",
@@ -1666,8 +1666,8 @@
       "bytes": 619
     },
     "v2/durable-core/domain/observation-builder.js": {
-      "sha256": "204aae8e096ae1b947812fa5edd3b1c91706460a302f401a9a95956d124fe893",
-      "bytes": 1830
+      "sha256": "df833dd1e0663acd4daf99cf27dc599b2c5e4a9e9c60ef88c1b0932892f9c62a",
+      "bytes": 1951
     },
     "v2/durable-core/domain/outputs.d.ts": {
       "sha256": "adc32e4b86c8036eac61096fe83371140c7de140db414227041a8854435f8f54",
@@ -2190,12 +2190,12 @@
       "bytes": 457
     },
     "v2/infra/local/data-dir/index.d.ts": {
-      "sha256": "082fce7c347f0e9fade727365c84010afce4cb1c10a56c31cd5598ba029a6f59",
-      "bytes": 993
+      "sha256": "b51169bfbaabb5149f874dc7b545099bc67e3615d92ee1a11163b39f1d12e218",
+      "bytes": 1016
     },
     "v2/infra/local/data-dir/index.js": {
-      "sha256": "79543d5c1797c34e171a848fd6c4bcef3c5f8aa76fbe58aa5ae68cfa9aca6d18",
-      "bytes": 3602
+      "sha256": "9ed70045f305f8a2257cab5fd5c7c2b9d12b678d15a67dde177145d1524c0f6b",
+      "bytes": 3671
     },
     "v2/infra/local/directory-listing/index.d.ts": {
       "sha256": "3139014cb738db3b0f10beca01a3a4a35b9ab8e72c8889b3bbff204fdbcb6b6c",
@@ -2366,8 +2366,8 @@
       "bytes": 77
     },
     "v2/ports/data-dir.port.d.ts": {
-      "sha256": "6f028592ad207b522e2b00be1d7252004595d48354a0a4d95a6be575c876ac59",
-      "bytes": 756
+      "sha256": "6713270d6e894e6ecf3cd6f0583dd16edfea771827ea2693f6ea54b970e97eb2",
+      "bytes": 779
     },
     "v2/ports/data-dir.port.js": {
       "sha256": "d43aa81f5bc89faa359e0f97c814ba25155591ff078fbb9bfd40f8c7c9683230",
@@ -2646,12 +2646,12 @@
       "bytes": 4795
     },
     "v2/usecases/console-routes.d.ts": {
-      "sha256": "13731496ddce8a46f1674d24a8660e790016dc77cd562106b95436e5a5513f72",
-      "bytes": 456
+      "sha256": "1afd41269475fecd4a27ac1c5faccf1e369ec8bd8c9a9c36d38ed92c79e4ec51",
+      "bytes": 508
     },
     "v2/usecases/console-routes.js": {
-      "sha256": "c9f3047a070722fc6142dedcb7b74b12581d969eba63af6b788ddb9e4ad59806",
-      "bytes": 12838
+      "sha256": "315a10a46cacd8bf279ecdc72b2cfac912f6d6ab5f606419d16fd734c9406718",
+      "bytes": 15503
     },
     "v2/usecases/console-service.d.ts": {
       "sha256": "489a44091dc1b15ff938a60f9cf3ac28363614b9f0446286f0914157528c7eb3",

package/dist/mcp/server.js CHANGED Viewed

@@ -35,6 +35,8 @@ var __importStar = (this && this.__importStar) || (function () {
 Object.defineProperty(exports, "__esModule", { value: true });
 exports.createToolContext = createToolContext;
 exports.composeServer = composeServer;
+const fs = __importStar(require("fs"));
+const path = __importStar(require("path"));
 const zod_to_json_schema_js_1 = require("./zod-to-json-schema.js");
 const container_js_1 = require("../di/container.js");
 const tokens_js_1 = require("../di/tokens.js");
@@ -164,6 +166,18 @@ async function composeServer() {
     await (0, container_js_1.bootstrap)();
     const ctx = await createToolContext();
     const timingRingBuffer = new tool_call_timing_js_1.ToolCallTimingRingBuffer(tool_call_timing_js_1.DEFAULT_RING_BUFFER_CAPACITY);
+    let serverVersion = 'unknown';
+    try {
+        const pkgPath = path.resolve(__dirname, '../../package.json');
+        const pkgJson = JSON.parse(fs.readFileSync(pkgPath, 'utf8'));
+        if (pkgJson.version)
+            serverVersion = pkgJson.version;
+    }
+    catch {
+    }
+    const toolCallsPerfFile = ctx.v2?.dataDir
+        ? path.join(ctx.v2.dataDir.perfDir(), 'tool-calls.jsonl')
+        : null;
     if (ctx.v2 && ctx.httpServer && ctx.v2.dataDir && ctx.v2.directoryListing) {
         const { ConsoleService } = await Promise.resolve().then(() => __importStar(require('../v2/usecases/console-service.js')));
         const { mountConsoleRoutes } = await Promise.resolve().then(() => __importStar(require('../v2/usecases/console-routes.js')));
@@ -174,7 +188,7 @@ async function composeServer() {
             snapshotStore: ctx.v2.snapshotStore,
             pinnedWorkflowStore: ctx.v2.pinnedStore,
         });
-        ctx.httpServer.mountRoutes((app) => mountConsoleRoutes(app, consoleService, ctx.workflowService, timingRingBuffer));
+        ctx.httpServer.mountRoutes((app) => mountConsoleRoutes(app, consoleService, ctx.workflowService, timingRingBuffer, toolCallsPerfFile ?? undefined, serverVersion));
         console.error('[Console] v2 Console API routes mounted at /api/v2/');
     }
     ctx.httpServer?.finalize();
@@ -218,9 +232,16 @@ async function composeServer() {
         tools,
     }));
     const devMode = (0, dev_mode_js_1.isDevMode)();
-    const timingSink = devMode
-        ? (0, tool_call_timing_js_1.composeSinks)((0, tool_call_timing_js_1.createRingBufferSink)(timingRingBuffer), (0, tool_call_timing_js_1.createDevPerfSink)())
-        : (0, tool_call_timing_js_1.createRingBufferSink)(timingRingBuffer);
+    const diskSink = toolCallsPerfFile
+        ? (0, tool_call_timing_js_1.createDiskPersistSink)(toolCallsPerfFile, serverVersion)
+        : null;
+    const timingSink = diskSink
+        ? devMode
+            ? (0, tool_call_timing_js_1.composeSinks)((0, tool_call_timing_js_1.createRingBufferSink)(timingRingBuffer), diskSink, (0, tool_call_timing_js_1.createDevPerfSink)())
+            : (0, tool_call_timing_js_1.composeSinks)((0, tool_call_timing_js_1.createRingBufferSink)(timingRingBuffer), diskSink)
+        : devMode
+            ? (0, tool_call_timing_js_1.composeSinks)((0, tool_call_timing_js_1.createRingBufferSink)(timingRingBuffer), (0, tool_call_timing_js_1.createDevPerfSink)())
+            : (0, tool_call_timing_js_1.createRingBufferSink)(timingRingBuffer);
     if (devMode) {
         console.error('[PerfTrace] WORKRAIL_DEV=1 -- tool call timing active');
     }

package/dist/mcp/tool-call-timing.d.ts CHANGED Viewed

@@ -1,4 +1,7 @@
 export type ToolCallOutcome = 'success' | 'error' | 'unknown_tool';
+export type ToolCallTimingEntry = ToolCallTiming & {
+    readonly serverVersion: string;
+};
 export interface ToolCallTiming {
     readonly toolName: string;
     readonly startedAtMs: number;
@@ -19,6 +22,7 @@ export declare class ToolCallTimingRingBuffer {
 }
 export declare const DEFAULT_RING_BUFFER_CAPACITY = 100;
 export declare function createRingBufferSink(buffer: ToolCallTimingRingBuffer): ToolCallTimingSink;
+export declare function createDiskPersistSink(perfFilePath: string, serverVersion: string): ToolCallTimingSink;
 export declare function createDevPerfSink(): ToolCallTimingSink;
 export declare function composeSinks(...sinks: ToolCallTimingSink[]): ToolCallTimingSink;
 export declare function withToolCallTiming<T>(toolName: string, handler: () => Promise<T>, sink: ToolCallTimingSink): Promise<T>;

package/dist/mcp/tool-call-timing.js CHANGED Viewed

@@ -1,10 +1,46 @@
 "use strict";
+var __createBinding = (this && this.__createBinding) || (Object.create ? (function(o, m, k, k2) {
+    if (k2 === undefined) k2 = k;
+    var desc = Object.getOwnPropertyDescriptor(m, k);
+    if (!desc || ("get" in desc ? !m.__esModule : desc.writable || desc.configurable)) {
+      desc = { enumerable: true, get: function() { return m[k]; } };
+    }
+    Object.defineProperty(o, k2, desc);
+}) : (function(o, m, k, k2) {
+    if (k2 === undefined) k2 = k;
+    o[k2] = m[k];
+}));
+var __setModuleDefault = (this && this.__setModuleDefault) || (Object.create ? (function(o, v) {
+    Object.defineProperty(o, "default", { enumerable: true, value: v });
+}) : function(o, v) {
+    o["default"] = v;
+});
+var __importStar = (this && this.__importStar) || (function () {
+    var ownKeys = function(o) {
+        ownKeys = Object.getOwnPropertyNames || function (o) {
+            var ar = [];
+            for (var k in o) if (Object.prototype.hasOwnProperty.call(o, k)) ar[ar.length] = k;
+            return ar;
+        };
+        return ownKeys(o);
+    };
+    return function (mod) {
+        if (mod && mod.__esModule) return mod;
+        var result = {};
+        if (mod != null) for (var k = ownKeys(mod), i = 0; i < k.length; i++) if (k[i] !== "default") __createBinding(result, mod, k[i]);
+        __setModuleDefault(result, mod);
+        return result;
+    };
+})();
 Object.defineProperty(exports, "__esModule", { value: true });
 exports.DEFAULT_RING_BUFFER_CAPACITY = exports.ToolCallTimingRingBuffer = exports.noopToolCallTimingSink = void 0;
 exports.createRingBufferSink = createRingBufferSink;
+exports.createDiskPersistSink = createDiskPersistSink;
 exports.createDevPerfSink = createDevPerfSink;
 exports.composeSinks = composeSinks;
 exports.withToolCallTiming = withToolCallTiming;
+const fs = __importStar(require("fs"));
+const path = __importStar(require("path"));
 const noopToolCallTimingSink = () => { };
 exports.noopToolCallTimingSink = noopToolCallTimingSink;
 class ToolCallTimingRingBuffer {
@@ -44,6 +80,22 @@ function createRingBufferSink(buffer) {
         buffer.push(timing);
     };
 }
+function createDiskPersistSink(perfFilePath, serverVersion) {
+    try {
+        fs.mkdirSync(path.dirname(perfFilePath), { recursive: true });
+    }
+    catch { }
+    let warnedOnce = false;
+    return (timing) => {
+        const entry = { ...timing, serverVersion };
+        fs.promises.appendFile(perfFilePath, JSON.stringify(entry) + '\n').catch((err) => {
+            if (!warnedOnce) {
+                warnedOnce = true;
+                process.stderr.write(`[PerfTrace] Failed to write timing to disk: ${String(err)}\n`);
+            }
+        });
+    };
+}
 function createDevPerfSink() {
     return (timing) => {
         const outcomeLabel = timing.outcome === 'success' ? 'OK' : timing.outcome.toUpperCase();

package/dist/v2/durable-core/domain/observation-builder.js CHANGED Viewed

@@ -34,6 +34,8 @@ function anchorsToObservations(anchors) {
                 });
                 break;
             case 'repo_root':
+                if (anchor.value.length > constants_js_1.MAX_OBSERVATION_SHORT_STRING_LENGTH)
+                    break;
                 observations.push({
                     key: 'repo_root',
                     value: { type: 'short_string', value: anchor.value },

package/dist/v2/infra/local/data-dir/index.d.ts CHANGED Viewed

@@ -21,4 +21,5 @@ export declare class LocalDataDirV2 implements DataDirPortV2 {
     tokenIndexPath(): string;
     managedSourcesPath(): string;
     managedSourcesLockPath(): string;
+    perfDir(): string;
 }

package/dist/v2/infra/local/data-dir/index.js CHANGED Viewed

@@ -95,5 +95,8 @@ class LocalDataDirV2 {
     managedSourcesLockPath() {
         return path.join(this.root(), 'managed-sources', 'managed-sources.lock');
     }
+    perfDir() {
+        return path.join(this.root(), 'perf');
+    }
 }
 exports.LocalDataDirV2 = LocalDataDirV2;

package/dist/v2/ports/data-dir.port.d.ts CHANGED Viewed

@@ -16,4 +16,5 @@ export interface DataDirPortV2 {
     tokenIndexPath(): string;
     managedSourcesPath(): string;
     managedSourcesLockPath(): string;
+    perfDir(): string;
 }

package/dist/v2/usecases/console-routes.d.ts CHANGED Viewed

@@ -2,4 +2,4 @@ import type { Application } from 'express';
 import type { ConsoleService } from './console-service.js';
 import type { WorkflowService } from '../../application/services/workflow-service.js';
 import type { ToolCallTimingRingBuffer } from '../../mcp/tool-call-timing.js';
-export declare function mountConsoleRoutes(app: Application, consoleService: ConsoleService, workflowService?: WorkflowService, timingRingBuffer?: ToolCallTimingRingBuffer): () => void;
+export declare function mountConsoleRoutes(app: Application, consoleService: ConsoleService, workflowService?: WorkflowService, timingRingBuffer?: ToolCallTimingRingBuffer, toolCallsPerfFile?: string, serverVersion?: string): () => void;

package/dist/v2/usecases/console-routes.js CHANGED Viewed

@@ -53,7 +53,7 @@ function loadWorkflowTags() {
         return { version: 0, tags: [], workflows: {} };
     }
 }
-function mountConsoleRoutes(app, consoleService, workflowService, timingRingBuffer) {
+function mountConsoleRoutes(app, consoleService, workflowService, timingRingBuffer, toolCallsPerfFile, serverVersion) {
     const sseClients = new Set();
     let sseDebounceTimer = null;
     function broadcastChange() {
@@ -99,14 +99,71 @@ function mountConsoleRoutes(app, consoleService, workflowService, timingRingBuff
         req.on('close', () => { sseClients.delete(res); });
         res.on('close', () => { sseClients.delete(res); });
     });
+    const THIRTY_DAYS_MS = 30 * 24 * 60 * 60 * 1000;
+    const PERF_FILE_READ_LIMIT_BYTES = 5 * 1024 * 1024;
+    async function readDiskEntries(perfFile) {
+        try {
+            const stat = await fs_1.default.promises.stat(perfFile);
+            let raw;
+            if (stat.size > PERF_FILE_READ_LIMIT_BYTES) {
+                const fd = await fs_1.default.promises.open(perfFile, 'r');
+                const offset = stat.size - PERF_FILE_READ_LIMIT_BYTES;
+                const buf = Buffer.alloc(PERF_FILE_READ_LIMIT_BYTES);
+                await fd.read(buf, 0, PERF_FILE_READ_LIMIT_BYTES, offset);
+                await fd.close();
+                raw = buf.toString('utf8');
+            }
+            else {
+                raw = await fs_1.default.promises.readFile(perfFile, 'utf8');
+            }
+            const cutoff = Date.now() - THIRTY_DAYS_MS;
+            return raw
+                .split('\n')
+                .filter(Boolean)
+                .flatMap((line) => {
+                try {
+                    const entry = JSON.parse(line);
+                    if (typeof entry.toolName !== 'string' ||
+                        typeof entry.startedAtMs !== 'number' ||
+                        typeof entry.durationMs !== 'number' ||
+                        (entry.outcome !== 'success' && entry.outcome !== 'error' && entry.outcome !== 'unknown_tool'))
+                        return [];
+                    const safeEntry = typeof entry.serverVersion === 'string'
+                        ? entry
+                        : { ...entry, serverVersion: 'unknown' };
+                    if (safeEntry.startedAtMs < cutoff)
+                        return [];
+                    return [safeEntry];
+                }
+                catch {
+                    return [];
+                }
+            });
+        }
+        catch {
+            return [];
+        }
+    }
     const devMode = (0, dev_mode_js_1.isDevMode)();
     if (devMode) {
-        app.get('/api/v2/perf/tool-calls', (req, res) => {
+        app.get('/api/v2/perf/tool-calls', async (req, res) => {
             const rawLimit = req.query['limit'];
             const limit = typeof rawLimit === 'string' ? parseInt(rawLimit, 10) : undefined;
             const safeLimit = (limit !== undefined && Number.isFinite(limit) && limit > 0) ? limit : undefined;
-            const observations = timingRingBuffer ? timingRingBuffer.recent(safeLimit) : [];
-            res.json({ success: true, data: { observations, total: timingRingBuffer?.size ?? 0, devMode } });
+            const diskEntries = toolCallsPerfFile ? await readDiskEntries(toolCallsPerfFile) : [];
+            const ringEntries = timingRingBuffer ? timingRingBuffer.recent(safeLimit) : [];
+            const version = serverVersion ?? 'unknown';
+            const ringEntriesWithVersion = ringEntries.map((t) => ({
+                ...t,
+                serverVersion: version,
+            }));
+            const dedupeKey = (e) => `${e.toolName}:${e.startedAtMs}:${e.durationMs}`;
+            const inMemoryKeys = new Set(ringEntriesWithVersion.map(dedupeKey));
+            const diskOnlyEntries = diskEntries.filter((e) => !inMemoryKeys.has(dedupeKey(e)));
+            const allEntries = [...ringEntriesWithVersion, ...diskOnlyEntries]
+                .sort((a, b) => b.startedAtMs - a.startedAtMs)
+                .slice(0, safeLimit ?? undefined);
+            res.json({ success: true, data: { observations: allEntries, devMode } });
         });
     }
     app.get('/api/v2/sessions', async (_req, res) => {

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@exaudeus/workrail",
-  "version": "3.18.1",
+  "version": "3.19.0",
   "description": "Step-by-step workflow enforcement for AI agents via MCP",
   "license": "MIT",
   "repository": {

package/workflows/workflow-for-workflows.json CHANGED Viewed

@@ -170,11 +170,12 @@
           "State what result the authored workflow should reliably produce for its user.",
           "List the criteria that would make the workflow feel genuinely satisfying in practice.",
           "Name the biggest likely failure mode and the most dangerous false-confidence mode.",
-          "State what would make the workflow technically correct but still disappointing."
+          "State what would make the workflow technically correct but still disappointing.",
+          "Build a success-criteria-to-mechanism map: for each item in userSatisfactionCriteria, name the specific step(s) that enforce it and the enforcement mechanism (gate, self-audit, second pass, example contrast, rubric). Any criterion with no named mechanism is a gap -- either add a mechanism to the planned architecture or flag it as a known weakness to address in Phase 3."
         ],
         "outputRequired": {
-          "notesMarkdown": "Effectiveness target, satisfaction criteria, failure modes, and false-confidence risks.",
-          "context": "Capture effectivenessTarget, userSatisfactionCriteria, primaryFailureMode, dangerousFalseConfidenceModes, likelyWeakOutcomeModes, and trustRisk."
+          "notesMarkdown": "Effectiveness target, satisfaction criteria, failure modes, false-confidence risks, and the success-criteria-to-mechanism map with any gaps identified.",
+          "context": "Capture effectivenessTarget, userSatisfactionCriteria, primaryFailureMode, dangerousFalseConfidenceModes, likelyWeakOutcomeModes, trustRisk, and successCriteriaToMechanismMap."
         },
         "verify": [
           "The authored workflow now has a clear outcome bar, not just an authoring bar."
@@ -492,11 +493,12 @@
               "Reviewer-family or validator output is evidence, not authority."
             ],
             "procedure": [
-              "Score these dimensions 0-2 with one sentence of evidence each: `voiceClarity`, `ceremonyLevel`, `loopSoundness`, `delegationBoundedness`, `artifactClarity`, `taskEffectiveness`, `falseConfidenceResistance`, `stateMinimality`, `coverageSharpness`, `domainFit`, `handoffUtility`, `rigorAdaptability` (0 = adapts to complexity/rigor levels, 2 = single-weight), `enforcementStrength` (0 = behavioral rules have structural teeth; 2 = important rules are prose-only with no enforcement mechanism), and `modernizationDiscipline` (0 = every valueInventory item preserved, equivalently replaced with justification, or dropped with justification; 2 = items missing or replaced with weaker versions without justification  -- score 0 for create mode).",
+              "Score these dimensions 0-2 with one sentence of evidence each: `voiceClarity`, `ceremonyLevel`, `loopSoundness`, `delegationBoundedness`, `artifactClarity`, `taskEffectiveness`, `falseConfidenceResistance`, `stateMinimality`, `coverageSharpness`, `domainFit`, `handoffUtility`, `rigorAdaptability` (0 = adapts to complexity/rigor levels, 2 = single-weight), `enforcementStrength` (0 = behavioral rules have structural teeth; 2 = important rules are prose-only with no enforcement mechanism), `outputQualityMechanisms` (0 = each key generative step has a concrete enforcement mechanism for output quality such as a self-audit, second pass, example contrast, or rubric; 1 = some generative steps rely only on metaGuidance or prose rules; 2 = generative steps have no quality enforcement beyond prompt wording), and `modernizationDiscipline` (0 = every valueInventory item preserved, equivalently replaced with justification, or dropped with justification; 2 = items missing or replaced with weaker versions without justification  -- score 0 for create mode).",
+              "For each generative step (any step whose output is judged on content quality rather than structural correctness), run an adversarial trace: what does a lazy or average agent do here, and does the prompt prevent it? A step where the lazy path produces a plausible-looking but shallow result scores poorly on `outputQualityMechanisms`. Check each such step against the successCriteriaToMechanismMap from Phase 1 -- any criterion whose mechanism lives in this step must actually be enforced here.",
               "If delegation is available and rigor is THOROUGH, run an adversarial review bundle with these lenses: `engine_native_reviewer`, `task_effectiveness_reviewer`, `state_economy_reviewer`, `false_confidence_reviewer`, `domain_fit_reviewer`, and `maintainer_reviewer`.",
               "Synthesize what the review confirmed, what it challenged, and what changed your mind.",
               "When scoring `falseConfidenceResistance`, explicitly check: do the workflow's quality gates protect edge cases and degraded paths, or only the happy path? A workflow that passes its own checks on ideal input but fails silently on minimal or unexpected input scores 2.",
-              "Set hard-gate failures whenever any of these are materially weak: `taskEffectiveness`, `falseConfidenceResistance`, `stateMinimality`, `coverageSharpness`, `domainFit`, or `handoffUtility`.",
+              "Set hard-gate failures whenever any of these are materially weak: `taskEffectiveness`, `falseConfidenceResistance`, `stateMinimality`, `coverageSharpness`, `domainFit`, `handoffUtility`, or `outputQualityMechanisms`.",
               "Set `authoringIntegrityPassed = true` only if structural and authoring-quality dimensions are all acceptable. Set `outcomeEffectivenessPassed = true` only if the workflow is likely to achieve satisfying results for the user."
             ],
             "outputRequired": {
@@ -548,6 +550,7 @@
             { "type": "contains", "value": "handoffUtility", "message": "Review must score handoffUtility" },
             { "type": "contains", "value": "rigorAdaptability", "message": "Review must score rigorAdaptability" },
             { "type": "contains", "value": "enforcementStrength", "message": "Review must score enforcementStrength" },
+            { "type": "contains", "value": "outputQualityMechanisms", "message": "Review must score outputQualityMechanisms" },
             {
               "type": "contains",
               "value": "modernizationDiscipline",
@@ -665,6 +668,31 @@
       },
       "notesOptional": true,
       "requireConfirmation": false
+    },
+    {
+      "id": "phase-8-process-retrospective",
+      "title": "Phase 8: Process Retrospective",
+      "promptBlocks": {
+        "goal": "While this run is still fresh, identify gaps in the workflow-for-workflows process itself -- not in the authored workflow.",
+        "constraints": [
+          "This step is about the authoring process, not the authored workflow. Do not summarize the workflow again.",
+          "Be honest. If the process caught everything, say so. If it missed something, say specifically where and why."
+        ],
+        "procedure": [
+          "Look back at the full run. Were any weaknesses in the authored workflow only identified post-hoc -- after the quality gate loop, by the user, or by a later reviewer?",
+          "For each weakness identified late: name the Phase where it should have been caught, explain why the current step failed to surface it, and propose a specific change to that step's procedure or scoring rubric that would catch it on the next run.",
+          "Check the successCriteriaToMechanismMap from Phase 1 against the final workflow: did every criterion end up with a concrete enforcement mechanism? Any criterion that is still prose-only in the final file is a gap in the Phase 1 or Phase 3 process.",
+          "If nothing was missed and the process caught all meaningful issues in-band, say so explicitly and explain what worked."
+        ],
+        "outputRequired": {
+          "notesMarkdown": "Process gaps found (or confirmed absent), where they should have been caught, and concrete proposed changes to workflow-for-workflows. This output is raw material for improving this workflow.",
+          "context": "Capture processGaps and suggestedProcessImprovements."
+        },
+        "verify": [
+          "The retrospective identifies specific step-level changes, not vague general improvements."
+        ]
+      },
+      "requireConfirmation": false
     }
   ],
   "validatedAgainstSpecVersion": 3