npm - cool-workflow - Versions diffs - 0.1.79 → 0.1.80 - Mend

cool-workflow 0.1.79 → 0.1.80

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (73) hide show

package/.claude-plugin/plugin.json +1 -1
package/.codex-plugin/plugin.json +1 -1
package/README.md +9 -1
package/apps/architecture-review/app.json +1 -1
package/apps/architecture-review-fast/app.json +64 -0
package/apps/architecture-review-fast/workflow.js +153 -0
package/apps/end-to-end-golden-path/app.json +1 -1
package/apps/pr-review-fix-ci/app.json +1 -1
package/apps/release-cut/app.json +1 -1
package/apps/research-synthesis/app.json +1 -1
package/dist/capability-core.js +38 -0
package/dist/capability-registry.js +11 -8
package/dist/cli.js +10 -1
package/dist/drive.js +74 -1
package/dist/evidence-reasoning.js +2 -2
package/dist/execution-backend.js +6 -1
package/dist/mcp-server.js +48 -13
package/dist/orchestrator/lifecycle-operations.js +2 -1
package/dist/orchestrator.js +1 -1
package/dist/run-export.js +370 -25
package/dist/run-registry.js +11 -4
package/dist/state-explosion.js +100 -21
package/dist/version.js +1 -1
package/docs/agent-delegation-drive.7.md +58 -0
package/docs/canonical-workflow-apps.7.md +37 -0
package/docs/cli-mcp-parity.7.md +12 -0
package/docs/contract-migration-tooling.7.md +4 -0
package/docs/control-plane-scheduling.7.md +4 -0
package/docs/durable-state-and-locking.7.md +4 -0
package/docs/evidence-adoption-reasoning-chain.7.md +4 -0
package/docs/execution-backends.7.md +4 -0
package/docs/index.md +1 -0
package/docs/launch/demo.tape +28 -0
package/docs/launch/launch-kit.md +59 -3
package/docs/launch/pre-launch-checklist.md +53 -0
package/docs/multi-agent-cli-mcp-surface.7.md +4 -0
package/docs/multi-agent-eval-replay-harness.7.md +4 -0
package/docs/multi-agent-operator-ux.7.md +4 -0
package/docs/node-snapshot-diff-replay.7.md +4 -0
package/docs/observability-cost-accounting.7.md +4 -0
package/docs/project-index.md +13 -5
package/docs/real-execution-backends.7.md +4 -0
package/docs/release-and-migration.7.md +4 -0
package/docs/release-tooling.7.md +4 -0
package/docs/routines.md +23 -0
package/docs/run-registry-control-plane.7.md +42 -1
package/docs/run-retention-reclamation.7.md +4 -0
package/docs/source-context-profiles.7.md +119 -0
package/docs/state-explosion-management.7.md +11 -0
package/docs/team-collaboration.7.md +4 -0
package/docs/unix-principles.md +49 -1
package/docs/web-desktop-workbench.7.md +4 -0
package/manifest/plugin.manifest.json +1 -1
package/manifest/source-context-profiles.json +142 -0
package/package.json +2 -1
package/scripts/agents/claude-p-agent.js +129 -43
package/scripts/architecture-review-fast.js +362 -0
package/scripts/bump-version.js +1 -0
package/scripts/canonical-apps.js +21 -4
package/scripts/coverage-gate.js +211 -0
package/scripts/dogfood-release.js +1 -1
package/scripts/golden-path.js +4 -4
package/scripts/source-context.js +291 -0
package/scripts/version-sync-check.js +1 -0
package/skills/ci-triage/SKILL.md +50 -0
package/skills/ci-triage/agents/openai.yaml +4 -0
package/skills/cool-workflow/SKILL.md +4 -1
package/skills/deploy-check/SKILL.md +55 -0
package/skills/deploy-check/agents/openai.yaml +4 -0
package/skills/design-qa/SKILL.md +49 -0
package/skills/design-qa/agents/openai.yaml +4 -0
package/skills/pr-review/SKILL.md +45 -0
package/skills/pr-review/agents/openai.yaml +4 -0

package/.claude-plugin/plugin.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "cool-workflow",
   "description": "Auditable workflow control-plane and orchestration runtime: TypeScript dispatch, evidence-gated verification, state commits, scheduling, routines, multi-agent coordination, and MCP. Delegates execution to external agents — never runs models.",
-  "version": "0.1.79",
+  "version": "0.1.80",
   "author": {
     "name": "COOLWHITE LLC"
   },

package/.codex-plugin/plugin.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "cool-workflow",
-  "version": "0.1.79",
+  "version": "0.1.80",
   "description": "Auditable workflow control-plane and orchestration runtime: TypeScript dispatch, evidence-gated verification, state commits, scheduling, routines, multi-agent coordination, and MCP. Delegates execution to external agents — never runs models.",
   "author": {
     "name": "COOLWHITE LLC"

package/README.md CHANGED Viewed

@@ -649,8 +649,16 @@ The orchestration vision landed in one release, all reviewer-gated:
 `--agent-command builtin:claude` resolves to a bundled read-only claude wrapper that completes workers with a real agent; the cross-directory quickstart crash is fixed; missing optional inputs no longer leak `{{name}}` into prompts. Published to npm (`cool-workflow`, bins `cw`/`cool-workflow`) with LICENSE and metadata. Live dogfood proof committed under `docs/dogfood/`.
-## Tamper-evidence demo (on main, ships next)
+## Tamper-evidence demo (v0.1.79)
 `cw demo tamper` — a hermetic, one-command proof that a recorded telemetry verdict cannot be forged undetected: it builds a real ed25519-signed ledger, forges it at the ledger layer (verdict flip + recomputed local hash → the chain still breaks) and the signature layer (inflated tokens, reused signature → ed25519 rejects), all verified offline with only the public key. `cw telemetry verify <run>` is the operator-facing half (`cw_telemetry_verify` on MCP).
+## Opt-in live agent output during a drive (on main, ships next)
+Set `CW_AGENT_STREAM=1` to see each worker's live agent trace. The bundled claude wrapper (`builtin:claude` / `scripts/agents/claude-p-agent.js`) keeps the legacy `--output-format json` path by default; only the opt-in path runs claude in `--output-format stream-json` and renders a concise human trace (tool uses, assistant text, per-turn summaries) to **stderr**. CW core forwards that stderr to the operator's terminal only when `CW_AGENT_STREAM=1`, CW's own stderr is a TTY, and `CW_NO_STREAM` is not set; piped/CI runs stay silent (Rule of Silence). Core only forwards the stream, never parses it — vendor-specific rendering is the wrapper's concern (policy), not the kernel's (mechanism).
 v0.1.79
+## Fast Architecture Review (v0.1.80)
+Adds the opt-in fast architecture-review lane: scoped JSONL source contexts, diff-aware exports, reusable Map and Assess results, measurable wrapper metrics, actionable background full-review handoff, and userland model policy flags for routing fast/strong workers without changing the full review contract.

package/apps/architecture-review/app.json CHANGED Viewed

@@ -3,7 +3,7 @@
   "id": "architecture-review",
   "title": "Architecture Review",
   "summary": "Map a repository architecture, assess risks, verify important findings, and synthesize an evidence-backed verdict.",
-  "version": "0.1.79",
+  "version": "0.1.80",
   "author": "COOLWHITE LLC",
   "inputs": [
     {

package/apps/architecture-review-fast/app.json ADDED Viewed

@@ -0,0 +1,64 @@
+{
+  "schemaVersion": 1,
+  "id": "architecture-review-fast",
+  "title": "Architecture Review Fast",
+  "summary": "Run a shorter architecture review with parallel map and assess phases for faster first results.",
+  "version": "0.1.80",
+  "author": "COOLWHITE LLC",
+  "inputs": [
+    {
+      "name": "repo",
+      "type": "path",
+      "required": true,
+      "description": "Repository path to inspect."
+    },
+    {
+      "name": "question",
+      "type": "string",
+      "required": true,
+      "description": "Architecture question or decision to review."
+    },
+    {
+      "name": "invariant",
+      "type": "string",
+      "repeated": true,
+      "description": "Invariant that must remain true."
+    },
+    {
+      "name": "focus",
+      "type": "string",
+      "description": "Optional subsystem, risk area, or file path to emphasize.",
+      "default": "the highest-risk runtime and operator paths"
+    },
+    {
+      "name": "sourceContext",
+      "type": "path",
+      "description": "Optional JSONL source context file generated by scripts/source-context.js export.",
+      "default": ""
+    },
+    {
+      "name": "sourceContextDigest",
+      "type": "string",
+      "description": "Optional digest or cache key for the supplied source context.",
+      "default": ""
+    }
+  ],
+  "sandboxProfiles": [
+    "readonly"
+  ],
+  "compatibility": {
+    "minVersion": "0.1.79",
+    "workflowSchemaVersion": 1,
+    "notes": "Opt-in fast architecture review app; the full architecture-review app remains unchanged."
+  },
+  "metadata": {
+    "canonical": true,
+    "domain": "software-architecture",
+    "mode": "fast",
+    "fullReviewApp": "architecture-review",
+    "maintainedAs": "official-userland"
+  },
+  "workflow": {
+    "entrypoint": "workflow.js"
+  }
+}

package/apps/architecture-review-fast/workflow.js ADDED Viewed

@@ -0,0 +1,153 @@
+const FAST_MODEL = modelHint("CW_ARCHITECTURE_REVIEW_FAST_MODEL");
+const STRONG_MODEL = modelHint("CW_ARCHITECTURE_REVIEW_STRONG_MODEL");
+module.exports = ({ workflow, phase, parallel, agent, artifact, input }) => {
+  const inputs = [
+    input("repo", {
+      type: "path",
+      required: true,
+      description: "Repository path to inspect."
+    }),
+    input("question", {
+      type: "string",
+      required: true,
+      description: "Architecture question or decision to review."
+    }),
+    input("invariant", {
+      type: "string",
+      repeated: true,
+      description: "Invariant that must remain true."
+    }),
+    input("focus", {
+      type: "string",
+      description: "Optional subsystem, risk area, or file path to emphasize.",
+      default: "the highest-risk runtime and operator paths"
+    }),
+    input("sourceContext", {
+      type: "path",
+      description: "Optional JSONL source context file generated by scripts/source-context.js export.",
+      default: ""
+    }),
+    input("sourceContextDigest", {
+      type: "string",
+      description: "Optional digest or cache key for the supplied source context.",
+      default: ""
+    })
+  ];
+  return workflow({
+    id: "architecture-review-fast",
+    title: "Architecture Review Fast",
+    summary: "Run a shorter architecture review with parallel map and assess phases for faster first results.",
+    limits: {
+      maxAgents: 12,
+      maxConcurrentAgents: 4
+    },
+    inputs,
+    sandboxProfiles: ["readonly"],
+    metadata: {
+      mode: "fast",
+      fullReviewApp: "architecture-review"
+    },
+    phases: [
+      parallel("Map", [
+        agent(
+          "map:runtime-surface",
+          [
+            "Fast-map the runtime architecture in {{repo}} for {{question}}.",
+            contextInstruction(),
+            "Focus: {{focus}}. Invariants: {{invariant}}.",
+            "Return the primary entrypoints, state stores, execution paths, and the exact files or commands inspected."
+          ].join(" "),
+          fastOptions("Runtime surface mapper", { resultCache: sourceContextResultCache() })
+        ),
+        agent(
+          "map:operator-surface",
+          [
+            "Fast-map operator, CI, deployment, test, release, and background-job surfaces in {{repo}} for {{question}}.",
+            contextInstruction(),
+            "Focus: {{focus}}. Return concrete files, scripts, configs, missing areas, and candidate runtime bottlenecks."
+          ].join(" "),
+          fastOptions("Operator surface mapper", { resultCache: sourceContextResultCache() })
+        )
+      ]),
+      parallel("Assess", [
+        agent(
+          "assess:risks",
+          [
+            "Assess the fast map for real P0/P1/P2 architecture and correctness risks.",
+            "Separate confirmed risks, conditional risks, non-issues, and unknowns.",
+            "Tie every important claim to inspected evidence and the invariants {{invariant}}."
+          ].join(" "),
+          fastOptions("Risk assessor", { resultCache: sourceContextResultCache({ includeCompletedResults: "previous-phases" }) })
+        ),
+        agent(
+          "assess:runtime-speed",
+          [
+            "Assess runtime speed and user-wait risk for {{question}}.",
+            "Look for serial agent work, repeated repository scanning, missing cache keys, oversized prompts, and long foreground jobs.",
+            "Recommend mechanisms that preserve POLA, stdout/stderr discipline, and zero runtime dependencies."
+          ].join(" "),
+          fastOptions("Runtime speed assessor", { resultCache: sourceContextResultCache({ includeCompletedResults: "previous-phases" }) })
+        )
+      ]),
+      phase("Verify", [
+        agent(
+          "verify:p0-p2-risks",
+          [
+            "Re-open evidence for every candidate P0/P1/P2 risk from the fast assessment.",
+            "Confirm real risks, downgrade unsupported claims, and list exact file paths, commands, logs, or unknowns.",
+            "The cw:result evidence array must cite durable locators."
+          ].join(" "),
+          strongOptions("Evidence verifier", { requiresEvidence: true })
+        )
+      ]),
+      phase("Verdict", [
+        artifact(
+          "verdict:fast-synthesis",
+          [
+            "Synthesize a fast architecture verdict for {{question}}.",
+            "Include a short answer, compact architecture map, ranked risks, speed recommendations, non-issues, and evidence links.",
+            "State when the full architecture-review app should be scheduled as a background routine.",
+            "The cw:result evidence array must support the final verdict."
+          ].join(" "),
+          strongOptions("Fast verdict synthesizer", { requiresEvidence: true })
+        )
+      ])
+    ]
+  });
+};
+function fastOptions(label, extra) {
+  return taskOptions(label, FAST_MODEL, extra);
+}
+function strongOptions(label, extra) {
+  return taskOptions(label, STRONG_MODEL, extra);
+}
+function taskOptions(label, model, extra) {
+  return {
+    label,
+    sandboxProfileId: "readonly",
+    ...(model ? { model } : {}),
+    ...(extra || {})
+  };
+}
+function modelHint(name) {
+  const value = String(process.env[name] || "").trim();
+  return value || undefined;
+}
+function contextInstruction() {
+  return [
+    "If {{sourceContext}} is non-empty, read that JSONL source context first and treat {{sourceContextDigest}} as its cache/digest hint.",
+    "If the supplied context is missing, unreadable, or obviously stale, say so explicitly instead of guessing.",
+    "If no source context is supplied, inspect {{repo}} directly."
+  ].join(" ");
+}
+function sourceContextResultCache(extra) {
+  return { mode: "read-write", keyInput: "sourceContextDigest", ...(extra || {}) };
+}

package/apps/end-to-end-golden-path/app.json CHANGED Viewed

@@ -3,7 +3,7 @@
   "id": "end-to-end-golden-path",
   "title": "End-to-End Golden Path",
   "summary": "Deterministic one-worker workflow app for proving the CW integration chain.",
-  "version": "0.1.79",
+  "version": "0.1.80",
   "author": "COOLWHITE LLC",
   "inputs": [
     {

package/apps/pr-review-fix-ci/app.json CHANGED Viewed

@@ -3,7 +3,7 @@
   "id": "pr-review-fix-ci",
   "title": "PR Review Fix CI",
   "summary": "Review a pull request or branch, inspect CI failures, diagnose actionable issues, optionally patch, verify, and summarize with evidence.",
-  "version": "0.1.79",
+  "version": "0.1.80",
   "author": "COOLWHITE LLC",
   "inputs": [
     {

package/apps/release-cut/app.json CHANGED Viewed

@@ -3,7 +3,7 @@
   "id": "release-cut",
   "title": "Release Cut",
   "summary": "Prepare a release with checklist discipline: version checks, changelog, tests, packaging, release notes, and final verification.",
-  "version": "0.1.79",
+  "version": "0.1.80",
   "author": "COOLWHITE LLC",
   "inputs": [
     {

package/apps/research-synthesis/app.json CHANGED Viewed

@@ -3,7 +3,7 @@
   "id": "research-synthesis",
   "title": "Research Synthesis",
   "summary": "Split a research question into claims, investigate sources, cross-check evidence, verify claims, and synthesize a concise answer.",
-  "version": "0.1.79",
+  "version": "0.1.80",
   "author": "COOLWHITE LLC",
   "inputs": [
     {

package/dist/capability-core.js CHANGED Viewed

@@ -35,6 +35,9 @@ exports.runShow = runShow;
 exports.runResume = runResume;
 exports.runArchive = runArchive;
 exports.runRerun = runRerun;
+exports.runExportArchive = runExportArchive;
+exports.runImportArchive = runImportArchive;
+exports.runVerifyImport = runVerifyImport;
 exports.queueAdd = queueAdd;
 exports.queueList = queueList;
 exports.queueDrain = queueDrain;
@@ -71,6 +74,7 @@ const observability_1 = require("./observability");
 const telemetry_ledger_1 = require("./telemetry-ledger");
 const telemetry_demo_1 = require("./telemetry-demo");
 const state_1 = require("./state");
+const run_export_1 = require("./run-export");
 const node_fs_1 = __importDefault(require("node:fs"));
 const node_path_1 = __importDefault(require("node:path"));
 const scheduling_1 = require("./scheduling");
@@ -194,6 +198,19 @@ function flag(value) {
         return false;
     return Boolean(value);
 }
+function withInvocationCwd(args, fn) {
+    const cwd = optionalString(args.cwd);
+    if (!cwd)
+        return fn();
+    const previous = process.cwd();
+    process.chdir(cwd);
+    try {
+        return fn();
+    }
+    finally {
+        process.chdir(previous);
+    }
+}
 function runRegistryRefresh(reg, args) {
     return reg.refresh({ scope: scopeOf(args, "repo") });
 }
@@ -251,6 +268,27 @@ function runArchive(reg, runId, args) {
 function runRerun(reg, runId, args) {
     return reg.rerun(runId, { scope: scopeOf(args, "home"), reason: optionalString(args.reason) });
 }
+function runExportArchive(runner, runId, args) {
+    return withInvocationCwd(args, () => {
+        const output = optionalString(args.output || args.path || args.archive) || `${runId}.cwrun.json`;
+        return (0, run_export_1.exportRun)(runner.loadRun(runId), node_path_1.default.resolve(output));
+    });
+}
+function runImportArchive(runner, args) {
+    return withInvocationCwd(args, () => {
+        const archive = optionalString(args.archive || args.path || args.file);
+        if (!archive)
+            throw new Error("run import requires an archive path (positional, --archive, --path, or --file)");
+        const target = optionalString(args.target || args.repo || args.cwd) || process.cwd();
+        const imported = (0, run_export_1.importRun)(node_path_1.default.resolve(archive), node_path_1.default.resolve(target));
+        const registry = new run_registry_1.RunRegistry(node_path_1.default.resolve(target), runner);
+        const registryReport = registry.refresh({ scope: "repo" });
+        return { ...imported, registry: registryReport };
+    });
+}
+function runVerifyImport(runner, runId, args) {
+    return withInvocationCwd(args, () => (0, run_export_1.verifyImportedRun)(runner.loadRun(runId)));
+}
 function queueAdd(reg, args) {
     return reg.queueAdd({
         runId: optionalString(args.runId),

package/dist/capability-registry.js CHANGED Viewed

@@ -215,13 +215,13 @@ const BUILTIN_CAPABILITIES = [
     { capability: "multi-agent.blackboard", summary: "Operate on the active multi-agent blackboard.", entry: "hostMultiAgentBlackboard", surface: "both", cli: { path: ["multi-agent", "blackboard"], jsonMode: "default" }, mcp: { tool: "cw_multi_agent_blackboard" } },
     { capability: "multi-agent.score", summary: "Score a candidate with evidence.", entry: "hostMultiAgentScore", surface: "both", cli: { path: ["multi-agent", "score"], jsonMode: "default" }, mcp: { tool: "cw_multi_agent_score" } },
     { capability: "multi-agent.select", summary: "Select a candidate with the verifier gate.", entry: "hostMultiAgentSelect", surface: "both", cli: { path: ["multi-agent", "select"], jsonMode: "default" }, mcp: { tool: "cw_multi_agent_select" } },
-    { capability: "multi-agent.summary", summary: "Read the multi-agent runtime summary.", entry: "multiAgentSummary", surface: "both", cli: { path: ["multi-agent", "summary"], jsonMode: "flag" }, mcp: { tool: "cw_multi_agent_summary" } },
+    { capability: "multi-agent.summary", summary: "Read the structured multi-agent runtime summary for a run.", entry: "multiAgentSummary", surface: "both", cli: { path: ["multi-agent", "summary"], jsonMode: "flag" }, mcp: { tool: "cw_multi_agent_summary" } },
     { capability: "multi-agent.summarize", summary: "Read the combined state-explosion report.", entry: "multiAgentSummarize", surface: "both", cli: { path: ["multi-agent", "summarize"], jsonMode: "flag" }, mcp: { tool: "cw_multi_agent_summarize" } },
-    { capability: "multi-agent.graph", summary: "Read the multi-agent operator graph.", entry: "multiAgentOperatorGraph", surface: "both", cli: { path: ["multi-agent", "graph"], jsonMode: "flag" }, mcp: { tool: "cw_multi_agent_graph" } },
+    { capability: "multi-agent.graph", summary: "Read the structured multi-agent operator graph for a run.", entry: "multiAgentOperatorGraph", surface: "both", cli: { path: ["multi-agent", "graph"], jsonMode: "flag" }, mcp: { tool: "cw_multi_agent_graph" } },
     { capability: "multi-agent.graph.compact", summary: "Read a compact/focused multi-agent graph view.", entry: "multiAgentGraphView", surface: "both", cli: { path: ["multi-agent", "graph"], caseTokens: ["multi-agent", "graph"], jsonMode: "flag" }, mcp: { tool: "cw_multi_agent_graph_compact" } },
-    { capability: "multi-agent.dependencies", summary: "Read derived multi-agent dependency edges.", entry: "multiAgentDependencies", surface: "both", cli: { path: ["multi-agent", "dependencies"], jsonMode: "flag" }, mcp: { tool: "cw_multi_agent_dependencies" } },
-    { capability: "multi-agent.failures", summary: "Read failed/blocked/rejected multi-agent records.", entry: "multiAgentFailures", surface: "both", cli: { path: ["multi-agent", "failures"], jsonMode: "flag" }, mcp: { tool: "cw_multi_agent_failures" } },
-    { capability: "multi-agent.evidence", summary: "Read evidence adoption status with rationaleStatus.", entry: "multiAgentEvidence", surface: "both", cli: { path: ["multi-agent", "evidence"], jsonMode: "flag" }, mcp: { tool: "cw_multi_agent_evidence" } },
+    { capability: "multi-agent.dependencies", summary: "Read derived multi-agent dependency edges for operator inspection.", entry: "multiAgentDependencies", surface: "both", cli: { path: ["multi-agent", "dependencies"], jsonMode: "flag" }, mcp: { tool: "cw_multi_agent_dependencies" } },
+    { capability: "multi-agent.failures", summary: "Read failed, blocked, rejected, and ambiguous multi-agent records.", entry: "multiAgentFailures", surface: "both", cli: { path: ["multi-agent", "failures"], jsonMode: "flag" }, mcp: { tool: "cw_multi_agent_failures" } },
+    { capability: "multi-agent.evidence", summary: "Read evidence adoption status from worker output through selection and commit. Each row carries a derived rationaleStatus (explained|unexplained|not-applicable).", entry: "multiAgentEvidence", surface: "both", cli: { path: ["multi-agent", "evidence"], jsonMode: "flag" }, mcp: { tool: "cw_multi_agent_evidence" } },
     { capability: "multi-agent.reasoning", summary: "Explain why each evidence item was adopted/rejected.", entry: "multiAgentReasoning", surface: "both", cli: { path: ["multi-agent", "reasoning"], jsonMode: "flag" }, mcp: { tool: "cw_evidence_reasoning" } },
     { capability: "multi-agent.reasoning.refresh", summary: "Refresh the durable evidence-reasoning index.", entry: "multiAgentReasoningRefresh", surface: "both", cli: { path: ["multi-agent", "reasoning"], caseTokens: ["multi-agent", "reasoning"], jsonMode: "default" }, mcp: { tool: "cw_evidence_reasoning_refresh" } },
     // ---- multi-agent lifecycle records --------------------------------------
@@ -285,7 +285,7 @@ const BUILTIN_CAPABILITIES = [
     { capability: "backend.agent.config.set", summary: "Set the durable agent delegation config (command-template/endpoint/model; API keys never written).", entry: "backendAgentConfigSet", surface: "both", cli: { path: ["backend", "agent", "config"], caseTokens: ["backend", "agent"], jsonMode: "default" }, mcp: { tool: "cw_backend_agent_config_set" }, payloadIdentical: false, reason: "Mutating: persists $CW_HOME/agent-config.json (secret-stripped) before returning the effective config; both surfaces perform the same write — it is a surface-mutating verb, not a read probe." },
     // ---- worker isolation ---------------------------------------------------
     { capability: "worker.list", summary: "List worker isolation scopes.", entry: "listWorkers", surface: "both", cli: { path: ["worker", "list"], jsonMode: "default" }, mcp: { tool: "cw_worker_list" } },
-    { capability: "worker.summary", summary: "Read the structured worker summary.", entry: "summarizeWorkerRecords", surface: "both", cli: { path: ["worker", "summary"], jsonMode: "flag" }, mcp: { tool: "cw_worker_summary" } },
+    { capability: "worker.summary", summary: "Read the structured worker summary for a run.", entry: "summarizeWorkerRecords", surface: "both", cli: { path: ["worker", "summary"], jsonMode: "flag" }, mcp: { tool: "cw_worker_summary" } },
     { capability: "worker.show", summary: "Show one worker isolation scope.", entry: "showWorker", surface: "both", cli: { path: ["worker", "show"], jsonMode: "default" }, mcp: { tool: "cw_worker_show" } },
     { capability: "worker.manifest", summary: "Write and return a worker manifest.", entry: "showWorkerManifest", surface: "both", cli: { path: ["worker", "manifest"], jsonMode: "default" }, mcp: { tool: "cw_worker_manifest" } },
     { capability: "worker.output", summary: "Record worker output.", entry: "recordWorkerOutput", surface: "both", cli: { path: ["worker", "output"], jsonMode: "default" }, mcp: { tool: "cw_worker_output" } },
@@ -299,12 +299,12 @@ const BUILTIN_CAPABILITIES = [
     { capability: "candidate.rank", summary: "Rank candidates with gates.", entry: "rankCandidates", surface: "both", cli: { path: ["candidate", "rank"], jsonMode: "default" }, mcp: { tool: "cw_candidate_rank" } },
     { capability: "candidate.select", summary: "Select a candidate with the verifier gate.", entry: "selectCandidate", surface: "both", cli: { path: ["candidate", "select"], jsonMode: "default" }, mcp: { tool: "cw_candidate_select" } },
     { capability: "candidate.reject", summary: "Reject a candidate with a reason.", entry: "rejectCandidate", surface: "both", cli: { path: ["candidate", "reject"], jsonMode: "default" }, mcp: { tool: "cw_candidate_reject" } },
-    { capability: "candidate.summary", summary: "Read the structured candidate summary.", entry: "summarizeCandidateOperatorRecords", surface: "both", cli: { path: ["candidate", "summary"], jsonMode: "flag" }, mcp: { tool: "cw_candidate_summary" } },
+    { capability: "candidate.summary", summary: "Read the structured candidate summary for a run.", entry: "summarizeCandidateOperatorRecords", surface: "both", cli: { path: ["candidate", "summary"], jsonMode: "flag" }, mcp: { tool: "cw_candidate_summary" } },
     // ---- feedback -----------------------------------------------------------
     { capability: "feedback.list", summary: "List run feedback records.", entry: "listFeedback", surface: "both", cli: { path: ["feedback", "list"], jsonMode: "default" }, mcp: { tool: "cw_feedback_list" } },
     { capability: "feedback.show", summary: "Show a run feedback record.", entry: "showFeedback", surface: "both", cli: { path: ["feedback", "show"], jsonMode: "default" }, mcp: { tool: "cw_feedback_show" } },
     { capability: "feedback.collect", summary: "Collect feedback from failed nodes.", entry: "collectFeedback", surface: "both", cli: { path: ["feedback", "collect"], jsonMode: "default" }, mcp: { tool: "cw_feedback_collect" } },
-    { capability: "feedback.summary", summary: "Read the structured feedback summary.", entry: "summarizeFeedbackRecords", surface: "both", cli: { path: ["feedback", "summary"], jsonMode: "flag" }, mcp: { tool: "cw_feedback_summary" } },
+    { capability: "feedback.summary", summary: "Read the structured feedback summary for a run.", entry: "summarizeFeedbackRecords", surface: "both", cli: { path: ["feedback", "summary"], jsonMode: "flag" }, mcp: { tool: "cw_feedback_summary" } },
     { capability: "feedback.task", summary: "Create a correction task for feedback.", entry: "createFeedbackTask", surface: "both", cli: { path: ["feedback", "task"], jsonMode: "default" }, mcp: { tool: "cw_feedback_task" } },
     { capability: "feedback.resolve", summary: "Resolve or reject feedback.", entry: "resolveFeedback", surface: "both", cli: { path: ["feedback", "resolve"], jsonMode: "default" }, mcp: { tool: "cw_feedback_resolve" } },
     // ---- scheduling ---------------------------------------------------------
@@ -344,6 +344,9 @@ const BUILTIN_CAPABILITIES = [
     { capability: "run.resume", summary: "Resolve a run by id and continue it from durable state.", entry: "runRegistry.resume", surface: "both", cli: { path: ["run", "resume"], jsonMode: "flag" }, mcp: { tool: "cw_run_resume" } },
     { capability: "run.archive", summary: "Archive/unarchive a run (overlay mark; never deletes source).", entry: "runRegistry.archive", surface: "both", cli: { path: ["run", "archive"], jsonMode: "default" }, mcp: { tool: "cw_run_archive" } },
     { capability: "run.rerun", summary: "Re-run a failed run as a NEW run linked to the original by provenance.", entry: "runRegistry.rerun", surface: "both", cli: { path: ["run", "rerun"], jsonMode: "default" }, mcp: { tool: "cw_run_rerun" } },
+    { capability: "run.export", summary: "Export a run to a portable archive with run-local files and digest integrity.", entry: "runExportArchive", surface: "both", cli: { path: ["run", "export"], jsonMode: "default" }, mcp: { tool: "cw_run_export" } },
+    { capability: "run.import", summary: "Restore a portable run archive into a target repo and verify restored file digests.", entry: "runImportArchive", surface: "both", cli: { path: ["run", "import"], jsonMode: "default" }, mcp: { tool: "cw_run_import" } },
+    { capability: "run.verify-import", summary: "Verify an imported run against its restore manifest and telemetry chain.", entry: "runVerifyImport", surface: "both", cli: { path: ["run", "verify-import"], jsonMode: "default" }, mcp: { tool: "cw_run_verify_import" } },
     { capability: "run.drive", summary: "Preview the next agent-delegation drive step for a run (read-only, deterministic).", entry: "runDrivePreview", surface: "both", cli: { path: ["run", "drive"], caseTokens: ["run", "drive"], jsonMode: "default" }, mcp: { tool: "cw_run_drive" } },
     { capability: "run.drive.step", summary: "Drive a run by delegating each worker to the agent backend (plan->dispatch->fulfill->accept->commit; --once for one step).", entry: "runDrive", surface: "both", cli: { path: ["run", "drive"], caseTokens: ["run", "drive"], jsonMode: "default" }, mcp: { tool: "cw_run_drive_step" }, payloadIdentical: false, reason: "Mutating: advances the run by spawning the external agent per worker and recording attested output — not a read probe. CLI (--drive/--step) and MCP route through the same drive() core." },
     {

package/dist/cli.js CHANGED Viewed

@@ -1064,10 +1064,19 @@ async function main() {
                 case "rerun":
                     printJson((0, capability_core_1.runRerun)(registry, required(id, "run id"), args.options));
                     return;
+                case "export":
+                    printJson((0, capability_core_1.runExportArchive)(runner, required(id || optionalArg(args.options.runId || args.options.run), "run id"), args.options));
+                    return;
+                case "import":
+                    printJson((0, capability_core_1.runImportArchive)(runner, { ...args.options, archive: id || args.options.archive || args.options.path }));
+                    return;
+                case "verify-import":
+                    printJson((0, capability_core_1.runVerifyImport)(runner, required(id || optionalArg(args.options.runId || args.options.run), "run id"), args.options));
+                    return;
                 default:
                     if (await tryDispatchCli(args, runner))
                         return;
-                    throw new Error("Usage: cw.js run search|list|show|resume|archive|rerun|drive [run-id] [--scope repo|home] [--json]  |  cw.js run <app> --drive [--once] [--repo R --question Q]");
+                    throw new Error("Usage: cw.js run search|list|show|resume|archive|rerun|drive|export|import|verify-import [run-id|archive] [--scope repo|home] [--json]  |  cw.js run <app> --drive [--once] [--repo R --question Q]");
             }
         }
         case "queue": {

package/dist/drive.js CHANGED Viewed

@@ -31,12 +31,14 @@ exports.driveConcurrentRound = driveConcurrentRound;
 exports.drive = drive;
 exports.drivePreview = drivePreview;
 const node_fs_1 = __importDefault(require("node:fs"));
+const node_path_1 = __importDefault(require("node:path"));
 const dispatch_1 = require("./dispatch");
 const execution_backend_1 = require("./execution-backend");
 const worker_isolation_1 = require("./worker-isolation");
 const agent_config_1 = require("./agent-config");
 const scheduling_1 = require("./scheduling");
 const observability_1 = require("./observability");
+const state_1 = require("./state");
 exports.DRIVE_SCHEMA_VERSION = 1;
 /** The task the next drive step would advance: a RUNNING (already-dispatched,
  *  awaiting fulfillment / retry) task first, else the next PENDING task in the
@@ -198,8 +200,26 @@ function processSelectedTask(ctx, selected, preparedOutcome) {
     // Progress BEFORE the (possibly multi-minute) agent spawn, so a live drive shows
     // immediate activity instead of a long silence on the first worker. task.label
     // is the human-facing display name; the id stays the stable reference.
-    emitProgress(`→ ${selected.label || selected.id} (${selected.phase}) — ${dispatched ? "dispatched, " : ""}spawning agent, may take minutes…`);
     const promptDigest = node_fs_1.default.existsSync(manifest.inputPath) ? (0, execution_backend_1.sha256)(node_fs_1.default.readFileSync(manifest.inputPath, "utf8")) : (0, execution_backend_1.sha256)(manifest.prompt || "");
+    const cachePath = resultCachePath(run, selected, (0, execution_backend_1.sha256)(selected.prompt));
+    if (cachePath && node_fs_1.default.existsSync(cachePath)) {
+        emitProgress(`↺ ${selected.label || selected.id} (${selected.phase}) — accepting cached result`);
+        try {
+            node_fs_1.default.writeFileSync(manifest.resultPath, node_fs_1.default.readFileSync(cachePath, "utf8"), "utf8");
+            runner.recordWorkerOutput(runId, workerId, manifest.resultPath, {});
+        }
+        catch (error) {
+            return handleHop(ctx, selected, workerId, `result cache rejected: ${error instanceof Error ? error.message : String(error)}`, dispatched);
+        }
+        return step("accept", "ok", {
+            runId,
+            taskId: selected.id,
+            phase: selected.phase,
+            handleKind: "result-cache",
+            reason: "result cache hit"
+        });
+    }
+    emitProgress(`→ ${selected.label || selected.id} (${selected.phase}) — ${dispatched ? "dispatched, " : ""}spawning agent, may take minutes…`);
     const envelope = (0, execution_backend_1.runBackend)(buildAgentRequest(ctx, run, selected, manifest, preparedOutcome));
     const handle = envelope.provenance.handle;
     const reportedModel = handle?.metadata?.reportedModel || "unreported";
@@ -236,6 +256,9 @@ function processSelectedTask(ctx, selected, preparedOutcome) {
     catch (error) {
         return handleHop(ctx, selected, workerId, `result.md rejected: ${error instanceof Error ? error.message : String(error)}`, dispatched);
     }
+    if (cachePath && manifest.resultPath && node_fs_1.default.existsSync(manifest.resultPath)) {
+        writeResultCache(cachePath, node_fs_1.default.readFileSync(manifest.resultPath, "utf8"));
+    }
     return step("accept", "ok", {
         runId,
         taskId: selected.id,
@@ -245,6 +268,53 @@ function processSelectedTask(ctx, selected, preparedOutcome) {
         reportedModel
     });
 }
+function resultCachePath(run, task, promptDigest) {
+    const policy = task.resultCache;
+    if (!policy || policy.mode !== "read-write")
+        return undefined;
+    const keyInput = policy.keyInput;
+    const keyValue = keyInput ? String(run.inputs[keyInput] || "").trim() : "";
+    if (!keyInput || !keyValue)
+        return undefined;
+    const completedResultsDigest = completedResultsCacheDigest(run, task);
+    if (completedResultsDigest === undefined)
+        return undefined;
+    const digest = (0, execution_backend_1.sha256)(JSON.stringify({
+        schemaVersion: 1,
+        workflowId: run.workflow.id,
+        taskId: task.id,
+        keyInput,
+        keyValue,
+        promptDigest,
+        completedResultsDigest
+    })).replace(/^sha256:/, "");
+    return node_path_1.default.join(run.cwd, ".cw", "cache", "worker-results", (0, state_1.safeFileName)(run.workflow.id), `${(0, state_1.safeFileName)(task.id)}-${digest.slice(0, 32)}.md`);
+}
+function completedResultsCacheDigest(run, task) {
+    if (task.resultCache?.includeCompletedResults !== "previous-phases")
+        return "";
+    const phaseIndex = run.phases.findIndex((phase) => phase.name === task.phase || phase.id === task.phase);
+    if (phaseIndex < 0)
+        return undefined;
+    const previousTaskIds = new Set(run.phases.slice(0, phaseIndex).flatMap((phase) => phase.taskIds));
+    const records = run.tasks
+        .filter((candidate) => previousTaskIds.has(candidate.id))
+        .sort((a, b) => a.id.localeCompare(b.id))
+        .map((candidate) => {
+        if (candidate.status !== "completed" || !candidate.resultPath || !node_fs_1.default.existsSync(candidate.resultPath))
+            return undefined;
+        return [candidate.id, (0, execution_backend_1.sha256)(node_fs_1.default.readFileSync(candidate.resultPath, "utf8"))];
+    });
+    if (records.some((record) => record === undefined))
+        return undefined;
+    return (0, execution_backend_1.sha256)(JSON.stringify(records));
+}
+function writeResultCache(file, content) {
+    node_fs_1.default.mkdirSync(node_path_1.default.dirname(file), { recursive: true });
+    const tmp = `${file}.${process.pid}.tmp`;
+    node_fs_1.default.writeFileSync(tmp, content, "utf8");
+    node_fs_1.default.renameSync(tmp, file);
+}
 /** Advance ONE concurrent ROUND: fulfill up to `limit` ready tasks in the first
  *  runnable phase as a single batch, recording results in DETERMINISTIC task
  *  order (the existing phase/dispatch order) regardless of completion order — so
@@ -322,6 +392,9 @@ function prepareConcurrentOutcomes(ctx, batch) {
             continue;
         }
         const manifest = runner.showWorkerManifest(runId, workerId);
+        const cachePath = resultCachePath(run, task, (0, execution_backend_1.sha256)(task.prompt));
+        if (cachePath && node_fs_1.default.existsSync(cachePath))
+            continue;
         const job = (0, execution_backend_1.prepareAgentSpawn)(buildAgentRequest(ctx, run, task, manifest));
         if (job) {
             jobs.push(job);

package/dist/evidence-reasoning.js CHANGED Viewed

@@ -389,11 +389,11 @@ function deriveCounterfactuals(run, scores) {
 // node. This returns the operator-graph node ids backing every decision-bearing
 // reasoning step of an adopted chain, so state-explosion can protect them.
 // ---------------------------------------------------------------------------
-function reasoningCriticalNodeIds(run) {
+function reasoningCriticalNodeIds(run, operator = (0, multi_agent_operator_ux_1.summarizeMultiAgentOperator)(run)) {
     const ids = new Set();
     const faninIds = new Set((run.multiAgent?.fanins || []).map((entry) => entry.id));
     const commitById = new Map((run.commits || []).map((commit) => [commit.id, commit]));
-    for (const evidence of (0, multi_agent_operator_ux_1.summarizeMultiAgentOperator)(run).evidence) {
+    for (const evidence of operator.evidence) {
         if (evidence.status !== "adopted")
             continue;
         for (const id of evidence.candidateIds)

package/dist/execution-backend.js CHANGED Viewed

@@ -887,13 +887,18 @@ function runAgentProcess(descriptor, policy, request, label, handle, attestation
             outcome = request.preparedAgentOutcome;
         }
         else {
+            // Live output is opt-in (POLA): stdout is always captured as data, while
+            // stderr is forwarded only when the operator explicitly asks for a stream
+            // and this process is attached to a terminal. CI/pipes stay silent.
+            const streamStderr = process.env.CW_AGENT_STREAM === "1" && Boolean(process.stderr.isTTY) && process.env.CW_NO_STREAM !== "1";
             const child = (0, node_child_process_1.spawnSync)(resolved.binary, realArgs, {
                 cwd: request.cwd,
                 env: { ...process.env },
                 encoding: "utf8",
                 timeout: resolved.timeoutMs || 600000,
                 maxBuffer: 32 * 1024 * 1024,
-                shell: false
+                shell: false,
+                stdio: ["ignore", "pipe", streamStderr ? "inherit" : "pipe"]
             });
             outcome = {
                 ...(child.error ? { spawnError: messageOf(child.error) } : {}),