npm - cool-workflow - Versions diffs - 0.1.79 → 0.1.81 - Mend

cool-workflow 0.1.79 → 0.1.81

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (131) hide show

package/.claude-plugin/plugin.json +1 -1
package/.codex-plugin/plugin.json +1 -1
package/README.md +51 -3
package/apps/architecture-review/app.json +1 -1
package/apps/architecture-review-fast/app.json +64 -0
package/apps/architecture-review-fast/workflow.js +153 -0
package/apps/end-to-end-golden-path/app.json +1 -1
package/apps/pr-review-fix-ci/app.json +1 -1
package/apps/release-cut/app.json +1 -1
package/apps/research-synthesis/app.json +1 -1
package/dist/agent-config.js +21 -7
package/dist/candidate-scoring.js +42 -22
package/dist/capability-core.js +132 -17
package/dist/capability-registry.js +138 -168
package/dist/cli.js +97 -98
package/dist/collaboration.js +5 -6
package/dist/commit.js +20 -6
package/dist/compare.js +18 -0
package/dist/coordinator/classify.js +45 -0
package/dist/coordinator/paths.js +42 -0
package/dist/coordinator/util.js +129 -0
package/dist/coordinator.js +127 -300
package/dist/dispatch.js +35 -0
package/dist/drive.js +79 -6
package/dist/error-feedback.js +8 -4
package/dist/evidence-reasoning.js +3 -3
package/dist/execution-backend/agent.js +331 -0
package/dist/execution-backend/probes.js +96 -0
package/dist/execution-backend/util.js +47 -0
package/dist/execution-backend.js +73 -421
package/dist/mcp-server.js +79 -183
package/dist/multi-agent/graph.js +84 -0
package/dist/multi-agent/helpers.js +145 -0
package/dist/multi-agent/paths.js +22 -0
package/dist/multi-agent-eval/format.js +194 -0
package/dist/multi-agent-eval/normalize.js +51 -0
package/dist/multi-agent-eval.js +39 -244
package/dist/multi-agent-host.js +0 -19
package/dist/multi-agent.js +125 -314
package/dist/node-snapshot.js +3 -3
package/dist/observability/format.js +61 -0
package/dist/observability/intake.js +98 -0
package/dist/observability.js +14 -160
package/dist/operator-ux/format.js +364 -0
package/dist/operator-ux.js +22 -363
package/dist/orchestrator/lifecycle-operations.js +2 -1
package/dist/orchestrator/report.js +8 -0
package/dist/orchestrator.js +26 -9
package/dist/reclamation.js +26 -21
package/dist/run-export.js +494 -25
package/dist/run-registry/derive.js +172 -0
package/dist/run-registry/format.js +124 -0
package/dist/run-registry/gc.js +251 -0
package/dist/run-registry/policy.js +16 -0
package/dist/run-registry/queue.js +116 -0
package/dist/run-registry.js +89 -597
package/dist/run-state-schema.js +1 -0
package/dist/sandbox-profile.js +43 -2
package/dist/state-explosion/format.js +159 -0
package/dist/state-explosion/helpers.js +82 -0
package/dist/state-explosion.js +165 -304
package/dist/state-node.js +19 -4
package/dist/telemetry-attestation.js +55 -0
package/dist/telemetry-demo.js +15 -3
package/dist/telemetry-ledger.js +60 -15
package/dist/topology.js +25 -8
package/dist/triggers.js +33 -14
package/dist/trust-audit.js +145 -33
package/dist/version.js +1 -1
package/dist/worker-isolation/helpers.js +51 -0
package/dist/worker-isolation/paths.js +46 -0
package/dist/worker-isolation.js +39 -115
package/docs/agent-delegation-drive.7.md +71 -0
package/docs/canonical-workflow-apps.7.md +37 -0
package/docs/cli-mcp-parity.7.md +16 -0
package/docs/contract-migration-tooling.7.md +6 -0
package/docs/control-plane-scheduling.7.md +6 -0
package/docs/dogfood/resume-drive-real-agent-2026-06-14.md +40 -0
package/docs/durable-state-and-locking.7.md +8 -0
package/docs/evidence-adoption-reasoning-chain.7.md +6 -0
package/docs/execution-backends.7.md +6 -0
package/docs/index.md +2 -0
package/docs/launch/demo.tape +28 -0
package/docs/launch/launch-kit.md +96 -17
package/docs/launch/pre-launch-checklist.md +53 -0
package/docs/multi-agent-cli-mcp-surface.7.md +8 -0
package/docs/multi-agent-eval-replay-harness.7.md +6 -0
package/docs/multi-agent-operator-ux.7.md +6 -0
package/docs/multi-agent-trust-policy-audit.7.md +27 -0
package/docs/node-snapshot-diff-replay.7.md +6 -0
package/docs/observability-cost-accounting.7.md +6 -0
package/docs/project-index.md +27 -6
package/docs/real-execution-backends.7.md +6 -0
package/docs/release-and-migration.7.md +8 -0
package/docs/release-tooling.7.md +6 -0
package/docs/routines.md +23 -0
package/docs/run-registry-control-plane.7.md +89 -2
package/docs/run-retention-reclamation.7.md +8 -0
package/docs/source-context-profiles.7.md +119 -0
package/docs/state-explosion-management.7.md +13 -0
package/docs/team-collaboration.7.md +6 -0
package/docs/trust-model.md +267 -0
package/docs/unix-principles.md +49 -1
package/docs/vendor-manifest-loadability.7.md +43 -0
package/docs/web-desktop-workbench.7.md +6 -0
package/manifest/plugin.manifest.json +1 -1
package/manifest/source-context-profiles.json +142 -0
package/package.json +4 -1
package/scripts/agents/builtin-templates.json +7 -0
package/scripts/agents/claude-p-agent.js +129 -43
package/scripts/architecture-review-fast.js +362 -0
package/scripts/bump-version.js +5 -10
package/scripts/canonical-apps-list.js +64 -0
package/scripts/canonical-apps.js +36 -4
package/scripts/coverage-gate.js +211 -0
package/scripts/dogfood-release.js +1 -1
package/scripts/golden-path.js +4 -4
package/scripts/parity-check.js +5 -0
package/scripts/release-check.js +5 -1
package/scripts/source-context.js +291 -0
package/scripts/version-sync-check.js +5 -7
package/skills/ci-triage/SKILL.md +50 -0
package/skills/ci-triage/agents/openai.yaml +4 -0
package/skills/cool-workflow/SKILL.md +4 -1
package/skills/deploy-check/SKILL.md +55 -0
package/skills/deploy-check/agents/openai.yaml +4 -0
package/skills/design-qa/SKILL.md +49 -0
package/skills/design-qa/agents/openai.yaml +4 -0
package/skills/pr-review/SKILL.md +45 -0
package/skills/pr-review/agents/openai.yaml +4 -0
package/dist/capability-dispatcher.js +0 -86

package/dist/capability-core.js CHANGED Viewed

@@ -9,11 +9,12 @@
 // expressed here and called identically by both surfaces. A composite that lives
 // in only one surface is exactly the cross-surface drift v0.1.27 forbids.
 //
-// From v0.1.46: each exported entry function SHOULD self-register its capability
-// metadata via registerCapability() from capability-registry.ts. This replaces
-// the manual "add an entry to the giant array in capability-registry.ts" workflow
-// with automatic discovery. New capabilities just add a registerCapability() call
-// next to their implementation — no need to touch capability-registry.ts.
+// Capability metadata (which entry is on which surface, tool names, jsonMode) is
+// declared in ONE place — the BUILTIN_CAPABILITIES table in capability-registry.ts,
+// the single source of truth both surfaces and the parity gate read. New
+// capabilities add a row there. (A v0.1.46 "self-register at load time" mechanism
+// was removed: the registry snapshot was taken before those registrations ran, so
+// they were silently dead duplicates of the table — see capability-registry.ts.)
 //
 // See docs/cli-mcp-parity.7.md and src/capability-registry.ts.
 var __importDefault = (this && this.__importDefault) || function (mod) {
@@ -35,6 +36,10 @@ exports.runShow = runShow;
 exports.runResume = runResume;
 exports.runArchive = runArchive;
 exports.runRerun = runRerun;
+exports.runExportArchive = runExportArchive;
+exports.runImportArchive = runImportArchive;
+exports.runInspectArchive = runInspectArchive;
+exports.runVerifyImport = runVerifyImport;
 exports.queueAdd = queueAdd;
 exports.queueList = queueList;
 exports.queueDrain = queueDrain;
@@ -62,15 +67,18 @@ exports.withoutRuntimeKeys = withoutRuntimeKeys;
 exports.optionalString = optionalString;
 exports.isRecord = isRecord;
 exports.telemetryVerify = telemetryVerify;
+exports.auditVerify = auditVerify;
 exports.demoTamper = demoTamper;
-const capability_registry_1 = require("./capability-registry");
 const drive_1 = require("./drive");
 const agent_config_1 = require("./agent-config");
 const run_registry_1 = require("./run-registry");
 const observability_1 = require("./observability");
 const telemetry_ledger_1 = require("./telemetry-ledger");
+const telemetry_attestation_1 = require("./telemetry-attestation");
+const trust_audit_1 = require("./trust-audit");
 const telemetry_demo_1 = require("./telemetry-demo");
 const state_1 = require("./state");
+const run_export_1 = require("./run-export");
 const node_fs_1 = __importDefault(require("node:fs"));
 const node_path_1 = __importDefault(require("node:path"));
 const scheduling_1 = require("./scheduling");
@@ -86,8 +94,6 @@ function planSummary(runner, workflowId, options) {
         pendingTasks: run.tasks.filter((task) => task.status === "pending").length
     };
 }
-// Auto-register with the capability registry (v0.1.46 — no need to edit capability-registry.ts)
-(0, capability_registry_1.registerCapability)({ capability: "plan", summary: "Plan a workflow run on a repo + app.", entry: "planSummary", surface: "both", cli: { path: ["plan"], jsonMode: "default" }, mcp: { tool: "cw_plan" } });
 // ---- canonical app-run payload --------------------------------------------
 // Both `cw app run` and `cw_app_run` resolve to this exact object. Structured
 // app inputs + optional sandbox resolution, then a compact operator status.
@@ -113,7 +119,6 @@ function appRun(runner, args) {
         sandboxProfile: resolvedSandbox
     };
 }
-(0, capability_registry_1.registerCapability)({ capability: "app.run", summary: "Plan a run on a named app with structured inputs.", entry: "appRun", surface: "both", cli: { path: ["app", "run"], caseTokens: ["app"], jsonMode: "default" }, mcp: { tool: "cw_app_run" } });
 // ---- canonical sandbox choice payload -------------------------------------
 // Both `cw sandbox choose|resolve` and `cw_sandbox_choose|cw_sandbox_resolve`
 // resolve to this exact object.
@@ -150,7 +155,6 @@ function commitEnvelope(runner, runId, args) {
         commit
     };
 }
-(0, capability_registry_1.registerCapability)({ capability: "commit", summary: "Create a verifier-gated state commit with evidence.", entry: "commitEnvelope", surface: "both", cli: { path: ["commit"], jsonMode: "default" }, mcp: { tool: "cw_commit" }, payloadIdentical: false, reason: "CLI renders a human summary with path hints; MCP returns the structured commit payload alone." });
 function compactOperatorStatus(status) {
     return {
         runId: status.runId,
@@ -194,6 +198,19 @@ function flag(value) {
         return false;
     return Boolean(value);
 }
+function withInvocationCwd(args, fn) {
+    const cwd = optionalString(args.cwd);
+    if (!cwd)
+        return fn();
+    const previous = process.cwd();
+    process.chdir(cwd);
+    try {
+        return fn();
+    }
+    finally {
+        process.chdir(previous);
+    }
+}
 function runRegistryRefresh(reg, args) {
     return reg.refresh({ scope: scopeOf(args, "repo") });
 }
@@ -225,11 +242,19 @@ function runList(reg, args) {
 function runShow(reg, runId, args) {
     return reg.showRun(runId, { scope: scopeOf(args, "home") });
 }
-function runResume(reg, runId, args) {
-    return reg.resume(runId, {
+function runResume(reg, runner, runId, args) {
+    const base = reg.resume(runId, {
         scope: scopeOf(args, "home"),
         limit: args.limit === undefined ? undefined : Number(args.limit)
     });
+    // Default (no --drive/--once): read-only, byte-identical to before.
+    if (!isTrue(args.drive) && !isTrue(args.once))
+        return base;
+    // Opt-in continuation: hand the resolved run to the EXISTING agent-delegation
+    // drive loop (re-plans nothing; picks up pending/running tasks from durable
+    // state). An unconfigured agent surfaces drive.status="blocked" (fail-closed).
+    const drive = runDrive(runner, { ...args, runId: base.runId, repo: base.repo, once: isTrue(args.once) });
+    return { ...base, drive };
 }
 function runArchive(reg, runId, args) {
     if (runId) {
@@ -251,6 +276,38 @@ function runArchive(reg, runId, args) {
 function runRerun(reg, runId, args) {
     return reg.rerun(runId, { scope: scopeOf(args, "home"), reason: optionalString(args.reason) });
 }
+function runExportArchive(runner, runId, args) {
+    return withInvocationCwd(args, () => {
+        const output = optionalString(args.output || args.path || args.archive) || `${runId}.cwrun.json`;
+        return (0, run_export_1.exportRun)(runner.loadRun(runId), node_path_1.default.resolve(output));
+    });
+}
+function runImportArchive(runner, args) {
+    return withInvocationCwd(args, () => {
+        const archive = optionalString(args.archive || args.path || args.file);
+        if (!archive)
+            throw new Error("run import requires an archive path (positional, --archive, --path, or --file)");
+        const target = optionalString(args.target || args.repo || args.cwd) || process.cwd();
+        const imported = (0, run_export_1.importRun)(node_path_1.default.resolve(archive), node_path_1.default.resolve(target));
+        const registry = new run_registry_1.RunRegistry(node_path_1.default.resolve(target), runner);
+        const registryReport = registry.refresh({ scope: "repo" });
+        return { ...imported, registry: registryReport };
+    });
+}
+// Read-only: inspect a portable archive's integrity WITHOUT importing it. Routes
+// both surfaces through one shared core entry. The runner is unused (no registry
+// touch — inspection writes nothing) but kept for dispatch-signature symmetry.
+function runInspectArchive(_runner, args) {
+    return withInvocationCwd(args, () => {
+        const archive = optionalString(args.archive || args.path || args.file);
+        if (!archive)
+            throw new Error("run inspect-archive requires an archive path (positional, --archive, --path, or --file)");
+        return (0, run_export_1.inspectArchive)(node_path_1.default.resolve(archive));
+    });
+}
+function runVerifyImport(runner, runId, args) {
+    return withInvocationCwd(args, () => (0, run_export_1.verifyImportedRun)(runner.loadRun(runId)));
+}
 function queueAdd(reg, args) {
     return reg.queueAdd({
         runId: optionalString(args.runId),
@@ -384,7 +441,8 @@ const DRIVE_RUNTIME_KEYS = [
     "agentModel",
     "agent-model",
     "agentTimeoutMs",
-    "agent-timeout-ms"
+    "agent-timeout-ms",
+    "resume"
 ];
 function planInputsFor(args) {
     const copy = withoutRuntimeKeys(args);
@@ -436,6 +494,12 @@ exports.QUICKSTART_DEFAULT_APP = "architecture-review";
 function quickstart(runner, args) {
     const appId = String(args.appId || args.app || args.workflowId || exports.QUICKSTART_DEFAULT_APP);
     const agentConfigured = Boolean((0, agent_config_1.resolveAgentConfig)(args).command || (0, agent_config_1.resolveAgentConfig)(args).endpoint);
+    // `--resume`: a discoverability flag over the existing continuation. With no
+    // `--run`, advance exactly ONE step (reuse the `--once` path) and print a
+    // copy-pasteable continue line; with `--run <id>`, continue that run to
+    // completion (the default drive). It adds no new execution path.
+    const resume = isTrue(args.resume);
+    const resumeRunId = resume ? optionalString(args.runId || args.run) : undefined;
     // `--preview`: read-only, deterministic next-step projection (no spawn, no commit).
     // Plan a fresh run (the read-only first verb) then project the next drive step.
     if (isTrue(args.preview)) {
@@ -460,7 +524,10 @@ function quickstart(runner, args) {
     // Drive end-to-end (or one `--once` step). runDrive plans the run, delegates each
     // worker to the agent backend, and commits — we add only the report write + a
     // single assembled payload. No orchestration is duplicated here.
-    const result = runDrive(runner, { ...args, appId });
+    // `--resume` with no run id advances a single step so a newcomer WITNESSES the
+    // stop-then-resume; with a run id it continues to completion. Non-resume paths
+    // are untouched (byte-identical default).
+    const result = runDrive(runner, { ...args, appId, ...(resume && !resumeRunId ? { once: true } : {}) });
     // Always (re)write the report so the one command yields a report.md on disk, even
     // when the drive blocked/parked (a partial report is still useful triage).
     const cwd0 = process.cwd();
@@ -492,7 +559,9 @@ function quickstart(runner, args) {
         hint = `the drive is blocked — inspect: cw run drive ${result.runId}`;
     }
     else if (result.status === "in-progress") {
-        hint = `one step advanced (--once) — continue: cw quickstart ${appId} --run ${result.runId} --once`;
+        hint = resume
+            ? `one step advanced — continue: cw quickstart ${appId} --run ${result.runId} --resume`
+            : `one step advanced (--once) — continue: cw quickstart ${appId} --run ${result.runId} --once`;
     }
     return {
         schemaVersion: 1,
@@ -508,7 +577,11 @@ function quickstart(runner, args) {
         statePath: result.statePath,
         agentConfigured,
         steps: result.steps,
-        hint
+        hint,
+        // Stamp resumedFrom ONLY when we continued an explicit run. Conditional spread
+        // keeps the key absent on the default/fresh path (own-property absent + omitted
+        // by JSON.stringify), so default output is byte-identical.
+        ...(resumeRunId ? { resumedFrom: resumeRunId } : {})
     };
 }
 /** Read-only, deterministic projection of the effective agent config (secret-stripped). */
@@ -642,15 +715,57 @@ function telemetryVerify(runner, args) {
         throw new Error("telemetry verify requires a run id (cw telemetry verify <run-id>)");
     const run = runner.loadRun(runId);
     const v = (0, telemetry_ledger_1.verifyTelemetryLedger)(run);
+    // Opt-in independent signature re-verification. verifyTelemetryLedger re-proves
+    // the chain (so the stored attestation verdicts were not edited); supplying the
+    // trust public key (--pubkey / CW_AGENT_ATTEST_PUBKEY) additionally RE-RUNS the
+    // ed25519 check over each `attested` record's stored raw usage rather than
+    // trusting that verdict, so a forged signature can no longer ride a green chain.
+    const trustPublicKeyInput = optionalString(args.pubkey || args.pubKey || args.publicKey) || process.env.CW_AGENT_ATTEST_PUBKEY;
+    const trustPublicKey = (0, telemetry_attestation_1.resolveTrustPublicKey)(trustPublicKeyInput);
+    const keyChecks = trustPublicKeyInput && !trustPublicKey
+        ? [{ name: "signature-key", pass: false, code: "telemetry-pubkey-unreadable" }]
+        : [];
+    const sig = (0, telemetry_attestation_1.verifyTelemetrySignatures)(v.records, trustPublicKey);
+    const failedChecks = [...v.checks.filter((c) => !c.pass), ...keyChecks, ...sig.checks.filter((c) => !c.pass)];
     return {
         schemaVersion: 1,
         runId: run.id,
         present: v.present,
-        verified: v.verified,
+        // Chain integrity AND (when a key was supplied) every attested signature must
+        // re-verify. With no key, sig.failed is 0 → unchanged chain-only behavior.
+        verified: v.verified && keyChecks.length === 0 && sig.failed === 0,
         records: v.records.length,
         attested: v.attested,
         unattested: v.unattested,
         absent: v.absent,
+        signatureKeyProvided: sig.keyProvided,
+        signaturesChecked: sig.checked,
+        signaturesReverified: sig.reverified,
+        signaturesFailed: sig.failed,
+        failedChecks: failedChecks.map((c) => ({ name: c.name, code: c.code }))
+    };
+}
+// audit.verify — fail-closed re-prove of a run's trust-audit hash chain. The peer
+// of telemetry.verify for the sandbox/policy/commit-gate decision log: recomputes
+// every event hash from genesis, checks chain linkage, and catches the
+// unchained-event forgery. Exposed as a verb (not just embedded in `audit summary`,
+// which always exits 0) so `cw audit verify <run> && deploy` can gate on the exit
+// code. POLA: a run with no audit log is present:false / verified:true / exit 0.
+function auditVerify(runner, args) {
+    const runId = optionalString(args.runId || args.run);
+    if (!runId)
+        throw new Error("audit verify requires a run id (cw audit verify <run-id>)");
+    const run = runner.loadRun(runId);
+    const v = (0, trust_audit_1.verifyTrustAudit)(run);
+    return {
+        schemaVersion: 1,
+        runId: run.id,
+        present: v.present,
+        verified: v.verified,
+        eventCount: v.eventCount,
+        chained: v.chained,
+        unchained: v.unchained,
+        corruptLines: v.corruptLines,
         failedChecks: v.checks.filter((c) => !c.pass).map((c) => ({ name: c.name, code: c.code }))
     };
 }