npm - @delegance/claude-autopilot - Versions diffs - 5.2.2 → 6.2.2 - Mend

@delegance/claude-autopilot 5.2.2 → 6.2.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (130) hide show

package/CHANGELOG.md +1027 -1
package/README.md +104 -17
package/dist/src/adapters/council/claude.js +2 -1
package/dist/src/adapters/council/openai.js +14 -7
package/dist/src/adapters/deploy/_http.d.ts +43 -0
package/dist/src/adapters/deploy/_http.js +99 -0
package/dist/src/adapters/deploy/fly.d.ts +206 -0
package/dist/src/adapters/deploy/fly.js +696 -0
package/dist/src/adapters/deploy/generic.d.ts +39 -0
package/dist/src/adapters/deploy/generic.js +98 -0
package/dist/src/adapters/deploy/index.d.ts +15 -0
package/dist/src/adapters/deploy/index.js +78 -0
package/dist/src/adapters/deploy/render.d.ts +181 -0
package/dist/src/adapters/deploy/render.js +550 -0
package/dist/src/adapters/deploy/types.d.ts +221 -0
package/dist/src/adapters/deploy/types.js +15 -0
package/dist/src/adapters/deploy/vercel.d.ts +143 -0
package/dist/src/adapters/deploy/vercel.js +426 -0
package/dist/src/adapters/pricing.d.ts +36 -0
package/dist/src/adapters/pricing.js +40 -0
package/dist/src/adapters/review-engine/claude.js +2 -1
package/dist/src/adapters/review-engine/codex.js +12 -8
package/dist/src/adapters/review-engine/gemini.js +2 -1
package/dist/src/adapters/review-engine/openai-compatible.js +2 -1
package/dist/src/adapters/sdk-loader.d.ts +15 -0
package/dist/src/adapters/sdk-loader.js +77 -0
package/dist/src/cli/autopilot.d.ts +71 -0
package/dist/src/cli/autopilot.js +735 -0
package/dist/src/cli/brainstorm.d.ts +23 -0
package/dist/src/cli/brainstorm.js +131 -0
package/dist/src/cli/costs.d.ts +15 -1
package/dist/src/cli/costs.js +99 -10
package/dist/src/cli/deploy.d.ts +71 -0
package/dist/src/cli/deploy.js +539 -0
package/dist/src/cli/fix.d.ts +18 -0
package/dist/src/cli/fix.js +105 -11
package/dist/src/cli/help-text.d.ts +52 -0
package/dist/src/cli/help-text.js +400 -0
package/dist/src/cli/implement.d.ts +91 -0
package/dist/src/cli/implement.js +196 -0
package/dist/src/cli/index.js +784 -222
package/dist/src/cli/json-envelope.d.ts +187 -0
package/dist/src/cli/json-envelope.js +270 -0
package/dist/src/cli/json-mode.d.ts +33 -0
package/dist/src/cli/json-mode.js +201 -0
package/dist/src/cli/migrate.d.ts +111 -0
package/dist/src/cli/migrate.js +305 -0
package/dist/src/cli/plan.d.ts +81 -0
package/dist/src/cli/plan.js +149 -0
package/dist/src/cli/pr.d.ts +106 -0
package/dist/src/cli/pr.js +191 -19
package/dist/src/cli/preflight.js +102 -1
package/dist/src/cli/review.d.ts +27 -0
package/dist/src/cli/review.js +126 -0
package/dist/src/cli/runs-watch-renderer.d.ts +45 -0
package/dist/src/cli/runs-watch-renderer.js +275 -0
package/dist/src/cli/runs-watch.d.ts +41 -0
package/dist/src/cli/runs-watch.js +395 -0
package/dist/src/cli/runs.d.ts +122 -0
package/dist/src/cli/runs.js +902 -0
package/dist/src/cli/scan.d.ts +93 -0
package/dist/src/cli/scan.js +166 -40
package/dist/src/cli/spec.d.ts +66 -0
package/dist/src/cli/spec.js +132 -0
package/dist/src/cli/validate.d.ts +29 -0
package/dist/src/cli/validate.js +131 -0
package/dist/src/core/config/schema.d.ts +43 -0
package/dist/src/core/config/schema.js +25 -0
package/dist/src/core/config/types.d.ts +17 -0
package/dist/src/core/council/runner.d.ts +10 -1
package/dist/src/core/council/runner.js +25 -3
package/dist/src/core/council/types.d.ts +7 -0
package/dist/src/core/errors.d.ts +1 -1
package/dist/src/core/errors.js +12 -0
package/dist/src/core/logging/redaction.d.ts +13 -0
package/dist/src/core/logging/redaction.js +20 -0
package/dist/src/core/migrate/detector-rules.js +6 -0
package/dist/src/core/migrate/schema-validator.js +22 -1
package/dist/src/core/phases/static-rules.d.ts +5 -1
package/dist/src/core/phases/static-rules.js +2 -5
package/dist/src/core/run-state/budget.d.ts +88 -0
package/dist/src/core/run-state/budget.js +141 -0
package/dist/src/core/run-state/cli-internal.d.ts +21 -0
package/dist/src/core/run-state/cli-internal.js +174 -0
package/dist/src/core/run-state/events.d.ts +59 -0
package/dist/src/core/run-state/events.js +504 -0
package/dist/src/core/run-state/lock.d.ts +61 -0
package/dist/src/core/run-state/lock.js +206 -0
package/dist/src/core/run-state/phase-context.d.ts +60 -0
package/dist/src/core/run-state/phase-context.js +108 -0
package/dist/src/core/run-state/phase-registry.d.ts +137 -0
package/dist/src/core/run-state/phase-registry.js +162 -0
package/dist/src/core/run-state/phase-runner.d.ts +80 -0
package/dist/src/core/run-state/phase-runner.js +447 -0
package/dist/src/core/run-state/provider-readback.d.ts +130 -0
package/dist/src/core/run-state/provider-readback.js +426 -0
package/dist/src/core/run-state/replay-decision.d.ts +69 -0
package/dist/src/core/run-state/replay-decision.js +144 -0
package/dist/src/core/run-state/resolve-engine.d.ts +100 -0
package/dist/src/core/run-state/resolve-engine.js +190 -0
package/dist/src/core/run-state/resume-preflight.d.ts +66 -0
package/dist/src/core/run-state/resume-preflight.js +116 -0
package/dist/src/core/run-state/run-phase-with-lifecycle.d.ts +73 -0
package/dist/src/core/run-state/run-phase-with-lifecycle.js +186 -0
package/dist/src/core/run-state/runs.d.ts +57 -0
package/dist/src/core/run-state/runs.js +288 -0
package/dist/src/core/run-state/snapshot.d.ts +14 -0
package/dist/src/core/run-state/snapshot.js +114 -0
package/dist/src/core/run-state/state.d.ts +40 -0
package/dist/src/core/run-state/state.js +164 -0
package/dist/src/core/run-state/types.d.ts +278 -0
package/dist/src/core/run-state/types.js +13 -0
package/dist/src/core/run-state/ulid.d.ts +11 -0
package/dist/src/core/run-state/ulid.js +95 -0
package/dist/src/core/schema-alignment/extractor/index.d.ts +1 -1
package/dist/src/core/schema-alignment/extractor/index.js +2 -2
package/dist/src/core/schema-alignment/extractor/prisma.d.ts +13 -1
package/dist/src/core/schema-alignment/extractor/prisma.js +65 -10
package/dist/src/core/schema-alignment/git-history.d.ts +19 -0
package/dist/src/core/schema-alignment/git-history.js +53 -0
package/dist/src/core/static-rules/rules/brand-tokens.js +2 -2
package/dist/src/core/static-rules/rules/schema-alignment.js +14 -4
package/package.json +9 -5
package/scripts/autoregress.ts +3 -2
package/skills/claude-autopilot.md +1 -1
package/skills/make-interfaces-feel-better/SKILL.md +104 -0
package/skills/migrate/SKILL.md +193 -47
package/skills/simplify-ui/SKILL.md +103 -0
package/skills/ui/SKILL.md +117 -0
package/skills/ui-ux-pro-max/SKILL.md +90 -0

package/dist/src/core/run-state/run-phase-with-lifecycle.js ADDED Viewed

@@ -0,0 +1,186 @@
+// src/core/run-state/run-phase-with-lifecycle.ts
+//
+// v6.0.6 — extract the lifecycle wrapper that's been duplicated across
+// every wrapped CLI verb (`scan`, `costs`, `fix`, `brainstorm`, `spec`,
+// `plan`, `review`, `validate`). The pattern is mechanical:
+//
+//   1. If engine-off → run the legacy phase body via `runEngineOff()` and
+//      return its result.
+//   2. If engine-on → createRun → optional run.warning for invalid env →
+//      runPhase → emit run.complete (success or failed) → refresh state.json
+//      → release lock (best effort, in finally).
+//
+// This helper sits ON TOP of `runPhase()` from `phase-runner.ts` — it does
+// not replace it. Callers continue to define their own `RunPhase<I, O>` with
+// per-phase `idempotent` / `hasSideEffects` / `run` and pass it in.
+//
+// Why now: with 8 of 10 phases wrapped (the v6.0.5 milestone), the pattern
+// is fully evidenced. The remaining 3 phases (`implement`, `migrate`, `pr`)
+// are side-effecting and need externalRefs — those will inform a v6.0.7+
+// extension to this helper but won't change its core shape. Doing the
+// extraction now means those 3 wraps build against the helper instead of
+// re-introducing the boilerplate.
+//
+// What this helper does NOT do:
+//   - Print success banners — rendering stays in the caller.
+//   - Decide engine-off behavior — that's `runEngineOff`, supplied by the
+//     caller (typically a thin closure over the phase body).
+//   - Plumb externalRefs / readback — the underlying `runPhase()` already
+//     handles those. This helper just owns the run-level lifecycle events.
+//
+// Future extension (v6.0.7+): `implement` / `migrate` / `pr` need
+// externalRef ledger entries (`git-remote-push`, `migration-version`,
+// `github-pr`). The helper's `phase.run` already receives `ctx` so
+// `ctx.emitExternalRef()` works without changes here. If a future PR needs
+// to fan-in run-wide externalRefs from multiple phases (multi-phase
+// pipelines, e.g. autopilot orchestrator), the signature can grow a
+// `phases: RunPhase[]` overload — but the single-phase shape stays identical.
+import { createRun } from "./runs.js";
+import { runPhase } from "./phase-runner.js";
+import { appendEvent, replayState } from "./events.js";
+import { writeStateSnapshot } from "./state.js";
+import { resolveEngineEnabled, emitEngineOffDeprecationWarning, } from "./resolve-engine.js";
+// Inline ANSI codes — same shape every wrapped verb uses. Kept here so the
+// helper doesn't depend on a verb-local `fmt`. The error message format
+// (`[<phase>] engine: phase failed — <msg>` + dim inspect hint) is
+// byte-for-byte identical to what every wrapped phase printed pre-extract.
+const ANSI_RESET = '\x1b[0m';
+const ANSI_DIM = '\x1b[2m';
+const ANSI_RED = '\x1b[31m';
+/** Drive a single-phase engine run with full lifecycle instrumentation,
+ *  OR fall through to the legacy `runEngineOff` callback when the engine
+ *  is disabled by config / CLI / env precedence.
+ *
+ *  Engine-on lifecycle (in order):
+ *    createRun → (optional run.warning for invalid env) → runPhase →
+ *    run.complete (success or failed) → refresh state.json → release lock.
+ *
+ *  On phase failure the helper:
+ *    1. Emits `run.complete` with `status: 'failed'`.
+ *    2. Refreshes state.json from the replayed events.
+ *    3. Prints the legacy `[<phase>] engine: phase failed — <msg>` banner
+ *       to stderr (byte-for-byte identical to the inline pattern that
+ *       lived in 8 of 8 wrapped verbs pre-v6.0.6).
+ *    4. Releases the lock and re-throws so the caller can return its
+ *       legacy non-zero exit code.
+ *
+ *  The lock release in `finally` is best-effort. `release()` is idempotent
+ *  (the runs lock module accepts double-release without throwing), so the
+ *  catch block does not need to release the lock itself — `finally` covers
+ *  both the success and failure exit paths. */
+export async function runPhaseWithLifecycle(opts) {
+    const { cwd, phase, input, config, cliEngine, envEngine, runEngineOff } = opts;
+    // Resolve engine via the canonical precedence (CLI > env > config >
+    // built-in default). The resolver is pure — same inputs always produce
+    // the same decision. We DO consult the loaded config's `engine.enabled`
+    // here so the helper's caller doesn't have to repeat the conditional
+    // spread that every wrapped verb wrote inline.
+    const engineResolved = resolveEngineEnabled({
+        ...(cliEngine !== undefined ? { cliEngine } : {}),
+        ...(envEngine !== undefined ? { envValue: envEngine } : {}),
+        ...(typeof config.engine?.enabled === 'boolean'
+            ? { configEnabled: config.engine.enabled }
+            : {}),
+    });
+    if (!engineResolved.enabled) {
+        // Engine off — call the caller's legacy path. No run dir, no events,
+        // no lifecycle work. Behavior is byte-for-byte identical to pre-engine
+        // versions of the verb. v6.1+ emits a one-line stderr deprecation
+        // notice when the user explicitly opted out (CLI / env / config); the
+        // v6.1 default is `enabled: true`, so a `'default'` source can't reach
+        // this branch and the deprecation helper no-ops on the `enabled: true`
+        // path. v7 removes the opt-out entirely.
+        emitEngineOffDeprecationWarning(engineResolved);
+        const output = await runEngineOff();
+        return { output, runId: null, runDir: null };
+    }
+    // Engine on — full lifecycle. Mirrors the pre-v6.0.6 inline shape that
+    // every wrapped verb duplicated.
+    const created = await createRun({
+        cwd,
+        phases: [phase.name],
+        config: {
+            engine: { enabled: true, source: engineResolved.source },
+            ...(engineResolved.invalidEnvValue !== undefined
+                ? { invalidEnvValue: engineResolved.invalidEnvValue }
+                : {}),
+        },
+    });
+    if (engineResolved.invalidEnvValue !== undefined) {
+        // Surface the invalid env value as a typed warning so observers
+        // (`runs show <id> --events`) can attribute the fallthrough.
+        appendEvent(created.runDir, {
+            event: 'run.warning',
+            message: `invalid CLAUDE_AUTOPILOT_ENGINE=${JSON.stringify(engineResolved.invalidEnvValue)} ignored`,
+            details: { resolution: engineResolved },
+        }, { writerId: created.lock.writerId, runId: created.runId });
+    }
+    const runStartedAt = Date.now();
+    try {
+        const output = await runPhase(phase, input, {
+            runDir: created.runDir,
+            runId: created.runId,
+            writerId: created.lock.writerId,
+            phaseIdx: 0,
+        });
+        // Final lifecycle event — run.complete. The runner doesn't emit this
+        // on its own; it's the caller's responsibility (multi-phase pipelines
+        // emit it after the LAST phase, single-phase wrappers like this emit
+        // after the only phase). Total cost falls back to 0 when the phase
+        // doesn't expose a `costUSD` field on its output (read-only verbs
+        // don't track cost; scan does).
+        const totalCostUSD = extractCostUSD(output);
+        appendEvent(created.runDir, {
+            event: 'run.complete',
+            status: 'success',
+            totalCostUSD,
+            durationMs: Date.now() - runStartedAt,
+        }, { writerId: created.lock.writerId, runId: created.runId });
+        // Refresh state.json from the replayed events. The events.ndjson is
+        // the source of truth; state.json is a derived snapshot that we MUST
+        // rewrite after run.complete so `runs show` / `runs list` reflect the
+        // terminal status without needing to replay on every read.
+        writeStateSnapshot(created.runDir, replayState(created.runDir));
+        return { output, runId: created.runId, runDir: created.runDir };
+    }
+    catch (err) {
+        // Engine-on failure — write run.complete with failed status, refresh
+        // state.json, print the legacy banner to stderr, then re-throw so the
+        // caller can return its legacy non-zero exit code. (Lock release
+        // happens in `finally` regardless of success / failure path.)
+        appendEvent(created.runDir, {
+            event: 'run.complete',
+            status: 'failed',
+            totalCostUSD: 0,
+            durationMs: Date.now() - runStartedAt,
+        }, { writerId: created.lock.writerId, runId: created.runId });
+        writeStateSnapshot(created.runDir, replayState(created.runDir));
+        const message = err instanceof Error ? err.message : String(err);
+        process.stderr.write(`${ANSI_RED}[${phase.name}] engine: phase failed — ${message}${ANSI_RESET}\n`);
+        process.stderr.write(`${ANSI_DIM}  inspect: claude-autopilot runs show ${created.runId} --events${ANSI_RESET}\n`);
+        throw err;
+    }
+    finally {
+        // Best-effort lock release. The lock module's `release()` is
+        // idempotent; if the catch path already released (it doesn't, but a
+        // future change might), this is a no-op. Wrapping the await in
+        // `.catch(() => {})` ensures a release error never masks the original
+        // throw — the spec calls this out explicitly.
+        await created.lock.release().catch(() => { });
+    }
+}
+/** Extract `costUSD` from a phase output if present, else 0. JSON-style
+ *  duck-typing: we accept any output that exposes a numeric `costUSD`
+ *  field. Today only `scan` exposes one; the other 7 wrapped verbs
+ *  return outputs without a cost field, which means `extractCostUSD`
+ *  returns 0 — byte-for-byte matching the inline `totalCostUSD: 0` they
+ *  used pre-v6.0.6. */
+function extractCostUSD(output) {
+    if (output !== null && typeof output === 'object' && 'costUSD' in output) {
+        const v = output.costUSD;
+        if (typeof v === 'number' && Number.isFinite(v))
+            return v;
+    }
+    return 0;
+}
+//# sourceMappingURL=run-phase-with-lifecycle.js.map

package/dist/src/core/run-state/runs.d.ts ADDED Viewed

@@ -0,0 +1,57 @@
+import { type RunLockHandle } from './lock.ts';
+import { type RunIndex, type RunIndexEntry, type RunState } from './types.ts';
+export declare function runsRoot(cwd: string): string;
+export declare function indexPath(cwd: string): string;
+export declare function runDirFor(cwd: string, runId: string): string;
+export interface CreateRunOptions {
+    cwd: string;
+    /** Phase names in the order they will execute. */
+    phases: string[];
+    /** Snapshot of the relevant guardrail.config.yaml fields. Free-form. */
+    config?: Record<string, unknown>;
+}
+export interface CreateRunResult {
+    runId: string;
+    runDir: string;
+    state: RunState;
+    /** Lock handle. Caller MUST `release()` on shutdown. */
+    lock: RunLockHandle;
+}
+/** Create a fresh run directory, acquire its advisory lock, write the
+ *  initial state.json, and emit the `run.start` event.
+ *
+ *  Throws GuardrailError(lock_held) if a stale lock exists for the freshly-
+ *  generated runId — extremely unlikely (ULIDs are unique) but possible if
+ *  two parallel invocations on the same OS clock collide on a leftover dir
+ *  on disk. Caller can simply retry. */
+export declare function createRun(opts: CreateRunOptions): Promise<CreateRunResult>;
+/** Rebuild index.json from each run dir's state.json (or replayed state if
+ *  the snapshot is missing / corrupt). Newest-first ordering by ULID. */
+export declare function rebuildIndex(cwd: string): RunIndex;
+export interface ListRunsOptions {
+    /** Force a rebuild from disk even if index.json is fresh. */
+    rebuild?: boolean;
+}
+/** List all runs, newest-first. Lazily rebuilds index.json if missing. */
+export declare function listRuns(cwd: string, opts?: ListRunsOptions): RunIndexEntry[];
+export interface GcRunsOptions {
+    /** Delete completed runs older than this many days. Required. */
+    olderThanDays: number;
+    /** Don't actually delete; just return what would be removed. */
+    dryRun?: boolean;
+    /** Override "now" for tests. Default Date.now(). */
+    now?: number;
+}
+export interface GcRunsResult {
+    /** runIds that were (or would be) deleted. */
+    deleted: string[];
+    /** runIds skipped because they're still active or too young. */
+    kept: string[];
+    /** runIds skipped for safety reasons (symlink, suspicious path). */
+    skippedUnsafe: string[];
+}
+/** Delete completed runs older than N days. Honors the spec's symlink
+ *  safety: uses lstat so we never traverse a symlink out of the runs/
+ *  tree. */
+export declare function gcRuns(cwd: string, opts: GcRunsOptions): GcRunsResult;
+//# sourceMappingURL=runs.d.ts.map

package/dist/src/core/run-state/runs.js ADDED Viewed

@@ -0,0 +1,288 @@
+// src/core/run-state/runs.ts
+//
+// Top-level Run State Engine helpers — createRun, listRuns, gcRuns. These
+// are the entry points the (yet-to-be-built) phase wrapper, CLI, and budget
+// enforcer will call. Phase 1 ships only the data layer; later phases build
+// on top.
+//
+// Spec: docs/specs/v6-run-state-engine.md "State on disk", "Run lifecycle",
+// "Resume command".
+import * as fs from 'node:fs';
+import * as path from 'node:path';
+import { ulid, decodeTime } from "./ulid.js";
+import { acquireRunLock } from "./lock.js";
+import { appendEvent, foldEvents, readEvents, stateToIndexEntry } from "./events.js";
+import { writeStateSnapshot } from "./state.js";
+import { RUN_STATE_SCHEMA_VERSION, } from "./types.js";
+const CACHE_DIR = '.guardrail-cache';
+const RUNS_DIR = 'runs';
+const INDEX_FILE = 'index.json';
+export function runsRoot(cwd) {
+    return path.join(cwd, CACHE_DIR, RUNS_DIR);
+}
+export function indexPath(cwd) {
+    return path.join(runsRoot(cwd), INDEX_FILE);
+}
+export function runDirFor(cwd, runId) {
+    return path.join(runsRoot(cwd), runId);
+}
+/** Create a fresh run directory, acquire its advisory lock, write the
+ *  initial state.json, and emit the `run.start` event.
+ *
+ *  Throws GuardrailError(lock_held) if a stale lock exists for the freshly-
+ *  generated runId — extremely unlikely (ULIDs are unique) but possible if
+ *  two parallel invocations on the same OS clock collide on a leftover dir
+ *  on disk. Caller can simply retry. */
+export async function createRun(opts) {
+    if (!Array.isArray(opts.phases) || opts.phases.length === 0) {
+        throw new Error('createRun: phases[] must be a non-empty array');
+    }
+    const runId = ulid();
+    const runDir = runDirFor(opts.cwd, runId);
+    fs.mkdirSync(runDir, { recursive: true });
+    // Acquire BEFORE first event write so writerId is well-defined.
+    const lock = await acquireRunLock(runDir);
+    // Seed the state snapshot first (with no events yet) so that even a crash
+    // before run.start lands leaves a recoverable artifact.
+    const startedAt = new Date(decodeTime(runId)).toISOString();
+    const initialState = {
+        schema_version: RUN_STATE_SCHEMA_VERSION,
+        runId,
+        startedAt,
+        status: 'pending',
+        phases: opts.phases.map((name, idx) => ({
+            schema_version: RUN_STATE_SCHEMA_VERSION,
+            name,
+            index: idx,
+            status: 'pending',
+            idempotent: false,
+            hasSideEffects: false,
+            costUSD: 0,
+            attempts: 0,
+            artifacts: [],
+            externalRefs: [],
+        })),
+        currentPhaseIdx: 0,
+        totalCostUSD: 0,
+        lastEventSeq: 0,
+        writerId: lock.writerId,
+        cwd: opts.cwd,
+        ...(opts.config !== undefined ? { config: opts.config } : {}),
+    };
+    writeStateSnapshot(runDir, initialState);
+    // Emit run.start. The appender owns the seq counter.
+    const startEvent = appendEvent(runDir, {
+        event: 'run.start',
+        phases: opts.phases,
+        ...(opts.config !== undefined ? { config: opts.config } : {}),
+    }, { writerId: lock.writerId, runId });
+    // Refresh the snapshot to reflect lastEventSeq=1.
+    initialState.lastEventSeq = startEvent.seq;
+    writeStateSnapshot(runDir, initialState);
+    // Refresh the index (best-effort — index is a pure cache).
+    try {
+        rebuildIndex(opts.cwd);
+    }
+    catch {
+        // Index failure shouldn't block the run.
+    }
+    return { runId, runDir, state: initialState, lock };
+}
+// ----------------------------------------------------------------------------
+// Listing + indexing.
+// ----------------------------------------------------------------------------
+function readIndex(cwd) {
+    const p = indexPath(cwd);
+    if (!fs.existsSync(p))
+        return null;
+    try {
+        return JSON.parse(fs.readFileSync(p, 'utf8'));
+    }
+    catch {
+        return null; // treat unreadable index as missing — it's a cache
+    }
+}
+function writeIndex(cwd, index) {
+    fs.mkdirSync(runsRoot(cwd), { recursive: true });
+    fs.writeFileSync(indexPath(cwd), JSON.stringify(index, null, 2), 'utf8');
+}
+/** Rebuild index.json from each run dir's state.json (or replayed state if
+ *  the snapshot is missing / corrupt). Newest-first ordering by ULID. */
+export function rebuildIndex(cwd) {
+    const root = runsRoot(cwd);
+    const entries = [];
+    if (!fs.existsSync(root)) {
+        const empty = { schema_version: RUN_STATE_SCHEMA_VERSION, runs: [] };
+        writeIndex(cwd, empty);
+        return empty;
+    }
+    const dirents = fs.readdirSync(root, { withFileTypes: true });
+    for (const d of dirents) {
+        if (!d.isDirectory())
+            continue;
+        const runId = d.name;
+        const runDir = path.join(root, runId);
+        let state;
+        let recovered = false;
+        try {
+            // We don't hold the lock during a list — listing is read-only and
+            // races with a concurrent writer are tolerated (we may briefly read
+            // a stale snapshot, which is fine). For replay-recovery we DO need
+            // a writerId, but only if the snapshot is bad; if so the run isn't
+            // healthy anyway, and we use a synthetic writerId so we never
+            // mutate the run's events.ndjson during a list operation.
+            // Instead of recoverState (which writes events) we just replay
+            // in-memory.
+            const fromEvents = readEvents(runDir);
+            // Build a fresh snapshot if state.json is missing or unreadable.
+            // Use the project-internal file paths to avoid pulling readState
+            // here just to throw.
+            const stateFilePath = path.join(runDir, 'state.json');
+            if (fs.existsSync(stateFilePath)) {
+                try {
+                    state = JSON.parse(fs.readFileSync(stateFilePath, 'utf8'));
+                }
+                catch {
+                    // fall through to replay
+                    recovered = true;
+                    // Replay needs the events; if the events are also corrupt we
+                    // surface the error via skip.
+                    state = replayInMemory(runDir, fromEvents.events);
+                }
+            }
+            else {
+                recovered = true;
+                state = replayInMemory(runDir, fromEvents.events);
+            }
+        }
+        catch {
+            // Corrupt run dir — skip from the index entirely. `runs doctor`
+            // (Phase 3) will surface these.
+            continue;
+        }
+        entries.push(stateToIndexEntry(state, recovered));
+    }
+    // ULIDs are sortable; we want NEWEST first → reverse-sort by runId.
+    entries.sort((a, b) => (a.runId < b.runId ? 1 : a.runId > b.runId ? -1 : 0));
+    const index = { schema_version: RUN_STATE_SCHEMA_VERSION, runs: entries };
+    writeIndex(cwd, index);
+    return index;
+}
+/** In-memory replay used by rebuildIndex / listRuns — does NOT write to disk
+ *  or emit events. Lets us pass pre-fetched events so we don't double-read
+ *  the file. */
+function replayInMemory(runDir, events) {
+    return foldEvents(runDir, events);
+}
+/** List all runs, newest-first. Lazily rebuilds index.json if missing. */
+export function listRuns(cwd, opts = {}) {
+    if (opts.rebuild)
+        return rebuildIndex(cwd).runs;
+    const idx = readIndex(cwd);
+    if (idx)
+        return idx.runs;
+    return rebuildIndex(cwd).runs;
+}
+/** Delete completed runs older than N days. Honors the spec's symlink
+ *  safety: uses lstat so we never traverse a symlink out of the runs/
+ *  tree. */
+export function gcRuns(cwd, opts) {
+    const root = runsRoot(cwd);
+    const result = { deleted: [], kept: [], skippedUnsafe: [] };
+    if (!fs.existsSync(root))
+        return result;
+    const cutoff = (opts.now ?? Date.now()) - opts.olderThanDays * 86_400_000;
+    const entries = fs.readdirSync(root, { withFileTypes: true });
+    for (const d of entries) {
+        if (d.name === INDEX_FILE)
+            continue;
+        const runId = d.name;
+        const runDir = path.join(root, runId);
+        // Symlinks (whether to dirs or files) are flagged unsafe. Dirent's
+        // isDirectory() returns FALSE for a symlink even if the target is a
+        // directory, which matches our policy here — we only operate on real
+        // dirs that lstat agrees are not links.
+        if (d.isSymbolicLink()) {
+            result.skippedUnsafe.push(runId);
+            continue;
+        }
+        if (!d.isDirectory())
+            continue;
+        let lst;
+        try {
+            lst = fs.lstatSync(runDir);
+        }
+        catch {
+            result.skippedUnsafe.push(runId);
+            continue;
+        }
+        if (!lst.isDirectory() || lst.isSymbolicLink()) {
+            result.skippedUnsafe.push(runId);
+            continue;
+        }
+        // Read state to decide. If unreadable, skip — `runs doctor` will deal.
+        let state = null;
+        try {
+            const sp = path.join(runDir, 'state.json');
+            if (fs.existsSync(sp)) {
+                state = JSON.parse(fs.readFileSync(sp, 'utf8'));
+            }
+        }
+        catch {
+            // fall through
+        }
+        if (!state) {
+            // Defensive: try to derive from ULID alone for "old enough" check.
+            // If runId isn't a ULID we treat it as suspicious and skip.
+            let createdMs;
+            try {
+                createdMs = decodeTime(runId);
+            }
+            catch {
+                result.skippedUnsafe.push(runId);
+                continue;
+            }
+            if (createdMs >= cutoff) {
+                result.kept.push(runId);
+                continue;
+            }
+            // Fall through — eligible for delete.
+        }
+        else {
+            const terminal = state.status === 'success' || state.status === 'failed' || state.status === 'aborted';
+            if (!terminal) {
+                result.kept.push(runId);
+                continue;
+            }
+            const endMs = state.endedAt ? Date.parse(state.endedAt) : Date.parse(state.startedAt);
+            if (Number.isFinite(endMs) && endMs >= cutoff) {
+                result.kept.push(runId);
+                continue;
+            }
+        }
+        if (opts.dryRun) {
+            result.deleted.push(runId);
+            continue;
+        }
+        try {
+            // Defense in depth: refuse to recurse out via a symlink hidden inside.
+            // fs.rmSync with `force: true, recursive: true` handles dirs but
+            // also follows nothing — it doesn't traverse symlinks for deletion
+            // boundaries (it deletes the link, not the target).
+            fs.rmSync(runDir, { recursive: true, force: true });
+            result.deleted.push(runId);
+        }
+        catch {
+            result.skippedUnsafe.push(runId);
+        }
+    }
+    // Refresh the index after a real GC pass.
+    if (!opts.dryRun && result.deleted.length > 0) {
+        try {
+            rebuildIndex(cwd);
+        }
+        catch { /* index is cache */ }
+    }
+    return result;
+}
+//# sourceMappingURL=runs.js.map

package/dist/src/core/run-state/snapshot.d.ts ADDED Viewed

@@ -0,0 +1,14 @@
+import { type PhaseSnapshot } from './types.ts';
+export declare function phasesDir(runDir: string): string;
+export declare function phaseSnapshotPath(runDir: string, phaseName: string): string;
+/** Write a per-phase snapshot atomically. Identical sequence to
+ *  state.json:
+ *    open(tmp, 'w') → write → fsync(fd) → close → rename → fsync(dirfd).
+ *
+ *  Any pre-existing snapshot is left untouched until the rename, so a crash
+ *  mid-write leaves the previous snapshot intact. */
+export declare function writePhaseSnapshot(runDir: string, snapshot: PhaseSnapshot): void;
+/** Read a per-phase snapshot. Returns null if missing. Throws
+ *  GuardrailError(corrupted_state) if it's present-but-unparseable. */
+export declare function readPhaseSnapshot(runDir: string, phaseName: string): PhaseSnapshot | null;
+//# sourceMappingURL=snapshot.d.ts.map

package/dist/src/core/run-state/snapshot.js ADDED Viewed

@@ -0,0 +1,114 @@
+// src/core/run-state/snapshot.ts
+//
+// Atomic per-phase snapshot writer/reader. Each phase, after run, gets a
+// `phases/<name>.json` artifact mirroring the corresponding entry in
+// state.json. Writes use the same tmp+rename+fsync protocol as state.json so
+// a crash mid-write never leaves a half-baked phase snapshot on disk.
+//
+// Phase 1 left this as a TODO; Phase 2 fills it in to back the lifecycle
+// wrapper (`runPhase`).
+//
+// Spec: docs/specs/v6-run-state-engine.md "State on disk" — `phases/<name>.json`.
+import * as fs from 'node:fs';
+import * as path from 'node:path';
+import { GuardrailError } from "../errors.js";
+const PHASES_DIR = 'phases';
+export function phasesDir(runDir) {
+    return path.join(runDir, PHASES_DIR);
+}
+export function phaseSnapshotPath(runDir, phaseName) {
+    return path.join(phasesDir(runDir), `${sanitizePhaseFilename(phaseName)}.json`);
+}
+/** Reject filename characters that would escape `phases/`. Phase names are
+ *  caller-supplied strings; we bound them to a safe charset rather than
+ *  letting `..` / path separators sneak in.
+ *
+ *  Allowed: ASCII alphanumerics, dash, underscore, dot. Anything else is
+ *  rejected with a typed error so callers can correct the call-site rather
+ *  than silently producing a write to `../somewhere`. */
+function sanitizePhaseFilename(phaseName) {
+    if (!phaseName || typeof phaseName !== 'string') {
+        throw new GuardrailError(`phase snapshot: name must be a non-empty string`, { code: 'invalid_config', provider: 'run-state', details: { phaseName } });
+    }
+    if (!/^[A-Za-z0-9._-]+$/.test(phaseName)) {
+        throw new GuardrailError(`phase snapshot: name "${phaseName}" contains unsupported characters`, { code: 'invalid_config', provider: 'run-state', details: { phaseName } });
+    }
+    return phaseName;
+}
+/** Write a per-phase snapshot atomically. Identical sequence to
+ *  state.json:
+ *    open(tmp, 'w') → write → fsync(fd) → close → rename → fsync(dirfd).
+ *
+ *  Any pre-existing snapshot is left untouched until the rename, so a crash
+ *  mid-write leaves the previous snapshot intact. */
+export function writePhaseSnapshot(runDir, snapshot) {
+    const dir = phasesDir(runDir);
+    fs.mkdirSync(dir, { recursive: true });
+    const target = phaseSnapshotPath(runDir, snapshot.name);
+    const tmp = `${target}.tmp`;
+    const data = JSON.stringify(snapshot, null, 2);
+    const fd = fs.openSync(tmp, 'w');
+    let wroteOk = false;
+    try {
+        fs.writeSync(fd, data);
+        fs.fsyncSync(fd);
+        wroteOk = true;
+    }
+    finally {
+        fs.closeSync(fd);
+        if (!wroteOk) {
+            try {
+                fs.unlinkSync(tmp);
+            }
+            catch { /* ignore */ }
+        }
+    }
+    fs.renameSync(tmp, target);
+    // Best-effort dir fsync for rename durability. Same EISDIR/EPERM/ENOTSUP
+    // tolerance as state.ts (tmpfs / SMB / Windows quirks).
+    try {
+        const dirFd = fs.openSync(dir, 'r');
+        try {
+            fs.fsyncSync(dirFd);
+        }
+        finally {
+            fs.closeSync(dirFd);
+        }
+    }
+    catch (err) {
+        const code = err.code;
+        if (code !== 'EISDIR' && code !== 'EPERM' && code !== 'ENOTSUP') {
+            throw new GuardrailError(`phase snapshot: dir fsync failed: ${err.message}`, {
+                code: 'corrupted_state',
+                provider: 'run-state',
+                details: { runDir, phaseName: snapshot.name, errno: code },
+            });
+        }
+    }
+}
+/** Read a per-phase snapshot. Returns null if missing. Throws
+ *  GuardrailError(corrupted_state) if it's present-but-unparseable. */
+export function readPhaseSnapshot(runDir, phaseName) {
+    const p = phaseSnapshotPath(runDir, phaseName);
+    if (!fs.existsSync(p))
+        return null;
+    const raw = fs.readFileSync(p, 'utf8');
+    if (!raw) {
+        throw new GuardrailError(`phase snapshot: empty file ${p}`, {
+            code: 'corrupted_state',
+            provider: 'run-state',
+            details: { runDir, phaseName },
+        });
+    }
+    try {
+        return JSON.parse(raw);
+    }
+    catch (err) {
+        throw new GuardrailError(`phase snapshot: corrupt JSON: ${err.message}`, {
+            code: 'corrupted_state',
+            provider: 'run-state',
+            details: { runDir, phaseName, error: err.message },
+        });
+    }
+}
+//# sourceMappingURL=snapshot.js.map