npm - @delegance/claude-autopilot - Versions diffs - 5.2.2 → 6.2.2 - Mend

@delegance/claude-autopilot 5.2.2 → 6.2.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (130) hide show

package/CHANGELOG.md +1027 -1
package/README.md +104 -17
package/dist/src/adapters/council/claude.js +2 -1
package/dist/src/adapters/council/openai.js +14 -7
package/dist/src/adapters/deploy/_http.d.ts +43 -0
package/dist/src/adapters/deploy/_http.js +99 -0
package/dist/src/adapters/deploy/fly.d.ts +206 -0
package/dist/src/adapters/deploy/fly.js +696 -0
package/dist/src/adapters/deploy/generic.d.ts +39 -0
package/dist/src/adapters/deploy/generic.js +98 -0
package/dist/src/adapters/deploy/index.d.ts +15 -0
package/dist/src/adapters/deploy/index.js +78 -0
package/dist/src/adapters/deploy/render.d.ts +181 -0
package/dist/src/adapters/deploy/render.js +550 -0
package/dist/src/adapters/deploy/types.d.ts +221 -0
package/dist/src/adapters/deploy/types.js +15 -0
package/dist/src/adapters/deploy/vercel.d.ts +143 -0
package/dist/src/adapters/deploy/vercel.js +426 -0
package/dist/src/adapters/pricing.d.ts +36 -0
package/dist/src/adapters/pricing.js +40 -0
package/dist/src/adapters/review-engine/claude.js +2 -1
package/dist/src/adapters/review-engine/codex.js +12 -8
package/dist/src/adapters/review-engine/gemini.js +2 -1
package/dist/src/adapters/review-engine/openai-compatible.js +2 -1
package/dist/src/adapters/sdk-loader.d.ts +15 -0
package/dist/src/adapters/sdk-loader.js +77 -0
package/dist/src/cli/autopilot.d.ts +71 -0
package/dist/src/cli/autopilot.js +735 -0
package/dist/src/cli/brainstorm.d.ts +23 -0
package/dist/src/cli/brainstorm.js +131 -0
package/dist/src/cli/costs.d.ts +15 -1
package/dist/src/cli/costs.js +99 -10
package/dist/src/cli/deploy.d.ts +71 -0
package/dist/src/cli/deploy.js +539 -0
package/dist/src/cli/fix.d.ts +18 -0
package/dist/src/cli/fix.js +105 -11
package/dist/src/cli/help-text.d.ts +52 -0
package/dist/src/cli/help-text.js +400 -0
package/dist/src/cli/implement.d.ts +91 -0
package/dist/src/cli/implement.js +196 -0
package/dist/src/cli/index.js +784 -222
package/dist/src/cli/json-envelope.d.ts +187 -0
package/dist/src/cli/json-envelope.js +270 -0
package/dist/src/cli/json-mode.d.ts +33 -0
package/dist/src/cli/json-mode.js +201 -0
package/dist/src/cli/migrate.d.ts +111 -0
package/dist/src/cli/migrate.js +305 -0
package/dist/src/cli/plan.d.ts +81 -0
package/dist/src/cli/plan.js +149 -0
package/dist/src/cli/pr.d.ts +106 -0
package/dist/src/cli/pr.js +191 -19
package/dist/src/cli/preflight.js +102 -1
package/dist/src/cli/review.d.ts +27 -0
package/dist/src/cli/review.js +126 -0
package/dist/src/cli/runs-watch-renderer.d.ts +45 -0
package/dist/src/cli/runs-watch-renderer.js +275 -0
package/dist/src/cli/runs-watch.d.ts +41 -0
package/dist/src/cli/runs-watch.js +395 -0
package/dist/src/cli/runs.d.ts +122 -0
package/dist/src/cli/runs.js +902 -0
package/dist/src/cli/scan.d.ts +93 -0
package/dist/src/cli/scan.js +166 -40
package/dist/src/cli/spec.d.ts +66 -0
package/dist/src/cli/spec.js +132 -0
package/dist/src/cli/validate.d.ts +29 -0
package/dist/src/cli/validate.js +131 -0
package/dist/src/core/config/schema.d.ts +43 -0
package/dist/src/core/config/schema.js +25 -0
package/dist/src/core/config/types.d.ts +17 -0
package/dist/src/core/council/runner.d.ts +10 -1
package/dist/src/core/council/runner.js +25 -3
package/dist/src/core/council/types.d.ts +7 -0
package/dist/src/core/errors.d.ts +1 -1
package/dist/src/core/errors.js +12 -0
package/dist/src/core/logging/redaction.d.ts +13 -0
package/dist/src/core/logging/redaction.js +20 -0
package/dist/src/core/migrate/detector-rules.js +6 -0
package/dist/src/core/migrate/schema-validator.js +22 -1
package/dist/src/core/phases/static-rules.d.ts +5 -1
package/dist/src/core/phases/static-rules.js +2 -5
package/dist/src/core/run-state/budget.d.ts +88 -0
package/dist/src/core/run-state/budget.js +141 -0
package/dist/src/core/run-state/cli-internal.d.ts +21 -0
package/dist/src/core/run-state/cli-internal.js +174 -0
package/dist/src/core/run-state/events.d.ts +59 -0
package/dist/src/core/run-state/events.js +504 -0
package/dist/src/core/run-state/lock.d.ts +61 -0
package/dist/src/core/run-state/lock.js +206 -0
package/dist/src/core/run-state/phase-context.d.ts +60 -0
package/dist/src/core/run-state/phase-context.js +108 -0
package/dist/src/core/run-state/phase-registry.d.ts +137 -0
package/dist/src/core/run-state/phase-registry.js +162 -0
package/dist/src/core/run-state/phase-runner.d.ts +80 -0
package/dist/src/core/run-state/phase-runner.js +447 -0
package/dist/src/core/run-state/provider-readback.d.ts +130 -0
package/dist/src/core/run-state/provider-readback.js +426 -0
package/dist/src/core/run-state/replay-decision.d.ts +69 -0
package/dist/src/core/run-state/replay-decision.js +144 -0
package/dist/src/core/run-state/resolve-engine.d.ts +100 -0
package/dist/src/core/run-state/resolve-engine.js +190 -0
package/dist/src/core/run-state/resume-preflight.d.ts +66 -0
package/dist/src/core/run-state/resume-preflight.js +116 -0
package/dist/src/core/run-state/run-phase-with-lifecycle.d.ts +73 -0
package/dist/src/core/run-state/run-phase-with-lifecycle.js +186 -0
package/dist/src/core/run-state/runs.d.ts +57 -0
package/dist/src/core/run-state/runs.js +288 -0
package/dist/src/core/run-state/snapshot.d.ts +14 -0
package/dist/src/core/run-state/snapshot.js +114 -0
package/dist/src/core/run-state/state.d.ts +40 -0
package/dist/src/core/run-state/state.js +164 -0
package/dist/src/core/run-state/types.d.ts +278 -0
package/dist/src/core/run-state/types.js +13 -0
package/dist/src/core/run-state/ulid.d.ts +11 -0
package/dist/src/core/run-state/ulid.js +95 -0
package/dist/src/core/schema-alignment/extractor/index.d.ts +1 -1
package/dist/src/core/schema-alignment/extractor/index.js +2 -2
package/dist/src/core/schema-alignment/extractor/prisma.d.ts +13 -1
package/dist/src/core/schema-alignment/extractor/prisma.js +65 -10
package/dist/src/core/schema-alignment/git-history.d.ts +19 -0
package/dist/src/core/schema-alignment/git-history.js +53 -0
package/dist/src/core/static-rules/rules/brand-tokens.js +2 -2
package/dist/src/core/static-rules/rules/schema-alignment.js +14 -4
package/package.json +9 -5
package/scripts/autoregress.ts +3 -2
package/skills/claude-autopilot.md +1 -1
package/skills/make-interfaces-feel-better/SKILL.md +104 -0
package/skills/migrate/SKILL.md +193 -47
package/skills/simplify-ui/SKILL.md +103 -0
package/skills/ui/SKILL.md +117 -0
package/skills/ui-ux-pro-max/SKILL.md +90 -0

package/dist/src/core/run-state/provider-readback.js ADDED Viewed

@@ -0,0 +1,426 @@
+// src/core/run-state/provider-readback.ts
+//
+// v6 Phase 6 — pluggable provider read-back layer.
+//
+// When the run-state engine resumes a run that has prior `phase.success` +
+// side-effects + persisted `externalRefs`, the replay decision (see
+// `replay-decision.ts`) is NOT pure — it MUST consult the platform of record
+// to confirm the ref is still live and in the expected state. e.g. for a
+// `github-pr` ref we ask `gh pr view <id> --json state` and inspect
+// open / closed / merged. For a `deploy` ref we ask the adapter's `status()`.
+//
+// This file is the seam: a `ProviderReadback` interface, a registry mapping
+// `ExternalRef.kind` to an implementation, and the built-in readbacks for
+// github / vercel / fly / render / supabase. Each readback FAILS CLOSED — any
+// throw or unrecognized response shape is recorded as
+// `existsOnPlatform: false, currentState: 'unknown'`. Callers (the replay
+// decision matrix) treat unknown-state as `needs-human` so we never quietly
+// overwrite or duplicate a side effect on a missing/stale ref.
+//
+// Spec: docs/specs/v6-run-state-engine.md "Idempotency rules + external
+// operation ledger (Codex CRITICAL #2)" — replay decision is "persisted refs
+// + a provider read-back check (e.g., 'is PR #123 still open?')".
+import { runSafe } from "../shell.js";
+// ---------------------------------------------------------------------------
+// Wrapping helper — guarantees the fail-closed contract regardless of impl.
+// ---------------------------------------------------------------------------
+/** Wrap a readback so that any throw collapses to the unknown-state result.
+ *  All built-in readbacks below opt into this; external implementations are
+ *  free to use it too. Centralizes the fail-closed invariant. */
+function failClosed(name, ref, fn) {
+    return fn().catch(() => unknownResult(ref, { readback: name, threw: true }));
+}
+/** Build a fail-closed result for a ref that the readback couldn't verify. */
+function unknownResult(ref, metadata) {
+    return {
+        refKind: ref.kind,
+        refId: ref.id,
+        existsOnPlatform: false,
+        currentState: 'unknown',
+        ...(metadata ? { metadata } : {}),
+    };
+}
+const defaultGhRunner = (args) => runSafe('gh', args, { timeout: 30000 });
+export function makeGithubReadback(opts = {}) {
+    const gh = opts.gh ?? defaultGhRunner;
+    return {
+        name: 'github',
+        handles: ['github-pr', 'github-comment', 'git-remote-push'],
+        verifyRef: (ref) => failClosed('github', ref, async () => {
+            if (ref.kind === 'github-pr')
+                return verifyGithubPr(gh, ref);
+            if (ref.kind === 'github-comment')
+                return verifyGithubComment(gh, ref);
+            if (ref.kind === 'git-remote-push')
+                return verifyGitRemotePush(gh, ref);
+            return unknownResult(ref, { readback: 'github', reason: 'unsupported-kind' });
+        }),
+    };
+}
+async function verifyGithubPr(gh, ref) {
+    // `gh pr view <id> --json state,url,title,merged` — single deterministic
+    // call. PR ID may be a bare number ("99") or a full URL.
+    const out = gh(['pr', 'view', ref.id, '--json', 'state,url,title,merged']);
+    if (out === null)
+        return unknownResult(ref, { readback: 'github-pr', reason: 'gh-cli-failed' });
+    let parsed;
+    try {
+        parsed = JSON.parse(out);
+    }
+    catch {
+        return unknownResult(ref, { readback: 'github-pr', reason: 'unparseable-json' });
+    }
+    // Map gh's state vocabulary onto ours. gh returns OPEN | CLOSED | MERGED.
+    // `merged: true` overrides — a closed-merged PR is "merged", not "closed".
+    let currentState;
+    if (parsed.merged === true || parsed.state === 'MERGED')
+        currentState = 'merged';
+    else if (parsed.state === 'OPEN')
+        currentState = 'open';
+    else if (parsed.state === 'CLOSED')
+        currentState = 'closed';
+    else
+        currentState = 'unknown';
+    return {
+        refKind: ref.kind,
+        refId: ref.id,
+        existsOnPlatform: true,
+        currentState,
+        metadata: {
+            readback: 'github-pr',
+            ...(parsed.url ? { url: parsed.url } : {}),
+            ...(parsed.title ? { title: parsed.title } : {}),
+            rawState: parsed.state,
+        },
+    };
+}
+async function verifyGithubComment(gh, ref) {
+    // gh doesn't have a clean per-comment-ID lookup — we use `gh api` against
+    // the issues comments endpoint. Comment IDs are integers; if the ref id is
+    // qualified as `<repo>:<id>` we split, else we rely on cwd's repo context.
+    let endpoint;
+    if (ref.id.includes(':')) {
+        const [repo, commentId] = ref.id.split(':', 2);
+        endpoint = `/repos/${repo}/issues/comments/${commentId}`;
+    }
+    else {
+        endpoint = `/repos/{owner}/{repo}/issues/comments/${ref.id}`;
+    }
+    const out = gh(['api', endpoint]);
+    if (out === null) {
+        // gh api returns non-zero on 404. Treat as does-not-exist (which is
+        // distinct from unknown — a deleted comment is meaningful: replay would
+        // create a new comment, so the prior ref is no longer authoritative).
+        return {
+            refKind: ref.kind,
+            refId: ref.id,
+            existsOnPlatform: false,
+            currentState: 'closed',
+            metadata: { readback: 'github-comment', reason: 'gh-api-failed-or-404' },
+        };
+    }
+    let parsed;
+    try {
+        parsed = JSON.parse(out);
+    }
+    catch {
+        return unknownResult(ref, { readback: 'github-comment', reason: 'unparseable-json' });
+    }
+    return {
+        refKind: ref.kind,
+        refId: ref.id,
+        existsOnPlatform: typeof parsed.id === 'number',
+        currentState: typeof parsed.id === 'number' ? 'open' : 'unknown',
+        metadata: {
+            readback: 'github-comment',
+            ...(parsed.html_url ? { url: parsed.html_url } : {}),
+        },
+    };
+}
+async function verifyGitRemotePush(gh, ref) {
+    // For a git-remote-push ref the id is the commit SHA. We confirm it exists
+    // on the remote by asking gh for the commit. Treat "not found" as
+    // does-not-exist (rebased away), distinct from unknown (auth/network).
+    // gh api format: /repos/{owner}/{repo}/commits/<sha>.
+    const out = gh(['api', `/repos/{owner}/{repo}/commits/${ref.id}`]);
+    if (out === null) {
+        return {
+            refKind: ref.kind,
+            refId: ref.id,
+            existsOnPlatform: false,
+            currentState: 'closed',
+            metadata: { readback: 'git-remote-push', reason: 'gh-api-failed-or-404' },
+        };
+    }
+    let parsed;
+    try {
+        parsed = JSON.parse(out);
+    }
+    catch {
+        return unknownResult(ref, { readback: 'git-remote-push', reason: 'unparseable-json' });
+    }
+    return {
+        refKind: ref.kind,
+        refId: ref.id,
+        existsOnPlatform: typeof parsed.sha === 'string',
+        currentState: typeof parsed.sha === 'string' ? 'live' : 'unknown',
+        metadata: {
+            readback: 'git-remote-push',
+            ...(parsed.html_url ? { url: parsed.html_url } : {}),
+        },
+    };
+}
+let deployAdapterResolver = null;
+/** Register a resolver that maps a provider name (e.g. "vercel") to a
+ *  status-fetcher. The CLI wires this from `src/adapters/deploy/index.ts`
+ *  during boot; tests inject mocks directly. */
+export function registerDeployAdapterResolver(resolver) {
+    deployAdapterResolver = resolver;
+}
+/** Reset the registered resolver. Test-only seam. */
+export function __resetDeployAdapterResolver() {
+    deployAdapterResolver = null;
+}
+export function makeDeployReadback(name, providers) {
+    return {
+        name,
+        handles: ['deploy', 'rollback-target'],
+        providers,
+        verifyRef: (ref) => failClosed(name, ref, async () => {
+            const provider = ref.provider ?? null;
+            if (!provider || !providers.includes(provider)) {
+                return unknownResult(ref, {
+                    readback: name,
+                    reason: 'provider-mismatch',
+                    refProvider: provider,
+                });
+            }
+            if (!deployAdapterResolver) {
+                return unknownResult(ref, {
+                    readback: name,
+                    reason: 'no-adapter-resolver-registered',
+                });
+            }
+            const fetcher = deployAdapterResolver(provider);
+            if (!fetcher) {
+                return unknownResult(ref, {
+                    readback: name,
+                    reason: 'adapter-not-resolvable',
+                    provider,
+                });
+            }
+            const r = await fetcher.status({ deployId: ref.id });
+            // Map adapter status → ReadbackState. The adapter contract returns
+            // 'pass'|'fail'|'in-progress'|'fail_rolled_back'|'fail_rollback_failed'.
+            let currentState;
+            switch (r.status) {
+                case 'pass':
+                    currentState = 'live';
+                    break;
+                case 'fail':
+                case 'fail_rollback_failed':
+                    currentState = 'failed';
+                    break;
+                case 'fail_rolled_back':
+                    currentState = 'rolled-back';
+                    break;
+                case 'in-progress':
+                    currentState = 'open';
+                    break;
+                default:
+                    currentState = 'unknown';
+            }
+            return {
+                refKind: ref.kind,
+                refId: ref.id,
+                existsOnPlatform: true,
+                currentState,
+                metadata: {
+                    readback: name,
+                    provider,
+                    rawStatus: r.status,
+                    ...(r.deployUrl ? { deployUrl: r.deployUrl } : {}),
+                },
+            };
+        }),
+    };
+}
+let migrationStateFetcher = null;
+/** Register the migration-state fetcher used by the supabase readback.
+ *  CLI boot wires this; tests inject directly. */
+export function registerMigrationStateFetcher(fetcher) {
+    migrationStateFetcher = fetcher;
+}
+export function __resetMigrationStateFetcher() {
+    migrationStateFetcher = null;
+}
+let migrationBatchFetcher = null;
+/** Register the `migration-batch` fetcher. The CLI boot wires this from the
+ *  per-skill adapter; tests inject mocks directly. */
+export function registerMigrationBatchFetcher(fetcher) {
+    migrationBatchFetcher = fetcher;
+}
+export function __resetMigrationBatchFetcher() {
+    migrationBatchFetcher = null;
+}
+export function makeSupabaseReadback() {
+    return {
+        name: 'supabase',
+        handles: ['migration-version', 'migration-batch'],
+        verifyRef: (ref) => failClosed('supabase', ref, async () => {
+            if (ref.kind === 'migration-batch')
+                return verifyMigrationBatch(ref);
+            // migration-version
+            if (!migrationStateFetcher) {
+                return unknownResult(ref, {
+                    readback: 'supabase',
+                    reason: 'no-migration-state-fetcher-registered',
+                });
+            }
+            const result = await migrationStateFetcher.fetch(ref.id);
+            if (!result) {
+                return unknownResult(ref, {
+                    readback: 'supabase',
+                    reason: 'migration-state-fetch-failed-or-not-found',
+                });
+            }
+            return {
+                refKind: ref.kind,
+                refId: ref.id,
+                existsOnPlatform: true,
+                currentState: result.applied ? 'live' : 'open',
+                metadata: {
+                    readback: 'supabase',
+                    applied: result.applied,
+                    ...(result.appliedAt ? { appliedAt: result.appliedAt } : {}),
+                },
+            };
+        }),
+    };
+}
+async function verifyMigrationBatch(ref) {
+    if (!migrationBatchFetcher) {
+        return unknownResult(ref, {
+            readback: 'supabase',
+            reason: 'no-migration-batch-fetcher-registered',
+        });
+    }
+    const result = await migrationBatchFetcher.fetch(ref.id);
+    if (!result) {
+        return unknownResult(ref, {
+            readback: 'supabase',
+            reason: 'migration-batch-fetch-failed-or-not-found',
+        });
+    }
+    if (result.planned.length === 0) {
+        // A planned-empty batch is degenerate — no work to verify against. Treat
+        // it as merged (skip-already-applied) rather than unknown so a batch ref
+        // emitted before the dispatcher discovered "nothing to do" doesn't
+        // wedge the resume preflight on needs-human. The post-effect ref set is
+        // also empty in this case, so the orchestrator's "all post-effect refs
+        // merged/live" check naturally short-circuits to skip.
+        return {
+            refKind: ref.kind,
+            refId: ref.id,
+            existsOnPlatform: true,
+            currentState: 'merged',
+            metadata: {
+                readback: 'supabase',
+                plannedCount: 0,
+                appliedCount: 0,
+                erroredCount: 0,
+            },
+        };
+    }
+    let appliedCount = 0;
+    let pendingCount = 0;
+    let erroredCount = 0;
+    for (const item of result.planned) {
+        if (item.state === 'applied')
+            appliedCount++;
+        else if (item.state === 'pending')
+            pendingCount++;
+        else if (item.state === 'errored')
+            erroredCount++;
+    }
+    let currentState;
+    if (erroredCount > 0)
+        currentState = 'failed';
+    else if (pendingCount === 0)
+        currentState = 'merged';
+    else
+        currentState = 'open';
+    return {
+        refKind: ref.kind,
+        refId: ref.id,
+        existsOnPlatform: true,
+        currentState,
+        metadata: {
+            readback: 'supabase',
+            plannedCount: result.planned.length,
+            appliedCount,
+            pendingCount,
+            erroredCount,
+        },
+    };
+}
+// ---------------------------------------------------------------------------
+// Registry — first-match-wins lookup keyed on ExternalRefKind.
+// ---------------------------------------------------------------------------
+/** Default built-in registry. Order matters: first readback whose `handles`
+ *  contains the ref kind wins. Callers may swap individual entries via
+ *  `setProviderReadbacks` (test-only seam). */
+function buildDefaultRegistry() {
+    return [
+        makeGithubReadback(),
+        makeDeployReadback('vercel', ['vercel']),
+        makeDeployReadback('fly', ['fly']),
+        makeDeployReadback('render', ['render']),
+        makeSupabaseReadback(),
+    ];
+}
+let providerReadbacks = buildDefaultRegistry();
+/** Live registry — exposed as a getter so tests / callers can introspect. */
+export function getProviderReadbacks() {
+    return providerReadbacks;
+}
+/** Replace the registry (test seam). Pass null to reset to defaults. */
+export function setProviderReadbacks(list) {
+    providerReadbacks = list === null ? buildDefaultRegistry() : list;
+}
+/** Look up the readback that handles a given ref. Two-pass match: first try
+ *  a strict (kind + provider) match so multiple readbacks sharing a kind
+ *  (vercel/fly/render all on `deploy`) don't shadow each other; then fall
+ *  back to a kind-only match for readbacks that don't declare a provider
+ *  allowlist (e.g. the github readback handles `github-pr` regardless of
+ *  ref.provider). Returns null if no registered readback claims this ref —
+ *  caller treats null as "no readback available, route to needs-human".
+ *
+ *  Bugbot MEDIUM (PR #91): without provider-aware matching, the first deploy
+ *  readback registered (vercel) won every `deploy`/`rollback-target` lookup
+ *  and the fly/render readbacks were dead code. */
+export function readbackForRef(ref) {
+    if (ref.provider) {
+        for (const rb of providerReadbacks) {
+            if (rb.handles.includes(ref.kind) && rb.providers?.includes(ref.provider))
+                return rb;
+        }
+    }
+    for (const rb of providerReadbacks) {
+        if (rb.handles.includes(ref.kind) && !rb.providers)
+            return rb;
+    }
+    return null;
+}
+/** Verify a list of refs in parallel. Returns one ReadbackResult per ref.
+ *  Refs without a registered readback get an unknown-state result so the
+ *  decision matrix can attribute the gap. Order is preserved. */
+export async function verifyRefs(refs) {
+    return Promise.all(refs.map(async (ref) => {
+        const rb = readbackForRef(ref);
+        if (!rb)
+            return unknownResult(ref, { reason: 'no-readback-registered' });
+        return rb.verifyRef(ref);
+    }));
+}
+//# sourceMappingURL=provider-readback.js.map

package/dist/src/core/run-state/replay-decision.d.ts ADDED Viewed

@@ -0,0 +1,69 @@
+import type { ExternalRef } from './types.ts';
+import type { ReadbackResult } from './provider-readback.ts';
+/** Decision the engine should take when replaying / resuming a phase. */
+export type ReplayDecisionKind =
+/** Run the phase body. Default for fresh attempts and post-failure retries. */
+'retry'
+/** Don't run; treat as already-done. Engine returns prior output / snapshot. */
+ | 'skip-already-applied'
+/** Don't run; can't safely decide. Engine emits phase.needs-human + throws. */
+ | 'needs-human'
+/** Don't run; explicit user/CI signal to give up. Engine throws abort code. */
+ | 'abort';
+export interface ReplayDecision {
+    decision: ReplayDecisionKind;
+    /** Single-line human-readable explanation. Embedded into needs-human events
+     *  and surface in `runs resume` output. */
+    reason: string;
+    /** External refs the decision considered. Echoed back so CI/humans can
+     *  inspect them without re-reading the events log. */
+    refsConsulted: ExternalRef[];
+    /** Per-ref readback results. Empty array when the decision was made
+     *  without consulting readbacks (e.g. retry on no-prior-success). */
+    readbacksConsulted: ReadbackResult[];
+}
+/** Inputs to `decideReplay`. All fields required so callers can't accidentally
+ *  drop a signal. Keep in lockstep with runPhase's gating logic. */
+export interface ReplayDecisionInput {
+    /** Phase name — for the reason string only; no behavior depends on it. */
+    phaseName: string;
+    /** True iff prior `phase.success` event exists for this phaseIdx. */
+    hasPriorSuccess: boolean;
+    /** Total attempts recorded in state.json for this phaseIdx (failed +
+     *  succeeded). Used only for the `reason` string when there's no prior
+     *  success but priorAttempts > 0 — distinguishes "first attempt" from
+     *  "post-failure retry" so users running `runs resume` get an accurate
+     *  description. No behavior depends on this; it's a presentation field.
+     *  Defaults to 0 when omitted (Bugbot LOW PR #91 fold-in). */
+    priorAttempts?: number;
+    /** Mirrors RunPhase.idempotent declared at registration. */
+    idempotent: boolean;
+    /** Mirrors RunPhase.hasSideEffects declared at registration. */
+    hasSideEffects: boolean;
+    /** All externalRefs persisted for this phaseIdx across prior attempts. */
+    externalRefs: ExternalRef[];
+    /** Readback results, one per externalRef in the same order. May be empty
+     *  when the caller is doing pure-state lookup (CLI `runs resume`) — in
+     *  that case any side-effect-phase prior success collapses to needs-human
+     *  because we have no live confirmation. */
+    readbacks: ReadbackResult[];
+    /** When true the user/CI explicitly asked to override needs-human. The
+     *  engine emits a `replay.override` event; this function flips the
+     *  decision to retry regardless of state. */
+    forceReplay: boolean;
+}
+/** Decide what to do with a (re-)attempt of a phase. Pure; safe to call
+ *  during CLI lookup AND inside runPhase. The decision matrix mirrors the
+ *  spec's per-phase replay table:
+ *
+ *    | prior success | idempotent | sideEffects | refs       | readback all valid | -> decision |
+ *    | no            | -          | -           | -          | -                  | retry       |
+ *    | yes           | yes        | -           | -          | -                  | skip        |
+ *    | yes           | no         | no          | -          | -                  | skip        |
+ *    | yes           | no         | yes         | empty      | -                  | needs-human |
+ *    | yes           | no         | yes         | non-empty  | all valid          | skip        |
+ *    | yes           | no         | yes         | non-empty  | any missing/stale  | needs-human |
+ *
+ *  forceReplay = true overrides everything → retry. */
+export declare function decideReplay(input: ReplayDecisionInput): ReplayDecision;
+//# sourceMappingURL=replay-decision.d.ts.map

package/dist/src/core/run-state/replay-decision.js ADDED Viewed

@@ -0,0 +1,144 @@
+// src/core/run-state/replay-decision.ts
+//
+// v6 Phase 6 — pure decision function for "should this phase replay?".
+//
+// Inputs are the persisted facts of a prior phase attempt (success count,
+// idempotent / hasSideEffects declarations, externalRefs) plus the live
+// readback results from `provider-readback.ts`. Output is one of four
+// decisions, plus the refs + readbacks the decision was based on so callers
+// can surface them in `phase.needs-human` events for human triage.
+//
+// This file is deliberately pure: it does NOT execute readbacks itself
+// (caller passes them in), it does NOT consult disk, it does NOT throw on
+// any input shape. Easy to unit-test exhaustively against the spec's
+// per-phase replay table.
+//
+// Spec: docs/specs/v6-run-state-engine.md "Idempotency rules + external
+// operation ledger (Codex CRITICAL #2)" — the replay matrix.
+/** Decide what to do with a (re-)attempt of a phase. Pure; safe to call
+ *  during CLI lookup AND inside runPhase. The decision matrix mirrors the
+ *  spec's per-phase replay table:
+ *
+ *    | prior success | idempotent | sideEffects | refs       | readback all valid | -> decision |
+ *    | no            | -          | -           | -          | -                  | retry       |
+ *    | yes           | yes        | -           | -          | -                  | skip        |
+ *    | yes           | no         | no          | -          | -                  | skip        |
+ *    | yes           | no         | yes         | empty      | -                  | needs-human |
+ *    | yes           | no         | yes         | non-empty  | all valid          | skip        |
+ *    | yes           | no         | yes         | non-empty  | any missing/stale  | needs-human |
+ *
+ *  forceReplay = true overrides everything → retry. */
+export function decideReplay(input) {
+    const refsConsulted = [...input.externalRefs];
+    const readbacksConsulted = [...input.readbacks];
+    // Override path — caller already gated this on user/CI consent. Engine
+    // emits replay.override on this branch.
+    if (input.forceReplay) {
+        return {
+            decision: 'retry',
+            reason: `forceReplay override: ${input.phaseName} will re-execute despite prior state`,
+            refsConsulted,
+            readbacksConsulted,
+        };
+    }
+    // No prior success → fresh attempt or post-failure retry. Always safe.
+    if (!input.hasPriorSuccess) {
+        const priorAttempts = input.priorAttempts ?? 0;
+        const reason = priorAttempts > 0
+            ? `${input.phaseName} previous attempt(s) failed (${priorAttempts}) — retry safe`
+            : `${input.phaseName} has no prior success — first attempt`;
+        return {
+            decision: 'retry',
+            reason,
+            refsConsulted,
+            readbacksConsulted: [],
+        };
+    }
+    // Prior success + declared idempotent → safe to short-circuit. The phase
+    // contract promises the prior output is durable / retrievable.
+    if (input.idempotent) {
+        return {
+            decision: 'skip-already-applied',
+            reason: `${input.phaseName} previously succeeded and is idempotent — replay short-circuits`,
+            refsConsulted,
+            readbacksConsulted: [],
+        };
+    }
+    // Prior success + no side effects → still safe to skip. The phase
+    // produced no observable platform state; replay would just re-do the
+    // identical no-side-effect work.
+    if (!input.hasSideEffects) {
+        return {
+            decision: 'skip-already-applied',
+            reason: `${input.phaseName} previously succeeded with no side effects — skip-already-applied`,
+            refsConsulted,
+            readbacksConsulted: [],
+        };
+    }
+    // Prior success + side effects + no refs → we can't reach the platform of
+    // record to confirm anything. Bubble to a human; the spec is explicit
+    // that missing refs always route to needs-human.
+    if (input.externalRefs.length === 0) {
+        return {
+            decision: 'needs-human',
+            reason: `${input.phaseName} previously succeeded with side effects but recorded no externalRefs — cannot verify, needs human review`,
+            refsConsulted,
+            readbacksConsulted: [],
+        };
+    }
+    // Prior success + side effects + refs but no readbacks supplied (CLI
+    // lookup mode): we must NOT silently skip. Surface as needs-human so the
+    // CLI prediction matches what runPhase will do under live conditions.
+    if (input.readbacks.length === 0) {
+        return {
+            decision: 'needs-human',
+            reason: `${input.phaseName} previously succeeded with side effects; no live readback was performed — needs human review (or pass --force-replay)`,
+            refsConsulted,
+            readbacksConsulted: [],
+        };
+    }
+    // Refs + readbacks both present — adjudicate per readback validity.
+    const stale = readbacksConsulted.filter(rb => !isReadbackValid(rb));
+    if (stale.length > 0) {
+        const summary = stale
+            .map(rb => `${rb.refKind}=${rb.refId} state=${rb.currentState}`)
+            .join(', ');
+        return {
+            decision: 'needs-human',
+            reason: `${input.phaseName} previously succeeded but ${stale.length} ref(s) are stale or missing on the platform: ${summary}`,
+            refsConsulted,
+            readbacksConsulted,
+        };
+    }
+    return {
+        decision: 'skip-already-applied',
+        reason: `${input.phaseName} previously succeeded; all ${readbacksConsulted.length} platform ref(s) verified live — skip-already-applied`,
+        refsConsulted,
+        readbacksConsulted,
+    };
+}
+/** A readback is "valid" — i.e. authorizes a skip-already-applied — when the
+ *  platform confirms the ref still exists AND its current state is one of
+ *  the "still represents the prior side effect" set. The deny-set:
+ *  - 'closed' / 'rolled-back' / 'failed' → side effect was reverted;
+ *    replaying would create a new artifact.
+ *  - 'unknown' → fail-closed; we can't make a confident assertion.
+ *  Anything else (open / merged / live) is treated as "ref still represents
+ *  the prior side effect" — replay would be a duplicate. */
+function isReadbackValid(rb) {
+    if (!rb.existsOnPlatform)
+        return false;
+    switch (rb.currentState) {
+        case 'open':
+        case 'merged':
+        case 'live':
+            return true;
+        case 'closed':
+        case 'rolled-back':
+        case 'failed':
+        case 'unknown':
+        default:
+            return false;
+    }
+}
+//# sourceMappingURL=replay-decision.js.map