npm - @delegance/claude-autopilot - Versions diffs - 5.5.2 → 7.2.0 - Mend

@delegance/claude-autopilot 5.5.2 → 7.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (150) hide show

package/CHANGELOG.md +1776 -6
package/README.md +65 -1
package/bin/_launcher.js +38 -23
package/dist/src/adapters/council/openai.js +12 -6
package/dist/src/adapters/deploy/_http.d.ts +43 -0
package/dist/src/adapters/deploy/_http.js +99 -0
package/dist/src/adapters/deploy/fly.d.ts +206 -0
package/dist/src/adapters/deploy/fly.js +696 -0
package/dist/src/adapters/deploy/index.d.ts +2 -0
package/dist/src/adapters/deploy/index.js +33 -0
package/dist/src/adapters/deploy/render.d.ts +181 -0
package/dist/src/adapters/deploy/render.js +550 -0
package/dist/src/adapters/deploy/types.d.ts +67 -3
package/dist/src/adapters/deploy/vercel.d.ts +17 -1
package/dist/src/adapters/deploy/vercel.js +29 -49
package/dist/src/adapters/pricing.d.ts +36 -0
package/dist/src/adapters/pricing.js +40 -0
package/dist/src/adapters/review-engine/codex.js +10 -7
package/dist/src/cli/autopilot.d.ts +75 -0
package/dist/src/cli/autopilot.js +750 -0
package/dist/src/cli/brainstorm.d.ts +23 -0
package/dist/src/cli/brainstorm.js +131 -0
package/dist/src/cli/costs.d.ts +15 -1
package/dist/src/cli/costs.js +99 -10
package/dist/src/cli/dashboard/index.d.ts +5 -0
package/dist/src/cli/dashboard/index.js +49 -0
package/dist/src/cli/dashboard/login.d.ts +22 -0
package/dist/src/cli/dashboard/login.js +260 -0
package/dist/src/cli/dashboard/logout.d.ts +12 -0
package/dist/src/cli/dashboard/logout.js +45 -0
package/dist/src/cli/dashboard/status.d.ts +30 -0
package/dist/src/cli/dashboard/status.js +65 -0
package/dist/src/cli/dashboard/upload.d.ts +16 -0
package/dist/src/cli/dashboard/upload.js +48 -0
package/dist/src/cli/deploy.d.ts +3 -3
package/dist/src/cli/deploy.js +34 -9
package/dist/src/cli/engine-flag-deprecation.d.ts +14 -0
package/dist/src/cli/engine-flag-deprecation.js +20 -0
package/dist/src/cli/fix.d.ts +18 -0
package/dist/src/cli/fix.js +105 -11
package/dist/src/cli/help-text.d.ts +52 -0
package/dist/src/cli/help-text.js +416 -0
package/dist/src/cli/implement.d.ts +91 -0
package/dist/src/cli/implement.js +196 -0
package/dist/src/cli/index.d.ts +2 -1
package/dist/src/cli/index.js +774 -245
package/dist/src/cli/json-envelope.d.ts +187 -0
package/dist/src/cli/json-envelope.js +270 -0
package/dist/src/cli/json-mode.d.ts +33 -0
package/dist/src/cli/json-mode.js +201 -0
package/dist/src/cli/migrate.d.ts +111 -0
package/dist/src/cli/migrate.js +305 -0
package/dist/src/cli/plan.d.ts +81 -0
package/dist/src/cli/plan.js +149 -0
package/dist/src/cli/pr.d.ts +106 -0
package/dist/src/cli/pr.js +191 -19
package/dist/src/cli/preflight.js +26 -0
package/dist/src/cli/review.d.ts +27 -0
package/dist/src/cli/review.js +126 -0
package/dist/src/cli/runs-watch-renderer.d.ts +45 -0
package/dist/src/cli/runs-watch-renderer.js +275 -0
package/dist/src/cli/runs-watch.d.ts +41 -0
package/dist/src/cli/runs-watch.js +395 -0
package/dist/src/cli/runs.d.ts +122 -0
package/dist/src/cli/runs.js +902 -0
package/dist/src/cli/scaffold.d.ts +39 -0
package/dist/src/cli/scaffold.js +287 -0
package/dist/src/cli/scan.d.ts +93 -0
package/dist/src/cli/scan.js +166 -40
package/dist/src/cli/setup.d.ts +30 -0
package/dist/src/cli/setup.js +137 -0
package/dist/src/cli/spec.d.ts +66 -0
package/dist/src/cli/spec.js +132 -0
package/dist/src/cli/validate.d.ts +29 -0
package/dist/src/cli/validate.js +131 -0
package/dist/src/core/config/schema.d.ts +9 -0
package/dist/src/core/config/schema.js +7 -0
package/dist/src/core/config/types.d.ts +11 -0
package/dist/src/core/council/runner.d.ts +10 -1
package/dist/src/core/council/runner.js +25 -3
package/dist/src/core/council/types.d.ts +7 -0
package/dist/src/core/errors.d.ts +1 -1
package/dist/src/core/errors.js +11 -0
package/dist/src/core/logging/redaction.d.ts +13 -0
package/dist/src/core/logging/redaction.js +20 -0
package/dist/src/core/migrate/schema-validator.js +15 -1
package/dist/src/core/phases/static-rules.d.ts +5 -1
package/dist/src/core/phases/static-rules.js +2 -5
package/dist/src/core/run-state/budget.d.ts +88 -0
package/dist/src/core/run-state/budget.js +141 -0
package/dist/src/core/run-state/cli-internal.d.ts +21 -0
package/dist/src/core/run-state/cli-internal.js +174 -0
package/dist/src/core/run-state/events.d.ts +59 -0
package/dist/src/core/run-state/events.js +512 -0
package/dist/src/core/run-state/lock.d.ts +61 -0
package/dist/src/core/run-state/lock.js +206 -0
package/dist/src/core/run-state/phase-context.d.ts +60 -0
package/dist/src/core/run-state/phase-context.js +108 -0
package/dist/src/core/run-state/phase-registry.d.ts +137 -0
package/dist/src/core/run-state/phase-registry.js +162 -0
package/dist/src/core/run-state/phase-runner.d.ts +80 -0
package/dist/src/core/run-state/phase-runner.js +447 -0
package/dist/src/core/run-state/provider-readback.d.ts +130 -0
package/dist/src/core/run-state/provider-readback.js +426 -0
package/dist/src/core/run-state/replay-decision.d.ts +69 -0
package/dist/src/core/run-state/replay-decision.js +144 -0
package/dist/src/core/run-state/resolve-engine.d.ts +45 -0
package/dist/src/core/run-state/resolve-engine.js +74 -0
package/dist/src/core/run-state/resume-preflight.d.ts +66 -0
package/dist/src/core/run-state/resume-preflight.js +116 -0
package/dist/src/core/run-state/run-phase-with-lifecycle.d.ts +69 -0
package/dist/src/core/run-state/run-phase-with-lifecycle.js +193 -0
package/dist/src/core/run-state/runs.d.ts +57 -0
package/dist/src/core/run-state/runs.js +288 -0
package/dist/src/core/run-state/snapshot.d.ts +14 -0
package/dist/src/core/run-state/snapshot.js +114 -0
package/dist/src/core/run-state/state.d.ts +40 -0
package/dist/src/core/run-state/state.js +164 -0
package/dist/src/core/run-state/types.d.ts +284 -0
package/dist/src/core/run-state/types.js +19 -0
package/dist/src/core/run-state/ulid.d.ts +11 -0
package/dist/src/core/run-state/ulid.js +95 -0
package/dist/src/core/schema-alignment/extractor/index.d.ts +1 -1
package/dist/src/core/schema-alignment/extractor/index.js +2 -2
package/dist/src/core/schema-alignment/extractor/prisma.d.ts +13 -1
package/dist/src/core/schema-alignment/extractor/prisma.js +65 -10
package/dist/src/core/schema-alignment/git-history.d.ts +19 -0
package/dist/src/core/schema-alignment/git-history.js +53 -0
package/dist/src/core/static-rules/rules/brand-tokens.js +2 -2
package/dist/src/core/static-rules/rules/schema-alignment.js +14 -4
package/dist/src/dashboard/auto-upload.d.ts +26 -0
package/dist/src/dashboard/auto-upload.js +107 -0
package/dist/src/dashboard/config.d.ts +22 -0
package/dist/src/dashboard/config.js +109 -0
package/dist/src/dashboard/upload/canonical.d.ts +3 -0
package/dist/src/dashboard/upload/canonical.js +16 -0
package/dist/src/dashboard/upload/chain.d.ts +9 -0
package/dist/src/dashboard/upload/chain.js +27 -0
package/dist/src/dashboard/upload/snapshot.d.ts +23 -0
package/dist/src/dashboard/upload/snapshot.js +66 -0
package/dist/src/dashboard/upload/uploader.d.ts +54 -0
package/dist/src/dashboard/upload/uploader.js +330 -0
package/package.json +19 -3
package/scripts/autoregress.ts +1 -1
package/scripts/test-runner.mjs +4 -0
package/skills/claude-autopilot.md +1 -1
package/skills/make-interfaces-feel-better/SKILL.md +104 -0
package/skills/simplify-ui/SKILL.md +103 -0
package/skills/ui/SKILL.md +117 -0
package/skills/ui-ux-pro-max/SKILL.md +90 -0

package/dist/src/cli/scan.js CHANGED Viewed

@@ -8,6 +8,8 @@ import { loadIgnoreRules, parseConfigIgnore, applyIgnoreRules } from "../core/ig
 import { saveCachedFindings } from "../core/persist/findings-cache.js";
 import { appendCostLog } from "../core/persist/cost-log.js";
 import { detectLLMKey, LLM_KEY_HINTS } from "../core/detect/llm-key.js";
+import { resolveEngineEnabled } from "../core/run-state/resolve-engine.js";
+import { runPhaseWithLifecycle } from "../core/run-state/run-phase-with-lifecycle.js";
 const C = {
     reset: '\x1b[0m', bold: '\x1b[1m', dim: '\x1b[2m',
     green: '\x1b[32m', yellow: '\x1b[33m', red: '\x1b[31m', cyan: '\x1b[36m',
@@ -50,7 +52,17 @@ function collectFiles(target, cwd) {
 function collectAllFiles(cwd) {
     return collectFiles(cwd, cwd);
 }
-export async function runScan(options = {}) {
+/**
+ * v6.2.0 — extract the `RunPhase<ScanInput, ScanOutput>` construction out of
+ * `runScan(options)` so the new top-level `autopilot` orchestrator can drive
+ * `runPhase` itself with a shared `phaseIdx` against the same run dir.
+ *
+ * The legacy `runScan(options)` keeps calling this builder internally (then
+ * `runPhaseWithLifecycle` for single-phase runs) so direct CLI behavior is
+ * byte-for-byte identical to v6.1. Parity is asserted by
+ * `tests/cli/scan-builder-parity.test.ts`.
+ */
+export async function buildScanPhase(options) {
     const cwd = options.cwd ?? process.cwd();
     const configPath = options.configPath ?? path.join(cwd, 'guardrail.config.yaml');
     let config = { configVersion: 1 };
@@ -73,46 +85,52 @@ export async function runScan(options = {}) {
         console.error(fmt('dim', '    guardrail scan src/auth/'));
         console.error(fmt('dim', '    guardrail scan --all'));
         console.error(fmt('dim', '    guardrail scan --ask "is there SQL injection?" src/db/'));
-        return 1;
+        return { kind: 'early-exit', exitCode: 1 };
     }
     // Deduplicate
     files = [...new Set(files)];
     if (files.length === 0) {
         console.log(fmt('yellow', '[scan] No code files found at the specified path(s)'));
-        return 0;
+        return { kind: 'early-exit', exitCode: 0 };
     }
     if (options.dryRun) {
         console.log(fmt('bold', `[scan] Would scan ${files.length} file(s):`));
         for (const f of files)
             console.log(fmt('dim', `  ${path.relative(cwd, f)}`));
-        return 0;
+        return { kind: 'early-exit', exitCode: 0 };
     }
     // Auto-detect stack if not in config
     if (!config.stack) {
         config = { ...config, stack: detectStack(cwd) ?? undefined };
     }
     // Build review engine
-    if (!detectLLMKey().hasKey) {
-        console.error(fmt('red', '[scan] No LLM API key — set one of:'));
-        for (const { name, url, note } of LLM_KEY_HINTS) {
-            const suffix = note ? `  (${note})` : '';
-            console.error(fmt('dim', `         ${name.padEnd(18)} ${url}${suffix}`));
-        }
-        return 1;
-    }
-    const engineRef = typeof config.reviewEngine === 'string' ? config.reviewEngine
-        : (config.reviewEngine?.adapter ?? 'auto');
     let engine;
-    try {
-        engine = await loadAdapter({
-            point: 'review-engine',
-            ref: engineRef,
-            options: typeof config.reviewEngine === 'object' ? config.reviewEngine.options : undefined,
-        });
+    if (options.__testReviewEngine) {
+        // Test-only fast path — skip the LLM key check and the adapter loader.
+        engine = options.__testReviewEngine;
     }
-    catch (err) {
-        console.error(fmt('red', `[scan] Could not load review engine: ${err instanceof Error ? err.message : String(err)}`));
-        return 1;
+    else {
+        if (!detectLLMKey().hasKey) {
+            console.error(fmt('red', '[scan] No LLM API key — set one of:'));
+            for (const { name, url, note } of LLM_KEY_HINTS) {
+                const suffix = note ? `  (${note})` : '';
+                console.error(fmt('dim', `         ${name.padEnd(18)} ${url}${suffix}`));
+            }
+            return { kind: 'early-exit', exitCode: 1 };
+        }
+        const engineRef = typeof config.reviewEngine === 'string' ? config.reviewEngine
+            : (config.reviewEngine?.adapter ?? 'auto');
+        try {
+            engine = await loadAdapter({
+                point: 'review-engine',
+                ref: engineRef,
+                options: typeof config.reviewEngine === 'object' ? config.reviewEngine.options : undefined,
+            });
+        }
+        catch (err) {
+            console.error(fmt('red', `[scan] Could not load review engine: ${err instanceof Error ? err.message : String(err)}`));
+            return { kind: 'early-exit', exitCode: 1 };
+        }
     }
     const focusLabel = options.focus && options.focus !== 'all' ? options.focus : null;
     const relFiles = files.map(f => path.relative(cwd, f));
@@ -123,9 +141,94 @@ export async function runScan(options = {}) {
         console.log(fmt('dim', `  question: ${options.ask}`));
     if (focusLabel)
         console.log(fmt('dim', `  focus: ${focusLabel}`));
+    // Pre-flight resolution just for the banner; the helper re-resolves
+    // internally with identical precedence so the engine path stays
+    // deterministic. Keeping this inline preserves the legacy "engine: on
+    // (<source>)" banner that scan emitted before v6.0.6.
+    const engineBanner = resolveEngineEnabled({
+        ...(options.cliEngine !== undefined ? { cliEngine: options.cliEngine } : {}),
+        ...(options.envEngine !== undefined ? { envValue: options.envEngine } : {}),
+        ...(typeof config.engine?.enabled === 'boolean' ? { configEnabled: config.engine.enabled } : {}),
+    });
+    if (engineBanner.enabled) {
+        console.log(fmt('dim', `  engine: on (${engineBanner.source})`));
+    }
     console.log('');
     // Build a focused git summary / prompt context
     const focusHint = buildFocusHint(options.ask, focusLabel);
+    const scanInput = {
+        files,
+        relFiles,
+        cwd,
+        config,
+        engine,
+        focusHint,
+        ...(options.ask !== undefined ? { ask: options.ask } : {}),
+        focusLabel,
+        all: options.all === true,
+    };
+    // The wrapped phase body — pure call-the-LLM-and-process-findings work.
+    // Extracted into a RunPhase so the engine path and the legacy path share
+    // the exact same logic. Engine-off callers invoke this directly via
+    // `executeScanPhase()`; engine-on callers route through `runPhase()`.
+    const phase = {
+        name: 'scan',
+        // scan re-issues identical LLM queries against the same code — re-running
+        // is safe and cheap-ish to retry.
+        idempotent: true,
+        // No git push, no PR comment, no provider-side mutation. The cost-log
+        // append + findings-cache write are local file IO that's already
+        // overwrite-style; replays are safe.
+        hasSideEffects: false,
+        run: executeScanPhase,
+    };
+    return {
+        kind: 'phase',
+        phase,
+        input: scanInput,
+        config,
+        renderResult: (output) => renderScanOutput(output, scanInput),
+    };
+}
+export async function runScan(options = {}) {
+    const built = await buildScanPhase(options);
+    if (built.kind === 'early-exit')
+        return built.exitCode;
+    const { phase, input, config, renderResult } = built;
+    // v6.0.6 — lifecycle wiring (createRun → runPhase → run.complete + state
+    // snapshot + lock release) lives in `runPhaseWithLifecycle`. The helper
+    // owns the engine-on/engine-off branch and the failure banner; the caller
+    // just supplies the phase, the input, and the engine-off escape hatch.
+    let output;
+    try {
+        const result = await runPhaseWithLifecycle({
+            cwd: input.cwd,
+            phase,
+            input,
+            config,
+            cliEngine: options.cliEngine,
+            envEngine: options.envEngine,
+            runEngineOff: () => executeScanPhase(input),
+        });
+        output = result.output;
+    }
+    catch {
+        // Helper already printed the failure banner + emitted run.complete
+        // failed + refreshed state.json + released the lock. Surface the
+        // legacy non-zero exit so existing CI / scripts are unaffected.
+        return 1;
+    }
+    return renderResult(output);
+}
+// ---------------------------------------------------------------------------
+// Phase body — the LLM call + finding processing + cost-log append + findings
+// cache write. Extracted from runScan so the engine-on path can wrap it via
+// `runPhase` and the engine-off path can call it directly. Returns a
+// JSON-serializable ScanOutput so the engine can persist it as `result` on
+// the phase snapshot.
+// ---------------------------------------------------------------------------
+async function executeScanPhase(input) {
+    const { files, relFiles, cwd, config, engine, focusHint, ask } = input;
     const result = await runReviewPhase({
         touchedFiles: relFiles,
         engine,
@@ -149,11 +252,47 @@ export async function runScan(options = {}) {
     // Apply ignore rules
     const ignoreRules = [...loadIgnoreRules(cwd), ...parseConfigIgnore(config.ignore)];
     const findings = applyIgnoreRules(result.findings, ignoreRules);
+    // Persist findings so `guardrail fix` can read them
+    saveCachedFindings(cwd, findings);
+    // Persist run to cost log so `claude-autopilot costs` reflects scans, not
+    // just full pipeline runs. Previously scan never wrote to the log, so the
+    // costs report stayed frozen at whatever the last `run` invocation produced.
+    appendCostLog(cwd, {
+        timestamp: new Date().toISOString(),
+        files: files.length,
+        inputTokens: result.usage?.input ?? 0,
+        outputTokens: result.usage?.output ?? 0,
+        costUSD: result.costUSD ?? 0,
+        durationMs: result.durationMs,
+    });
+    return {
+        fileCount: files.length,
+        findings: findings.map(f => ({
+            severity: f.severity,
+            message: f.message,
+            ...(f.file !== undefined ? { file: f.file } : {}),
+            ...(f.line !== undefined ? { line: f.line } : {}),
+            ...(f.suggestion !== undefined ? { suggestion: f.suggestion } : {}),
+        })),
+        ...(result.costUSD !== undefined ? { costUSD: result.costUSD } : {}),
+        durationMs: result.durationMs,
+        ...(result.rawOutputs !== undefined ? { rawOutputs: result.rawOutputs } : {}),
+    };
+}
+// ---------------------------------------------------------------------------
+// Render — translate ScanOutput back to the legacy stdout banner + exit code.
+// Lives outside the wrapped phase because it's pure presentation; doing the
+// rendering inside the phase would couple the engine path's idempotency to
+// console output, which we don't want.
+// ---------------------------------------------------------------------------
+function renderScanOutput(output, input) {
+    const { findings, costUSD, durationMs, rawOutputs } = output;
+    const { ask } = input;
     // Print results
-    if (findings.length === 0 && options.ask && result.rawOutputs && result.rawOutputs.length > 0) {
+    if (findings.length === 0 && ask && rawOutputs && rawOutputs.length > 0) {
         // --ask returned prose rather than structured findings — surface raw response
         console.log(fmt('cyan', `Answer:`));
-        for (const raw of result.rawOutputs) {
+        for (const raw of rawOutputs) {
             // Strip markdown fences and the ## Findings / ## Review Summary headers if present
             const cleaned = raw.replace(/^##\s+Review Summary\s*\n/gm, '').replace(/^##\s+Findings\s*\n/gm, '').trim();
             console.log(cleaned);
@@ -196,21 +335,8 @@ export async function runScan(options = {}) {
             console.log('');
         }
     }
-    // Persist findings so `guardrail fix` can read them
-    saveCachedFindings(cwd, findings);
-    // Persist run to cost log so `claude-autopilot costs` reflects scans, not
-    // just full pipeline runs. Previously scan never wrote to the log, so the
-    // costs report stayed frozen at whatever the last `run` invocation produced.
-    appendCostLog(cwd, {
-        timestamp: new Date().toISOString(),
-        files: files.length,
-        inputTokens: result.usage?.input ?? 0,
-        outputTokens: result.usage?.output ?? 0,
-        costUSD: result.costUSD ?? 0,
-        durationMs: result.durationMs,
-    });
-    if (result.costUSD !== undefined) {
-        console.log(fmt('dim', `  $${result.costUSD.toFixed(4)} · ${result.durationMs}ms`));
+    if (costUSD !== undefined) {
+        console.log(fmt('dim', `  $${costUSD.toFixed(4)} · ${durationMs}ms`));
     }
     const fixable = findings.filter(f => f.severity === 'critical' || f.severity === 'warning');
     if (fixable.length > 0) {

package/dist/src/cli/setup.d.ts CHANGED Viewed

@@ -1,3 +1,4 @@
+import { type DetectionResult } from './detector.ts';
 export type ProfileName = 'security-strict' | 'team' | 'solo';
 export interface SetupOptions {
     cwd?: string;
@@ -6,4 +7,33 @@ export interface SetupOptions {
     profile?: ProfileName;
 }
 export declare function runSetup(options?: SetupOptions): Promise<void>;
+/**
+ * Append `entries` to `<cwd>/.gitignore` if missing. Returns the entries
+ * actually added (empty array when all already present, .gitignore is empty
+ * + we don't want to create one, etc.).
+ *
+ * Behavior:
+ *   - .gitignore exists: parse line-by-line, skip entries already present
+ *     (exact match after trim, ignoring leading `!`), append the rest.
+ *   - .gitignore missing: create it with the entries. Reasonable default
+ *     for a fresh `setup` since the user is opting into autopilot's cache.
+ *
+ * Idempotent: safe to call twice with the same entries.
+ */
+export declare function ensureGitignoreEntries(cwd: string, entries: string[]): Promise<string[]>;
+/**
+ * Write a starter `<cwd>/CLAUDE.md` if none exists. Pulls stack-detection
+ * info from the same `detection` result that drove preset selection, so the
+ * scaffolded conventions match the actual project.
+ *
+ * The starter doc is intentionally short (~35 lines) — a real project will
+ * grow it. The goal is to give downstream agents an anchor for the most
+ * common "I had to guess" decisions the v7.1.6 benchmark agent reported:
+ * commit-message style, test command, error class shape, prompt location.
+ *
+ * Returns true when the file was written (false if it already exists; we
+ * never overwrite — operator opted into autopilot, not into us nuking
+ * their docs).
+ */
+export declare function ensureStarterClaudeMd(cwd: string, detection: DetectionResult): Promise<boolean>;
 //# sourceMappingURL=setup.d.ts.map

package/dist/src/cli/setup.js CHANGED Viewed

@@ -138,6 +138,26 @@ export async function runSetup(options = {}) {
     for (const line of presetContent.trimEnd().split('\n')) {
         console.log(`  ${DIM(line)}`);
     }
+    // v7.1.7 — Auto-add `.guardrail-cache/` and `node_modules/` to .gitignore.
+    // Per the v7.1.6 blank-repo benchmark, these are the two most common
+    // day-1 paper cuts: `setup` creates the cache dir on first run, and (for
+    // Node projects) `npm install` creates `node_modules` — neither belongs
+    // in git. Skipped silently if already present or no .gitignore exists
+    // and we don't want to create one without consent.
+    const gitignoreAdds = await ensureGitignoreEntries(cwd, [
+        '.guardrail-cache/',
+        'node_modules/',
+    ]);
+    if (gitignoreAdds.length > 0) {
+        console.log(`\n  ${PASS}  Added to .gitignore: ${DIM(gitignoreAdds.join(', '))}`);
+    }
+    // v7.1.7 — Auto-scaffold a starter CLAUDE.md if none exists. Closes ~5 of
+    // 6 friction points the benchmark agent hit on a blank repo (commit
+    // style, error class shape, test runner choice, etc.).
+    const claudeMdAdded = await ensureStarterClaudeMd(cwd, detection);
+    if (claudeMdAdded) {
+        console.log(`  ${PASS}  Wrote starter CLAUDE.md`);
+    }
     let hookInstalled = false;
     if (!options.skipHook) {
         const hookCode = await runHook('install', { cwd, silent: true });
@@ -152,6 +172,19 @@ export async function runSetup(options = {}) {
     console.log('\nChecking prerequisites…');
     await runDoctor();
     console.log(`\n${BOLD('Next steps:')}\n`);
+    // v7.1.9 — Generic+low-confidence detection prompt. The v7.1.8 benchmark
+    // re-run on a truly blank repo (no package.json / go.mod / language signal)
+    // surfaced this: setup runs fine but downstream agents get a CLAUDE.md
+    // saying "Detected: Generic (low confidence)" with no concrete next step
+    // to improve detection. Surfacing the actionable "scaffold a stack file
+    // first" hint converts a paper-cut into a one-liner.
+    if (detection.preset === 'generic' && detection.confidence === 'low') {
+        console.log(`  ${WARN}  ${CYAN('Stack detection: Generic (low confidence).')}`);
+        console.log(`       For higher-quality reviews + stack-specific presets, scaffold a`);
+        console.log(`       package manifest first, then re-run setup:`);
+        console.log(`         npm init -y                              ${DIM('# or: pnpm init, go mod init, cargo init')}`);
+        console.log(`         npx claude-autopilot setup --force       ${DIM('# re-detect with the new manifest')}\n`);
+    }
     if (!hasKey) {
         console.log(`  1. ${CYAN('Set an LLM API key')} — guardrail needs one to review code:`);
         console.log(`       export ANTHROPIC_API_KEY=sk-ant-...     # https://console.anthropic.com/`);
@@ -175,4 +208,108 @@ export async function runSetup(options = {}) {
         }
     }
 }
+// ---------------------------------------------------------------------------
+// v7.1.7 — setup-verb day-1 polish helpers
+// ---------------------------------------------------------------------------
+/**
+ * Append `entries` to `<cwd>/.gitignore` if missing. Returns the entries
+ * actually added (empty array when all already present, .gitignore is empty
+ * + we don't want to create one, etc.).
+ *
+ * Behavior:
+ *   - .gitignore exists: parse line-by-line, skip entries already present
+ *     (exact match after trim, ignoring leading `!`), append the rest.
+ *   - .gitignore missing: create it with the entries. Reasonable default
+ *     for a fresh `setup` since the user is opting into autopilot's cache.
+ *
+ * Idempotent: safe to call twice with the same entries.
+ */
+export async function ensureGitignoreEntries(cwd, entries) {
+    const gitignorePath = path.join(cwd, '.gitignore');
+    let existing = [];
+    let existingContent = '';
+    try {
+        existingContent = await fsAsync.readFile(gitignorePath, 'utf8');
+        existing = existingContent
+            .split('\n')
+            .map((l) => l.trim())
+            .filter((l) => l.length > 0 && !l.startsWith('#'));
+    }
+    catch {
+        // File doesn't exist — that's fine, we'll create it below.
+    }
+    const present = new Set(existing.map((l) => l.replace(/^!/, '')));
+    const missing = entries.filter((e) => !present.has(e.replace(/^!/, '')));
+    if (missing.length === 0)
+        return [];
+    // Build the appended block. Add a trailing newline first so we don't
+    // collide with a no-final-newline file.
+    const needsLeadingNewline = existingContent.length > 0 && !existingContent.endsWith('\n');
+    const block = (needsLeadingNewline ? '\n' : '') +
+        (existingContent.length > 0 ? '# claude-autopilot (v7.1.7+)\n' : '') +
+        missing.join('\n') +
+        '\n';
+    await fsAsync.writeFile(gitignorePath, existingContent + block, 'utf8');
+    return missing;
+}
+/**
+ * Write a starter `<cwd>/CLAUDE.md` if none exists. Pulls stack-detection
+ * info from the same `detection` result that drove preset selection, so the
+ * scaffolded conventions match the actual project.
+ *
+ * The starter doc is intentionally short (~35 lines) — a real project will
+ * grow it. The goal is to give downstream agents an anchor for the most
+ * common "I had to guess" decisions the v7.1.6 benchmark agent reported:
+ * commit-message style, test command, error class shape, prompt location.
+ *
+ * Returns true when the file was written (false if it already exists; we
+ * never overwrite — operator opted into autopilot, not into us nuking
+ * their docs).
+ */
+export async function ensureStarterClaudeMd(cwd, detection) {
+    const dest = path.join(cwd, 'CLAUDE.md');
+    if (fs.existsSync(dest))
+        return false;
+    const stackLabel = PRESET_LABELS[detection.preset] ?? detection.preset;
+    const today = new Date().toISOString().slice(0, 10);
+    const body = [
+        `# CLAUDE.md`,
+        ``,
+        `Project conventions for AI-assisted contributions. Auto-scaffolded by`,
+        `\`claude-autopilot setup\` on ${today}; edit freely.`,
+        ``,
+        `## Stack`,
+        ``,
+        `- **Detected:** ${stackLabel} (${detection.confidence} confidence)`,
+        `- **Test command:** \`${detection.testCommand}\``,
+        `- **Evidence:** ${detection.evidence}`,
+        ``,
+        `## Conventions`,
+        ``,
+        `- **Commit messages:** Conventional Commits (\`feat:\`, \`fix:\`,`,
+        `  \`docs:\`, \`refactor:\`, \`test:\`, \`chore:\`). One sentence first`,
+        `  line, optional body.`,
+        `- **Branches:** \`feat/<topic>\`, \`fix/<topic>\`, \`chore/<topic>\`.`,
+        `- **Errors:** prefer custom \`Error\` subclasses with a string \`code\``,
+        `  field for programmatic handling. Example:`,
+        `  \`\`\`ts`,
+        `  class FetchFailed extends Error { code = 'fetch_failed' as const; }`,
+        `  \`\`\``,
+        `- **Tests:** colocated with source under \`tests/\` or \`__tests__/\`.`,
+        `  Run via \`${detection.testCommand}\`.`,
+        ``,
+        `## Patterns to mimic`,
+        ``,
+        `- TODO: as the project grows, list 2-3 example files agents should`,
+        `  read first to learn local style.`,
+        ``,
+        `## Common pitfalls`,
+        ``,
+        `- TODO: list any non-obvious gotchas — env-var quirks, ordering`,
+        `  requirements, footguns the test suite won't catch.`,
+        ``,
+    ].join('\n');
+    await fsAsync.writeFile(dest, body, 'utf8');
+    return true;
+}
 //# sourceMappingURL=setup.js.map

package/dist/src/cli/spec.d.ts ADDED Viewed

@@ -0,0 +1,66 @@
+import type { GuardrailConfig } from '../core/config/types.ts';
+import { type RunPhase } from '../core/run-state/phase-runner.ts';
+export interface SpecCommandOptions {
+    cwd?: string;
+    configPath?: string;
+    /**
+     * v6.0.3 — engine knob inputs. Same shape and precedence as scan / costs /
+     * fix / brainstorm (CLI > env > config > built-in default off in v6.0.x).
+     */
+    cliEngine?: boolean;
+    envEngine?: string;
+    /**
+     * Test-only seam — when true, the phase body returns its result without
+     * printing the advisory banner. Lets engine-smoke tests assert the
+     * `state.json` + `events.ndjson` lifecycle without polluting stdout.
+     * Production callers (the CLI dispatcher) MUST NOT pass this.
+     */
+    __silent?: boolean;
+}
+/**
+ * Phase input — minimal. The CLI verb body is a print-and-exit advisory.
+ * Captured as a struct so the engine path's phase body matches the
+ * engine-off path call signature.
+ *
+ * Exported so the v6.2.0 orchestrator's phase registry can carry the typed
+ * I/O shape on its `PhaseRegistration<SpecInput, SpecOutput>` slot.
+ */
+export interface SpecInput {
+    cwd: string;
+    silent: boolean;
+}
+/**
+ * Phase output — JSON-serializable acknowledgment. Mirrors the shape of
+ * `BrainstormOutput`. Persisted as `result` on `phases/spec.json`.
+ */
+export interface SpecOutput {
+    /** Always 'advisory' for v6.0.3 — the CLI verb is a Claude Code pointer. */
+    kind: 'advisory';
+    nextActions: string[];
+}
+/** v6.2.0 — see scan.ts for the kind='early-exit' rationale. Spec has no
+ *  early-exit branches today (it just creates a config struct and returns
+ *  an advisory) so this discriminant is included for shape parity with the
+ *  other builders. */
+export interface BuildSpecPhaseEarlyExit {
+    kind: 'early-exit';
+    exitCode: number;
+}
+export interface BuildSpecPhaseResult {
+    kind: 'phase';
+    phase: RunPhase<SpecInput, SpecOutput>;
+    input: SpecInput;
+    config: GuardrailConfig;
+    renderResult: (output: SpecOutput) => number;
+}
+/**
+ * v6.2.0 — extract the `RunPhase<SpecInput, SpecOutput>` construction out of
+ * `runSpec(options)` so the new top-level `autopilot` orchestrator can drive
+ * `runPhase` itself with a shared `phaseIdx` against the same run dir.
+ *
+ * Parity with `runSpec(options)` is asserted by
+ * `tests/cli/spec-builder-parity.test.ts`.
+ */
+export declare function buildSpecPhase(options: SpecCommandOptions): Promise<BuildSpecPhaseResult | BuildSpecPhaseEarlyExit>;
+export declare function runSpec(options?: SpecCommandOptions): Promise<number>;
+//# sourceMappingURL=spec.d.ts.map

package/dist/src/cli/spec.js ADDED Viewed

@@ -0,0 +1,132 @@
+// src/cli/spec.ts
+//
+// v6.0.3 — wrap the `spec` pipeline phase through `runPhase`.
+//
+// `spec` is the second phase of the autopilot pipeline (brainstorm → spec →
+// plan → implement → migrate → validate → pr → review). Like `brainstorm`, it
+// is implemented primarily as a Claude Code skill, not as a standalone CLI
+// subcommand. The CLI verb that ships in this binary is an advisory shim: it
+// points the user at the Claude Code skill and the next pipeline verbs. There
+// is no LLM call in the CLI verb body and no provider side effects. The
+// pure-LLM spec writing happens in Claude Code; the spec markdown produced
+// there lands at `docs/superpowers/specs/<slug>.md` (a local file write —
+// the recipe treats local file writes as acceptable inside the phase body,
+// identical precedent to `fix.ts` editing local source files).
+//
+// Idempotency / side effects (deviation note vs. spec table):
+//   - The spec table at docs/specs/v6-run-state-engine.md says
+//     `idempotent: no` for `spec` because re-running produces NEW LLM
+//     content each invocation. v6.0.3 declares `idempotent: true` to match
+//     the engine's actual semantics ("safe to retry without
+//     reconciliation"): the CLI verb itself is a printed advisory that is
+//     byte-for-byte identical on every invocation, has no externalRefs to
+//     reconcile, and no provider state to roll back. Same reasoning as the
+//     brainstorm wrap. See `src/cli/brainstorm.ts` for the longer
+//     deviation rationale.
+//   - `hasSideEffects: false` — the CLI verb prints to stdout. No provider
+//     calls, no git push, no PR creation, no remote API write.
+import * as path from 'node:path';
+import * as fs from 'node:fs';
+import { loadConfig } from "../core/config/loader.js";
+import { runPhaseWithLifecycle } from "../core/run-state/run-phase-with-lifecycle.js";
+const C = {
+    reset: '\x1b[0m', bold: '\x1b[1m', dim: '\x1b[2m',
+    cyan: '\x1b[36m', red: '\x1b[31m',
+};
+const fmt = (c, t) => `${C[c]}${t}${C.reset}`;
+/**
+ * v6.2.0 — extract the `RunPhase<SpecInput, SpecOutput>` construction out of
+ * `runSpec(options)` so the new top-level `autopilot` orchestrator can drive
+ * `runPhase` itself with a shared `phaseIdx` against the same run dir.
+ *
+ * Parity with `runSpec(options)` is asserted by
+ * `tests/cli/spec-builder-parity.test.ts`.
+ */
+export async function buildSpecPhase(options) {
+    const cwd = options.cwd ?? process.cwd();
+    const configPath = options.configPath ?? path.join(cwd, 'guardrail.config.yaml');
+    let config = { configVersion: 1 };
+    if (fs.existsSync(configPath)) {
+        const loaded = await loadConfig(configPath);
+        if (loaded)
+            config = loaded;
+    }
+    const specInput = { cwd, silent: options.__silent === true };
+    const phase = {
+        name: 'spec',
+        // Pure-LLM spec writing happens in the Claude Code skill, not here.
+        // The CLI verb is an advisory print with no externalRefs to reconcile
+        // and no provider state to roll back. Safe to retry. (Deviation from
+        // the spec table noted at the top of the file.)
+        idempotent: true,
+        // No provider calls, no git push, no PR creation. Identical to costs
+        // and brainstorm.
+        hasSideEffects: false,
+        run: async (input) => executeSpecPhase(input),
+    };
+    return {
+        kind: 'phase',
+        phase,
+        input: specInput,
+        config,
+        renderResult: (output) => renderSpecOutput(output, specInput),
+    };
+}
+export async function runSpec(options = {}) {
+    const built = await buildSpecPhase(options);
+    if (built.kind === 'early-exit')
+        return built.exitCode;
+    const { phase, input, config, renderResult } = built;
+    // v6.0.6 — lifecycle wiring lives in `runPhaseWithLifecycle`.
+    let output;
+    try {
+        const result = await runPhaseWithLifecycle({
+            cwd: input.cwd,
+            phase,
+            input,
+            config,
+            cliEngine: options.cliEngine,
+            envEngine: options.envEngine,
+            runEngineOff: () => executeSpecPhase(input),
+        });
+        output = result.output;
+    }
+    catch {
+        return 1;
+    }
+    return renderResult(output);
+}
+// ---------------------------------------------------------------------------
+// Phase body — produce the advisory payload. Pure: no provider calls.
+// ---------------------------------------------------------------------------
+async function executeSpecPhase(_input) {
+    return {
+        kind: 'advisory',
+        nextActions: [
+            'Approve a brainstorm output, then invoke /autopilot from Claude Code',
+            'The autopilot skill writes the implementation plan + executes the pipeline',
+        ],
+    };
+}
+// ---------------------------------------------------------------------------
+// Render — translate SpecOutput back to the stdout advisory + exit code.
+// ---------------------------------------------------------------------------
+function renderSpecOutput(_output, input) {
+    if (input.silent)
+        return 0;
+    console.log(`
+${fmt('bold', '[spec]')} Spec writing is a Claude Code skill, not a standalone CLI subcommand.
+Invoke it from Claude Code:
+  ${fmt('cyan', '/brainstorm')}                         Interactive spec writing (entry point)
+  ${fmt('cyan', '/autopilot')}                          Full pipeline from an approved spec
+  ${fmt('cyan', '/migrate')}                            Database migration phase (stack-dependent)
+Specs land at ${fmt('dim', 'docs/superpowers/specs/<slug>.md')} — once approved, /autopilot consumes them.
+Full pipeline docs: https://github.com/axledbetter/claude-autopilot#the-pipeline-phase-by-phase
+`);
+    return 0;
+}
+//# sourceMappingURL=spec.js.map