npm - nightytidy - Versions diffs - 0.1.0 - Mend

nightytidy 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (61) hide show

package/LICENSE +21 -0
package/README.md +314 -0
package/bin/nightytidy.js +3 -0
package/package.json +55 -0
package/src/checks.js +367 -0
package/src/claude.js +655 -0
package/src/cli.js +1012 -0
package/src/consolidation.js +81 -0
package/src/dashboard-html.js +496 -0
package/src/dashboard-standalone.js +167 -0
package/src/dashboard-tui.js +208 -0
package/src/dashboard.js +427 -0
package/src/env.js +100 -0
package/src/executor.js +550 -0
package/src/git.js +348 -0
package/src/lock.js +186 -0
package/src/logger.js +111 -0
package/src/notifications.js +33 -0
package/src/orchestrator.js +919 -0
package/src/prompts/loader.js +55 -0
package/src/prompts/manifest.json +138 -0
package/src/prompts/specials/changelog.md +28 -0
package/src/prompts/specials/consolidation.md +61 -0
package/src/prompts/specials/doc-update.md +1 -0
package/src/prompts/specials/report.md +95 -0
package/src/prompts/steps/01-documentation.md +173 -0
package/src/prompts/steps/02-test-coverage.md +181 -0
package/src/prompts/steps/03-test-hardening.md +181 -0
package/src/prompts/steps/04-test-architecture.md +130 -0
package/src/prompts/steps/05-test-consolidation.md +165 -0
package/src/prompts/steps/06-test-quality.md +211 -0
package/src/prompts/steps/07-api-design.md +165 -0
package/src/prompts/steps/08-security-sweep.md +207 -0
package/src/prompts/steps/09-dependency-health.md +217 -0
package/src/prompts/steps/10-codebase-cleanup.md +189 -0
package/src/prompts/steps/11-crosscutting-concerns.md +196 -0
package/src/prompts/steps/12-file-decomposition.md +263 -0
package/src/prompts/steps/13-code-elegance.md +329 -0
package/src/prompts/steps/14-architectural-complexity.md +297 -0
package/src/prompts/steps/15-type-safety.md +192 -0
package/src/prompts/steps/16-logging-error-message.md +173 -0
package/src/prompts/steps/17-data-integrity.md +139 -0
package/src/prompts/steps/18-performance.md +183 -0
package/src/prompts/steps/19-cost-resource-optimization.md +136 -0
package/src/prompts/steps/20-error-recovery.md +145 -0
package/src/prompts/steps/21-race-condition-audit.md +178 -0
package/src/prompts/steps/22-bug-hunt.md +229 -0
package/src/prompts/steps/23-frontend-quality.md +210 -0
package/src/prompts/steps/24-uiux-audit.md +284 -0
package/src/prompts/steps/25-state-management.md +170 -0
package/src/prompts/steps/26-perceived-performance.md +190 -0
package/src/prompts/steps/27-devops.md +165 -0
package/src/prompts/steps/28-scheduled-job-chron-jobs.md +141 -0
package/src/prompts/steps/29-observability.md +152 -0
package/src/prompts/steps/30-backup-check.md +155 -0
package/src/prompts/steps/31-product-polish-ux-friction.md +122 -0
package/src/prompts/steps/32-feature-discovery-opportunity.md +128 -0
package/src/prompts/steps/33-strategic-opportunities.md +217 -0
package/src/report.js +540 -0
package/src/setup.js +133 -0
package/src/sync.js +536 -0

package/src/orchestrator.js ADDED Viewed

@@ -0,0 +1,919 @@
+/**
+ * @fileoverview Claude Code orchestrator mode for NightyTidy.
+ *
+ * Provides a JSON-based API for step-by-step runs where Claude Code
+ * (or another orchestrator) controls the workflow conversationally.
+ *
+ * Error contract: This module NEVER throws. All functions return
+ * { success: boolean, ...data } or { success: false, error: string }.
+ */
+import { readFileSync, writeFileSync, renameSync, unlinkSync, existsSync } from 'fs';
+import { spawn } from 'child_process';
+import { fileURLToPath } from 'url';
+import path from 'path';
+import { initLogger, info, warn, error as logError } from './logger.js';
+import { runPreChecks } from './checks.js';
+import { initGit, excludeEphemeralFiles, getCurrentBranch, createPreRunTag, createRunBranch, mergeRunBranch, getGitInstance, ensureOnBranch } from './git.js';
+import { runPrompt, ERROR_TYPE } from './claude.js';
+import { STEPS, reloadSteps } from './prompts/loader.js';
+import { executeSingleStep, sumCosts, SAFETY_PREAMBLE, PROD_PREAMBLE, copyPromptsToProject } from './executor.js';
+import { notify } from './notifications.js';
+import { generateReport, formatDuration, getVersion, buildReportNames, buildReportPrompt, verifyReportContent, updateClaudeMd } from './report.js';
+import { acquireLock, releaseLock } from './lock.js';
+/**
+ * @typedef {import('./executor.js').CostData} CostData
+ * @typedef {import('./executor.js').StepResult} StepResult
+ */
+/**
+ * @typedef {Object} OrchestratorState
+ * @property {number} version - State format version
+ * @property {string} originalBranch - Branch to return to after run
+ * @property {string} runBranch - Branch for run changes
+ * @property {string} tagName - Safety tag name
+ * @property {number[]} selectedSteps - Step numbers selected for this run
+ * @property {StepEntry[]} completedSteps - Successfully completed steps
+ * @property {StepEntry[]} failedSteps - Failed steps
+ * @property {StepEntry[]} [skippedSteps] - Steps skipped (prompt not applicable)
+ * @property {number} startTime - Run start timestamp (ms)
+ * @property {number|null} timeout - Per-step timeout in ms
+ * @property {number|null} dashboardPid - Dashboard server process ID
+ * @property {string|null} dashboardUrl - Dashboard server URL
+ */
+/**
+ * @typedef {Object} StepEntry
+ * @property {number} number - Step number
+ * @property {string} name - Step name
+ * @property {'completed' | 'failed' | 'skipped'} status - Step status
+ * @property {number} duration - Duration in milliseconds
+ * @property {number} attempts - Number of attempts
+ * @property {string} output - Truncated output (max 6000 chars)
+ * @property {string|null} error - Error message if failed
+ * @property {CostData|null} cost - Cost data
+ * @property {boolean} suspiciousFast - True if flagged as suspicious
+ * @property {string|null} errorType - Error type if failed
+ * @property {number|null} retryAfterMs - Retry delay for rate limits
+ */
+/**
+ * @typedef {Object} OrchestratorResult
+ * @property {boolean} success - Whether operation succeeded
+ * @property {string} [error] - Error message if failed
+ */
+const PROGRESS_FILENAME = 'nightytidy-progress.json';
+const URL_FILENAME = 'nightytidy-dashboard.url';
+const STATE_FILENAME = 'nightytidy-run-state.json';
+export const STATE_VERSION = 1;
+const DASHBOARD_STARTUP_TIMEOUT = 5000; // ms — max wait for dashboard server to respond
+const SSE_FLUSH_DELAY = 500; // ms — brief delay to let last SSE event reach clients
+/**
+ * Get the path to the state file for a project.
+ *
+ * @param {string} projectDir - Project directory
+ * @returns {string} Absolute path to state file
+ */
+function statePath(projectDir) {
+  return path.join(projectDir, STATE_FILENAME);
+}
+/**
+ * Read the orchestrator state file.
+ *
+ * @param {string} projectDir - Project directory
+ * @returns {OrchestratorState|null} State object, or null if not found/invalid
+ */
+export function readState(projectDir) {
+  const fp = statePath(projectDir);
+  if (!existsSync(fp)) return null;
+  try {
+    const data = JSON.parse(readFileSync(fp, 'utf8'));
+    if (data.version !== STATE_VERSION) return null;
+    return data;
+  } catch {
+    return null;
+  }
+}
+/**
+ * Write the orchestrator state file atomically.
+ * Uses write-to-temp + rename to prevent truncation on crash.
+ *
+ * @param {string} projectDir - Project directory
+ * @param {OrchestratorState} state - State to write
+ * @returns {void}
+ */
+export function writeState(projectDir, state) {
+  // Write to temp file then rename for atomic replacement.
+  // Prevents truncated JSON on crash (FINDING-06, audit #21).
+  const target = statePath(projectDir);
+  const tmp = target + '.tmp';
+  writeFileSync(tmp, JSON.stringify(state, null, 2), 'utf8');
+  renameSync(tmp, target);
+}
+/**
+ * Delete the orchestrator state file.
+ *
+ * @param {string} projectDir - Project directory
+ * @returns {void}
+ */
+export function deleteState(projectDir) {
+  try {
+    unlinkSync(statePath(projectDir));
+  } catch (err) {
+    if (err.code !== 'ENOENT') {
+      warn(`Failed to delete state file: ${err.message}`);
+    }
+  }
+}
+/**
+ * Create a success result object.
+ *
+ * @template T
+ * @param {T} data - Data to include in result
+ * @returns {{success: true} & T}
+ */
+function ok(data) {
+  return { success: true, ...data };
+}
+/**
+ * Create a failure result object.
+ *
+ * @param {string} error - Error message
+ * @returns {{success: false, error: string}}
+ */
+function fail(error) {
+  return { success: false, error };
+}
+/**
+ * Validate that step numbers are within valid range.
+ *
+ * @param {number[]} numbers - Step numbers to validate
+ * @returns {{success: false, error: string}|null} Error result, or null if valid
+ */
+function validateStepNumbers(numbers) {
+  const valid = STEPS.map(s => s.number);
+  const invalid = numbers.filter(n => !valid.includes(n));
+  if (invalid.length > 0) {
+    return fail(`Invalid step number(s): ${invalid.join(', ')}. Valid range: 1-${STEPS.length}.`);
+  }
+  return null;
+}
+/**
+ * Validate that a step can be run in the current orchestrator state.
+ *
+ * @param {number} stepNumber - Step number to validate
+ * @param {OrchestratorState} state - Current orchestrator state
+ * @returns {string|null} Error string if invalid, null if valid
+ */
+function validateStepCanRun(stepNumber, state) {
+  if (!state.selectedSteps.includes(stepNumber)) {
+    return `Step ${stepNumber} is not in the selected steps for this run. Selected: ${state.selectedSteps.join(', ')}`;
+  }
+  if (state.completedSteps.some(s => s.number === stepNumber)) {
+    return `Step ${stepNumber} has already been completed in this run.`;
+  }
+  if ((state.skippedSteps || []).some(s => s.number === stepNumber)) {
+    return `Step ${stepNumber} was skipped (prompt not applicable to this codebase).`;
+  }
+  // Failed steps can be retried (e.g., after rate-limit pause/resume).
+  // The old entry is removed before recording the new result in runStep().
+  return null;
+}
+/**
+ * Build execution results from orchestrator state for report generation.
+ *
+ * @param {OrchestratorState} state - Orchestrator state
+ * @returns {import('./executor.js').ExecutionResults} Execution results
+ */
+function buildExecutionResults(state) {
+  const skipped = state.skippedSteps || [];
+  const allStepResults = [...state.completedSteps, ...state.failedSteps, ...skipped]
+    .sort((a, b) => state.selectedSteps.indexOf(a.number) - state.selectedSteps.indexOf(b.number));
+  return {
+    results: allStepResults.map(s => ({
+      step: { number: s.number, name: s.name },
+      status: s.status,
+      output: s.output || '',
+      duration: s.duration,
+      attempts: s.attempts,
+      error: s.status === 'failed' ? 'Step failed during orchestrated run' : null,
+      cost: s.cost || null,
+    })),
+    completedCount: state.completedSteps.length,
+    failedCount: state.failedSteps.length,
+    skippedCount: skipped.length,
+  };
+}
+/**
+ * @typedef {Object} ProgressState
+ * @property {'running' | 'paused' | 'completed' | 'error'} status
+ * @property {number} totalSteps
+ * @property {number} currentStepIndex
+ * @property {string} currentStepName
+ * @property {Array<{number: number, name: string, status: string, duration: number|null}>} steps
+ * @property {number} completedCount
+ * @property {number} failedCount
+ * @property {number} startTime
+ * @property {string|null} error
+ */
+/**
+ * Build progress state for dashboard display.
+ *
+ * @param {OrchestratorState} state - Orchestrator state
+ * @returns {ProgressState} Progress state for JSON serialization
+ */
+function buildProgressState(state) {
+  // Pre-index for O(1) lookups instead of O(n) find() calls
+  const stepsMap = new Map(STEPS.map(s => [s.number, s]));
+  const completedMap = new Map(state.completedSteps.map(s => [s.number, s]));
+  const failedMap = new Map(state.failedSteps.map(s => [s.number, s]));
+  const skippedMap = new Map((state.skippedSteps || []).map(s => [s.number, s]));
+  return {
+    status: 'running',
+    totalSteps: state.selectedSteps.length,
+    currentStepIndex: -1,
+    currentStepName: '',
+    steps: state.selectedSteps.map(num => {
+      const step = stepsMap.get(num);
+      const completed = completedMap.get(num);
+      const failed = failedMap.get(num);
+      const skipped = skippedMap.get(num);
+      return {
+        number: num,
+        name: step?.name || `Step ${num}`,
+        status: completed ? 'completed' : failed ? 'failed' : skipped ? 'skipped' : 'pending',
+        duration: completed?.duration || failed?.duration || skipped?.duration || null,
+      };
+    }),
+    completedCount: state.completedSteps.length,
+    failedCount: state.failedSteps.length,
+    skippedCount: (state.skippedSteps || []).length,
+    startTime: state.startTime,
+    error: null,
+  };
+}
+/**
+ * Write progress state to JSON file for dashboard consumption.
+ *
+ * @param {string} projectDir - Project directory
+ * @param {ProgressState} progressState - Progress state to write
+ * @returns {void}
+ */
+function writeProgress(projectDir, progressState) {
+  try {
+    writeFileSync(path.join(projectDir, PROGRESS_FILENAME), JSON.stringify(progressState), 'utf8');
+  } catch { /* non-critical */ }
+}
+const OUTPUT_BUFFER_SIZE = 100 * 1024;
+const OUTPUT_WRITE_INTERVAL = 500;
+/**
+ * Create a throttled output handler for streaming Claude output.
+ *
+ * @param {ProgressState} progress - Progress state object (mutated)
+ * @param {string} projectDir - Project directory for progress file
+ * @returns {(chunk: string) => void} Output handler callback
+ */
+function createOutputHandler(progress, projectDir) {
+  let buffer = '';
+  let writePending = false;
+  return (chunk) => {
+    buffer += chunk;
+    // Forward to stdout so CLI bridge / agent can stream it in real time
+    process.stdout.write(chunk);
+    if (buffer.length > OUTPUT_BUFFER_SIZE) {
+      buffer = buffer.slice(buffer.length - OUTPUT_BUFFER_SIZE);
+    }
+    if (!writePending) {
+      writePending = true;
+      setTimeout(() => {
+        writePending = false;
+        progress.currentStepOutput = buffer;
+        writeProgress(projectDir, progress);
+      }, OUTPUT_WRITE_INTERVAL);
+    }
+  };
+}
+/**
+ * Clean up dashboard ephemeral files.
+ *
+ * @param {string} projectDir - Project directory
+ * @returns {void}
+ */
+function cleanupDashboard(projectDir) {
+  for (const f of [PROGRESS_FILENAME, URL_FILENAME]) {
+    try { unlinkSync(path.join(projectDir, f)); } catch { /* already gone */ }
+  }
+}
+/**
+ * Spawn a detached dashboard server process.
+ *
+ * @param {string} projectDir - Project directory
+ * @returns {Promise<{url: string, pid: number}|null>} Dashboard info, or null on failure
+ */
+function spawnDashboardServer(projectDir) {
+  try {
+    const serverScript = fileURLToPath(new URL('./dashboard-standalone.js', import.meta.url));
+    const child = spawn(process.execPath, [serverScript, projectDir], {
+      detached: true,
+      stdio: ['ignore', 'pipe', 'ignore'],
+      windowsHide: true,
+    });
+    return new Promise((resolve) => {
+      let output = '';
+      const timer = setTimeout(() => {
+        child.stdout.removeAllListeners();
+        child.unref();
+        info('Dashboard server startup timed out — continuing without live progress display');
+        resolve(null);
+      }, DASHBOARD_STARTUP_TIMEOUT);
+      child.stdout.on('data', (chunk) => {
+        output += chunk.toString();
+        if (output.includes('\n')) {
+          clearTimeout(timer);
+          child.stdout.removeAllListeners();
+          child.unref();
+          try {
+            const parsed = JSON.parse(output.trim());
+            return resolve({ url: parsed.url, pid: parsed.pid });
+          } catch (parseErr) {
+            info(`Dashboard startup response was not valid JSON: ${parseErr.message}`);
+            resolve(null);
+          }
+        }
+      });
+      child.on('error', (err) => {
+        clearTimeout(timer);
+        info(`Dashboard server spawn failed: ${err.message}`);
+        resolve(null);
+      });
+    });
+  } catch (err) {
+    warn(`Could not start dashboard server: ${err.message}`);
+    return Promise.resolve(null);
+  }
+}
+/**
+ * Stop the dashboard server process.
+ *
+ * @param {number|null} pid - Process ID to kill
+ * @returns {void}
+ */
+function stopDashboardServer(pid) {
+  if (!pid) return;
+  try {
+    process.kill(pid, 'SIGTERM');
+  } catch { /* already dead */ }
+}
+/**
+ * @typedef {Object} InitRunResult
+ * @property {boolean} success
+ * @property {string} [error]
+ * @property {string} [runBranch]
+ * @property {string} [tagName]
+ * @property {string} [originalBranch]
+ * @property {number[]} [selectedSteps]
+ * @property {string|null} [dashboardUrl]
+ */
+/**
+ * Initialize an orchestrated run.
+ *
+ * Performs pre-checks, git setup, and creates state file. The run can then
+ * be executed step-by-step via runStep().
+ *
+ * @param {string} projectDir - Target project directory
+ * @param {Object} [options] - Options
+ * @param {string} [options.steps] - Comma-separated step numbers
+ * @param {number} [options.timeout] - Per-step timeout in ms
+ * @returns {Promise<InitRunResult>} Result object (never throws)
+ */
+export async function initRun(projectDir, { steps, timeout, skipDashboard } = {}) {
+  try {
+    initLogger(projectDir, { quiet: true });
+    info(`NightyTidy v${getVersion()} orchestrator starting (Node ${process.version}, ${process.platform} ${process.arch})`);
+    // Check for existing run
+    if (readState(projectDir)) {
+      return fail('A run is already in progress. Call --finish-run to complete it, or delete nightytidy-run-state.json to force-reset.');
+    }
+    writeProgress(projectDir, { status: 'initializing', initPhase: 'lock' });
+    await acquireLock(projectDir, { persistent: true });
+    writeProgress(projectDir, { status: 'initializing', initPhase: 'git_init' });
+    const git = initGit(projectDir);
+    excludeEphemeralFiles();
+    writeProgress(projectDir, { status: 'initializing', initPhase: 'pre_checks' });
+    await runPreChecks(projectDir, git);
+    // Auto-sync prompts from Google Doc (non-blocking)
+    writeProgress(projectDir, { status: 'initializing', initPhase: 'sync_prompts' });
+    try {
+      const { syncPrompts } = await import('./sync.js');
+      const syncResult = await syncPrompts();
+      if (syncResult.success) {
+        const changeCount = syncResult.summary.updated.length +
+          syncResult.summary.added.length +
+          syncResult.summary.removed.length;
+        if (changeCount > 0) {
+          reloadSteps();
+          info(`Prompts synced: ${changeCount} change(s)`);
+        } else {
+          info('Prompts up to date');
+        }
+      } else {
+        warn(`Prompt sync failed: ${syncResult.error}. Using cached versions.`);
+      }
+    } catch (err) {
+      warn(`Prompt sync error: ${err.message}. Using cached versions.`);
+    }
+    // Validate and select steps
+    writeProgress(projectDir, { status: 'initializing', initPhase: 'validate_steps' });
+    let selectedNums;
+    if (steps) {
+      const rawTokens = steps.split(',').map(s => s.trim());
+      const nums = rawTokens.map(s => parseInt(s, 10));
+      const droppedTokens = rawTokens.filter((s, i) => Number.isNaN(nums[i]));
+      if (droppedTokens.length > 0) {
+        warn(`Ignoring non-numeric step values: ${droppedTokens.join(', ')}`);
+      }
+      const validNums = nums.filter(n => !Number.isNaN(n));
+      if (validNums.length === 0) {
+        return fail('No valid step numbers provided. Use --list --json to see available steps.');
+      }
+      const err = validateStepNumbers(validNums);
+      if (err) return err;
+      selectedNums = validNums;
+    } else {
+      selectedNums = STEPS.map(s => s.number);
+    }
+    writeProgress(projectDir, { status: 'initializing', initPhase: 'git_branch' });
+    const originalBranch = await getCurrentBranch();
+    const tagName = await createPreRunTag();
+    const runBranch = await createRunBranch(originalBranch);
+    // Sync all prompts into the target project for audit trail
+    writeProgress(projectDir, { status: 'initializing', initPhase: 'copy_prompts' });
+    copyPromptsToProject(projectDir);
+    try {
+      const git = getGitInstance();
+      await git.add([path.join('audit-reports', 'refactor-prompts')]);
+      await git.commit('NightyTidy: Sync refactor prompts');
+    } catch (err) {
+      warn(`Failed to commit refactor prompts: ${err.message}`);
+    }
+    if (!skipDashboard) {
+      writeProgress(projectDir, { status: 'initializing', initPhase: 'dashboard' });
+    }
+    const state = {
+      version: STATE_VERSION,
+      originalBranch,
+      runBranch,
+      tagName,
+      selectedSteps: selectedNums,
+      completedSteps: [],
+      failedSteps: [],
+      skippedSteps: [],
+      startTime: Date.now(),
+      timeout: timeout || null,
+      dashboardPid: null,
+      dashboardUrl: null,
+    };
+    writeState(projectDir, state);
+    // Write running progress JSON and spawn dashboard server
+    writeProgress(projectDir, buildProgressState(state));
+    if (!skipDashboard) {
+      const dashboard = await spawnDashboardServer(projectDir);
+      if (dashboard) {
+        state.dashboardPid = dashboard.pid;
+        state.dashboardUrl = dashboard.url;
+        writeState(projectDir, state);
+        info(`Dashboard server at ${dashboard.url} (PID ${dashboard.pid})`);
+      }
+    }
+    notify('NightyTidy Started', `Orchestrator run initialized with ${selectedNums.length} steps.`);
+    info(`Orchestrator init complete: branch=${runBranch}, tag=${tagName}, steps=${selectedNums.join(',')}`);
+    return ok({
+      runBranch,
+      tagName,
+      originalBranch,
+      selectedSteps: selectedNums,
+      dashboardUrl: state.dashboardUrl,
+    });
+  } catch (err) {
+    return fail(err.message);
+  }
+}
+/**
+ * @typedef {Object} RunStepResult
+ * @property {boolean} success
+ * @property {string} [error]
+ * @property {number} [step]
+ * @property {string} [name]
+ * @property {'completed' | 'failed' | 'skipped'} [status]
+ * @property {string} [output]
+ * @property {number} [duration]
+ * @property {string} [durationFormatted]
+ * @property {number} [attempts]
+ * @property {number|null} [costUSD]
+ * @property {number|null} [inputTokens]
+ * @property {number|null} [outputTokens]
+ * @property {boolean} [suspiciousFast]
+ * @property {string|null} [errorType]
+ * @property {number|null} [retryAfterMs]
+ * @property {number[]} [remainingSteps]
+ */
+/**
+ * Run a single step in an orchestrated run.
+ *
+ * @param {string} projectDir - Target project directory
+ * @param {number} stepNumber - Step number to run
+ * @param {Object} [options] - Options
+ * @param {number} [options.timeout] - Step timeout in ms (overrides state)
+ * @returns {Promise<RunStepResult>} Result object (never throws)
+ */
+export async function runStep(projectDir, stepNumber, { timeout } = {}) {
+  try {
+    if (!Number.isFinite(stepNumber) || stepNumber < 1) {
+      return fail(`Invalid step number: ${stepNumber}. Use --list to see available steps.`);
+    }
+    initLogger(projectDir, { quiet: true });
+    const state = readState(projectDir);
+    if (!state) {
+      return fail('No active orchestrator run. Call --init-run first.');
+    }
+    const validationError = validateStepCanRun(stepNumber, state);
+    if (validationError) return fail(validationError);
+    const step = STEPS.find(s => s.number === stepNumber);
+    if (!step) {
+      return fail(`Step ${stepNumber} not found in available steps.`);
+    }
+    initGit(projectDir);
+    const stepTimeout = timeout || state.timeout || undefined;
+    info(`Orchestrator: running step ${stepNumber} — ${step.name}`);
+    // Branch guard: ensure we're on the run branch before starting
+    await ensureOnBranch(state.runBranch);
+    // Update progress: mark step as running
+    const stepIdx = state.selectedSteps.indexOf(stepNumber);
+    const progress = buildProgressState(state);
+    progress.currentStepIndex = stepIdx;
+    progress.currentStepName = step.name;
+    if (stepIdx >= 0 && progress.steps[stepIdx]) {
+      progress.steps[stepIdx].status = 'running';
+    }
+    writeProgress(projectDir, progress);
+    // Stream Claude output to progress file for dashboard consumption
+    const onOutput = createOutputHandler(progress, projectDir);
+    let result = await executeSingleStep(step, projectDir, { timeout: stepTimeout, onOutput });
+    // ── 3-Tier Recovery ──────────────────────────────────────────────
+    // Tier 1 already ran above. If it failed (non-rate-limit), try:
+    //   Tier 2 (prod): --continue to resume the killed session
+    //   Tier 3 (fresh): clean slate with a new session
+    if (result.status === 'failed' && result.errorType !== ERROR_TYPE.RATE_LIMIT) {
+      // ── Tier 2: PROD — continue killed session ──
+      warn(`Step ${stepNumber} failed (${result.error}) — prodding (resuming previous session)`);
+      progress.prodding = true;
+      progress.retrying = false;
+      progress.currentStepOutput = '';
+      writeProgress(projectDir, progress);
+      const prodOutput = createOutputHandler(progress, projectDir);
+      const prodPrompt = SAFETY_PREAMBLE + PROD_PREAMBLE + step.prompt;
+      const prodResult = await executeSingleStep(step, projectDir, {
+        timeout: stepTimeout, onOutput: prodOutput,
+        continueSession: true, promptOverride: prodPrompt,
+      });
+      result = {
+        ...prodResult,
+        attempts: (result.attempts || 0) + (prodResult.attempts || 0),
+        cost: sumCosts(result.cost, prodResult.cost),
+      };
+      // Branch guard between tiers — recover before deciding next tier
+      await ensureOnBranch(state.runBranch);
+      if (result.status === 'completed') {
+        info(`Step ${stepNumber} succeeded on prod (session resume)`);
+      } else if (result.errorType !== ERROR_TYPE.RATE_LIMIT) {
+        // ── Tier 3: FRESH RETRY — clean slate ──
+        warn(`Step ${stepNumber} prod failed — fresh retry with new session`);
+        progress.prodding = false;
+        progress.retrying = true;
+        progress.currentStepOutput = '';
+        writeProgress(projectDir, progress);
+        const freshOutput = createOutputHandler(progress, projectDir);
+        const freshResult = await executeSingleStep(step, projectDir, {
+          timeout: stepTimeout, onOutput: freshOutput,
+        });
+        result = {
+          ...freshResult,
+          attempts: (result.attempts || 0) + (freshResult.attempts || 0),
+          cost: sumCosts(result.cost, freshResult.cost),
+        };
+        // Branch guard after Tier 3
+        await ensureOnBranch(state.runBranch);
+        if (result.status === 'completed') {
+          info(`Step ${stepNumber} succeeded on fresh retry`);
+        } else {
+          warn(`Step ${stepNumber} failed on all 3 tiers — recording as failed`);
+        }
+      } else {
+        warn(`Step ${stepNumber} prod hit rate limit — recording as failed`);
+      }
+    }
+    // Branch guard: final check before writing state
+    await ensureOnBranch(state.runBranch);
+    // Update state — remove any previous failed entry for this step (retry scenario)
+    const prevFailIdx = state.failedSteps.findIndex(s => s.number === step.number);
+    if (prevFailIdx !== -1) {
+      info(`Orchestrator: step ${stepNumber} previously failed — recording retry result`);
+      state.failedSteps.splice(prevFailIdx, 1);
+    }
+    const output = (result.output || '').slice(0, 6000);
+    const stepError = result.status === 'failed' ? (result.error || 'Step failed during orchestrated run') : null;
+    const entry = { number: step.number, name: step.name, status: result.status, duration: result.duration, attempts: result.attempts, output, error: stepError, cost: result.cost || null, suspiciousFast: result.suspiciousFast || false, errorType: result.errorType || null, retryAfterMs: result.retryAfterMs || null };
+    if (result.status === 'completed') {
+      state.completedSteps.push(entry);
+    } else if (result.status === 'skipped') {
+      if (!state.skippedSteps) state.skippedSteps = [];
+      state.skippedSteps.push(entry);
+    } else {
+      state.failedSteps.push(entry);
+    }
+    writeState(projectDir, state);
+    // Update progress after step completes (clear output)
+    const finalProgress = buildProgressState(state);
+    delete finalProgress.currentStepOutput;
+    writeProgress(projectDir, finalProgress);
+    // Compute remaining
+    const doneNums = new Set([...state.completedSteps.map(s => s.number), ...state.failedSteps.map(s => s.number), ...(state.skippedSteps || []).map(s => s.number)]);
+    const remaining = state.selectedSteps.filter(n => !doneNums.has(n));
+    return ok({
+      step: stepNumber,
+      name: step.name,
+      status: result.status,
+      output,
+      error: stepError,
+      duration: result.duration,
+      durationFormatted: formatDuration(result.duration),
+      attempts: result.attempts,
+      costUSD: result.cost?.costUSD ?? null,
+      inputTokens: result.cost?.inputTokens ?? null,
+      outputTokens: result.cost?.outputTokens ?? null,
+      suspiciousFast: result.suspiciousFast || false,
+      errorType: result.errorType || null,
+      retryAfterMs: result.retryAfterMs || null,
+      remainingSteps: remaining,
+    });
+  } catch (err) {
+    return fail(err.message);
+  }
+}
+/**
+ * @typedef {Object} FinishRunResult
+ * @property {boolean} success
+ * @property {string} [error]
+ * @property {number} [completed]
+ * @property {number} [failed]
+ * @property {number} [skipped]
+ * @property {string} [totalDurationFormatted]
+ * @property {number|null} [totalCostUSD]
+ * @property {number|null} [totalInputTokens]
+ * @property {number|null} [totalOutputTokens]
+ * @property {number|null} [finishCostUSD]
+ * @property {number|null} [finishInputTokens]
+ * @property {number|null} [finishOutputTokens]
+ * @property {number} [finishDuration]
+ * @property {boolean} [merged]
+ * @property {boolean} [mergeConflict]
+ * @property {string} [reportPath]
+ * @property {string} [tagName]
+ * @property {string} [runBranch]
+ */
+/**
+ * Finish an orchestrated run.
+ *
+ * Generates narrated changelog and action plan (2 AI calls with output
+ * streaming to progress JSON), then generates report, commits, merges back
+ * to original branch, and cleans up state.
+ *
+ * @param {string} projectDir - Target project directory
+ * @returns {Promise<FinishRunResult>} Result object (never throws)
+ */
+export async function finishRun(projectDir) {
+  try {
+    initLogger(projectDir, { quiet: true });
+    const state = readState(projectDir);
+    if (!state) {
+      return fail('No active orchestrator run. Nothing to finish.');
+    }
+    initGit(projectDir);
+    info('Orchestrator: finishing run');
+    const executionResults = buildExecutionResults(state);
+    const totalDuration = Date.now() - state.startTime;
+    // Sum step costs
+    const stepsCostUSD = executionResults.results.reduce((sum, r) => sum + (r.cost?.costUSD || 0), 0);
+    const stepsInputTokens = executionResults.results.reduce((sum, r) => sum + (r.cost?.inputTokens || 0), 0) || null;
+    const stepsOutputTokens = executionResults.results.reduce((sum, r) => sum + (r.cost?.outputTokens || 0), 0) || null;
+    // Build unique report filename (numbered + timestamped)
+    const { reportFile } = buildReportNames(projectDir, state.startTime);
+    // ── Single AI call for report generation ──
+    const finishStart = Date.now();
+    // Build progress state with virtual "Final Report" step
+    const progress = buildProgressState(state);
+    progress.steps.push({ number: 0, name: 'Final Report', status: 'running', duration: null });
+    progress.currentStepIndex = state.selectedSteps.length;
+    progress.currentStepName = 'Final Report';
+    writeProgress(projectDir, progress);
+    const onOutput = createOutputHandler(progress, projectDir);
+    // Build metadata for pre-built report sections
+    const metadata = {
+      projectDir,
+      branchName: state.runBranch,
+      tagName: state.tagName,
+      originalBranch: state.originalBranch,
+      startTime: state.startTime,
+      endTime: Date.now(),
+      totalCostUSD: stepsCostUSD || null,
+      totalInputTokens: stepsInputTokens,
+      totalOutputTokens: stepsOutputTokens,
+    };
+    // Generate report in a single fresh Claude session (like other steps)
+    info('Generating report (narration + action plan)...');
+    const reportPrompt = buildReportPrompt(executionResults, metadata, { reportFile });
+    const reportResult = await runPrompt(SAFETY_PREAMBLE + reportPrompt, projectDir, {
+      label: 'Report generation',
+      timeout: state.timeout || undefined,
+      onOutput,
+    });
+    let finishCost = reportResult.cost || null;
+    const finishDuration = Date.now() - finishStart;
+    // Verify the report file was created correctly
+    const reportPath = path.join(projectDir, reportFile);
+    let reportOk = false;
+    try {
+      if (existsSync(reportPath)) {
+        const content = readFileSync(reportPath, 'utf8');
+        reportOk = verifyReportContent(content, metadata);
+      }
+    } catch { /* verification failed */ }
+    // Fallback: generate report via JS template if AI failed
+    if (!reportOk) {
+      warn('AI report generation failed or produced invalid output — using template fallback');
+      generateReport(executionResults, null, metadata, { reportFile, skipClaudeMdUpdate: true });
+    }
+    // Update progress: mark finish step as completed
+    const lastStep = progress.steps[progress.steps.length - 1];
+    lastStep.status = 'completed';
+    lastStep.duration = finishDuration;
+    delete progress.currentStepOutput;
+    writeProgress(projectDir, progress);
+    // Include finish-phase costs in totals
+    const totalCostUSD = (stepsCostUSD || 0) + (finishCost?.costUSD || 0) || null;
+    const totalInputTokens = (stepsInputTokens || 0) + (finishCost?.inputTokens || 0) || null;
+    const totalOutputTokens = (stepsOutputTokens || 0) + (finishCost?.outputTokens || 0) || null;
+    // Always update CLAUDE.md via JS (not AI)
+    updateClaudeMd(metadata);
+    // Commit report + CLAUDE.md (if not already committed by Claude)
+    const gitInstance = getGitInstance();
+    try {
+      const filesToCommit = [reportFile, 'CLAUDE.md'];
+      await gitInstance.add(filesToCommit);
+      await gitInstance.commit('NightyTidy: Add run report and update CLAUDE.md');
+    } catch (err) {
+      warn(`Failed to commit report: ${err.message}`);
+    }
+    // Read report content for embedding in response (avoids fragile file-read API in GUI)
+    let reportContent = null;
+    try { reportContent = readFileSync(path.join(projectDir, reportFile), 'utf-8'); } catch { /* merge will bring file back */ }
+    // Merge
+    const mergeResult = await mergeRunBranch(state.originalBranch, state.runBranch);
+    // Update progress to completed status before cleanup
+    const finalProgress = buildProgressState(state);
+    finalProgress.status = 'completed';
+    writeProgress(projectDir, finalProgress);
+    // Stop dashboard server and clean up
+    stopDashboardServer(state.dashboardPid);
+    await new Promise(resolve => setTimeout(resolve, SSE_FLUSH_DELAY));
+    cleanupDashboard(projectDir);
+    releaseLock(projectDir);
+    deleteState(projectDir);
+    const skippedStr = (executionResults.skippedCount || 0) > 0 ? `, ${executionResults.skippedCount} skipped` : '';
+    const completionMsg = mergeResult.success
+      ? `Run complete: ${executionResults.completedCount} completed, ${executionResults.failedCount} failed${skippedStr}.`
+      : `Run complete but merge needs attention. Changes on branch: ${state.runBranch}`;
+    notify('NightyTidy Complete', completionMsg);
+    info(`Orchestrator finish complete: ${executionResults.completedCount} completed, ${executionResults.failedCount} failed${skippedStr}`);
+    return ok({
+      completed: executionResults.completedCount,
+      failed: executionResults.failedCount,
+      skipped: executionResults.skippedCount || 0,
+      totalDurationFormatted: formatDuration(totalDuration),
+      totalCostUSD,
+      totalInputTokens,
+      totalOutputTokens,
+      finishCostUSD: finishCost?.costUSD ?? null,
+      finishInputTokens: finishCost?.inputTokens ?? null,
+      finishOutputTokens: finishCost?.outputTokens ?? null,
+      finishDuration,
+      merged: mergeResult.success,
+      mergeConflict: mergeResult.conflict || false,
+      reportPath: reportFile,
+      reportContent,
+      tagName: state.tagName,
+      runBranch: state.runBranch,
+    });
+  } catch (err) {
+    return fail(err.message);
+  }
+}