npm - @nathapp/nax - Versions diffs - 0.18.1 - Mend

@nathapp/nax 0.18.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (459) hide show

package/.gitlab-ci.yml +96 -0
package/BRIEF.md +140 -0
package/CHANGELOG.md +60 -0
package/CLAUDE.md +159 -0
package/README.md +373 -0
package/US-007-IMPLEMENTATION.md +139 -0
package/bin/nax.ts +930 -0
package/biome.json +14 -0
package/bun.lock +168 -0
package/bunfig.toml +11 -0
package/docs/20260216-fix-plan-context-review.md +56 -0
package/docs/20260216-relentless-vs-ngent-comparison.md +208 -0
package/docs/20260216-v02-plan.md +136 -0
package/docs/20260216-v02-review.md +685 -0
package/docs/20260217-dogfood-findings.md +56 -0
package/docs/20260217-p2-plus-plan.md +117 -0
package/docs/20260217-partial-fixes-plan.md +62 -0
package/docs/20260217-plan-analyze-spec.md +117 -0
package/docs/20260217-post-impl-review.md +1137 -0
package/docs/20260217-quick-wins-plan.md +66 -0
package/docs/20260217-split-runner-plan.md +75 -0
package/docs/20260217-v03-impl-plan.md +80 -0
package/docs/20260217-v03-post-impl-review.md +589 -0
package/docs/20260217-v04-impl-plan.md +86 -0
package/docs/20260217-v05-post-impl-review.md +850 -0
package/docs/20260217-v06-post-impl-review.md +817 -0
package/docs/20260218-adr003-port-plan.md +151 -0
package/docs/20260218-review-adr003-verification.md +175 -0
package/docs/20260219-fix-plan-bug16-19.md +79 -0
package/docs/20260219-fix-plan-bug20-22.md +114 -0
package/docs/20260219-plan-llm-routing.md +116 -0
package/docs/20260219-review-bug20-22-fixes.md +135 -0
package/docs/20260219-routing-baseline-keyword.md +63 -0
package/docs/20260220-plan-structured-logging-p1.md +80 -0
package/docs/20260220-plan-structured-logging-p2.md +37 -0
package/docs/20260220-review-llm-routing.md +180 -0
package/docs/20260220-review-post-fix-llm-routing.md +70 -0
package/docs/20260221-fix-plan-relevantfiles-split.md +101 -0
package/docs/20260221-fix-plan-routing-mode.md +125 -0
package/docs/20260221-review-v0.9-implementation.md +379 -0
package/docs/20260222-fix-plan-v091-routing-isolation.md +197 -0
package/docs/20260223-fix-plan-prompt-audit.md +62 -0
package/docs/20260224-nax-roadmap-phases.md +189 -0
package/docs/20260225-phase2-llm-service-layer.md +401 -0
package/docs/20260225-review-v0.10.1.md +187 -0
package/docs/20260303-v010-implementation-plan.md +165 -0
package/docs/CLAUDE.md.bak +191 -0
package/docs/ROADMAP.md +165 -0
package/docs/SPEC-rectification.md +0 -0
package/docs/SPEC.md +324 -0
package/docs/US-001-plugin-loading-verification.md +152 -0
package/docs/architecture-analysis.md +1076 -0
package/docs/bugs/BUG-21-escalation-null-attempts.md +48 -0
package/docs/bugs-from-dogfood-run-c.md +243 -0
package/docs/code-review-20260228.md +612 -0
package/docs/code-review-v0.15.0.md +629 -0
package/docs/hook-lifecycle-test-plan.md +149 -0
package/docs/releases/v0.11.0-and-earlier.md +20 -0
package/docs/releases/v0.12.0.md +15 -0
package/docs/releases/v0.13.0.md +14 -0
package/docs/releases/v0.14.0.md +20 -0
package/docs/releases/v0.14.1.md +36 -0
package/docs/releases/v0.14.2.md +51 -0
package/docs/releases/v0.14.3.md +174 -0
package/docs/releases/v0.14.4.md +94 -0
package/docs/releases/v0.15.0.md +502 -0
package/docs/releases/v0.15.1.md +170 -0
package/docs/releases/v0.15.3.md +193 -0
package/docs/specs/status-file-v0.10.1.md +812 -0
package/docs/v0.10-global-config.md +206 -0
package/docs/v0.10-plugin-system.md +415 -0
package/docs/v0.10-prompt-optimizer.md +234 -0
package/docs/v0.3-spec.md +244 -0
package/docs/v0.4-spec.md +140 -0
package/docs/v0.5-spec.md +237 -0
package/docs/v0.6-spec.md +371 -0
package/docs/v0.7-spec.md +177 -0
package/docs/v0.8-llm-routing.md +206 -0
package/docs/v0.8-structured-logging.md +132 -0
package/docs/v0.9.3-prompt-audit.md +112 -0
package/examples/plugins/console-reporter/index.test.ts +207 -0
package/examples/plugins/console-reporter/index.ts +110 -0
package/nax/config.json +147 -0
package/nax/features/bugfix-v0171/prd.json +52 -0
package/nax/features/config-management/prd.json +108 -0
package/nax/features/config-management/progress.txt +5 -0
package/nax/features/diagnose/acceptance.test.ts +412 -0
package/nax/features/diagnose/prd.json +41 -0
package/nax/features/orchestration-fixes/prd.json +89 -0
package/nax/features/orchestration-fixes/progress.txt +1 -0
package/nax/features/plugin-integration/US-007-VERIFICATION.md +259 -0
package/nax/features/plugin-integration/prd.json +208 -0
package/nax/features/plugin-integration/progress.txt +5 -0
package/nax/features/precheck/prd.json +205 -0
package/nax/features/precheck/progress.txt +15 -0
package/nax/features/structured-logging/prd.json +199 -0
package/nax/features/unlock/prd.json +36 -0
package/package.json +47 -0
package/src/acceptance/fix-generator.ts +348 -0
package/src/acceptance/generator.ts +282 -0
package/src/acceptance/index.ts +30 -0
package/src/acceptance/types.ts +79 -0
package/src/agents/claude-decompose.ts +169 -0
package/src/agents/claude-plan.ts +139 -0
package/src/agents/claude.ts +324 -0
package/src/agents/cost.ts +268 -0
package/src/agents/index.ts +13 -0
package/src/agents/registry.ts +48 -0
package/src/agents/types-extended.ts +133 -0
package/src/agents/types.ts +113 -0
package/src/agents/validation.ts +69 -0
package/src/analyze/classifier.ts +305 -0
package/src/analyze/index.ts +16 -0
package/src/analyze/scanner.ts +175 -0
package/src/analyze/types.ts +51 -0
package/src/cli/accept.ts +108 -0
package/src/cli/analyze-parser.ts +284 -0
package/src/cli/analyze.ts +207 -0
package/src/cli/config.ts +561 -0
package/src/cli/constitution.ts +109 -0
package/src/cli/diagnose-analysis.ts +159 -0
package/src/cli/diagnose-formatter.ts +87 -0
package/src/cli/diagnose.ts +203 -0
package/src/cli/generate.ts +127 -0
package/src/cli/index.ts +37 -0
package/src/cli/init.ts +188 -0
package/src/cli/interact.ts +295 -0
package/src/cli/plan.ts +198 -0
package/src/cli/plugins.ts +111 -0
package/src/cli/prompts.ts +295 -0
package/src/cli/runs.ts +174 -0
package/src/cli/status-cost.ts +151 -0
package/src/cli/status-features.ts +338 -0
package/src/cli/status.ts +13 -0
package/src/commands/common.ts +171 -0
package/src/commands/diagnose.ts +17 -0
package/src/commands/index.ts +8 -0
package/src/commands/logs.ts +384 -0
package/src/commands/precheck.ts +86 -0
package/src/commands/unlock.ts +96 -0
package/src/config/defaults.ts +160 -0
package/src/config/index.ts +22 -0
package/src/config/loader.ts +121 -0
package/src/config/merger.ts +147 -0
package/src/config/path-security.ts +121 -0
package/src/config/paths.ts +27 -0
package/src/config/schema.ts +56 -0
package/src/config/schemas.ts +286 -0
package/src/config/types.ts +423 -0
package/src/config/validate.ts +103 -0
package/src/constitution/generator.ts +191 -0
package/src/constitution/generators/aider.ts +41 -0
package/src/constitution/generators/claude.ts +35 -0
package/src/constitution/generators/cursor.ts +36 -0
package/src/constitution/generators/opencode.ts +38 -0
package/src/constitution/generators/types.ts +33 -0
package/src/constitution/generators/windsurf.ts +36 -0
package/src/constitution/index.ts +10 -0
package/src/constitution/loader.ts +133 -0
package/src/constitution/types.ts +31 -0
package/src/context/auto-detect.ts +227 -0
package/src/context/builder.ts +246 -0
package/src/context/elements.ts +83 -0
package/src/context/formatter.ts +107 -0
package/src/context/generator.ts +129 -0
package/src/context/generators/aider.ts +34 -0
package/src/context/generators/claude.ts +28 -0
package/src/context/generators/cursor.ts +28 -0
package/src/context/generators/opencode.ts +30 -0
package/src/context/generators/windsurf.ts +28 -0
package/src/context/greenfield.ts +114 -0
package/src/context/index.ts +33 -0
package/src/context/injector.ts +279 -0
package/src/context/test-scanner.ts +370 -0
package/src/context/types.ts +98 -0
package/src/errors.ts +67 -0
package/src/execution/batching.ts +157 -0
package/src/execution/crash-recovery.ts +373 -0
package/src/execution/escalation/escalation.ts +44 -0
package/src/execution/escalation/index.ts +13 -0
package/src/execution/escalation/tier-escalation.ts +295 -0
package/src/execution/escalation/tier-outcome.ts +158 -0
package/src/execution/helpers.ts +38 -0
package/src/execution/index.ts +45 -0
package/src/execution/lifecycle/acceptance-loop.ts +272 -0
package/src/execution/lifecycle/headless-formatter.ts +85 -0
package/src/execution/lifecycle/index.ts +12 -0
package/src/execution/lifecycle/parallel-lifecycle.ts +101 -0
package/src/execution/lifecycle/precheck-runner.ts +140 -0
package/src/execution/lifecycle/run-cleanup.ts +81 -0
package/src/execution/lifecycle/run-completion.ts +129 -0
package/src/execution/lifecycle/run-initialization.ts +141 -0
package/src/execution/lifecycle/run-lifecycle.ts +312 -0
package/src/execution/lifecycle/run-setup.ts +204 -0
package/src/execution/lifecycle/story-hooks.ts +38 -0
package/src/execution/lifecycle/story-size-prompts.ts +123 -0
package/src/execution/lock.ts +115 -0
package/src/execution/parallel-executor.ts +216 -0
package/src/execution/parallel.ts +400 -0
package/src/execution/pid-registry.ts +280 -0
package/src/execution/pipeline-result-handler.ts +388 -0
package/src/execution/post-verify-rectification.ts +188 -0
package/src/execution/post-verify.ts +274 -0
package/src/execution/progress.ts +25 -0
package/src/execution/prompts.ts +127 -0
package/src/execution/queue-handler.ts +109 -0
package/src/execution/rectification.ts +13 -0
package/src/execution/runner.ts +377 -0
package/src/execution/sequential-executor.ts +388 -0
package/src/execution/status-file.ts +264 -0
package/src/execution/status-writer.ts +139 -0
package/src/execution/story-context.ts +229 -0
package/src/execution/test-output-parser.ts +14 -0
package/src/execution/verification.ts +72 -0
package/src/hooks/index.ts +2 -0
package/src/hooks/runner.ts +286 -0
package/src/hooks/types.ts +67 -0
package/src/interaction/chain.ts +154 -0
package/src/interaction/index.ts +60 -0
package/src/interaction/init.ts +83 -0
package/src/interaction/plugins/auto.ts +217 -0
package/src/interaction/plugins/cli.ts +300 -0
package/src/interaction/plugins/telegram.ts +384 -0
package/src/interaction/plugins/webhook.ts +258 -0
package/src/interaction/state.ts +171 -0
package/src/interaction/triggers.ts +229 -0
package/src/interaction/types.ts +163 -0
package/src/logger/formatters.ts +84 -0
package/src/logger/index.ts +16 -0
package/src/logger/logger.ts +298 -0
package/src/logger/types.ts +48 -0
package/src/logging/formatter.ts +355 -0
package/src/logging/index.ts +22 -0
package/src/logging/types.ts +93 -0
package/src/metrics/aggregator.ts +190 -0
package/src/metrics/index.ts +14 -0
package/src/metrics/tracker.ts +200 -0
package/src/metrics/types.ts +109 -0
package/src/optimizer/index.ts +62 -0
package/src/optimizer/noop.optimizer.ts +24 -0
package/src/optimizer/rule-based.optimizer.ts +248 -0
package/src/optimizer/types.ts +53 -0
package/src/pipeline/events.ts +130 -0
package/src/pipeline/index.ts +19 -0
package/src/pipeline/runner.ts +161 -0
package/src/pipeline/stages/acceptance.ts +197 -0
package/src/pipeline/stages/completion.ts +99 -0
package/src/pipeline/stages/constitution.ts +63 -0
package/src/pipeline/stages/context.ts +117 -0
package/src/pipeline/stages/execution.ts +194 -0
package/src/pipeline/stages/index.ts +62 -0
package/src/pipeline/stages/optimizer.ts +74 -0
package/src/pipeline/stages/prompt.ts +57 -0
package/src/pipeline/stages/queue-check.ts +103 -0
package/src/pipeline/stages/review.ts +181 -0
package/src/pipeline/stages/routing.ts +81 -0
package/src/pipeline/stages/verify.ts +100 -0
package/src/pipeline/types.ts +167 -0
package/src/plugins/index.ts +31 -0
package/src/plugins/loader.ts +287 -0
package/src/plugins/registry.ts +168 -0
package/src/plugins/types.ts +327 -0
package/src/plugins/validator.ts +352 -0
package/src/prd/index.ts +172 -0
package/src/prd/types.ts +202 -0
package/src/precheck/checks-blockers.ts +391 -0
package/src/precheck/checks-warnings.ts +142 -0
package/src/precheck/checks.ts +30 -0
package/src/precheck/index.ts +247 -0
package/src/precheck/story-size-gate.ts +144 -0
package/src/precheck/types.ts +31 -0
package/src/queue/index.ts +2 -0
package/src/queue/manager.ts +254 -0
package/src/queue/types.ts +54 -0
package/src/review/index.ts +8 -0
package/src/review/runner.ts +172 -0
package/src/review/types.ts +66 -0
package/src/routing/builder.ts +81 -0
package/src/routing/chain.ts +74 -0
package/src/routing/index.ts +16 -0
package/src/routing/loader.ts +58 -0
package/src/routing/router.ts +303 -0
package/src/routing/strategies/adaptive.ts +215 -0
package/src/routing/strategies/index.ts +8 -0
package/src/routing/strategies/keyword.ts +163 -0
package/src/routing/strategies/llm-prompts.ts +209 -0
package/src/routing/strategies/llm.ts +235 -0
package/src/routing/strategies/manual.ts +50 -0
package/src/routing/strategy.ts +99 -0
package/src/tdd/cleanup.ts +111 -0
package/src/tdd/index.ts +23 -0
package/src/tdd/isolation.ts +123 -0
package/src/tdd/orchestrator.ts +383 -0
package/src/tdd/prompts.ts +270 -0
package/src/tdd/rectification-gate.ts +183 -0
package/src/tdd/session-runner.ts +179 -0
package/src/tdd/types.ts +81 -0
package/src/tdd/verdict.ts +271 -0
package/src/tui/App.tsx +265 -0
package/src/tui/components/AgentPanel.tsx +75 -0
package/src/tui/components/CostOverlay.tsx +118 -0
package/src/tui/components/HelpOverlay.tsx +107 -0
package/src/tui/components/StatusBar.tsx +63 -0
package/src/tui/components/StoriesPanel.tsx +177 -0
package/src/tui/hooks/useKeyboard.ts +142 -0
package/src/tui/hooks/useLayout.ts +137 -0
package/src/tui/hooks/usePipelineEvents.ts +183 -0
package/src/tui/hooks/usePty.ts +194 -0
package/src/tui/index.tsx +38 -0
package/src/tui/types.ts +76 -0
package/src/utils/git.ts +83 -0
package/src/utils/queue-writer.ts +54 -0
package/src/verification/executor.ts +235 -0
package/src/verification/gate.ts +207 -0
package/src/verification/index.ts +12 -0
package/src/verification/parser.ts +230 -0
package/src/verification/rectification.ts +108 -0
package/src/verification/types.ts +113 -0
package/src/worktree/dispatcher.ts +65 -0
package/src/worktree/index.ts +2 -0
package/src/worktree/manager.ts +187 -0
package/src/worktree/merge.ts +301 -0
package/src/worktree/types.ts +4 -0
package/test/TEST_COVERAGE_US001.md +217 -0
package/test/TEST_COVERAGE_US003.md +84 -0
package/test/TEST_COVERAGE_US005.md +86 -0
package/test/US-002-orchestrator.test.ts +246 -0
package/test/acceptance/cm-003-default-view.test.ts +194 -0
package/test/execution/pid-registry.test.ts +240 -0
package/test/execution/post-verify.test.ts +224 -0
package/test/helpers/timeout.ts +42 -0
package/test/integration/US-002-TEST-SUMMARY.md +107 -0
package/test/integration/US-003-TEST-SUMMARY.md +149 -0
package/test/integration/US-004-TEST-SUMMARY.md +106 -0
package/test/integration/US-005-TEST-SUMMARY.md +138 -0
package/test/integration/US-007-TEST-SUMMARY.md +100 -0
package/test/integration/agent-validation.test.ts +439 -0
package/test/integration/analyze-integration.test.ts +261 -0
package/test/integration/analyze-scanner.test.ts +131 -0
package/test/integration/cli-config-default-edge-cases.test.ts +222 -0
package/test/integration/cli-config-default-view.test.ts +229 -0
package/test/integration/cli-config-diff.test.ts +460 -0
package/test/integration/cli-config.test.ts +736 -0
package/test/integration/cli-diagnose.test.ts +592 -0
package/test/integration/cli-logs.test.ts +314 -0
package/test/integration/cli-plugins.test.ts +678 -0
package/test/integration/cli-precheck.test.ts +371 -0
package/test/integration/cli-run-headless.test.ts +173 -0
package/test/integration/cli.test.ts +75 -0
package/test/integration/config/merger.test.ts +465 -0
package/test/integration/config/paths.test.ts +51 -0
package/test/integration/config-loader.test.ts +265 -0
package/test/integration/config.test.ts +444 -0
package/test/integration/context-integration.test.ts +702 -0
package/test/integration/context-provider-injection.test.ts +506 -0
package/test/integration/context-verification-integration.test.ts +295 -0
package/test/integration/e2e.test.ts +896 -0
package/test/integration/execution.test.ts +625 -0
package/test/integration/helpers.test.ts +295 -0
package/test/integration/hooks.test.ts +361 -0
package/test/integration/interaction-chain-pipeline.test.ts +464 -0
package/test/integration/isolation.test.ts +143 -0
package/test/integration/logger.test.ts +461 -0
package/test/integration/parallel.test.ts +250 -0
package/test/integration/path-security.test.ts +173 -0
package/test/integration/pipeline-acceptance.test.ts +302 -0
package/test/integration/pipeline-events.test.ts +475 -0
package/test/integration/pipeline.test.ts +658 -0
package/test/integration/plan.test.ts +157 -0
package/test/integration/plugin-routing.test.ts +921 -0
package/test/integration/plugins/config-integration.test.ts +172 -0
package/test/integration/plugins/config-resolution.test.ts +522 -0
package/test/integration/plugins/loader.test.ts +641 -0
package/test/integration/plugins/registry.test.ts +746 -0
package/test/integration/plugins/validator.test.ts +563 -0
package/test/integration/prd-pause.test.ts +205 -0
package/test/integration/prd-resolvers.test.ts +185 -0
package/test/integration/precheck-integration.test.ts +468 -0
package/test/integration/precheck.test.ts +805 -0
package/test/integration/progress.test.ts +34 -0
package/test/integration/rectification-flow.test.ts +512 -0
package/test/integration/reporter-lifecycle.test.ts +860 -0
package/test/integration/review-config-commands.test.ts +319 -0
package/test/integration/review-config-schema.test.ts +116 -0
package/test/integration/review-plugin-integration.test.ts +722 -0
package/test/integration/review.test.ts +149 -0
package/test/integration/routing-stage-bug-021.test.ts +274 -0
package/test/integration/routing-stage-greenfield.test.ts +286 -0
package/test/integration/runner-config-plugins.test.ts +461 -0
package/test/integration/runner-fixes.test.ts +399 -0
package/test/integration/runner-plugin-integration.test.ts +543 -0
package/test/integration/runner.test.ts +1679 -0
package/test/integration/s5-greenfield-fallback.test.ts +297 -0
package/test/integration/status-file-integration.test.ts +325 -0
package/test/integration/status-file.test.ts +379 -0
package/test/integration/status-writer.test.ts +345 -0
package/test/integration/story-id-in-events.test.ts +273 -0
package/test/integration/tdd-cleanup.test.ts +246 -0
package/test/integration/tdd-orchestrator.test.ts +1762 -0
package/test/integration/test-scanner.test.ts +403 -0
package/test/integration/verification-asset-check.test.ts +142 -0
package/test/integration/verify-stage.test.ts +275 -0
package/test/integration/worktree/manager.test.ts +218 -0
package/test/integration/worktree/merge.test.ts +341 -0
package/test/manual/logging-formatter-demo.ts +158 -0
package/test/ui/tui-agent-panel.test.tsx +99 -0
package/test/ui/tui-controls.test.ts +334 -0
package/test/ui/tui-cost-and-pty.test.ts +189 -0
package/test/ui/tui-layout.test.ts +378 -0
package/test/ui/tui-pty-integration.test.tsx +159 -0
package/test/ui/tui-stories.test.ts +332 -0
package/test/unit/acceptance.test.ts +186 -0
package/test/unit/agent-stderr-capture.test.ts +146 -0
package/test/unit/analyze-classifier.test.ts +215 -0
package/test/unit/analyze.test.ts +224 -0
package/test/unit/auto-detect.test.ts +249 -0
package/test/unit/cli-status.test.ts +417 -0
package/test/unit/commands/common.test.ts +320 -0
package/test/unit/commands/logs.test.ts +416 -0
package/test/unit/commands/unlock.test.ts +319 -0
package/test/unit/constitution-generators.test.ts +160 -0
package/test/unit/constitution.test.ts +209 -0
package/test/unit/context.test.ts +1722 -0
package/test/unit/cost.test.ts +231 -0
package/test/unit/crash-recovery.test.ts +308 -0
package/test/unit/escalation.test.ts +126 -0
package/test/unit/execution-logging-stderr.test.ts +156 -0
package/test/unit/execution-stage.test.ts +122 -0
package/test/unit/fix-generator.test.ts +275 -0
package/test/unit/formatters.test.ts +469 -0
package/test/unit/greenfield.test.ts +179 -0
package/test/unit/helpers.test.ts +317 -0
package/test/unit/interaction/human-review-trigger.test.ts +164 -0
package/test/unit/interaction-network-failures.test.ts +389 -0
package/test/unit/interaction-plugins.test.ts +164 -0
package/test/unit/isolation.test.ts +134 -0
package/test/unit/logging/formatter.test.ts +455 -0
package/test/unit/merge.test.ts +268 -0
package/test/unit/metrics.test.ts +276 -0
package/test/unit/optimizer/noop.optimizer.test.ts +125 -0
package/test/unit/optimizer/rule-based.optimizer.test.ts +358 -0
package/test/unit/prd-auto-default.test.ts +290 -0
package/test/unit/prd-failure-category.test.ts +176 -0
package/test/unit/prd-get-next-story.test.ts +186 -0
package/test/unit/precheck-checks.test.ts +840 -0
package/test/unit/precheck-story-size-gate.test.ts +287 -0
package/test/unit/precheck-types.test.ts +142 -0
package/test/unit/prompts.test.ts +475 -0
package/test/unit/queue.test.ts +237 -0
package/test/unit/rectification.test.ts +284 -0
package/test/unit/registry.test.ts +287 -0
package/test/unit/routing.test.ts +937 -0
package/test/unit/run-lifecycle.test.ts +140 -0
package/test/unit/storyid-events.test.ts +224 -0
package/test/unit/tdd-verdict.test.ts +492 -0
package/test/unit/test-output-parser.test.ts +377 -0
package/test/unit/verdict.test.ts +324 -0
package/test/unit/worktree-manager.test.ts +158 -0
package/tsconfig.json +27 -0

package/test/integration/tdd-orchestrator.test.ts ADDED Viewed

@@ -0,0 +1,1762 @@
+import { afterEach, beforeEach, describe, expect, mock, test } from "bun:test";
+import { existsSync } from "node:fs";
+import { mkdir, rm, writeFile } from "node:fs/promises";
+import path from "node:path";
+import type { AgentAdapter, AgentResult } from "../../src/agents";
+import { DEFAULT_CONFIG } from "../../src/config";
+import type { UserStory } from "../../src/prd";
+import { runThreeSessionTdd } from "../../src/tdd/orchestrator";
+import { VERDICT_FILE } from "../../src/tdd/verdict";
+let originalSpawn: typeof Bun.spawn;
+beforeEach(() => {
+  originalSpawn = Bun.spawn;
+});
+afterEach(() => {
+  Bun.spawn = originalSpawn;
+});
+/** Create a mock agent that returns sequential results */
+function createMockAgent(results: Partial<AgentResult>[]): AgentAdapter {
+  let callCount = 0;
+  return {
+    name: "mock",
+    displayName: "Mock Agent",
+    binary: "mock",
+    isInstalled: async () => true,
+    buildCommand: () => ["mock"],
+    run: mock(async () => {
+      const r = results[callCount] || {};
+      callCount++;
+      return {
+        success: r.success ?? true,
+        exitCode: r.exitCode ?? 0,
+        output: r.output ?? "",
+        rateLimited: r.rateLimited ?? false,
+        durationMs: r.durationMs ?? 100,
+        estimatedCost: r.estimatedCost ?? 0.01,
+      };
+    }),
+  };
+}
+/** Mock Bun.spawn to intercept git commands */
+function mockGitSpawn(opts: {
+  /** Files returned by git diff for each session (indexed by git-diff call number) */
+  diffFiles: string[][];
+  /** Optional: mock test command success (default: true) */
+  testCommandSuccess?: boolean;
+}) {
+  let revParseCount = 0;
+  let diffCount = 0;
+  const testSuccess = opts.testCommandSuccess ?? true;
+  // @ts-ignore — mocking global
+  Bun.spawn = mock((cmd: string[], spawnOpts?: any) => {
+    // Intercept test commands (bun test, npm test, etc.)
+    if ((cmd[0] === "/bin/sh" || cmd[0] === "/bin/bash" || cmd[0] === "/bin/zsh") && cmd[1] === "-c") {
+      return {
+        pid: 9999,
+        exited: Promise.resolve(testSuccess ? 0 : 1),
+        stdout: new Response(testSuccess ? "tests pass\n" : "tests fail\n").body,
+        stderr: new Response("").body,
+      };
+    }
+    if (cmd[0] === "git" && cmd[1] === "rev-parse") {
+      revParseCount++;
+      return {
+        exited: Promise.resolve(0),
+        stdout: new Response(`ref-${revParseCount}\n`).body,
+        stderr: new Response("").body,
+      };
+    }
+    if (cmd[0] === "git" && cmd[1] === "checkout") {
+      // Intercept git checkout (used in zero-file fallback) — silently succeed
+      return {
+        exited: Promise.resolve(0),
+        stdout: new Response("").body,
+        stderr: new Response("").body,
+      };
+    }
+    if (cmd[0] === "git" && cmd[1] === "diff") {
+      const files = opts.diffFiles[diffCount] || [];
+      diffCount++;
+      return {
+        exited: Promise.resolve(0),
+        stdout: new Response(files.join("\n") + "\n").body,
+        stderr: new Response("").body,
+      };
+    }
+    return originalSpawn(cmd, spawnOpts);
+  });
+}
+const story: UserStory = {
+  id: "US-001",
+  title: "Add user validation",
+  description: "Add validation to user input",
+  acceptanceCriteria: ["Validation works", "Errors are clear"],
+  dependencies: [],
+  tags: [],
+  status: "pending",
+  passes: false,
+  escalations: [],
+  attempts: 0,
+};
+describe("runThreeSessionTdd", () => {
+  test("happy path: all 3 sessions succeed", async () => {
+    // Each session triggers: captureGitRef (rev-parse) + isolation check (git diff) + getChangedFiles (git diff)
+    // Session 1: test-writer → verifyTestWriterIsolation calls getChangedFiles (1 diff) + getChangedFiles for result (1 diff) = 2 diffs
+    // Session 2: implementer → verifyImplementerIsolation (1 diff) + getChangedFiles (1 diff) = 2 diffs
+    // Session 3: verifier → no isolation check + getChangedFiles (1 diff) = 1 diff
+    // But actually looking at the code: isolation + getChangedFiles share the same call in runTddSession
+    // isolation calls getChangedFiles internally, then runTddSession calls getChangedFiles separately
+    // Actually no — look at orchestrator.ts runTddSession:
+    //   1. verifyTestWriterIsolation (calls getChangedFiles) → 1 diff call
+    //   2. getChangedFiles → 1 diff call
+    // So per session with isolation: 2 diff calls. Without isolation (verifier): 1 diff call.
+    // Total: 2 + 2 + 1 = 5 diff calls
+    mockGitSpawn({
+      diffFiles: [
+        // Session 1 isolation check: test files only (OK)
+        ["test/user.test.ts"],
+        // Session 1 getChangedFiles
+        ["test/user.test.ts"],
+        // Session 2 isolation check: source files only (OK)
+        ["src/user.ts"],
+        // Session 2 getChangedFiles
+        ["src/user.ts"],
+        // Session 3 getChangedFiles (no isolation check for verifier)
+        ["src/user.ts"],
+      ],
+    });
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 },
+      { success: true, estimatedCost: 0.02 },
+      { success: true, estimatedCost: 0.01 },
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+    });
+    expect(result.success).toBe(true);
+    expect(result.sessions).toHaveLength(3);
+    expect(result.sessions[0].role).toBe("test-writer");
+    expect(result.sessions[1].role).toBe("implementer");
+    expect(result.sessions[2].role).toBe("verifier");
+    expect(result.needsHumanReview).toBe(false);
+    expect(result.totalCost).toBe(0.04);
+  });
+  test("failure when test-writer session fails", async () => {
+    mockGitSpawn({
+      diffFiles: [["test/user.test.ts"], ["test/user.test.ts"]],
+    });
+    const agent = createMockAgent([{ success: false, exitCode: 1, estimatedCost: 0.01 }]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+    });
+    expect(result.success).toBe(false);
+    expect(result.sessions).toHaveLength(1);
+    expect(result.needsHumanReview).toBe(true);
+  });
+  test("failure when test-writer violates isolation", async () => {
+    mockGitSpawn({
+      diffFiles: [
+        // Isolation check: test-writer touched source files!
+        ["src/user.ts", "test/user.test.ts"],
+        // getChangedFiles
+        ["src/user.ts", "test/user.test.ts"],
+      ],
+    });
+    const agent = createMockAgent([{ success: true, estimatedCost: 0.01 }]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+    });
+    expect(result.success).toBe(false);
+    expect(result.sessions).toHaveLength(1);
+    expect(result.sessions[0].success).toBe(false);
+    expect(result.needsHumanReview).toBe(true);
+  });
+  test("failure when implementer session fails", async () => {
+    mockGitSpawn({
+      diffFiles: [
+        // Session 1 isolation: OK
+        ["test/user.test.ts"],
+        // Session 1 getChangedFiles
+        ["test/user.test.ts"],
+        // Session 2 isolation: OK
+        ["src/user.ts"],
+        // Session 2 getChangedFiles
+        ["src/user.ts"],
+      ],
+    });
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 },
+      { success: false, exitCode: 1, estimatedCost: 0.02 },
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+    });
+    expect(result.success).toBe(false);
+    expect(result.sessions).toHaveLength(2);
+    expect(result.needsHumanReview).toBe(true);
+  });
+  test("implementer touching test files is a warning (soft-pass), not failure", async () => {
+    mockGitSpawn({
+      diffFiles: [
+        // Session 1 isolation: OK
+        ["test/user.test.ts"],
+        // Session 1 getChangedFiles
+        ["test/user.test.ts"],
+        // Session 2 isolation: implementer touched tests (warning, not violation)
+        ["test/user.test.ts", "src/user.ts"],
+        // Session 2 getChangedFiles
+        ["test/user.test.ts", "src/user.ts"],
+        // Session 3 isolation: OK
+        [],
+        // Session 3 getChangedFiles
+        [],
+      ],
+    });
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 },
+      { success: true, estimatedCost: 0.02 },
+      { success: true, estimatedCost: 0.01 },
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+    });
+    // v0.9.2: implementer touching test files is a warning, not a failure
+    expect(result.sessions).toHaveLength(3);
+    expect(result.sessions[1].success).toBe(true);
+    expect(result.sessions[1].isolation?.warnings).toContain("test/user.test.ts");
+    expect(result.success).toBe(true);
+  });
+  test("dry-run mode logs sessions without executing", async () => {
+    const agent = createMockAgent([]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+      dryRun: true,
+    });
+    expect(result.success).toBe(true);
+    expect(result.sessions).toHaveLength(0);
+    expect(result.needsHumanReview).toBe(false);
+    expect(result.totalCost).toBe(0);
+    // Agent should not have been called
+    expect(agent.run).not.toHaveBeenCalled();
+  });
+  test("dry-run mode works with context markdown", async () => {
+    const agent = createMockAgent([]);
+    const contextMarkdown = "## Dependencies\n- US-000: Setup database\n";
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: "/tmp/test",
+      modelTier: "powerful",
+      contextMarkdown,
+      dryRun: true,
+    });
+    expect(result.success).toBe(true);
+    expect(result.sessions).toHaveLength(0);
+    expect(result.totalCost).toBe(0);
+    // Agent should not have been called
+    expect(agent.run).not.toHaveBeenCalled();
+  });
+  test("BUG-22: post-TDD verification overrides session failures when tests pass", async () => {
+    // Scenario: All 3 sessions complete but verifier has non-zero exit code
+    // However, when we run tests independently, they pass
+    // Expected: allSuccessful should be overridden to true
+    let testCommandCalled = false;
+    let revParseCount = 0;
+    let diffCount = 0;
+    const diffFiles = [
+      // Session 1 isolation + getChangedFiles
+      ["test/user.test.ts"],
+      ["test/user.test.ts"],
+      // Session 2 isolation + getChangedFiles
+      ["src/user.ts"],
+      ["src/user.ts"],
+      // Session 3 getChangedFiles
+      ["src/user.ts"],
+    ];
+    // @ts-ignore — mocking global
+    Bun.spawn = mock((cmd: string[], spawnOpts?: any) => {
+      // Intercept the post-TDD test command (bun test)
+      if (cmd[0] === "/bin/sh" && cmd[2]?.includes("bun test")) {
+        testCommandCalled = true;
+        return {
+          pid: 9999,
+          exited: Promise.resolve(0), // Tests pass!
+          stdout: new Response("5 pass, 0 fail\n").body,
+          stderr: new Response("").body,
+        };
+      }
+      // Git rev-parse
+      if (cmd[0] === "git" && cmd[1] === "rev-parse") {
+        revParseCount++;
+        return {
+          exited: Promise.resolve(0),
+          stdout: new Response(`ref-${revParseCount}\n`).body,
+          stderr: new Response("").body,
+        };
+      }
+      // Git diff
+      if (cmd[0] === "git" && cmd[1] === "diff") {
+        const files = diffFiles[diffCount] || [];
+        diffCount++;
+        return {
+          exited: Promise.resolve(0),
+          stdout: new Response(files.join("\n") + "\n").body,
+          stderr: new Response("").body,
+        };
+      }
+      return originalSpawn(cmd, spawnOpts);
+    });
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 }, // test-writer succeeds
+      { success: true, estimatedCost: 0.02 }, // implementer succeeds
+      { success: false, exitCode: 1, estimatedCost: 0.01 }, // verifier fails (e.g., fixed issues)
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+    });
+    // Assertions
+    expect(testCommandCalled).toBe(true); // Post-TDD test was executed
+    expect(result.sessions).toHaveLength(3);
+    expect(result.sessions[2].success).toBe(false); // Verifier session itself failed
+    expect(result.success).toBe(true); // But overall result is success (overridden)
+    expect(result.needsHumanReview).toBe(false); // No human review needed
+    expect(result.reviewReason).toBeUndefined();
+  });
+  test("BUG-20: failure when test-writer creates no test files", async () => {
+    // Scenario: Test-writer session succeeds and passes isolation but creates no test files
+    // (e.g., creates requirements.md instead)
+    // Expected: Should fail with needsHumanReview and specific reason
+    mockGitSpawn({
+      diffFiles: [
+        // Isolation check: only non-test files
+        ["requirements.md", "docs/plan.md"],
+        // getChangedFiles
+        ["requirements.md", "docs/plan.md"],
+      ],
+    });
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 }, // test-writer succeeds but creates wrong files
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+    });
+    expect(result.success).toBe(false);
+    expect(result.sessions).toHaveLength(1); // Should stop after session 1
+    expect(result.needsHumanReview).toBe(true);
+    expect(result.reviewReason).toBe("Test writer session created no test files (greenfield project)");
+  });
+  test("BUG-20: failure when test-writer creates zero files", async () => {
+    // Scenario: Test-writer session succeeds but creates no files at all
+    // Expected: Should fail with needsHumanReview
+    mockGitSpawn({
+      diffFiles: [
+        // Isolation check: no files
+        [],
+        // getChangedFiles: no files
+        [],
+      ],
+    });
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 }, // test-writer succeeds but creates nothing
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+    });
+    expect(result.success).toBe(false);
+    expect(result.sessions).toHaveLength(1);
+    expect(result.needsHumanReview).toBe(true);
+    expect(result.reviewReason).toBe("Test writer session created no test files (greenfield project)");
+  });
+  test("BUG-20: success when test-writer creates test files with various extensions", async () => {
+    // Scenario: Test-writer creates test files with different valid extensions
+    // Expected: Should succeed and continue to session 2
+    mockGitSpawn({
+      diffFiles: [
+        // Isolation check: various test file formats
+        ["test/user.test.ts", "test/auth.spec.js", "test/api.test.tsx"],
+        // getChangedFiles
+        ["test/user.test.ts", "test/auth.spec.js", "test/api.test.tsx"],
+        // Session 2 isolation
+        ["src/user.ts", "src/auth.js"],
+        // Session 2 getChangedFiles
+        ["src/user.ts", "src/auth.js"],
+        // Session 3 getChangedFiles
+        ["src/user.ts"],
+      ],
+    });
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 },
+      { success: true, estimatedCost: 0.02 },
+      { success: true, estimatedCost: 0.01 },
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+    });
+    expect(result.success).toBe(true);
+    expect(result.sessions).toHaveLength(3); // All sessions run
+    expect(result.needsHumanReview).toBe(false);
+  });
+  test("BUG-22: post-TDD verification does not override when tests actually fail", async () => {
+    // Scenario: Sessions complete with failures AND independent test run also fails
+    // Expected: Result should remain failed
+    let testCommandCalled = false;
+    let revParseCount = 0;
+    let diffCount = 0;
+    const diffFiles = [["test/user.test.ts"], ["test/user.test.ts"], ["src/user.ts"], ["src/user.ts"], ["src/user.ts"]];
+    // @ts-ignore — mocking global
+    Bun.spawn = mock((cmd: string[], spawnOpts?: any) => {
+      if (cmd[0] === "/bin/sh" && cmd[2]?.includes("bun test")) {
+        testCommandCalled = true;
+        return {
+          pid: 9999,
+          exited: Promise.resolve(1), // Tests FAIL!
+          stdout: new Response("3 pass, 2 fail\n").body,
+          stderr: new Response("Test errors...\n").body,
+        };
+      }
+      if (cmd[0] === "git" && cmd[1] === "rev-parse") {
+        revParseCount++;
+        return {
+          exited: Promise.resolve(0),
+          stdout: new Response(`ref-${revParseCount}\n`).body,
+          stderr: new Response("").body,
+        };
+      }
+      if (cmd[0] === "git" && cmd[1] === "diff") {
+        const files = diffFiles[diffCount] || [];
+        diffCount++;
+        return {
+          exited: Promise.resolve(0),
+          stdout: new Response(files.join("\n") + "\n").body,
+          stderr: new Response("").body,
+        };
+      }
+      return originalSpawn(cmd, spawnOpts);
+    });
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 },
+      { success: true, estimatedCost: 0.02 },
+      { success: false, exitCode: 1, estimatedCost: 0.01 }, // verifier fails
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+    });
+    expect(testCommandCalled).toBe(true);
+    expect(result.success).toBe(false); // Should remain failed
+    expect(result.needsHumanReview).toBe(true); // Needs review
+    expect(result.reviewReason).toBeDefined();
+  });
+});
+// ─── Lite-mode prompt tests ───────────────────────────────────────────────────
+import {
+  buildImplementerLitePrompt,
+  buildImplementerPrompt,
+  buildTestWriterLitePrompt,
+  buildTestWriterPrompt,
+  buildVerifierPrompt,
+} from "../../src/tdd/prompts";
+describe("buildTestWriterLitePrompt", () => {
+  test("tells agent it CAN read source files", () => {
+    const prompt = buildTestWriterLitePrompt(story);
+    expect(prompt).toContain("MAY read source files");
+  });
+  test("tells agent it CAN import from source files", () => {
+    const prompt = buildTestWriterLitePrompt(story);
+    expect(prompt).toContain("MAY import from source files");
+  });
+  test("still instructs agent to only CREATE test files", () => {
+    const prompt = buildTestWriterLitePrompt(story);
+    expect(prompt).toMatch(/[Oo]nly\s+[Cc][Rr][Ee][Aa][Tt][Ee]\s+test files|CREATE test files/);
+  });
+  test("does NOT say DO NOT create or modify any source files (strict isolation rule)", () => {
+    const prompt = buildTestWriterLitePrompt(story);
+    expect(prompt).not.toContain("DO NOT create or modify any source files");
+  });
+  test("does NOT say ONLY create/modify test files (strict isolation rule)", () => {
+    const prompt = buildTestWriterLitePrompt(story);
+    expect(prompt).not.toContain("ONLY create/modify test files");
+  });
+  test("includes story title and acceptance criteria", () => {
+    const prompt = buildTestWriterLitePrompt(story);
+    expect(prompt).toContain(story.title);
+    expect(prompt).toContain("Validation works");
+    expect(prompt).toContain("Errors are clear");
+  });
+  test("includes context markdown when provided", () => {
+    const ctx = "## Relevant Files\n- src/user.ts";
+    const prompt = buildTestWriterLitePrompt(story, ctx);
+    expect(prompt).toContain("## Relevant Files");
+    expect(prompt).toContain("src/user.ts");
+  });
+  test("does not include context separator when no context provided", () => {
+    const prompt = buildTestWriterLitePrompt(story);
+    // Should still have content but no trailing separator
+    expect(prompt).not.toMatch(/---\s*$/);
+  });
+  test("uses lite mode label in heading", () => {
+    const prompt = buildTestWriterLitePrompt(story);
+    expect(prompt.toLowerCase()).toContain("lite");
+  });
+});
+describe("buildImplementerLitePrompt", () => {
+  test("has no file restriction rules (does not say Only create or modify files in the test/ directory)", () => {
+    const prompt = buildImplementerLitePrompt(story);
+    expect(prompt).not.toContain("Only create or modify files in the test/ directory");
+  });
+  test("has no file restriction rules (does not say Implement source code in src/ to make tests pass)", () => {
+    const prompt = buildImplementerLitePrompt(story);
+    expect(prompt).not.toContain("Implement source code in src/ to make tests pass");
+  });
+  test("allows writing tests and implementing", () => {
+    const prompt = buildImplementerLitePrompt(story);
+    expect(prompt).toContain("Write tests AND implement");
+  });
+  test("includes story title and acceptance criteria", () => {
+    const prompt = buildImplementerLitePrompt(story);
+    expect(prompt).toContain(story.title);
+    expect(prompt).toContain("Validation works");
+    expect(prompt).toContain("Errors are clear");
+  });
+  test("includes context markdown when provided", () => {
+    const ctx = "## Context\n- Use existing patterns";
+    const prompt = buildImplementerLitePrompt(story, ctx);
+    expect(prompt).toContain("## Context");
+    expect(prompt).toContain("Use existing patterns");
+  });
+  test("uses lite mode label in heading", () => {
+    const prompt = buildImplementerLitePrompt(story);
+    expect(prompt.toLowerCase()).toContain("lite");
+  });
+  test("still instructs to make tests pass", () => {
+    const prompt = buildImplementerLitePrompt(story);
+    expect(prompt.toLowerCase()).toContain("all tests must pass");
+  });
+});
+describe("buildVerifierPrompt (unchanged)", () => {
+  test("is unchanged — still has isolation-focused verification rules", () => {
+    const prompt = buildVerifierPrompt(story);
+    expect(prompt).toContain("Session 3: Verify");
+    expect(prompt).toContain("Check if test files were modified by the implementer");
+    expect(prompt).toContain(story.title);
+  });
+  test("does NOT mention lite mode", () => {
+    const prompt = buildVerifierPrompt(story);
+    expect(prompt.toLowerCase()).not.toContain("lite");
+  });
+  test("still verifies acceptance criteria", () => {
+    const prompt = buildVerifierPrompt(story);
+    expect(prompt).toContain("Validation works");
+    expect(prompt).toContain("Errors are clear");
+  });
+});
+describe("strict vs lite prompt comparison", () => {
+  test("strict test-writer has harder isolation rules than lite", () => {
+    const strict = buildTestWriterPrompt(story);
+    const lite = buildTestWriterLitePrompt(story);
+    // Strict has hard NO rule on source files
+    expect(strict).toContain("Only create or modify files in the test/ directory");
+    expect(lite).not.toContain("Only create or modify files in the test/ directory");
+    // Lite explicitly allows reading source files
+    expect(lite).toContain("You may create minimal stubs in src/");
+    expect(strict).not.toContain("You may create minimal stubs in src/");
+  });
+  test("strict implementer has harder isolation rules than lite", () => {
+    const strict = buildImplementerPrompt(story);
+    const lite = buildImplementerLitePrompt(story);
+    // Strict bans test file modifications
+    expect(strict).toContain("Do NOT modify test files");
+    expect(lite).not.toContain("Do NOT modify test files");
+    // Lite allows adjusting test files
+    expect(lite).toContain("Write tests AND implement");
+    expect(strict).not.toContain("Write tests AND implement");
+  });
+});
+// ─── T4: Lite mode orchestration tests ───────────────────────────────────────
+describe("runThreeSessionTdd — lite mode", () => {
+  test("lite mode: result includes lite=true flag", async () => {
+    // In lite mode all 3 sessions succeed
+    // Lite skips isolation for sessions 1 and 2, so only 2 diff calls for those
+    // Session 3 (verifier) always runs isolation: 2 diff calls (isolation + getChangedFiles)
+    // Total: 1 (s1 getChangedFiles) + 1 (s2 getChangedFiles) + 2 (s3) = 4 diff calls
+    mockGitSpawn({
+      diffFiles: [
+        ["test/user.test.ts"], // s1 getChangedFiles (no isolation in lite)
+        ["src/user.ts"], // s2 getChangedFiles (no isolation in lite)
+        [], // s3 isolation check (verifier always checks)
+        ["src/user.ts"], // s3 getChangedFiles
+      ],
+    });
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 },
+      { success: true, estimatedCost: 0.02 },
+      { success: true, estimatedCost: 0.01 },
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+      lite: true,
+    });
+    expect(result.lite).toBe(true);
+    expect(result.success).toBe(true);
+  });
+  test("strict mode: result includes lite=false flag", async () => {
+    mockGitSpawn({
+      diffFiles: [
+        ["test/user.test.ts"],
+        ["test/user.test.ts"],
+        ["src/user.ts"],
+        ["src/user.ts"],
+        [], // s3 isolation
+        ["src/user.ts"], // s3 getChangedFiles
+      ],
+    });
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 },
+      { success: true, estimatedCost: 0.02 },
+      { success: true, estimatedCost: 0.01 },
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+      lite: false,
+    });
+    expect(result.lite).toBe(false);
+    expect(result.success).toBe(true);
+  });
+  test("lite mode: test-writer session has no isolation check (isolation is undefined)", async () => {
+    mockGitSpawn({
+      diffFiles: [
+        ["test/user.test.ts"], // s1 getChangedFiles only (no isolation in lite)
+        ["src/user.ts"], // s2 getChangedFiles only (no isolation in lite)
+        [], // s3 isolation
+        ["src/user.ts"], // s3 getChangedFiles
+      ],
+    });
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 },
+      { success: true, estimatedCost: 0.02 },
+      { success: true, estimatedCost: 0.01 },
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+      lite: true,
+    });
+    expect(result.sessions).toHaveLength(3);
+    // In lite mode, test-writer and implementer skip isolation
+    expect(result.sessions[0].isolation).toBeUndefined();
+    expect(result.sessions[1].isolation).toBeUndefined();
+    // Verifier always runs isolation
+    expect(result.sessions[2].isolation).toBeDefined();
+  });
+  test("lite mode: implementer modifying test files does NOT appear in isolation warnings (no isolation check)", async () => {
+    // In strict mode, implementer touching test files produces warnings.
+    // In lite mode, isolation is skipped entirely, so there are no warnings.
+    mockGitSpawn({
+      diffFiles: [
+        ["test/user.test.ts"], // s1 getChangedFiles
+        ["test/user.test.ts", "src/user.ts"], // s2 getChangedFiles
+        [], // s3 isolation
+        [], // s3 getChangedFiles
+      ],
+    });
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 },
+      { success: true, estimatedCost: 0.02 },
+      { success: true, estimatedCost: 0.01 },
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+      lite: true,
+    });
+    expect(result.sessions[1].isolation).toBeUndefined(); // No isolation in lite
+    expect(result.sessions[1].success).toBe(true); // Agent succeeded
+    expect(result.success).toBe(true);
+    expect(result.lite).toBe(true);
+  });
+  test("lite mode: verifier always runs isolation check (even in lite mode)", async () => {
+    mockGitSpawn({
+      diffFiles: [
+        ["test/user.test.ts"], // s1 getChangedFiles
+        ["src/user.ts"], // s2 getChangedFiles
+        [], // s3 isolation (verifier always checks)
+        [], // s3 getChangedFiles
+      ],
+    });
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 },
+      { success: true, estimatedCost: 0.02 },
+      { success: true, estimatedCost: 0.01 },
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+      lite: true,
+    });
+    expect(result.sessions[2].isolation).toBeDefined();
+    expect(result.sessions[2].isolation?.passed).toBe(true);
+    expect(result.lite).toBe(true);
+  });
+  test("lite mode: dry-run returns lite=true", async () => {
+    const agent = createMockAgent([]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+      dryRun: true,
+      lite: true,
+    });
+    expect(result.lite).toBe(true);
+    expect(result.success).toBe(true);
+    expect(result.sessions).toHaveLength(0);
+  });
+});
+// ─── T4: Zero-file fallback tests ────────────────────────────────────────────
+describe("runThreeSessionTdd — zero-file fallback", () => {
+  /** Extended git mock that also handles `git checkout .` */
+  function mockGitSpawnWithCheckout(opts: {
+    diffFiles: string[][];
+    onCheckout?: () => void;
+    testCommandSuccess?: boolean;
+  }) {
+    let revParseCount = 0;
+    let diffCount = 0;
+    const testSuccess = opts.testCommandSuccess ?? true;
+    // @ts-ignore — mocking global
+    Bun.spawn = mock((cmd: string[], spawnOpts?: any) => {
+      // Intercept test commands
+      if ((cmd[0] === "/bin/sh" || cmd[0] === "/bin/bash" || cmd[0] === "/bin/zsh") && cmd[1] === "-c") {
+        return {
+          pid: 9999,
+          exited: Promise.resolve(testSuccess ? 0 : 1),
+          stdout: new Response(testSuccess ? "tests pass\n" : "tests fail\n").body,
+          stderr: new Response("").body,
+        };
+      }
+      if (cmd[0] === "git" && cmd[1] === "rev-parse") {
+        revParseCount++;
+        return {
+          exited: Promise.resolve(0),
+          stdout: new Response(`ref-${revParseCount}\n`).body,
+          stderr: new Response("").body,
+        };
+      }
+      if (cmd[0] === "git" && cmd[1] === "checkout") {
+        opts.onCheckout?.();
+        return {
+          exited: Promise.resolve(0),
+          stdout: new Response("").body,
+          stderr: new Response("").body,
+        };
+      }
+      if (cmd[0] === "git" && cmd[1] === "diff") {
+        const files = opts.diffFiles[diffCount] || [];
+        diffCount++;
+        return {
+          exited: Promise.resolve(0),
+          stdout: new Response(files.join("\n") + "\n").body,
+          stderr: new Response("").body,
+        };
+      }
+      return originalSpawn(cmd, spawnOpts);
+    });
+  }
+  test("fallback NO LONGER triggers when strategy='auto' and 0 test files (BUG-010 removed auto-fallback)", async () => {
+    let checkoutCalled = false;
+    // BUG-010: Zero-file scenarios now return greenfield-no-tests immediately
+    // No fallback to lite mode occurs
+    mockGitSpawnWithCheckout({
+      diffFiles: [
+        ["requirements.md"], // s1 isolation (strict) — no source violations
+        ["requirements.md"], // s1 getChangedFiles (strict) — 0 test files → return greenfield-no-tests
+      ],
+      onCheckout: () => {
+        checkoutCalled = true;
+      },
+    });
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 }, // s1 strict test-writer
+    ]);
+    const configWithAutoStrategy = {
+      ...DEFAULT_CONFIG,
+      tdd: { ...DEFAULT_CONFIG.tdd, strategy: "auto" as const },
+    };
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: configWithAutoStrategy,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+    });
+    expect(checkoutCalled).toBe(false); // git checkout NOT called (no fallback)
+    expect(result.lite).toBe(false); // not in lite mode
+    expect(result.success).toBe(false); // fails with greenfield-no-tests
+    expect(result.failureCategory).toBe("greenfield-no-tests");
+  });
+  test("zero-file scenario returns greenfield-no-tests (BUG-010 removed lite fallback)", async () => {
+    // BUG-010: No more auto-fallback to lite mode
+    mockGitSpawn({
+      diffFiles: [
+        ["docs/plan.md"], // s1 isolation (strict)
+        ["docs/plan.md"], // s1 getChangedFiles (strict) → 0 test files
+      ],
+    });
+    const agent = createMockAgent([{ success: true, estimatedCost: 0.01 }]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+    });
+    expect(result.lite).toBe(false);
+    expect(result.success).toBe(false);
+    expect(result.failureCategory).toBe("greenfield-no-tests");
+  });
+  test("fallback does NOT trigger when strategy='strict' (explicit strict mode)", async () => {
+    // In strategy='strict', no fallback — should return failure
+    mockGitSpawn({
+      diffFiles: [
+        ["requirements.md"], // s1 isolation — no source violations
+        ["requirements.md"], // s1 getChangedFiles — 0 test files
+      ],
+    });
+    const agent = createMockAgent([{ success: true, estimatedCost: 0.01 }]);
+    const configWithStrictStrategy = {
+      ...DEFAULT_CONFIG,
+      tdd: { ...DEFAULT_CONFIG.tdd, strategy: "strict" as const },
+    };
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: configWithStrictStrategy,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+    });
+    // Should fail (no fallback in strict mode)
+    expect(result.success).toBe(false);
+    expect(result.needsHumanReview).toBe(true);
+    expect(result.reviewReason).toBe("Test writer session created no test files (greenfield project)");
+    expect(result.lite).toBe(false); // Was called in strict mode, no fallback
+  });
+  test("fallback does NOT trigger when already in lite mode", async () => {
+    // Calling with lite=true — if 0 test files, should return failure (not recurse again)
+    mockGitSpawn({
+      diffFiles: [
+        ["requirements.md"], // s1 getChangedFiles (lite, no isolation) — 0 test files
+      ],
+    });
+    const agent = createMockAgent([{ success: true, estimatedCost: 0.01 }]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+      lite: true,
+    });
+    // Should fail — no further fallback from lite mode
+    expect(result.success).toBe(false);
+    expect(result.needsHumanReview).toBe(true);
+    expect(result.reviewReason).toBe("Test writer session created no test files (greenfield project)");
+    expect(result.lite).toBe(true);
+  });
+  test("fallback does NOT trigger when strategy='lite' config", async () => {
+    // When strategy='lite', runThreeSessionTdd is called with lite=true (from execution stage)
+    // So !lite = false → no fallback
+    mockGitSpawn({
+      diffFiles: [
+        [], // s1 getChangedFiles (lite, no isolation) — 0 test files
+      ],
+    });
+    const agent = createMockAgent([{ success: true, estimatedCost: 0.01 }]);
+    const configWithLiteStrategy = {
+      ...DEFAULT_CONFIG,
+      tdd: { ...DEFAULT_CONFIG.tdd, strategy: "lite" as const },
+    };
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: configWithLiteStrategy,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+      lite: true, // router sets this for lite strategy
+    });
+    expect(result.success).toBe(false);
+    expect(result.lite).toBe(true);
+  });
+});
+// ─── T4: failureCategory tests ────────────────────────────────────────────────
+describe("runThreeSessionTdd — failureCategory", () => {
+  test("test-writer isolation failure sets failureCategory='isolation-violation'", async () => {
+    // Test-writer modifies source files → isolation violation
+    mockGitSpawn({
+      diffFiles: [
+        // Isolation check: test-writer touched source files!
+        ["src/user.ts", "test/user.test.ts"],
+        // getChangedFiles
+        ["src/user.ts", "test/user.test.ts"],
+      ],
+    });
+    const agent = createMockAgent([{ success: true, estimatedCost: 0.01 }]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+    });
+    expect(result.success).toBe(false);
+    expect(result.failureCategory).toBe("isolation-violation");
+  });
+  test("test-writer zero files (non-auto strategy) sets failureCategory='isolation-violation'", async () => {
+    // In strict strategy, zero test files → greenfield-no-tests category (BUG-010 behavior)
+    mockGitSpawn({
+      diffFiles: [
+        ["requirements.md"], // s1 isolation — no source violations
+        ["requirements.md"], // s1 getChangedFiles — 0 test files
+      ],
+    });
+    const agent = createMockAgent([{ success: true, estimatedCost: 0.01 }]);
+    const configWithStrictStrategy = {
+      ...DEFAULT_CONFIG,
+      tdd: { ...DEFAULT_CONFIG.tdd, strategy: "strict" as const },
+    };
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: configWithStrictStrategy,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+    });
+    expect(result.success).toBe(false);
+    expect(result.failureCategory).toBe("greenfield-no-tests");
+  });
+  test("test-writer crash/timeout (non-isolation failure) sets failureCategory='session-failure'", async () => {
+    // Test-writer agent crashes/times out but isolation is clean
+    mockGitSpawn({
+      diffFiles: [
+        // Isolation check: only test files (passes)
+        ["test/user.test.ts"],
+        // getChangedFiles
+        ["test/user.test.ts"],
+      ],
+    });
+    const agent = createMockAgent([
+      { success: false, exitCode: 1, estimatedCost: 0.01 }, // Agent crash
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+    });
+    expect(result.success).toBe(false);
+    // isolation.passed=true but agent failed → session-failure
+    expect(result.failureCategory).toBe("session-failure");
+  });
+  test("implementer failure sets failureCategory='session-failure'", async () => {
+    mockGitSpawn({
+      diffFiles: [
+        // Session 1 isolation: OK
+        ["test/user.test.ts"],
+        // Session 1 getChangedFiles
+        ["test/user.test.ts"],
+        // Session 2 isolation: OK
+        ["src/user.ts"],
+        // Session 2 getChangedFiles
+        ["src/user.ts"],
+      ],
+    });
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 }, // test-writer OK
+      { success: false, exitCode: 1, estimatedCost: 0.02 }, // implementer fails
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+    });
+    expect(result.success).toBe(false);
+    expect(result.failureCategory).toBe("session-failure");
+  });
+  test("post-TDD test failure sets failureCategory='tests-failing'", async () => {
+    // Verifier session fails AND independent test run also fails
+    let revParseCount = 0;
+    let diffCount = 0;
+    const diffFiles = [["test/user.test.ts"], ["test/user.test.ts"], ["src/user.ts"], ["src/user.ts"], ["src/user.ts"]];
+    // @ts-ignore — mocking global
+    Bun.spawn = mock((cmd: string[], spawnOpts?: any) => {
+      if (cmd[0] === "/bin/sh" && cmd[2]?.includes("bun test")) {
+        return {
+          pid: 9999,
+          exited: Promise.resolve(1), // Tests FAIL
+          stdout: new Response("3 pass, 2 fail\n").body,
+          stderr: new Response("Test errors...\n").body,
+        };
+      }
+      if (cmd[0] === "git" && cmd[1] === "rev-parse") {
+        revParseCount++;
+        return {
+          exited: Promise.resolve(0),
+          stdout: new Response(`ref-${revParseCount}\n`).body,
+          stderr: new Response("").body,
+        };
+      }
+      if (cmd[0] === "git" && cmd[1] === "diff") {
+        const files = diffFiles[diffCount] || [];
+        diffCount++;
+        return {
+          exited: Promise.resolve(0),
+          stdout: new Response(files.join("\n") + "\n").body,
+          stderr: new Response("").body,
+        };
+      }
+      return originalSpawn(cmd, spawnOpts);
+    });
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 },
+      { success: true, estimatedCost: 0.02 },
+      { success: false, exitCode: 1, estimatedCost: 0.01 }, // verifier fails
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+    });
+    expect(result.success).toBe(false);
+    expect(result.failureCategory).toBe("tests-failing");
+  });
+  test("success path has no failureCategory", async () => {
+    mockGitSpawn({
+      diffFiles: [["test/user.test.ts"], ["test/user.test.ts"], ["src/user.ts"], ["src/user.ts"], ["src/user.ts"]],
+    });
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 },
+      { success: true, estimatedCost: 0.02 },
+      { success: true, estimatedCost: 0.01 },
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+    });
+    expect(result.success).toBe(true);
+    expect(result.failureCategory).toBeUndefined();
+  });
+  test("zero-file scenario (auto strategy) returns greenfield-no-tests (BUG-010 removed auto-fallback)", async () => {
+    // BUG-010: In auto strategy, zero test files → return greenfield-no-tests (no more fallback)
+    let diffCount = 0;
+    const diffFiles = [
+      ["requirements.md"], // s1 isolation (strict) — no source violations
+      ["requirements.md"], // s1 getChangedFiles (strict) — 0 test files → return greenfield-no-tests
+    ];
+    // @ts-ignore — mocking global
+    Bun.spawn = mock((cmd: string[], spawnOpts?: any) => {
+      if (cmd[0] === "git" && cmd[1] === "rev-parse") {
+        return {
+          exited: Promise.resolve(0),
+          stdout: new Response("ref-1\n").body,
+          stderr: new Response("").body,
+        };
+      }
+      if (cmd[0] === "git" && cmd[1] === "diff") {
+        const files = diffFiles[diffCount] || [];
+        diffCount++;
+        return {
+          exited: Promise.resolve(0),
+          stdout: new Response(files.join("\n") + "\n").body,
+          stderr: new Response("").body,
+        };
+      }
+      return originalSpawn(cmd, spawnOpts);
+    });
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 }, // s1 strict test-writer
+    ]);
+    const configWithAutoStrategy = {
+      ...DEFAULT_CONFIG,
+      tdd: { ...DEFAULT_CONFIG.tdd, strategy: "auto" as const },
+    };
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: configWithAutoStrategy,
+      workdir: "/tmp/test",
+      modelTier: "balanced",
+    });
+    expect(result.success).toBe(false);
+    expect(result.lite).toBe(false);
+    expect(result.failureCategory).toBe("greenfield-no-tests");
+  });
+});
+// ─── T9: Verdict integration tests ───────────────────────────────────────────
+describe("runThreeSessionTdd — T9: verdict integration", () => {
+  let tmpDir: string;
+  beforeEach(async () => {
+    tmpDir = `/tmp/nax-t9-test-${Date.now()}-${Math.random().toString(36).slice(2)}`;
+    await mkdir(tmpDir, { recursive: true });
+  });
+  afterEach(async () => {
+    await rm(tmpDir, { recursive: true, force: true });
+    Bun.spawn = originalSpawn;
+  });
+  /** Write a valid verdict file to tmpDir */
+  async function writeVerdictToDir(opts: {
+    approved: boolean;
+    failReason?: "tests-failing" | "illegitimate-mods" | "criteria-not-met" | "poor-quality";
+  }) {
+    const verdict = {
+      version: 1,
+      approved: opts.approved,
+      tests: {
+        allPassing: opts.failReason !== "tests-failing",
+        passCount: opts.failReason === "tests-failing" ? 5 : 10,
+        failCount: opts.failReason === "tests-failing" ? 3 : 0,
+      },
+      testModifications: {
+        detected: opts.failReason === "illegitimate-mods",
+        files: opts.failReason === "illegitimate-mods" ? ["test/foo.test.ts"] : [],
+        legitimate: opts.failReason !== "illegitimate-mods",
+        reasoning: opts.failReason === "illegitimate-mods" ? "Implementer cheated" : "No mods",
+      },
+      acceptanceCriteria: {
+        allMet: opts.failReason !== "criteria-not-met",
+        criteria:
+          opts.failReason === "criteria-not-met"
+            ? [{ criterion: "Must work", met: false }]
+            : [{ criterion: "Works", met: true }],
+      },
+      quality: {
+        rating: opts.failReason === "poor-quality" ? "poor" : "good",
+        issues: opts.failReason === "poor-quality" ? ["Security issue"] : [],
+      },
+      fixes: [],
+      reasoning: opts.approved ? "All good." : "Implementation rejected.",
+    };
+    await writeFile(path.join(tmpDir, VERDICT_FILE), JSON.stringify(verdict, null, 2));
+  }
+  /**
+   * Mock Bun.spawn for a full 3-session T9 run.
+   * Provides 6 git diff calls (isolation + getChangedFiles per session)
+   * and optionally intercepts the post-TDD shell command (bun test).
+   */
+  function mockGitAndTestForT9(opts: {
+    diffFiles?: string[][];
+    onTestCmd?: () => { exitCode: number; stdout: string };
+  }) {
+    const files = opts.diffFiles ?? [
+      ["test/user.test.ts"], // s1 isolation
+      ["test/user.test.ts"], // s1 getChangedFiles
+      ["src/user.ts"], // s2 isolation
+      ["src/user.ts"], // s2 getChangedFiles
+      [], // s3 isolation
+      ["src/user.ts"], // s3 getChangedFiles
+    ];
+    let revParseCount = 0;
+    let diffCount = 0;
+    // @ts-ignore — mocking global
+    Bun.spawn = mock((cmd: string[], spawnOpts?: any) => {
+      if (cmd[0] === "/bin/sh" && cmd[2]?.includes("bun test")) {
+        const r = opts.onTestCmd?.() ?? { exitCode: 0, stdout: "5 pass, 0 fail\n" };
+        return {
+          pid: 9999,
+          exited: Promise.resolve(r.exitCode),
+          stdout: new Response(r.stdout).body,
+          stderr: new Response("").body,
+        };
+      }
+      if (cmd[0] === "git" && cmd[1] === "rev-parse") {
+        revParseCount++;
+        return {
+          exited: Promise.resolve(0),
+          stdout: new Response(`ref-${revParseCount}\n`).body,
+          stderr: new Response("").body,
+        };
+      }
+      if (cmd[0] === "git" && cmd[1] === "diff") {
+        const f = files[diffCount] || [];
+        diffCount++;
+        return {
+          exited: Promise.resolve(0),
+          stdout: new Response(f.join("\n") + "\n").body,
+          stderr: new Response("").body,
+        };
+      }
+      return originalSpawn(cmd, spawnOpts);
+    });
+  }
+  test("verdict approved=true: overall success even when verifier session failed", async () => {
+    await writeVerdictToDir({ approved: true });
+    mockGitAndTestForT9({});
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 },
+      { success: true, estimatedCost: 0.02 },
+      { success: false, exitCode: 1, estimatedCost: 0.01 }, // verifier exits non-zero
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: tmpDir,
+      modelTier: "balanced",
+    });
+    expect(result.success).toBe(true);
+    expect(result.needsHumanReview).toBe(false);
+    expect(result.failureCategory).toBeUndefined();
+    expect(result.reviewReason).toBeUndefined();
+  });
+  test("verdict approved=true: skips the post-TDD independent test check", async () => {
+    await writeVerdictToDir({ approved: true });
+    let testCommandCalled = false;
+    mockGitAndTestForT9({
+      onTestCmd: () => {
+        testCommandCalled = true;
+        return { exitCode: 0, stdout: "" };
+      },
+    });
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 },
+      { success: true, estimatedCost: 0.02 },
+      { success: false, exitCode: 1, estimatedCost: 0.01 }, // verifier fails
+    ]);
+    // Disable rectification to avoid test command being called for full-suite gate
+    const configNoRectification = {
+      ...DEFAULT_CONFIG,
+      execution: {
+        ...DEFAULT_CONFIG.execution,
+        rectification: { ...DEFAULT_CONFIG.execution.rectification, enabled: false },
+      },
+    };
+    await runThreeSessionTdd({
+      agent,
+      story,
+      config: configNoRectification,
+      workdir: tmpDir,
+      modelTier: "balanced",
+    });
+    expect(testCommandCalled).toBe(false); // Test was NOT run when verdict present
+  });
+  test("verdict approved=false + tests-failing → failureCategory='tests-failing'", async () => {
+    await writeVerdictToDir({ approved: false, failReason: "tests-failing" });
+    mockGitAndTestForT9({});
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 },
+      { success: true, estimatedCost: 0.02 },
+      { success: true, estimatedCost: 0.01 }, // sessions succeed but verdict says rejected
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: tmpDir,
+      modelTier: "balanced",
+    });
+    expect(result.success).toBe(false);
+    expect(result.needsHumanReview).toBe(true);
+    expect(result.failureCategory).toBe("tests-failing");
+    expect(result.reviewReason).toContain("failure(s)");
+  });
+  test("verdict approved=false + illegitimate test mods → failureCategory='verifier-rejected'", async () => {
+    await writeVerdictToDir({ approved: false, failReason: "illegitimate-mods" });
+    mockGitAndTestForT9({});
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 },
+      { success: true, estimatedCost: 0.02 },
+      { success: true, estimatedCost: 0.01 },
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: tmpDir,
+      modelTier: "balanced",
+    });
+    expect(result.success).toBe(false);
+    expect(result.failureCategory).toBe("verifier-rejected");
+    expect(result.reviewReason).toContain("illegitimate test modifications");
+  });
+  test("verdict approved=false + criteria not met → failureCategory='verifier-rejected'", async () => {
+    await writeVerdictToDir({ approved: false, failReason: "criteria-not-met" });
+    mockGitAndTestForT9({});
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 },
+      { success: true, estimatedCost: 0.02 },
+      { success: true, estimatedCost: 0.01 },
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: tmpDir,
+      modelTier: "balanced",
+    });
+    expect(result.success).toBe(false);
+    expect(result.failureCategory).toBe("verifier-rejected");
+    expect(result.reviewReason).toContain("Must work");
+  });
+  test("no verdict file → fallback: post-TDD test check is run on session failures", async () => {
+    // No verdict file — when verifier fails, falls back to running tests independently
+    let testCommandCalled = false;
+    mockGitAndTestForT9({
+      onTestCmd: () => {
+        testCommandCalled = true;
+        return { exitCode: 0, stdout: "5 pass, 0 fail\n" }; // Tests pass in fallback
+      },
+    });
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 },
+      { success: true, estimatedCost: 0.02 },
+      { success: false, exitCode: 1, estimatedCost: 0.01 }, // verifier fails
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: tmpDir,
+      modelTier: "balanced",
+    });
+    expect(testCommandCalled).toBe(true); // Fallback test run was executed
+    expect(result.success).toBe(true); // Tests pass in fallback → success
+    expect(result.verdict).toBeNull(); // No verdict available
+  });
+  test("malformed verdict → fallback: post-TDD test check is run", async () => {
+    // Write invalid JSON — should trigger fallback
+    await writeFile(path.join(tmpDir, VERDICT_FILE), "{ this is not valid json }");
+    let testCommandCalled = false;
+    mockGitAndTestForT9({
+      onTestCmd: () => {
+        testCommandCalled = true;
+        return { exitCode: 0, stdout: "5 pass\n" };
+      },
+    });
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 },
+      { success: true, estimatedCost: 0.02 },
+      { success: false, exitCode: 1, estimatedCost: 0.01 },
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: tmpDir,
+      modelTier: "balanced",
+    });
+    expect(testCommandCalled).toBe(true); // Fallback used when verdict is malformed
+    expect(result.verdict).toBeNull(); // Malformed = null
+  });
+  test("verdict stored in result.verdict for logging/debugging (approved=true)", async () => {
+    await writeVerdictToDir({ approved: true });
+    mockGitAndTestForT9({});
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 },
+      { success: true, estimatedCost: 0.02 },
+      { success: true, estimatedCost: 0.01 },
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: tmpDir,
+      modelTier: "balanced",
+    });
+    expect(result.verdict).toBeDefined();
+    expect(result.verdict).not.toBeNull();
+    expect(result.verdict!.version).toBe(1);
+    expect(result.verdict!.approved).toBe(true);
+    expect(result.verdict!.tests.allPassing).toBe(true);
+    expect(result.verdict!.tests.passCount).toBe(10);
+    expect(result.verdict!.reasoning).toBe("All good.");
+  });
+  test("verdict stored in result.verdict for logging/debugging (approved=false)", async () => {
+    await writeVerdictToDir({ approved: false, failReason: "tests-failing" });
+    mockGitAndTestForT9({});
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 },
+      { success: true, estimatedCost: 0.02 },
+      { success: true, estimatedCost: 0.01 },
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: tmpDir,
+      modelTier: "balanced",
+    });
+    expect(result.verdict).not.toBeNull();
+    expect(result.verdict!.approved).toBe(false);
+    expect(result.verdict!.tests.failCount).toBe(3);
+  });
+  test("verdict file is deleted after reading (cleanup enforced)", async () => {
+    await writeVerdictToDir({ approved: true });
+    mockGitAndTestForT9({});
+    const verdictPath = path.join(tmpDir, VERDICT_FILE);
+    expect(existsSync(verdictPath)).toBe(true); // File exists before run
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 },
+      { success: true, estimatedCost: 0.02 },
+      { success: true, estimatedCost: 0.01 },
+    ]);
+    await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: tmpDir,
+      modelTier: "balanced",
+    });
+    expect(existsSync(verdictPath)).toBe(false); // File cleaned up after run
+  });
+  test("no verdict + all sessions succeed → success without running test check", async () => {
+    // All sessions succeed, no verdict → should succeed and NOT run the test command
+    let testCommandCalled = false;
+    mockGitAndTestForT9({
+      onTestCmd: () => {
+        testCommandCalled = true;
+        return { exitCode: 0, stdout: "" };
+      },
+    });
+    const agent = createMockAgent([
+      { success: true, estimatedCost: 0.01 },
+      { success: true, estimatedCost: 0.02 },
+      { success: true, estimatedCost: 0.01 },
+    ]);
+    // Disable rectification to avoid test command being called for full-suite gate
+    const configNoRectification = {
+      ...DEFAULT_CONFIG,
+      execution: {
+        ...DEFAULT_CONFIG.execution,
+        rectification: { ...DEFAULT_CONFIG.execution.rectification, enabled: false },
+      },
+    };
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: configNoRectification,
+      workdir: tmpDir,
+      modelTier: "balanced",
+    });
+    expect(result.success).toBe(true);
+    expect(testCommandCalled).toBe(false); // Not needed when sessions all succeed
+    expect(result.verdict).toBeNull(); // No verdict
+    expect(result.failureCategory).toBeUndefined();
+  });
+  test("early-exit before session 3 (session 1 fails) → verdict is undefined (not attempted)", async () => {
+    // If we exit before session 3, verdict reading is never attempted
+    mockGitAndTestForT9({
+      diffFiles: [
+        ["test/user.test.ts"], // s1 isolation
+        ["test/user.test.ts"], // s1 getChangedFiles
+      ],
+    });
+    const agent = createMockAgent([
+      { success: false, exitCode: 1, estimatedCost: 0.01 }, // session 1 fails
+    ]);
+    const result = await runThreeSessionTdd({
+      agent,
+      story,
+      config: DEFAULT_CONFIG,
+      workdir: tmpDir,
+      modelTier: "balanced",
+    });
+    expect(result.success).toBe(false);
+    expect(result.sessions).toHaveLength(1);
+    // verdict is undefined (field not set) because we never got to session 3
+    expect(result.verdict).toBeUndefined();
+  });
+});