@nathapp/nax 0.28.0 → 0.30.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (385) hide show
  1. package/CHANGELOG.md +23 -2
  2. package/bin/nax.ts +2 -3
  3. package/dist/nax.js +72753 -0
  4. package/package.json +11 -3
  5. package/src/cli/analyze.ts +2 -7
  6. package/src/cli/config.ts +3 -1
  7. package/src/config/defaults.ts +1 -0
  8. package/src/config/schemas.ts +1 -0
  9. package/src/config/types.ts +1 -0
  10. package/src/context/builder.ts +10 -1
  11. package/src/execution/lifecycle/headless-formatter.ts +2 -4
  12. package/src/prompts/builder.ts +12 -69
  13. package/src/prompts/sections/isolation.ts +38 -8
  14. package/src/prompts/sections/role-task.ts +79 -17
  15. package/src/review/runner.ts +6 -1
  16. package/src/version.ts +2 -1
  17. package/.claude/rules/01-project-conventions.md +0 -34
  18. package/.claude/rules/02-test-architecture.md +0 -39
  19. package/.claude/rules/03-test-writing.md +0 -58
  20. package/.claude/rules/04-forbidden-patterns.md +0 -29
  21. package/.claude/settings.json +0 -15
  22. package/.githooks/pre-commit +0 -16
  23. package/.gitlab-ci.yml +0 -103
  24. package/.mcp.json +0 -8
  25. package/BRIEF.md +0 -140
  26. package/CLAUDE.md +0 -143
  27. package/US-007-IMPLEMENTATION.md +0 -139
  28. package/biome.json +0 -14
  29. package/bun.lock +0 -163
  30. package/bunfig.toml +0 -12
  31. package/docker-compose.test.yml +0 -15
  32. package/docs/20260216-fix-plan-context-review.md +0 -56
  33. package/docs/20260216-relentless-vs-ngent-comparison.md +0 -208
  34. package/docs/20260216-v02-plan.md +0 -136
  35. package/docs/20260216-v02-review.md +0 -685
  36. package/docs/20260217-dogfood-findings.md +0 -56
  37. package/docs/20260217-p2-plus-plan.md +0 -117
  38. package/docs/20260217-partial-fixes-plan.md +0 -62
  39. package/docs/20260217-plan-analyze-spec.md +0 -117
  40. package/docs/20260217-post-impl-review.md +0 -1137
  41. package/docs/20260217-quick-wins-plan.md +0 -66
  42. package/docs/20260217-split-runner-plan.md +0 -75
  43. package/docs/20260217-v03-impl-plan.md +0 -80
  44. package/docs/20260217-v03-post-impl-review.md +0 -589
  45. package/docs/20260217-v04-impl-plan.md +0 -86
  46. package/docs/20260217-v05-post-impl-review.md +0 -850
  47. package/docs/20260217-v06-post-impl-review.md +0 -817
  48. package/docs/20260218-adr003-port-plan.md +0 -151
  49. package/docs/20260218-review-adr003-verification.md +0 -175
  50. package/docs/20260219-fix-plan-bug16-19.md +0 -79
  51. package/docs/20260219-fix-plan-bug20-22.md +0 -114
  52. package/docs/20260219-plan-llm-routing.md +0 -116
  53. package/docs/20260219-review-bug20-22-fixes.md +0 -135
  54. package/docs/20260219-routing-baseline-keyword.md +0 -63
  55. package/docs/20260220-plan-structured-logging-p1.md +0 -80
  56. package/docs/20260220-plan-structured-logging-p2.md +0 -37
  57. package/docs/20260220-review-llm-routing.md +0 -180
  58. package/docs/20260220-review-post-fix-llm-routing.md +0 -70
  59. package/docs/20260221-fix-plan-relevantfiles-split.md +0 -101
  60. package/docs/20260221-fix-plan-routing-mode.md +0 -125
  61. package/docs/20260221-review-v0.9-implementation.md +0 -379
  62. package/docs/20260222-fix-plan-v091-routing-isolation.md +0 -197
  63. package/docs/20260223-fix-plan-prompt-audit.md +0 -62
  64. package/docs/20260224-nax-roadmap-phases.md +0 -189
  65. package/docs/20260225-phase2-llm-service-layer.md +0 -401
  66. package/docs/20260225-review-v0.10.1.md +0 -187
  67. package/docs/20260303-v010-implementation-plan.md +0 -165
  68. package/docs/20260304-review-nax.md +0 -492
  69. package/docs/CLAUDE.md.bak +0 -191
  70. package/docs/ROADMAP.md +0 -390
  71. package/docs/SPEC-rectification.md +0 -0
  72. package/docs/SPEC.md +0 -324
  73. package/docs/US-001-plugin-loading-verification.md +0 -152
  74. package/docs/adr/ADR-005-implementation-plan.md +0 -655
  75. package/docs/adr/ADR-005-pipeline-re-architecture.md +0 -464
  76. package/docs/architecture-analysis.md +0 -1076
  77. package/docs/bugs/BUG-21-escalation-null-attempts.md +0 -48
  78. package/docs/bugs-from-dogfood-run-c.md +0 -243
  79. package/docs/code-review-20260228.md +0 -612
  80. package/docs/code-review-v0.15.0.md +0 -629
  81. package/docs/hook-lifecycle-test-plan.md +0 -149
  82. package/docs/releases/v0.11.0-and-earlier.md +0 -20
  83. package/docs/releases/v0.12.0.md +0 -15
  84. package/docs/releases/v0.13.0.md +0 -14
  85. package/docs/releases/v0.14.0.md +0 -20
  86. package/docs/releases/v0.14.1.md +0 -36
  87. package/docs/releases/v0.14.2.md +0 -51
  88. package/docs/releases/v0.14.3.md +0 -174
  89. package/docs/releases/v0.14.4.md +0 -94
  90. package/docs/releases/v0.15.0.md +0 -502
  91. package/docs/releases/v0.15.1.md +0 -170
  92. package/docs/releases/v0.15.3.md +0 -193
  93. package/docs/specs/bug-039-orphan-processes.md +0 -131
  94. package/docs/specs/bug-040-review-rectification.md +0 -82
  95. package/docs/specs/bug-041-cross-story-test-isolation.md +0 -88
  96. package/docs/specs/bug-042-verifier-failure-capture.md +0 -117
  97. package/docs/specs/bun-pty-migration.md +0 -171
  98. package/docs/specs/central-run-registry.md +0 -116
  99. package/docs/specs/feat-010-smart-runner-git-history.md +0 -96
  100. package/docs/specs/feat-011-file-context-strategy.md +0 -73
  101. package/docs/specs/feat-012-tdd-writer-tier.md +0 -79
  102. package/docs/specs/feat-013-test-after-review.md +0 -89
  103. package/docs/specs/feat-014-heartbeat-observability.md +0 -127
  104. package/docs/specs/status-file-consolidation.md +0 -93
  105. package/docs/specs/status-file-v0.10.1.md +0 -812
  106. package/docs/specs/trigger-completion.md +0 -145
  107. package/docs/specs/verification-architecture-v2.md +0 -343
  108. package/docs/tdd/strategies.md +0 -97
  109. package/docs/v0.10-global-config.md +0 -206
  110. package/docs/v0.10-plugin-system.md +0 -415
  111. package/docs/v0.10-prompt-optimizer.md +0 -234
  112. package/docs/v0.3-spec.md +0 -244
  113. package/docs/v0.4-spec.md +0 -140
  114. package/docs/v0.5-spec.md +0 -237
  115. package/docs/v0.6-spec.md +0 -371
  116. package/docs/v0.7-spec.md +0 -177
  117. package/docs/v0.8-llm-routing.md +0 -206
  118. package/docs/v0.8-structured-logging.md +0 -132
  119. package/docs/v0.9.3-prompt-audit.md +0 -112
  120. package/examples/plugins/console-reporter/index.test.ts +0 -207
  121. package/examples/plugins/console-reporter/index.ts +0 -110
  122. package/memory/topic/feat-010-baseref.md +0 -28
  123. package/memory/topic/feat-013-test-after-deprecation.md +0 -22
  124. package/nax/config.json +0 -154
  125. package/nax/features/bug-039-medium/prd.json +0 -45
  126. package/nax/features/bugfix-v0171/prd.json +0 -52
  127. package/nax/features/central-run-registry/prd.json +0 -105
  128. package/nax/features/config-management/prd.json +0 -108
  129. package/nax/features/config-management/progress.txt +0 -5
  130. package/nax/features/diagnose/acceptance.test.ts +0 -414
  131. package/nax/features/diagnose/prd.json +0 -41
  132. package/nax/features/nax-compliance/prd.json +0 -52
  133. package/nax/features/nax-compliance/progress.txt +0 -1
  134. package/nax/features/orchestration-fixes/prd.json +0 -89
  135. package/nax/features/orchestration-fixes/progress.txt +0 -1
  136. package/nax/features/plugin-integration/US-007-VERIFICATION.md +0 -259
  137. package/nax/features/plugin-integration/prd.json +0 -208
  138. package/nax/features/plugin-integration/progress.txt +0 -5
  139. package/nax/features/post-rearch-bugfix/prd.json +0 -137
  140. package/nax/features/precheck/prd.json +0 -205
  141. package/nax/features/precheck/progress.txt +0 -15
  142. package/nax/features/prompt-builder/prd.json +0 -152
  143. package/nax/features/prompt-builder/progress.txt +0 -3
  144. package/nax/features/review-quality/prd.json +0 -55
  145. package/nax/features/routing-persistence/prd.json +0 -104
  146. package/nax/features/routing-persistence/progress.txt +0 -1
  147. package/nax/features/smart-test-runner/plan.md +0 -7
  148. package/nax/features/smart-test-runner/prd.json +0 -203
  149. package/nax/features/smart-test-runner/progress.txt +0 -13
  150. package/nax/features/smart-test-runner/spec.md +0 -7
  151. package/nax/features/smart-test-runner/tasks.md +0 -8
  152. package/nax/features/status-file-consolidation/prd.json +0 -106
  153. package/nax/features/structured-logging/prd.json +0 -199
  154. package/nax/features/trigger-completion/prd.json +0 -150
  155. package/nax/features/trigger-completion/progress.txt +0 -7
  156. package/nax/features/unlock/prd.json +0 -36
  157. package/nax/features/v0.18.3-execution-reliability/prd.json +0 -80
  158. package/nax/features/v0.18.3-execution-reliability/progress.txt +0 -3
  159. package/nax/features/v0.19.0-hardening/plan.md +0 -7
  160. package/nax/features/v0.19.0-hardening/prd.json +0 -84
  161. package/nax/features/v0.19.0-hardening/progress.txt +0 -7
  162. package/nax/features/v0.19.0-hardening/spec.md +0 -18
  163. package/nax/features/v0.19.0-hardening/tasks.md +0 -8
  164. package/nax/features/verify-v2/prd.json +0 -79
  165. package/nax/features/verify-v2/progress.txt +0 -3
  166. package/nax/status.json +0 -36
  167. package/src/prompts/templates/implementer.ts +0 -6
  168. package/src/prompts/templates/single-session.ts +0 -6
  169. package/src/prompts/templates/test-writer.ts +0 -6
  170. package/src/prompts/templates/verifier.ts +0 -6
  171. package/test/COVERAGE-GAPS.md +0 -333
  172. package/test/e2e/cm-003-default-view.test.ts +0 -195
  173. package/test/e2e/plan-analyze-run.test.ts +0 -902
  174. package/test/helpers/helpers.test.ts +0 -295
  175. package/test/helpers/timeout.ts +0 -42
  176. package/test/integration/US-002-TEST-SUMMARY.md +0 -107
  177. package/test/integration/US-003-TEST-SUMMARY.md +0 -149
  178. package/test/integration/US-004-TEST-SUMMARY.md +0 -106
  179. package/test/integration/US-005-TEST-SUMMARY.md +0 -138
  180. package/test/integration/US-007-TEST-SUMMARY.md +0 -100
  181. package/test/integration/cli/agent-validation.test.ts +0 -439
  182. package/test/integration/cli/cli-config-default-edge-cases.test.ts +0 -223
  183. package/test/integration/cli/cli-config-default-view.test.ts +0 -230
  184. package/test/integration/cli/cli-config-diff.test.ts +0 -461
  185. package/test/integration/cli/cli-config-prompts-explain.test.ts +0 -74
  186. package/test/integration/cli/cli-config.test.ts +0 -737
  187. package/test/integration/cli/cli-diagnose.test.ts +0 -595
  188. package/test/integration/cli/cli-logs.test.ts +0 -346
  189. package/test/integration/cli/cli-plugins.test.ts +0 -679
  190. package/test/integration/cli/cli-precheck.test.ts +0 -372
  191. package/test/integration/cli/cli-run-headless.test.ts +0 -174
  192. package/test/integration/cli/cli.test.ts +0 -76
  193. package/test/integration/cli/precheck-integration.test.ts +0 -476
  194. package/test/integration/cli/precheck-orchestrator.test.ts +0 -247
  195. package/test/integration/cli/precheck.test.ts +0 -806
  196. package/test/integration/config/config-loader.test.ts +0 -266
  197. package/test/integration/config/config.test.ts +0 -444
  198. package/test/integration/config/merger.test.ts +0 -466
  199. package/test/integration/config/paths.test.ts +0 -52
  200. package/test/integration/config/security-loader.test.ts +0 -83
  201. package/test/integration/context/context-integration.test.ts +0 -703
  202. package/test/integration/context/context-path-security.test.ts +0 -173
  203. package/test/integration/context/context-provider-injection.test.ts +0 -507
  204. package/test/integration/context/context-verification-integration.test.ts +0 -296
  205. package/test/integration/context/s5-greenfield-fallback.test.ts +0 -298
  206. package/test/integration/execution/execution-isolation.test.ts +0 -143
  207. package/test/integration/execution/execution.test.ts +0 -634
  208. package/test/integration/execution/feature-status-write.test.ts +0 -302
  209. package/test/integration/execution/parallel.test.ts +0 -251
  210. package/test/integration/execution/prd-pause.test.ts +0 -205
  211. package/test/integration/execution/prd-resolvers.test.ts +0 -186
  212. package/test/integration/execution/progress.test.ts +0 -34
  213. package/test/integration/execution/runner-batching.test.ts +0 -682
  214. package/test/integration/execution/runner-config-plugins.test.ts +0 -462
  215. package/test/integration/execution/runner-escalation.test.ts +0 -561
  216. package/test/integration/execution/runner-fixes.test.ts +0 -400
  217. package/test/integration/execution/runner-plugin-integration.test.ts +0 -544
  218. package/test/integration/execution/runner-queue-and-attempts.test.ts +0 -476
  219. package/test/integration/execution/status-file-integration.test.ts +0 -289
  220. package/test/integration/execution/status-file.test.ts +0 -380
  221. package/test/integration/execution/status-writer.test.ts +0 -447
  222. package/test/integration/execution/story-id-in-events.test.ts +0 -274
  223. package/test/integration/interaction/interaction-chain-pipeline.test.ts +0 -476
  224. package/test/integration/pipeline/hooks.test.ts +0 -363
  225. package/test/integration/pipeline/pipeline-acceptance.test.ts +0 -303
  226. package/test/integration/pipeline/pipeline-events.test.ts +0 -476
  227. package/test/integration/pipeline/pipeline.test.ts +0 -660
  228. package/test/integration/pipeline/reporter-lifecycle.test.ts +0 -862
  229. package/test/integration/pipeline/verify-stage.test.ts +0 -286
  230. package/test/integration/plan/analyze-integration.test.ts +0 -262
  231. package/test/integration/plan/analyze-scanner.test.ts +0 -132
  232. package/test/integration/plan/logger.test.ts +0 -461
  233. package/test/integration/plan/plan.test.ts +0 -157
  234. package/test/integration/plugins/config-integration.test.ts +0 -173
  235. package/test/integration/plugins/config-resolution.test.ts +0 -523
  236. package/test/integration/plugins/loader.test.ts +0 -644
  237. package/test/integration/plugins/plugins-registry.test.ts +0 -747
  238. package/test/integration/plugins/validator.test.ts +0 -564
  239. package/test/integration/prompts/pb-004-migration.test.ts +0 -523
  240. package/test/integration/review/review-config-commands.test.ts +0 -320
  241. package/test/integration/review/review-config-schema.test.ts +0 -117
  242. package/test/integration/review/review-plugin-integration.test.ts +0 -729
  243. package/test/integration/review/review.test.ts +0 -150
  244. package/test/integration/routing/plugin-routing-advanced.test.ts +0 -461
  245. package/test/integration/routing/plugin-routing-core.test.ts +0 -527
  246. package/test/integration/routing/routing-stage-bug-021.test.ts +0 -275
  247. package/test/integration/routing/routing-stage-greenfield.test.ts +0 -287
  248. package/test/integration/tdd/tdd-cleanup.test.ts +0 -246
  249. package/test/integration/tdd/tdd-orchestrator-core.test.ts +0 -565
  250. package/test/integration/tdd/tdd-orchestrator-failureCategory.test.ts +0 -355
  251. package/test/integration/tdd/tdd-orchestrator-fallback.test.ts +0 -311
  252. package/test/integration/tdd/tdd-orchestrator-lite.test.ts +0 -289
  253. package/test/integration/tdd/tdd-orchestrator-prompts.test.ts +0 -260
  254. package/test/integration/tdd/tdd-orchestrator-verdict.test.ts +0 -536
  255. package/test/integration/tmp/headless-test/test.jsonl +0 -30
  256. package/test/integration/verification/test-scanner.test.ts +0 -403
  257. package/test/integration/verification/verification-asset-check.test.ts +0 -143
  258. package/test/integration/worktree/manager.test.ts +0 -218
  259. package/test/integration/worktree/worktree-merge.test.ts +0 -341
  260. package/test/manual/logging-formatter-demo.ts +0 -158
  261. package/test/ui/tui-agent-panel.test.tsx +0 -99
  262. package/test/ui/tui-pty-integration.test.tsx +0 -146
  263. package/test/unit/acceptance.test.ts +0 -187
  264. package/test/unit/agent-stderr-capture.test.ts +0 -147
  265. package/test/unit/agents/claude.test.ts +0 -107
  266. package/test/unit/analyze-classifier.test.ts +0 -216
  267. package/test/unit/analyze.test.ts +0 -224
  268. package/test/unit/auto-detect.test.ts +0 -250
  269. package/test/unit/cli-status-project-level.test.ts +0 -283
  270. package/test/unit/cli-status.test.ts +0 -418
  271. package/test/unit/commands/common.test.ts +0 -321
  272. package/test/unit/commands/logs.test.ts +0 -458
  273. package/test/unit/commands/runs.test.ts +0 -303
  274. package/test/unit/commands/unlock.test.ts +0 -320
  275. package/test/unit/config/defaults.test.ts +0 -70
  276. package/test/unit/config/quality-commands-schema.test.ts +0 -72
  277. package/test/unit/config/regression-gate-schema.test.ts +0 -160
  278. package/test/unit/config/smart-runner-flag.test.ts +0 -250
  279. package/test/unit/constitution-generators.test.ts +0 -161
  280. package/test/unit/constitution.test.ts +0 -210
  281. package/test/unit/context/context-autodetect.test.ts +0 -297
  282. package/test/unit/context/context-build.test.ts +0 -575
  283. package/test/unit/context/context-coverage.test.ts +0 -236
  284. package/test/unit/context/context-error.test.ts +0 -93
  285. package/test/unit/context/context-estimate-tokens.test.ts +0 -201
  286. package/test/unit/context/context-format.test.ts +0 -302
  287. package/test/unit/context/context-isolation.test.ts +0 -267
  288. package/test/unit/context/context-sort.test.ts +0 -93
  289. package/test/unit/context/context-story.test.ts +0 -108
  290. package/test/unit/context/prior-failures.test.ts +0 -463
  291. package/test/unit/context.test.ts +0 -1726
  292. package/test/unit/cost.test.ts +0 -231
  293. package/test/unit/crash-recovery.test.ts +0 -309
  294. package/test/unit/escalation.test.ts +0 -127
  295. package/test/unit/execution/lifecycle/run-completion.test.ts +0 -240
  296. package/test/unit/execution/lifecycle/run-regression.test.ts +0 -420
  297. package/test/unit/execution/pid-registry.test.ts +0 -241
  298. package/test/unit/execution/sequential-executor.test.ts +0 -235
  299. package/test/unit/execution/sfc-004-dead-code-cleanup.test.ts +0 -89
  300. package/test/unit/execution/structured-failure.test.ts +0 -415
  301. package/test/unit/execution-logging-stderr.test.ts +0 -157
  302. package/test/unit/execution-stage.test.ts +0 -123
  303. package/test/unit/fix-generator.test.ts +0 -276
  304. package/test/unit/formatters.test.ts +0 -468
  305. package/test/unit/greenfield.test.ts +0 -180
  306. package/test/unit/hooks/shell-security.test.ts +0 -40
  307. package/test/unit/interaction/auto-plugin.test.ts +0 -162
  308. package/test/unit/interaction/human-review-trigger.test.ts +0 -165
  309. package/test/unit/interaction-network-failures.test.ts +0 -390
  310. package/test/unit/interaction-plugins.test.ts +0 -472
  311. package/test/unit/logging/formatter.test.ts +0 -456
  312. package/test/unit/merge.test.ts +0 -269
  313. package/test/unit/metrics/aggregator.test.ts +0 -164
  314. package/test/unit/metrics/tracker.test.ts +0 -186
  315. package/test/unit/metrics.test.ts +0 -276
  316. package/test/unit/optimizer/noop.optimizer.test.ts +0 -125
  317. package/test/unit/optimizer/rule-based.optimizer.test.ts +0 -358
  318. package/test/unit/pipeline/event-bus.test.ts +0 -105
  319. package/test/unit/pipeline/routing-partial-override.test.ts +0 -121
  320. package/test/unit/pipeline/runner-retry.test.ts +0 -89
  321. package/test/unit/pipeline/stages/autofix.test.ts +0 -97
  322. package/test/unit/pipeline/stages/completion-review-gate.test.ts +0 -218
  323. package/test/unit/pipeline/stages/execution-ambiguity.test.ts +0 -311
  324. package/test/unit/pipeline/stages/execution-merge-conflict.test.ts +0 -218
  325. package/test/unit/pipeline/stages/rectify.test.ts +0 -101
  326. package/test/unit/pipeline/stages/regression-stage.test.ts +0 -69
  327. package/test/unit/pipeline/stages/review.test.ts +0 -201
  328. package/test/unit/pipeline/stages/routing-idempotence.test.ts +0 -139
  329. package/test/unit/pipeline/stages/routing-initial-complexity.test.ts +0 -321
  330. package/test/unit/pipeline/stages/routing-persistence.test.ts +0 -380
  331. package/test/unit/pipeline/stages/verify.test.ts +0 -267
  332. package/test/unit/pipeline/subscribers/events-writer.test.ts +0 -227
  333. package/test/unit/pipeline/subscribers/hooks.test.ts +0 -84
  334. package/test/unit/pipeline/subscribers/interaction.test.ts +0 -313
  335. package/test/unit/pipeline/subscribers/registry.test.ts +0 -149
  336. package/test/unit/pipeline/subscribers/reporters.test.ts +0 -90
  337. package/test/unit/pipeline/verify-smart-runner.test.ts +0 -345
  338. package/test/unit/prd-auto-default.test.ts +0 -291
  339. package/test/unit/prd-failure-category.test.ts +0 -177
  340. package/test/unit/prd-get-next-story.test.ts +0 -215
  341. package/test/unit/precheck/checks-warnings.test.ts +0 -114
  342. package/test/unit/precheck-checks.test.ts +0 -841
  343. package/test/unit/precheck-story-size-gate.test.ts +0 -288
  344. package/test/unit/precheck-types.test.ts +0 -143
  345. package/test/unit/prompts/builder.test.ts +0 -258
  346. package/test/unit/prompts/loader.test.ts +0 -355
  347. package/test/unit/prompts/sections/conventions.test.ts +0 -30
  348. package/test/unit/prompts/sections/isolation.test.ts +0 -35
  349. package/test/unit/prompts/sections/role-task.test.ts +0 -40
  350. package/test/unit/prompts/sections/sections.test.ts +0 -238
  351. package/test/unit/prompts/sections/story.test.ts +0 -45
  352. package/test/unit/prompts/sections/verdict.test.ts +0 -58
  353. package/test/unit/prompts.test.ts +0 -476
  354. package/test/unit/queue.test.ts +0 -237
  355. package/test/unit/rectification.test.ts +0 -285
  356. package/test/unit/registry.test.ts +0 -288
  357. package/test/unit/review/runner.test.ts +0 -117
  358. package/test/unit/routing/content-hash.test.ts +0 -99
  359. package/test/unit/routing/routing-stability.test.ts +0 -208
  360. package/test/unit/routing/strategies/llm.test.ts +0 -306
  361. package/test/unit/routing-advanced.test.ts +0 -313
  362. package/test/unit/routing-core.test.ts +0 -341
  363. package/test/unit/routing-strategies.test.ts +0 -440
  364. package/test/unit/storyid-events.test.ts +0 -213
  365. package/test/unit/tdd-verdict.test.ts +0 -492
  366. package/test/unit/test-output-parser.test.ts +0 -377
  367. package/test/unit/ui/tui-controls.test.ts +0 -335
  368. package/test/unit/ui/tui-cost-and-pty.test.ts +0 -190
  369. package/test/unit/ui/tui-layout.test.ts +0 -379
  370. package/test/unit/ui/tui-stories.test.ts +0 -333
  371. package/test/unit/unit-isolation.test.ts +0 -135
  372. package/test/unit/utils/git.test.ts +0 -50
  373. package/test/unit/utils/path-security.test.ts +0 -47
  374. package/test/unit/utils-helpers.test.ts +0 -318
  375. package/test/unit/verdict.test.ts +0 -325
  376. package/test/unit/verification/orchestrator-types.test.ts +0 -54
  377. package/test/unit/verification/orchestrator.test.ts +0 -66
  378. package/test/unit/verification/smart-runner-config.test.ts +0 -163
  379. package/test/unit/verification/smart-runner-discovery.test.ts +0 -354
  380. package/test/unit/verification/smart-runner.test.ts +0 -262
  381. package/test/unit/verification/strategies/acceptance.test.ts +0 -33
  382. package/test/unit/verification/strategies/regression.test.ts +0 -87
  383. package/test/unit/verification/strategies/scoped.test.ts +0 -100
  384. package/test/unit/worktree-manager.test.ts +0 -159
  385. package/tsconfig.json +0 -27
@@ -1,902 +0,0 @@
1
- // RE-ARCH: keep
2
- /**
3
- * End-to-End Integration Tests
4
- *
5
- * Tests the full nax workflow: plan → analyze → run
6
- * Uses a MockAgentAdapter to avoid requiring real Claude Code installation
7
- */
8
-
9
- import { afterAll, afterEach, beforeAll, beforeEach, describe, expect, test } from "bun:test";
10
- import { existsSync, mkdirSync, rmSync } from "node:fs";
11
- import { join } from "node:path";
12
- import { ALL_AGENTS } from "../../src/agents/registry";
13
- import type {
14
- AgentAdapter,
15
- AgentCapabilities,
16
- AgentResult,
17
- AgentRunOptions,
18
- DecomposeOptions,
19
- DecomposeResult,
20
- PlanOptions,
21
- PlanResult,
22
- } from "../../src/agents/types";
23
- import { analyzeFeature } from "../../src/cli/analyze";
24
- import { planCommand } from "../../src/cli/plan";
25
- import { DEFAULT_CONFIG } from "../../src/config";
26
- import type { NaxConfig } from "../../src/config";
27
- import { run } from "../../src/execution/runner";
28
- import { initLogger, resetLogger } from "../../src/logger";
29
- import { loadPRD } from "../../src/prd";
30
-
31
- /**
32
- * Mock Agent Adapter for testing
33
- *
34
- * Implements the AgentAdapter interface but doesn't spawn real processes.
35
- * Returns realistic, controllable results for testing scenarios.
36
- */
37
- class MockAgentAdapter implements AgentAdapter {
38
- readonly name = "mock";
39
- readonly displayName = "Mock Agent";
40
- readonly binary = "mock-agent";
41
-
42
- readonly capabilities: AgentCapabilities = {
43
- supportedTiers: ["fast", "balanced", "powerful"],
44
- maxContextTokens: 200_000,
45
- features: new Set(["tdd", "review", "refactor", "batch"]),
46
- };
47
-
48
- // Control behavior via flags
49
- public shouldFailRun = false;
50
- public shouldRateLimit = false;
51
- public shouldFailReview = false;
52
- public callCount = 0;
53
- public runCalls: AgentRunOptions[] = [];
54
- public planCalls: PlanOptions[] = [];
55
- public decomposeCalls: DecomposeOptions[] = [];
56
-
57
- // Hard iteration cap to prevent infinite retry loops in tests
58
- // Set to 5 to allow for story batching and escalation scenarios
59
- public maxAttempts = 5;
60
- private attemptCountMap = new Map<string, number>();
61
-
62
- async isInstalled(): Promise<boolean> {
63
- return true;
64
- }
65
-
66
- buildCommand(options: AgentRunOptions): string[] {
67
- return [this.binary, "--prompt", options.prompt];
68
- }
69
-
70
- async run(_options: AgentRunOptions): Promise<AgentResult> {
71
- this.callCount++;
72
- this.runCalls.push(_options);
73
-
74
- // Track attempts per unique prompt to prevent infinite loops
75
- const promptKey = _options.prompt.slice(0, 100);
76
- const currentAttempts = (this.attemptCountMap.get(promptKey) || 0) + 1;
77
- this.attemptCountMap.set(promptKey, currentAttempts);
78
-
79
- // Hard cap: fail after maxAttempts to prevent infinite retry loops
80
- if (currentAttempts > this.maxAttempts) {
81
- return {
82
- success: false,
83
- exitCode: 1,
84
- output: `Mock agent: max attempts (${this.maxAttempts}) exceeded for this prompt`,
85
- rateLimited: false,
86
- durationMs: 100,
87
- estimatedCost: 0.01,
88
- };
89
- }
90
-
91
- // Simulate execution time
92
- await Bun.sleep(10);
93
-
94
- // Rate limit scenario
95
- if (this.shouldRateLimit && this.callCount === 1) {
96
- return {
97
- success: false,
98
- exitCode: 1,
99
- output: "Rate limit exceeded. Too many requests.",
100
- rateLimited: true,
101
- durationMs: 100,
102
- estimatedCost: 0.0,
103
- };
104
- }
105
-
106
- // Failure scenario
107
- if (this.shouldFailRun) {
108
- return {
109
- success: false,
110
- exitCode: 1,
111
- output: "Agent execution failed: mock error",
112
- rateLimited: false,
113
- durationMs: 500,
114
- estimatedCost: 0.01,
115
- };
116
- }
117
-
118
- // Success scenario
119
- return {
120
- success: true,
121
- exitCode: 0,
122
- output: `Mock agent completed task: ${_options.prompt.slice(0, 50)}...\n\nToken usage: 1500 input, 800 output`,
123
- rateLimited: false,
124
- durationMs: 2000,
125
- estimatedCost: 0.015,
126
- };
127
- }
128
-
129
- async plan(_options: PlanOptions): Promise<PlanResult> {
130
- this.planCalls.push(_options);
131
-
132
- // Simulate planning time
133
- await Bun.sleep(10);
134
-
135
- const specContent = `# Feature: URL Shortener
136
-
137
- ## Problem
138
- We need a URL shortening service to make long URLs more shareable.
139
-
140
- ## Requirements
141
- - REQ-1: Accept long URLs and generate short codes
142
- - REQ-2: Redirect short codes to original URLs
143
- - REQ-3: Track click analytics
144
- - REQ-4: Support custom short codes (optional)
145
-
146
- ## Acceptance Criteria
147
- - AC-1: Short codes are unique and collision-free
148
- - AC-2: Redirects work with 301 status
149
- - AC-3: Click counts are tracked accurately
150
- - AC-4: API returns JSON responses
151
-
152
- ## Technical Notes
153
- - Use base62 encoding for short codes
154
- - Store mappings in database (consider Redis for caching)
155
- - Log all redirects for analytics
156
- - Validate URLs before shortening
157
-
158
- ## Out of Scope
159
- - User accounts and authentication (MVP only)
160
- - Custom domains
161
- - Link expiration
162
- `;
163
-
164
- return {
165
- specContent,
166
- conversationLog: "Mock planning session",
167
- };
168
- }
169
-
170
- async decompose(_options: DecomposeOptions): Promise<DecomposeResult> {
171
- this.decomposeCalls.push(_options);
172
-
173
- // Simulate decompose time
174
- await Bun.sleep(10);
175
-
176
- // Parse the spec content to determine what stories to generate
177
- // For URL shortener spec, return realistic stories
178
- const stories = [
179
- {
180
- id: "US-001",
181
- title: "Implement short code generation",
182
- description: "Create algorithm to generate unique base62 short codes from URLs",
183
- acceptanceCriteria: [
184
- "Short codes are 6-8 characters",
185
- "Codes use base62 charset (a-zA-Z0-9)",
186
- "Collision detection works",
187
- "Codes are URL-safe",
188
- ],
189
- tags: ["core", "algorithm"],
190
- dependencies: [],
191
- complexity: "medium" as const,
192
- relevantFiles: ["src/shortener/generator.ts", "src/utils/base62.ts"],
193
- reasoning: "Requires algorithmic implementation with collision handling. 2-3 files, ~150 LOC.",
194
- estimatedLOC: 150,
195
- risks: ["Collision probability under high load"],
196
- },
197
- {
198
- id: "US-002",
199
- title: "Add database storage for URL mappings",
200
- description: "Store short code → long URL mappings in database with timestamps",
201
- acceptanceCriteria: [
202
- "Database schema defined",
203
- "CRUD operations work",
204
- "Queries are indexed",
205
- "Timestamps recorded",
206
- ],
207
- tags: ["database", "storage"],
208
- dependencies: [],
209
- complexity: "medium" as const,
210
- relevantFiles: ["src/db/schema.ts", "src/db/repository.ts"],
211
- reasoning: "Standard CRUD with indexing. 2 files, ~120 LOC.",
212
- estimatedLOC: 120,
213
- risks: ["Database performance at scale"],
214
- },
215
- {
216
- id: "US-003",
217
- title: "Create redirect handler",
218
- description: "Route that redirects /:code to the original URL with 301 status",
219
- acceptanceCriteria: [
220
- "GET /:code returns 301 redirect",
221
- "404 for invalid codes",
222
- "Click count incremented",
223
- "Response headers correct",
224
- ],
225
- tags: ["api", "core"],
226
- dependencies: ["US-001", "US-002"],
227
- complexity: "simple" as const,
228
- relevantFiles: ["src/api/redirect.ts"],
229
- reasoning: "Simple handler with lookup and redirect. 1 file, ~50 LOC.",
230
- estimatedLOC: 50,
231
- risks: [],
232
- },
233
- {
234
- id: "US-004",
235
- title: "Build URL shortening handler",
236
- description: "POST /api/shorten route that accepts URL and returns short code",
237
- acceptanceCriteria: [
238
- "POST /api/shorten accepts JSON",
239
- "URL validation works",
240
- "Returns short code in response",
241
- "Error handling for invalid URLs",
242
- ],
243
- tags: ["api", "core"],
244
- dependencies: ["US-001", "US-002"],
245
- complexity: "simple" as const,
246
- relevantFiles: ["src/api/shorten.ts"],
247
- reasoning: "Standard POST handler. 1 file, ~60 LOC.",
248
- estimatedLOC: 60,
249
- risks: [],
250
- },
251
- {
252
- id: "US-005",
253
- title: "Implement click analytics tracking",
254
- description: "Track clicks on each short URL with timestamps and IP addresses",
255
- acceptanceCriteria: [
256
- "Clicks logged with timestamp",
257
- "IP address recorded (anonymized)",
258
- "Analytics queryable by code",
259
- "Performance doesn't block redirects",
260
- ],
261
- tags: ["analytics", "database"],
262
- dependencies: ["US-003"],
263
- complexity: "medium" as const,
264
- relevantFiles: ["src/analytics/tracker.ts", "src/db/analytics-schema.ts"],
265
- reasoning: "Async logging with privacy concerns. 2 files, ~100 LOC.",
266
- estimatedLOC: 100,
267
- risks: ["Privacy compliance (GDPR)", "Performance under high traffic"],
268
- },
269
- ];
270
-
271
- return { stories };
272
- }
273
-
274
- reset() {
275
- this.shouldFailRun = false;
276
- this.shouldRateLimit = false;
277
- this.shouldFailReview = false;
278
- this.callCount = 0;
279
- this.runCalls = [];
280
- this.planCalls = [];
281
- this.decomposeCalls = [];
282
- this.attemptCountMap.clear();
283
- }
284
- }
285
-
286
- /**
287
- * Register mock agent in the registry for testing
288
- *
289
- * Modifies the ALL_AGENTS array to include the mock agent
290
- */
291
- function registerMockAgent(adapter: MockAgentAdapter): () => void {
292
- // Add mock agent to registry
293
- ALL_AGENTS.push(adapter);
294
-
295
- // Return cleanup function that removes it
296
- return () => {
297
- const index = ALL_AGENTS.findIndex((a) => a.name === "mock");
298
- if (index >= 0) {
299
- ALL_AGENTS.splice(index, 1);
300
- }
301
- };
302
- }
303
-
304
- describe("E2E: plan → analyze → run workflow", () => {
305
- let testDir: string;
306
- let mockAgent: MockAgentAdapter;
307
- let cleanup: () => void;
308
-
309
- beforeAll(() => {
310
- // Create mock agent and register once for the whole suite
311
- mockAgent = new MockAgentAdapter();
312
- cleanup = registerMockAgent(mockAgent);
313
- });
314
-
315
- afterAll(() => {
316
- // Unregister mock agent once after all tests complete
317
- cleanup();
318
- });
319
-
320
- beforeEach(() => {
321
- // Initialize logger
322
- initLogger({ level: "error", useChalk: false });
323
-
324
- // Reset mock agent state between tests
325
- mockAgent.reset();
326
-
327
- // Create temp directory
328
- testDir = `/tmp/nax-e2e-test-${Date.now()}`;
329
- mkdirSync(testDir, { recursive: true });
330
-
331
- // Set up minimal project structure
332
- setupTestProject(testDir);
333
- });
334
-
335
- afterEach(() => {
336
- // Clean up temp directory
337
- if (existsSync(testDir)) {
338
- rmSync(testDir, { recursive: true, force: true });
339
- }
340
- // Reset logger
341
- resetLogger();
342
- });
343
-
344
- test("full workflow: init → plan → analyze → run", { timeout: 120000 }, async () => {
345
- const ngentDir = join(testDir, "nax");
346
- const featureDir = join(ngentDir, "features/url-shortener");
347
- mkdirSync(featureDir, { recursive: true });
348
-
349
- // Step 1: Initialize (create config, constitution, hooks)
350
- await initializeNgent(ngentDir);
351
- expect(existsSync(join(ngentDir, "config.json"))).toBe(true);
352
- expect(existsSync(join(ngentDir, "constitution.md"))).toBe(true);
353
- expect(existsSync(join(ngentDir, "hooks.json"))).toBe(true);
354
-
355
- // Step 2: Plan (manually create spec.md since mock agent doesn't spawn real process)
356
- const config = createTestConfig();
357
- const specPath = join(featureDir, "spec.md");
358
- const spec = await mockAgent.plan({
359
- prompt: "Build a URL shortener with analytics",
360
- workdir: testDir,
361
- interactive: false,
362
- });
363
- await Bun.write(specPath, spec.specContent);
364
-
365
- expect(existsSync(specPath)).toBe(true);
366
- const specContent = await Bun.file(specPath).text();
367
- expect(specContent).toContain("# Feature: URL Shortener");
368
- expect(specContent).toContain("## Requirements");
369
- expect(mockAgent.planCalls).toHaveLength(1);
370
-
371
- // Step 3: Analyze (decompose spec into prd.json)
372
- const prd = await analyzeFeature({
373
- featureDir,
374
- featureName: "url-shortener",
375
- branchName: "feat/url-shortener",
376
- config,
377
- });
378
-
379
- expect(prd.userStories).toHaveLength(5);
380
- expect(prd.userStories[0].id).toBe("US-001");
381
- expect(prd.userStories[0].routing?.complexity).toBe("medium");
382
- expect(prd.userStories[2].dependencies).toContain("US-001");
383
- expect(mockAgent.decomposeCalls).toHaveLength(1);
384
-
385
- // Save PRD
386
- const prdPath = join(featureDir, "prd.json");
387
- await Bun.write(prdPath, JSON.stringify(prd, null, 2));
388
-
389
- // Step 4: Run (execute stories via pipeline)
390
- const runResult = await run({
391
- prdPath,
392
- workdir: testDir,
393
- config: {
394
- ...config,
395
- execution: {
396
- ...config.execution,
397
- maxIterations: 10, // Enough for 5 stories
398
- },
399
- },
400
- hooks: { hooks: {} },
401
- feature: "url-shortener",
402
- featureDir,
403
- dryRun: false,
404
- useBatch: true, // Enable batching
405
- statusFile: join(testDir, "nax", "status.json"),
406
- skipPrecheck: true, // Skip precheck for E2E test (no git repo in temp dir)
407
- });
408
-
409
- expect(runResult.success).toBe(true);
410
- expect(runResult.storiesCompleted).toBe(5);
411
- expect(mockAgent.runCalls.length).toBeGreaterThan(0);
412
-
413
- // Verify PRD was updated
414
- const finalPRD = await loadPRD(prdPath);
415
- expect(finalPRD.userStories.every((s) => s.status === "passed")).toBe(true);
416
- });
417
-
418
- test("pipeline stages execute in correct order", { timeout: 15000 }, async () => {
419
- const ngentDir = join(testDir, "nax");
420
- const featureDir = join(ngentDir, "features/simple-task");
421
- mkdirSync(featureDir, { recursive: true });
422
-
423
- await initializeNgent(ngentDir);
424
-
425
- // Create minimal PRD with one simple story
426
- const prd = {
427
- project: "test",
428
- feature: "simple-task",
429
- branchName: "feat/simple-task",
430
- createdAt: new Date().toISOString(),
431
- updatedAt: new Date().toISOString(),
432
- userStories: [
433
- {
434
- id: "US-001",
435
- title: "Add console log",
436
- description: "Add a console.log statement to index.ts",
437
- acceptanceCriteria: ["Log statement added"],
438
- tags: [],
439
- dependencies: [],
440
- status: "pending" as const,
441
- passes: false,
442
- escalations: [],
443
- attempts: 0,
444
- routing: {
445
- complexity: "simple" as const,
446
- modelTier: "fast" as const,
447
- testStrategy: "test-after" as const,
448
- reasoning: "Trivial change",
449
- estimatedLOC: 1,
450
- risks: [],
451
- },
452
- },
453
- ],
454
- };
455
-
456
- const prdPath = join(featureDir, "prd.json");
457
- await Bun.write(prdPath, JSON.stringify(prd, null, 2));
458
-
459
- const config = createTestConfig();
460
-
461
- // Run execution
462
- await run({
463
- prdPath,
464
- workdir: testDir,
465
- config,
466
- hooks: {
467
- hooks: {
468
- "on-story-start": {
469
- command: "echo story-start",
470
- enabled: true,
471
- timeout: 60000,
472
- },
473
- "on-story-complete": {
474
- command: "echo story-complete",
475
- enabled: true,
476
- timeout: 60000,
477
- },
478
- },
479
- },
480
- feature: "simple-task",
481
- featureDir,
482
- dryRun: false,
483
- statusFile: join(testDir, "nax", "status.json"),
484
- skipPrecheck: true, // Skip precheck for E2E test (no git repo in temp dir)
485
- });
486
-
487
- // Verify agent was called (execution stage ran)
488
- expect(mockAgent.runCalls.length).toBeGreaterThan(0);
489
-
490
- // Verify story completed (completion stage ran)
491
- const finalPRD = await loadPRD(prdPath);
492
- expect(finalPRD.userStories[0].status).toBe("passed");
493
- });
494
-
495
- test("agent failure triggers escalation", { timeout: 60000 }, async () => {
496
- const ngentDir = join(testDir, "nax");
497
- const featureDir = join(ngentDir, "features/fail-task");
498
- mkdirSync(featureDir, { recursive: true });
499
-
500
- await initializeNgent(ngentDir);
501
-
502
- const prd = {
503
- project: "test",
504
- feature: "fail-task",
505
- branchName: "feat/fail-task",
506
- createdAt: new Date().toISOString(),
507
- updatedAt: new Date().toISOString(),
508
- userStories: [
509
- {
510
- id: "US-001",
511
- title: "Task that will fail",
512
- description: "This task will fail on first attempt",
513
- acceptanceCriteria: ["Task complete"],
514
- tags: [],
515
- dependencies: [],
516
- status: "pending" as const,
517
- passes: false,
518
- escalations: [],
519
- attempts: 0,
520
- routing: {
521
- complexity: "simple" as const,
522
- modelTier: "fast" as const,
523
- testStrategy: "test-after" as const,
524
- reasoning: "Simple task",
525
- estimatedLOC: 10,
526
- risks: [],
527
- },
528
- },
529
- ],
530
- };
531
-
532
- const prdPath = join(featureDir, "prd.json");
533
- await Bun.write(prdPath, JSON.stringify(prd, null, 2));
534
-
535
- // Make first call fail, subsequent calls succeed
536
- let failCount = 0;
537
- const originalRun = mockAgent.run.bind(mockAgent);
538
- mockAgent.run = async (opts: AgentRunOptions): Promise<AgentResult> => {
539
- failCount++;
540
- if (failCount === 1) {
541
- // First call fails
542
- return {
543
- success: false,
544
- exitCode: 1,
545
- output: "Tests failed",
546
- rateLimited: false,
547
- durationMs: 100,
548
- estimatedCost: 0.01,
549
- };
550
- }
551
- // Subsequent calls succeed
552
- return originalRun(opts);
553
- };
554
-
555
- const config = createTestConfig();
556
-
557
- await run({
558
- prdPath,
559
- workdir: testDir,
560
- config,
561
- hooks: { hooks: {} },
562
- feature: "fail-task",
563
- featureDir,
564
- dryRun: false,
565
- statusFile: join(testDir, "nax", "status.json"),
566
- skipPrecheck: true, // Skip precheck for E2E test (no git repo in temp dir)
567
- });
568
-
569
- // Verify story completed (escalation auto-handled by system)
570
- const finalPRD = await loadPRD(prdPath);
571
-
572
- // The story should complete after escalation kicks in
573
- expect(finalPRD.userStories[0].status).toBe("passed");
574
- });
575
-
576
- test("rate limit triggers retry with backoff", { timeout: 60000 }, async () => {
577
- const ngentDir = join(testDir, "nax");
578
- const featureDir = join(ngentDir, "features/rate-limit-task");
579
- mkdirSync(featureDir, { recursive: true });
580
-
581
- await initializeNgent(ngentDir);
582
-
583
- const prd = {
584
- project: "test",
585
- feature: "rate-limit-task",
586
- branchName: "feat/rate-limit",
587
- createdAt: new Date().toISOString(),
588
- updatedAt: new Date().toISOString(),
589
- userStories: [
590
- {
591
- id: "US-001",
592
- title: "Task with rate limit",
593
- description: "This task will hit rate limit once",
594
- acceptanceCriteria: ["Task complete"],
595
- tags: [],
596
- dependencies: [],
597
- status: "pending" as const,
598
- passes: false,
599
- escalations: [],
600
- attempts: 0,
601
- routing: {
602
- complexity: "simple" as const,
603
- modelTier: "fast" as const,
604
- testStrategy: "test-after" as const,
605
- reasoning: "Simple task",
606
- estimatedLOC: 10,
607
- risks: [],
608
- },
609
- },
610
- ],
611
- };
612
-
613
- const prdPath = join(featureDir, "prd.json");
614
- await Bun.write(prdPath, JSON.stringify(prd, null, 2));
615
-
616
- // Set rate limit on first call
617
- mockAgent.shouldRateLimit = true;
618
-
619
- const config = createTestConfig();
620
-
621
- const runResult = await run({
622
- prdPath,
623
- workdir: testDir,
624
- config,
625
- hooks: { hooks: {} },
626
- feature: "rate-limit-task",
627
- featureDir,
628
- dryRun: false,
629
- statusFile: join(testDir, "nax", "status.json"),
630
- skipPrecheck: true, // Skip precheck for E2E test (no git repo in temp dir)
631
- });
632
-
633
- expect(runResult.success).toBe(true);
634
-
635
- const finalPRD = await loadPRD(prdPath);
636
- expect(finalPRD.userStories[0].status).toBe("passed");
637
- });
638
-
639
- test.skip("review phase failure marks story as failed (skipped - review disabled in tests)", async () => {
640
- // This test is skipped because review is disabled in test config to avoid mocking
641
- // typecheck/lint/test commands. In a real scenario with review enabled, this would
642
- // test that review failures are properly handled.
643
- });
644
-
645
- test("story batching groups simple stories", { timeout: 15000 }, async () => {
646
- const ngentDir = join(testDir, "nax");
647
- const featureDir = join(ngentDir, "features/batch-test");
648
- mkdirSync(featureDir, { recursive: true });
649
-
650
- await initializeNgent(ngentDir);
651
-
652
- const prd = {
653
- project: "test",
654
- feature: "batch-test",
655
- branchName: "feat/batch",
656
- createdAt: new Date().toISOString(),
657
- updatedAt: new Date().toISOString(),
658
- userStories: [
659
- {
660
- id: "US-001",
661
- title: "Add log statement 1",
662
- description: "Add console.log to file1.ts",
663
- acceptanceCriteria: ["Log added"],
664
- tags: [],
665
- dependencies: [],
666
- status: "pending" as const,
667
- passes: false,
668
- escalations: [],
669
- attempts: 0,
670
- routing: {
671
- complexity: "simple" as const,
672
- modelTier: "fast" as const,
673
- testStrategy: "test-after" as const,
674
- reasoning: "Trivial",
675
- estimatedLOC: 1,
676
- risks: [],
677
- },
678
- },
679
- {
680
- id: "US-002",
681
- title: "Add log statement 2",
682
- description: "Add console.log to file2.ts",
683
- acceptanceCriteria: ["Log added"],
684
- tags: [],
685
- dependencies: [],
686
- status: "pending" as const,
687
- passes: false,
688
- escalations: [],
689
- attempts: 0,
690
- routing: {
691
- complexity: "simple" as const,
692
- modelTier: "fast" as const,
693
- testStrategy: "test-after" as const,
694
- reasoning: "Trivial",
695
- estimatedLOC: 1,
696
- risks: [],
697
- },
698
- },
699
- {
700
- id: "US-003",
701
- title: "Add log statement 3",
702
- description: "Add console.log to file3.ts",
703
- acceptanceCriteria: ["Log added"],
704
- tags: [],
705
- dependencies: [],
706
- status: "pending" as const,
707
- passes: false,
708
- escalations: [],
709
- attempts: 0,
710
- routing: {
711
- complexity: "simple" as const,
712
- modelTier: "fast" as const,
713
- testStrategy: "test-after" as const,
714
- reasoning: "Trivial",
715
- estimatedLOC: 1,
716
- risks: [],
717
- },
718
- },
719
- ],
720
- };
721
-
722
- const prdPath = join(featureDir, "prd.json");
723
- await Bun.write(prdPath, JSON.stringify(prd, null, 2));
724
-
725
- const config = createTestConfig();
726
-
727
- const runResult = await run({
728
- prdPath,
729
- workdir: testDir,
730
- config,
731
- hooks: { hooks: {} },
732
- feature: "batch-test",
733
- featureDir,
734
- dryRun: false,
735
- useBatch: true,
736
- statusFile: join(testDir, "nax", "status.json"),
737
- skipPrecheck: true, // Skip precheck for E2E test (no git repo in temp dir)
738
- });
739
-
740
- expect(runResult.success).toBe(true);
741
- expect(runResult.storiesCompleted).toBe(3);
742
-
743
- // With batching, should have fewer agent calls than stories
744
- // (3 simple stories should be batched into 1 call)
745
- expect(mockAgent.runCalls.length).toBeLessThan(3);
746
-
747
- // Verify all stories completed
748
- const finalPRD = await loadPRD(prdPath);
749
- expect(finalPRD.userStories.every((s) => s.status === "passed")).toBe(true);
750
- });
751
- });
752
-
753
- // ── Helper Functions ──────────────────────────────────
754
-
755
- function setupTestProject(dir: string) {
756
- // Create src/ directory
757
- mkdirSync(join(dir, "src"), { recursive: true });
758
- Bun.write(join(dir, "src/index.ts"), "export const greet = () => 'Hello';\n");
759
-
760
- // Create test/ directory
761
- mkdirSync(join(dir, "test"), { recursive: true });
762
- Bun.write(
763
- join(dir, "test/index.test.ts"),
764
- "import { expect, test } from 'bun:test';\nimport { greet } from '../../src/index';\n\ntest('greet', () => {\n expect(greet()).toBe('Hello');\n});\n",
765
- );
766
-
767
- // Create package.json
768
- Bun.write(
769
- join(dir, "package.json"),
770
- JSON.stringify(
771
- {
772
- name: "e2e-test-project",
773
- version: "1.0.0",
774
- dependencies: {
775
- zod: "^4.0.0",
776
- },
777
- devDependencies: {
778
- typescript: "^5.0.0",
779
- "@types/bun": "^1.0.0",
780
- },
781
- },
782
- null,
783
- 2,
784
- ),
785
- );
786
-
787
- // Create tsconfig.json
788
- Bun.write(
789
- join(dir, "tsconfig.json"),
790
- JSON.stringify(
791
- {
792
- compilerOptions: {
793
- target: "ES2022",
794
- module: "ESNext",
795
- moduleResolution: "bundler",
796
- strict: true,
797
- esModuleInterop: true,
798
- skipLibCheck: true,
799
- forceConsistentCasingInFileNames: true,
800
- outDir: "./dist",
801
- },
802
- include: ["src/**/*"],
803
- exclude: ["node_modules", "dist"],
804
- },
805
- null,
806
- 2,
807
- ),
808
- );
809
- }
810
-
811
- async function initializeNgent(ngentDir: string) {
812
- // Create directory structure
813
- mkdirSync(join(ngentDir, "features"), { recursive: true });
814
- mkdirSync(join(ngentDir, "hooks"), { recursive: true });
815
-
816
- // Write config.json
817
- await Bun.write(join(ngentDir, "config.json"), JSON.stringify(DEFAULT_CONFIG, null, 2));
818
-
819
- // Write hooks.json
820
- await Bun.write(
821
- join(ngentDir, "hooks.json"),
822
- JSON.stringify(
823
- {
824
- hooks: {
825
- "on-start": { command: "echo nax started", enabled: false },
826
- "on-complete": { command: "echo nax complete", enabled: false },
827
- },
828
- },
829
- null,
830
- 2,
831
- ),
832
- );
833
-
834
- // Write constitution.md
835
- await Bun.write(
836
- join(ngentDir, "constitution.md"),
837
- `# Project Constitution
838
-
839
- ## Coding Standards
840
- - Write clear, maintainable code
841
- - Follow project conventions
842
-
843
- ## Testing Requirements
844
- - All code must have tests
845
- - Aim for 80%+ coverage
846
-
847
- ## Architecture Rules
848
- - Keep functions small and focused
849
- - Avoid tight coupling
850
- `,
851
- );
852
- }
853
-
854
- function createTestConfig(): NaxConfig {
855
- return {
856
- ...DEFAULT_CONFIG,
857
- autoMode: {
858
- ...DEFAULT_CONFIG.autoMode,
859
- defaultAgent: "mock", // Use our mock agent
860
- escalation: {
861
- ...DEFAULT_CONFIG.autoMode.escalation,
862
- enabled: true,
863
- tierOrder: [
864
- { tier: "fast", attempts: 1 },
865
- { tier: "balanced", attempts: 1 },
866
- ],
867
- },
868
- },
869
- analyze: {
870
- ...DEFAULT_CONFIG.analyze,
871
- llmEnhanced: true, // Enable LLM decompose
872
- },
873
- execution: {
874
- ...DEFAULT_CONFIG.execution,
875
- maxIterations: 15, // Reduced from 20 to fail faster in tests
876
- maxStoriesPerFeature: 500,
877
- regressionGate: {
878
- ...DEFAULT_CONFIG.execution.regressionGate,
879
- enabled: false, // Disable regression gate for E2E tests
880
- },
881
- rectification: {
882
- ...DEFAULT_CONFIG.execution.rectification,
883
- enabled: false, // Disable rectification for E2E tests
884
- },
885
- },
886
- quality: {
887
- ...DEFAULT_CONFIG.quality,
888
- requireTypecheck: false,
889
- requireLint: false,
890
- requireTests: false,
891
- commands: {}, // No quality commands for E2E tests
892
- },
893
- review: {
894
- ...DEFAULT_CONFIG.review,
895
- enabled: false, // Disable review for tests (would require mocking typecheck/lint/test)
896
- },
897
- acceptance: {
898
- ...DEFAULT_CONFIG.acceptance,
899
- enabled: false, // Disable acceptance for E2E tests (no real acceptance tests)
900
- },
901
- };
902
- }