@nathapp/nax 0.18.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (459) hide show
  1. package/.gitlab-ci.yml +96 -0
  2. package/BRIEF.md +140 -0
  3. package/CHANGELOG.md +60 -0
  4. package/CLAUDE.md +159 -0
  5. package/README.md +373 -0
  6. package/US-007-IMPLEMENTATION.md +139 -0
  7. package/bin/nax.ts +930 -0
  8. package/biome.json +14 -0
  9. package/bun.lock +168 -0
  10. package/bunfig.toml +11 -0
  11. package/docs/20260216-fix-plan-context-review.md +56 -0
  12. package/docs/20260216-relentless-vs-ngent-comparison.md +208 -0
  13. package/docs/20260216-v02-plan.md +136 -0
  14. package/docs/20260216-v02-review.md +685 -0
  15. package/docs/20260217-dogfood-findings.md +56 -0
  16. package/docs/20260217-p2-plus-plan.md +117 -0
  17. package/docs/20260217-partial-fixes-plan.md +62 -0
  18. package/docs/20260217-plan-analyze-spec.md +117 -0
  19. package/docs/20260217-post-impl-review.md +1137 -0
  20. package/docs/20260217-quick-wins-plan.md +66 -0
  21. package/docs/20260217-split-runner-plan.md +75 -0
  22. package/docs/20260217-v03-impl-plan.md +80 -0
  23. package/docs/20260217-v03-post-impl-review.md +589 -0
  24. package/docs/20260217-v04-impl-plan.md +86 -0
  25. package/docs/20260217-v05-post-impl-review.md +850 -0
  26. package/docs/20260217-v06-post-impl-review.md +817 -0
  27. package/docs/20260218-adr003-port-plan.md +151 -0
  28. package/docs/20260218-review-adr003-verification.md +175 -0
  29. package/docs/20260219-fix-plan-bug16-19.md +79 -0
  30. package/docs/20260219-fix-plan-bug20-22.md +114 -0
  31. package/docs/20260219-plan-llm-routing.md +116 -0
  32. package/docs/20260219-review-bug20-22-fixes.md +135 -0
  33. package/docs/20260219-routing-baseline-keyword.md +63 -0
  34. package/docs/20260220-plan-structured-logging-p1.md +80 -0
  35. package/docs/20260220-plan-structured-logging-p2.md +37 -0
  36. package/docs/20260220-review-llm-routing.md +180 -0
  37. package/docs/20260220-review-post-fix-llm-routing.md +70 -0
  38. package/docs/20260221-fix-plan-relevantfiles-split.md +101 -0
  39. package/docs/20260221-fix-plan-routing-mode.md +125 -0
  40. package/docs/20260221-review-v0.9-implementation.md +379 -0
  41. package/docs/20260222-fix-plan-v091-routing-isolation.md +197 -0
  42. package/docs/20260223-fix-plan-prompt-audit.md +62 -0
  43. package/docs/20260224-nax-roadmap-phases.md +189 -0
  44. package/docs/20260225-phase2-llm-service-layer.md +401 -0
  45. package/docs/20260225-review-v0.10.1.md +187 -0
  46. package/docs/20260303-v010-implementation-plan.md +165 -0
  47. package/docs/CLAUDE.md.bak +191 -0
  48. package/docs/ROADMAP.md +165 -0
  49. package/docs/SPEC-rectification.md +0 -0
  50. package/docs/SPEC.md +324 -0
  51. package/docs/US-001-plugin-loading-verification.md +152 -0
  52. package/docs/architecture-analysis.md +1076 -0
  53. package/docs/bugs/BUG-21-escalation-null-attempts.md +48 -0
  54. package/docs/bugs-from-dogfood-run-c.md +243 -0
  55. package/docs/code-review-20260228.md +612 -0
  56. package/docs/code-review-v0.15.0.md +629 -0
  57. package/docs/hook-lifecycle-test-plan.md +149 -0
  58. package/docs/releases/v0.11.0-and-earlier.md +20 -0
  59. package/docs/releases/v0.12.0.md +15 -0
  60. package/docs/releases/v0.13.0.md +14 -0
  61. package/docs/releases/v0.14.0.md +20 -0
  62. package/docs/releases/v0.14.1.md +36 -0
  63. package/docs/releases/v0.14.2.md +51 -0
  64. package/docs/releases/v0.14.3.md +174 -0
  65. package/docs/releases/v0.14.4.md +94 -0
  66. package/docs/releases/v0.15.0.md +502 -0
  67. package/docs/releases/v0.15.1.md +170 -0
  68. package/docs/releases/v0.15.3.md +193 -0
  69. package/docs/specs/status-file-v0.10.1.md +812 -0
  70. package/docs/v0.10-global-config.md +206 -0
  71. package/docs/v0.10-plugin-system.md +415 -0
  72. package/docs/v0.10-prompt-optimizer.md +234 -0
  73. package/docs/v0.3-spec.md +244 -0
  74. package/docs/v0.4-spec.md +140 -0
  75. package/docs/v0.5-spec.md +237 -0
  76. package/docs/v0.6-spec.md +371 -0
  77. package/docs/v0.7-spec.md +177 -0
  78. package/docs/v0.8-llm-routing.md +206 -0
  79. package/docs/v0.8-structured-logging.md +132 -0
  80. package/docs/v0.9.3-prompt-audit.md +112 -0
  81. package/examples/plugins/console-reporter/index.test.ts +207 -0
  82. package/examples/plugins/console-reporter/index.ts +110 -0
  83. package/nax/config.json +147 -0
  84. package/nax/features/bugfix-v0171/prd.json +52 -0
  85. package/nax/features/config-management/prd.json +108 -0
  86. package/nax/features/config-management/progress.txt +5 -0
  87. package/nax/features/diagnose/acceptance.test.ts +412 -0
  88. package/nax/features/diagnose/prd.json +41 -0
  89. package/nax/features/orchestration-fixes/prd.json +89 -0
  90. package/nax/features/orchestration-fixes/progress.txt +1 -0
  91. package/nax/features/plugin-integration/US-007-VERIFICATION.md +259 -0
  92. package/nax/features/plugin-integration/prd.json +208 -0
  93. package/nax/features/plugin-integration/progress.txt +5 -0
  94. package/nax/features/precheck/prd.json +205 -0
  95. package/nax/features/precheck/progress.txt +15 -0
  96. package/nax/features/structured-logging/prd.json +199 -0
  97. package/nax/features/unlock/prd.json +36 -0
  98. package/package.json +47 -0
  99. package/src/acceptance/fix-generator.ts +348 -0
  100. package/src/acceptance/generator.ts +282 -0
  101. package/src/acceptance/index.ts +30 -0
  102. package/src/acceptance/types.ts +79 -0
  103. package/src/agents/claude-decompose.ts +169 -0
  104. package/src/agents/claude-plan.ts +139 -0
  105. package/src/agents/claude.ts +324 -0
  106. package/src/agents/cost.ts +268 -0
  107. package/src/agents/index.ts +13 -0
  108. package/src/agents/registry.ts +48 -0
  109. package/src/agents/types-extended.ts +133 -0
  110. package/src/agents/types.ts +113 -0
  111. package/src/agents/validation.ts +69 -0
  112. package/src/analyze/classifier.ts +305 -0
  113. package/src/analyze/index.ts +16 -0
  114. package/src/analyze/scanner.ts +175 -0
  115. package/src/analyze/types.ts +51 -0
  116. package/src/cli/accept.ts +108 -0
  117. package/src/cli/analyze-parser.ts +284 -0
  118. package/src/cli/analyze.ts +207 -0
  119. package/src/cli/config.ts +561 -0
  120. package/src/cli/constitution.ts +109 -0
  121. package/src/cli/diagnose-analysis.ts +159 -0
  122. package/src/cli/diagnose-formatter.ts +87 -0
  123. package/src/cli/diagnose.ts +203 -0
  124. package/src/cli/generate.ts +127 -0
  125. package/src/cli/index.ts +37 -0
  126. package/src/cli/init.ts +188 -0
  127. package/src/cli/interact.ts +295 -0
  128. package/src/cli/plan.ts +198 -0
  129. package/src/cli/plugins.ts +111 -0
  130. package/src/cli/prompts.ts +295 -0
  131. package/src/cli/runs.ts +174 -0
  132. package/src/cli/status-cost.ts +151 -0
  133. package/src/cli/status-features.ts +338 -0
  134. package/src/cli/status.ts +13 -0
  135. package/src/commands/common.ts +171 -0
  136. package/src/commands/diagnose.ts +17 -0
  137. package/src/commands/index.ts +8 -0
  138. package/src/commands/logs.ts +384 -0
  139. package/src/commands/precheck.ts +86 -0
  140. package/src/commands/unlock.ts +96 -0
  141. package/src/config/defaults.ts +160 -0
  142. package/src/config/index.ts +22 -0
  143. package/src/config/loader.ts +121 -0
  144. package/src/config/merger.ts +147 -0
  145. package/src/config/path-security.ts +121 -0
  146. package/src/config/paths.ts +27 -0
  147. package/src/config/schema.ts +56 -0
  148. package/src/config/schemas.ts +286 -0
  149. package/src/config/types.ts +423 -0
  150. package/src/config/validate.ts +103 -0
  151. package/src/constitution/generator.ts +191 -0
  152. package/src/constitution/generators/aider.ts +41 -0
  153. package/src/constitution/generators/claude.ts +35 -0
  154. package/src/constitution/generators/cursor.ts +36 -0
  155. package/src/constitution/generators/opencode.ts +38 -0
  156. package/src/constitution/generators/types.ts +33 -0
  157. package/src/constitution/generators/windsurf.ts +36 -0
  158. package/src/constitution/index.ts +10 -0
  159. package/src/constitution/loader.ts +133 -0
  160. package/src/constitution/types.ts +31 -0
  161. package/src/context/auto-detect.ts +227 -0
  162. package/src/context/builder.ts +246 -0
  163. package/src/context/elements.ts +83 -0
  164. package/src/context/formatter.ts +107 -0
  165. package/src/context/generator.ts +129 -0
  166. package/src/context/generators/aider.ts +34 -0
  167. package/src/context/generators/claude.ts +28 -0
  168. package/src/context/generators/cursor.ts +28 -0
  169. package/src/context/generators/opencode.ts +30 -0
  170. package/src/context/generators/windsurf.ts +28 -0
  171. package/src/context/greenfield.ts +114 -0
  172. package/src/context/index.ts +33 -0
  173. package/src/context/injector.ts +279 -0
  174. package/src/context/test-scanner.ts +370 -0
  175. package/src/context/types.ts +98 -0
  176. package/src/errors.ts +67 -0
  177. package/src/execution/batching.ts +157 -0
  178. package/src/execution/crash-recovery.ts +373 -0
  179. package/src/execution/escalation/escalation.ts +44 -0
  180. package/src/execution/escalation/index.ts +13 -0
  181. package/src/execution/escalation/tier-escalation.ts +295 -0
  182. package/src/execution/escalation/tier-outcome.ts +158 -0
  183. package/src/execution/helpers.ts +38 -0
  184. package/src/execution/index.ts +45 -0
  185. package/src/execution/lifecycle/acceptance-loop.ts +272 -0
  186. package/src/execution/lifecycle/headless-formatter.ts +85 -0
  187. package/src/execution/lifecycle/index.ts +12 -0
  188. package/src/execution/lifecycle/parallel-lifecycle.ts +101 -0
  189. package/src/execution/lifecycle/precheck-runner.ts +140 -0
  190. package/src/execution/lifecycle/run-cleanup.ts +81 -0
  191. package/src/execution/lifecycle/run-completion.ts +129 -0
  192. package/src/execution/lifecycle/run-initialization.ts +141 -0
  193. package/src/execution/lifecycle/run-lifecycle.ts +312 -0
  194. package/src/execution/lifecycle/run-setup.ts +204 -0
  195. package/src/execution/lifecycle/story-hooks.ts +38 -0
  196. package/src/execution/lifecycle/story-size-prompts.ts +123 -0
  197. package/src/execution/lock.ts +115 -0
  198. package/src/execution/parallel-executor.ts +216 -0
  199. package/src/execution/parallel.ts +400 -0
  200. package/src/execution/pid-registry.ts +280 -0
  201. package/src/execution/pipeline-result-handler.ts +388 -0
  202. package/src/execution/post-verify-rectification.ts +188 -0
  203. package/src/execution/post-verify.ts +274 -0
  204. package/src/execution/progress.ts +25 -0
  205. package/src/execution/prompts.ts +127 -0
  206. package/src/execution/queue-handler.ts +109 -0
  207. package/src/execution/rectification.ts +13 -0
  208. package/src/execution/runner.ts +377 -0
  209. package/src/execution/sequential-executor.ts +388 -0
  210. package/src/execution/status-file.ts +264 -0
  211. package/src/execution/status-writer.ts +139 -0
  212. package/src/execution/story-context.ts +229 -0
  213. package/src/execution/test-output-parser.ts +14 -0
  214. package/src/execution/verification.ts +72 -0
  215. package/src/hooks/index.ts +2 -0
  216. package/src/hooks/runner.ts +286 -0
  217. package/src/hooks/types.ts +67 -0
  218. package/src/interaction/chain.ts +154 -0
  219. package/src/interaction/index.ts +60 -0
  220. package/src/interaction/init.ts +83 -0
  221. package/src/interaction/plugins/auto.ts +217 -0
  222. package/src/interaction/plugins/cli.ts +300 -0
  223. package/src/interaction/plugins/telegram.ts +384 -0
  224. package/src/interaction/plugins/webhook.ts +258 -0
  225. package/src/interaction/state.ts +171 -0
  226. package/src/interaction/triggers.ts +229 -0
  227. package/src/interaction/types.ts +163 -0
  228. package/src/logger/formatters.ts +84 -0
  229. package/src/logger/index.ts +16 -0
  230. package/src/logger/logger.ts +298 -0
  231. package/src/logger/types.ts +48 -0
  232. package/src/logging/formatter.ts +355 -0
  233. package/src/logging/index.ts +22 -0
  234. package/src/logging/types.ts +93 -0
  235. package/src/metrics/aggregator.ts +190 -0
  236. package/src/metrics/index.ts +14 -0
  237. package/src/metrics/tracker.ts +200 -0
  238. package/src/metrics/types.ts +109 -0
  239. package/src/optimizer/index.ts +62 -0
  240. package/src/optimizer/noop.optimizer.ts +24 -0
  241. package/src/optimizer/rule-based.optimizer.ts +248 -0
  242. package/src/optimizer/types.ts +53 -0
  243. package/src/pipeline/events.ts +130 -0
  244. package/src/pipeline/index.ts +19 -0
  245. package/src/pipeline/runner.ts +161 -0
  246. package/src/pipeline/stages/acceptance.ts +197 -0
  247. package/src/pipeline/stages/completion.ts +99 -0
  248. package/src/pipeline/stages/constitution.ts +63 -0
  249. package/src/pipeline/stages/context.ts +117 -0
  250. package/src/pipeline/stages/execution.ts +194 -0
  251. package/src/pipeline/stages/index.ts +62 -0
  252. package/src/pipeline/stages/optimizer.ts +74 -0
  253. package/src/pipeline/stages/prompt.ts +57 -0
  254. package/src/pipeline/stages/queue-check.ts +103 -0
  255. package/src/pipeline/stages/review.ts +181 -0
  256. package/src/pipeline/stages/routing.ts +81 -0
  257. package/src/pipeline/stages/verify.ts +100 -0
  258. package/src/pipeline/types.ts +167 -0
  259. package/src/plugins/index.ts +31 -0
  260. package/src/plugins/loader.ts +287 -0
  261. package/src/plugins/registry.ts +168 -0
  262. package/src/plugins/types.ts +327 -0
  263. package/src/plugins/validator.ts +352 -0
  264. package/src/prd/index.ts +172 -0
  265. package/src/prd/types.ts +202 -0
  266. package/src/precheck/checks-blockers.ts +391 -0
  267. package/src/precheck/checks-warnings.ts +142 -0
  268. package/src/precheck/checks.ts +30 -0
  269. package/src/precheck/index.ts +247 -0
  270. package/src/precheck/story-size-gate.ts +144 -0
  271. package/src/precheck/types.ts +31 -0
  272. package/src/queue/index.ts +2 -0
  273. package/src/queue/manager.ts +254 -0
  274. package/src/queue/types.ts +54 -0
  275. package/src/review/index.ts +8 -0
  276. package/src/review/runner.ts +172 -0
  277. package/src/review/types.ts +66 -0
  278. package/src/routing/builder.ts +81 -0
  279. package/src/routing/chain.ts +74 -0
  280. package/src/routing/index.ts +16 -0
  281. package/src/routing/loader.ts +58 -0
  282. package/src/routing/router.ts +303 -0
  283. package/src/routing/strategies/adaptive.ts +215 -0
  284. package/src/routing/strategies/index.ts +8 -0
  285. package/src/routing/strategies/keyword.ts +163 -0
  286. package/src/routing/strategies/llm-prompts.ts +209 -0
  287. package/src/routing/strategies/llm.ts +235 -0
  288. package/src/routing/strategies/manual.ts +50 -0
  289. package/src/routing/strategy.ts +99 -0
  290. package/src/tdd/cleanup.ts +111 -0
  291. package/src/tdd/index.ts +23 -0
  292. package/src/tdd/isolation.ts +123 -0
  293. package/src/tdd/orchestrator.ts +383 -0
  294. package/src/tdd/prompts.ts +270 -0
  295. package/src/tdd/rectification-gate.ts +183 -0
  296. package/src/tdd/session-runner.ts +179 -0
  297. package/src/tdd/types.ts +81 -0
  298. package/src/tdd/verdict.ts +271 -0
  299. package/src/tui/App.tsx +265 -0
  300. package/src/tui/components/AgentPanel.tsx +75 -0
  301. package/src/tui/components/CostOverlay.tsx +118 -0
  302. package/src/tui/components/HelpOverlay.tsx +107 -0
  303. package/src/tui/components/StatusBar.tsx +63 -0
  304. package/src/tui/components/StoriesPanel.tsx +177 -0
  305. package/src/tui/hooks/useKeyboard.ts +142 -0
  306. package/src/tui/hooks/useLayout.ts +137 -0
  307. package/src/tui/hooks/usePipelineEvents.ts +183 -0
  308. package/src/tui/hooks/usePty.ts +194 -0
  309. package/src/tui/index.tsx +38 -0
  310. package/src/tui/types.ts +76 -0
  311. package/src/utils/git.ts +83 -0
  312. package/src/utils/queue-writer.ts +54 -0
  313. package/src/verification/executor.ts +235 -0
  314. package/src/verification/gate.ts +207 -0
  315. package/src/verification/index.ts +12 -0
  316. package/src/verification/parser.ts +230 -0
  317. package/src/verification/rectification.ts +108 -0
  318. package/src/verification/types.ts +113 -0
  319. package/src/worktree/dispatcher.ts +65 -0
  320. package/src/worktree/index.ts +2 -0
  321. package/src/worktree/manager.ts +187 -0
  322. package/src/worktree/merge.ts +301 -0
  323. package/src/worktree/types.ts +4 -0
  324. package/test/TEST_COVERAGE_US001.md +217 -0
  325. package/test/TEST_COVERAGE_US003.md +84 -0
  326. package/test/TEST_COVERAGE_US005.md +86 -0
  327. package/test/US-002-orchestrator.test.ts +246 -0
  328. package/test/acceptance/cm-003-default-view.test.ts +194 -0
  329. package/test/execution/pid-registry.test.ts +240 -0
  330. package/test/execution/post-verify.test.ts +224 -0
  331. package/test/helpers/timeout.ts +42 -0
  332. package/test/integration/US-002-TEST-SUMMARY.md +107 -0
  333. package/test/integration/US-003-TEST-SUMMARY.md +149 -0
  334. package/test/integration/US-004-TEST-SUMMARY.md +106 -0
  335. package/test/integration/US-005-TEST-SUMMARY.md +138 -0
  336. package/test/integration/US-007-TEST-SUMMARY.md +100 -0
  337. package/test/integration/agent-validation.test.ts +439 -0
  338. package/test/integration/analyze-integration.test.ts +261 -0
  339. package/test/integration/analyze-scanner.test.ts +131 -0
  340. package/test/integration/cli-config-default-edge-cases.test.ts +222 -0
  341. package/test/integration/cli-config-default-view.test.ts +229 -0
  342. package/test/integration/cli-config-diff.test.ts +460 -0
  343. package/test/integration/cli-config.test.ts +736 -0
  344. package/test/integration/cli-diagnose.test.ts +592 -0
  345. package/test/integration/cli-logs.test.ts +314 -0
  346. package/test/integration/cli-plugins.test.ts +678 -0
  347. package/test/integration/cli-precheck.test.ts +371 -0
  348. package/test/integration/cli-run-headless.test.ts +173 -0
  349. package/test/integration/cli.test.ts +75 -0
  350. package/test/integration/config/merger.test.ts +465 -0
  351. package/test/integration/config/paths.test.ts +51 -0
  352. package/test/integration/config-loader.test.ts +265 -0
  353. package/test/integration/config.test.ts +444 -0
  354. package/test/integration/context-integration.test.ts +702 -0
  355. package/test/integration/context-provider-injection.test.ts +506 -0
  356. package/test/integration/context-verification-integration.test.ts +295 -0
  357. package/test/integration/e2e.test.ts +896 -0
  358. package/test/integration/execution.test.ts +625 -0
  359. package/test/integration/helpers.test.ts +295 -0
  360. package/test/integration/hooks.test.ts +361 -0
  361. package/test/integration/interaction-chain-pipeline.test.ts +464 -0
  362. package/test/integration/isolation.test.ts +143 -0
  363. package/test/integration/logger.test.ts +461 -0
  364. package/test/integration/parallel.test.ts +250 -0
  365. package/test/integration/path-security.test.ts +173 -0
  366. package/test/integration/pipeline-acceptance.test.ts +302 -0
  367. package/test/integration/pipeline-events.test.ts +475 -0
  368. package/test/integration/pipeline.test.ts +658 -0
  369. package/test/integration/plan.test.ts +157 -0
  370. package/test/integration/plugin-routing.test.ts +921 -0
  371. package/test/integration/plugins/config-integration.test.ts +172 -0
  372. package/test/integration/plugins/config-resolution.test.ts +522 -0
  373. package/test/integration/plugins/loader.test.ts +641 -0
  374. package/test/integration/plugins/registry.test.ts +746 -0
  375. package/test/integration/plugins/validator.test.ts +563 -0
  376. package/test/integration/prd-pause.test.ts +205 -0
  377. package/test/integration/prd-resolvers.test.ts +185 -0
  378. package/test/integration/precheck-integration.test.ts +468 -0
  379. package/test/integration/precheck.test.ts +805 -0
  380. package/test/integration/progress.test.ts +34 -0
  381. package/test/integration/rectification-flow.test.ts +512 -0
  382. package/test/integration/reporter-lifecycle.test.ts +860 -0
  383. package/test/integration/review-config-commands.test.ts +319 -0
  384. package/test/integration/review-config-schema.test.ts +116 -0
  385. package/test/integration/review-plugin-integration.test.ts +722 -0
  386. package/test/integration/review.test.ts +149 -0
  387. package/test/integration/routing-stage-bug-021.test.ts +274 -0
  388. package/test/integration/routing-stage-greenfield.test.ts +286 -0
  389. package/test/integration/runner-config-plugins.test.ts +461 -0
  390. package/test/integration/runner-fixes.test.ts +399 -0
  391. package/test/integration/runner-plugin-integration.test.ts +543 -0
  392. package/test/integration/runner.test.ts +1679 -0
  393. package/test/integration/s5-greenfield-fallback.test.ts +297 -0
  394. package/test/integration/status-file-integration.test.ts +325 -0
  395. package/test/integration/status-file.test.ts +379 -0
  396. package/test/integration/status-writer.test.ts +345 -0
  397. package/test/integration/story-id-in-events.test.ts +273 -0
  398. package/test/integration/tdd-cleanup.test.ts +246 -0
  399. package/test/integration/tdd-orchestrator.test.ts +1762 -0
  400. package/test/integration/test-scanner.test.ts +403 -0
  401. package/test/integration/verification-asset-check.test.ts +142 -0
  402. package/test/integration/verify-stage.test.ts +275 -0
  403. package/test/integration/worktree/manager.test.ts +218 -0
  404. package/test/integration/worktree/merge.test.ts +341 -0
  405. package/test/manual/logging-formatter-demo.ts +158 -0
  406. package/test/ui/tui-agent-panel.test.tsx +99 -0
  407. package/test/ui/tui-controls.test.ts +334 -0
  408. package/test/ui/tui-cost-and-pty.test.ts +189 -0
  409. package/test/ui/tui-layout.test.ts +378 -0
  410. package/test/ui/tui-pty-integration.test.tsx +159 -0
  411. package/test/ui/tui-stories.test.ts +332 -0
  412. package/test/unit/acceptance.test.ts +186 -0
  413. package/test/unit/agent-stderr-capture.test.ts +146 -0
  414. package/test/unit/analyze-classifier.test.ts +215 -0
  415. package/test/unit/analyze.test.ts +224 -0
  416. package/test/unit/auto-detect.test.ts +249 -0
  417. package/test/unit/cli-status.test.ts +417 -0
  418. package/test/unit/commands/common.test.ts +320 -0
  419. package/test/unit/commands/logs.test.ts +416 -0
  420. package/test/unit/commands/unlock.test.ts +319 -0
  421. package/test/unit/constitution-generators.test.ts +160 -0
  422. package/test/unit/constitution.test.ts +209 -0
  423. package/test/unit/context.test.ts +1722 -0
  424. package/test/unit/cost.test.ts +231 -0
  425. package/test/unit/crash-recovery.test.ts +308 -0
  426. package/test/unit/escalation.test.ts +126 -0
  427. package/test/unit/execution-logging-stderr.test.ts +156 -0
  428. package/test/unit/execution-stage.test.ts +122 -0
  429. package/test/unit/fix-generator.test.ts +275 -0
  430. package/test/unit/formatters.test.ts +469 -0
  431. package/test/unit/greenfield.test.ts +179 -0
  432. package/test/unit/helpers.test.ts +317 -0
  433. package/test/unit/interaction/human-review-trigger.test.ts +164 -0
  434. package/test/unit/interaction-network-failures.test.ts +389 -0
  435. package/test/unit/interaction-plugins.test.ts +164 -0
  436. package/test/unit/isolation.test.ts +134 -0
  437. package/test/unit/logging/formatter.test.ts +455 -0
  438. package/test/unit/merge.test.ts +268 -0
  439. package/test/unit/metrics.test.ts +276 -0
  440. package/test/unit/optimizer/noop.optimizer.test.ts +125 -0
  441. package/test/unit/optimizer/rule-based.optimizer.test.ts +358 -0
  442. package/test/unit/prd-auto-default.test.ts +290 -0
  443. package/test/unit/prd-failure-category.test.ts +176 -0
  444. package/test/unit/prd-get-next-story.test.ts +186 -0
  445. package/test/unit/precheck-checks.test.ts +840 -0
  446. package/test/unit/precheck-story-size-gate.test.ts +287 -0
  447. package/test/unit/precheck-types.test.ts +142 -0
  448. package/test/unit/prompts.test.ts +475 -0
  449. package/test/unit/queue.test.ts +237 -0
  450. package/test/unit/rectification.test.ts +284 -0
  451. package/test/unit/registry.test.ts +287 -0
  452. package/test/unit/routing.test.ts +937 -0
  453. package/test/unit/run-lifecycle.test.ts +140 -0
  454. package/test/unit/storyid-events.test.ts +224 -0
  455. package/test/unit/tdd-verdict.test.ts +492 -0
  456. package/test/unit/test-output-parser.test.ts +377 -0
  457. package/test/unit/verdict.test.ts +324 -0
  458. package/test/unit/worktree-manager.test.ts +158 -0
  459. package/tsconfig.json +27 -0
@@ -0,0 +1,197 @@
1
+ # Fix Plan: v0.9.1 — Routing Respect + TDD Isolation Rework
2
+
3
+ **Date:** 2026-02-22
4
+ **Branch:** fix/v0.9.1-routing-isolation
5
+ **Base:** Revert commits 211a884 and 4fa39a4, then apply clean fixes
6
+
7
+ ## Context
8
+
9
+ Two commits (211a884, 4fa39a4) attempted to fix 4 issues but introduced problems:
10
+ 1. `determineTestStrategy()` still overrides LLM complexity via keyword scan
11
+ 2. Story count prompt hint isn't enforced
12
+ 3. `analyzeConfig` metadata is fine but incomplete (missing naxVersion)
13
+ 4. Isolation check now always passes (toothless)
14
+
15
+ This plan implements clean fixes for all 4 issues.
16
+
17
+ ---
18
+
19
+ ## Phase 1: Revert and Create Branch
20
+
21
+ 1. `git revert --no-commit 4fa39a4 211a884` (revert both commits)
22
+ 2. `git checkout -b fix/v0.9.1-routing-isolation`
23
+ 3. Commit: `revert: undo 211a884 and 4fa39a4 for clean reimplementation`
24
+
25
+ ---
26
+
27
+ ## Phase 2: Fix Routing — LLM testStrategy in Decomposition
28
+
29
+ **Problem:** `determineTestStrategy()` re-scans keywords after LLM already classified complexity, overriding LLM decisions for simple tasks.
30
+
31
+ **Fix:** When `strategy=llm`, have the LLM output `testStrategy` directly in its decomposition response. `determineTestStrategy()` is only used for keyword-mode fallback.
32
+
33
+ ### Changes:
34
+
35
+ **File: `src/agents/claude.ts`** (decomposition prompt)
36
+ - Add to the decomposition prompt schema: each story must include `testStrategy: "three-session-tdd" | "test-after"`
37
+ - Add decision rules to prompt:
38
+ ```
39
+ testStrategy rules:
40
+ - "three-session-tdd": ONLY for complex/expert tasks that are security-critical (auth, encryption, tokens) or define public API contracts
41
+ - "test-after": for all other tasks including simple/medium complexity
42
+ - A task being "simple" complexity should almost never be three-session-tdd
43
+ ```
44
+ - Add `testStrategy` to the expected JSON response schema alongside existing `complexity` field
45
+
46
+ **File: `src/cli/analyze.ts`**
47
+ - When building UserStory from LLM decomposition result:
48
+ - Use `ds.testStrategy` directly (from LLM response) instead of calling `determineTestStrategy()`
49
+ - Fallback to `determineTestStrategy()` only if LLM didn't return a testStrategy
50
+ - When using keyword classification (non-LLM path): keep calling `determineTestStrategy()` as-is
51
+ - Add `routing.strategy: "llm" | "keyword"` and `routing.llmModel` to the story routing object
52
+
53
+ **File: `src/prd/types.ts`**
54
+ - Add to `StoryRouting`:
55
+ ```ts
56
+ strategy?: "keyword" | "llm";
57
+ llmModel?: string;
58
+ ```
59
+
60
+ ### Tests:
61
+ - Update existing analyze tests to verify LLM-classified stories use LLM's testStrategy
62
+ - Add test: simple story with "auth" in tags gets `test-after` from LLM (not overridden to three-session-tdd)
63
+
64
+ ---
65
+
66
+ ## Phase 3: Enforce Max Stories + Add analyzeConfig
67
+
68
+ **Problem:** Prompt hint for max stories isn't enforced. analyzeConfig missing naxVersion.
69
+
70
+ ### Changes:
71
+
72
+ **File: `src/agents/claude.ts`** (decomposition prompt)
73
+ - Add grouping guidelines (from 211a884 — this part was good):
74
+ ```
75
+ Grouping Guidelines:
76
+ - Combine small related tasks into single stories
77
+ - Maximum stories: {maxStories} (from config). If you generate more, merge related ones.
78
+ - Aim for coherent units of value
79
+ ```
80
+ - Pass `maxStories` from config into the prompt template
81
+
82
+ **File: `src/cli/analyze.ts`**
83
+ - After LLM returns stories, if count > `config.execution.maxStoriesPerFeature`:
84
+ - Log a warning: `"LLM returned {n} stories, exceeding max {max}. Consider re-running with stricter grouping."`
85
+ - Do NOT auto-truncate (could lose important work). Just warn.
86
+ - Add `analyzeConfig` to PRD output:
87
+ ```ts
88
+ analyzeConfig: {
89
+ naxVersion: pkg.version, // read from package.json
90
+ model: config.analyze.model,
91
+ llmEnhanced: config.analyze.llmEnhanced,
92
+ maxStoriesPerFeature: config.execution.maxStoriesPerFeature,
93
+ routingStrategy: config.analyze.llmEnhanced ? "llm" : "keyword",
94
+ }
95
+ ```
96
+
97
+ **File: `src/prd/types.ts`**
98
+ - Add to PRD interface:
99
+ ```ts
100
+ analyzeConfig?: {
101
+ naxVersion: string;
102
+ model: string;
103
+ llmEnhanced: boolean;
104
+ maxStoriesPerFeature: number;
105
+ routingStrategy: "keyword" | "llm";
106
+ };
107
+ ```
108
+
109
+ ### Tests:
110
+ - Test that analyzeConfig is populated with correct values
111
+ - Test warning logged when stories exceed max
112
+
113
+ ---
114
+
115
+ ## Phase 4: TDD Isolation — Detector + Verifier Judgment
116
+
117
+ **Problem:** Isolation check always passes after 211a884. Should detect and report, let verifier judge.
118
+
119
+ ### Changes:
120
+
121
+ **File: `src/tdd/types.ts`**
122
+ - Update `IsolationCheck`:
123
+ ```ts
124
+ interface IsolationCheck {
125
+ /** Whether strict isolation was maintained (no test files touched) */
126
+ strictPass: boolean;
127
+ /** Test files modified by implementer */
128
+ modifiedTestFiles: string[];
129
+ /** Verdict: clean (no changes), needs-review (verifier must judge) */
130
+ verdict: "clean" | "needs-review";
131
+ description: string;
132
+ }
133
+ ```
134
+
135
+ **File: `src/tdd/isolation.ts`**
136
+ - `verifyImplementerIsolation()` returns honest results:
137
+ - If no test files modified: `{ strictPass: true, modifiedTestFiles: [], verdict: "clean" }`
138
+ - If test files modified: `{ strictPass: false, modifiedTestFiles: [...], verdict: "needs-review" }`
139
+ - Do NOT return `passed: true` when files were modified
140
+
141
+ **File: `src/tdd/orchestrator.ts`**
142
+ - After Session 2 isolation check:
143
+ - If `verdict === "clean"`: proceed normally
144
+ - If `verdict === "needs-review"`: inject modified file info into verifier (Session 3) prompt
145
+ - Update verifier prompt:
146
+ ```
147
+ ⚠️ ISOLATION REVIEW REQUIRED
148
+ The implementer modified these test files: {modifiedTestFiles}
149
+
150
+ You MUST review the changes to these files and determine:
151
+ - LEGITIMATE: Fixing genuinely incorrect test expectations, adding missing imports,
152
+ adjusting test fixtures to match correct implementation behavior
153
+ - VIOLATION: Removing test cases, weakening assertions, deleting acceptance criteria
154
+ checks, adding tests to inflate pass rate
155
+
156
+ Include your verdict in the output:
157
+ - isolationVerdict: "approved" | "rejected"
158
+ - isolationReason: "<explanation>"
159
+
160
+ If REJECTED: fail the story.
161
+ ```
162
+ - Parse verifier output for isolation verdict
163
+ - Log the verdict (approved/rejected + reason) to structured JSONL
164
+
165
+ **File: `src/tdd/orchestrator.ts`** (runTddSession result handling)
166
+ - When isolation.verdict === "needs-review" and verifier says "rejected":
167
+ - Mark story as failed with reason "TDD isolation violation confirmed by verifier"
168
+ - When isolation.verdict === "needs-review" and verifier says "approved":
169
+ - Mark story as passed with warning logged
170
+
171
+ ### Tests:
172
+ - Test isolation detection: modified test files → verdict "needs-review"
173
+ - Test clean isolation: no test files → verdict "clean"
174
+ - Test orchestrator injects isolation context into verifier prompt when needs-review
175
+ - Test story fails when verifier rejects isolation
176
+
177
+ ---
178
+
179
+ ## Phase 5: Version Bump + Cleanup
180
+
181
+ 1. Bump version to `0.9.1` in `package.json`
182
+ 2. Run full test suite: `bun test`
183
+ 3. Commit: `fix(v0.9.1): routing respects LLM complexity, isolation reworked to detector+verifier`
184
+ 4. Do NOT push.
185
+
186
+ ---
187
+
188
+ ## Test Strategy
189
+ - Mode: test-after
190
+ - Reason: Internal refactor with existing test coverage. Tests updated alongside implementation per phase.
191
+
192
+ ## Commits
193
+ - Phase 1: `revert: undo 211a884 and 4fa39a4 for clean reimplementation`
194
+ - Phase 2: `fix(routing): LLM decomposition outputs testStrategy directly`
195
+ - Phase 3: `fix(analyze): enforce max stories warning, add analyzeConfig with naxVersion`
196
+ - Phase 4: `fix(tdd): isolation becomes detector, verifier makes judgment`
197
+ - Phase 5: `chore: bump to v0.9.1`
@@ -0,0 +1,62 @@
1
+ # Fix Plan: nax prompts CLI + Scoped Test Coverage
2
+ **Date:** 2026-02-23
3
+ **Branch:** master (direct, v0.9.3)
4
+
5
+ ## Phase 1: `nax prompts` CLI Command (US-001)
6
+
7
+ ### Fix 1: Add CLI command handler
8
+ **File:** `src/cli/prompts.ts` (new)
9
+ **Change:** New CLI command that:
10
+ - Accepts `-f <feature>` (required), `--out <dir>` (optional, default stdout), `--story <id>` (optional filter)
11
+ - Loads PRD from feature dir
12
+ - Loads config
13
+ - For each story (or filtered story):
14
+ - Runs routing (classify complexity)
15
+ - Runs context building (buildContext + formatContextAsMarkdown)
16
+ - Loads constitution (if configured)
17
+ - Assembles prompt via buildSingleSessionPrompt / buildBatchPrompt
18
+ - For three-session-tdd stories: also builds test-writer/implementer/verifier prompts
19
+ - Outputs to stdout or writes files with YAML frontmatter
20
+
21
+ ### Fix 2: Register CLI command
22
+ **File:** `src/cli/index.ts`
23
+ **Change:** Add `prompts` subcommand to the CLI parser. Wire to handler.
24
+
25
+ ### Fix 3: Add tests
26
+ **File:** `test/prompts-cli.test.ts` (new)
27
+ **Change:** Test that:
28
+ - `nax prompts` loads PRD and produces prompt files
29
+ - Frontmatter includes storyId, testStrategy, contextTokens
30
+ - `--story` flag filters to single story
31
+ - Three-session-tdd stories produce separate session prompts
32
+ - Output dir is created if it doesn't exist
33
+
34
+ ## Phase 2: Scoped Test Coverage Scanner (US-003)
35
+
36
+ ### Fix 4: Add story scoping to test scanner
37
+ **File:** `src/context/test-scanner.ts`
38
+ **Change:**
39
+ - Accept optional `scopeFiles?: string[]` parameter
40
+ - When scopeFiles provided, derive test file patterns (e.g., `src/health.service.ts` → `**/health.service.{spec,test}.ts`)
41
+ - Filter scan results to only matching test files
42
+ - Fall back to full scan when scopeFiles is empty/undefined
43
+
44
+ ### Fix 5: Wire scoping in context builder
45
+ **File:** `src/context/builder.ts`
46
+ **Change:** Pass `currentStory.contextFiles` to generateTestCoverageSummary as scopeFiles.
47
+
48
+ ### Fix 6: Add config option
49
+ **File:** `src/config/schema.ts`
50
+ **Change:** Add `context.testCoverage.scopeToStory` boolean (default: true) to config schema.
51
+
52
+ ### Fix 7: Add tests for scoped scanning
53
+ **File:** `test/context.test.ts` or `test/test-scanner.test.ts`
54
+ **Change:** Test that test coverage scan respects scopeFiles filter.
55
+
56
+ ## Test Strategy
57
+ - Mode: test-after
58
+ - Run: `bun test` after each phase
59
+
60
+ ## Commits
61
+ - Phase 1: `feat: add nax prompts CLI command for prompt inspection`
62
+ - Phase 2: `feat: scope test coverage scanner to story-relevant files`
@@ -0,0 +1,189 @@
1
+ # nax Roadmap — TDD-Lite, LLM Service Layer, Parallelism
2
+
3
+ *Date: 2026-02-24*
4
+ *Status: Proposed*
5
+
6
+ ---
7
+
8
+ ## Context
9
+
10
+ nax v0.10.0 has a solid TDD pipeline for TypeScript libraries, but struggles with:
11
+ - Non-TS/polyglot projects (UI, shell scripts, integration-heavy)
12
+ - No parallelism (sequential story execution)
13
+ - Memory-heavy (long-running agent sessions, OOMs on 4GB VPS)
14
+ - Single agent backend (claude CLI only, no OpenClaw sub-agents)
15
+
16
+ dev-orchestrator (OpenClaw skill) solves execution well — worktrees, parallel coders, phase-by-phase memory — but lacks nax's TDD pipeline, structured logging, PRD workflow, and CLI.
17
+
18
+ ## nax vs dev-orchestrator — Honest Comparison
19
+
20
+ | Capability | nax v0.10.0 | dev-orchestrator |
21
+ |:-----------|:-----------|:-----------------|
22
+ | **TDD pipeline** | ✅ Three-session (strict isolation) | ❌ None |
23
+ | **Verification** | ✅ Isolated verifier | ❌ Code review only |
24
+ | **Test quality gates** | ✅ Coverage, typecheck, lint | ❌ Up to the coder |
25
+ | **Planning/PRD** | ✅ `nax plan` → `analyze` → structured stories | ❌ Simple task decomposition |
26
+ | **Parallelism** | ❌ Sequential (batch = same session) | ✅ Git worktrees, true parallel |
27
+ | **Memory** | ❌ Peaks 3-4GB+, OOMs on VPS | ✅ Phase-by-phase ~1-2GB, exits between phases |
28
+ | **Agent backends** | ❌ claude CLI only | ✅ OpenClaw sessions_spawn + claude CLI |
29
+ | **Structured logging** | ✅ JSONL, `nax runs list/show` | ❌ None |
30
+ | **Hooks/plugins** | ✅ Global hooks, plugin system | ❌ None |
31
+ | **Escalation tiers** | ✅ Automatic model escalation | ❌ Manual |
32
+ | **Reproducibility** | ✅ Same PRD = same run | ❌ Depends on orchestrator prompt |
33
+ | **Polyglot support** | ❌ TDD isolation breaks for UI/bash | ✅ Handles anything |
34
+ | **Setup overhead** | ❌ PRD → analyze → config → run | ✅ Zero — just spawn with task |
35
+ | **CLI** | ✅ Full CLI (`nax plan/run/accept/stories`) | ❌ OpenClaw skill only |
36
+
37
+ ### Key Insight
38
+
39
+ nax's TDD pipeline is its strongest differentiator. dev-orchestrator's execution model (worktrees + phase-by-phase agents) is proven and lighter. The gap is **agent spawning** — nax can't spawn parallel managed agents (#3 LLM Service Layer).
40
+
41
+ ## Decision
42
+
43
+ **Fix nax** in phases. Port dev-orchestrator's execution strengths into nax rather than rebuilding nax's TDD/PRD pipeline elsewhere.
44
+
45
+ ---
46
+
47
+ ## Phase 1 — TDD-Lite + Fallback (Quick Win)
48
+
49
+ **Goal:** Solve GitLab #20, support non-TS projects without abandoning TDD.
50
+
51
+ ### Three TDD Tiers
52
+
53
+ | Strategy | Test Writer | Implementer | Verifier | Use Case |
54
+ |:---------|:-----------|:------------|:---------|:---------|
55
+ | `three-session-tdd` (strict) | Isolated — no source access | Isolated — no test access | Isolated ✅ | TS libraries, APIs |
56
+ | `three-session-tdd-lite` | Can read source, write tests | Free to modify anything | Isolated ✅ | UI, polyglot, integration |
57
+ | `test-after` | N/A | Writes code + tests together | N/A | Simple tasks |
58
+
59
+ ### Fallback Logic
60
+
61
+ - If test-writer produces **0 test files** in strict mode → auto-downgrade to `tdd-lite` and retry
62
+ - No wasted iteration, no story pause
63
+
64
+ ### Config
65
+
66
+ ```json
67
+ {
68
+ "tdd": {
69
+ "strategy": "auto" | "strict" | "lite" | "off",
70
+ "enabled": true
71
+ }
72
+ }
73
+ ```
74
+
75
+ - `auto` (default): LLM router classifies testability, picks strict or lite
76
+ - `strict`: Always three-session-tdd
77
+ - `lite`: Always three-session-tdd-lite
78
+ - `off`: test-after for everything
79
+
80
+ ### Scope
81
+
82
+ - Modify `src/tdd/` prompts for lite mode (relax isolation rules for test-writer)
83
+ - Add fallback logic in `src/execution/runner.ts`
84
+ - Add `strategy` to routing decision
85
+ - Update config schema
86
+ - No architecture changes needed
87
+
88
+ ---
89
+
90
+ ## Phase 2 — LLM Service Layer (GitLab #3)
91
+
92
+ **Goal:** Abstract agent spawning so nax can use multiple backends and run agents in parallel.
93
+
94
+ ### Agent Interface
95
+
96
+ ```typescript
97
+ interface Agent {
98
+ name: string;
99
+ spawn(options: AgentSpawnOptions): Promise<AgentSession>;
100
+ isInstalled(): Promise<boolean>;
101
+ }
102
+
103
+ interface AgentSession {
104
+ id: string;
105
+ status: 'running' | 'completed' | 'failed';
106
+ workdir: string;
107
+ wait(): Promise<AgentResult>;
108
+ kill(): Promise<void>;
109
+ steer?(message: string): Promise<void>; // optional
110
+ }
111
+
112
+ interface AgentSpawnOptions {
113
+ prompt: string;
114
+ workdir: string;
115
+ model?: string;
116
+ timeout?: number;
117
+ env?: Record<string, string>;
118
+ }
119
+ ```
120
+
121
+ ### Backends
122
+
123
+ | Backend | How | Parallelism | Where |
124
+ |:--------|:----|:-----------|:------|
125
+ | `ClaudeCliAgent` | `claude -p` (existing) | ❌ Sequential | VPS, Mac01 |
126
+ | `OpenClawAgent` | `sessions_spawn` | ✅ Managed sub-agents | OpenClaw environments |
127
+ | `ApiAgent` | Direct Anthropic/Google API | ✅ Concurrent requests | Anywhere |
128
+
129
+ ### Key Design Decisions
130
+
131
+ - Agent selection via config: `autoMode.defaultAgent: "claude-cli" | "openclaw" | "api"`
132
+ - Each backend implements the same interface — runner doesn't care
133
+ - `ApiAgent` is the lightest (no CLI overhead) but needs prompt engineering for tool use
134
+
135
+ ---
136
+
137
+ ## Phase 3 — Worktree Parallelism
138
+
139
+ **Goal:** Run N stories concurrently using git worktrees + LLM Service Layer agents.
140
+
141
+ ### Flow
142
+
143
+ ```
144
+ nax run -f feature --parallel 3
145
+
146
+ ├── Worktree: .nax-wt/story-001/ → Agent 1 (tdd pipeline)
147
+ ├── Worktree: .nax-wt/story-002/ → Agent 2 (tdd pipeline)
148
+ └── Worktree: .nax-wt/story-003/ → Agent 3 (tdd pipeline)
149
+
150
+ ├── Each agent exits after its story (phase-by-phase memory)
151
+ ├── Verifier runs per-worktree (isolated)
152
+ └── Merge back to main branch on pass
153
+ ```
154
+
155
+ ### Benefits
156
+
157
+ - True parallelism (stolen from dev-orchestrator's proven model)
158
+ - Phase-by-phase execution = low memory (solves VPS OOM)
159
+ - Each worktree is isolated — no git conflicts during execution
160
+ - Merge conflicts detected at merge time, not runtime
161
+
162
+ ### Dependencies
163
+
164
+ - Phase 2 (LLM Service Layer) — need agent spawning abstraction
165
+ - Worktree management utilities (create, merge, cleanup)
166
+ - Dependency-aware scheduling (respect story dependencies in PRD)
167
+
168
+ ---
169
+
170
+ ## Dependency Chain
171
+
172
+ ```
173
+ Phase 1: tdd-lite + fallback ← standalone, no blockers
174
+
175
+ Phase 2: LLM Service Layer (#3) ← abstracts agent spawning
176
+
177
+ Phase 3: Worktree parallelism ← needs Phase 2
178
+
179
+ Memory optimization ← comes free with Phase 3
180
+ ```
181
+
182
+ ---
183
+
184
+ ## Open Questions
185
+
186
+ 1. Should `ApiAgent` support tool use (file read/write/exec) or is it prompt-only?
187
+ 2. For OpenClaw backend — do we use `sessions_spawn` (managed) or `exec` with claude CLI?
188
+ 3. Worktree merge strategy — rebase or merge commit?
189
+ 4. Should nax accept a `--backend` flag or always use config?