@nathapp/nax 0.28.0 → 0.30.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/CHANGELOG.md +23 -2
- package/bin/nax.ts +2 -3
- package/dist/nax.js +72753 -0
- package/package.json +11 -3
- package/src/cli/analyze.ts +2 -7
- package/src/cli/config.ts +3 -1
- package/src/config/defaults.ts +1 -0
- package/src/config/schemas.ts +1 -0
- package/src/config/types.ts +1 -0
- package/src/context/builder.ts +10 -1
- package/src/execution/lifecycle/headless-formatter.ts +2 -4
- package/src/prompts/builder.ts +12 -69
- package/src/prompts/sections/isolation.ts +38 -8
- package/src/prompts/sections/role-task.ts +79 -17
- package/src/review/runner.ts +6 -1
- package/src/version.ts +2 -1
- package/.claude/rules/01-project-conventions.md +0 -34
- package/.claude/rules/02-test-architecture.md +0 -39
- package/.claude/rules/03-test-writing.md +0 -58
- package/.claude/rules/04-forbidden-patterns.md +0 -29
- package/.claude/settings.json +0 -15
- package/.githooks/pre-commit +0 -16
- package/.gitlab-ci.yml +0 -103
- package/.mcp.json +0 -8
- package/BRIEF.md +0 -140
- package/CLAUDE.md +0 -143
- package/US-007-IMPLEMENTATION.md +0 -139
- package/biome.json +0 -14
- package/bun.lock +0 -163
- package/bunfig.toml +0 -12
- package/docker-compose.test.yml +0 -15
- package/docs/20260216-fix-plan-context-review.md +0 -56
- package/docs/20260216-relentless-vs-ngent-comparison.md +0 -208
- package/docs/20260216-v02-plan.md +0 -136
- package/docs/20260216-v02-review.md +0 -685
- package/docs/20260217-dogfood-findings.md +0 -56
- package/docs/20260217-p2-plus-plan.md +0 -117
- package/docs/20260217-partial-fixes-plan.md +0 -62
- package/docs/20260217-plan-analyze-spec.md +0 -117
- package/docs/20260217-post-impl-review.md +0 -1137
- package/docs/20260217-quick-wins-plan.md +0 -66
- package/docs/20260217-split-runner-plan.md +0 -75
- package/docs/20260217-v03-impl-plan.md +0 -80
- package/docs/20260217-v03-post-impl-review.md +0 -589
- package/docs/20260217-v04-impl-plan.md +0 -86
- package/docs/20260217-v05-post-impl-review.md +0 -850
- package/docs/20260217-v06-post-impl-review.md +0 -817
- package/docs/20260218-adr003-port-plan.md +0 -151
- package/docs/20260218-review-adr003-verification.md +0 -175
- package/docs/20260219-fix-plan-bug16-19.md +0 -79
- package/docs/20260219-fix-plan-bug20-22.md +0 -114
- package/docs/20260219-plan-llm-routing.md +0 -116
- package/docs/20260219-review-bug20-22-fixes.md +0 -135
- package/docs/20260219-routing-baseline-keyword.md +0 -63
- package/docs/20260220-plan-structured-logging-p1.md +0 -80
- package/docs/20260220-plan-structured-logging-p2.md +0 -37
- package/docs/20260220-review-llm-routing.md +0 -180
- package/docs/20260220-review-post-fix-llm-routing.md +0 -70
- package/docs/20260221-fix-plan-relevantfiles-split.md +0 -101
- package/docs/20260221-fix-plan-routing-mode.md +0 -125
- package/docs/20260221-review-v0.9-implementation.md +0 -379
- package/docs/20260222-fix-plan-v091-routing-isolation.md +0 -197
- package/docs/20260223-fix-plan-prompt-audit.md +0 -62
- package/docs/20260224-nax-roadmap-phases.md +0 -189
- package/docs/20260225-phase2-llm-service-layer.md +0 -401
- package/docs/20260225-review-v0.10.1.md +0 -187
- package/docs/20260303-v010-implementation-plan.md +0 -165
- package/docs/20260304-review-nax.md +0 -492
- package/docs/CLAUDE.md.bak +0 -191
- package/docs/ROADMAP.md +0 -390
- package/docs/SPEC-rectification.md +0 -0
- package/docs/SPEC.md +0 -324
- package/docs/US-001-plugin-loading-verification.md +0 -152
- package/docs/adr/ADR-005-implementation-plan.md +0 -655
- package/docs/adr/ADR-005-pipeline-re-architecture.md +0 -464
- package/docs/architecture-analysis.md +0 -1076
- package/docs/bugs/BUG-21-escalation-null-attempts.md +0 -48
- package/docs/bugs-from-dogfood-run-c.md +0 -243
- package/docs/code-review-20260228.md +0 -612
- package/docs/code-review-v0.15.0.md +0 -629
- package/docs/hook-lifecycle-test-plan.md +0 -149
- package/docs/releases/v0.11.0-and-earlier.md +0 -20
- package/docs/releases/v0.12.0.md +0 -15
- package/docs/releases/v0.13.0.md +0 -14
- package/docs/releases/v0.14.0.md +0 -20
- package/docs/releases/v0.14.1.md +0 -36
- package/docs/releases/v0.14.2.md +0 -51
- package/docs/releases/v0.14.3.md +0 -174
- package/docs/releases/v0.14.4.md +0 -94
- package/docs/releases/v0.15.0.md +0 -502
- package/docs/releases/v0.15.1.md +0 -170
- package/docs/releases/v0.15.3.md +0 -193
- package/docs/specs/bug-039-orphan-processes.md +0 -131
- package/docs/specs/bug-040-review-rectification.md +0 -82
- package/docs/specs/bug-041-cross-story-test-isolation.md +0 -88
- package/docs/specs/bug-042-verifier-failure-capture.md +0 -117
- package/docs/specs/bun-pty-migration.md +0 -171
- package/docs/specs/central-run-registry.md +0 -116
- package/docs/specs/feat-010-smart-runner-git-history.md +0 -96
- package/docs/specs/feat-011-file-context-strategy.md +0 -73
- package/docs/specs/feat-012-tdd-writer-tier.md +0 -79
- package/docs/specs/feat-013-test-after-review.md +0 -89
- package/docs/specs/feat-014-heartbeat-observability.md +0 -127
- package/docs/specs/status-file-consolidation.md +0 -93
- package/docs/specs/status-file-v0.10.1.md +0 -812
- package/docs/specs/trigger-completion.md +0 -145
- package/docs/specs/verification-architecture-v2.md +0 -343
- package/docs/tdd/strategies.md +0 -97
- package/docs/v0.10-global-config.md +0 -206
- package/docs/v0.10-plugin-system.md +0 -415
- package/docs/v0.10-prompt-optimizer.md +0 -234
- package/docs/v0.3-spec.md +0 -244
- package/docs/v0.4-spec.md +0 -140
- package/docs/v0.5-spec.md +0 -237
- package/docs/v0.6-spec.md +0 -371
- package/docs/v0.7-spec.md +0 -177
- package/docs/v0.8-llm-routing.md +0 -206
- package/docs/v0.8-structured-logging.md +0 -132
- package/docs/v0.9.3-prompt-audit.md +0 -112
- package/examples/plugins/console-reporter/index.test.ts +0 -207
- package/examples/plugins/console-reporter/index.ts +0 -110
- package/memory/topic/feat-010-baseref.md +0 -28
- package/memory/topic/feat-013-test-after-deprecation.md +0 -22
- package/nax/config.json +0 -154
- package/nax/features/bug-039-medium/prd.json +0 -45
- package/nax/features/bugfix-v0171/prd.json +0 -52
- package/nax/features/central-run-registry/prd.json +0 -105
- package/nax/features/config-management/prd.json +0 -108
- package/nax/features/config-management/progress.txt +0 -5
- package/nax/features/diagnose/acceptance.test.ts +0 -414
- package/nax/features/diagnose/prd.json +0 -41
- package/nax/features/nax-compliance/prd.json +0 -52
- package/nax/features/nax-compliance/progress.txt +0 -1
- package/nax/features/orchestration-fixes/prd.json +0 -89
- package/nax/features/orchestration-fixes/progress.txt +0 -1
- package/nax/features/plugin-integration/US-007-VERIFICATION.md +0 -259
- package/nax/features/plugin-integration/prd.json +0 -208
- package/nax/features/plugin-integration/progress.txt +0 -5
- package/nax/features/post-rearch-bugfix/prd.json +0 -137
- package/nax/features/precheck/prd.json +0 -205
- package/nax/features/precheck/progress.txt +0 -15
- package/nax/features/prompt-builder/prd.json +0 -152
- package/nax/features/prompt-builder/progress.txt +0 -3
- package/nax/features/review-quality/prd.json +0 -55
- package/nax/features/routing-persistence/prd.json +0 -104
- package/nax/features/routing-persistence/progress.txt +0 -1
- package/nax/features/smart-test-runner/plan.md +0 -7
- package/nax/features/smart-test-runner/prd.json +0 -203
- package/nax/features/smart-test-runner/progress.txt +0 -13
- package/nax/features/smart-test-runner/spec.md +0 -7
- package/nax/features/smart-test-runner/tasks.md +0 -8
- package/nax/features/status-file-consolidation/prd.json +0 -106
- package/nax/features/structured-logging/prd.json +0 -199
- package/nax/features/trigger-completion/prd.json +0 -150
- package/nax/features/trigger-completion/progress.txt +0 -7
- package/nax/features/unlock/prd.json +0 -36
- package/nax/features/v0.18.3-execution-reliability/prd.json +0 -80
- package/nax/features/v0.18.3-execution-reliability/progress.txt +0 -3
- package/nax/features/v0.19.0-hardening/plan.md +0 -7
- package/nax/features/v0.19.0-hardening/prd.json +0 -84
- package/nax/features/v0.19.0-hardening/progress.txt +0 -7
- package/nax/features/v0.19.0-hardening/spec.md +0 -18
- package/nax/features/v0.19.0-hardening/tasks.md +0 -8
- package/nax/features/verify-v2/prd.json +0 -79
- package/nax/features/verify-v2/progress.txt +0 -3
- package/nax/status.json +0 -36
- package/src/prompts/templates/implementer.ts +0 -6
- package/src/prompts/templates/single-session.ts +0 -6
- package/src/prompts/templates/test-writer.ts +0 -6
- package/src/prompts/templates/verifier.ts +0 -6
- package/test/COVERAGE-GAPS.md +0 -333
- package/test/e2e/cm-003-default-view.test.ts +0 -195
- package/test/e2e/plan-analyze-run.test.ts +0 -902
- package/test/helpers/helpers.test.ts +0 -295
- package/test/helpers/timeout.ts +0 -42
- package/test/integration/US-002-TEST-SUMMARY.md +0 -107
- package/test/integration/US-003-TEST-SUMMARY.md +0 -149
- package/test/integration/US-004-TEST-SUMMARY.md +0 -106
- package/test/integration/US-005-TEST-SUMMARY.md +0 -138
- package/test/integration/US-007-TEST-SUMMARY.md +0 -100
- package/test/integration/cli/agent-validation.test.ts +0 -439
- package/test/integration/cli/cli-config-default-edge-cases.test.ts +0 -223
- package/test/integration/cli/cli-config-default-view.test.ts +0 -230
- package/test/integration/cli/cli-config-diff.test.ts +0 -461
- package/test/integration/cli/cli-config-prompts-explain.test.ts +0 -74
- package/test/integration/cli/cli-config.test.ts +0 -737
- package/test/integration/cli/cli-diagnose.test.ts +0 -595
- package/test/integration/cli/cli-logs.test.ts +0 -346
- package/test/integration/cli/cli-plugins.test.ts +0 -679
- package/test/integration/cli/cli-precheck.test.ts +0 -372
- package/test/integration/cli/cli-run-headless.test.ts +0 -174
- package/test/integration/cli/cli.test.ts +0 -76
- package/test/integration/cli/precheck-integration.test.ts +0 -476
- package/test/integration/cli/precheck-orchestrator.test.ts +0 -247
- package/test/integration/cli/precheck.test.ts +0 -806
- package/test/integration/config/config-loader.test.ts +0 -266
- package/test/integration/config/config.test.ts +0 -444
- package/test/integration/config/merger.test.ts +0 -466
- package/test/integration/config/paths.test.ts +0 -52
- package/test/integration/config/security-loader.test.ts +0 -83
- package/test/integration/context/context-integration.test.ts +0 -703
- package/test/integration/context/context-path-security.test.ts +0 -173
- package/test/integration/context/context-provider-injection.test.ts +0 -507
- package/test/integration/context/context-verification-integration.test.ts +0 -296
- package/test/integration/context/s5-greenfield-fallback.test.ts +0 -298
- package/test/integration/execution/execution-isolation.test.ts +0 -143
- package/test/integration/execution/execution.test.ts +0 -634
- package/test/integration/execution/feature-status-write.test.ts +0 -302
- package/test/integration/execution/parallel.test.ts +0 -251
- package/test/integration/execution/prd-pause.test.ts +0 -205
- package/test/integration/execution/prd-resolvers.test.ts +0 -186
- package/test/integration/execution/progress.test.ts +0 -34
- package/test/integration/execution/runner-batching.test.ts +0 -682
- package/test/integration/execution/runner-config-plugins.test.ts +0 -462
- package/test/integration/execution/runner-escalation.test.ts +0 -561
- package/test/integration/execution/runner-fixes.test.ts +0 -400
- package/test/integration/execution/runner-plugin-integration.test.ts +0 -544
- package/test/integration/execution/runner-queue-and-attempts.test.ts +0 -476
- package/test/integration/execution/status-file-integration.test.ts +0 -289
- package/test/integration/execution/status-file.test.ts +0 -380
- package/test/integration/execution/status-writer.test.ts +0 -447
- package/test/integration/execution/story-id-in-events.test.ts +0 -274
- package/test/integration/interaction/interaction-chain-pipeline.test.ts +0 -476
- package/test/integration/pipeline/hooks.test.ts +0 -363
- package/test/integration/pipeline/pipeline-acceptance.test.ts +0 -303
- package/test/integration/pipeline/pipeline-events.test.ts +0 -476
- package/test/integration/pipeline/pipeline.test.ts +0 -660
- package/test/integration/pipeline/reporter-lifecycle.test.ts +0 -862
- package/test/integration/pipeline/verify-stage.test.ts +0 -286
- package/test/integration/plan/analyze-integration.test.ts +0 -262
- package/test/integration/plan/analyze-scanner.test.ts +0 -132
- package/test/integration/plan/logger.test.ts +0 -461
- package/test/integration/plan/plan.test.ts +0 -157
- package/test/integration/plugins/config-integration.test.ts +0 -173
- package/test/integration/plugins/config-resolution.test.ts +0 -523
- package/test/integration/plugins/loader.test.ts +0 -644
- package/test/integration/plugins/plugins-registry.test.ts +0 -747
- package/test/integration/plugins/validator.test.ts +0 -564
- package/test/integration/prompts/pb-004-migration.test.ts +0 -523
- package/test/integration/review/review-config-commands.test.ts +0 -320
- package/test/integration/review/review-config-schema.test.ts +0 -117
- package/test/integration/review/review-plugin-integration.test.ts +0 -729
- package/test/integration/review/review.test.ts +0 -150
- package/test/integration/routing/plugin-routing-advanced.test.ts +0 -461
- package/test/integration/routing/plugin-routing-core.test.ts +0 -527
- package/test/integration/routing/routing-stage-bug-021.test.ts +0 -275
- package/test/integration/routing/routing-stage-greenfield.test.ts +0 -287
- package/test/integration/tdd/tdd-cleanup.test.ts +0 -246
- package/test/integration/tdd/tdd-orchestrator-core.test.ts +0 -565
- package/test/integration/tdd/tdd-orchestrator-failureCategory.test.ts +0 -355
- package/test/integration/tdd/tdd-orchestrator-fallback.test.ts +0 -311
- package/test/integration/tdd/tdd-orchestrator-lite.test.ts +0 -289
- package/test/integration/tdd/tdd-orchestrator-prompts.test.ts +0 -260
- package/test/integration/tdd/tdd-orchestrator-verdict.test.ts +0 -536
- package/test/integration/tmp/headless-test/test.jsonl +0 -30
- package/test/integration/verification/test-scanner.test.ts +0 -403
- package/test/integration/verification/verification-asset-check.test.ts +0 -143
- package/test/integration/worktree/manager.test.ts +0 -218
- package/test/integration/worktree/worktree-merge.test.ts +0 -341
- package/test/manual/logging-formatter-demo.ts +0 -158
- package/test/ui/tui-agent-panel.test.tsx +0 -99
- package/test/ui/tui-pty-integration.test.tsx +0 -146
- package/test/unit/acceptance.test.ts +0 -187
- package/test/unit/agent-stderr-capture.test.ts +0 -147
- package/test/unit/agents/claude.test.ts +0 -107
- package/test/unit/analyze-classifier.test.ts +0 -216
- package/test/unit/analyze.test.ts +0 -224
- package/test/unit/auto-detect.test.ts +0 -250
- package/test/unit/cli-status-project-level.test.ts +0 -283
- package/test/unit/cli-status.test.ts +0 -418
- package/test/unit/commands/common.test.ts +0 -321
- package/test/unit/commands/logs.test.ts +0 -458
- package/test/unit/commands/runs.test.ts +0 -303
- package/test/unit/commands/unlock.test.ts +0 -320
- package/test/unit/config/defaults.test.ts +0 -70
- package/test/unit/config/quality-commands-schema.test.ts +0 -72
- package/test/unit/config/regression-gate-schema.test.ts +0 -160
- package/test/unit/config/smart-runner-flag.test.ts +0 -250
- package/test/unit/constitution-generators.test.ts +0 -161
- package/test/unit/constitution.test.ts +0 -210
- package/test/unit/context/context-autodetect.test.ts +0 -297
- package/test/unit/context/context-build.test.ts +0 -575
- package/test/unit/context/context-coverage.test.ts +0 -236
- package/test/unit/context/context-error.test.ts +0 -93
- package/test/unit/context/context-estimate-tokens.test.ts +0 -201
- package/test/unit/context/context-format.test.ts +0 -302
- package/test/unit/context/context-isolation.test.ts +0 -267
- package/test/unit/context/context-sort.test.ts +0 -93
- package/test/unit/context/context-story.test.ts +0 -108
- package/test/unit/context/prior-failures.test.ts +0 -463
- package/test/unit/context.test.ts +0 -1726
- package/test/unit/cost.test.ts +0 -231
- package/test/unit/crash-recovery.test.ts +0 -309
- package/test/unit/escalation.test.ts +0 -127
- package/test/unit/execution/lifecycle/run-completion.test.ts +0 -240
- package/test/unit/execution/lifecycle/run-regression.test.ts +0 -420
- package/test/unit/execution/pid-registry.test.ts +0 -241
- package/test/unit/execution/sequential-executor.test.ts +0 -235
- package/test/unit/execution/sfc-004-dead-code-cleanup.test.ts +0 -89
- package/test/unit/execution/structured-failure.test.ts +0 -415
- package/test/unit/execution-logging-stderr.test.ts +0 -157
- package/test/unit/execution-stage.test.ts +0 -123
- package/test/unit/fix-generator.test.ts +0 -276
- package/test/unit/formatters.test.ts +0 -468
- package/test/unit/greenfield.test.ts +0 -180
- package/test/unit/hooks/shell-security.test.ts +0 -40
- package/test/unit/interaction/auto-plugin.test.ts +0 -162
- package/test/unit/interaction/human-review-trigger.test.ts +0 -165
- package/test/unit/interaction-network-failures.test.ts +0 -390
- package/test/unit/interaction-plugins.test.ts +0 -472
- package/test/unit/logging/formatter.test.ts +0 -456
- package/test/unit/merge.test.ts +0 -269
- package/test/unit/metrics/aggregator.test.ts +0 -164
- package/test/unit/metrics/tracker.test.ts +0 -186
- package/test/unit/metrics.test.ts +0 -276
- package/test/unit/optimizer/noop.optimizer.test.ts +0 -125
- package/test/unit/optimizer/rule-based.optimizer.test.ts +0 -358
- package/test/unit/pipeline/event-bus.test.ts +0 -105
- package/test/unit/pipeline/routing-partial-override.test.ts +0 -121
- package/test/unit/pipeline/runner-retry.test.ts +0 -89
- package/test/unit/pipeline/stages/autofix.test.ts +0 -97
- package/test/unit/pipeline/stages/completion-review-gate.test.ts +0 -218
- package/test/unit/pipeline/stages/execution-ambiguity.test.ts +0 -311
- package/test/unit/pipeline/stages/execution-merge-conflict.test.ts +0 -218
- package/test/unit/pipeline/stages/rectify.test.ts +0 -101
- package/test/unit/pipeline/stages/regression-stage.test.ts +0 -69
- package/test/unit/pipeline/stages/review.test.ts +0 -201
- package/test/unit/pipeline/stages/routing-idempotence.test.ts +0 -139
- package/test/unit/pipeline/stages/routing-initial-complexity.test.ts +0 -321
- package/test/unit/pipeline/stages/routing-persistence.test.ts +0 -380
- package/test/unit/pipeline/stages/verify.test.ts +0 -267
- package/test/unit/pipeline/subscribers/events-writer.test.ts +0 -227
- package/test/unit/pipeline/subscribers/hooks.test.ts +0 -84
- package/test/unit/pipeline/subscribers/interaction.test.ts +0 -313
- package/test/unit/pipeline/subscribers/registry.test.ts +0 -149
- package/test/unit/pipeline/subscribers/reporters.test.ts +0 -90
- package/test/unit/pipeline/verify-smart-runner.test.ts +0 -345
- package/test/unit/prd-auto-default.test.ts +0 -291
- package/test/unit/prd-failure-category.test.ts +0 -177
- package/test/unit/prd-get-next-story.test.ts +0 -215
- package/test/unit/precheck/checks-warnings.test.ts +0 -114
- package/test/unit/precheck-checks.test.ts +0 -841
- package/test/unit/precheck-story-size-gate.test.ts +0 -288
- package/test/unit/precheck-types.test.ts +0 -143
- package/test/unit/prompts/builder.test.ts +0 -258
- package/test/unit/prompts/loader.test.ts +0 -355
- package/test/unit/prompts/sections/conventions.test.ts +0 -30
- package/test/unit/prompts/sections/isolation.test.ts +0 -35
- package/test/unit/prompts/sections/role-task.test.ts +0 -40
- package/test/unit/prompts/sections/sections.test.ts +0 -238
- package/test/unit/prompts/sections/story.test.ts +0 -45
- package/test/unit/prompts/sections/verdict.test.ts +0 -58
- package/test/unit/prompts.test.ts +0 -476
- package/test/unit/queue.test.ts +0 -237
- package/test/unit/rectification.test.ts +0 -285
- package/test/unit/registry.test.ts +0 -288
- package/test/unit/review/runner.test.ts +0 -117
- package/test/unit/routing/content-hash.test.ts +0 -99
- package/test/unit/routing/routing-stability.test.ts +0 -208
- package/test/unit/routing/strategies/llm.test.ts +0 -306
- package/test/unit/routing-advanced.test.ts +0 -313
- package/test/unit/routing-core.test.ts +0 -341
- package/test/unit/routing-strategies.test.ts +0 -440
- package/test/unit/storyid-events.test.ts +0 -213
- package/test/unit/tdd-verdict.test.ts +0 -492
- package/test/unit/test-output-parser.test.ts +0 -377
- package/test/unit/ui/tui-controls.test.ts +0 -335
- package/test/unit/ui/tui-cost-and-pty.test.ts +0 -190
- package/test/unit/ui/tui-layout.test.ts +0 -379
- package/test/unit/ui/tui-stories.test.ts +0 -333
- package/test/unit/unit-isolation.test.ts +0 -135
- package/test/unit/utils/git.test.ts +0 -50
- package/test/unit/utils/path-security.test.ts +0 -47
- package/test/unit/utils-helpers.test.ts +0 -318
- package/test/unit/verdict.test.ts +0 -325
- package/test/unit/verification/orchestrator-types.test.ts +0 -54
- package/test/unit/verification/orchestrator.test.ts +0 -66
- package/test/unit/verification/smart-runner-config.test.ts +0 -163
- package/test/unit/verification/smart-runner-discovery.test.ts +0 -354
- package/test/unit/verification/smart-runner.test.ts +0 -262
- package/test/unit/verification/strategies/acceptance.test.ts +0 -33
- package/test/unit/verification/strategies/regression.test.ts +0 -87
- package/test/unit/verification/strategies/scoped.test.ts +0 -100
- package/test/unit/worktree-manager.test.ts +0 -159
- package/tsconfig.json +0 -27
|
@@ -1,536 +0,0 @@
|
|
|
1
|
-
import { afterEach, beforeEach, describe, expect, mock, test } from "bun:test";
|
|
2
|
-
import { existsSync } from "node:fs";
|
|
3
|
-
import { mkdir, rm, writeFile } from "node:fs/promises";
|
|
4
|
-
import path from "node:path";
|
|
5
|
-
import type { AgentAdapter, AgentResult } from "../../../src/agents";
|
|
6
|
-
import { DEFAULT_CONFIG } from "../../../src/config";
|
|
7
|
-
import type { UserStory } from "../../../src/prd";
|
|
8
|
-
import { runThreeSessionTdd } from "../../../src/tdd/orchestrator";
|
|
9
|
-
import { VERDICT_FILE } from "../../../src/tdd/verdict";
|
|
10
|
-
|
|
11
|
-
let originalSpawn: typeof Bun.spawn;
|
|
12
|
-
|
|
13
|
-
beforeEach(() => {
|
|
14
|
-
originalSpawn = Bun.spawn;
|
|
15
|
-
});
|
|
16
|
-
|
|
17
|
-
afterEach(() => {
|
|
18
|
-
Bun.spawn = originalSpawn;
|
|
19
|
-
});
|
|
20
|
-
|
|
21
|
-
/** Create a mock agent that returns sequential results */
|
|
22
|
-
function createMockAgent(results: Partial<AgentResult>[]): AgentAdapter {
|
|
23
|
-
let callCount = 0;
|
|
24
|
-
return {
|
|
25
|
-
name: "mock",
|
|
26
|
-
displayName: "Mock Agent",
|
|
27
|
-
binary: "mock",
|
|
28
|
-
isInstalled: async () => true,
|
|
29
|
-
buildCommand: () => ["mock"],
|
|
30
|
-
run: mock(async () => {
|
|
31
|
-
const r = results[callCount] || {};
|
|
32
|
-
callCount++;
|
|
33
|
-
return {
|
|
34
|
-
success: r.success ?? true,
|
|
35
|
-
exitCode: r.exitCode ?? 0,
|
|
36
|
-
output: r.output ?? "",
|
|
37
|
-
rateLimited: r.rateLimited ?? false,
|
|
38
|
-
durationMs: r.durationMs ?? 100,
|
|
39
|
-
estimatedCost: r.estimatedCost ?? 0.01,
|
|
40
|
-
};
|
|
41
|
-
}),
|
|
42
|
-
};
|
|
43
|
-
}
|
|
44
|
-
|
|
45
|
-
/** Mock Bun.spawn to intercept git commands */
|
|
46
|
-
function mockGitSpawn(opts: {
|
|
47
|
-
/** Files returned by git diff for each session (indexed by git-diff call number) */
|
|
48
|
-
diffFiles: string[][];
|
|
49
|
-
/** Optional: mock test command success (default: true) */
|
|
50
|
-
testCommandSuccess?: boolean;
|
|
51
|
-
}) {
|
|
52
|
-
let revParseCount = 0;
|
|
53
|
-
let diffCount = 0;
|
|
54
|
-
const testSuccess = opts.testCommandSuccess ?? true;
|
|
55
|
-
|
|
56
|
-
// @ts-ignore — mocking global
|
|
57
|
-
Bun.spawn = mock((cmd: string[], spawnOpts?: any) => {
|
|
58
|
-
// Intercept test commands (bun test, npm test, etc.)
|
|
59
|
-
if ((cmd[0] === "/bin/sh" || cmd[0] === "/bin/bash" || cmd[0] === "/bin/zsh") && cmd[1] === "-c") {
|
|
60
|
-
return {
|
|
61
|
-
pid: 9999,
|
|
62
|
-
exited: Promise.resolve(testSuccess ? 0 : 1),
|
|
63
|
-
stdout: new Response(testSuccess ? "tests pass\n" : "tests fail\n").body,
|
|
64
|
-
stderr: new Response("").body,
|
|
65
|
-
};
|
|
66
|
-
}
|
|
67
|
-
if (cmd[0] === "git" && cmd[1] === "rev-parse") {
|
|
68
|
-
revParseCount++;
|
|
69
|
-
return {
|
|
70
|
-
exited: Promise.resolve(0),
|
|
71
|
-
stdout: new Response(`ref-${revParseCount}\n`).body,
|
|
72
|
-
stderr: new Response("").body,
|
|
73
|
-
};
|
|
74
|
-
}
|
|
75
|
-
if (cmd[0] === "git" && cmd[1] === "checkout") {
|
|
76
|
-
// Intercept git checkout (used in zero-file fallback) — silently succeed
|
|
77
|
-
return {
|
|
78
|
-
exited: Promise.resolve(0),
|
|
79
|
-
stdout: new Response("").body,
|
|
80
|
-
stderr: new Response("").body,
|
|
81
|
-
};
|
|
82
|
-
}
|
|
83
|
-
if (cmd[0] === "git" && cmd[1] === "diff") {
|
|
84
|
-
const files = opts.diffFiles[diffCount] || [];
|
|
85
|
-
diffCount++;
|
|
86
|
-
return {
|
|
87
|
-
exited: Promise.resolve(0),
|
|
88
|
-
stdout: new Response(files.join("\n") + "\n").body,
|
|
89
|
-
stderr: new Response("").body,
|
|
90
|
-
};
|
|
91
|
-
}
|
|
92
|
-
return originalSpawn(cmd, spawnOpts);
|
|
93
|
-
});
|
|
94
|
-
}
|
|
95
|
-
|
|
96
|
-
const story: UserStory = {
|
|
97
|
-
id: "US-001",
|
|
98
|
-
title: "Add user validation",
|
|
99
|
-
description: "Add validation to user input",
|
|
100
|
-
acceptanceCriteria: ["Validation works", "Errors are clear"],
|
|
101
|
-
dependencies: [],
|
|
102
|
-
tags: [],
|
|
103
|
-
status: "pending",
|
|
104
|
-
passes: false,
|
|
105
|
-
escalations: [],
|
|
106
|
-
attempts: 0,
|
|
107
|
-
};
|
|
108
|
-
|
|
109
|
-
|
|
110
|
-
describe("runThreeSessionTdd — T9: verdict integration", () => {
|
|
111
|
-
let tmpDir: string;
|
|
112
|
-
|
|
113
|
-
beforeEach(async () => {
|
|
114
|
-
tmpDir = `/tmp/nax-t9-test-${Date.now()}-${Math.random().toString(36).slice(2)}`;
|
|
115
|
-
await mkdir(tmpDir, { recursive: true });
|
|
116
|
-
});
|
|
117
|
-
|
|
118
|
-
afterEach(async () => {
|
|
119
|
-
await rm(tmpDir, { recursive: true, force: true });
|
|
120
|
-
Bun.spawn = originalSpawn;
|
|
121
|
-
});
|
|
122
|
-
|
|
123
|
-
/** Write a valid verdict file to tmpDir */
|
|
124
|
-
async function writeVerdictToDir(opts: {
|
|
125
|
-
approved: boolean;
|
|
126
|
-
failReason?: "tests-failing" | "illegitimate-mods" | "criteria-not-met" | "poor-quality";
|
|
127
|
-
}) {
|
|
128
|
-
const verdict = {
|
|
129
|
-
version: 1,
|
|
130
|
-
approved: opts.approved,
|
|
131
|
-
tests: {
|
|
132
|
-
allPassing: opts.failReason !== "tests-failing",
|
|
133
|
-
passCount: opts.failReason === "tests-failing" ? 5 : 10,
|
|
134
|
-
failCount: opts.failReason === "tests-failing" ? 3 : 0,
|
|
135
|
-
},
|
|
136
|
-
testModifications: {
|
|
137
|
-
detected: opts.failReason === "illegitimate-mods",
|
|
138
|
-
files: opts.failReason === "illegitimate-mods" ? ["test/foo.test.ts"] : [],
|
|
139
|
-
legitimate: opts.failReason !== "illegitimate-mods",
|
|
140
|
-
reasoning: opts.failReason === "illegitimate-mods" ? "Implementer cheated" : "No mods",
|
|
141
|
-
},
|
|
142
|
-
acceptanceCriteria: {
|
|
143
|
-
allMet: opts.failReason !== "criteria-not-met",
|
|
144
|
-
criteria:
|
|
145
|
-
opts.failReason === "criteria-not-met"
|
|
146
|
-
? [{ criterion: "Must work", met: false }]
|
|
147
|
-
: [{ criterion: "Works", met: true }],
|
|
148
|
-
},
|
|
149
|
-
quality: {
|
|
150
|
-
rating: opts.failReason === "poor-quality" ? "poor" : "good",
|
|
151
|
-
issues: opts.failReason === "poor-quality" ? ["Security issue"] : [],
|
|
152
|
-
},
|
|
153
|
-
fixes: [],
|
|
154
|
-
reasoning: opts.approved ? "All good." : "Implementation rejected.",
|
|
155
|
-
};
|
|
156
|
-
await writeFile(path.join(tmpDir, VERDICT_FILE), JSON.stringify(verdict, null, 2));
|
|
157
|
-
}
|
|
158
|
-
|
|
159
|
-
/**
|
|
160
|
-
* Mock Bun.spawn for a full 3-session T9 run.
|
|
161
|
-
* Provides 6 git diff calls (isolation + getChangedFiles per session)
|
|
162
|
-
* and optionally intercepts the post-TDD shell command (bun test).
|
|
163
|
-
*/
|
|
164
|
-
function mockGitAndTestForT9(opts: {
|
|
165
|
-
diffFiles?: string[][];
|
|
166
|
-
onTestCmd?: () => { exitCode: number; stdout: string };
|
|
167
|
-
}) {
|
|
168
|
-
const files = opts.diffFiles ?? [
|
|
169
|
-
["test/user.test.ts"], // s1 isolation
|
|
170
|
-
["test/user.test.ts"], // s1 getChangedFiles
|
|
171
|
-
["src/user.ts"], // s2 isolation
|
|
172
|
-
["src/user.ts"], // s2 getChangedFiles
|
|
173
|
-
[], // s3 isolation
|
|
174
|
-
["src/user.ts"], // s3 getChangedFiles
|
|
175
|
-
];
|
|
176
|
-
let revParseCount = 0;
|
|
177
|
-
let diffCount = 0;
|
|
178
|
-
|
|
179
|
-
// @ts-ignore — mocking global
|
|
180
|
-
Bun.spawn = mock((cmd: string[], spawnOpts?: any) => {
|
|
181
|
-
if (cmd[0] === "/bin/sh" && cmd[2]?.includes("bun test")) {
|
|
182
|
-
const r = opts.onTestCmd?.() ?? { exitCode: 0, stdout: "5 pass, 0 fail\n" };
|
|
183
|
-
return {
|
|
184
|
-
pid: 9999,
|
|
185
|
-
exited: Promise.resolve(r.exitCode),
|
|
186
|
-
stdout: new Response(r.stdout).body,
|
|
187
|
-
stderr: new Response("").body,
|
|
188
|
-
};
|
|
189
|
-
}
|
|
190
|
-
if (cmd[0] === "git" && cmd[1] === "rev-parse") {
|
|
191
|
-
revParseCount++;
|
|
192
|
-
return {
|
|
193
|
-
exited: Promise.resolve(0),
|
|
194
|
-
stdout: new Response(`ref-${revParseCount}\n`).body,
|
|
195
|
-
stderr: new Response("").body,
|
|
196
|
-
};
|
|
197
|
-
}
|
|
198
|
-
if (cmd[0] === "git" && cmd[1] === "diff") {
|
|
199
|
-
const f = files[diffCount] || [];
|
|
200
|
-
diffCount++;
|
|
201
|
-
return {
|
|
202
|
-
exited: Promise.resolve(0),
|
|
203
|
-
stdout: new Response(f.join("\n") + "\n").body,
|
|
204
|
-
stderr: new Response("").body,
|
|
205
|
-
};
|
|
206
|
-
}
|
|
207
|
-
return originalSpawn(cmd, spawnOpts);
|
|
208
|
-
});
|
|
209
|
-
}
|
|
210
|
-
|
|
211
|
-
test("verdict approved=true: overall success even when verifier session failed", async () => {
|
|
212
|
-
await writeVerdictToDir({ approved: true });
|
|
213
|
-
mockGitAndTestForT9({});
|
|
214
|
-
|
|
215
|
-
const agent = createMockAgent([
|
|
216
|
-
{ success: true, estimatedCost: 0.01 },
|
|
217
|
-
{ success: true, estimatedCost: 0.02 },
|
|
218
|
-
{ success: false, exitCode: 1, estimatedCost: 0.01 }, // verifier exits non-zero
|
|
219
|
-
]);
|
|
220
|
-
|
|
221
|
-
const result = await runThreeSessionTdd({
|
|
222
|
-
agent,
|
|
223
|
-
story,
|
|
224
|
-
config: DEFAULT_CONFIG,
|
|
225
|
-
workdir: tmpDir,
|
|
226
|
-
modelTier: "balanced",
|
|
227
|
-
});
|
|
228
|
-
|
|
229
|
-
expect(result.success).toBe(true);
|
|
230
|
-
expect(result.needsHumanReview).toBe(false);
|
|
231
|
-
expect(result.failureCategory).toBeUndefined();
|
|
232
|
-
expect(result.reviewReason).toBeUndefined();
|
|
233
|
-
});
|
|
234
|
-
|
|
235
|
-
test("verdict approved=true: skips the post-TDD independent test check", async () => {
|
|
236
|
-
await writeVerdictToDir({ approved: true });
|
|
237
|
-
let testCommandCalled = false;
|
|
238
|
-
mockGitAndTestForT9({
|
|
239
|
-
onTestCmd: () => {
|
|
240
|
-
testCommandCalled = true;
|
|
241
|
-
return { exitCode: 0, stdout: "" };
|
|
242
|
-
},
|
|
243
|
-
});
|
|
244
|
-
|
|
245
|
-
const agent = createMockAgent([
|
|
246
|
-
{ success: true, estimatedCost: 0.01 },
|
|
247
|
-
{ success: true, estimatedCost: 0.02 },
|
|
248
|
-
{ success: false, exitCode: 1, estimatedCost: 0.01 }, // verifier fails
|
|
249
|
-
]);
|
|
250
|
-
|
|
251
|
-
// Disable rectification to avoid test command being called for full-suite gate
|
|
252
|
-
const configNoRectification = {
|
|
253
|
-
...DEFAULT_CONFIG,
|
|
254
|
-
execution: {
|
|
255
|
-
...DEFAULT_CONFIG.execution,
|
|
256
|
-
rectification: { ...DEFAULT_CONFIG.execution.rectification, enabled: false },
|
|
257
|
-
},
|
|
258
|
-
};
|
|
259
|
-
|
|
260
|
-
await runThreeSessionTdd({
|
|
261
|
-
agent,
|
|
262
|
-
story,
|
|
263
|
-
config: configNoRectification,
|
|
264
|
-
workdir: tmpDir,
|
|
265
|
-
modelTier: "balanced",
|
|
266
|
-
});
|
|
267
|
-
expect(testCommandCalled).toBe(false); // Test was NOT run when verdict present
|
|
268
|
-
});
|
|
269
|
-
|
|
270
|
-
test("verdict approved=false + tests-failing → failureCategory='tests-failing'", async () => {
|
|
271
|
-
await writeVerdictToDir({ approved: false, failReason: "tests-failing" });
|
|
272
|
-
mockGitAndTestForT9({});
|
|
273
|
-
|
|
274
|
-
const agent = createMockAgent([
|
|
275
|
-
{ success: true, estimatedCost: 0.01 },
|
|
276
|
-
{ success: true, estimatedCost: 0.02 },
|
|
277
|
-
{ success: true, estimatedCost: 0.01 }, // sessions succeed but verdict says rejected
|
|
278
|
-
]);
|
|
279
|
-
|
|
280
|
-
const result = await runThreeSessionTdd({
|
|
281
|
-
agent,
|
|
282
|
-
story,
|
|
283
|
-
config: DEFAULT_CONFIG,
|
|
284
|
-
workdir: tmpDir,
|
|
285
|
-
modelTier: "balanced",
|
|
286
|
-
});
|
|
287
|
-
|
|
288
|
-
expect(result.success).toBe(false);
|
|
289
|
-
expect(result.needsHumanReview).toBe(true);
|
|
290
|
-
expect(result.failureCategory).toBe("tests-failing");
|
|
291
|
-
expect(result.reviewReason).toContain("failure(s)");
|
|
292
|
-
});
|
|
293
|
-
|
|
294
|
-
test("verdict approved=false + illegitimate test mods → failureCategory='verifier-rejected'", async () => {
|
|
295
|
-
await writeVerdictToDir({ approved: false, failReason: "illegitimate-mods" });
|
|
296
|
-
mockGitAndTestForT9({});
|
|
297
|
-
|
|
298
|
-
const agent = createMockAgent([
|
|
299
|
-
{ success: true, estimatedCost: 0.01 },
|
|
300
|
-
{ success: true, estimatedCost: 0.02 },
|
|
301
|
-
{ success: true, estimatedCost: 0.01 },
|
|
302
|
-
]);
|
|
303
|
-
|
|
304
|
-
const result = await runThreeSessionTdd({
|
|
305
|
-
agent,
|
|
306
|
-
story,
|
|
307
|
-
config: DEFAULT_CONFIG,
|
|
308
|
-
workdir: tmpDir,
|
|
309
|
-
modelTier: "balanced",
|
|
310
|
-
});
|
|
311
|
-
|
|
312
|
-
expect(result.success).toBe(false);
|
|
313
|
-
expect(result.failureCategory).toBe("verifier-rejected");
|
|
314
|
-
expect(result.reviewReason).toContain("illegitimate test modifications");
|
|
315
|
-
});
|
|
316
|
-
|
|
317
|
-
test("verdict approved=false + criteria not met → failureCategory='verifier-rejected'", async () => {
|
|
318
|
-
await writeVerdictToDir({ approved: false, failReason: "criteria-not-met" });
|
|
319
|
-
mockGitAndTestForT9({});
|
|
320
|
-
|
|
321
|
-
const agent = createMockAgent([
|
|
322
|
-
{ success: true, estimatedCost: 0.01 },
|
|
323
|
-
{ success: true, estimatedCost: 0.02 },
|
|
324
|
-
{ success: true, estimatedCost: 0.01 },
|
|
325
|
-
]);
|
|
326
|
-
|
|
327
|
-
const result = await runThreeSessionTdd({
|
|
328
|
-
agent,
|
|
329
|
-
story,
|
|
330
|
-
config: DEFAULT_CONFIG,
|
|
331
|
-
workdir: tmpDir,
|
|
332
|
-
modelTier: "balanced",
|
|
333
|
-
});
|
|
334
|
-
|
|
335
|
-
expect(result.success).toBe(false);
|
|
336
|
-
expect(result.failureCategory).toBe("verifier-rejected");
|
|
337
|
-
expect(result.reviewReason).toContain("Must work");
|
|
338
|
-
});
|
|
339
|
-
|
|
340
|
-
test("no verdict file → fallback: post-TDD test check is run on session failures", async () => {
|
|
341
|
-
// No verdict file — when verifier fails, falls back to running tests independently
|
|
342
|
-
let testCommandCalled = false;
|
|
343
|
-
mockGitAndTestForT9({
|
|
344
|
-
onTestCmd: () => {
|
|
345
|
-
testCommandCalled = true;
|
|
346
|
-
return { exitCode: 0, stdout: "5 pass, 0 fail\n" }; // Tests pass in fallback
|
|
347
|
-
},
|
|
348
|
-
});
|
|
349
|
-
|
|
350
|
-
const agent = createMockAgent([
|
|
351
|
-
{ success: true, estimatedCost: 0.01 },
|
|
352
|
-
{ success: true, estimatedCost: 0.02 },
|
|
353
|
-
{ success: false, exitCode: 1, estimatedCost: 0.01 }, // verifier fails
|
|
354
|
-
]);
|
|
355
|
-
|
|
356
|
-
const result = await runThreeSessionTdd({
|
|
357
|
-
agent,
|
|
358
|
-
story,
|
|
359
|
-
config: DEFAULT_CONFIG,
|
|
360
|
-
workdir: tmpDir,
|
|
361
|
-
modelTier: "balanced",
|
|
362
|
-
});
|
|
363
|
-
|
|
364
|
-
expect(testCommandCalled).toBe(true); // Fallback test run was executed
|
|
365
|
-
expect(result.success).toBe(true); // Tests pass in fallback → success
|
|
366
|
-
expect(result.verdict).toBeNull(); // No verdict available
|
|
367
|
-
});
|
|
368
|
-
|
|
369
|
-
test("malformed verdict → fallback: post-TDD test check is run", async () => {
|
|
370
|
-
// Write invalid JSON — should trigger fallback
|
|
371
|
-
await writeFile(path.join(tmpDir, VERDICT_FILE), "{ this is not valid json }");
|
|
372
|
-
let testCommandCalled = false;
|
|
373
|
-
mockGitAndTestForT9({
|
|
374
|
-
onTestCmd: () => {
|
|
375
|
-
testCommandCalled = true;
|
|
376
|
-
return { exitCode: 0, stdout: "5 pass\n" };
|
|
377
|
-
},
|
|
378
|
-
});
|
|
379
|
-
|
|
380
|
-
const agent = createMockAgent([
|
|
381
|
-
{ success: true, estimatedCost: 0.01 },
|
|
382
|
-
{ success: true, estimatedCost: 0.02 },
|
|
383
|
-
{ success: false, exitCode: 1, estimatedCost: 0.01 },
|
|
384
|
-
]);
|
|
385
|
-
|
|
386
|
-
const result = await runThreeSessionTdd({
|
|
387
|
-
agent,
|
|
388
|
-
story,
|
|
389
|
-
config: DEFAULT_CONFIG,
|
|
390
|
-
workdir: tmpDir,
|
|
391
|
-
modelTier: "balanced",
|
|
392
|
-
});
|
|
393
|
-
|
|
394
|
-
expect(testCommandCalled).toBe(true); // Fallback used when verdict is malformed
|
|
395
|
-
expect(result.verdict).toBeNull(); // Malformed = null
|
|
396
|
-
});
|
|
397
|
-
|
|
398
|
-
test("verdict stored in result.verdict for logging/debugging (approved=true)", async () => {
|
|
399
|
-
await writeVerdictToDir({ approved: true });
|
|
400
|
-
mockGitAndTestForT9({});
|
|
401
|
-
|
|
402
|
-
const agent = createMockAgent([
|
|
403
|
-
{ success: true, estimatedCost: 0.01 },
|
|
404
|
-
{ success: true, estimatedCost: 0.02 },
|
|
405
|
-
{ success: true, estimatedCost: 0.01 },
|
|
406
|
-
]);
|
|
407
|
-
|
|
408
|
-
const result = await runThreeSessionTdd({
|
|
409
|
-
agent,
|
|
410
|
-
story,
|
|
411
|
-
config: DEFAULT_CONFIG,
|
|
412
|
-
workdir: tmpDir,
|
|
413
|
-
modelTier: "balanced",
|
|
414
|
-
});
|
|
415
|
-
|
|
416
|
-
expect(result.verdict).toBeDefined();
|
|
417
|
-
expect(result.verdict).not.toBeNull();
|
|
418
|
-
expect(result.verdict!.version).toBe(1);
|
|
419
|
-
expect(result.verdict!.approved).toBe(true);
|
|
420
|
-
expect(result.verdict!.tests.allPassing).toBe(true);
|
|
421
|
-
expect(result.verdict!.tests.passCount).toBe(10);
|
|
422
|
-
expect(result.verdict!.reasoning).toBe("All good.");
|
|
423
|
-
});
|
|
424
|
-
|
|
425
|
-
test("verdict stored in result.verdict for logging/debugging (approved=false)", async () => {
|
|
426
|
-
await writeVerdictToDir({ approved: false, failReason: "tests-failing" });
|
|
427
|
-
mockGitAndTestForT9({});
|
|
428
|
-
|
|
429
|
-
const agent = createMockAgent([
|
|
430
|
-
{ success: true, estimatedCost: 0.01 },
|
|
431
|
-
{ success: true, estimatedCost: 0.02 },
|
|
432
|
-
{ success: true, estimatedCost: 0.01 },
|
|
433
|
-
]);
|
|
434
|
-
|
|
435
|
-
const result = await runThreeSessionTdd({
|
|
436
|
-
agent,
|
|
437
|
-
story,
|
|
438
|
-
config: DEFAULT_CONFIG,
|
|
439
|
-
workdir: tmpDir,
|
|
440
|
-
modelTier: "balanced",
|
|
441
|
-
});
|
|
442
|
-
|
|
443
|
-
expect(result.verdict).not.toBeNull();
|
|
444
|
-
expect(result.verdict!.approved).toBe(false);
|
|
445
|
-
expect(result.verdict!.tests.failCount).toBe(3);
|
|
446
|
-
});
|
|
447
|
-
|
|
448
|
-
test("verdict file is deleted after reading (cleanup enforced)", async () => {
|
|
449
|
-
await writeVerdictToDir({ approved: true });
|
|
450
|
-
mockGitAndTestForT9({});
|
|
451
|
-
|
|
452
|
-
const verdictPath = path.join(tmpDir, VERDICT_FILE);
|
|
453
|
-
expect(existsSync(verdictPath)).toBe(true); // File exists before run
|
|
454
|
-
|
|
455
|
-
const agent = createMockAgent([
|
|
456
|
-
{ success: true, estimatedCost: 0.01 },
|
|
457
|
-
{ success: true, estimatedCost: 0.02 },
|
|
458
|
-
{ success: true, estimatedCost: 0.01 },
|
|
459
|
-
]);
|
|
460
|
-
await runThreeSessionTdd({
|
|
461
|
-
agent,
|
|
462
|
-
story,
|
|
463
|
-
config: DEFAULT_CONFIG,
|
|
464
|
-
workdir: tmpDir,
|
|
465
|
-
modelTier: "balanced",
|
|
466
|
-
});
|
|
467
|
-
|
|
468
|
-
expect(existsSync(verdictPath)).toBe(false); // File cleaned up after run
|
|
469
|
-
});
|
|
470
|
-
|
|
471
|
-
test("no verdict + all sessions succeed → success without running test check", async () => {
|
|
472
|
-
// All sessions succeed, no verdict → should succeed and NOT run the test command
|
|
473
|
-
let testCommandCalled = false;
|
|
474
|
-
mockGitAndTestForT9({
|
|
475
|
-
onTestCmd: () => {
|
|
476
|
-
testCommandCalled = true;
|
|
477
|
-
return { exitCode: 0, stdout: "" };
|
|
478
|
-
},
|
|
479
|
-
});
|
|
480
|
-
|
|
481
|
-
const agent = createMockAgent([
|
|
482
|
-
{ success: true, estimatedCost: 0.01 },
|
|
483
|
-
{ success: true, estimatedCost: 0.02 },
|
|
484
|
-
{ success: true, estimatedCost: 0.01 },
|
|
485
|
-
]);
|
|
486
|
-
|
|
487
|
-
// Disable rectification to avoid test command being called for full-suite gate
|
|
488
|
-
const configNoRectification = {
|
|
489
|
-
...DEFAULT_CONFIG,
|
|
490
|
-
execution: {
|
|
491
|
-
...DEFAULT_CONFIG.execution,
|
|
492
|
-
rectification: { ...DEFAULT_CONFIG.execution.rectification, enabled: false },
|
|
493
|
-
},
|
|
494
|
-
};
|
|
495
|
-
|
|
496
|
-
const result = await runThreeSessionTdd({
|
|
497
|
-
agent,
|
|
498
|
-
story,
|
|
499
|
-
config: configNoRectification,
|
|
500
|
-
workdir: tmpDir,
|
|
501
|
-
modelTier: "balanced",
|
|
502
|
-
});
|
|
503
|
-
|
|
504
|
-
expect(result.success).toBe(true);
|
|
505
|
-
expect(testCommandCalled).toBe(false); // Not needed when sessions all succeed
|
|
506
|
-
expect(result.verdict).toBeNull(); // No verdict
|
|
507
|
-
expect(result.failureCategory).toBeUndefined();
|
|
508
|
-
});
|
|
509
|
-
|
|
510
|
-
test("early-exit before session 3 (session 1 fails) → verdict is undefined (not attempted)", async () => {
|
|
511
|
-
// If we exit before session 3, verdict reading is never attempted
|
|
512
|
-
mockGitAndTestForT9({
|
|
513
|
-
diffFiles: [
|
|
514
|
-
["test/user.test.ts"], // s1 isolation
|
|
515
|
-
["test/user.test.ts"], // s1 getChangedFiles
|
|
516
|
-
],
|
|
517
|
-
});
|
|
518
|
-
|
|
519
|
-
const agent = createMockAgent([
|
|
520
|
-
{ success: false, exitCode: 1, estimatedCost: 0.01 }, // session 1 fails
|
|
521
|
-
]);
|
|
522
|
-
|
|
523
|
-
const result = await runThreeSessionTdd({
|
|
524
|
-
agent,
|
|
525
|
-
story,
|
|
526
|
-
config: DEFAULT_CONFIG,
|
|
527
|
-
workdir: tmpDir,
|
|
528
|
-
modelTier: "balanced",
|
|
529
|
-
});
|
|
530
|
-
|
|
531
|
-
expect(result.success).toBe(false);
|
|
532
|
-
expect(result.sessions).toHaveLength(1);
|
|
533
|
-
// verdict is undefined (field not set) because we never got to session 3
|
|
534
|
-
expect(result.verdict).toBeUndefined();
|
|
535
|
-
});
|
|
536
|
-
});
|
|
@@ -1,30 +0,0 @@
|
|
|
1
|
-
{"timestamp":"2026-03-06T08:58:27.466Z","level":"info","stage":"test.stage","message":"Test message","data":{"foo":"bar"}}
|
|
2
|
-
{"timestamp":"2026-03-06T08:58:27.482Z","level":"info","stage":"test.stage","message":"Test message","data":{"foo":"bar"}}
|
|
3
|
-
{"timestamp":"2026-03-06T08:58:27.482Z","level":"debug","stage":"test.stage","message":"Debug message"}
|
|
4
|
-
{"timestamp":"2026-03-06T08:58:27.482Z","level":"info","stage":"test.stage","message":"Info message"}
|
|
5
|
-
{"timestamp":"2026-03-06T08:58:27.482Z","level":"error","stage":"test.stage","message":"Error message"}
|
|
6
|
-
{"timestamp":"2026-03-06T08:58:27.483Z","level":"info","stage":"test.stage","message":"Test message","data":{"foo":"bar"}}
|
|
7
|
-
{"timestamp":"2026-03-06T09:00:48.487Z","level":"info","stage":"test.stage","message":"Test message","data":{"foo":"bar"}}
|
|
8
|
-
{"timestamp":"2026-03-06T09:00:48.520Z","level":"info","stage":"test.stage","message":"Test message","data":{"foo":"bar"}}
|
|
9
|
-
{"timestamp":"2026-03-06T09:00:48.521Z","level":"debug","stage":"test.stage","message":"Debug message"}
|
|
10
|
-
{"timestamp":"2026-03-06T09:00:48.521Z","level":"info","stage":"test.stage","message":"Info message"}
|
|
11
|
-
{"timestamp":"2026-03-06T09:00:48.521Z","level":"error","stage":"test.stage","message":"Error message"}
|
|
12
|
-
{"timestamp":"2026-03-06T09:00:48.521Z","level":"info","stage":"test.stage","message":"Test message","data":{"foo":"bar"}}
|
|
13
|
-
{"timestamp":"2026-03-06T09:03:16.966Z","level":"info","stage":"test.stage","message":"Test message","data":{"foo":"bar"}}
|
|
14
|
-
{"timestamp":"2026-03-06T09:03:16.981Z","level":"info","stage":"test.stage","message":"Test message","data":{"foo":"bar"}}
|
|
15
|
-
{"timestamp":"2026-03-06T09:03:16.981Z","level":"debug","stage":"test.stage","message":"Debug message"}
|
|
16
|
-
{"timestamp":"2026-03-06T09:03:16.981Z","level":"info","stage":"test.stage","message":"Info message"}
|
|
17
|
-
{"timestamp":"2026-03-06T09:03:16.981Z","level":"error","stage":"test.stage","message":"Error message"}
|
|
18
|
-
{"timestamp":"2026-03-06T09:03:16.982Z","level":"info","stage":"test.stage","message":"Test message","data":{"foo":"bar"}}
|
|
19
|
-
{"timestamp":"2026-03-06T09:08:50.110Z","level":"info","stage":"test.stage","message":"Test message","data":{"foo":"bar"}}
|
|
20
|
-
{"timestamp":"2026-03-06T09:08:50.143Z","level":"info","stage":"test.stage","message":"Test message","data":{"foo":"bar"}}
|
|
21
|
-
{"timestamp":"2026-03-06T09:08:50.144Z","level":"debug","stage":"test.stage","message":"Debug message"}
|
|
22
|
-
{"timestamp":"2026-03-06T09:08:50.144Z","level":"info","stage":"test.stage","message":"Info message"}
|
|
23
|
-
{"timestamp":"2026-03-06T09:08:50.144Z","level":"error","stage":"test.stage","message":"Error message"}
|
|
24
|
-
{"timestamp":"2026-03-06T09:08:50.144Z","level":"info","stage":"test.stage","message":"Test message","data":{"foo":"bar"}}
|
|
25
|
-
{"timestamp":"2026-03-06T10:13:12.262Z","level":"info","stage":"test.stage","message":"Test message","data":{"foo":"bar"}}
|
|
26
|
-
{"timestamp":"2026-03-06T10:13:12.263Z","level":"info","stage":"test.stage","message":"Test message","data":{"foo":"bar"}}
|
|
27
|
-
{"timestamp":"2026-03-06T10:13:12.263Z","level":"debug","stage":"test.stage","message":"Debug message"}
|
|
28
|
-
{"timestamp":"2026-03-06T10:13:12.263Z","level":"info","stage":"test.stage","message":"Info message"}
|
|
29
|
-
{"timestamp":"2026-03-06T10:13:12.263Z","level":"error","stage":"test.stage","message":"Error message"}
|
|
30
|
-
{"timestamp":"2026-03-06T10:13:12.263Z","level":"info","stage":"test.stage","message":"Test message","data":{"foo":"bar"}}
|