npm - @nathapp/nax - Versions diffs - 0.67.17 → 0.67.19 - Mend

@nathapp/nax 0.67.17 → 0.67.19

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/dist/nax.js +241 -57
package/package.json +1 -1

package/dist/nax.js CHANGED Viewed

@@ -29750,11 +29750,14 @@ function buildStorySection(story) {
 function buildVerdictSection(story) {
   return `# Verdict Instructions
-## Write Verdict File
+## Write Verdict File and Emit JSON in Final Reply
-After completing your verification, you **MUST** write a verdict file at the **project root**:
+After completing your verification, you **MUST** do BOTH of the following:
-**File:** \`.nax-verifier-verdict.json\`
+1. Write the verdict file at the **project root**: \`.nax-verifier-verdict.json\`
+2. Emit the same verdict JSON as the FINAL content of your reply \u2014 no prose
+   before or after, no markdown fences. Your reply must end with a closing
+   brace \`}\` on its own line. The orchestrator parses your reply as JSON.
 Set \`approved: true\` when ALL of these conditions are met:
 - All story-scoped tests pass (the orchestrator already attempted the full-suite gate \u2014 you only need to verify the story's own tests)
@@ -29778,7 +29781,7 @@ Set \`approved: false\` when ANY of these conditions are true:
 - \`fixes\` \u2014 keep this empty; the verifier must not apply code or test fixes
 - \`reasoning\` \u2014 brief summary of your overall assessment
-When done, do not commit code changes. Only write the verdict file.`;
+When done, do not commit code changes. Write the verdict file, then end your reply with the JSON object.`;
 }
 // src/prompts/sections/conventions.ts
@@ -30164,6 +30167,24 @@ class TddPromptBuilder {
     const isolation = role === "test-writer" ? opts.lite ? "lite" : "strict" : undefined;
     return TddPromptBuilder.for(role, { variant, isolation }).withLoader(workdir, config2).story(story).context(opts.contextMarkdown).v2FeatureContext(opts.contextBundle?.pushMarkdown).featureContext(opts.contextBundle ? undefined : opts.featureContextMarkdown).constitution(opts.constitution).testCommand(config2.quality?.commands?.test).hermeticConfig(config2.quality?.testing).build();
   }
+  static verdictRetry() {
+    return `Your previous reply could not be parsed as a valid VerifierVerdict JSON object.
+` + `Re-emit the verdict as the FINAL content of your reply.
+` + `Output ONLY the JSON object \u2014 no markdown fences, no explanation, no prose.
+` + `The reply must start with { and end with } on its own line.
+` + "Required top-level fields: version, approved, tests, testModifications, acceptanceCriteria, quality, fixes, reasoning.";
+  }
+  static verdictRetryCondensed() {
+    return `Your previous reply was truncated and could not be parsed as valid JSON.
+` + `Re-emit a CONDENSED verdict that omits the acceptanceCriteria.criteria[] entries:
+` + `- Keep acceptanceCriteria.allMet (boolean) but use criteria=[] (empty array).
+` + `- Keep quality.issues=[] and fixes=[] empty.
+` + `- Set testModifications.reasoning to a single sentence.
+` + `- Set reasoning to a single sentence.
+` + `Output ONLY the JSON object \u2014 no markdown fences, no prose.
+` + `Schema (minimal):
+` + `{"version":1,"approved":boolean,"tests":{"allPassing":boolean,"passCount":number,"failCount":number},"testModifications":{"detected":boolean,"files":[],"legitimate":boolean,"reasoning":"..."},"acceptanceCriteria":{"allMet":boolean,"criteria":[]},"quality":{"rating":"good"|"acceptable"|"poor","issues":[]},"fixes":[],"reasoning":"..."}`;
+  }
   s(id, content) {
     return { id, content, overridable: false };
   }
@@ -31013,6 +31034,7 @@ Severity guide:
 - If you cannot quote an exact excerpt that proves your point, downgrade the finding to \`"unverifiable"\` rather than fabricating a quote.
 **AC-grounding rule \u2014 required for every "error" finding:**
+- Do NOT write an \`acQuote\` that does not appear verbatim in the listed AC text. If you cannot find an exact verbatim match, set severity to \`warning\` \u2014 never approximate, paraphrase, or synthesise a quote. A finding dropped for a fabricated quote wastes a review cycle and is worse than a correctly classified \`warning\`.
 - \`acQuote\` must be a verbatim substring of one AC bullet (from the Acceptance Criteria above) that names or constrains the exact **symbol** you are flagging \u2014 not merely the file the symbol lives in.
 - \`acIndex\` is the 1-based position of that AC bullet in the list.
 - Copy \`acQuote\` **exactly** from the AC text, including any backticks, asterisks, or punctuation. Do not paraphrase, strip formatting, or rewrite.
@@ -31220,7 +31242,7 @@ ${STEP2}${frameworkLine}
 ${STEP3_HEADER}
 ${STEP3_SHARED_RULES}
 - **File output (REQUIRED)**: Write the acceptance test file DIRECTLY to the path shown below. Do NOT output the test code in your response. After writing the file, reply with a brief confirmation.
-- **Path anchor (CRITICAL)**: Write the test file to this exact path: \`${p.targetTestFilePath}\`. Import from package sources using relative paths like \`../../../src/...\` (3 levels up from \`.nax/features/<name>/\` to the package root).
+- **Path anchor (CRITICAL \u2014 do NOT deviate)**: Write the test file to this exact path: \`${p.targetTestFilePath}\`. This path is intentional and computed by the orchestrator \u2014 do not change it based on what you observe in the project. In particular: if you see a \`.nax/features/\` directory at the repo root, that is for stories scoped to the repo root. When a story belongs to a specific package (e.g. \`packages/core\`), its acceptance test lives inside that package's \`.nax/features/\` directory so the test runner can resolve the package's imports correctly. The package root is 3 levels above the test file (\`../../../\` relative to the test file).
 - **Process cwd**: When spawning child processes to invoke a CLI or binary, set the working directory to the **package root** (\`join(import.meta.dir, "../../..")\`) as your default \u2014 unless your Step 2 exploration reveals the CLI uses a different working directory convention (e.g. reads config from \`~/.config/\`, or resolves paths relative to a flag value). Always check how the CLI resolves file paths before assuming.${implSection}`;
   }
   buildGeneratorFromSpecPrompt(p) {
@@ -32776,6 +32798,7 @@ function recordAdversarialAudit(opts) {
     looksLikeFail: opts.looksLikeFail,
     failOpen: opts.failOpen,
     passed: opts.passed,
+    passReason: opts.passReason,
     blockingThreshold: opts.blockingThreshold,
     result: opts.result,
     advisoryFindings: opts.advisoryFindings,
@@ -33109,6 +33132,46 @@ ${formatFindings(blockingFindings)}` : "Adversarial review failed (no findings)"
     };
   }
   if (!opResult.passed && acDropped.length > 0) {
+    const allHallucinated = acDropped.every((d) => d.code === "ac_quote_not_substring");
+    if (allHallucinated) {
+      const demotedFindings = toAdversarialReviewFindings(acDropped.map((d) => ({ ...d.finding, severity: "warning", acQuote: undefined, acIndex: undefined })));
+      const existingAdvisory = advisoryFindings.length > 0 ? toAdversarialReviewFindings(advisoryFindings) : [];
+      const allAdvisory = [...existingAdvisory, ...demotedFindings];
+      logger?.warn("review", "Adversarial review passed: all blocking findings discarded as hallucinated AC quotes", {
+        storyId: story.id,
+        durationMs,
+        droppedCount: acDropped.length,
+        drops: acDropped.map((d) => ({ file: d.finding.file, issue: d.finding.issue }))
+      });
+      recordAdversarialAudit({
+        runtime,
+        workdir,
+        projectDir,
+        storyId: story.id,
+        featureName,
+        parsed: true,
+        failOpen: false,
+        passed: true,
+        passReason: "ac_quote_not_substring_demoted",
+        blockingThreshold: threshold,
+        result: { passed: true, findings: [] },
+        advisoryFindings: allAdvisory.length > 0 ? allAdvisory : undefined,
+        diffAvailable,
+        adversarialDropAnalysis,
+        adversarialAcceptAnalysis: []
+      });
+      return {
+        check: "adversarial",
+        success: true,
+        passReason: "ac_quote_not_substring_demoted",
+        command: "",
+        exitCode: 0,
+        output: `Adversarial review passed: ${acDropped.length} blocking finding(s) demoted to advisory \u2014 all cited AC quotes were fabricated and could not be validated.`,
+        durationMs,
+        advisoryFindings: allAdvisory.length > 0 ? allAdvisory : undefined,
+        cost: llmCost
+      };
+    }
     logger?.warn("review", "Adversarial review fail-closed: blocking findings dropped as ungrounded", {
       storyId: story.id,
       durationMs,
@@ -33653,6 +33716,35 @@ function acFailureToFinding(acId, output) {
     fixTarget: "source"
   };
 }
+function executionFailureToFinding(params) {
+  const tail = tailLines(params.output, 40);
+  const exitStr = params.exitCode !== undefined ? ` (exit ${params.exitCode})` : "";
+  const message = `Test runner exited non-zero without structured failures${exitStr}. Command: \`${params.command}\`
+--- runner output (last 40 lines) ---
+${tail}`;
+  return {
+    source: "test-runner",
+    severity: "error",
+    category: "execution-failed",
+    message,
+    fixTarget: "source",
+    meta: {
+      command: params.command,
+      exitCode: params.exitCode,
+      packageDir: params.packageDir,
+      cwd: params.cwd
+    }
+  };
+}
+function tailLines(s, n) {
+  if (!s)
+    return "(no output)";
+  const lines = s.split(`
+`);
+  return lines.slice(Math.max(0, lines.length - n)).join(`
+`);
+}
 function acSentinelToFinding(sentinel, _output) {
   if (sentinel === "AC-HOOK") {
     return {
@@ -36874,6 +36966,29 @@ var init_verdict = __esm(() => {
 });
 // src/operations/verify.ts
+function parseVerdictFromStdout(output, _input, _ctx) {
+  if (!output || !output.trim()) {
+    throw new ParseValidationError("verifier produced no stdout");
+  }
+  const raw = tryParseLLMJson(output);
+  if (!raw || typeof raw !== "object") {
+    throw new ParseValidationError("verifier stdout is not a JSON object");
+  }
+  const verdict = isValidVerdict(raw) ? raw : coerceVerdict(raw);
+  if (!verdict) {
+    throw new ParseValidationError("verifier stdout JSON missing required VerifierVerdict fields");
+  }
+  const categorization = categorizeVerdict(verdict, verdict.tests.allPassing === true);
+  return {
+    success: categorization.success,
+    filesChanged: [],
+    estimatedCostUsd: 0,
+    durationMs: 0,
+    output,
+    ...categorization.failureCategory && { failureCategory: categorization.failureCategory },
+    ...categorization.reviewReason && { reviewReason: categorization.reviewReason }
+  };
+}
 async function runVerifierIsolation(beforeRef, ctx) {
   if (!beforeRef)
     return;
@@ -36882,16 +36997,31 @@ async function runVerifierIsolation(beforeRef, ctx) {
 }
 var verifierOp;
 var init_verify = __esm(() => {
+  init_retry();
   init_config();
+  init_tdd_builder();
   init_isolation();
   init_verdict();
-  init__session_output();
   verifierOp = {
     kind: "run",
     name: "verifier",
     stage: "verify",
     session: { role: "verifier", lifetime: "fresh" },
     config: tddConfigSelector,
+    retry: makeParseRetryStrategy({
+      validate: (parsed) => {
+        if (!parsed || typeof parsed !== "object")
+          return false;
+        const r = parsed;
+        return isValidVerdict(r) || coerceVerdict(r) !== null;
+      },
+      reviewerKind: "verifier",
+      maxAttempts: 2,
+      prompts: {
+        invalid: () => TddPromptBuilder.verdictRetry(),
+        truncated: () => TddPromptBuilder.verdictRetryCondensed()
+      }
+    }),
     build(input, _ctx) {
       if (input.promptMarkdown?.trim()) {
         return {
@@ -36908,13 +37038,8 @@ var init_verify = __esm(() => {
         }
       };
     },
-    parse(output, _input, _ctx) {
-      const envelope = parseSessionJsonOutput(output);
-      return { ...envelope, estimatedCostUsd: 0, durationMs: 0 };
-    },
+    parse: parseVerdictFromStdout,
     async verify(parsed, input, ctx) {
-      if (!parsed.success)
-        return null;
       const isolation = await runVerifierIsolation(input.beforeRef, ctx);
       return isolation ? { ...parsed, isolation } : parsed;
     },
@@ -36922,20 +37047,28 @@ var init_verify = __esm(() => {
       const packageDir = verifyCtx.packageView.packageDir;
       try {
         const verdict = await readVerdict(packageDir);
-        if (!verdict)
-          return null;
-        const testsAllPassing = verdict.tests.allPassing === true;
-        const categorization = categorizeVerdict(verdict, testsAllPassing);
-        const isolation = await runVerifierIsolation(input.beforeRef, verifyCtx);
+        if (verdict) {
+          const testsAllPassing = verdict.tests.allPassing === true;
+          const categorization = categorizeVerdict(verdict, testsAllPassing);
+          const isolation = await runVerifierIsolation(input.beforeRef, verifyCtx);
+          return {
+            success: categorization.success,
+            filesChanged: [],
+            estimatedCostUsd: 0,
+            durationMs: 0,
+            output: "",
+            ...categorization.failureCategory && { failureCategory: categorization.failureCategory },
+            ...categorization.reviewReason && { reviewReason: categorization.reviewReason },
+            ...isolation && { isolation }
+          };
+        }
         return {
-          success: categorization.success,
+          success: false,
           filesChanged: [],
           estimatedCostUsd: 0,
           durationMs: 0,
           output: "",
-          ...categorization.failureCategory && { failureCategory: categorization.failureCategory },
-          ...categorization.reviewReason && { reviewReason: categorization.reviewReason },
-          ...isolation && { isolation }
+          reviewReason: "verifier produced unparseable verdict in stdout after retries and no usable verdict file on disk"
         };
       } finally {
         await cleanupVerdict(packageDir);
@@ -37688,7 +37821,9 @@ async function runVerificationCore(options) {
       success: options.acceptOnTimeout ?? false,
       countsTowardEscalation: false,
       error: execution.error,
-      output: execution.output
+      output: execution.output,
+      exitCode: execution.exitCode,
+      command: finalCommand
     };
   }
   const exitCode = execution.exitCode ?? 1;
@@ -37702,7 +37837,9 @@ async function runVerificationCore(options) {
         error: analysis.error,
         output: execution.output,
         passCount: analysis.passCount,
-        failCount: analysis.failCount
+        failCount: analysis.failCount,
+        exitCode,
+        command: finalCommand
       };
     }
     return {
@@ -37711,10 +37848,19 @@ async function runVerificationCore(options) {
       countsTowardEscalation: true,
       output: execution.output,
       passCount: analysis.passCount,
-      failCount: analysis.failCount
+      failCount: analysis.failCount,
+      exitCode,
+      command: finalCommand
     };
   }
-  return { status: "SUCCESS", success: true, countsTowardEscalation: true, output: execution.output };
+  return {
+    status: "SUCCESS",
+    success: true,
+    countsTowardEscalation: true,
+    output: execution.output,
+    exitCode,
+    command: finalCommand
+  };
 }
 async function fullSuite(options) {
   return runVerificationCore(options);
@@ -37791,7 +37937,9 @@ var init_full_suite_gate = __esm(() => {
         failed: parsedSummary.failed ?? 0,
         output: result.output ?? "",
         parsedSummary,
-        timedOut: result.status === "TIMEOUT"
+        timedOut: result.status === "TIMEOUT",
+        exitCode: result.exitCode,
+        command: result.command ?? gateCtx.testCmd
       };
     }
   };
@@ -37818,6 +37966,13 @@ var init_full_suite_gate = __esm(() => {
         };
       }
       const gateCtx = await deps.resolveGateContext(input, ctx);
+      logger.info("verify[regression]", "Running full-suite gate", {
+        storyId: input.story.id,
+        packageDir: input.story.workdir,
+        cwd: input.workdir,
+        command: gateCtx.testCmd,
+        timeoutSeconds: gateCtx.fullSuiteTimeout
+      });
       const testResult = await deps.runTests(input, gateCtx);
       if (testResult.passed) {
         return { success: true, passed: true, status: "passed", estimatedCostUsd: 0, attempts: 0, findings: [] };
@@ -37851,13 +38006,27 @@ var init_full_suite_gate = __esm(() => {
       }
       const findings = testSummaryToFindings(testResult.parsedSummary);
       if (findings.length === 0) {
+        const cmd = testResult.command ?? gateCtx.testCmd;
+        const synth = executionFailureToFinding({
+          command: cmd,
+          exitCode: testResult.exitCode,
+          output: testResult.output,
+          packageDir: input.story.workdir,
+          cwd: input.workdir
+        });
+        logger.warn("verify[regression]", "Full-suite gate execution-failed \u2014 emitting synth finding", {
+          storyId: input.story.id,
+          command: cmd,
+          exitCode: testResult.exitCode,
+          packageDir: input.story.workdir
+        });
         return {
           success: false,
           passed: false,
           status: "execution-failed",
           estimatedCostUsd: 0,
           attempts: 0,
-          findings: []
+          findings: [synth]
         };
       }
       return { success: false, passed: false, status: "failed", estimatedCostUsd: 0, attempts: 0, findings };
@@ -37869,7 +38038,7 @@ var init_full_suite_gate = __esm(() => {
 function makeFullSuiteRectifyStrategy(story, config2) {
   return {
     name: "full-suite-rectify",
-    appliesTo: (finding) => finding.source === "test-runner" && finding.category === "failed-test",
+    appliesTo: (finding) => finding.source === "test-runner" && (finding.category === "failed-test" || finding.category === "execution-failed"),
     fixOp: implementerOp,
     buildInput: (findings) => ({
       story,
@@ -38561,6 +38730,15 @@ var init_verify_scoped = __esm(() => {
           command: selection.effectiveCommand
         });
       }
+      const scopedTimeout = ctxConfig.execution?.regressionGate?.timeoutSeconds ?? 600;
+      logger.info("verify[scoped]", "Running scoped tests", {
+        storyId: input.storyId,
+        packageDir: input.packageDir,
+        cwd: input.workdir,
+        command: selection.effectiveCommand,
+        timeoutSeconds: scopedTimeout,
+        isFullSuite: selection.isFullSuite
+      });
       const start = Date.now();
       const result = await deps.regression({
         workdir: input.workdir,
@@ -51387,9 +51565,9 @@ var init_acceptance2 = __esm(() => {
 function logTestOutput(logger, stage, output, opts = {}) {
   if (!logger || !output)
     return;
-  const tailLines = opts.tailLines ?? 20;
+  const tailLines2 = opts.tailLines ?? 20;
   const lines = output.split(`
-`).slice(-tailLines).join(`
+`).slice(-tailLines2).join(`
 `);
   logger.debug(stage, "Test output (tail)", {
     ...opts.storyId !== undefined && { storyId: opts.storyId },
@@ -52779,10 +52957,13 @@ async function refreshReviewInputForDispatch(opName, input) {
     return fallback;
   }
 }
-function formatPhaseResultMessage(opName, success2) {
+function formatPhaseResultMessage(opName, success2, stage) {
   if (opName === "greenfield-gate") {
     return success2 ? "Greenfield-gate: pre-existing tests detected (not greenfield) \u2014 proceeding with normal TDD" : "Greenfield-gate: no pre-existing tests \u2014 greenfield run, pausing TDD test-writer";
   }
+  if (stage === "rectification") {
+    return `Rectification strategy completed: ${opName}`;
+  }
   return success2 ? `Phase passed: ${opName}` : `Phase failed: ${opName}`;
 }
 function isSlot(value) {
@@ -52975,7 +53156,7 @@ function logUnifiedReviewPhaseStart(storyId, opName) {
     logger?.info("review", "Running adversarial check", { storyId });
   }
 }
-function logDeterministicPhaseOutcome(storyId, opName, output, durationMs, isTddPhase) {
+function logDeterministicPhaseOutcome(storyId, opName, output, durationMs, isTddPhase, stage) {
   if (isTddPhase)
     return;
   if (opName === "semantic-review" || opName === "adversarial-review")
@@ -52992,7 +53173,11 @@ function logDeterministicPhaseOutcome(storyId, opName, output, durationMs, isTdd
     data.findingsCount = findingsCount;
   if (status !== undefined)
     data.status = status;
-  const message = formatPhaseResultMessage(opName, success2);
+  const message = formatPhaseResultMessage(opName, success2, stage);
+  if (stage === "rectification") {
+    logger?.info("story-orchestrator", message, data);
+    return;
+  }
   if (success2) {
     logger?.info("story-orchestrator", message, data);
   } else {
@@ -53069,7 +53254,7 @@ async function runPhase(ctx, slot, phaseCosts, phaseOutputs, isThreeSession = fa
     phaseOutputs[opName] = output;
     emitReviewDecision(ctx, opName, output);
     logUnifiedReviewPhaseResult(ctx.storyId, opName, output);
-    logDeterministicPhaseOutcome(ctx.storyId, opName, output, Date.now() - phaseStartedAt, isTddPhase);
+    logDeterministicPhaseOutcome(ctx.storyId, opName, output, Date.now() - phaseStartedAt, isTddPhase, slot.op.stage);
     if (isTddPhase) {
       const durationMs = Date.now() - phaseStartedAt;
       logger?.info("tdd", `Session complete: ${opName}`, {
@@ -53453,23 +53638,8 @@ var init_story_orchestrator = __esm(() => {
   STRATEGY_TO_REVALIDATION_PHASES = {
     "mechanical-lintfix": ["lint-check"],
     "mechanical-formatfix": ["lint-check"],
-    "autofix-implementer": [
-      "lint-check",
-      "typecheck-check",
-      "full-suite-gate",
-      "verifier",
-      "verify-scoped",
-      "semantic-review",
-      "adversarial-review"
-    ],
-    "autofix-test-writer": [
-      "lint-check",
-      "typecheck-check",
-      "full-suite-gate",
-      "verifier",
-      "verify-scoped",
-      "adversarial-review"
-    ],
+    "autofix-implementer": ["lint-check", "typecheck-check", "full-suite-gate", "semantic-review", "adversarial-review"],
+    "autofix-test-writer": ["lint-check", "typecheck-check", "full-suite-gate", "adversarial-review"],
     "full-suite-rectify": [
       "lint-check",
       "typecheck-check",
@@ -53817,7 +53987,7 @@ function routeTddFailure(failureCategory, isLiteMode, ctx, reviewReason, failure
     }
     return { action: "escalate", reason: buildReason("isolation-violation") };
   }
-  if (failureCategory === "session-failure" || failureCategory === "tests-failing" || failureCategory === "full-suite-gate-exhausted" || failureCategory === "verifier-rejected") {
+  if (failureCategory === "session-failure" || failureCategory === "tests-failing" || failureCategory === "full-suite-gate-exhausted" || failureCategory === "verifier-rejected" || failureCategory === "runtime-crash") {
     return { action: "escalate", reason: buildReason(failureCategory) };
   }
   if (failureCategory === "greenfield-no-tests") {
@@ -53989,6 +54159,12 @@ function deriveTddFailureCategory(phaseOutputs, unfixedFindings) {
       return "full-suite-gate-exhausted";
     }
   }
+  if (!verifierPassed) {
+    const rectOutputCrash = phaseOutputs.rectification;
+    if (rectOutputCrash?.exitReason === "validator-error") {
+      return "runtime-crash";
+    }
+  }
   if (!verifierPassed) {
     const gateOutput = phaseOutputs[fullSuiteGateOp.name];
     if (gateOutput && (gateOutput.success === false || gateOutput.passed === false)) {
@@ -54321,9 +54497,10 @@ var init_post_run = __esm(() => {
 });
 // src/pipeline/stages/execution.ts
-var executionStage, _executionDeps;
+var RUNTIME_CRASH_CODES, executionStage, _executionDeps;
 var init_execution = __esm(() => {
   init_agents();
+  init_errors();
   init_build_plan_for_strategy();
   init_plan_inputs();
   init_post_run();
@@ -54331,6 +54508,7 @@ var init_execution = __esm(() => {
   init_logger2();
   init_git();
   init_execution_helpers();
+  RUNTIME_CRASH_CODES = new Set(["CALL_OP_NO_OUTPUT", "CALL_OP_MAX_RETRIES"]);
   executionStage = {
     name: "execution",
     enabled: () => true,
@@ -54389,10 +54567,15 @@ var init_execution = __esm(() => {
       } : null;
       const initialRef = tddMode ? await _executionDeps.captureGitRef(ctx.workdir) ?? "HEAD" : null;
       const inputs = await _executionDeps.assemblePlanInputsFromCtx(ctx);
-      const plan = await buildPlanForStrategy(callCtx, ctx.story, ctx.config, ctx.routing.testStrategy, inputs);
+      const plan = await _executionDeps.buildPlanForStrategy(callCtx, ctx.story, ctx.config, ctx.routing.testStrategy, inputs);
       let planResult;
       try {
         planResult = await plan.run();
+      } catch (err) {
+        if (err instanceof NaxError && RUNTIME_CRASH_CODES.has(err.code)) {
+          ctx.tddFailureCategory = "runtime-crash";
+        }
+        throw err;
       } finally {
         unsubscribe();
       }
@@ -54414,6 +54597,7 @@ var init_execution = __esm(() => {
     validateAgentForTier,
     captureGitRef,
     assemblePlanInputsFromCtx,
+    buildPlanForStrategy,
     applyPostRunInspection,
     decideStageAction
   };
@@ -57833,7 +58017,7 @@ var package_default;
 var init_package = __esm(() => {
   package_default = {
     name: "@nathapp/nax",
-    version: "0.67.17",
+    version: "0.67.19",
     description: "AI Coding Agent Orchestrator \u2014 loops until done",
     type: "module",
     bin: {
@@ -57928,8 +58112,8 @@ var init_version = __esm(() => {
   NAX_VERSION = package_default.version;
   NAX_COMMIT = (() => {
     try {
-      if (/^[0-9a-f]{6,10}$/.test("74621ad5"))
-        return "74621ad5";
+      if (/^[0-9a-f]{6,10}$/.test("e80ba4d6"))
+        return "e80ba4d6";
     } catch {}
     try {
       const result = Bun.spawnSync(["git", "rev-parse", "--short", "HEAD"], {

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@nathapp/nax",
-  "version": "0.67.17",
+  "version": "0.67.19",
   "description": "AI Coding Agent Orchestrator — loops until done",
   "type": "module",
   "bin": {