npm - @nathapp/nax - Versions diffs - 0.54.3 → 0.54.5 - Mend

@nathapp/nax 0.54.3 → 0.54.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/dist/nax.js +795 -715
package/package.json +1 -1

package/dist/nax.js CHANGED Viewed

@@ -18945,7 +18945,7 @@ Rules:
 - Every test MUST have real assertions that PASS when the feature is correctly implemented and FAIL when it is broken
 - **Prefer behavioral tests** \u2014 import functions and call them rather than reading source files. For example, to verify "getPostRunActions() returns empty array", import PluginRegistry and call getPostRunActions(), don't grep the source file for the method name.
 - **File output (REQUIRED)**: Write the acceptance test file DIRECTLY to the path shown below. Do NOT output the test code in your response. After writing the file, reply with a brief confirmation.
-- **Path anchor (CRITICAL)**: Write the test file to this exact path: \`${options.featureDir}/${acceptanceTestFilename(options.language)}\`. Import from package sources using relative paths like \`./src/...\`. No deep \`../../../../\` traversal needed.`;
+- **Path anchor (CRITICAL)**: Write the test file to this exact path: \`${join2(options.workdir, ".nax", "features", options.featureName, acceptanceTestFilename(options.language))}\`. Import from package sources using relative paths like \`../../../src/...\` (3 levels up from \`.nax/features/<name>/\` to the package root).`;
   const prompt = basePrompt;
   logger.info("acceptance", "Generating tests from PRD refined criteria", { count: refinedCriteria.length });
   const rawOutput = await (options.adapter ?? _generatorPRDDeps.adapter).complete(prompt, {
@@ -18963,7 +18963,7 @@ Rules:
     outputPreview: rawOutput.slice(0, 300)
   });
   if (!testCode) {
-    const targetPath = join2(options.featureDir, acceptanceTestFilename(options.language));
+    const targetPath = join2(options.workdir, ".nax", "features", options.featureName, acceptanceTestFilename(options.language));
     let recoveryFailed = false;
     logger.debug("acceptance", "BUG-076 recovery: checking for agent-written file", { targetPath });
     try {
@@ -22348,7 +22348,7 @@ var package_default;
 var init_package = __esm(() => {
   package_default = {
     name: "@nathapp/nax",
-    version: "0.54.3",
+    version: "0.54.5",
     description: "AI Coding Agent Orchestrator \u2014 loops until done",
     type: "module",
     bin: {
@@ -22425,8 +22425,8 @@ var init_version = __esm(() => {
   NAX_VERSION = package_default.version;
   NAX_COMMIT = (() => {
     try {
-      if (/^[0-9a-f]{6,10}$/.test("5acee1f"))
-        return "5acee1f";
+      if (/^[0-9a-f]{6,10}$/.test("e98d5b1"))
+        return "e98d5b1";
     } catch {}
     try {
       const result = Bun.spawnSync(["git", "rev-parse", "--short", "HEAD"], {
@@ -22444,316 +22444,37 @@ var init_version = __esm(() => {
   NAX_BUILD_INFO = NAX_COMMIT === "dev" ? `v${NAX_VERSION}` : `v${NAX_VERSION} (${NAX_COMMIT})`;
 });
-// src/prd/validate.ts
-function validateStoryId(id) {
-  if (!id || id.length === 0) {
-    throw new Error("Story ID cannot be empty");
-  }
-  if (id.includes("..")) {
-    throw new Error("Story ID cannot contain path traversal (..)");
-  }
-  if (id.startsWith("--")) {
-    throw new Error("Story ID cannot start with git flags (--)");
-  }
-  const validPattern = /^[a-zA-Z0-9][a-zA-Z0-9._-]{0,63}$/;
-  if (!validPattern.test(id)) {
-    throw new Error(`Story ID must match pattern [a-zA-Z0-9][a-zA-Z0-9._-]{0,63}. Got: ${id}`);
-  }
-}
-// src/errors.ts
-var NaxError, AgentNotFoundError, AgentNotInstalledError, StoryLimitExceededError, LockAcquisitionError;
-var init_errors3 = __esm(() => {
-  NaxError = class NaxError extends Error {
-    code;
-    context;
-    constructor(message, code, context) {
-      super(message);
-      this.code = code;
-      this.context = context;
-      this.name = "NaxError";
-      Error.captureStackTrace(this, this.constructor);
-    }
-  };
-  AgentNotFoundError = class AgentNotFoundError extends NaxError {
-    constructor(agentName, binary) {
-      super(`Agent "${agentName}" not found or not installed`, "AGENT_NOT_FOUND", { agentName, binary });
-      this.name = "AgentNotFoundError";
-    }
-  };
-  AgentNotInstalledError = class AgentNotInstalledError extends NaxError {
-    constructor(agentName, binary) {
-      super(`Agent "${agentName}" is not installed or not in PATH: ${binary}`, "AGENT_NOT_INSTALLED", {
-        agentName,
-        binary
-      });
-      this.name = "AgentNotInstalledError";
-    }
-  };
-  StoryLimitExceededError = class StoryLimitExceededError extends NaxError {
-    constructor(totalStories, limit) {
-      super(`Feature exceeds story limit: ${totalStories} stories (max: ${limit})`, "STORY_LIMIT_EXCEEDED", {
-        totalStories,
-        limit
-      });
-      this.name = "StoryLimitExceededError";
-    }
-  };
-  LockAcquisitionError = class LockAcquisitionError extends NaxError {
-    constructor(workdir) {
-      super("Another nax process is already running in this directory", "LOCK_ACQUISITION_FAILED", { workdir });
-      this.name = "LockAcquisitionError";
-    }
-  };
-});
-// src/metrics/tracker.ts
-import path2 from "path";
-function collectStoryMetrics(ctx, storyStartTime) {
-  const story = ctx.story;
-  const routing = ctx.routing;
-  const agentResult = ctx.agentResult;
-  const escalationCount = story.escalations?.length || 0;
-  const priorFailureCount = story.priorFailures?.length || 0;
-  const attempts = priorFailureCount + Math.max(1, story.attempts || 1);
-  const finalTier = escalationCount > 0 ? story.escalations[escalationCount - 1].toTier : routing.modelTier;
-  const firstPassSuccess = agentResult?.success === true && escalationCount === 0 && priorFailureCount === 0;
-  const modelEntry = ctx.config.models[routing.modelTier];
-  const modelDef = modelEntry ? resolveModel(modelEntry) : null;
-  const modelUsed = modelDef?.model || routing.modelTier;
-  const initialComplexity = story.routing?.initialComplexity ?? routing.complexity;
-  const isTddStrategy = routing.testStrategy === "three-session-tdd" || routing.testStrategy === "three-session-tdd-lite";
-  const fullSuiteGatePassed = isTddStrategy ? ctx.fullSuiteGatePassed ?? false : false;
+// src/interaction/bridge-builder.ts
+function buildInteractionBridge(chain, context, timeoutMs = DEFAULT_INTERACTION_TIMEOUT_MS) {
+  const plugin = chain?.getPrimary();
+  if (!plugin)
+    return;
   return {
-    storyId: story.id,
-    complexity: routing.complexity,
-    initialComplexity,
-    modelTier: routing.modelTier,
-    modelUsed,
-    attempts,
-    finalTier,
-    success: agentResult?.success || false,
-    cost: (ctx.accumulatedAttemptCost ?? 0) + (agentResult?.estimatedCost || 0),
-    durationMs: agentResult?.durationMs || 0,
-    firstPassSuccess,
-    startedAt: storyStartTime,
-    completedAt: new Date().toISOString(),
-    fullSuiteGatePassed,
-    runtimeCrashes: ctx.storyRuntimeCrashes ?? 0
-  };
-}
-function collectBatchMetrics(ctx, storyStartTime) {
-  const stories = ctx.stories;
-  const routing = ctx.routing;
-  const agentResult = ctx.agentResult;
-  const totalCost = agentResult?.estimatedCost || 0;
-  const totalDuration = agentResult?.durationMs || 0;
-  const costPerStory = totalCost / stories.length;
-  const durationPerStory = totalDuration / stories.length;
-  const modelEntry = ctx.config.models[routing.modelTier];
-  const modelDef = modelEntry ? resolveModel(modelEntry) : null;
-  const modelUsed = modelDef?.model || routing.modelTier;
-  return stories.map((story) => {
-    const initialComplexity = story.routing?.initialComplexity ?? routing.complexity;
-    return {
-      storyId: story.id,
-      complexity: routing.complexity,
-      initialComplexity,
-      modelTier: routing.modelTier,
-      modelUsed,
-      attempts: 1,
-      finalTier: routing.modelTier,
-      success: true,
-      cost: costPerStory,
-      durationMs: durationPerStory,
-      firstPassSuccess: true,
-      startedAt: storyStartTime,
-      completedAt: new Date().toISOString(),
-      fullSuiteGatePassed: false,
-      runtimeCrashes: 0
-    };
-  });
-}
-async function saveRunMetrics(workdir, runMetrics) {
-  const metricsPath = path2.join(workdir, ".nax", "metrics.json");
-  const existing = await loadJsonFile(metricsPath, "metrics");
-  const allMetrics = Array.isArray(existing) ? existing : [];
-  allMetrics.push(runMetrics);
-  await saveJsonFile(metricsPath, allMetrics, "metrics");
-}
-async function loadRunMetrics(workdir) {
-  const metricsPath = path2.join(workdir, ".nax", "metrics.json");
-  const content = await loadJsonFile(metricsPath, "metrics");
-  return Array.isArray(content) ? content : [];
-}
-var init_tracker = __esm(() => {
-  init_schema();
-  init_json_file();
-});
-// src/metrics/aggregator.ts
-function calculateAggregateMetrics(runs) {
-  if (runs.length === 0) {
-    return {
-      totalRuns: 0,
-      totalCost: 0,
-      totalStories: 0,
-      firstPassRate: 0,
-      escalationRate: 0,
-      avgCostPerStory: 0,
-      avgCostPerFeature: 0,
-      modelEfficiency: {},
-      complexityAccuracy: {}
-    };
-  }
-  const allStories = runs.flatMap((run) => run.stories);
-  const totalRuns = runs.length;
-  const totalCost = runs.reduce((sum, run) => sum + run.totalCost, 0);
-  const totalStories = allStories.length;
-  const firstPassSuccesses = allStories.filter((s) => s.firstPassSuccess).length;
-  const firstPassRate = totalStories > 0 ? firstPassSuccesses / totalStories : 0;
-  const escalatedStories = allStories.filter((s) => s.attempts > 1).length;
-  const escalationRate = totalStories > 0 ? escalatedStories / totalStories : 0;
-  const avgCostPerStory = totalStories > 0 ? totalCost / totalStories : 0;
-  const avgCostPerFeature = totalRuns > 0 ? totalCost / totalRuns : 0;
-  const modelStats = new Map;
-  for (const story of allStories) {
-    const modelKey = story.modelUsed;
-    const existing = modelStats.get(modelKey) || {
-      attempts: 0,
-      successes: 0,
-      totalCost: 0
-    };
-    modelStats.set(modelKey, {
-      attempts: existing.attempts + story.attempts,
-      successes: existing.successes + (story.success ? 1 : 0),
-      totalCost: existing.totalCost + story.cost
-    });
-  }
-  const modelEfficiency = {};
-  for (const [modelKey, stats] of modelStats) {
-    const passRate = stats.attempts > 0 ? stats.successes / stats.attempts : 0;
-    const avgCost = stats.successes > 0 ? stats.totalCost / stats.successes : 0;
-    modelEfficiency[modelKey] = {
-      attempts: stats.attempts,
-      successes: stats.successes,
-      passRate,
-      avgCost,
-      totalCost: stats.totalCost
-    };
-  }
-  const complexityStats = new Map;
-  for (const story of allStories) {
-    const complexity = story.initialComplexity ?? story.complexity;
-    const existing = complexityStats.get(complexity) || {
-      predicted: 0,
-      tierCounts: new Map,
-      mismatches: 0
-    };
-    existing.predicted += 1;
-    const finalTier = story.finalTier;
-    existing.tierCounts.set(finalTier, (existing.tierCounts.get(finalTier) || 0) + 1);
-    if (story.modelTier !== story.finalTier) {
-      existing.mismatches += 1;
-    }
-    complexityStats.set(complexity, existing);
-  }
-  const complexityAccuracy = {};
-  for (const [complexity, stats] of complexityStats) {
-    let maxCount = 0;
-    let mostCommonTier = "unknown";
-    for (const [tier, count] of stats.tierCounts) {
-      if (count > maxCount) {
-        maxCount = count;
-        mostCommonTier = tier;
+    detectQuestion: async (text) => QUESTION_PATTERNS.some((p) => p.test(text)),
+    onQuestionDetected: async (text) => {
+      const requestId = `ix-${context.stage}-${Date.now()}-${Math.random().toString(36).slice(2, 9)}`;
+      await plugin.send({
+        id: requestId,
+        type: "input",
+        featureName: context.featureName ?? "unknown",
+        storyId: context.storyId,
+        stage: context.stage,
+        summary: text,
+        fallback: "continue",
+        createdAt: Date.now()
+      });
+      try {
+        const response = await plugin.receive(requestId, timeoutMs);
+        return response.value ?? "continue";
+      } catch {
+        return "continue";
       }
     }
-    const mismatchRate = stats.predicted > 0 ? stats.mismatches / stats.predicted : 0;
-    complexityAccuracy[complexity] = {
-      predicted: stats.predicted,
-      actualTierUsed: mostCommonTier,
-      mismatchRate
-    };
-  }
-  return {
-    totalRuns,
-    totalCost,
-    totalStories,
-    firstPassRate,
-    escalationRate,
-    avgCostPerStory,
-    avgCostPerFeature,
-    modelEfficiency,
-    complexityAccuracy
   };
 }
-function getLastRun(runs) {
-  if (runs.length === 0) {
-    return null;
-  }
-  return runs[runs.length - 1];
-}
-// src/metrics/index.ts
-var init_metrics = __esm(() => {
-  init_tracker();
-});
-// src/interaction/types.ts
-var TRIGGER_METADATA;
-var init_types4 = __esm(() => {
-  TRIGGER_METADATA = {
-    "security-review": {
-      defaultFallback: "abort",
-      safety: "red",
-      defaultSummary: "Security review failed \u2014 abort execution?"
-    },
-    "cost-exceeded": {
-      defaultFallback: "abort",
-      safety: "red",
-      defaultSummary: "Cost limit exceeded ({{cost}} USD) \u2014 abort execution?"
-    },
-    "merge-conflict": {
-      defaultFallback: "abort",
-      safety: "red",
-      defaultSummary: "Merge conflict detected in {{storyId}} \u2014 abort execution?"
-    },
-    "cost-warning": {
-      defaultFallback: "escalate",
-      safety: "yellow",
-      defaultSummary: "Cost warning: {{cost}} USD / {{limit}} USD \u2014 escalate to higher tier?"
-    },
-    "max-retries": {
-      defaultFallback: "skip",
-      safety: "yellow",
-      defaultSummary: "Max retries reached for {{storyId}} \u2014 skip story?"
-    },
-    "pre-merge": {
-      defaultFallback: "escalate",
-      safety: "yellow",
-      defaultSummary: "Pre-merge checkpoint for {{storyId}} \u2014 proceed with merge?"
-    },
-    "human-review": {
-      defaultFallback: "skip",
-      safety: "yellow",
-      defaultSummary: "Human review required for story {{storyId}} \u2014 skip and continue?"
-    },
-    "story-oversized": {
-      defaultFallback: "continue",
-      safety: "yellow",
-      defaultSummary: "Story {{storyId}} is oversized ({{criteriaCount}} acceptance criteria) \u2014 decompose into smaller stories?"
-    },
-    "story-ambiguity": {
-      defaultFallback: "continue",
-      safety: "green",
-      defaultSummary: "Story {{storyId}} requirements unclear \u2014 continue with best effort?"
-    },
-    "review-gate": {
-      defaultFallback: "continue",
-      safety: "green",
-      defaultSummary: "Code review checkpoint for {{storyId}} \u2014 proceed?"
-    }
-  };
+var QUESTION_PATTERNS, DEFAULT_INTERACTION_TIMEOUT_MS = 120000;
+var init_bridge_builder = __esm(() => {
+  QUESTION_PATTERNS = [/\?/, /\bwhich\b/i, /\bshould i\b/i, /\bunclear\b/i, /\bplease clarify\b/i];
 });
 // src/interaction/chain.ts
@@ -22844,47 +22565,166 @@ class InteractionChain {
   }
 }
-// src/interaction/state.ts
-import * as path3 from "path";
-async function loadPendingInteraction(requestId, featureDir) {
-  const interactionsDir = path3.join(featureDir, "interactions");
-  const filename = `${requestId}.json`;
-  const filePath = path3.join(interactionsDir, filename);
-  try {
-    const file2 = Bun.file(filePath);
-    const exists = await file2.exists();
-    if (!exists) {
-      return null;
+// src/interaction/plugins/auto.ts
+class AutoInteractionPlugin {
+  name = "auto";
+  config = {};
+  async init(config2) {
+    const cfg = AutoConfigSchema.parse(config2);
+    this.config = {
+      model: cfg.model ?? "fast",
+      confidenceThreshold: cfg.confidenceThreshold ?? 0.7,
+      maxCostPerDecision: cfg.maxCostPerDecision ?? 0.01,
+      naxConfig: cfg.naxConfig
+    };
+  }
+  async destroy() {}
+  async send(request) {}
+  async receive(_requestId, _timeout = 60000) {
+    throw new Error("Auto plugin requires full request context (not just requestId)");
+  }
+  async decide(request) {
+    if (request.metadata?.trigger === "security-review") {
+      return;
+    }
+    try {
+      if (_autoPluginDeps.callLlm) {
+        const decision2 = await _autoPluginDeps.callLlm(request);
+        if (decision2.confidence < (this.config.confidenceThreshold ?? 0.7)) {
+          return;
+        }
+        return {
+          requestId: request.id,
+          action: decision2.action,
+          value: decision2.value,
+          respondedBy: "auto-ai",
+          respondedAt: Date.now()
+        };
+      }
+      const decision = await this.callLlm(request);
+      if (decision.confidence < (this.config.confidenceThreshold ?? 0.7)) {
+        return;
+      }
+      return {
+        requestId: request.id,
+        action: decision.action,
+        value: decision.value,
+        respondedBy: "auto-ai",
+        respondedAt: Date.now()
+      };
+    } catch (err) {
+      return;
     }
-    const json2 = await file2.text();
-    const request = JSON.parse(json2);
-    return request;
-  } catch {
-    return null;
   }
-}
-async function listPendingInteractions(featureDir) {
-  const interactionsDir = path3.join(featureDir, "interactions");
-  try {
-    const dir = Bun.file(interactionsDir);
-    const exists = await dir.exists();
-    if (!exists) {
-      return [];
+  async callLlm(request) {
+    const prompt = this.buildPrompt(request);
+    const adapter = _autoPluginDeps.adapter;
+    if (!adapter) {
+      throw new Error("Auto plugin requires adapter to be injected via _autoPluginDeps.adapter");
     }
-    const proc = Bun.spawn(["ls", interactionsDir], {
-      stdout: "pipe",
-      stderr: "pipe"
+    let modelArg;
+    if (this.config.naxConfig) {
+      const modelTier = this.config.model ?? "fast";
+      const modelEntry = this.config.naxConfig.models[modelTier];
+      if (!modelEntry) {
+        throw new Error(`Model tier "${modelTier}" not found in config.models`);
+      }
+      const modelDef = resolveModel(modelEntry);
+      modelArg = modelDef.model;
+    }
+    const output = await adapter.complete(prompt, {
+      ...modelArg && { model: modelArg },
+      jsonMode: true,
+      ...this.config.naxConfig && { config: this.config.naxConfig },
+      featureName: request.featureName,
+      storyId: request.storyId,
+      sessionRole: "auto"
     });
-    const output = await new Response(proc.stdout).text();
-    await proc.exited;
-    const files = output.split(`
-`).filter((f) => f.endsWith(".json") && f !== ".gitkeep").map((f) => f.replace(".json", ""));
-    return files;
-  } catch {
-    return [];
+    return this.parseResponse(output);
+  }
+  buildPrompt(request) {
+    let prompt = `You are an AI decision assistant for a code orchestration system. Given an interaction request, decide the best action.
+## Interaction Request
+Type: ${request.type}
+Stage: ${request.stage}
+Feature: ${request.featureName}
+${request.storyId ? `Story: ${request.storyId}` : ""}
+Summary: ${request.summary.replace(/`/g, "\\`").replace(/\$/g, "\\$")}
+${request.detail ? `
+Detail: ${request.detail.replace(/`/g, "\\`").replace(/\$/g, "\\$")}` : ""}
+`;
+    if (request.options && request.options.length > 0) {
+      prompt += `
+Options:
+`;
+      for (const opt of request.options) {
+        const desc = opt.description ? ` \u2014 ${opt.description}` : "";
+        prompt += `  [${opt.key}] ${opt.label}${desc}
+`;
+      }
+    }
+    prompt += `
+Fallback behavior on timeout: ${request.fallback}
+Safety tier: ${request.metadata?.safety ?? "unknown"}
+## Available Actions
+- approve: Proceed with the operation
+- reject: Deny the operation
+- choose: Select an option (requires value field)
+- input: Provide text input (requires value field)
+- skip: Skip this interaction
+- abort: Abort execution
+## Rules
+1. For "red" safety tier (security-review, cost-exceeded, merge-conflict): ALWAYS return confidence 0 to escalate to human
+2. For "yellow" safety tier (cost-warning, max-retries, pre-merge): High confidence (0.8+) ONLY if clearly safe
+3. For "green" safety tier (story-ambiguity, review-gate): Can approve with moderate confidence (0.6+)
+4. Default to the fallback behavior if unsure
+5. Never auto-approve security issues
+6. If the summary mentions "critical" or "security", confidence MUST be < 0.5
+Respond with ONLY this JSON (no markdown, no explanation):
+{"action":"approve|reject|choose|input|skip|abort","value":"<optional>","confidence":0.0-1.0,"reasoning":"<one line>"}`;
+    return prompt;
+  }
+  parseResponse(output) {
+    let jsonText = output.trim();
+    if (jsonText.startsWith("```")) {
+      const lines = jsonText.split(`
+`);
+      jsonText = lines.slice(1, -1).join(`
+`).trim();
+    }
+    if (jsonText.startsWith("json")) {
+      jsonText = jsonText.slice(4).trim();
+    }
+    const parsed = JSON.parse(jsonText);
+    if (!parsed.action || parsed.confidence === undefined || !parsed.reasoning) {
+      throw new Error(`Invalid LLM response: ${jsonText}`);
+    }
+    if (parsed.confidence < 0 || parsed.confidence > 1) {
+      throw new Error(`Invalid confidence: ${parsed.confidence} (must be 0-1)`);
+    }
+    return parsed;
   }
 }
-var init_state = () => {};
+var AutoConfigSchema, _autoPluginDeps;
+var init_auto = __esm(() => {
+  init_zod();
+  init_config();
+  AutoConfigSchema = exports_external.object({
+    model: exports_external.string().optional(),
+    confidenceThreshold: exports_external.number().min(0).max(1).optional(),
+    maxCostPerDecision: exports_external.number().positive().optional(),
+    naxConfig: exports_external.any().optional()
+  });
+  _autoPluginDeps = {
+    adapter: null,
+    callLlm: null
+  };
+});
 // src/interaction/plugins/cli.ts
 import * as readline from "readline";
@@ -22953,9 +22793,9 @@ ${request.summary}
     if (!this.rl) {
       throw new Error("CLI plugin not initialized");
     }
-    const timeoutPromise = new Promise((resolve5) => {
+    const timeoutPromise = new Promise((resolve4) => {
       setTimeout(() => {
-        resolve5({
+        resolve4({
           requestId: request.id,
           action: "skip",
           respondedBy: "timeout",
@@ -23107,9 +22947,9 @@ ${request.summary}
     if (!this.rl) {
       throw new Error("CLI plugin not initialized");
     }
-    return new Promise((resolve5) => {
+    return new Promise((resolve4) => {
       this.rl?.question(prompt, (answer) => {
-        resolve5(answer);
+        resolve4(answer);
       });
     });
   }
@@ -23144,28 +22984,38 @@ class TelegramInteractionPlugin {
     if (!this.botToken || !this.chatId) {
       throw new Error("Telegram plugin not initialized");
     }
-    const text = this.formatMessage(request);
+    const header = this.buildHeader(request);
     const keyboard = this.buildKeyboard(request);
+    const body = this.buildBody(request);
+    const chunks = this.splitText(body, MAX_MESSAGE_CHARS - header.length - 10);
     try {
-      const response = await fetch(`https://api.telegram.org/bot${this.botToken}/sendMessage`, {
-        method: "POST",
-        headers: { "Content-Type": "application/json" },
-        body: JSON.stringify({
-          chat_id: this.chatId,
-          text,
-          reply_markup: keyboard ? { inline_keyboard: keyboard } : undefined,
-          parse_mode: "Markdown"
-        })
-      });
-      if (!response.ok) {
-        const errorBody = await response.text().catch(() => "");
-        throw new Error(`Telegram API error (${response.status}): ${errorBody || response.statusText}`);
-      }
-      const data = await response.json();
-      if (!data.ok) {
-        throw new Error(`Telegram API returned ok=false: ${JSON.stringify(data)}`);
+      const sentIds = [];
+      for (let i = 0;i < chunks.length; i++) {
+        const isLast = i === chunks.length - 1;
+        const partLabel = chunks.length > 1 ? `[${i + 1}/${chunks.length}] ` : "";
+        const text = `${header}
+${partLabel}${chunks[i]}`;
+        const response = await fetch(`https://api.telegram.org/bot${this.botToken}/sendMessage`, {
+          method: "POST",
+          headers: { "Content-Type": "application/json" },
+          body: JSON.stringify({
+            chat_id: this.chatId,
+            text,
+            reply_markup: isLast && keyboard ? { inline_keyboard: keyboard } : undefined,
+            parse_mode: "Markdown"
+          })
+        });
+        if (!response.ok) {
+          const errorBody = await response.text().catch(() => "");
+          throw new Error(`Telegram API error (${response.status}): ${errorBody || response.statusText}`);
+        }
+        const data = await response.json();
+        if (!data.ok) {
+          throw new Error(`Telegram API returned ok=false: ${JSON.stringify(data)}`);
+        }
+        sentIds.push(data.result.message_id);
       }
-      this.pendingMessages.set(request.id, data.result.message_id);
+      this.pendingMessages.set(request.id, sentIds);
     } catch (err) {
       const msg = err instanceof Error ? err.message : String(err);
       throw new Error(`Failed to send Telegram message: ${msg}`);
@@ -23202,10 +23052,9 @@ class TelegramInteractionPlugin {
     await this.sendTimeoutMessage(requestId);
     this.pendingMessages.delete(requestId);
   }
-  formatMessage(request) {
+  buildHeader(request) {
     const emoji3 = this.getStageEmoji(request.stage);
     let text = `${emoji3} *${request.stage.toUpperCase()}*
 `;
     text += `*Feature:* ${request.featureName}
 `;
@@ -23214,11 +23063,15 @@ class TelegramInteractionPlugin {
 `;
     }
     text += `
-${request.summary}
+`;
+    return text;
+  }
+  buildBody(request) {
+    let text = `${this.sanitizeMarkdown(request.summary)}
 `;
     if (request.detail) {
       text += `
-${request.detail}
+${this.sanitizeMarkdown(request.detail)}
 `;
     }
     if (request.options && request.options.length > 0) {
@@ -23226,8 +23079,8 @@ ${request.detail}
 *Options:*
 `;
       for (const opt of request.options) {
-        const desc = opt.description ? ` \u2014 ${opt.description}` : "";
-        text += `  \u2022 ${opt.label}${desc}
+        const desc = opt.description ? ` - ${this.sanitizeMarkdown(opt.description)}` : "";
+        text += `  - ${opt.label}${desc}
 `;
       }
     }
@@ -23238,6 +23091,30 @@ ${request.detail}
     }
     return text;
   }
+  sanitizeMarkdown(text) {
+    return text.replace(/\\(?=[_*`\[])/g, "\\\\").replace(/_/g, "\\_").replace(/`/g, "\\`").replace(/\*/g, "\\*").replace(/\[/g, "\\[");
+  }
+  splitText(text, maxChars) {
+    if (text.length <= maxChars)
+      return [text];
+    const chunks = [];
+    let remaining = text;
+    while (remaining.length > maxChars) {
+      const slice = remaining.slice(0, maxChars);
+      const lastNewline = slice.lastIndexOf(`
+`);
+      if (lastNewline > maxChars * 0.5) {
+        chunks.push(remaining.slice(0, lastNewline));
+        remaining = remaining.slice(lastNewline + 1);
+      } else {
+        chunks.push(slice);
+        remaining = remaining.slice(maxChars);
+      }
+    }
+    if (remaining.length > 0)
+      chunks.push(remaining);
+    return chunks;
+  }
   buildKeyboard(request) {
     switch (request.type) {
       case "confirm":
@@ -23345,8 +23222,11 @@ ${request.detail}
       };
     }
     if (update.message?.text) {
-      const messageId = this.pendingMessages.get(requestId);
-      if (!messageId)
+      const messageIds = this.pendingMessages.get(requestId);
+      if (!messageIds)
+        return null;
+      const replyToId = update.message.reply_to_message?.message_id;
+      if (replyToId !== undefined && !messageIds.includes(replyToId))
         return null;
       return {
         requestId,
@@ -23372,20 +23252,20 @@ ${request.detail}
     } catch {}
   }
   async sendTimeoutMessage(requestId) {
-    const messageId = this.pendingMessages.get(requestId);
-    if (!messageId || !this.botToken || !this.chatId) {
+    const messageIds = this.pendingMessages.get(requestId);
+    if (!messageIds || !this.botToken || !this.chatId) {
       this.pendingMessages.delete(requestId);
       return;
     }
+    const lastId = messageIds[messageIds.length - 1];
     try {
       await fetch(`https://api.telegram.org/bot${this.botToken}/editMessageText`, {
         method: "POST",
         headers: { "Content-Type": "application/json" },
         body: JSON.stringify({
           chat_id: this.chatId,
-          message_id: messageId,
-          text: "\u23F1 *EXPIRED* \u2014 Interaction timed out",
-          parse_mode: "Markdown"
+          message_id: lastId,
+          text: "\u23F1 EXPIRED \u2014 Interaction timed out"
         })
       });
     } catch {} finally {
@@ -23393,7 +23273,7 @@ ${request.detail}
     }
   }
 }
-var TelegramConfigSchema;
+var MAX_MESSAGE_CHARS = 4000, TelegramConfigSchema;
 var init_telegram = __esm(() => {
   init_zod();
   TelegramConfigSchema = exports_external.object({
@@ -23466,10 +23346,10 @@ class WebhookInteractionPlugin {
       this.pendingResponses.delete(requestId);
       return early;
     }
-    return new Promise((resolve5) => {
+    return new Promise((resolve4) => {
       const timer = setTimeout(() => {
         this.receiveCallbacks.delete(requestId);
-        resolve5({
+        resolve4({
           requestId,
           action: "skip",
           respondedBy: "timeout",
@@ -23479,7 +23359,7 @@ class WebhookInteractionPlugin {
       this.receiveCallbacks.set(requestId, (response) => {
         clearTimeout(timer);
         this.receiveCallbacks.delete(requestId);
-        resolve5(response);
+        resolve4(response);
       });
     });
   }
@@ -23600,290 +23480,6 @@ var init_webhook = __esm(() => {
   });
 });
-// src/interaction/plugins/auto.ts
-class AutoInteractionPlugin {
-  name = "auto";
-  config = {};
-  async init(config2) {
-    const cfg = AutoConfigSchema.parse(config2);
-    this.config = {
-      model: cfg.model ?? "fast",
-      confidenceThreshold: cfg.confidenceThreshold ?? 0.7,
-      maxCostPerDecision: cfg.maxCostPerDecision ?? 0.01,
-      naxConfig: cfg.naxConfig
-    };
-  }
-  async destroy() {}
-  async send(request) {}
-  async receive(_requestId, _timeout = 60000) {
-    throw new Error("Auto plugin requires full request context (not just requestId)");
-  }
-  async decide(request) {
-    if (request.metadata?.trigger === "security-review") {
-      return;
-    }
-    try {
-      if (_autoPluginDeps.callLlm) {
-        const decision2 = await _autoPluginDeps.callLlm(request);
-        if (decision2.confidence < (this.config.confidenceThreshold ?? 0.7)) {
-          return;
-        }
-        return {
-          requestId: request.id,
-          action: decision2.action,
-          value: decision2.value,
-          respondedBy: "auto-ai",
-          respondedAt: Date.now()
-        };
-      }
-      const decision = await this.callLlm(request);
-      if (decision.confidence < (this.config.confidenceThreshold ?? 0.7)) {
-        return;
-      }
-      return {
-        requestId: request.id,
-        action: decision.action,
-        value: decision.value,
-        respondedBy: "auto-ai",
-        respondedAt: Date.now()
-      };
-    } catch (err) {
-      return;
-    }
-  }
-  async callLlm(request) {
-    const prompt = this.buildPrompt(request);
-    const adapter = _autoPluginDeps.adapter;
-    if (!adapter) {
-      throw new Error("Auto plugin requires adapter to be injected via _autoPluginDeps.adapter");
-    }
-    let modelArg;
-    if (this.config.naxConfig) {
-      const modelTier = this.config.model ?? "fast";
-      const modelEntry = this.config.naxConfig.models[modelTier];
-      if (!modelEntry) {
-        throw new Error(`Model tier "${modelTier}" not found in config.models`);
-      }
-      const modelDef = resolveModel(modelEntry);
-      modelArg = modelDef.model;
-    }
-    const output = await adapter.complete(prompt, {
-      ...modelArg && { model: modelArg },
-      jsonMode: true,
-      ...this.config.naxConfig && { config: this.config.naxConfig },
-      featureName: request.featureName,
-      storyId: request.storyId,
-      sessionRole: "auto"
-    });
-    return this.parseResponse(output);
-  }
-  buildPrompt(request) {
-    let prompt = `You are an AI decision assistant for a code orchestration system. Given an interaction request, decide the best action.
-## Interaction Request
-Type: ${request.type}
-Stage: ${request.stage}
-Feature: ${request.featureName}
-${request.storyId ? `Story: ${request.storyId}` : ""}
-Summary: ${request.summary.replace(/`/g, "\\`").replace(/\$/g, "\\$")}
-${request.detail ? `
-Detail: ${request.detail.replace(/`/g, "\\`").replace(/\$/g, "\\$")}` : ""}
-`;
-    if (request.options && request.options.length > 0) {
-      prompt += `
-Options:
-`;
-      for (const opt of request.options) {
-        const desc = opt.description ? ` \u2014 ${opt.description}` : "";
-        prompt += `  [${opt.key}] ${opt.label}${desc}
-`;
-      }
-    }
-    prompt += `
-Fallback behavior on timeout: ${request.fallback}
-Safety tier: ${request.metadata?.safety ?? "unknown"}
-## Available Actions
-- approve: Proceed with the operation
-- reject: Deny the operation
-- choose: Select an option (requires value field)
-- input: Provide text input (requires value field)
-- skip: Skip this interaction
-- abort: Abort execution
-## Rules
-1. For "red" safety tier (security-review, cost-exceeded, merge-conflict): ALWAYS return confidence 0 to escalate to human
-2. For "yellow" safety tier (cost-warning, max-retries, pre-merge): High confidence (0.8+) ONLY if clearly safe
-3. For "green" safety tier (story-ambiguity, review-gate): Can approve with moderate confidence (0.6+)
-4. Default to the fallback behavior if unsure
-5. Never auto-approve security issues
-6. If the summary mentions "critical" or "security", confidence MUST be < 0.5
-Respond with ONLY this JSON (no markdown, no explanation):
-{"action":"approve|reject|choose|input|skip|abort","value":"<optional>","confidence":0.0-1.0,"reasoning":"<one line>"}`;
-    return prompt;
-  }
-  parseResponse(output) {
-    let jsonText = output.trim();
-    if (jsonText.startsWith("```")) {
-      const lines = jsonText.split(`
-`);
-      jsonText = lines.slice(1, -1).join(`
-`).trim();
-    }
-    if (jsonText.startsWith("json")) {
-      jsonText = jsonText.slice(4).trim();
-    }
-    const parsed = JSON.parse(jsonText);
-    if (!parsed.action || parsed.confidence === undefined || !parsed.reasoning) {
-      throw new Error(`Invalid LLM response: ${jsonText}`);
-    }
-    if (parsed.confidence < 0 || parsed.confidence > 1) {
-      throw new Error(`Invalid confidence: ${parsed.confidence} (must be 0-1)`);
-    }
-    return parsed;
-  }
-}
-var AutoConfigSchema, _autoPluginDeps;
-var init_auto = __esm(() => {
-  init_zod();
-  init_config();
-  AutoConfigSchema = exports_external.object({
-    model: exports_external.string().optional(),
-    confidenceThreshold: exports_external.number().min(0).max(1).optional(),
-    maxCostPerDecision: exports_external.number().positive().optional(),
-    naxConfig: exports_external.any().optional()
-  });
-  _autoPluginDeps = {
-    adapter: null,
-    callLlm: null
-  };
-});
-// src/interaction/triggers.ts
-function isTriggerEnabled(trigger, config2) {
-  const triggerConfig = config2.interaction?.triggers?.[trigger];
-  if (triggerConfig === undefined)
-    return false;
-  if (typeof triggerConfig === "boolean")
-    return triggerConfig;
-  return triggerConfig.enabled;
-}
-function getTriggerConfig(trigger, config2) {
-  const metadata = TRIGGER_METADATA[trigger];
-  const triggerConfig = config2.interaction?.triggers?.[trigger];
-  const defaults = config2.interaction?.defaults ?? {
-    timeout: 600000,
-    fallback: "escalate"
-  };
-  let fallback = metadata.defaultFallback;
-  let timeout = defaults.timeout;
-  if (typeof triggerConfig === "object") {
-    if (triggerConfig.fallback) {
-      fallback = triggerConfig.fallback;
-    }
-    if (triggerConfig.timeout) {
-      timeout = triggerConfig.timeout;
-    }
-  }
-  return { fallback, timeout };
-}
-function substituteTemplate(template, context) {
-  let result = template;
-  for (const [key, value] of Object.entries(context)) {
-    if (value !== undefined) {
-      result = result.replace(new RegExp(`\\{\\{${key}\\}\\}`, "g"), String(value));
-    }
-  }
-  return result;
-}
-function createTriggerRequest(trigger, context, config2) {
-  const metadata = TRIGGER_METADATA[trigger];
-  const { fallback, timeout } = getTriggerConfig(trigger, config2);
-  const summary = substituteTemplate(metadata.defaultSummary, context);
-  const id = `trigger-${trigger}-${Date.now()}`;
-  return {
-    id,
-    type: "confirm",
-    featureName: context.featureName,
-    storyId: context.storyId,
-    stage: "custom",
-    summary,
-    fallback,
-    timeout,
-    createdAt: Date.now(),
-    metadata: {
-      trigger,
-      safety: metadata.safety
-    }
-  };
-}
-async function executeTrigger(trigger, context, config2, chain) {
-  const request = createTriggerRequest(trigger, context, config2);
-  const response = await chain.prompt(request);
-  return response;
-}
-async function checkSecurityReview(context, config2, chain) {
-  if (!isTriggerEnabled("security-review", config2))
-    return true;
-  const response = await executeTrigger("security-review", context, config2, chain);
-  return response.action !== "abort";
-}
-async function checkCostExceeded(context, config2, chain) {
-  if (!isTriggerEnabled("cost-exceeded", config2))
-    return true;
-  const response = await executeTrigger("cost-exceeded", context, config2, chain);
-  return response.action !== "abort";
-}
-async function checkMergeConflict(context, config2, chain) {
-  if (!isTriggerEnabled("merge-conflict", config2))
-    return true;
-  const response = await executeTrigger("merge-conflict", context, config2, chain);
-  return response.action !== "abort";
-}
-async function checkCostWarning(context, config2, chain) {
-  if (!isTriggerEnabled("cost-warning", config2))
-    return "continue";
-  const response = await executeTrigger("cost-warning", context, config2, chain);
-  return response.action === "approve" ? "escalate" : "continue";
-}
-async function checkPreMerge(context, config2, chain) {
-  if (!isTriggerEnabled("pre-merge", config2))
-    return true;
-  const response = await executeTrigger("pre-merge", context, config2, chain);
-  return response.action === "approve";
-}
-async function checkStoryAmbiguity(context, config2, chain) {
-  if (!isTriggerEnabled("story-ambiguity", config2))
-    return true;
-  const response = await executeTrigger("story-ambiguity", context, config2, chain);
-  return response.action === "approve";
-}
-async function checkReviewGate(context, config2, chain) {
-  if (!isTriggerEnabled("review-gate", config2))
-    return true;
-  const response = await executeTrigger("review-gate", context, config2, chain);
-  return response.action === "approve";
-}
-async function checkStoryOversized(context, config2, chain) {
-  if (!isTriggerEnabled("story-oversized", config2))
-    return "continue";
-  try {
-    const response = await executeTrigger("story-oversized", context, config2, chain);
-    if (response.action === "approve")
-      return "decompose";
-    if (response.action === "skip")
-      return "skip";
-    return "continue";
-  } catch {
-    return "continue";
-  }
-}
-var init_triggers = __esm(() => {
-  init_types4();
-});
 // src/interaction/init.ts
 function createInteractionPlugin(pluginName) {
   switch (pluginName) {
@@ -23938,6 +23534,483 @@ var init_init = __esm(() => {
   init_webhook();
 });
+// src/prd/validate.ts
+function validateStoryId(id) {
+  if (!id || id.length === 0) {
+    throw new Error("Story ID cannot be empty");
+  }
+  if (id.includes("..")) {
+    throw new Error("Story ID cannot contain path traversal (..)");
+  }
+  if (id.startsWith("--")) {
+    throw new Error("Story ID cannot start with git flags (--)");
+  }
+  const validPattern = /^[a-zA-Z0-9][a-zA-Z0-9._-]{0,63}$/;
+  if (!validPattern.test(id)) {
+    throw new Error(`Story ID must match pattern [a-zA-Z0-9][a-zA-Z0-9._-]{0,63}. Got: ${id}`);
+  }
+}
+// src/errors.ts
+var NaxError, AgentNotFoundError, AgentNotInstalledError, StoryLimitExceededError, LockAcquisitionError;
+var init_errors3 = __esm(() => {
+  NaxError = class NaxError extends Error {
+    code;
+    context;
+    constructor(message, code, context) {
+      super(message);
+      this.code = code;
+      this.context = context;
+      this.name = "NaxError";
+      Error.captureStackTrace(this, this.constructor);
+    }
+  };
+  AgentNotFoundError = class AgentNotFoundError extends NaxError {
+    constructor(agentName, binary) {
+      super(`Agent "${agentName}" not found or not installed`, "AGENT_NOT_FOUND", { agentName, binary });
+      this.name = "AgentNotFoundError";
+    }
+  };
+  AgentNotInstalledError = class AgentNotInstalledError extends NaxError {
+    constructor(agentName, binary) {
+      super(`Agent "${agentName}" is not installed or not in PATH: ${binary}`, "AGENT_NOT_INSTALLED", {
+        agentName,
+        binary
+      });
+      this.name = "AgentNotInstalledError";
+    }
+  };
+  StoryLimitExceededError = class StoryLimitExceededError extends NaxError {
+    constructor(totalStories, limit) {
+      super(`Feature exceeds story limit: ${totalStories} stories (max: ${limit})`, "STORY_LIMIT_EXCEEDED", {
+        totalStories,
+        limit
+      });
+      this.name = "StoryLimitExceededError";
+    }
+  };
+  LockAcquisitionError = class LockAcquisitionError extends NaxError {
+    constructor(workdir) {
+      super("Another nax process is already running in this directory", "LOCK_ACQUISITION_FAILED", { workdir });
+      this.name = "LockAcquisitionError";
+    }
+  };
+});
+// src/metrics/tracker.ts
+import path2 from "path";
+function collectStoryMetrics(ctx, storyStartTime) {
+  const story = ctx.story;
+  const routing = ctx.routing;
+  const agentResult = ctx.agentResult;
+  const escalationCount = story.escalations?.length || 0;
+  const priorFailureCount = story.priorFailures?.length || 0;
+  const attempts = priorFailureCount + Math.max(1, story.attempts || 1);
+  const finalTier = escalationCount > 0 ? story.escalations[escalationCount - 1].toTier : routing.modelTier;
+  const firstPassSuccess = agentResult?.success === true && escalationCount === 0 && priorFailureCount === 0;
+  const modelEntry = ctx.config.models[routing.modelTier];
+  const modelDef = modelEntry ? resolveModel(modelEntry) : null;
+  const modelUsed = modelDef?.model || routing.modelTier;
+  const initialComplexity = story.routing?.initialComplexity ?? routing.complexity;
+  const isTddStrategy = routing.testStrategy === "three-session-tdd" || routing.testStrategy === "three-session-tdd-lite";
+  const fullSuiteGatePassed = isTddStrategy ? ctx.fullSuiteGatePassed ?? false : false;
+  return {
+    storyId: story.id,
+    complexity: routing.complexity,
+    initialComplexity,
+    modelTier: routing.modelTier,
+    modelUsed,
+    attempts,
+    finalTier,
+    success: agentResult?.success || false,
+    cost: (ctx.accumulatedAttemptCost ?? 0) + (agentResult?.estimatedCost || 0),
+    durationMs: agentResult?.durationMs || 0,
+    firstPassSuccess,
+    startedAt: storyStartTime,
+    completedAt: new Date().toISOString(),
+    fullSuiteGatePassed,
+    runtimeCrashes: ctx.storyRuntimeCrashes ?? 0
+  };
+}
+function collectBatchMetrics(ctx, storyStartTime) {
+  const stories = ctx.stories;
+  const routing = ctx.routing;
+  const agentResult = ctx.agentResult;
+  const totalCost = agentResult?.estimatedCost || 0;
+  const totalDuration = agentResult?.durationMs || 0;
+  const costPerStory = totalCost / stories.length;
+  const durationPerStory = totalDuration / stories.length;
+  const modelEntry = ctx.config.models[routing.modelTier];
+  const modelDef = modelEntry ? resolveModel(modelEntry) : null;
+  const modelUsed = modelDef?.model || routing.modelTier;
+  return stories.map((story) => {
+    const initialComplexity = story.routing?.initialComplexity ?? routing.complexity;
+    return {
+      storyId: story.id,
+      complexity: routing.complexity,
+      initialComplexity,
+      modelTier: routing.modelTier,
+      modelUsed,
+      attempts: 1,
+      finalTier: routing.modelTier,
+      success: true,
+      cost: costPerStory,
+      durationMs: durationPerStory,
+      firstPassSuccess: true,
+      startedAt: storyStartTime,
+      completedAt: new Date().toISOString(),
+      fullSuiteGatePassed: false,
+      runtimeCrashes: 0
+    };
+  });
+}
+async function saveRunMetrics(workdir, runMetrics) {
+  const metricsPath = path2.join(workdir, ".nax", "metrics.json");
+  const existing = await loadJsonFile(metricsPath, "metrics");
+  const allMetrics = Array.isArray(existing) ? existing : [];
+  allMetrics.push(runMetrics);
+  await saveJsonFile(metricsPath, allMetrics, "metrics");
+}
+async function loadRunMetrics(workdir) {
+  const metricsPath = path2.join(workdir, ".nax", "metrics.json");
+  const content = await loadJsonFile(metricsPath, "metrics");
+  return Array.isArray(content) ? content : [];
+}
+var init_tracker = __esm(() => {
+  init_schema();
+  init_json_file();
+});
+// src/metrics/aggregator.ts
+function calculateAggregateMetrics(runs) {
+  if (runs.length === 0) {
+    return {
+      totalRuns: 0,
+      totalCost: 0,
+      totalStories: 0,
+      firstPassRate: 0,
+      escalationRate: 0,
+      avgCostPerStory: 0,
+      avgCostPerFeature: 0,
+      modelEfficiency: {},
+      complexityAccuracy: {}
+    };
+  }
+  const allStories = runs.flatMap((run) => run.stories);
+  const totalRuns = runs.length;
+  const totalCost = runs.reduce((sum, run) => sum + run.totalCost, 0);
+  const totalStories = allStories.length;
+  const firstPassSuccesses = allStories.filter((s) => s.firstPassSuccess).length;
+  const firstPassRate = totalStories > 0 ? firstPassSuccesses / totalStories : 0;
+  const escalatedStories = allStories.filter((s) => s.attempts > 1).length;
+  const escalationRate = totalStories > 0 ? escalatedStories / totalStories : 0;
+  const avgCostPerStory = totalStories > 0 ? totalCost / totalStories : 0;
+  const avgCostPerFeature = totalRuns > 0 ? totalCost / totalRuns : 0;
+  const modelStats = new Map;
+  for (const story of allStories) {
+    const modelKey = story.modelUsed;
+    const existing = modelStats.get(modelKey) || {
+      attempts: 0,
+      successes: 0,
+      totalCost: 0
+    };
+    modelStats.set(modelKey, {
+      attempts: existing.attempts + story.attempts,
+      successes: existing.successes + (story.success ? 1 : 0),
+      totalCost: existing.totalCost + story.cost
+    });
+  }
+  const modelEfficiency = {};
+  for (const [modelKey, stats] of modelStats) {
+    const passRate = stats.attempts > 0 ? stats.successes / stats.attempts : 0;
+    const avgCost = stats.successes > 0 ? stats.totalCost / stats.successes : 0;
+    modelEfficiency[modelKey] = {
+      attempts: stats.attempts,
+      successes: stats.successes,
+      passRate,
+      avgCost,
+      totalCost: stats.totalCost
+    };
+  }
+  const complexityStats = new Map;
+  for (const story of allStories) {
+    const complexity = story.initialComplexity ?? story.complexity;
+    const existing = complexityStats.get(complexity) || {
+      predicted: 0,
+      tierCounts: new Map,
+      mismatches: 0
+    };
+    existing.predicted += 1;
+    const finalTier = story.finalTier;
+    existing.tierCounts.set(finalTier, (existing.tierCounts.get(finalTier) || 0) + 1);
+    if (story.modelTier !== story.finalTier) {
+      existing.mismatches += 1;
+    }
+    complexityStats.set(complexity, existing);
+  }
+  const complexityAccuracy = {};
+  for (const [complexity, stats] of complexityStats) {
+    let maxCount = 0;
+    let mostCommonTier = "unknown";
+    for (const [tier, count] of stats.tierCounts) {
+      if (count > maxCount) {
+        maxCount = count;
+        mostCommonTier = tier;
+      }
+    }
+    const mismatchRate = stats.predicted > 0 ? stats.mismatches / stats.predicted : 0;
+    complexityAccuracy[complexity] = {
+      predicted: stats.predicted,
+      actualTierUsed: mostCommonTier,
+      mismatchRate
+    };
+  }
+  return {
+    totalRuns,
+    totalCost,
+    totalStories,
+    firstPassRate,
+    escalationRate,
+    avgCostPerStory,
+    avgCostPerFeature,
+    modelEfficiency,
+    complexityAccuracy
+  };
+}
+function getLastRun(runs) {
+  if (runs.length === 0) {
+    return null;
+  }
+  return runs[runs.length - 1];
+}
+// src/metrics/index.ts
+var init_metrics = __esm(() => {
+  init_tracker();
+});
+// src/interaction/types.ts
+var TRIGGER_METADATA;
+var init_types4 = __esm(() => {
+  TRIGGER_METADATA = {
+    "security-review": {
+      defaultFallback: "abort",
+      safety: "red",
+      defaultSummary: "Security review failed \u2014 abort execution?"
+    },
+    "cost-exceeded": {
+      defaultFallback: "abort",
+      safety: "red",
+      defaultSummary: "Cost limit exceeded ({{cost}} USD) \u2014 abort execution?"
+    },
+    "merge-conflict": {
+      defaultFallback: "abort",
+      safety: "red",
+      defaultSummary: "Merge conflict detected in {{storyId}} \u2014 abort execution?"
+    },
+    "cost-warning": {
+      defaultFallback: "escalate",
+      safety: "yellow",
+      defaultSummary: "Cost warning: {{cost}} USD / {{limit}} USD \u2014 escalate to higher tier?"
+    },
+    "max-retries": {
+      defaultFallback: "skip",
+      safety: "yellow",
+      defaultSummary: "Max retries reached for {{storyId}} \u2014 skip story?"
+    },
+    "pre-merge": {
+      defaultFallback: "escalate",
+      safety: "yellow",
+      defaultSummary: "Pre-merge checkpoint for {{storyId}} \u2014 proceed with merge?"
+    },
+    "human-review": {
+      defaultFallback: "skip",
+      safety: "yellow",
+      defaultSummary: "Human review required for story {{storyId}} \u2014 skip and continue?"
+    },
+    "story-oversized": {
+      defaultFallback: "continue",
+      safety: "yellow",
+      defaultSummary: "Story {{storyId}} is oversized ({{criteriaCount}} acceptance criteria) \u2014 decompose into smaller stories?"
+    },
+    "story-ambiguity": {
+      defaultFallback: "continue",
+      safety: "green",
+      defaultSummary: "Story {{storyId}} requirements unclear \u2014 continue with best effort?"
+    },
+    "review-gate": {
+      defaultFallback: "continue",
+      safety: "green",
+      defaultSummary: "Code review checkpoint for {{storyId}} \u2014 proceed?"
+    }
+  };
+});
+// src/interaction/state.ts
+import * as path3 from "path";
+async function loadPendingInteraction(requestId, featureDir) {
+  const interactionsDir = path3.join(featureDir, "interactions");
+  const filename = `${requestId}.json`;
+  const filePath = path3.join(interactionsDir, filename);
+  try {
+    const file2 = Bun.file(filePath);
+    const exists = await file2.exists();
+    if (!exists) {
+      return null;
+    }
+    const json2 = await file2.text();
+    const request = JSON.parse(json2);
+    return request;
+  } catch {
+    return null;
+  }
+}
+async function listPendingInteractions(featureDir) {
+  const interactionsDir = path3.join(featureDir, "interactions");
+  try {
+    const dir = Bun.file(interactionsDir);
+    const exists = await dir.exists();
+    if (!exists) {
+      return [];
+    }
+    const proc = Bun.spawn(["ls", interactionsDir], {
+      stdout: "pipe",
+      stderr: "pipe"
+    });
+    const output = await new Response(proc.stdout).text();
+    await proc.exited;
+    const files = output.split(`
+`).filter((f) => f.endsWith(".json") && f !== ".gitkeep").map((f) => f.replace(".json", ""));
+    return files;
+  } catch {
+    return [];
+  }
+}
+var init_state = () => {};
+// src/interaction/triggers.ts
+function isTriggerEnabled(trigger, config2) {
+  const triggerConfig = config2.interaction?.triggers?.[trigger];
+  if (triggerConfig === undefined)
+    return false;
+  if (typeof triggerConfig === "boolean")
+    return triggerConfig;
+  return triggerConfig.enabled;
+}
+function getTriggerConfig(trigger, config2) {
+  const metadata = TRIGGER_METADATA[trigger];
+  const triggerConfig = config2.interaction?.triggers?.[trigger];
+  const defaults = config2.interaction?.defaults ?? {
+    timeout: 600000,
+    fallback: "escalate"
+  };
+  let fallback = metadata.defaultFallback;
+  let timeout = defaults.timeout;
+  if (typeof triggerConfig === "object") {
+    if (triggerConfig.fallback) {
+      fallback = triggerConfig.fallback;
+    }
+    if (triggerConfig.timeout) {
+      timeout = triggerConfig.timeout;
+    }
+  }
+  return { fallback, timeout };
+}
+function substituteTemplate(template, context) {
+  let result = template;
+  for (const [key, value] of Object.entries(context)) {
+    if (value !== undefined) {
+      result = result.replace(new RegExp(`\\{\\{${key}\\}\\}`, "g"), String(value));
+    }
+  }
+  return result;
+}
+function createTriggerRequest(trigger, context, config2) {
+  const metadata = TRIGGER_METADATA[trigger];
+  const { fallback, timeout } = getTriggerConfig(trigger, config2);
+  const summary = substituteTemplate(metadata.defaultSummary, context);
+  const id = `trigger-${trigger}-${Date.now()}`;
+  return {
+    id,
+    type: "confirm",
+    featureName: context.featureName,
+    storyId: context.storyId,
+    stage: "custom",
+    summary,
+    fallback,
+    timeout,
+    createdAt: Date.now(),
+    metadata: {
+      trigger,
+      safety: metadata.safety
+    }
+  };
+}
+async function executeTrigger(trigger, context, config2, chain) {
+  const request = createTriggerRequest(trigger, context, config2);
+  const response = await chain.prompt(request);
+  return response;
+}
+async function checkSecurityReview(context, config2, chain) {
+  if (!isTriggerEnabled("security-review", config2))
+    return true;
+  const response = await executeTrigger("security-review", context, config2, chain);
+  return response.action !== "abort";
+}
+async function checkCostExceeded(context, config2, chain) {
+  if (!isTriggerEnabled("cost-exceeded", config2))
+    return true;
+  const response = await executeTrigger("cost-exceeded", context, config2, chain);
+  return response.action !== "abort";
+}
+async function checkMergeConflict(context, config2, chain) {
+  if (!isTriggerEnabled("merge-conflict", config2))
+    return true;
+  const response = await executeTrigger("merge-conflict", context, config2, chain);
+  return response.action !== "abort";
+}
+async function checkCostWarning(context, config2, chain) {
+  if (!isTriggerEnabled("cost-warning", config2))
+    return "continue";
+  const response = await executeTrigger("cost-warning", context, config2, chain);
+  return response.action === "approve" ? "escalate" : "continue";
+}
+async function checkPreMerge(context, config2, chain) {
+  if (!isTriggerEnabled("pre-merge", config2))
+    return true;
+  const response = await executeTrigger("pre-merge", context, config2, chain);
+  return response.action === "approve";
+}
+async function checkStoryAmbiguity(context, config2, chain) {
+  if (!isTriggerEnabled("story-ambiguity", config2))
+    return true;
+  const response = await executeTrigger("story-ambiguity", context, config2, chain);
+  return response.action === "approve";
+}
+async function checkReviewGate(context, config2, chain) {
+  if (!isTriggerEnabled("review-gate", config2))
+    return true;
+  const response = await executeTrigger("review-gate", context, config2, chain);
+  return response.action === "approve";
+}
+async function checkStoryOversized(context, config2, chain) {
+  if (!isTriggerEnabled("story-oversized", config2))
+    return "continue";
+  try {
+    const response = await executeTrigger("story-oversized", context, config2, chain);
+    if (response.action === "approve")
+      return "decompose";
+    if (response.action === "skip")
+      return "skip";
+    return "continue";
+  } catch {
+    return "continue";
+  }
+}
+var init_triggers = __esm(() => {
+  init_types4();
+});
 // src/interaction/index.ts
 var init_interaction = __esm(() => {
   init_types4();
@@ -23948,6 +24021,7 @@ var init_interaction = __esm(() => {
   init_auto();
   init_triggers();
   init_init();
+  init_bridge_builder();
 });
 // src/pipeline/runner.ts
@@ -24406,10 +24480,11 @@ ${stderr}` };
       if (workdirGroups.size === 0) {
         workdirGroups.set("", { stories: [], criteria: [] });
       }
+      const featureName = ctx.prd.feature;
       const testPaths = [];
       for (const [workdir] of workdirGroups) {
         const packageDir = workdir ? path5.join(ctx.workdir, workdir) : ctx.workdir;
-        const testPath = path5.join(packageDir, acceptanceTestFilename(language));
+        const testPath = path5.join(packageDir, ".nax", "features", featureName, acceptanceTestFilename(language));
         testPaths.push({ testPath, packageDir });
       }
       let totalCriteria = 0;
@@ -28357,7 +28432,7 @@ async function rollbackToRef(workdir, ref) {
   }
   logger.info("tdd", "Successfully rolled back git changes", { ref });
 }
-async function runTddSession(role, agent, story, config2, workdir, modelTier, beforeRef, contextMarkdown, lite = false, skipIsolation = false, constitution, featureName) {
+async function runTddSession(role, agent, story, config2, workdir, modelTier, beforeRef, contextMarkdown, lite = false, skipIsolation = false, constitution, featureName, interactionBridge) {
   const startTime = Date.now();
   let prompt;
   if (_sessionRunnerDeps.buildPrompt) {
@@ -28391,7 +28466,8 @@ async function runTddSession(role, agent, story, config2, workdir, modelTier, be
     featureName,
     storyId: story.id,
     sessionRole: role,
-    keepSessionOpen
+    keepSessionOpen,
+    interactionBridge
   });
   if (!result.success && result.pid) {
     await _sessionRunnerDeps.cleanupProcessTree(result.pid);
@@ -28756,7 +28832,8 @@ async function runThreeSessionTdd(options) {
     constitution,
     dryRun = false,
     lite = false,
-    _recursionDepth = 0
+    _recursionDepth = 0,
+    interactionChain
   } = options;
   const logger = getLogger();
   const MAX_RECURSION_DEPTH = 2;
@@ -28815,7 +28892,7 @@ async function runThreeSessionTdd(options) {
   let session1;
   if (!isRetry) {
     const testWriterTier = config2.tdd.sessionTiers?.testWriter ?? "balanced";
-    session1 = await runTddSession("test-writer", agent, story, config2, workdir, testWriterTier, session1Ref, contextMarkdown, lite, lite, constitution, featureName);
+    session1 = await runTddSession("test-writer", agent, story, config2, workdir, testWriterTier, session1Ref, contextMarkdown, lite, lite, constitution, featureName, buildInteractionBridge(interactionChain, { featureName, storyId: story.id, stage: "execution" }));
     sessions.push(session1);
   }
   if (session1 && !session1.success) {
@@ -28877,7 +28954,7 @@ async function runThreeSessionTdd(options) {
   });
   const session2Ref = await captureGitRef(workdir) ?? "HEAD";
   const implementerTier = config2.tdd.sessionTiers?.implementer ?? modelTier;
-  const session2 = await runTddSession("implementer", agent, story, config2, workdir, implementerTier, session2Ref, contextMarkdown, lite, lite, constitution, featureName);
+  const session2 = await runTddSession("implementer", agent, story, config2, workdir, implementerTier, session2Ref, contextMarkdown, lite, lite, constitution, featureName, buildInteractionBridge(interactionChain, { featureName, storyId: story.id, stage: "execution" }));
   sessions.push(session2);
   if (!session2.success) {
     needsHumanReview = true;
@@ -28995,6 +29072,7 @@ async function runThreeSessionTdd(options) {
 var init_orchestrator2 = __esm(() => {
   init_config();
   init_greenfield();
+  init_bridge_builder();
   init_logger2();
   init_git();
   init_verification();
@@ -29060,6 +29138,7 @@ var executionStage, _executionDeps;
 var init_execution2 = __esm(() => {
   init_agents();
   init_config();
+  init_bridge_builder();
   init_triggers();
   init_logger2();
   init_tdd();
@@ -29094,7 +29173,8 @@ var init_execution2 = __esm(() => {
           contextMarkdown: ctx.contextMarkdown,
           constitution: ctx.constitution?.content,
           dryRun: false,
-          lite: isLiteMode
+          lite: isLiteMode,
+          interactionChain: ctx.interaction
         });
         ctx.agentResult = {
           success: tddResult.success,
@@ -29168,34 +29248,11 @@ Category: ${tddResult.failureCategory ?? "unknown"}`,
         pidRegistry: ctx.pidRegistry,
         featureName: ctx.prd.feature,
         storyId: ctx.story.id,
-        interactionBridge: (() => {
-          const plugin = ctx.interaction?.getPrimary();
-          if (!plugin)
-            return;
-          const QUESTION_PATTERNS = [/\?/, /\bwhich\b/i, /\bshould i\b/i, /\bunclear\b/i, /\bplease clarify\b/i];
-          return {
-            detectQuestion: async (text) => QUESTION_PATTERNS.some((p) => p.test(text)),
-            onQuestionDetected: async (text) => {
-              const requestId = `ix-acp-${Date.now()}-${Math.random().toString(36).slice(2, 9)}`;
-              await plugin.send({
-                id: requestId,
-                type: "input",
-                featureName: ctx.prd.feature,
-                storyId: ctx.story.id,
-                stage: "execution",
-                summary: text,
-                fallback: "continue",
-                createdAt: Date.now()
-              });
-              try {
-                const response = await plugin.receive(requestId, 120000);
-                return response.value ?? "continue";
-              } catch {
-                return "continue";
-              }
-            }
-          };
-        })()
+        interactionBridge: buildInteractionBridge(ctx.interaction, {
+          featureName: ctx.prd.feature,
+          storyId: ctx.story.id,
+          stage: "execution"
+        })
       });
       ctx.agentResult = result;
       await autoCommitIfDirty(storyWorkdir, "execution", "single-session", ctx.story.id);
@@ -32198,7 +32255,8 @@ async function checkGitignoreCoversNax(workdir) {
     ".nax/features/*/status.json",
     ".nax-pids",
     ".nax-wt/",
-    "**/.nax-acceptance*"
+    "**/.nax-acceptance*",
+    "**/.nax/features/*/"
   ];
   const missing = patterns.filter((pattern) => !content.includes(pattern));
   const passed = missing.length === 0;
@@ -34481,7 +34539,7 @@ __export(exports_parallel_executor_rectify, {
 });
 import path15 from "path";
 async function rectifyConflictedStory(options) {
-  const { storyId, workdir, config: config2, hooks, pluginRegistry, prd, eventEmitter } = options;
+  const { storyId, workdir, config: config2, hooks, pluginRegistry, prd, eventEmitter, agentGetFn } = options;
   const logger = getSafeLogger();
   logger?.info("parallel", "Rectifying story on updated base", { storyId, attempt: "rectification" });
   try {
@@ -34513,7 +34571,8 @@ async function rectifyConflictedStory(options) {
       hooks,
       plugins: pluginRegistry,
       storyStartTime: new Date().toISOString(),
-      routing
+      routing,
+      agentGetFn
     };
     const pipelineResult = await runPipeline2(defaultPipeline2, pipelineContext, eventEmitter);
     const cost = pipelineResult.context.agentResult?.estimatedCost ?? 0;
@@ -34549,7 +34608,7 @@ var init_parallel_executor_rectify = __esm(() => {
 // src/execution/parallel-executor-rectification-pass.ts
 async function runRectificationPass(conflictedStories, options, prd, rectifyConflictedStory2) {
   const logger = getSafeLogger();
-  const { workdir, config: config2, hooks, pluginRegistry, eventEmitter } = options;
+  const { workdir, config: config2, hooks, pluginRegistry, eventEmitter, agentGetFn } = options;
   const rectify = rectifyConflictedStory2 || (async (opts) => {
     const { rectifyConflictedStory: importedRectify } = await Promise.resolve().then(() => (init_parallel_executor_rectify(), exports_parallel_executor_rectify));
     return importedRectify(opts);
@@ -34570,7 +34629,8 @@ async function runRectificationPass(conflictedStories, options, prd, rectifyConf
       hooks,
       pluginRegistry,
       prd,
-      eventEmitter
+      eventEmitter,
+      agentGetFn
     });
     additionalCost += result.cost;
     if (result.success) {
@@ -68241,7 +68301,7 @@ async function generateAcceptanceTestsForFeature(specContent, featureName, featu
 init_registry();
 import { existsSync as existsSync11 } from "fs";
 import { join as join11 } from "path";
-import { createInterface } from "readline";
+import { createInterface as createInterface2 } from "readline";
 init_test_strategy();
 // src/context/generator.ts
@@ -68779,6 +68839,8 @@ async function generateForPackage(packageDir, config2, dryRun = false, repoRoot)
 // src/cli/plan.ts
 init_pid_registry();
+init_bridge_builder();
+init_init();
 init_logger2();
 // src/prd/schema.ts
@@ -68907,11 +68969,19 @@ function validateStory(raw, index, allIds) {
     ...contextFiles.length > 0 ? { contextFiles } : {}
   };
 }
+function sanitizeInvalidEscapes(text) {
+  let result = text.replace(/\\x([0-9a-fA-F]{1,2})/g, (_, hex3) => `\\u00${hex3.padStart(2, "0")}`);
+  result = result.replace(/\\u([0-9a-fA-F]{1,3})(?![0-9a-fA-F])/g, (_, digits) => `\\u${digits.padStart(4, "0")}`);
+  result = result.replace(/\\u(?![0-9a-fA-F])/g, "\\");
+  result = result.replace(/\\([^"\\\/bfnrtu])/g, "$1");
+  return result;
+}
 function parseRawString(text) {
   const extracted = extractJsonFromMarkdown(text);
   const cleaned = stripTrailingCommas(extracted);
+  const sanitized = sanitizeInvalidEscapes(cleaned);
   try {
-    return JSON.parse(cleaned);
+    return JSON.parse(sanitized);
   } catch (err) {
     const parseErr = err;
     throw new Error(`[schema] Failed to parse JSON: ${parseErr.message}`, { cause: parseErr });
@@ -68965,7 +69035,8 @@ var _planDeps = {
   existsSync: (path) => existsSync11(path),
   discoverWorkspacePackages: (repoRoot) => discoverWorkspacePackages(repoRoot),
   readPackageJsonAt: (path) => Bun.file(path).json().catch(() => null),
-  createInteractionBridge: () => createCliInteractionBridge()
+  createInteractionBridge: () => createCliInteractionBridge(),
+  initInteractionChain: (cfg, headless) => initInteractionChain(cfg, headless)
 };
 async function planCommand(workdir, config2, options) {
   const naxDir = join11(workdir, ".nax");
@@ -69028,7 +69099,13 @@ async function planCommand(workdir, config2, options) {
     const adapter = _planDeps.getAgent(agentName, config2);
     if (!adapter)
       throw new Error(`[plan] No agent adapter found for '${agentName}'`);
-    const interactionBridge = _planDeps.createInteractionBridge();
+    const headless = !process.stdin.isTTY;
+    const interactionChain = config2 ? await _planDeps.initInteractionChain(config2, headless) : null;
+    const configuredBridge = interactionChain ? buildInteractionBridge(interactionChain, {
+      featureName: options.feature,
+      stage: "pre-flight"
+    }) : undefined;
+    const interactionBridge = configuredBridge ?? _planDeps.createInteractionBridge();
     const pidRegistry = new PidRegistry(workdir);
     const resolvedPerm = resolvePermissions(config2, "plan");
     const resolvedModel = config2?.plan?.model ?? "balanced";
@@ -69057,6 +69134,8 @@ async function planCommand(workdir, config2, options) {
       });
     } finally {
       await pidRegistry.killAll().catch(() => {});
+      if (interactionChain)
+        await interactionChain.destroy().catch(() => {});
       logger?.info("plan", "Interactive session ended", { durationMs: Date.now() - planStartTime });
     }
     if (!_planDeps.existsSync(outputPath)) {
@@ -69083,7 +69162,7 @@ function createCliInteractionBridge() {
 \uD83E\uDD16 Agent: ${text}
 You: `);
       return new Promise((resolve4) => {
-        const rl = createInterface({ input: process.stdin, terminal: false });
+        const rl = createInterface2({ input: process.stdin, terminal: false });
         rl.once("line", (line) => {
           rl.close();
           resolve4(line.trim());
@@ -72036,7 +72115,8 @@ async function runExecutionPhase(options, prd, pluginRegistry) {
       allStoryMetrics,
       pluginRegistry,
       formatterMode: options.formatterMode,
-      headless: options.headless
+      headless: options.headless,
+      agentGetFn: options.agentGetFn
     }, prd);
     prd = parallelResult.prd;
     totalCost = parallelResult.totalCost;