npm - @kody-ade/kody-engine-lite - Versions diffs - 0.1.113 → 0.1.114 - Mend

@kody-ade/kody-engine-lite 0.1.113 → 0.1.114

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/dist/bin/cli.js CHANGED Viewed

@@ -226,13 +226,13 @@ function getProjectConfig() {
   const configPath = path6.join(_configDir ?? process.cwd(), "kody.config.json");
   if (fs7.existsSync(configPath)) {
     try {
-      const result = parseJsonSafe(fs7.readFileSync(configPath, "utf-8"));
-      if (!result.ok) {
-        logger.warn(`kody.config.json: ${result.error} \u2014 using defaults`);
+      const result2 = parseJsonSafe(fs7.readFileSync(configPath, "utf-8"));
+      if (!result2.ok) {
+        logger.warn(`kody.config.json: ${result2.error} \u2014 using defaults`);
         _config = { ...DEFAULT_CONFIG };
         return _config;
       }
-      const raw = result.data;
+      const raw = result2.data;
       _config = {
         quality: { ...DEFAULT_CONFIG.quality, ...raw.quality },
         git: { ...DEFAULT_CONFIG.git, ...raw.git },
@@ -966,8 +966,8 @@ function findLatestTaskForIssue(issueNumber, projectDir) {
 }
 function generateTaskId() {
   const now = /* @__PURE__ */ new Date();
-  const pad = (n) => String(n).padStart(2, "0");
-  return `${String(now.getFullYear()).slice(2)}${pad(now.getMonth() + 1)}${pad(now.getDate())}-${pad(now.getHours())}${pad(now.getMinutes())}${pad(now.getSeconds())}`;
+  const pad2 = (n) => String(n).padStart(2, "0");
+  return `${String(now.getFullYear()).slice(2)}${pad2(now.getMonth() + 1)}${pad2(now.getDate())}-${pad2(now.getHours())}${pad2(now.getMinutes())}${pad2(now.getSeconds())}`;
 }
 function resolveTaskIdFromComments(issueNumber) {
   try {
@@ -1361,13 +1361,13 @@ Kody is decomposing ${src} into tasks...`);
   fs11.writeFileSync(path10.join(taskDir, MARKER_FILE), JSON.stringify({ ticketId, prdFile, issueNumber }));
   const runner = opts.runner ?? createClaudeCodeRunner();
   logger.info(`  model=${model} timeout=${TASKIFY_TIMEOUT_MS / 1e3}s`);
-  const result = await runner.run("taskify", prompt, model, TASKIFY_TIMEOUT_MS, taskDir, {
+  const result2 = await runner.run("taskify", prompt, model, TASKIFY_TIMEOUT_MS, taskDir, {
     cwd: projectDir,
     mcpConfigJson,
     env: opts.runnerEnv
   });
-  if (result.outcome !== "completed") {
-    const errMsg = result.outcome === "timed_out" ? "Taskify timed out after 5 minutes." : `Taskify failed: ${result.error}`;
+  if (result2.outcome !== "completed") {
+    const errMsg = result2.outcome === "timed_out" ? "Taskify timed out after 5 minutes." : `Taskify failed: ${result2.error}`;
     if (issueNumber && !local) {
       postComment(issueNumber, `Kody taskify failed:
@@ -1380,7 +1380,7 @@ Kody is decomposing ${src} into tasks...`);
   if (!fs11.existsSync(resultPath)) {
     const errMsg = `Claude did not write ${RESULT_FILE}. Output:
-${result.output?.slice(0, 500) ?? "(none)"}`;
+${result2.output?.slice(0, 500) ?? "(none)"}`;
     if (issueNumber && !local) {
       postComment(issueNumber, `Kody taskify failed: result file not found.
@@ -1568,6 +1568,999 @@ var init_taskify_command = __esm({
   }
 });
+// src/cli/test-model-tests.ts
+import * as fs12 from "fs";
+import * as os2 from "os";
+import * as path11 from "path";
+import * as zlib from "zlib";
+import { spawnSync, execSync as execSync2 } from "child_process";
+async function apiCall(ctx, body) {
+  try {
+    const res = await fetch(`${ctx.proxyUrl}/v1/messages`, {
+      method: "POST",
+      headers: {
+        "Content-Type": "application/json",
+        "x-api-key": ctx.apiKey,
+        "anthropic-version": "2023-06-01"
+      },
+      body: JSON.stringify({ model: ctx.model, ...body }),
+      signal: AbortSignal.timeout(6e4)
+    });
+    const data = await res.json();
+    if (!res.ok) {
+      return { ok: false, data, status: res.status, errorMsg: data?.error?.message ?? `HTTP ${res.status}` };
+    }
+    return { ok: true, data, status: res.status };
+  } catch (err) {
+    return { ok: false, data: null, status: 0, errorMsg: err instanceof Error ? err.message : String(err) };
+  }
+}
+function extractText(data) {
+  if (!data?.content) return "";
+  return data.content.filter((b) => b.type === "text").map((b) => b.text ?? "").join("");
+}
+async function runToolConversation(ctx, tools, userPrompt, simulate, opts) {
+  const messages = [{ role: "user", content: userPrompt }];
+  const allCalls = [];
+  for (let turn = 0; turn < (opts?.maxTurns ?? 5); turn++) {
+    const body = {
+      max_tokens: 1024,
+      temperature: 0,
+      messages,
+      tools
+    };
+    if (opts?.system) body.system = opts.system;
+    const res = await apiCall(ctx, body);
+    if (!res.ok) return { finalText: "", toolCalls: allCalls, error: res.errorMsg };
+    const content = res.data.content ?? [];
+    const toolBlocks = content.filter((b) => b.type === "tool_use");
+    const textBlocks = content.filter((b) => b.type === "text");
+    if (toolBlocks.length === 0) {
+      return { finalText: textBlocks.map((b) => b.text ?? "").join(""), toolCalls: allCalls };
+    }
+    for (const tc of toolBlocks) allCalls.push({ name: tc.name, input: tc.input });
+    messages.push({ role: "assistant", content });
+    messages.push({
+      role: "user",
+      content: toolBlocks.map((tc) => ({
+        type: "tool_result",
+        tool_use_id: tc.id,
+        content: simulate(tc.name, tc.input)
+      }))
+    });
+  }
+  return { finalText: "", toolCalls: allCalls, error: "Max turns reached" };
+}
+function filterStderr(stderr) {
+  return stderr.split("\n").filter((l) => !l.includes("CPU lacks AVX") && !l.includes("bun-darwin") && !l.includes("Warning: no stdin data") && l.trim().length > 0).join("\n").trim();
+}
+function runClaudeTest(ctx, prompt, extraFlags = [], timeout = 9e4) {
+  try {
+    const result2 = spawnSync("claude", [
+      "--print",
+      "--model",
+      ctx.model,
+      "--dangerously-skip-permissions",
+      ...extraFlags,
+      "-p",
+      prompt
+    ], {
+      env: { ...process.env, ANTHROPIC_BASE_URL: ctx.proxyUrl, ANTHROPIC_API_KEY: ctx.apiKey },
+      timeout,
+      encoding: "utf-8",
+      cwd: ctx.projectDir
+    });
+    return {
+      stdout: result2.stdout ?? "",
+      stderr: filterStderr(result2.stderr ?? ""),
+      exitCode: result2.status ?? 1
+    };
+  } catch (err) {
+    return { stdout: "", stderr: String(err), exitCode: 1 };
+  }
+}
+function isGitClean(dir) {
+  try {
+    const out = execSync2("git diff --name-only", { cwd: dir, encoding: "utf-8", timeout: 5e3 });
+    return out.trim().length === 0;
+  } catch {
+    return false;
+  }
+}
+function revertChanges(dir) {
+  try {
+    execSync2("git checkout -- src/logger.ts", { cwd: dir, timeout: 5e3, stdio: "pipe" });
+  } catch {
+  }
+}
+function result(name, category, status, accuracy, durationMs, detail, metrics) {
+  return { name, category, status, accuracy, durationMs, detail, metrics };
+}
+function crc32(buf) {
+  let c = 4294967295;
+  for (const b of buf) c = CRC_TABLE[(c ^ b) & 255] ^ c >>> 8;
+  return (c ^ 4294967295) >>> 0;
+}
+function createRedPng() {
+  const w = 4, h = 4;
+  const scanlines = Buffer.alloc(h * (1 + w * 3));
+  for (let y = 0; y < h; y++) {
+    const off = y * (1 + w * 3);
+    scanlines[off] = 0;
+    for (let x = 0; x < w; x++) {
+      scanlines[off + 1 + x * 3] = 255;
+      scanlines[off + 1 + x * 3 + 1] = 0;
+      scanlines[off + 1 + x * 3 + 2] = 0;
+    }
+  }
+  function chunk(type, data) {
+    const tb = Buffer.from(type, "ascii");
+    const merged = Buffer.concat([tb, data]);
+    const len = Buffer.alloc(4);
+    len.writeUInt32BE(data.length);
+    const crcBuf = Buffer.alloc(4);
+    crcBuf.writeUInt32BE(crc32(merged));
+    return Buffer.concat([len, tb, data, crcBuf]);
+  }
+  const sig = Buffer.from([137, 80, 78, 71, 13, 10, 26, 10]);
+  const ihdr = Buffer.alloc(13);
+  ihdr.writeUInt32BE(w, 0);
+  ihdr.writeUInt32BE(h, 4);
+  ihdr[8] = 8;
+  ihdr[9] = 2;
+  return Buffer.concat([sig, chunk("IHDR", ihdr), chunk("IDAT", zlib.deflateSync(scanlines)), chunk("IEND", Buffer.alloc(0))]);
+}
+async function testSimplePrompt(ctx) {
+  const t = Date.now();
+  const res = await apiCall(ctx, {
+    max_tokens: 50,
+    temperature: 0,
+    messages: [{ role: "user", content: "Reply with exactly: KODY_TEST_OK" }]
+  });
+  if (!res.ok) return result("simple_prompt", "basic", "fail", 0, Date.now() - t, `API error: ${res.errorMsg}`);
+  const text = extractText(res.data);
+  const ok = text.includes("KODY_TEST_OK");
+  return result(
+    "simple_prompt",
+    "basic",
+    ok ? "pass" : "fail",
+    ok ? 100 : 0,
+    Date.now() - t,
+    ok ? "Model responded correctly" : `Expected KODY_TEST_OK, got: ${text.slice(0, 80)}`
+  );
+}
+async function testJsonOutput(ctx) {
+  const t = Date.now();
+  const res = await apiCall(ctx, {
+    max_tokens: 200,
+    temperature: 0,
+    system: "Respond with ONLY valid JSON. No markdown fences, no explanation. Just raw JSON.",
+    messages: [{ role: "user", content: 'Return a JSON object with keys "status" (string "ok") and "model" (string, your model name).' }]
+  });
+  if (!res.ok) return result("json_output", "basic", "fail", 0, Date.now() - t, `API error: ${res.errorMsg}`);
+  let text = extractText(res.data).trim();
+  text = text.replace(/^```(?:json)?\s*\n?/i, "").replace(/\n?```\s*$/i, "").trim();
+  try {
+    const parsed = JSON.parse(text);
+    const hasKeys = typeof parsed.status === "string" && typeof parsed.model === "string";
+    return result(
+      "json_output",
+      "basic",
+      "pass",
+      hasKeys ? 100 : 70,
+      Date.now() - t,
+      hasKeys ? "Valid JSON with correct keys" : "Valid JSON but missing expected keys"
+    );
+  } catch {
+    return result("json_output", "basic", "fail", 0, Date.now() - t, `Invalid JSON: ${text.slice(0, 80)}`);
+  }
+}
+async function testSystemPromptRules(ctx) {
+  const t = Date.now();
+  const res = await apiCall(ctx, {
+    max_tokens: 200,
+    temperature: 0,
+    system: [
+      "STRICT RULES \u2014 violating ANY will crash the system:",
+      "1) Start every response with 'KODY:'",
+      "2) Never use the word 'the'",
+      "3) Keep response under 50 words",
+      "4) End your response with 'END'",
+      "5) Use ONLY lowercase letters (no uppercase anywhere)"
+    ].join("\n"),
+    messages: [{ role: "user", content: "Describe what a compiler does." }]
+  });
+  if (!res.ok) return result("system_prompt_rules", "basic", "fail", 0, Date.now() - t, `API error: ${res.errorMsg}`);
+  const text = extractText(res.data).trim();
+  let score = 0;
+  const checks = [];
+  if (text.startsWith("KODY:") || text.startsWith("kody:")) {
+    score += 20;
+    checks.push("starts-with-kody");
+  }
+  if (!text.toLowerCase().split(/\s+/).includes("the")) {
+    score += 20;
+    checks.push("no-the");
+  }
+  if (text.split(/\s+/).length <= 55) {
+    score += 20;
+    checks.push("under-50-words");
+  }
+  if (text.endsWith("END") || text.endsWith("end")) {
+    score += 20;
+    checks.push("ends-with-end");
+  }
+  if (text === text.toLowerCase()) {
+    score += 20;
+    checks.push("all-lowercase");
+  }
+  const status = score >= 80 ? "pass" : score >= 40 ? "warn" : "fail";
+  return result(
+    "system_prompt_rules",
+    "basic",
+    status,
+    score,
+    Date.now() - t,
+    `${score / 20}/5 rules followed: ${checks.join(", ")}`,
+    { instructionCompliance: score }
+  );
+}
+async function testExtendedThinking(ctx) {
+  const t = Date.now();
+  const res = await apiCall(ctx, {
+    max_tokens: 200,
+    thinking: { type: "enabled", budget_tokens: 2e3 },
+    messages: [{ role: "user", content: "What is 15 * 23?" }]
+  });
+  if (!res.ok) return result(
+    "extended_thinking",
+    "infrastructure",
+    "warn",
+    50,
+    Date.now() - t,
+    `Request failed (model may not support thinking): ${res.errorMsg?.slice(0, 80)}`
+  );
+  const hasThinking = Array.isArray(res.data.content) && res.data.content.some((b) => b.type === "thinking");
+  const hasText = extractText(res.data).length > 0;
+  if (hasThinking) return result("extended_thinking", "infrastructure", "pass", 100, Date.now() - t, "Thinking block present in response");
+  if (hasText) return result("extended_thinking", "infrastructure", "warn", 70, Date.now() - t, "Response OK but no thinking block");
+  return result("extended_thinking", "infrastructure", "fail", 0, Date.now() - t, "No content in response");
+}
+async function testToolRead(ctx) {
+  const t = Date.now();
+  const testFile = path11.join(os2.tmpdir(), "kody-test-model-read.txt");
+  fs12.writeFileSync(testFile, "KODY_SECRET_CONTENT_42");
+  try {
+    const conv = await runToolConversation(
+      ctx,
+      [TOOL_READ],
+      `Read the file ${testFile} and tell me what it contains.`,
+      (name, input) => {
+        if (name === "Read" && input.path === testFile) return "KODY_SECRET_CONTENT_42";
+        return "Error: File not found";
+      }
+    );
+    if (conv.error) return result("tool_read", "tool-use", "fail", 0, Date.now() - t, `Error: ${conv.error}`);
+    const calledRead = conv.toolCalls.some((tc) => tc.name === "Read");
+    const correctPath = conv.toolCalls.some((tc) => tc.name === "Read" && tc.input.path === testFile);
+    const mentionsContent = conv.finalText.includes("KODY_SECRET_CONTENT_42") || conv.finalText.includes("42");
+    let acc = 0;
+    if (calledRead) acc += 30;
+    if (correctPath) acc += 30;
+    if (mentionsContent) acc += 40;
+    return result(
+      "tool_read",
+      "tool-use",
+      acc >= 60 ? "pass" : "fail",
+      acc,
+      Date.now() - t,
+      `Read called: ${calledRead}, correct path: ${correctPath}, content referenced: ${mentionsContent}`,
+      { toolSelection: calledRead ? 100 : 0 }
+    );
+  } finally {
+    fs12.rmSync(testFile, { force: true });
+  }
+}
+async function testToolEdit(ctx) {
+  const t = Date.now();
+  const conv = await runToolConversation(
+    ctx,
+    [TOOL_READ, TOOL_EDIT],
+    'Read the file /tmp/kody-edit-test.txt, then use Edit to replace "hello" with "goodbye" in it.',
+    (name, input) => {
+      if (name === "Read") return "hello world";
+      if (name === "Edit") return "File edited successfully";
+      return "Unknown tool";
+    }
+  );
+  if (conv.error) return result("tool_edit", "tool-use", "fail", 0, Date.now() - t, `Error: ${conv.error}`);
+  const editCall = conv.toolCalls.find((tc) => tc.name === "Edit");
+  let acc = 0;
+  if (editCall) {
+    acc += 40;
+    if (editCall.input.old_string === "hello") acc += 30;
+    if (editCall.input.new_string === "goodbye") acc += 30;
+  }
+  return result(
+    "tool_edit",
+    "tool-use",
+    acc >= 70 ? "pass" : acc > 0 ? "warn" : "fail",
+    acc,
+    Date.now() - t,
+    editCall ? `Edit called with old="${editCall.input.old_string}" new="${editCall.input.new_string}"` : "Edit tool was not called",
+    { toolSelection: editCall ? 100 : 0 }
+  );
+}
+async function testToolBash(ctx) {
+  const t = Date.now();
+  const conv = await runToolConversation(
+    ctx,
+    [TOOL_BASH],
+    "Run this exact bash command: echo KODY_BASH_OK",
+    (name, input) => {
+      if (name === "Bash") return "KODY_BASH_OK\n";
+      return "Error";
+    }
+  );
+  if (conv.error) return result("tool_bash", "tool-use", "fail", 0, Date.now() - t, `Error: ${conv.error}`);
+  const bashCall = conv.toolCalls.find((tc) => tc.name === "Bash");
+  const correctCmd = bashCall && String(bashCall.input.command).includes("echo KODY_BASH_OK");
+  const acc = bashCall ? correctCmd ? 100 : 50 : 0;
+  return result(
+    "tool_bash",
+    "tool-use",
+    acc >= 50 ? "pass" : "fail",
+    acc,
+    Date.now() - t,
+    bashCall ? `Bash called: ${bashCall.input.command}` : "Bash tool was not called",
+    { toolSelection: bashCall ? 100 : 0 }
+  );
+}
+async function testImageAttachment(ctx) {
+  const t = Date.now();
+  const pngData = createRedPng().toString("base64");
+  const res = await apiCall(ctx, {
+    max_tokens: 100,
+    temperature: 0,
+    messages: [{
+      role: "user",
+      content: [
+        { type: "image", source: { type: "base64", media_type: "image/png", data: pngData } },
+        { type: "text", text: "What color is this image? Reply with just the color name." }
+      ]
+    }]
+  });
+  if (!res.ok) return result(
+    "image_attachment",
+    "tool-use",
+    "fail",
+    0,
+    Date.now() - t,
+    `API error (model may not support vision): ${res.errorMsg?.slice(0, 80)}`
+  );
+  const text = extractText(res.data).toLowerCase();
+  const mentionsRed = text.includes("red");
+  const mentionsColor = mentionsRed || text.includes("color") || text.includes("image") || text.includes("pixel");
+  const acc = mentionsRed ? 100 : mentionsColor ? 50 : 20;
+  return result(
+    "image_attachment",
+    "tool-use",
+    mentionsRed ? "pass" : mentionsColor ? "warn" : "fail",
+    acc,
+    Date.now() - t,
+    `Response: ${text.slice(0, 80)}`
+  );
+}
+async function testErrorRecovery(ctx) {
+  const t = Date.now();
+  let errorGiven = false;
+  const conv = await runToolConversation(
+    ctx,
+    [TOOL_READ, TOOL_BASH],
+    "Read the file /tmp/nonexistent-kody-file.txt and tell me what's in it. If the file doesn't exist, say so.",
+    (name, input) => {
+      if (name === "Read" && !errorGiven) {
+        errorGiven = true;
+        return "Error: ENOENT: no such file or directory";
+      }
+      if (name === "Bash") return "ls: /tmp/nonexistent-kody-file.txt: No such file or directory";
+      return "Error: File not found";
+    }
+  );
+  if (conv.error) return result("error_recovery", "advanced", "fail", 0, Date.now() - t, `Error: ${conv.error}`);
+  const reported = conv.finalText.toLowerCase().includes("not found") || conv.finalText.toLowerCase().includes("doesn't exist") || conv.finalText.toLowerCase().includes("does not exist") || conv.finalText.toLowerCase().includes("no such file");
+  const tried = conv.toolCalls.length >= 1;
+  const acc = reported ? tried ? 100 : 70 : 20;
+  return result(
+    "error_recovery",
+    "advanced",
+    reported ? "pass" : "warn",
+    acc,
+    Date.now() - t,
+    reported ? "Gracefully reported missing file" : `Response: ${conv.finalText.slice(0, 80)}`
+  );
+}
+async function testToolMultiStep(ctx) {
+  const t = Date.now();
+  const r = runClaudeTest(
+    ctx,
+    "Do these steps in order: 1) Read kody.config.json 2) Tell me the value of git.defaultBranch. Reply with ONLY the branch name, nothing else."
+  );
+  if (!r.stdout.trim() && r.exitCode !== 0) return result(
+    "tool_multi_step",
+    "tool-use",
+    "fail",
+    0,
+    Date.now() - t,
+    `CLI failed: ${r.stderr.slice(0, 200) || "no output"}`
+  );
+  const out = r.stdout.trim().toLowerCase();
+  const correct = out.includes("main");
+  return result(
+    "tool_multi_step",
+    "tool-use",
+    correct ? "pass" : "fail",
+    correct ? 100 : 20,
+    Date.now() - t,
+    correct ? "Correct: main" : `Got: ${out.slice(0, 80)}`
+  );
+}
+async function testPlanStage(ctx) {
+  const t = Date.now();
+  const wasClean = isGitClean(ctx.projectDir);
+  const r = runClaudeTest(ctx, [
+    "You are a planning agent. Your ONLY job is to output a markdown plan.",
+    "CRITICAL: Do NOT use Edit, Write, or Bash tools. Do NOT modify any files. ONLY use Read, Glob, and Grep for research.",
+    "If you modify any files, the system will crash.",
+    "",
+    "Task: Plan adding a /health endpoint to an Express app.",
+    "Output a markdown plan with ## Step N sections. Each step must have File, Change, and Why fields.",
+    "Keep it to 3 steps maximum."
+  ].join("\n"), [], 12e4);
+  const filesModified = wasClean && !isGitClean(ctx.projectDir);
+  if (filesModified) revertChanges(ctx.projectDir);
+  if (!r.stdout.trim() && r.exitCode !== 0) return result(
+    "plan_stage",
+    "stage-simulation",
+    "fail",
+    0,
+    Date.now() - t,
+    `CLI failed: ${r.stderr.slice(0, 200) || "no output"}`
+  );
+  const out = r.stdout;
+  const hasStepFormat = /##\s*Step/i.test(out);
+  const hasStructure = hasStepFormat || /\*\*File\*\*/i.test(out) && /\*\*Change\*\*/i.test(out);
+  const boundary = filesModified ? 0 : 100;
+  const format = hasStructure ? 100 : hasStepFormat ? 70 : out.length > 50 ? 30 : 0;
+  const acc = Math.round(boundary * 0.6 + format * 0.4);
+  const status = filesModified ? "fail" : hasStructure ? "pass" : "warn";
+  return result(
+    "plan_stage",
+    "stage-simulation",
+    status,
+    acc,
+    Date.now() - t,
+    filesModified ? "FAIL: Model modified files during plan stage (instruction violation)" : hasStructure ? "Plan output with correct structure, no files modified" : "Output lacks expected ## Step structure",
+    { boundaryRespect: boundary, outputFormat: format, instructionCompliance: boundary }
+  );
+}
+async function testBuildStage(ctx) {
+  const t = Date.now();
+  const r = runClaudeTest(ctx, "Add a comment '// kody-build-test' as the very first line of src/logger.ts. That is your only task.");
+  const diff = (() => {
+    try {
+      return execSync2("git diff src/logger.ts", { cwd: ctx.projectDir, encoding: "utf-8", timeout: 5e3 });
+    } catch {
+      return "";
+    }
+  })();
+  const edited = diff.includes("kody-build-test");
+  revertChanges(ctx.projectDir);
+  if (!r.stdout.trim() && r.exitCode !== 0 && !edited) return result(
+    "build_stage",
+    "stage-simulation",
+    "fail",
+    0,
+    Date.now() - t,
+    `CLI failed: ${r.stderr.slice(0, 200) || "no output"}`
+  );
+  return result(
+    "build_stage",
+    "stage-simulation",
+    edited ? "pass" : "fail",
+    edited ? 100 : 0,
+    Date.now() - t,
+    edited ? "File correctly modified with expected comment" : "File was not modified as expected"
+  );
+}
+async function testReviewStage(ctx) {
+  const t = Date.now();
+  const wasClean = isGitClean(ctx.projectDir);
+  const r = runClaudeTest(ctx, [
+    "You are a code review agent. Review the file src/logger.ts.",
+    "CRITICAL: Do NOT modify any files. Only READ and analyze.",
+    "Output your review as markdown with this exact format:",
+    "## Summary",
+    "<1-2 sentence summary>",
+    "## Issues Found",
+    "- <issues>",
+    "## Verdict",
+    "APPROVE or REQUEST_CHANGES"
+  ].join("\n"));
+  const filesModified = wasClean && !isGitClean(ctx.projectDir);
+  if (filesModified) revertChanges(ctx.projectDir);
+  if (!r.stdout.trim() && r.exitCode !== 0) return result(
+    "review_stage",
+    "stage-simulation",
+    "fail",
+    0,
+    Date.now() - t,
+    `CLI failed: ${r.stderr.slice(0, 200) || "no output"}`
+  );
+  const out = r.stdout;
+  const hasVerdict = /verdict/i.test(out);
+  const hasSummary = /summary/i.test(out);
+  const boundary = filesModified ? 0 : 100;
+  const format = (hasVerdict ? 50 : 0) + (hasSummary ? 50 : 0);
+  const acc = Math.round(boundary * 0.5 + format * 0.5);
+  const status = filesModified ? "fail" : hasVerdict && hasSummary ? "pass" : "warn";
+  return result(
+    "review_stage",
+    "stage-simulation",
+    status,
+    acc,
+    Date.now() - t,
+    filesModified ? "FAIL: Model modified files during review (instruction violation)" : `Summary: ${hasSummary}, Verdict: ${hasVerdict}, no files modified`,
+    { boundaryRespect: boundary, outputFormat: format }
+  );
+}
+async function testMcpTools(ctx) {
+  const t = Date.now();
+  const mcpConfig = path11.join(os2.tmpdir(), `kody-test-mcp-${Date.now()}.json`);
+  const testFile = path11.join(ctx.projectDir, "kody-mcp-compat-test.txt");
+  try {
+    fs12.writeFileSync(mcpConfig, JSON.stringify({
+      mcpServers: {
+        filesystem: { command: "npx", args: ["-y", "@modelcontextprotocol/server-filesystem", ctx.projectDir] }
+      }
+    }));
+    const r = runClaudeTest(
+      ctx,
+      `Use the MCP filesystem write_file tool to create a file at ${testFile} with the content 'mcp-ok'. Do not use the built-in Write tool.`,
+      ["--mcp-config", mcpConfig],
+      12e4
+    );
+    const created = fs12.existsSync(testFile);
+    const content = created ? fs12.readFileSync(testFile, "utf-8").trim() : "";
+    const correct = content.includes("mcp-ok");
+    return result(
+      "mcp_tools",
+      "advanced",
+      created ? "pass" : "fail",
+      correct ? 100 : created ? 70 : 0,
+      Date.now() - t,
+      created ? `File created, content: ${content.slice(0, 50)}` : `MCP test failed: ${r.stderr.slice(0, 80)}`
+    );
+  } catch (err) {
+    return result("mcp_tools", "advanced", "warn", 0, Date.now() - t, `MCP test error: ${err instanceof Error ? err.message : String(err)}`);
+  } finally {
+    fs12.rmSync(mcpConfig, { force: true });
+    fs12.rmSync(testFile, { force: true });
+    revertChanges(ctx.projectDir);
+  }
+}
+var TOOL_READ, TOOL_EDIT, TOOL_BASH, CRC_TABLE, ALL_TESTS;
+var init_test_model_tests = __esm({
+  "src/cli/test-model-tests.ts"() {
+    "use strict";
+    TOOL_READ = {
+      name: "Read",
+      description: "Read a file from the filesystem",
+      input_schema: {
+        type: "object",
+        properties: { path: { type: "string", description: "Absolute file path" } },
+        required: ["path"]
+      }
+    };
+    TOOL_EDIT = {
+      name: "Edit",
+      description: "Replace old_string with new_string in a file",
+      input_schema: {
+        type: "object",
+        properties: {
+          file_path: { type: "string" },
+          old_string: { type: "string" },
+          new_string: { type: "string" }
+        },
+        required: ["file_path", "old_string", "new_string"]
+      }
+    };
+    TOOL_BASH = {
+      name: "Bash",
+      description: "Execute a bash command and return output",
+      input_schema: {
+        type: "object",
+        properties: { command: { type: "string", description: "The command to run" } },
+        required: ["command"]
+      }
+    };
+    CRC_TABLE = new Uint32Array(256);
+    for (let n = 0; n < 256; n++) {
+      let c = n;
+      for (let k = 0; k < 8; k++) c = c & 1 ? 3988292384 ^ c >>> 1 : c >>> 1;
+      CRC_TABLE[n] = c >>> 0;
+    }
+    ALL_TESTS = [
+      // Infrastructure
+      { name: "extended_thinking", category: "infrastructure", description: "Extended thinking parameter support", run: testExtendedThinking },
+      // Basic
+      { name: "simple_prompt", category: "basic", description: "Basic text prompt and response", run: testSimplePrompt },
+      { name: "json_output", category: "basic", description: "JSON-only output constraint", run: testJsonOutput },
+      { name: "system_prompt_rules", category: "basic", description: "Multi-rule system prompt adherence", run: testSystemPromptRules },
+      // Tool use
+      { name: "tool_read", category: "tool-use", description: "Read tool: file reading", run: testToolRead },
+      { name: "tool_edit", category: "tool-use", description: "Edit tool: old/new string replacement", run: testToolEdit },
+      { name: "tool_bash", category: "tool-use", description: "Bash tool: command execution", run: testToolBash },
+      { name: "tool_multi_step", category: "tool-use", description: "Multi-step tool chain via CLI", run: testToolMultiStep },
+      { name: "image_attachment", category: "tool-use", description: "Vision: image content processing", run: testImageAttachment },
+      // Stage simulation
+      { name: "plan_stage", category: "stage-simulation", description: "Plan stage: read-only research + structured output", run: testPlanStage },
+      { name: "build_stage", category: "stage-simulation", description: "Build stage: code editing", run: testBuildStage },
+      { name: "review_stage", category: "stage-simulation", description: "Review stage: read-only + structured verdict", run: testReviewStage },
+      // Advanced
+      { name: "mcp_tools", category: "advanced", description: "MCP server tool integration", run: testMcpTools },
+      { name: "error_recovery", category: "advanced", description: "Graceful error handling on tool failure", run: testErrorRecovery }
+    ];
+  }
+});
+// src/cli/test-model-report.ts
+function pad(str, len) {
+  return str.padEnd(len);
+}
+function fmtDuration(ms) {
+  return `${(ms / 1e3).toFixed(1)}s`;
+}
+function formatReport(report) {
+  const W = 74;
+  const lines = [];
+  lines.push("=".repeat(W));
+  lines.push("");
+  lines.push("  Model Compatibility Report");
+  lines.push(`  Provider: ${report.provider} | Model: ${report.model}`);
+  lines.push(`  Date: ${report.timestamp}`);
+  lines.push(`  Duration: ${fmtDuration(report.totalDurationMs)}`);
+  lines.push("");
+  lines.push("-".repeat(W));
+  for (const cat of CATEGORY_ORDER) {
+    const catResults = report.results.filter((r) => r.category === cat);
+    if (catResults.length === 0) continue;
+    lines.push("");
+    lines.push(`  ${CATEGORY_LABELS[cat]}`);
+    lines.push("");
+    for (const r of catResults) {
+      const icon = r.status === "pass" ? "+" : r.status === "fail" ? "x" : "!";
+      const name = pad(r.name, 28);
+      const status = pad(r.status.toUpperCase(), 6);
+      const acc = pad(`${r.accuracy}%`, 5);
+      const dur = fmtDuration(r.durationMs);
+      lines.push(`  [${icon}] ${name} ${status} ${acc} ${dur}`);
+      if (r.status !== "pass" && r.detail) {
+        lines.push(`      ${r.detail.slice(0, W - 8)}`);
+      }
+    }
+  }
+  const passed = report.results.filter((r) => r.status === "pass").length;
+  const failed = report.results.filter((r) => r.status === "fail").length;
+  const warned = report.results.filter((r) => r.status === "warn").length;
+  const total = report.results.length;
+  const avgAccuracy = total > 0 ? Math.round(report.results.reduce((s, r) => s + r.accuracy, 0) / total) : 0;
+  lines.push("");
+  lines.push("-".repeat(W));
+  lines.push("");
+  lines.push(`  RESULTS: ${passed}/${total} PASS | ${failed} FAIL | ${warned} WARN`);
+  lines.push(`  OVERALL ACCURACY: ${avgAccuracy}%`);
+  lines.push(`  drop_params required: ${report.dropParamsRequired ? "YES" : "NO"}`);
+  lines.push("");
+  lines.push("  ACCURACY BY CATEGORY:");
+  for (const cat of CATEGORY_ORDER) {
+    const cr = report.results.filter((r) => r.category === cat);
+    if (cr.length === 0) continue;
+    const avg = Math.round(cr.reduce((s, r) => s + r.accuracy, 0) / cr.length);
+    lines.push(`    ${pad(CATEGORY_LABELS[cat], 22)} ${avg}%`);
+  }
+  lines.push("");
+  lines.push("  RECOMMENDATION:");
+  for (const line of getRecommendation(report)) {
+    lines.push(`  ${line}`);
+  }
+  lines.push("");
+  lines.push("=".repeat(W));
+  return lines.join("\n");
+}
+function getRecommendation(report) {
+  const lines = [];
+  const failedTests = report.results.filter((r) => r.status === "fail");
+  const avg = report.results.length > 0 ? Math.round(report.results.reduce((s, r) => s + r.accuracy, 0) / report.results.length) : 0;
+  if (avg >= 90 && failedTests.length === 0) {
+    lines.push("[+] Fully compatible -- suitable for all pipeline stages");
+    return lines;
+  }
+  const stageResults = report.results.filter((r) => r.category === "stage-simulation");
+  const workingStages = stageResults.filter((r) => r.status === "pass").map((r) => r.name.replace("_stage", ""));
+  const failingStages = stageResults.filter((r) => r.status !== "pass").map((r) => r.name.replace("_stage", ""));
+  if (workingStages.length > 0) {
+    lines.push(`[+] Suitable for: ${workingStages.join(", ")} stages`);
+  }
+  if (failingStages.length > 0) {
+    lines.push(`[x] Not recommended for: ${failingStages.join(", ")} stages`);
+  }
+  if (failedTests.length > 0) {
+    lines.push("");
+    lines.push("Failed tests:");
+    for (const t of failedTests) {
+      lines.push(`  - ${t.name}: ${t.detail.slice(0, 60)}`);
+    }
+  }
+  return lines;
+}
+var CATEGORY_ORDER, CATEGORY_LABELS;
+var init_test_model_report = __esm({
+  "src/cli/test-model-report.ts"() {
+    "use strict";
+    CATEGORY_ORDER = ["infrastructure", "basic", "tool-use", "stage-simulation", "advanced"];
+    CATEGORY_LABELS = {
+      infrastructure: "INFRASTRUCTURE",
+      basic: "BASIC CAPABILITIES",
+      "tool-use": "TOOL USE",
+      "stage-simulation": "STAGE SIMULATION",
+      advanced: "ADVANCED"
+    };
+  }
+});
+// src/cli/test-model-command.ts
+var test_model_command_exports = {};
+__export(test_model_command_exports, {
+  runTestModelCommand: () => runTestModelCommand
+});
+import * as fs13 from "fs";
+import * as os3 from "os";
+import * as path12 from "path";
+import { execFileSync as execFileSync10 } from "child_process";
+function parseTestModelArgs() {
+  const args2 = process.argv.slice(3);
+  function getArg3(flag) {
+    const idx = args2.indexOf(flag);
+    if (idx !== -1 && args2[idx + 1] && !args2[idx + 1].startsWith("--")) return args2[idx + 1];
+    return void 0;
+  }
+  const hasFlag3 = (f) => args2.includes(f);
+  if (hasFlag3("--help") || hasFlag3("-h")) {
+    logger.info([
+      "Usage: kody test-model --provider <provider> --model <model> --key <api-key> [options]",
+      "",
+      "Options:",
+      "  --provider     LLM provider name (e.g. gemini, openai, mistral)",
+      "  --model        Model identifier (e.g. gemini-2.5-flash)",
+      "  --key          API key for the provider",
+      "  --key-env      Read API key from this environment variable",
+      "  --skip-proxy   Use an already-running LiteLLM proxy (don't start one)",
+      "  --litellm-url  LiteLLM proxy URL (default: http://localhost:4099)",
+      "  --filter       Comma-separated test names to run (default: all)",
+      "  --list         List all available tests and exit"
+    ].join("\n"));
+    process.exit(0);
+  }
+  if (hasFlag3("--list")) {
+    for (const t of ALL_TESTS) {
+      logger.info(`  ${t.name.padEnd(24)} [${t.category}] ${t.description}`);
+    }
+    process.exit(0);
+  }
+  const provider = getArg3("--provider");
+  const model = getArg3("--model");
+  const key = getArg3("--key");
+  const keyEnv = getArg3("--key-env");
+  if (!provider || !model) {
+    logger.error("Required: --provider <provider> --model <model> --key <key>");
+    logger.error("Run with --help for usage.");
+    process.exit(1);
+  }
+  let apiKey = key;
+  if (!apiKey && keyEnv) apiKey = process.env[keyEnv];
+  if (!apiKey) {
+    logger.error("API key required: use --key <value> or --key-env <ENV_VAR>");
+    process.exit(1);
+  }
+  return {
+    provider,
+    model,
+    apiKey,
+    proxyUrl: getArg3("--litellm-url") ?? TEST_URL,
+    skipProxy: hasFlag3("--skip-proxy"),
+    filter: getArg3("--filter")?.split(",")
+  };
+}
+function generateConfig(provider, model, dropParams) {
+  const lines = [];
+  if (dropParams) {
+    lines.push("litellm_settings:");
+    lines.push("  drop_params: true");
+    lines.push("");
+  }
+  lines.push("model_list:");
+  lines.push(`  - model_name: ${model}`);
+  lines.push("    litellm_params:");
+  lines.push(`      model: ${provider}/${model}`);
+  lines.push("      api_key: os.environ/ANTHROPIC_COMPATIBLE_API_KEY");
+  return lines.join("\n") + "\n";
+}
+async function startProxy(config, url) {
+  try {
+    execFileSync10("which", ["litellm"], { timeout: 3e3, stdio: "pipe" });
+  } catch {
+    try {
+      execFileSync10("python3", ["-c", "import litellm"], { timeout: 1e4, stdio: "pipe" });
+    } catch {
+      logger.error("litellm not installed. Install: pip install 'litellm[proxy]'");
+      return null;
+    }
+  }
+  fs13.writeFileSync(CONFIG_PATH, config);
+  const portMatch = url.match(/:(\d+)/);
+  const port = portMatch ? portMatch[1] : "4099";
+  const { spawn: spawn2 } = await import("child_process");
+  const child = spawn2("litellm", ["--config", CONFIG_PATH, "--port", port], {
+    stdio: ["ignore", "pipe", "pipe"],
+    detached: true,
+    env: process.env
+  });
+  for (let i = 0; i < 30; i++) {
+    await delay(2e3);
+    if (await checkLitellmHealth(url)) {
+      logger.info(`LiteLLM proxy ready at ${url}`);
+      return child;
+    }
+  }
+  child.kill();
+  return null;
+}
+async function quickApiTest(url, model, apiKey) {
+  try {
+    const res = await fetch(`${url}/v1/messages`, {
+      method: "POST",
+      headers: { "Content-Type": "application/json", "x-api-key": apiKey, "anthropic-version": "2023-06-01" },
+      body: JSON.stringify({
+        model,
+        max_tokens: 10,
+        messages: [{ role: "user", content: "Say ok" }],
+        context_management: { policy: "smart" }
+      }),
+      signal: AbortSignal.timeout(3e4)
+    });
+    if (!res.ok) {
+      const body = await res.text();
+      return { ok: false, error: body.slice(0, 200) };
+    }
+    return { ok: true };
+  } catch (err) {
+    return { ok: false, error: String(err) };
+  }
+}
+function delay(ms) {
+  return new Promise((resolve5) => setTimeout(resolve5, ms));
+}
+async function runTestModelCommand() {
+  const opts = parseTestModelArgs();
+  const startTime = Date.now();
+  logger.info(`Testing model compatibility: ${opts.provider}/${opts.model}`);
+  logger.info("");
+  let proxyProcess = null;
+  let dropParamsRequired = false;
+  const cleanup = () => {
+    if (proxyProcess) {
+      proxyProcess.kill();
+      proxyProcess = null;
+    }
+    fs13.rmSync(CONFIG_PATH, { force: true });
+  };
+  process.on("SIGINT", () => {
+    cleanup();
+    process.exit(1);
+  });
+  process.on("SIGTERM", () => {
+    cleanup();
+    process.exit(1);
+  });
+  try {
+    if (!opts.skipProxy) {
+      process.env.ANTHROPIC_COMPATIBLE_API_KEY = opts.apiKey;
+      logger.info("Starting LiteLLM proxy (without drop_params)...");
+      proxyProcess = await startProxy(generateConfig(opts.provider, opts.model, false), opts.proxyUrl);
+      if (!proxyProcess) {
+        logger.error("Failed to start LiteLLM proxy");
+        process.exit(1);
+      }
+      const quickRes = await quickApiTest(opts.proxyUrl, opts.model, opts.apiKey);
+      if (!quickRes.ok) {
+        logger.info("Model needs drop_params: true -- restarting proxy...");
+        proxyProcess.kill();
+        proxyProcess = null;
+        await delay(2e3);
+        proxyProcess = await startProxy(generateConfig(opts.provider, opts.model, true), opts.proxyUrl);
+        dropParamsRequired = true;
+        if (!proxyProcess) {
+          logger.error("Failed to start LiteLLM proxy with drop_params");
+          process.exit(1);
+        }
+        const retry = await quickApiTest(opts.proxyUrl, opts.model, opts.apiKey);
+        if (!retry.ok) {
+          logger.error(`Model not accessible: ${retry.error}`);
+          process.exit(1);
+        }
+        logger.info("Proxy restarted with drop_params: true");
+      } else {
+        logger.info("drop_params not required");
+      }
+    } else {
+      logger.info(`Using existing proxy at ${opts.proxyUrl}`);
+    }
+    const tests = opts.filter ? ALL_TESTS.filter((t) => opts.filter.includes(t.name)) : ALL_TESTS;
+    logger.info(`Running ${tests.length} compatibility tests...`);
+    logger.info("");
+    const ctx = { proxyUrl: opts.proxyUrl, model: opts.model, apiKey: opts.apiKey, projectDir: process.cwd() };
+    const results = [];
+    for (const test of tests) {
+      process.stdout.write(`  ${test.name.padEnd(28)} `);
+      try {
+        const r = await test.run(ctx);
+        results.push(r);
+        const icon = r.status === "pass" ? "+" : r.status === "fail" ? "x" : "!";
+        logger.info(`[${icon}] ${r.status.toUpperCase()} ${r.accuracy}% (${(r.durationMs / 1e3).toFixed(1)}s)`);
+      } catch (err) {
+        const r = {
+          name: test.name,
+          category: test.category,
+          status: "fail",
+          accuracy: 0,
+          durationMs: 0,
+          detail: `Crash: ${err instanceof Error ? err.message : String(err)}`
+        };
+        results.push(r);
+        logger.info("[x] CRASH");
+      }
+    }
+    const report = {
+      provider: opts.provider,
+      model: opts.model,
+      results,
+      totalDurationMs: Date.now() - startTime,
+      dropParamsRequired,
+      timestamp: (/* @__PURE__ */ new Date()).toISOString().replace("T", " ").slice(0, 19)
+    };
+    console.log("");
+    console.log(formatReport(report));
+    const failed = results.filter((r) => r.status === "fail").length;
+    process.exit(failed > 0 ? 1 : 0);
+  } finally {
+    cleanup();
+  }
+}
+var TEST_PORT, TEST_URL, CONFIG_PATH;
+var init_test_model_command = __esm({
+  "src/cli/test-model-command.ts"() {
+    "use strict";
+    init_logger();
+    init_litellm();
+    init_test_model_tests();
+    init_test_model_report();
+    TEST_PORT = 4099;
+    TEST_URL = `http://localhost:${TEST_PORT}`;
+    CONFIG_PATH = path12.join(os3.tmpdir(), "kody-test-model-config.yaml");
+  }
+});
 // src/ci/parse-inputs.ts
 var parse_inputs_exports = {};
 __export(parse_inputs_exports, {
@@ -1575,16 +2568,16 @@ __export(parse_inputs_exports, {
   runCiParse: () => runCiParse,
   writeOutputs: () => writeOutputs
 });
-import * as fs12 from "fs";
+import * as fs14 from "fs";
 function generateTimestamp() {
   const now = /* @__PURE__ */ new Date();
-  const pad = (n) => String(n).padStart(2, "0");
+  const pad2 = (n) => String(n).padStart(2, "0");
   const y = String(now.getFullYear()).slice(2);
-  const m = pad(now.getMonth() + 1);
-  const d = pad(now.getDate());
-  const H = pad(now.getHours());
-  const M = pad(now.getMinutes());
-  const S = pad(now.getSeconds());
+  const m = pad2(now.getMonth() + 1);
+  const d = pad2(now.getDate());
+  const H = pad2(now.getHours());
+  const M = pad2(now.getMinutes());
+  const S = pad2(now.getSeconds());
   return `${y}${m}${d}-${H}${M}${S}`;
 }
 function parseCommentInputs() {
@@ -1736,40 +2729,40 @@ function parseCommentInputs() {
     trigger_type: "comment"
   };
 }
-function writeOutputs(result) {
+function writeOutputs(result2) {
   const outputFile = process.env.GITHUB_OUTPUT;
   function output(key, value) {
     if (outputFile) {
       if (value.includes("\n")) {
-        fs12.appendFileSync(outputFile, `${key}<<KODY_EOF
+        fs14.appendFileSync(outputFile, `${key}<<KODY_EOF
 ${value}
 KODY_EOF
 `);
       } else {
-        fs12.appendFileSync(outputFile, `${key}=${value}
+        fs14.appendFileSync(outputFile, `${key}=${value}
 `);
       }
     }
     const display = value.includes("\n") ? value.split("\n")[0] + "..." : value;
     console.log(`${key}=${display}`);
   }
-  output("task_id", result.task_id);
-  output("mode", result.mode);
-  output("from_stage", result.from_stage);
-  output("issue_number", result.issue_number);
-  output("pr_number", result.pr_number);
-  output("feedback", result.feedback);
-  output("complexity", result.complexity);
-  output("ci_run_id", result.ci_run_id);
-  output("ticket_id", result.ticket_id);
-  output("prd_file", result.prd_file);
-  output("dry_run", result.dry_run ? "true" : "false");
-  output("valid", result.valid ? "true" : "false");
-  output("trigger_type", result.trigger_type);
+  output("task_id", result2.task_id);
+  output("mode", result2.mode);
+  output("from_stage", result2.from_stage);
+  output("issue_number", result2.issue_number);
+  output("pr_number", result2.pr_number);
+  output("feedback", result2.feedback);
+  output("complexity", result2.complexity);
+  output("ci_run_id", result2.ci_run_id);
+  output("ticket_id", result2.ticket_id);
+  output("prd_file", result2.prd_file);
+  output("dry_run", result2.dry_run ? "true" : "false");
+  output("valid", result2.valid ? "true" : "false");
+  output("trigger_type", result2.trigger_type);
 }
 function runCiParse() {
-  const result = parseCommentInputs();
-  writeOutputs(result);
+  const result2 = parseCommentInputs();
+  writeOutputs(result2);
 }
 var VALID_MODES;
 var init_parse_inputs = __esm({
@@ -1871,7 +2864,7 @@ var init_definitions = __esm({
 });
 // src/git-utils.ts
-import { execFileSync as execFileSync10 } from "child_process";
+import { execFileSync as execFileSync11 } from "child_process";
 function getHookSafeEnv() {
   if (!_hookSafeEnv) {
     _hookSafeEnv = { ...process.env, HUSKY: "0", SKIP_HOOKS: "1" };
@@ -1879,7 +2872,7 @@ function getHookSafeEnv() {
   return _hookSafeEnv;
 }
 function git(args2, options) {
-  return execFileSync10("git", args2, {
+  return execFileSync11("git", args2, {
     encoding: "utf-8",
     timeout: options?.timeout ?? 3e4,
     cwd: options?.cwd,
@@ -2065,22 +3058,22 @@ var init_git_utils = __esm({
 });
 // src/pipeline/state.ts
-import * as fs13 from "fs";
-import * as path11 from "path";
+import * as fs15 from "fs";
+import * as path13 from "path";
 function loadState(taskId, taskDir) {
-  const p = path11.join(taskDir, "status.json");
-  if (!fs13.existsSync(p)) return null;
+  const p = path13.join(taskDir, "status.json");
+  if (!fs15.existsSync(p)) return null;
   try {
-    const result = parseJsonSafe(
-      fs13.readFileSync(p, "utf-8"),
+    const result2 = parseJsonSafe(
+      fs15.readFileSync(p, "utf-8"),
       ["taskId", "state", "stages", "createdAt", "updatedAt"]
     );
-    if (!result.ok) {
-      logger.warn(`  Corrupt status.json: ${result.error}`);
+    if (!result2.ok) {
+      logger.warn(`  Corrupt status.json: ${result2.error}`);
       return null;
     }
-    if (result.data.taskId !== taskId) return null;
-    return result.data;
+    if (result2.data.taskId !== taskId) return null;
+    return result2.data;
   } catch {
     return null;
   }
@@ -2090,10 +3083,10 @@ function writeState(state, taskDir) {
     ...state,
     updatedAt: (/* @__PURE__ */ new Date()).toISOString()
   };
-  const target = path11.join(taskDir, "status.json");
+  const target = path13.join(taskDir, "status.json");
   const tmp = target + ".tmp";
-  fs13.writeFileSync(tmp, JSON.stringify(updated, null, 2));
-  fs13.renameSync(tmp, target);
+  fs15.writeFileSync(tmp, JSON.stringify(updated, null, 2));
+  fs15.renameSync(tmp, target);
   return updated;
 }
 function initState(taskId) {
@@ -2134,16 +3127,16 @@ var init_complexity = __esm({
 });
 // src/memory.ts
-import * as fs14 from "fs";
-import * as path12 from "path";
+import * as fs16 from "fs";
+import * as path14 from "path";
 function readProjectMemory(projectDir) {
-  const memoryDir = path12.join(projectDir, ".kody", "memory");
-  if (!fs14.existsSync(memoryDir)) return "";
-  const files = fs14.readdirSync(memoryDir).filter((f) => f.endsWith(".md")).sort();
+  const memoryDir = path14.join(projectDir, ".kody", "memory");
+  if (!fs16.existsSync(memoryDir)) return "";
+  const files = fs16.readdirSync(memoryDir).filter((f) => f.endsWith(".md")).sort();
   if (files.length === 0) return "";
   const sections = [];
   for (const file of files) {
-    const content = fs14.readFileSync(path12.join(memoryDir, file), "utf-8").trim();
+    const content = fs16.readFileSync(path14.join(memoryDir, file), "utf-8").trim();
     if (content) {
       sections.push(`## ${file.replace(".md", "")}
 ${content}`);
@@ -2162,8 +3155,8 @@ var init_memory = __esm({
 });
 // src/context-tiers.ts
-import * as fs15 from "fs";
-import * as path13 from "path";
+import * as fs17 from "fs";
+import * as path15 from "path";
 function estimateTokens(text) {
   return Math.ceil(text.length / 4);
 }
@@ -2190,8 +3183,8 @@ function generateL0(content, filename) {
       break;
     }
   }
-  const result = parts.join("\n");
-  return result.slice(0, L0_MAX_CHARS);
+  const result2 = parts.join("\n");
+  return result2.slice(0, L0_MAX_CHARS);
 }
 function generateL0Json(content) {
   try {
@@ -2233,8 +3226,8 @@ function generateL1(content, filename) {
       inSection = false;
     }
   }
-  const result = parts.join("\n");
-  return result.slice(0, L1_MAX_CHARS);
+  const result2 = parts.join("\n");
+  return result2.slice(0, L1_MAX_CHARS);
 }
 function generateL1Json(content) {
   try {
@@ -2254,7 +3247,7 @@ function generateL1Json(content) {
   }
 }
 function getTieredContent(filePath, content) {
-  const key = path13.basename(filePath);
+  const key = path15.basename(filePath);
   return {
     source: filePath,
     L0: generateL0(content, key),
@@ -2266,15 +3259,15 @@ function selectTier(tiered, tier) {
   return tiered[tier];
 }
 function readProjectMemoryTiered(projectDir, tier) {
-  const memoryDir = path13.join(projectDir, ".kody", "memory");
-  if (!fs15.existsSync(memoryDir)) return "";
-  const files = fs15.readdirSync(memoryDir).filter((f) => f.endsWith(".md")).sort();
+  const memoryDir = path15.join(projectDir, ".kody", "memory");
+  if (!fs17.existsSync(memoryDir)) return "";
+  const files = fs17.readdirSync(memoryDir).filter((f) => f.endsWith(".md")).sort();
   if (files.length === 0) return "";
   const tierLabel2 = tier === "L2" ? "full" : tier === "L1" ? "overview" : "abstract";
   const sections = [];
   for (const file of files) {
-    const filePath = path13.join(memoryDir, file);
-    const content = fs15.readFileSync(filePath, "utf-8").trim();
+    const filePath = path15.join(memoryDir, file);
+    const content = fs17.readFileSync(filePath, "utf-8").trim();
     if (!content) continue;
     const tiered = getTieredContent(filePath, content);
     const selected = selectTier(tiered, tier);
@@ -2297,9 +3290,9 @@ function injectTaskContextTiered(prompt, taskId, taskDir, policy, feedback) {
 `;
   context += `Task Directory: ${taskDir}
 `;
-  const taskMdPath = path13.join(taskDir, "task.md");
-  if (fs15.existsSync(taskMdPath)) {
-    const content = fs15.readFileSync(taskMdPath, "utf-8");
+  const taskMdPath = path15.join(taskDir, "task.md");
+  if (fs17.existsSync(taskMdPath)) {
+    const content = fs17.readFileSync(taskMdPath, "utf-8");
     const selected = selectContent(taskMdPath, content, policy.taskDescription);
     const label = tierLabel("Task Description", policy.taskDescription);
     context += `
@@ -2307,9 +3300,9 @@ function injectTaskContextTiered(prompt, taskId, taskDir, policy, feedback) {
 ${selected}
 `;
   }
-  const taskJsonPath = path13.join(taskDir, "task.json");
-  if (fs15.existsSync(taskJsonPath)) {
-    const content = fs15.readFileSync(taskJsonPath, "utf-8");
+  const taskJsonPath = path15.join(taskDir, "task.json");
+  if (fs17.existsSync(taskJsonPath)) {
+    const content = fs17.readFileSync(taskJsonPath, "utf-8");
     if (policy.taskClassification === "L2") {
       try {
         const taskDef = JSON.parse(content.replace(/^```json\s*\n?/m, "").replace(/\n?```\s*$/m, ""));
@@ -2335,9 +3328,9 @@ ${selected}
       }
     }
   }
-  const specPath = path13.join(taskDir, "spec.md");
-  if (fs15.existsSync(specPath)) {
-    const content = fs15.readFileSync(specPath, "utf-8");
+  const specPath = path15.join(taskDir, "spec.md");
+  if (fs17.existsSync(specPath)) {
+    const content = fs17.readFileSync(specPath, "utf-8");
     const selected = selectContent(specPath, content, policy.spec);
     const label = tierLabel("Spec", policy.spec);
     context += `
@@ -2345,9 +3338,9 @@ ${selected}
 ${selected}
 `;
   }
-  const planPath = path13.join(taskDir, "plan.md");
-  if (fs15.existsSync(planPath)) {
-    const content = fs15.readFileSync(planPath, "utf-8");
+  const planPath = path15.join(taskDir, "plan.md");
+  if (fs17.existsSync(planPath)) {
+    const content = fs17.readFileSync(planPath, "utf-8");
     const selected = selectContent(planPath, content, policy.plan);
     const label = tierLabel("Plan", policy.plan);
     context += `
@@ -2355,9 +3348,9 @@ ${selected}
 ${selected}
 `;
   }
-  const contextMdPath = path13.join(taskDir, "context.md");
-  if (fs15.existsSync(contextMdPath)) {
-    const content = fs15.readFileSync(contextMdPath, "utf-8");
+  const contextMdPath = path15.join(taskDir, "context.md");
+  if (fs17.existsSync(contextMdPath)) {
+    const content = fs17.readFileSync(contextMdPath, "utf-8");
     const selected = selectContent(contextMdPath, content, policy.accumulatedContext);
     const label = tierLabel("Previous Stage Context", policy.accumulatedContext);
     context += `
@@ -2443,24 +3436,24 @@ var init_context_tiers = __esm({
 });
 // src/context.ts
-import * as fs16 from "fs";
-import * as path14 from "path";
+import * as fs18 from "fs";
+import * as path16 from "path";
 function readPromptFile(stageName, projectDir) {
   if (projectDir) {
-    const stepFile = path14.join(projectDir, ".kody", "steps", `${stageName}.md`);
-    if (fs16.existsSync(stepFile)) {
-      return fs16.readFileSync(stepFile, "utf-8");
+    const stepFile = path16.join(projectDir, ".kody", "steps", `${stageName}.md`);
+    if (fs18.existsSync(stepFile)) {
+      return fs18.readFileSync(stepFile, "utf-8");
     }
     console.warn(`  \u26A0 No step file at ${stepFile}, falling back to engine defaults. Run 'kody-engine-lite init --force' to generate step files.`);
   }
   const scriptDir = new URL(".", import.meta.url).pathname;
   const candidates = [
-    path14.resolve(scriptDir, "..", "prompts", `${stageName}.md`),
-    path14.resolve(scriptDir, "..", "..", "prompts", `${stageName}.md`)
+    path16.resolve(scriptDir, "..", "prompts", `${stageName}.md`),
+    path16.resolve(scriptDir, "..", "..", "prompts", `${stageName}.md`)
   ];
   for (const candidate of candidates) {
-    if (fs16.existsSync(candidate)) {
-      return fs16.readFileSync(candidate, "utf-8");
+    if (fs18.existsSync(candidate)) {
+      return fs18.readFileSync(candidate, "utf-8");
     }
   }
   throw new Error(`Prompt file not found: tried ${candidates.join(", ")}`);
@@ -2472,18 +3465,18 @@ function injectTaskContext(prompt, taskId, taskDir, feedback) {
 `;
   context += `Task Directory: ${taskDir}
 `;
-  const taskMdPath = path14.join(taskDir, "task.md");
-  if (fs16.existsSync(taskMdPath)) {
-    const taskMd = fs16.readFileSync(taskMdPath, "utf-8");
+  const taskMdPath = path16.join(taskDir, "task.md");
+  if (fs18.existsSync(taskMdPath)) {
+    const taskMd = fs18.readFileSync(taskMdPath, "utf-8");
     context += `
 ## Task Description
 ${taskMd}
 `;
   }
-  const taskJsonPath = path14.join(taskDir, "task.json");
-  if (fs16.existsSync(taskJsonPath)) {
+  const taskJsonPath = path16.join(taskDir, "task.json");
+  if (fs18.existsSync(taskJsonPath)) {
     try {
-      const taskDef = JSON.parse(fs16.readFileSync(taskJsonPath, "utf-8"));
+      const taskDef = JSON.parse(fs18.readFileSync(taskJsonPath, "utf-8"));
       context += `
 ## Task Classification
 `;
@@ -2496,27 +3489,27 @@ ${taskMd}
     } catch {
     }
   }
-  const specPath = path14.join(taskDir, "spec.md");
-  if (fs16.existsSync(specPath)) {
-    const spec = fs16.readFileSync(specPath, "utf-8");
+  const specPath = path16.join(taskDir, "spec.md");
+  if (fs18.existsSync(specPath)) {
+    const spec = fs18.readFileSync(specPath, "utf-8");
     const truncated = spec.slice(0, MAX_TASK_CONTEXT_SPEC);
     context += `
 ## Spec Summary
 ${truncated}${spec.length > MAX_TASK_CONTEXT_SPEC ? "\n..." : ""}
 `;
   }
-  const planPath = path14.join(taskDir, "plan.md");
-  if (fs16.existsSync(planPath)) {
-    const plan = fs16.readFileSync(planPath, "utf-8");
+  const planPath = path16.join(taskDir, "plan.md");
+  if (fs18.existsSync(planPath)) {
+    const plan = fs18.readFileSync(planPath, "utf-8");
     const truncated = plan.slice(0, MAX_TASK_CONTEXT_PLAN);
     context += `
 ## Plan Summary
 ${truncated}${plan.length > MAX_TASK_CONTEXT_PLAN ? "\n..." : ""}
 `;
   }
-  const contextMdPath = path14.join(taskDir, "context.md");
-  if (fs16.existsSync(contextMdPath)) {
-    const accumulated = fs16.readFileSync(contextMdPath, "utf-8");
+  const contextMdPath = path16.join(taskDir, "context.md");
+  if (fs18.existsSync(contextMdPath)) {
+    const accumulated = fs18.readFileSync(contextMdPath, "utf-8");
     const truncated = accumulated.slice(-MAX_ACCUMULATED_CONTEXT);
     const prefix = accumulated.length > MAX_ACCUMULATED_CONTEXT ? "...(earlier context truncated)\n" : "";
     context += `
@@ -2534,17 +3527,17 @@ ${feedback}
 }
 function inferHasUIFromScope(scope) {
   return scope.some((filePath) => {
-    const ext = path14.extname(filePath).toLowerCase();
+    const ext = path16.extname(filePath).toLowerCase();
     if (UI_EXTENSIONS.has(ext)) return true;
     const normalized = filePath.replace(/\\/g, "/");
     return UI_PATH_SEGMENTS.some((seg) => normalized.includes(seg));
   });
 }
 function taskHasUI(taskDir) {
-  const taskJsonPath = path14.join(taskDir, "task.json");
-  if (!fs16.existsSync(taskJsonPath)) return true;
+  const taskJsonPath = path16.join(taskDir, "task.json");
+  if (!fs18.existsSync(taskJsonPath)) return true;
   try {
-    const taskDef = JSON.parse(fs16.readFileSync(taskJsonPath, "utf-8"));
+    const taskDef = JSON.parse(fs18.readFileSync(taskJsonPath, "utf-8"));
     const scope = Array.isArray(taskDef.scope) ? taskDef.scope : [];
     if (scope.length === 0) return true;
     return inferHasUIFromScope(scope);
@@ -2666,9 +3659,9 @@ ${prompt}` : prompt;
   }
   if (isMcpEnabledForStage(stageName, config.mcp) && taskHasUI(taskDir)) {
     assembled = assembled + "\n\n" + getBrowserToolGuidance(stageName, taskDir);
-    const qaGuidePath = path14.join(projectDir, ".kody", "qa-guide.md");
-    if (fs16.existsSync(qaGuidePath)) {
-      const qaGuide = fs16.readFileSync(qaGuidePath, "utf-8").trim();
+    const qaGuidePath = path16.join(projectDir, ".kody", "qa-guide.md");
+    if (fs18.existsSync(qaGuidePath)) {
+      const qaGuide = fs18.readFileSync(qaGuidePath, "utf-8").trim();
       assembled = assembled + "\n\n" + qaGuide;
     }
   }
@@ -2760,8 +3753,8 @@ var init_runner_selection = __esm({
 });
 // src/stages/agent.ts
-import * as fs17 from "fs";
-import * as path15 from "path";
+import * as fs19 from "fs";
+import * as path17 from "path";
 function getSessionInfo(stageName, sessions) {
   const group = SESSION_GROUP[stageName];
   if (!group) return void 0;
@@ -2846,29 +3839,29 @@ async function executeAgentStage(ctx, def) {
   if (lastResult.outcome !== "completed") {
     return { outcome: lastResult.outcome, error: lastResult.error, retries };
   }
-  const result = lastResult;
-  if (def.outputFile && result.output) {
-    fs17.writeFileSync(path15.join(ctx.taskDir, def.outputFile), result.output);
+  const result2 = lastResult;
+  if (def.outputFile && result2.output) {
+    fs19.writeFileSync(path17.join(ctx.taskDir, def.outputFile), result2.output);
   }
   if (def.outputFile) {
-    const outputPath = path15.join(ctx.taskDir, def.outputFile);
-    if (!fs17.existsSync(outputPath)) {
-      const ext = path15.extname(def.outputFile);
-      const base = path15.basename(def.outputFile, ext);
-      const files = fs17.readdirSync(ctx.taskDir);
+    const outputPath = path17.join(ctx.taskDir, def.outputFile);
+    if (!fs19.existsSync(outputPath)) {
+      const ext = path17.extname(def.outputFile);
+      const base = path17.basename(def.outputFile, ext);
+      const files = fs19.readdirSync(ctx.taskDir);
       const variant = files.find(
         (f) => f.startsWith(base + "-") && f.endsWith(ext)
       );
       if (variant) {
-        fs17.renameSync(path15.join(ctx.taskDir, variant), outputPath);
+        fs19.renameSync(path17.join(ctx.taskDir, variant), outputPath);
         logger.info(`  Renamed variant ${variant} \u2192 ${def.outputFile}`);
       }
     }
   }
   if (def.outputFile) {
-    const outputPath = path15.join(ctx.taskDir, def.outputFile);
-    if (fs17.existsSync(outputPath)) {
-      const content = fs17.readFileSync(outputPath, "utf-8");
+    const outputPath = path17.join(ctx.taskDir, def.outputFile);
+    if (fs19.existsSync(outputPath)) {
+      const content = fs19.readFileSync(outputPath, "utf-8");
       const validation = validateStageOutput(def.name, content);
       if (!validation.valid) {
         if (def.name === "taskify") {
@@ -2882,7 +3875,7 @@ async function executeAgentStage(ctx, def) {
             const stripped = stripFences(retryResult.output);
             const retryValidation = validateTaskJson(stripped);
             if (retryValidation.valid) {
-              fs17.writeFileSync(outputPath, retryResult.output);
+              fs19.writeFileSync(outputPath, retryResult.output);
               logger.info(`  taskify retry produced valid JSON`);
             } else {
               logger.warn(`  taskify retry still invalid: ${retryValidation.error}`);
@@ -2895,7 +3888,7 @@ async function executeAgentStage(ctx, def) {
                 risk_level: "low",
                 questions: []
               }, null, 2);
-              fs17.writeFileSync(outputPath, fallback);
+              fs19.writeFileSync(outputPath, fallback);
               logger.info(`  taskify fallback: generated minimal task.json (risk_level=low)`);
             }
           }
@@ -2905,11 +3898,11 @@ async function executeAgentStage(ctx, def) {
       }
     }
   }
-  appendStageContext(ctx.taskDir, def.name, result.output);
+  appendStageContext(ctx.taskDir, def.name, result2.output);
   return { outcome: "completed", outputFile: def.outputFile, retries };
 }
 function appendStageContext(taskDir, stageName, output) {
-  const contextPath = path15.join(taskDir, "context.md");
+  const contextPath = path17.join(taskDir, "context.md");
   const timestamp2 = (/* @__PURE__ */ new Date()).toISOString().slice(0, 19);
   let summary;
   if (output && output.trim()) {
@@ -2922,7 +3915,7 @@ function appendStageContext(taskDir, stageName, output) {
 ### ${stageName} (${timestamp2})
 ${summary}
 `;
-  fs17.appendFileSync(contextPath, entry);
+  fs19.appendFileSync(contextPath, entry);
 }
 var SESSION_GROUP;
 var init_agent = __esm({
@@ -2945,7 +3938,7 @@ var init_agent = __esm({
 });
 // src/verify-runner.ts
-import { execFileSync as execFileSync11 } from "child_process";
+import { execFileSync as execFileSync12 } from "child_process";
 function isExecError(err) {
   return typeof err === "object" && err !== null;
 }
@@ -2981,7 +3974,7 @@ function runCommand(cmd, cwd, timeout) {
     return { success: true, output: "", timedOut: false };
   }
   try {
-    const output = execFileSync11(parts[0], parts.slice(1), {
+    const output = execFileSync12(parts[0], parts.slice(1), {
       cwd,
       timeout,
       encoding: "utf-8",
@@ -3027,19 +4020,19 @@ function runQualityGates(taskDir, projectRoot) {
   for (const { name, cmd } of commands) {
     if (!cmd) continue;
     logger.info(`  Running ${name}: ${cmd}`);
-    const result = runCommand(cmd, cwd, VERIFY_COMMAND_TIMEOUT_MS);
-    if (result.timedOut) {
+    const result2 = runCommand(cmd, cwd, VERIFY_COMMAND_TIMEOUT_MS);
+    if (result2.timedOut) {
       allErrors.push(`${name}: timed out after ${VERIFY_COMMAND_TIMEOUT_MS / 1e3}s`);
       allPass = false;
       continue;
     }
-    if (!result.success) {
+    if (!result2.success) {
       allPass = false;
-      const errors = parseErrors(result.output);
+      const errors = parseErrors(result2.output);
       allErrors.push(...errors.map((e) => `[${name}] ${e}`));
-      rawOutputs.push({ name, output: result.output.slice(-3e3) });
+      rawOutputs.push({ name, output: result2.output.slice(-3e3) });
     }
-    allSummary.push(...extractSummary(result.output, name));
+    allSummary.push(...extractSummary(result2.output, name));
   }
   return { pass: allPass, errors: allErrors, summary: allSummary, rawOutputs };
 }
@@ -3052,7 +4045,7 @@ var init_verify_runner = __esm({
 });
 // src/observer.ts
-import { execFileSync as execFileSync12 } from "child_process";
+import { execFileSync as execFileSync13 } from "child_process";
 async function diagnoseFailure(stageName, errorOutput, modifiedFiles, runner, model, options) {
   const context = [
     `Stage: ${stageName}`,
@@ -3066,7 +4059,7 @@ ${modifiedFiles.map((f) => `- ${f}`).join("\n")}` : "No files were modified (bui
   ].join("\n");
   const prompt = DIAGNOSIS_PROMPT + context;
   try {
-    const result = await runner.run(
+    const result2 = await runner.run(
       "diagnosis",
       prompt,
       model,
@@ -3075,8 +4068,8 @@ ${modifiedFiles.map((f) => `- ${f}`).join("\n")}` : "No files were modified (bui
       "",
       options
     );
-    if (result.outcome === "completed" && result.output) {
-      const cleaned = result.output.replace(/^```json\s*\n?/m, "").replace(/\n?```\s*$/m, "").trim();
+    if (result2.outcome === "completed" && result2.output) {
+      const cleaned = result2.output.replace(/^```json\s*\n?/m, "").replace(/\n?```\s*$/m, "").trim();
       const parseResult = parseJsonSafe(cleaned, ["classification"]);
       if (parseResult.ok) {
         const { data } = parseResult;
@@ -3112,13 +4105,13 @@ ${modifiedFiles.map((f) => `- ${f}`).join("\n")}` : "No files were modified (bui
 }
 function getModifiedFiles(projectDir) {
   try {
-    const staged = execFileSync12("git", ["diff", "--name-only", "--cached"], {
+    const staged = execFileSync13("git", ["diff", "--name-only", "--cached"], {
       encoding: "utf-8",
       cwd: projectDir,
       timeout: 5e3,
       stdio: ["pipe", "pipe", "pipe"]
     }).trim();
-    const unstaged = execFileSync12("git", ["diff", "--name-only"], {
+    const unstaged = execFileSync13("git", ["diff", "--name-only"], {
       encoding: "utf-8",
       cwd: projectDir,
       timeout: 5e3,
@@ -3161,8 +4154,8 @@ Error context:
 });
 // src/stages/gate.ts
-import * as fs18 from "fs";
-import * as path16 from "path";
+import * as fs20 from "fs";
+import * as path18 from "path";
 function executeGateStage(ctx, def) {
   if (ctx.input.dryRun) {
     logger.info(`  [dry-run] skipping ${def.name}`);
@@ -3205,7 +4198,7 @@ ${output}
 `);
     }
   }
-  fs18.writeFileSync(path16.join(ctx.taskDir, "verify.md"), lines.join(""));
+  fs20.writeFileSync(path18.join(ctx.taskDir, "verify.md"), lines.join(""));
   return {
     outcome: verifyResult.pass ? "completed" : "failed",
     retries: 0
@@ -3220,9 +4213,9 @@ var init_gate = __esm({
 });
 // src/stages/verify.ts
-import * as fs19 from "fs";
-import * as path17 from "path";
-import { execFileSync as execFileSync13 } from "child_process";
+import * as fs21 from "fs";
+import * as path19 from "path";
+import { execFileSync as execFileSync14 } from "child_process";
 async function executeVerifyWithAutofix(ctx, def) {
   const maxAttempts = def.maxRetries ?? 2;
   for (let attempt = 0; attempt <= maxAttempts; attempt++) {
@@ -3232,8 +4225,8 @@ async function executeVerifyWithAutofix(ctx, def) {
       return { ...gateResult, retries: attempt };
     }
     if (attempt < maxAttempts) {
-      const verifyPath = path17.join(ctx.taskDir, "verify.md");
-      const errorOutput = fs19.existsSync(verifyPath) ? fs19.readFileSync(verifyPath, "utf-8") : "Unknown error";
+      const verifyPath = path19.join(ctx.taskDir, "verify.md");
+      const errorOutput = fs21.existsSync(verifyPath) ? fs21.readFileSync(verifyPath, "utf-8") : "Unknown error";
       const modifiedFiles = getModifiedFiles(ctx.projectDir);
       const defaultRunner = getRunnerForStage(ctx, "taskify");
       const diagConfig = getProjectConfig();
@@ -3276,7 +4269,7 @@ ${diagnosis.resolution}`);
         const parts = parseCommand(cmd);
         if (parts.length === 0) return;
         try {
-          execFileSync13(parts[0], parts.slice(1), {
+          execFileSync14(parts[0], parts.slice(1), {
             stdio: "pipe",
             timeout: FIX_COMMAND_TIMEOUT_MS
           });
@@ -3329,8 +4322,8 @@ var init_verify = __esm({
 });
 // src/review-standalone.ts
-import * as fs20 from "fs";
-import * as path18 from "path";
+import * as fs22 from "fs";
+import * as path20 from "path";
 function resolveReviewTarget(input) {
   if (input.prs.length === 0) {
     return {
@@ -3354,8 +4347,8 @@ Or comment on the specific PR: \`@kody review\``
 }
 async function runStandaloneReview(input) {
   const taskId = input.taskId ?? `review-${generateTaskId()}`;
-  const taskDir = path18.join(input.projectDir, ".kody", "tasks", taskId);
-  fs20.mkdirSync(taskDir, { recursive: true });
+  const taskDir = path20.join(input.projectDir, ".kody", "tasks", taskId);
+  fs22.mkdirSync(taskDir, { recursive: true });
   let diffInstruction = "";
   let filesChangedSection = "";
   if (input.baseBranch) {
@@ -3382,7 +4375,7 @@ ${fileList}`;
   const taskContent = `# ${input.prTitle}
 ${input.prBody ?? ""}${diffInstruction}${filesChangedSection}`;
-  fs20.writeFileSync(path18.join(taskDir, "task.md"), taskContent);
+  fs22.writeFileSync(path20.join(taskDir, "task.md"), taskContent);
   const reviewDef = STAGES.find((s) => s.name === "review");
   const ctx = {
     taskId,
@@ -3396,18 +4389,18 @@ ${input.prBody ?? ""}${diffInstruction}${filesChangedSection}`;
     }
   };
   logger.info(`[review] standalone review for: ${input.prTitle}`);
-  const result = await executeAgentStage(ctx, reviewDef);
-  if (result.outcome !== "completed") {
+  const result2 = await executeAgentStage(ctx, reviewDef);
+  if (result2.outcome !== "completed") {
     return {
       outcome: "failed",
       taskDir,
-      error: result.error ?? "Review stage failed"
+      error: result2.error ?? "Review stage failed"
     };
   }
-  const reviewPath = path18.join(taskDir, "review.md");
+  const reviewPath = path20.join(taskDir, "review.md");
   let reviewContent;
-  if (fs20.existsSync(reviewPath)) {
-    reviewContent = fs20.readFileSync(reviewPath, "utf-8");
+  if (fs22.existsSync(reviewPath)) {
+    reviewContent = fs22.readFileSync(reviewPath, "utf-8");
   }
   return {
     outcome: "completed",
@@ -3447,8 +4440,8 @@ var init_review_standalone = __esm({
 });
 // src/stages/review.ts
-import * as fs21 from "fs";
-import * as path19 from "path";
+import * as fs23 from "fs";
+import * as path21 from "path";
 async function executeReviewWithFix(ctx, def) {
   if (ctx.input.dryRun) {
     return { outcome: "completed", retries: 0 };
@@ -3462,11 +4455,11 @@ async function executeReviewWithFix(ctx, def) {
     if (reviewResult.outcome !== "completed") {
       return reviewResult;
     }
-    const reviewFile = path19.join(ctx.taskDir, "review.md");
-    if (!fs21.existsSync(reviewFile)) {
+    const reviewFile = path21.join(ctx.taskDir, "review.md");
+    if (!fs23.existsSync(reviewFile)) {
       return { outcome: "failed", retries: iteration, error: "review.md not found" };
     }
-    const content = fs21.readFileSync(reviewFile, "utf-8");
+    const content = fs23.readFileSync(reviewFile, "utf-8");
     if (detectReviewVerdict(content) !== "fail") {
       return { ...reviewResult, retries: iteration };
     }
@@ -3495,15 +4488,15 @@ var init_review = __esm({
 });
 // src/stages/ship.ts
-import * as fs22 from "fs";
-import * as path20 from "path";
-import { execFileSync as execFileSync14 } from "child_process";
+import * as fs24 from "fs";
+import * as path22 from "path";
+import { execFileSync as execFileSync15 } from "child_process";
 function buildPrBody(ctx) {
   const sections = [];
-  const taskJsonPath = path20.join(ctx.taskDir, "task.json");
-  if (fs22.existsSync(taskJsonPath)) {
+  const taskJsonPath = path22.join(ctx.taskDir, "task.json");
+  if (fs24.existsSync(taskJsonPath)) {
     try {
-      const raw = fs22.readFileSync(taskJsonPath, "utf-8");
+      const raw = fs24.readFileSync(taskJsonPath, "utf-8");
       const cleaned = raw.replace(/^```json\s*\n?/m, "").replace(/\n?```\s*$/m, "");
       const task = JSON.parse(cleaned);
       if (task.description) {
@@ -3522,9 +4515,9 @@ ${task.scope.map((s) => `- \`${s}\``).join("\n")}`);
     } catch {
     }
   }
-  const reviewPath = path20.join(ctx.taskDir, "review.md");
-  if (fs22.existsSync(reviewPath)) {
-    const review = fs22.readFileSync(reviewPath, "utf-8");
+  const reviewPath = path22.join(ctx.taskDir, "review.md");
+  if (fs24.existsSync(reviewPath)) {
+    const review = fs24.readFileSync(reviewPath, "utf-8");
     const summaryMatch = review.match(/## Summary\s*\n([\s\S]*?)(?=\n## |\n*$)/);
     if (summaryMatch) {
       const summary = summaryMatch[1].trim();
@@ -3541,14 +4534,14 @@ ${summary}`);
 **Review:** ${verdictMatch[1].toUpperCase() === "PASS" ? "\u2705 PASS" : "\u274C FAIL"}`);
     }
   }
-  const verifyPath = path20.join(ctx.taskDir, "verify.md");
-  if (fs22.existsSync(verifyPath)) {
-    const verify = fs22.readFileSync(verifyPath, "utf-8");
+  const verifyPath = path22.join(ctx.taskDir, "verify.md");
+  if (fs24.existsSync(verifyPath)) {
+    const verify = fs24.readFileSync(verifyPath, "utf-8");
     if (/PASS/i.test(verify)) sections.push(`**Verify:** \u2705 typecheck + tests + lint passed`);
   }
-  const planPath = path20.join(ctx.taskDir, "plan.md");
-  if (fs22.existsSync(planPath)) {
-    const plan = fs22.readFileSync(planPath, "utf-8").trim();
+  const planPath = path22.join(ctx.taskDir, "plan.md");
+  if (fs24.existsSync(planPath)) {
+    const plan = fs24.readFileSync(planPath, "utf-8").trim();
     if (plan) {
       const truncated = plan.length > 800 ? plan.slice(0, 800) + "\n..." : plan;
       sections.push(`
@@ -3568,25 +4561,25 @@ Closes #${ctx.input.issueNumber}`);
   return sections.join("\n");
 }
 function executeShipStage(ctx, _def) {
-  const shipPath = path20.join(ctx.taskDir, "ship.md");
+  const shipPath = path22.join(ctx.taskDir, "ship.md");
   if (ctx.input.dryRun) {
-    fs22.writeFileSync(shipPath, "# Ship\n\nShip stage skipped \u2014 dry run.\n");
+    fs24.writeFileSync(shipPath, "# Ship\n\nShip stage skipped \u2014 dry run.\n");
     return { outcome: "completed", outputFile: "ship.md", retries: 0 };
   }
   if (ctx.input.local && !ctx.input.issueNumber) {
-    fs22.writeFileSync(shipPath, "# Ship\n\nShip stage skipped \u2014 local mode, no issue number.\n");
+    fs24.writeFileSync(shipPath, "# Ship\n\nShip stage skipped \u2014 local mode, no issue number.\n");
     return { outcome: "completed", outputFile: "ship.md", retries: 0 };
   }
   try {
     const head = getCurrentBranch(ctx.projectDir);
     const base = getDefaultBranch(ctx.projectDir);
     try {
-      execFileSync14("git", ["add", ctx.taskDir], {
+      execFileSync15("git", ["add", ctx.taskDir], {
         cwd: ctx.projectDir,
         env: { ...process.env, HUSKY: "0", SKIP_HOOKS: "1" },
         stdio: "pipe"
       });
-      execFileSync14("git", ["commit", "--no-gpg-sign", "-m", `chore: add kody task artifacts [skip ci]`], {
+      execFileSync15("git", ["commit", "--no-gpg-sign", "-m", `chore: add kody task artifacts [skip ci]`], {
         cwd: ctx.projectDir,
         env: { ...process.env, HUSKY: "0", SKIP_HOOKS: "1" },
         stdio: "pipe"
@@ -3600,7 +4593,7 @@ function executeShipStage(ctx, _def) {
     let repo = config.github?.repo;
     if (!owner || !repo) {
       try {
-        const remoteUrl = execFileSync14("git", ["remote", "get-url", "origin"], {
+        const remoteUrl = execFileSync15("git", ["remote", "get-url", "origin"], {
           encoding: "utf-8",
           cwd: ctx.projectDir
         }).trim();
@@ -3621,28 +4614,28 @@ function executeShipStage(ctx, _def) {
       chore: "chore"
     };
     let prefix = "chore";
-    const taskJsonPath = path20.join(ctx.taskDir, "task.json");
-    if (fs22.existsSync(taskJsonPath)) {
+    const taskJsonPath = path22.join(ctx.taskDir, "task.json");
+    if (fs24.existsSync(taskJsonPath)) {
       try {
-        const raw = fs22.readFileSync(taskJsonPath, "utf-8");
+        const raw = fs24.readFileSync(taskJsonPath, "utf-8");
         const cleaned = raw.replace(/^```json\s*\n?/m, "").replace(/\n?```\s*$/m, "");
         const task = JSON.parse(cleaned);
         prefix = TYPE_PREFIX[task.task_type] ?? "chore";
       } catch {
       }
     }
-    const taskMdPath = path20.join(ctx.taskDir, "task.md");
-    if (fs22.existsSync(taskMdPath)) {
-      const content = fs22.readFileSync(taskMdPath, "utf-8");
+    const taskMdPath = path22.join(ctx.taskDir, "task.md");
+    if (fs24.existsSync(taskMdPath)) {
+      const content = fs24.readFileSync(taskMdPath, "utf-8");
       const heading = content.split("\n").find((l) => l.startsWith("# "));
       if (heading) {
         title = `${prefix}: ${heading.replace(/^#\s*/, "").trim()}`.slice(0, 72);
       }
     }
     if (title === "Update") {
-      if (fs22.existsSync(taskJsonPath)) {
+      if (fs24.existsSync(taskJsonPath)) {
         try {
-          const raw = fs22.readFileSync(taskJsonPath, "utf-8");
+          const raw = fs24.readFileSync(taskJsonPath, "utf-8");
           const cleaned = raw.replace(/^```json\s*\n?/m, "").replace(/\n?```\s*$/m, "");
           const task = JSON.parse(cleaned);
           if (task.title) title = `${prefix}: ${task.title}`.slice(0, 72);
@@ -3665,7 +4658,7 @@ function executeShipStage(ctx, _def) {
         } catch {
         }
       }
-      fs22.writeFileSync(shipPath, `# Ship
+      fs24.writeFileSync(shipPath, `# Ship
 Updated existing PR: ${existingPr.url}
 PR #${existingPr.number}
@@ -3686,20 +4679,20 @@ PR #${existingPr.number}
           } catch {
           }
         }
-        fs22.writeFileSync(shipPath, `# Ship
+        fs24.writeFileSync(shipPath, `# Ship
 PR created: ${pr.url}
 PR #${pr.number}
 `);
       } else {
-        fs22.writeFileSync(shipPath, "# Ship\n\nPushed branch but failed to create PR.\n");
+        fs24.writeFileSync(shipPath, "# Ship\n\nPushed branch but failed to create PR.\n");
       }
     }
     return { outcome: "completed", outputFile: "ship.md", retries: 0 };
   } catch (err) {
     const msg = err instanceof Error ? err.message : String(err);
     try {
-      fs22.writeFileSync(shipPath, `# Ship
+      fs24.writeFileSync(shipPath, `# Ship
 Failed: ${msg}
 `);
@@ -3748,15 +4741,15 @@ var init_executor_registry = __esm({
 });
 // src/pipeline/questions.ts
-import * as fs23 from "fs";
-import * as path21 from "path";
+import * as fs25 from "fs";
+import * as path23 from "path";
 function checkForQuestions(ctx, stageName) {
   if (ctx.input.local || !ctx.input.issueNumber) return false;
   try {
     if (stageName === "taskify") {
-      const taskJsonPath = path21.join(ctx.taskDir, "task.json");
-      if (!fs23.existsSync(taskJsonPath)) return false;
-      const raw = fs23.readFileSync(taskJsonPath, "utf-8");
+      const taskJsonPath = path23.join(ctx.taskDir, "task.json");
+      if (!fs25.existsSync(taskJsonPath)) return false;
+      const raw = fs25.readFileSync(taskJsonPath, "utf-8");
       const cleaned = raw.replace(/^```json\s*\n?/m, "").replace(/\n?```\s*$/m, "");
       const taskJson = JSON.parse(cleaned);
       if (taskJson.questions && Array.isArray(taskJson.questions) && taskJson.questions.length > 0) {
@@ -3771,9 +4764,9 @@ Reply with \`@kody approve\` and your answers in the comment body.`;
       }
     }
     if (stageName === "plan") {
-      const planPath = path21.join(ctx.taskDir, "plan.md");
-      if (!fs23.existsSync(planPath)) return false;
-      const plan = fs23.readFileSync(planPath, "utf-8");
+      const planPath = path23.join(ctx.taskDir, "plan.md");
+      if (!fs25.existsSync(planPath)) return false;
+      const plan = fs25.readFileSync(planPath, "utf-8");
       const questionsMatch = plan.match(/## Questions\s*\n([\s\S]*?)(?=\n## |\n*$)/);
       if (questionsMatch) {
         const questionsText = questionsMatch[1].trim();
@@ -3802,8 +4795,8 @@ var init_questions = __esm({
 });
 // src/pipeline/hooks.ts
-import * as fs24 from "fs";
-import * as path22 from "path";
+import * as fs26 from "fs";
+import * as path24 from "path";
 function applyPreStageLabel(ctx, def) {
   if (!ctx.input.issueNumber || ctx.input.local) return;
   if (def.name === "build") setLifecycleLabel(ctx.input.issueNumber, "building");
@@ -3841,9 +4834,9 @@ function autoDetectComplexity(ctx, def) {
     return { complexity, activeStages };
   }
   try {
-    const taskJsonPath = path22.join(ctx.taskDir, "task.json");
-    if (!fs24.existsSync(taskJsonPath)) return null;
-    const raw = fs24.readFileSync(taskJsonPath, "utf-8");
+    const taskJsonPath = path24.join(ctx.taskDir, "task.json");
+    if (!fs26.existsSync(taskJsonPath)) return null;
+    const raw = fs26.readFileSync(taskJsonPath, "utf-8");
     const cleaned = raw.replace(/^```json\s*\n?/m, "").replace(/\n?```\s*$/m, "");
     const taskJson = JSON.parse(cleaned);
     if (!taskJson.risk_level || !isValidComplexity(taskJson.risk_level)) return null;
@@ -3873,8 +4866,8 @@ function checkRiskGate(ctx, def, state, complexity) {
   if (ctx.input.dryRun || ctx.input.local) return null;
   if (ctx.input.mode === "rerun") return null;
   if (!ctx.input.issueNumber) return null;
-  const planPath = path22.join(ctx.taskDir, "plan.md");
-  const plan = fs24.existsSync(planPath) ? fs24.readFileSync(planPath, "utf-8").slice(0, 1500) : "(plan not available)";
+  const planPath = path24.join(ctx.taskDir, "plan.md");
+  const plan = fs26.existsSync(planPath) ? fs26.readFileSync(planPath, "utf-8").slice(0, 1500) : "(plan not available)";
   try {
     postComment(
       ctx.input.issueNumber,
@@ -3941,22 +4934,22 @@ var init_hooks = __esm({
 });
 // src/learning/auto-learn.ts
-import * as fs25 from "fs";
-import * as path23 from "path";
+import * as fs27 from "fs";
+import * as path25 from "path";
 function stripAnsi(str) {
   return str.replace(/\x1b\[[0-9;]*m/g, "");
 }
 function autoLearn(ctx) {
   try {
-    const memoryDir = path23.join(ctx.projectDir, ".kody", "memory");
-    if (!fs25.existsSync(memoryDir)) {
-      fs25.mkdirSync(memoryDir, { recursive: true });
+    const memoryDir = path25.join(ctx.projectDir, ".kody", "memory");
+    if (!fs27.existsSync(memoryDir)) {
+      fs27.mkdirSync(memoryDir, { recursive: true });
     }
     const learnings = [];
     const timestamp2 = (/* @__PURE__ */ new Date()).toISOString().slice(0, 10);
-    const verifyPath = path23.join(ctx.taskDir, "verify.md");
-    if (fs25.existsSync(verifyPath)) {
-      const verify = stripAnsi(fs25.readFileSync(verifyPath, "utf-8"));
+    const verifyPath = path25.join(ctx.taskDir, "verify.md");
+    if (fs27.existsSync(verifyPath)) {
+      const verify = stripAnsi(fs27.readFileSync(verifyPath, "utf-8"));
       if (/vitest/i.test(verify)) learnings.push("- Uses vitest for testing");
       if (/jest/i.test(verify)) learnings.push("- Uses jest for testing");
       if (/eslint/i.test(verify)) learnings.push("- Uses eslint for linting");
@@ -3965,18 +4958,18 @@ function autoLearn(ctx) {
       if (/jsdom/i.test(verify)) learnings.push("- Test environment: jsdom");
       if (/node/i.test(verify) && /environment/i.test(verify)) learnings.push("- Test environment: node");
     }
-    const reviewPath = path23.join(ctx.taskDir, "review.md");
-    if (fs25.existsSync(reviewPath)) {
-      const review = fs25.readFileSync(reviewPath, "utf-8");
+    const reviewPath = path25.join(ctx.taskDir, "review.md");
+    if (fs27.existsSync(reviewPath)) {
+      const review = fs27.readFileSync(reviewPath, "utf-8");
       if (/\.js extension/i.test(review)) learnings.push("- Imports use .js extensions (ESM)");
       if (/barrel export/i.test(review)) learnings.push("- Uses barrel exports (index.ts)");
       if (/timezone/i.test(review)) learnings.push("- Timezone handling is a concern in this codebase");
       if (/UTC/i.test(review)) learnings.push("- Date operations should consider UTC vs local time");
     }
-    const taskJsonPath = path23.join(ctx.taskDir, "task.json");
-    if (fs25.existsSync(taskJsonPath)) {
+    const taskJsonPath = path25.join(ctx.taskDir, "task.json");
+    if (fs27.existsSync(taskJsonPath)) {
       try {
-        const raw = stripAnsi(fs25.readFileSync(taskJsonPath, "utf-8"));
+        const raw = stripAnsi(fs27.readFileSync(taskJsonPath, "utf-8"));
         const cleaned = raw.replace(/^```json\s*\n?/m, "").replace(/\n?```\s*$/m, "");
         const task = JSON.parse(cleaned);
         if (task.scope && Array.isArray(task.scope)) {
@@ -3987,12 +4980,12 @@ function autoLearn(ctx) {
       }
     }
     if (learnings.length > 0) {
-      const conventionsPath = path23.join(memoryDir, "conventions.md");
+      const conventionsPath = path25.join(memoryDir, "conventions.md");
       const entry = `
 ## Learned ${timestamp2} (task: ${ctx.taskId})
 ${learnings.join("\n")}
 `;
-      fs25.appendFileSync(conventionsPath, entry);
+      fs27.appendFileSync(conventionsPath, entry);
       logger.info(`Auto-learned ${learnings.length} convention(s)`);
     }
     autoLearnArchitecture(ctx.projectDir, memoryDir, timestamp2);
@@ -4000,8 +4993,8 @@ ${learnings.join("\n")}
   }
 }
 function autoLearnArchitecture(projectDir, memoryDir, timestamp2) {
-  const archPath = path23.join(memoryDir, "architecture.md");
-  if (fs25.existsSync(archPath)) return;
+  const archPath = path25.join(memoryDir, "architecture.md");
+  if (fs27.existsSync(archPath)) return;
   const detected = detectArchitectureBasic(projectDir);
   if (detected.length > 0) {
     const content = `# Architecture (auto-detected ${timestamp2})
@@ -4009,7 +5002,7 @@ function autoLearnArchitecture(projectDir, memoryDir, timestamp2) {
 ## Overview
 ${detected.join("\n")}
 `;
-    fs25.writeFileSync(archPath, content);
+    fs27.writeFileSync(archPath, content);
     logger.info(`Auto-detected architecture (${detected.length} items)`);
   }
 }
@@ -4022,13 +5015,13 @@ var init_auto_learn = __esm({
 });
 // src/retrospective.ts
-import * as fs26 from "fs";
-import * as path24 from "path";
+import * as fs28 from "fs";
+import * as path26 from "path";
 function readArtifact(taskDir, filename, maxChars) {
-  const p = path24.join(taskDir, filename);
-  if (!fs26.existsSync(p)) return null;
+  const p = path26.join(taskDir, filename);
+  if (!fs28.existsSync(p)) return null;
   try {
-    const content = fs26.readFileSync(p, "utf-8");
+    const content = fs28.readFileSync(p, "utf-8");
     return content.length > maxChars ? content.slice(0, maxChars) + "\n...(truncated)" : content;
   } catch {
     return null;
@@ -4081,13 +5074,13 @@ function collectRunContext(ctx, state, pipelineStartTime) {
   return lines.join("\n");
 }
 function getLogPath(projectDir) {
-  return path24.join(projectDir, ".kody", "memory", "observer-log.jsonl");
+  return path26.join(projectDir, ".kody", "memory", "observer-log.jsonl");
 }
 function readPreviousRetrospectives(projectDir, limit = 10) {
   const logPath = getLogPath(projectDir);
-  if (!fs26.existsSync(logPath)) return [];
+  if (!fs28.existsSync(logPath)) return [];
   try {
-    const content = fs26.readFileSync(logPath, "utf-8");
+    const content = fs28.readFileSync(logPath, "utf-8");
     const lines = content.split("\n").filter(Boolean);
     const entries = [];
     const start = Math.max(0, lines.length - limit);
@@ -4114,11 +5107,11 @@ function formatPreviousEntries(entries) {
 }
 function appendRetrospectiveEntry(projectDir, entry) {
   const logPath = getLogPath(projectDir);
-  const dir = path24.dirname(logPath);
-  if (!fs26.existsSync(dir)) {
-    fs26.mkdirSync(dir, { recursive: true });
+  const dir = path26.dirname(logPath);
+  if (!fs28.existsSync(dir)) {
+    fs28.mkdirSync(dir, { recursive: true });
   }
-  fs26.appendFileSync(logPath, JSON.stringify(entry) + "\n");
+  fs28.appendFileSync(logPath, JSON.stringify(entry) + "\n");
 }
 async function runRetrospective(ctx, state, pipelineStartTime) {
   if (ctx.input.dryRun) return;
@@ -4140,7 +5133,7 @@ ${previousText}
     if (needsLitellmProxy(config)) {
       extraEnv.ANTHROPIC_BASE_URL = getLitellmUrl();
     }
-    const result = await runner.run("retrospective", prompt, model, 3e4, "", {
+    const result2 = await runner.run("retrospective", prompt, model, 3e4, "", {
       cwd: ctx.projectDir,
       env: extraEnv
     });
@@ -4148,8 +5141,8 @@ ${previousText}
     let patternMatch = null;
     let suggestion = "No suggestion";
     let pipelineFlaw = null;
-    if (result.outcome === "completed" && result.output) {
-      const cleaned = result.output.replace(/^```json\s*\n?/m, "").replace(/\n?```\s*$/m, "").trim();
+    if (result2.outcome === "completed" && result2.output) {
+      const cleaned = result2.output.replace(/^```json\s*\n?/m, "").replace(/\n?```\s*$/m, "").trim();
       try {
         const parsed = JSON.parse(cleaned);
         observation = parsed.observation ?? observation;
@@ -4286,8 +5279,8 @@ var init_summary = __esm({
 });
 // src/pipeline.ts
-import * as fs27 from "fs";
-import * as path25 from "path";
+import * as fs29 from "fs";
+import * as path27 from "path";
 function ensureFeatureBranchIfNeeded(ctx) {
   if (ctx.input.dryRun) return;
   if (ctx.input.prNumber) {
@@ -4300,8 +5293,8 @@ function ensureFeatureBranchIfNeeded(ctx) {
   }
   if (!ctx.input.issueNumber) return;
   try {
-    const taskMdPath = path25.join(ctx.taskDir, "task.md");
-    const title = fs27.existsSync(taskMdPath) ? fs27.readFileSync(taskMdPath, "utf-8").split("\n")[0].slice(0, 50) : ctx.taskId;
+    const taskMdPath = path27.join(ctx.taskDir, "task.md");
+    const title = fs29.existsSync(taskMdPath) ? fs29.readFileSync(taskMdPath, "utf-8").split("\n")[0].slice(0, 50) : ctx.taskId;
     ensureFeatureBranch(ctx.input.issueNumber, title, ctx.projectDir);
     syncWithDefault(ctx.projectDir);
   } catch (err) {
@@ -4315,10 +5308,10 @@ function ensureFeatureBranchIfNeeded(ctx) {
   }
 }
 function acquireLock(taskDir) {
-  const lockPath = path25.join(taskDir, ".lock");
-  if (fs27.existsSync(lockPath)) {
+  const lockPath = path27.join(taskDir, ".lock");
+  if (fs29.existsSync(lockPath)) {
     try {
-      const pid = parseInt(fs27.readFileSync(lockPath, "utf-8").trim(), 10);
+      const pid = parseInt(fs29.readFileSync(lockPath, "utf-8").trim(), 10);
       if (!isNaN(pid)) {
         try {
           process.kill(pid, 0);
@@ -4335,14 +5328,14 @@ function acquireLock(taskDir) {
       logger.warn(`  Corrupt lock file \u2014 overwriting`);
     }
     try {
-      fs27.unlinkSync(lockPath);
+      fs29.unlinkSync(lockPath);
     } catch {
     }
   }
   try {
-    const fd = fs27.openSync(lockPath, fs27.constants.O_WRONLY | fs27.constants.O_CREAT | fs27.constants.O_EXCL);
-    fs27.writeSync(fd, String(process.pid));
-    fs27.closeSync(fd);
+    const fd = fs29.openSync(lockPath, fs29.constants.O_WRONLY | fs29.constants.O_CREAT | fs29.constants.O_EXCL);
+    fs29.writeSync(fd, String(process.pid));
+    fs29.closeSync(fd);
   } catch (err) {
     if (err.code === "EEXIST") {
       throw new Error("Pipeline already running (lock acquired by another process)");
@@ -4352,7 +5345,7 @@ function acquireLock(taskDir) {
 }
 function releaseLock(taskDir) {
   try {
-    fs27.unlinkSync(path25.join(taskDir, ".lock"));
+    fs29.unlinkSync(path27.join(taskDir, ".lock"));
   } catch {
   }
 }
@@ -4441,23 +5434,23 @@ async function runPipelineInner(ctx) {
     writeState(state, ctx.taskDir);
     logger.info(`[${def.name}] starting...`);
     applyPreStageLabel(ctx, def);
-    let result;
+    let result2;
     try {
-      result = await getExecutor(def.name)(ctx, def);
+      result2 = await getExecutor(def.name)(ctx, def);
     } catch (error) {
-      result = {
+      result2 = {
         outcome: "failed",
         retries: 0,
         error: error instanceof Error ? error.message : String(error)
       };
     }
     ciGroupEnd();
-    if (result.outcome === "completed") {
+    if (result2.outcome === "completed") {
       state.stages[def.name] = {
         state: "completed",
         completedAt: (/* @__PURE__ */ new Date()).toISOString(),
-        retries: result.retries,
-        outputFile: result.outputFile
+        retries: result2.retries,
+        outputFile: result2.outputFile
       };
       logger.info(`[${def.name}] \u2713 completed`);
       const detected = autoDetectComplexity(ctx, def);
@@ -4471,16 +5464,16 @@ async function runPipelineInner(ctx) {
       if (gated) return gated;
       commitAfterStage(ctx, def);
     } else {
-      const isTimeout = result.outcome === "timed_out";
+      const isTimeout = result2.outcome === "timed_out";
       state.stages[def.name] = {
         state: isTimeout ? "timeout" : "failed",
-        retries: result.retries,
-        error: isTimeout ? "Stage timed out" : result.error ?? "Stage failed"
+        retries: result2.retries,
+        error: isTimeout ? "Stage timed out" : result2.error ?? "Stage failed"
       };
       state.state = "failed";
       state.sessions = ctx.sessions;
       writeState(state, ctx.taskDir);
-      logger.error(`[${def.name}] ${isTimeout ? "\u23F1 timed out" : `\u2717 failed: ${result.error}`}`);
+      logger.error(`[${def.name}] ${isTimeout ? "\u23F1 timed out" : `\u2717 failed: ${result2.error}`}`);
       if (ctx.input.issueNumber && !ctx.input.local) {
         setLifecycleLabel(ctx.input.issueNumber, "failed");
       }
@@ -4560,8 +5553,8 @@ var init_pipeline = __esm({
 });
 // src/preflight.ts
-import { execFileSync as execFileSync15 } from "child_process";
-import * as fs28 from "fs";
+import { execFileSync as execFileSync16 } from "child_process";
+import * as fs30 from "fs";
 function check(name, fn) {
   try {
     const detail = fn() ?? void 0;
@@ -4573,7 +5566,7 @@ function check(name, fn) {
 function runPreflight() {
   const checks = [
     check("claude CLI", () => {
-      const v = execFileSync15("claude", ["--version"], {
+      const v = execFileSync16("claude", ["--version"], {
         encoding: "utf-8",
         timeout: 1e4,
         stdio: ["pipe", "pipe", "pipe"]
@@ -4581,14 +5574,14 @@ function runPreflight() {
       return v;
     }),
     check("git repo", () => {
-      execFileSync15("git", ["rev-parse", "--is-inside-work-tree"], {
+      execFileSync16("git", ["rev-parse", "--is-inside-work-tree"], {
         encoding: "utf-8",
         timeout: 5e3,
         stdio: ["pipe", "pipe", "pipe"]
       });
     }),
     check("pnpm", () => {
-      const v = execFileSync15("pnpm", ["--version"], {
+      const v = execFileSync16("pnpm", ["--version"], {
         encoding: "utf-8",
         timeout: 5e3,
         stdio: ["pipe", "pipe", "pipe"]
@@ -4596,7 +5589,7 @@ function runPreflight() {
       return v;
     }),
     check("node >= 18", () => {
-      const v = execFileSync15("node", ["--version"], {
+      const v = execFileSync16("node", ["--version"], {
         encoding: "utf-8",
         timeout: 5e3,
         stdio: ["pipe", "pipe", "pipe"]
@@ -4606,7 +5599,7 @@ function runPreflight() {
       return v;
     }),
     check("gh CLI", () => {
-      const v = execFileSync15("gh", ["--version"], {
+      const v = execFileSync16("gh", ["--version"], {
         encoding: "utf-8",
         timeout: 5e3,
         stdio: ["pipe", "pipe", "pipe"]
@@ -4614,7 +5607,7 @@ function runPreflight() {
       return v;
     }),
     check("package.json", () => {
-      if (!fs28.existsSync("package.json")) throw new Error("not found");
+      if (!fs30.existsSync("package.json")) throw new Error("not found");
     })
   ];
   const failed = checks.filter((c) => !c.ok);
@@ -4691,8 +5684,8 @@ var init_args = __esm({
 });
 // src/cli/task-state.ts
-import * as fs29 from "fs";
-import * as path26 from "path";
+import * as fs31 from "fs";
+import * as path28 from "path";
 function resolveTaskAction(issueNumber, existingTaskId, existingState) {
   if (!existingTaskId || !existingState) {
     return { action: "start-fresh", taskId: `${issueNumber}-${generateTaskId()}` };
@@ -4724,11 +5717,11 @@ function resolveTaskAction(issueNumber, existingTaskId, existingState) {
 function resolveForIssue(issueNumber, projectDir) {
   const existingTaskId = findLatestTaskForIssue(issueNumber, projectDir);
   if (existingTaskId) {
-    const statusPath = path26.join(projectDir, ".kody", "tasks", existingTaskId, "status.json");
+    const statusPath = path28.join(projectDir, ".kody", "tasks", existingTaskId, "status.json");
     let existingState = null;
-    if (fs29.existsSync(statusPath)) {
+    if (fs31.existsSync(statusPath)) {
       try {
-        existingState = JSON.parse(fs29.readFileSync(statusPath, "utf-8"));
+        existingState = JSON.parse(fs31.readFileSync(statusPath, "utf-8"));
       } catch {
       }
     }
@@ -4761,12 +5754,12 @@ var resolve_exports = {};
 __export(resolve_exports, {
   runResolve: () => runResolve
 });
-import { execFileSync as execFileSync16 } from "child_process";
+import { execFileSync as execFileSync17 } from "child_process";
 function getConflictContext(cwd, files) {
   const parts = [];
   for (const file of files.slice(0, 10)) {
     try {
-      const content = execFileSync16("git", ["diff", file], {
+      const content = execFileSync17("git", ["diff", file], {
         cwd,
         encoding: "utf-8",
         stdio: ["pipe", "pipe", "pipe"]
@@ -4816,12 +5809,12 @@ async function runResolve(options) {
     extraEnv.ANTHROPIC_BASE_URL = getLitellmUrl();
   }
   logger.info(`  Running agent to resolve conflicts (model=${model})...`);
-  const result = await runner.run("resolve", prompt, model, 3e5, projectDir, {
+  const result2 = await runner.run("resolve", prompt, model, 3e5, projectDir, {
     cwd: projectDir,
     env: extraEnv
   });
-  if (result.outcome !== "completed") {
-    return { outcome: "failed", error: `Agent failed: ${result.error}` };
+  if (result2.outcome !== "completed") {
+    return { outcome: "failed", error: `Agent failed: ${result2.error}` };
   }
   logger.info("  Verifying resolution...");
   const verify = runQualityGates(projectDir, projectDir);
@@ -4885,8 +5878,8 @@ var init_resolve = __esm({
 // src/entry.ts
 var entry_exports = {};
-import * as fs30 from "fs";
-import * as path27 from "path";
+import * as fs32 from "fs";
+import * as path29 from "path";
 async function ensureLitellmProxy(config, projectDir) {
   if (!anyStageNeedsProxy(config)) return null;
   const litellmUrl = getLitellmUrl();
@@ -4931,19 +5924,19 @@ async function runModelHealthCheck(config) {
   }
   const model = config.agent.modelMap.cheap;
   logger.info(`Model health check (${model} via ${usesProxy ? "LiteLLM" : "Anthropic"})...`);
-  const result = await checkModelHealth(baseUrl, apiKey, model);
-  if (result.ok) {
+  const result2 = await checkModelHealth(baseUrl, apiKey, model);
+  if (result2.ok) {
     logger.info("  \u2713 Model responded");
   } else {
-    logger.error(`  \u2717 Model health check failed: ${result.error}`);
+    logger.error(`  \u2717 Model health check failed: ${result2.error}`);
     process.exit(1);
   }
 }
 async function main() {
   const input = parseArgs();
-  const projectDir = input.cwd ? path27.resolve(input.cwd) : process.cwd();
+  const projectDir = input.cwd ? path29.resolve(input.cwd) : process.cwd();
   if (input.cwd) {
-    if (!fs30.existsSync(projectDir)) {
+    if (!fs32.existsSync(projectDir)) {
       console.error(`--cwd path does not exist: ${projectDir}`);
       process.exit(1);
     }
@@ -5009,8 +6002,8 @@ async function main() {
       process.exit(1);
     }
   }
-  const taskDir = path27.join(projectDir, ".kody", "tasks", taskId);
-  fs30.mkdirSync(taskDir, { recursive: true });
+  const taskDir = path29.join(projectDir, ".kody", "tasks", taskId);
+  fs32.mkdirSync(taskDir, { recursive: true });
   if (input.command === "rerun" && isTaskifyRun(taskDir)) {
     const marker = readTaskifyMarker(taskDir);
     if (marker) {
@@ -5075,7 +6068,7 @@ async function main() {
       console.error(`Runner "${defaultRunnerName2}" health check failed`);
       process.exit(1);
     }
-    const result = await runStandaloneReview({
+    const result2 = await runStandaloneReview({
       projectDir,
       runners: runners2,
       prTitle,
@@ -5085,15 +6078,15 @@ async function main() {
       taskId
     });
     if (litellmProcess2) litellmProcess2.kill();
-    if (result.outcome === "failed") {
-      console.error(`Review failed: ${result.error}`);
+    if (result2.outcome === "failed") {
+      console.error(`Review failed: ${result2.error}`);
       process.exit(1);
     }
-    if (result.reviewContent) {
-      console.log(result.reviewContent);
+    if (result2.reviewContent) {
+      console.log(result2.reviewContent);
       if (!input.local && prNumber) {
-        const comment = formatReviewComment(result.reviewContent, taskId);
-        const verdict = detectReviewVerdict(result.reviewContent);
+        const comment = formatReviewComment(result2.reviewContent, taskId);
+        const verdict = detectReviewVerdict(result2.reviewContent);
         const event = verdict === "fail" ? "request-changes" : "approve";
         const posted = submitPRReview(prNumber, comment, event);
         if (!posted) {
@@ -5125,48 +6118,48 @@ async function main() {
       process.exit(1);
     }
     const { runResolve: runResolve2 } = await Promise.resolve().then(() => (init_resolve(), resolve_exports));
-    const result = await runResolve2({
+    const result2 = await runResolve2({
       prNumber: input.prNumber,
       projectDir,
       runners: runners2,
       local: input.local ?? true
     });
     if (litellmProcess2) litellmProcess2.kill();
-    if (result.outcome === "failed") {
-      console.error(`Resolve failed: ${result.error}`);
+    if (result2.outcome === "failed") {
+      console.error(`Resolve failed: ${result2.error}`);
       process.exit(1);
     }
-    console.log(`Resolve: ${result.outcome}`);
+    console.log(`Resolve: ${result2.outcome}`);
     process.exit(0);
   }
   logger.info("Preflight checks:");
   runPreflight();
   if (input.task) {
-    fs30.writeFileSync(path27.join(taskDir, "task.md"), input.task);
+    fs32.writeFileSync(path29.join(taskDir, "task.md"), input.task);
   }
-  const taskMdPath = path27.join(taskDir, "task.md");
-  if (!fs30.existsSync(taskMdPath) && isPRFix && input.prNumber) {
+  const taskMdPath = path29.join(taskDir, "task.md");
+  if (!fs32.existsSync(taskMdPath) && isPRFix && input.prNumber) {
     logger.info(`Fetching PR #${input.prNumber} details as task context...`);
     const prDetails = getPRDetails(input.prNumber);
     if (prDetails) {
       const taskContent = `# ${prDetails.title}
 ${prDetails.body ?? ""}`;
-      fs30.writeFileSync(taskMdPath, taskContent);
+      fs32.writeFileSync(taskMdPath, taskContent);
       logger.info(`  Task loaded from PR #${input.prNumber}: ${prDetails.title}`);
     }
-  } else if (!fs30.existsSync(taskMdPath) && input.issueNumber) {
+  } else if (!fs32.existsSync(taskMdPath) && input.issueNumber) {
     logger.info(`Fetching issue #${input.issueNumber} body as task...`);
     const issue = getIssue(input.issueNumber);
     if (issue) {
       const taskContent = `# ${issue.title}
 ${issue.body ?? ""}`;
-      fs30.writeFileSync(taskMdPath, taskContent);
+      fs32.writeFileSync(taskMdPath, taskContent);
       logger.info(`  Task loaded from issue #${input.issueNumber}: ${issue.title}`);
     }
   }
-  if (!fs30.existsSync(taskMdPath)) {
+  if (!fs32.existsSync(taskMdPath)) {
     console.error("No task.md found. Provide --task, --issue-number, or ensure .kody/tasks/<id>/task.md exists.");
     process.exit(1);
   }
@@ -5304,7 +6297,7 @@ To rerun: \`@kody rerun ${taskId} --from <stage>\``
     }
   }
   const state = await runPipeline(ctx);
-  const files = fs30.readdirSync(taskDir);
+  const files = fs32.readdirSync(taskDir);
   console.log(`
 Artifacts in ${taskDir}:`);
   for (const f of files) {
@@ -5369,8 +6362,8 @@ var init_entry = __esm({
 });
 // src/bin/cli.ts
-import * as fs31 from "fs";
-import * as path28 from "path";
+import * as fs33 from "fs";
+import * as path30 from "path";
 import { fileURLToPath as fileURLToPath2 } from "url";
 // src/bin/commands/init.ts
@@ -5750,7 +6743,7 @@ import { execFileSync as execFileSync5 } from "child_process";
 import * as fs5 from "fs";
 import * as path4 from "path";
 function discoverQaContext(cwd) {
-  const result = {
+  const result2 = {
     routes: [],
     authFiles: [],
     loginPage: null,
@@ -5763,21 +6756,21 @@ function discoverQaContext(cwd) {
     const pkg = JSON.parse(fs5.readFileSync(path4.join(cwd, "package.json"), "utf-8"));
     const allDeps = { ...pkg.dependencies, ...pkg.devDependencies };
     const pm = fs5.existsSync(path4.join(cwd, "pnpm-lock.yaml")) ? "pnpm" : fs5.existsSync(path4.join(cwd, "yarn.lock")) ? "yarn" : "npm";
-    if (pkg.scripts?.dev) result.devCommand = `${pm} dev`;
-    if (allDeps.next || allDeps.nuxt) result.devPort = 3e3;
-    else if (allDeps.vite) result.devPort = 5173;
+    if (pkg.scripts?.dev) result2.devCommand = `${pm} dev`;
+    if (allDeps.next || allDeps.nuxt) result2.devPort = 3e3;
+    else if (allDeps.vite) result2.devPort = 5173;
   } catch {
   }
   const appDirs = ["src/app", "app"];
   for (const appDir of appDirs) {
     const fullAppDir = path4.join(cwd, appDir);
     if (!fs5.existsSync(fullAppDir)) continue;
-    scanRoutes(fullAppDir, appDir, "", result);
+    scanRoutes(fullAppDir, appDir, "", result2);
     break;
   }
   const authPatterns = ["middleware.ts", "middleware.js", "src/middleware.ts", "src/middleware.js"];
   for (const p of authPatterns) {
-    if (fs5.existsSync(path4.join(cwd, p))) result.authFiles.push(p);
+    if (fs5.existsSync(path4.join(cwd, p))) result2.authFiles.push(p);
   }
   const authConfigGlobs = [
     "src/app/api/auth",
@@ -5788,7 +6781,7 @@ function discoverQaContext(cwd) {
     "src/app/api/oauth"
   ];
   for (const g of authConfigGlobs) {
-    if (fs5.existsSync(path4.join(cwd, g))) result.authFiles.push(g);
+    if (fs5.existsSync(path4.join(cwd, g))) result2.authFiles.push(g);
   }
   try {
     const rolePaths = [
@@ -5810,7 +6803,7 @@ function discoverQaContext(cwd) {
           if (roleMatches) {
             for (const m of roleMatches) {
               const val = m.match(/['"](\w+)['"]/);
-              if (val && !result.roles.includes(val[1])) result.roles.push(val[1]);
+              if (val && !result2.roles.includes(val[1])) result2.roles.push(val[1]);
             }
           }
           const enumMatch = content.match(/(?:enum|type)\s+\w*[Rr]ole\w*\s*[={]([^}]+)/s);
@@ -5819,7 +6812,7 @@ function discoverQaContext(cwd) {
             if (vals) {
               for (const v of vals) {
                 const clean = v.replace(/['"]/g, "");
-                if (!result.roles.includes(clean)) result.roles.push(clean);
+                if (!result2.roles.includes(clean)) result2.roles.push(clean);
               }
             }
           }
@@ -5829,9 +6822,9 @@ function discoverQaContext(cwd) {
     }
   } catch {
   }
-  return result;
+  return result2;
 }
-function scanRoutes(dir, baseDir, prefix, result) {
+function scanRoutes(dir, baseDir, prefix, result2) {
   let entries;
   try {
     entries = fs5.readdirSync(dir, { withFileTypes: true });
@@ -5842,16 +6835,16 @@ function scanRoutes(dir, baseDir, prefix, result) {
   if (hasPage) {
     const routePath = prefix || "/";
     const group = prefix.startsWith("/admin") ? "admin" : prefix.includes("/login") ? "auth" : prefix.includes("/signup") ? "auth" : prefix.includes("/api") ? "api" : "frontend";
-    result.routes.push({ path: routePath, group });
-    if (prefix.includes("/login")) result.loginPage = routePath;
-    if (prefix.startsWith("/admin") && !result.adminPath) result.adminPath = prefix;
+    result2.routes.push({ path: routePath, group });
+    if (prefix.includes("/login")) result2.loginPage = routePath;
+    if (prefix.startsWith("/admin") && !result2.adminPath) result2.adminPath = prefix;
   }
   for (const entry of entries) {
     if (!entry.isDirectory()) continue;
     if (entry.name === "node_modules" || entry.name === ".next") continue;
     let segment = entry.name;
     if (segment.startsWith("(") && segment.endsWith(")")) {
-      scanRoutes(path4.join(dir, entry.name), baseDir, prefix, result);
+      scanRoutes(path4.join(dir, entry.name), baseDir, prefix, result2);
       continue;
     }
     if (segment.startsWith("[") && segment.endsWith("]")) {
@@ -5860,7 +6853,7 @@ function scanRoutes(dir, baseDir, prefix, result) {
     if (segment.startsWith("[[") && segment.endsWith("]]")) {
       segment = `:${segment.slice(2, -2)}?`;
     }
-    scanRoutes(path4.join(dir, entry.name), baseDir, `${prefix}/${segment}`, result);
+    scanRoutes(path4.join(dir, entry.name), baseDir, `${prefix}/${segment}`, result2);
   }
 }
 function generateQaGuide(discovery) {
@@ -6544,11 +7537,11 @@ Create it manually.`, cwd);
 // src/bin/cli.ts
 init_architecture_detection();
-var __dirname2 = path28.dirname(fileURLToPath2(import.meta.url));
-var PKG_ROOT = path28.resolve(__dirname2, "..", "..");
+var __dirname2 = path30.dirname(fileURLToPath2(import.meta.url));
+var PKG_ROOT = path30.resolve(__dirname2, "..", "..");
 function getVersion() {
-  const pkgPath = path28.join(PKG_ROOT, "package.json");
-  const pkg = JSON.parse(fs31.readFileSync(pkgPath, "utf-8"));
+  const pkgPath = path30.join(PKG_ROOT, "package.json");
+  const pkg = JSON.parse(fs33.readFileSync(pkgPath, "utf-8"));
   return pkg.version;
 }
 var args = process.argv.slice(2);
@@ -6559,6 +7552,8 @@ if (command === "init") {
   bootstrapCommand({ force: args.includes("--force") }, PKG_ROOT);
 } else if (command === "taskify") {
   Promise.resolve().then(() => (init_taskify_command(), taskify_command_exports)).then(({ runTaskifyCommand: runTaskifyCommand2 }) => runTaskifyCommand2());
+} else if (command === "test-model") {
+  Promise.resolve().then(() => (init_test_model_command(), test_model_command_exports)).then(({ runTestModelCommand: runTestModelCommand2 }) => runTestModelCommand2());
 } else if (command === "ci-parse") {
   Promise.resolve().then(() => (init_parse_inputs(), parse_inputs_exports)).then(({ runCiParse: runCiParse2 }) => runCiParse2());
 } else if (command === "version" || command === "--version" || command === "-v") {