npm - jinzd-ai-cli - Versions diffs - 0.4.67 → 0.4.69 - Mend

jinzd-ai-cli 0.4.67 → 0.4.69

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

package/dist/{chunk-XSIVGDCN.js → chunk-3IZATQV5.js} RENAMED Viewed

@@ -8,7 +8,7 @@ import {
   RateLimitError,
   schemaToJsonSchema,
   truncateForPersist
-} from "./chunk-BVLQ3FRA.js";
+} from "./chunk-ZKHLLGUU.js";
 import {
   APP_NAME,
   CONFIG_DIR_NAME,
@@ -21,7 +21,7 @@ import {
   MCP_TOOL_PREFIX,
   PLUGINS_DIR_NAME,
   VERSION
-} from "./chunk-F44OKMB2.js";
+} from "./chunk-APJHOYCH.js";
 // src/config/config-manager.ts
 import { readFileSync, writeFileSync, existsSync, mkdirSync } from "fs";
@@ -191,7 +191,27 @@ var ConfigSchema = z.object({
   // 插件以完整 Node.js 权限在主进程中执行（可读写文件、访问网络、执行命令），
   // 必须确认插件来源可信后，再设为 true 启用。
   // 可通过 /config 命令或直接编辑 ~/.aicli/config.json 开启。
-  allowPlugins: z.boolean().default(false)
+  allowPlugins: z.boolean().default(false),
+  // 智能模型路由（v0.4.68+）
+  // 按用户每轮输入的内容/标签/长度动态选择模型，在同一 provider 内切换，
+  // 例：短问题走 haiku（省钱），planning 走 opus（质量）。
+  // enabled=false 时永远返回当前模型。rules 按顺序匹配，首个命中的规则生效。
+  // 每个 rule 的 match 必须至少有一个条件（tag/contains/maxLength/minLength）。
+  // 详见 src/core/model-router.ts。
+  routing: z.object({
+    enabled: z.boolean().default(false),
+    rules: z.array(z.object({
+      match: z.object({
+        contains: z.array(z.string()).optional(),
+        maxLength: z.number().int().positive().optional(),
+        minLength: z.number().int().positive().optional(),
+        tag: z.string().optional()
+      }),
+      model: z.string(),
+      name: z.string().optional()
+    })).default([]),
+    fallback: z.string().optional()
+  }).default({ enabled: false, rules: [] })
 });
 // src/config/config-manager.ts

package/dist/{chunk-F44OKMB2.js → chunk-APJHOYCH.js} RENAMED Viewed

@@ -8,7 +8,7 @@ import { platform } from "os";
 import chalk from "chalk";
 // src/core/constants.ts
-var VERSION = "0.4.67";
+var VERSION = "0.4.69";
 var APP_NAME = "ai-cli";
 var CONFIG_DIR_NAME = ".aicli";
 var CONFIG_FILE_NAME = "config.json";

package/dist/{chunk-X7NVAEFI.js → chunk-IJIU46TF.js} RENAMED Viewed

@@ -6,7 +6,7 @@ import { platform } from "os";
 import chalk from "chalk";
 // src/core/constants.ts
-var VERSION = "0.4.67";
+var VERSION = "0.4.69";
 var APP_NAME = "ai-cli";
 var CONFIG_DIR_NAME = ".aicli";
 var CONFIG_FILE_NAME = "config.json";

package/dist/{chunk-BVLQ3FRA.js → chunk-ZKHLLGUU.js} RENAMED Viewed

@@ -10,7 +10,7 @@ import {
   SUBAGENT_DEFAULT_MAX_ROUNDS,
   SUBAGENT_MAX_ROUNDS_LIMIT,
   runTestsTool
-} from "./chunk-F44OKMB2.js";
+} from "./chunk-APJHOYCH.js";
 // src/tools/builtin/bash.ts
 import { execSync } from "child_process";
@@ -1839,16 +1839,123 @@ function findWhitespaceTolerant(fileLines, searchLines) {
   }
   return { matchStart, matchCount };
 }
+function applyReplace(content, oldStr, newStr, options = {}) {
+  if (oldStr === "") {
+    return { ok: false, error: "old_str cannot be empty" };
+  }
+  if (options.ignoreWhitespace) {
+    const fileLines = content.split("\n");
+    const searchLines = oldStr.split("\n");
+    const { matchStart, matchCount } = findWhitespaceTolerant(fileLines, searchLines);
+    if (matchStart === -1) {
+      const similar = findSimilarLines(content, oldStr);
+      const hint = similar.length > 0 ? `
+Similar lines found (did you mean?):
+${similar.join("\n")}` : "";
+      return {
+        ok: false,
+        error: `old_str not found in file (even with whitespace ignored). File has ${fileLines.length} lines.${hint}`
+      };
+    }
+    if (matchCount > 1) {
+      return {
+        ok: false,
+        error: "old_str matches multiple locations with whitespace-tolerant matching. Please include more surrounding context to make it unique."
+      };
+    }
+    const before = fileLines.slice(0, matchStart);
+    const after = fileLines.slice(matchStart + searchLines.length);
+    const updated2 = [...before, newStr, ...after].join("\n");
+    return {
+      ok: true,
+      content: updated2,
+      info: { mode: "ignore_whitespace", replacedCount: 1, lineNumber: matchStart + 1 }
+    };
+  }
+  if (options.replaceAll) {
+    const occurrences = content.split(oldStr).length - 1;
+    if (occurrences === 0) {
+      const similar = findSimilarLines(content, oldStr);
+      const hint = similar.length > 0 ? `
+Similar lines found (did you mean?):
+${similar.join("\n")}` : "";
+      return { ok: false, error: `old_str not found in file.${hint}` };
+    }
+    const updated2 = content.split(oldStr).join(newStr);
+    return {
+      ok: true,
+      content: updated2,
+      info: { mode: "replace_all", replacedCount: occurrences }
+    };
+  }
+  const firstIndex = content.indexOf(oldStr);
+  if (firstIndex === -1) {
+    const lines = content.split("\n");
+    const similar = findSimilarLines(content, oldStr);
+    const hint = similar.length > 0 ? `
+Similar lines found (did you mean?):
+${similar.join("\n")}` : "";
+    return {
+      ok: false,
+      error: `old_str not found in file. File has ${lines.length} lines.${hint}
+Tip: try ignore_whitespace: true if indentation differs.`
+    };
+  }
+  const secondIndex = content.indexOf(oldStr, firstIndex + 1);
+  if (secondIndex !== -1) {
+    return {
+      ok: false,
+      error: `old_str appears multiple times in file (at positions ${firstIndex} and ${secondIndex}). Please include more surrounding context to make it unique, or set replace_all: true.`
+    };
+  }
+  const updated = content.slice(0, firstIndex) + newStr + content.slice(firstIndex + oldStr.length);
+  const linesBefore = content.slice(0, firstIndex).split("\n").length;
+  return {
+    ok: true,
+    content: updated,
+    info: { mode: "exact", replacedCount: 1, lineNumber: linesBefore }
+  };
+}
+function parseEditsArg(raw) {
+  if (!Array.isArray(raw)) {
+    throw new ToolError("edit_file", "edits must be an array of { old_str, new_str } objects");
+  }
+  if (raw.length === 0) {
+    throw new ToolError("edit_file", "edits array is empty \u2014 provide at least one edit");
+  }
+  if (raw.length > 200) {
+    throw new ToolError("edit_file", `edits array too large (${raw.length}) \u2014 max 200 per call`);
+  }
+  return raw.map((e, i) => {
+    if (e == null || typeof e !== "object") {
+      throw new ToolError("edit_file", `edits[${i}] must be an object`);
+    }
+    const rec = e;
+    if (typeof rec.old_str !== "string") {
+      throw new ToolError("edit_file", `edits[${i}].old_str must be a string`);
+    }
+    if (rec.new_str !== void 0 && typeof rec.new_str !== "string") {
+      throw new ToolError("edit_file", `edits[${i}].new_str must be a string`);
+    }
+    return {
+      old_str: rec.old_str,
+      new_str: String(rec.new_str ?? ""),
+      ignore_whitespace: Boolean(rec.ignore_whitespace),
+      replace_all: Boolean(rec.replace_all)
+    };
+  });
+}
 var editFileTool = {
   definition: {
     name: "edit_file",
-    description: `Precisely edit file contents. Supports three modes:
-1. String replace (most common): Provide old_str and new_str to replace an exact match. old_str must appear exactly once in the file (unless replace_all is true).
-2. Line insert: Provide insert_after_line (1-based line number) and insert_content to insert after that line.
-3. Line delete: Provide delete_from_line and delete_to_line (inclusive) to delete that range.
-Optional ignore_whitespace: true to match ignoring indentation differences.
-Optional replace_all: true to replace ALL occurrences of old_str in the file at once (saves tool rounds when renaming variables/functions).
-Note: Path can be absolute or relative to the current working directory.`,
+    description: `Precisely edit file contents. Four modes:
+1. String replace (most common): Provide old_str and new_str to replace an exact match. old_str must appear exactly once (unless replace_all is true).
+2. Line insert: Provide insert_after_line (1-based) and insert_content.
+3. Line delete: Provide delete_from_line and delete_to_line (inclusive).
+4. Batch edits: Provide edits=[{old_str, new_str, ignore_whitespace?, replace_all?}, ...] to apply MULTIPLE edits in ONE call \u2014 saves tool rounds/tokens when refactoring a file. Edits are applied sequentially in-memory; by default any failure rolls back ALL edits (set stop_on_error=false to apply successful ones and report failures).
+Optional ignore_whitespace: true ignores indentation differences during matching.
+Optional replace_all: true replaces ALL occurrences of old_str.
+Note: Path can be absolute or relative to cwd.`,
     parameters: {
       path: {
         type: "string",
@@ -1857,22 +1964,22 @@ Note: Path can be absolute or relative to the current working directory.`,
       },
       old_str: {
         type: "string",
-        description: "[Replace mode] Original string to replace, must appear exactly once (include enough context for uniqueness)",
+        description: "[Single-replace mode] Original string to replace, must appear exactly once (include enough context for uniqueness)",
         required: false
       },
       new_str: {
         type: "string",
-        description: "[Replace mode] New replacement string, can be empty to delete old_str",
+        description: "[Single-replace mode] New replacement string, can be empty to delete old_str",
         required: false
       },
       ignore_whitespace: {
         type: "boolean",
-        description: "[Replace mode] Whether to ignore leading/trailing whitespace per line when matching, defaults to false",
+        description: "[Single-replace mode] Whether to ignore leading/trailing whitespace per line when matching, defaults to false",
         required: false
       },
       replace_all: {
         type: "boolean",
-        description: "[Replace mode] Replace ALL occurrences of old_str instead of requiring unique match. Useful for renaming variables/functions across the file in one call.",
+        description: "[Single-replace mode] Replace ALL occurrences of old_str instead of requiring unique match. Useful for renaming variables/functions across the file in one call.",
         required: false
       },
       insert_after_line: {
@@ -1895,6 +2002,16 @@ Note: Path can be absolute or relative to the current working directory.`,
         description: "[Delete mode] Delete up to and including this line (1-based)",
         required: false
       },
+      edits: {
+        type: "array",
+        description: "[Batch mode] Array of {old_str, new_str, ignore_whitespace?, replace_all?} objects. Each applied sequentially to the in-memory content. Max 200 per call.",
+        required: false
+      },
+      stop_on_error: {
+        type: "boolean",
+        description: "[Batch mode] If true (default), any failing edit rolls back the whole batch and writes nothing. If false, successful edits are written and failed ones are reported.",
+        required: false
+      },
       encoding: {
         type: "string",
         description: "File encoding, defaults to utf-8",
@@ -1910,83 +2027,84 @@ Note: Path can be absolute or relative to the current working directory.`,
     if (!filePath) throw new ToolError("edit_file", "path is required");
     if (!existsSync5(filePath)) throw new ToolError("edit_file", `File not found: ${filePath}`);
     const original = readFileSync4(filePath, encoding);
+    if (args["edits"] !== void 0) {
+      const edits = parseEditsArg(args["edits"]);
+      const stopOnError = args["stop_on_error"] !== false;
+      let working = original;
+      const reports = [];
+      let appliedCount = 0;
+      for (let i = 0; i < edits.length; i++) {
+        const edit = edits[i];
+        const res = applyReplace(working, edit.old_str, edit.new_str, {
+          ignoreWhitespace: edit.ignore_whitespace,
+          replaceAll: edit.replace_all
+        });
+        if (res.ok) {
+          working = res.content;
+          appliedCount++;
+          reports.push({
+            index: i,
+            ok: true,
+            summary: `${res.info?.mode} at ${res.info?.lineNumber != null ? `line ${res.info.lineNumber}` : `${res.info?.replacedCount} occurrence(s)`}: ${truncatePreview(edit.old_str)} \u2192 ${truncatePreview(edit.new_str)}`
+          });
+        } else {
+          reports.push({ index: i, ok: false, error: res.error });
+          if (stopOnError) break;
+        }
+      }
+      const anyFailed = reports.some((r) => !r.ok);
+      const writeChanges = appliedCount > 0 && !(anyFailed && stopOnError);
+      if (writeChanges) {
+        undoStack.push(filePath, `edit_file (batch ${appliedCount}/${edits.length}): ${filePath}`);
+        fileCheckpoints.snapshot(filePath, ToolExecutor.currentMessageIndex);
+        writeFileSync3(filePath, working, encoding);
+      }
+      const lines = [];
+      if (anyFailed && stopOnError) {
+        lines.push(`ERROR: Batch edit aborted \u2014 ${appliedCount}/${edits.length} applied, then edit #${appliedCount} failed. No changes written (stop_on_error=true).`);
+      } else if (anyFailed) {
+        lines.push(`Partial success: ${appliedCount}/${edits.length} edits applied to ${filePath} (stop_on_error=false).`);
+      } else {
+        lines.push(`Successfully applied ${appliedCount}/${edits.length} edit(s) to ${filePath}.`);
+      }
+      lines.push("");
+      for (const r of reports) {
+        if (r.ok) {
+          lines.push(`  \u2713 #${r.index + 1}: ${r.summary}`);
+        } else {
+          lines.push(`  \u2717 #${r.index + 1}: ${r.error}`);
+        }
+      }
+      return lines.join("\n");
+    }
     if (args["old_str"] !== void 0) {
       const oldStr = String(args["old_str"]);
       const newStr = String(args["new_str"] ?? "");
       const ignoreWs = Boolean(args["ignore_whitespace"]);
       const replaceAll = Boolean(args["replace_all"]);
       if (oldStr === "") throw new ToolError("edit_file", "old_str cannot be empty");
-      if (ignoreWs) {
-        const fileLines = original.split("\n");
-        const searchLines = oldStr.split("\n");
-        const { matchStart, matchCount } = findWhitespaceTolerant(fileLines, searchLines);
-        if (matchStart === -1) {
-          const similar = findSimilarLines(original, oldStr);
-          const hint = similar.length > 0 ? `
-Similar lines found (did you mean?):
-${similar.join("\n")}` : "";
-          return `ERROR: old_str not found in file (even with whitespace ignored).
-File has ${fileLines.length} lines.${hint}
+      const res = applyReplace(original, oldStr, newStr, {
+        ignoreWhitespace: ignoreWs,
+        replaceAll
+      });
+      if (!res.ok) {
+        return `ERROR: ${res.error}
 Please read the file first and use exact text.`;
-        }
-        if (matchCount > 1) {
-          return `ERROR: old_str matches multiple locations with whitespace-tolerant matching. Please include more surrounding context to make it unique.`;
-        }
-        undoStack.push(filePath, `edit_file (ws-replace): ${filePath}`);
-        fileCheckpoints.snapshot(filePath, ToolExecutor.currentMessageIndex);
-        const before = fileLines.slice(0, matchStart);
-        const after = fileLines.slice(matchStart + searchLines.length);
-        const updated2 = [...before, newStr, ...after].join("\n");
-        writeFileSync3(filePath, updated2, encoding);
-        return `Successfully edited ${filePath} (whitespace-tolerant match)
-  Location: around line ${matchStart + 1}
-  Replaced: ${searchLines.length} line(s) \u2192 ${newStr.split("\n").length} line(s)
-  Old: ${truncatePreview(oldStr)}
-  New: ${truncatePreview(newStr)}`;
       }
-      if (replaceAll) {
-        const occurrences = original.split(oldStr).length - 1;
-        if (occurrences === 0) {
-          const similar = findSimilarLines(original, oldStr);
-          const hint = similar.length > 0 ? `
-Similar lines found (did you mean?):
-${similar.join("\n")}` : "";
-          return `ERROR: old_str not found in file.${hint}
-Please read the file first and use exact text.`;
-        }
-        undoStack.push(filePath, `edit_file (replace_all): ${filePath}`);
-        fileCheckpoints.snapshot(filePath, ToolExecutor.currentMessageIndex);
-        const updated2 = original.split(oldStr).join(newStr);
-        writeFileSync3(filePath, updated2, encoding);
-        return `Successfully edited ${filePath} (replace_all)
-  Replaced: ${occurrences} occurrence(s) of ${truncatePreview(oldStr)}
+      const modeLabel = res.info?.mode === "ignore_whitespace" ? " (whitespace-tolerant match)" : res.info?.mode === "replace_all" ? " (replace_all)" : "";
+      const label = res.info?.mode === "ignore_whitespace" ? "edit_file (ws-replace)" : res.info?.mode === "replace_all" ? "edit_file (replace_all)" : "edit_file (replace)";
+      undoStack.push(filePath, `${label}: ${filePath}`);
+      fileCheckpoints.snapshot(filePath, ToolExecutor.currentMessageIndex);
+      writeFileSync3(filePath, res.content, encoding);
+      if (res.info?.mode === "replace_all") {
+        return `Successfully edited ${filePath}${modeLabel}
+  Replaced: ${res.info.replacedCount} occurrence(s) of ${truncatePreview(oldStr)}
   With: ${truncatePreview(newStr)}`;
       }
-      const firstIndex = original.indexOf(oldStr);
-      if (firstIndex === -1) {
-        const lines = original.split("\n");
-        const similar = findSimilarLines(original, oldStr);
-        const hint = similar.length > 0 ? `
-Similar lines found (did you mean?):
-${similar.join("\n")}` : "";
-        return `ERROR: old_str not found in file.
-File has ${lines.length} lines.${hint}
-Please read the file first and use exact text including whitespace/indentation.
-Tip: You can also try ignore_whitespace: true to match ignoring indentation differences.`;
-      }
-      const secondIndex = original.indexOf(oldStr, firstIndex + 1);
-      if (secondIndex !== -1) {
-        return `ERROR: old_str appears multiple times in file (at least at positions ${firstIndex} and ${secondIndex}). Please include more surrounding context to make it unique.`;
-      }
-      undoStack.push(filePath, `edit_file (replace): ${filePath}`);
-      fileCheckpoints.snapshot(filePath, ToolExecutor.currentMessageIndex);
-      const updated = original.slice(0, firstIndex) + newStr + original.slice(firstIndex + oldStr.length);
-      writeFileSync3(filePath, updated, encoding);
       const oldLines = oldStr.split("\n").length;
       const newLines = newStr.split("\n").length;
-      const linesBefore = original.slice(0, firstIndex).split("\n").length;
-      return `Successfully edited ${filePath}
-  Location: around line ${linesBefore}
+      return `Successfully edited ${filePath}${modeLabel}
+  Location: around line ${res.info?.lineNumber ?? "?"}
   Replaced: ${oldLines} line(s) \u2192 ${newLines} line(s)
   Old: ${truncatePreview(oldStr)}
   New: ${truncatePreview(newStr)}`;
@@ -2022,7 +2140,7 @@ Tip: You can also try ignore_whitespace: true to match ignoring indentation diff
     }
     throw new ToolError(
       "edit_file",
-      "No operation specified. Provide either: (old_str + new_str) for replace, (insert_after_line + insert_content) for insert, or (delete_from_line + delete_to_line) for delete."
+      "No operation specified. Provide one of: (old_str + new_str), (insert_after_line + insert_content), (delete_from_line + delete_to_line), or edits=[...]."
     );
   }
 };

package/dist/{hub-RGK325NQ.js → hub-H3OSDWZW.js} RENAMED Viewed

@@ -385,7 +385,7 @@ ${content}`);
   }
 }
 async function runTaskMode(config, providers, configManager, topic) {
-  const { TaskOrchestrator } = await import("./task-orchestrator-4PVBMQJ7.js");
+  const { TaskOrchestrator } = await import("./task-orchestrator-AZPMRFET.js");
   const orchestrator = new TaskOrchestrator(config, providers, configManager);
   let interrupted = false;
   const onSigint = () => {

package/dist/index.js CHANGED Viewed

@@ -31,7 +31,7 @@ import {
   saveDevState,
   sessionHasMeaningfulContent,
   setupProxy
-} from "./chunk-XSIVGDCN.js";
+} from "./chunk-3IZATQV5.js";
 import {
   ToolExecutor,
   ToolRegistry,
@@ -47,7 +47,7 @@ import {
   spawnAgentContext,
   theme,
   undoStack
-} from "./chunk-BVLQ3FRA.js";
+} from "./chunk-ZKHLLGUU.js";
 import {
   fileCheckpoints
 } from "./chunk-4BKXL7SM.js";
@@ -72,7 +72,7 @@ import {
   SKILLS_DIR_NAME,
   VERSION,
   buildUserIdentityPrompt
-} from "./chunk-F44OKMB2.js";
+} from "./chunk-APJHOYCH.js";
 // src/index.ts
 import { program } from "commander";
@@ -1075,6 +1075,79 @@ function createDefaultCommands() {
         );
       }
     },
+    {
+      name: "route",
+      description: "Smart model routing \u2014 enable/disable or inspect routing rules",
+      usage: "/route [on|off|show|test <message>]",
+      async execute(args, ctx) {
+        const sub = (args[0] ?? "show").toLowerCase();
+        const routing = ctx.config.get("routing");
+        if (sub === "on" || sub === "enable") {
+          ctx.config.setByPath("routing.enabled", "true");
+          ctx.renderer.printSuccess("Smart model routing enabled.");
+          if (!routing || routing.rules.length === 0) {
+            ctx.renderer.printInfo(
+              'No rules configured yet. Add rules under `routing.rules` in ~/.aicli/config.json.\nExample: { match: { tag: "fast" }, model: "claude-haiku-4-5" }'
+            );
+          }
+          return;
+        }
+        if (sub === "off" || sub === "disable") {
+          ctx.config.setByPath("routing.enabled", "false");
+          ctx.renderer.printSuccess("Smart model routing disabled.");
+          return;
+        }
+        if (sub === "test") {
+          const msg = args.slice(1).join(" ").trim();
+          if (!msg) {
+            console.log(theme.warning("  Usage: /route test <message>"));
+            return;
+          }
+          const decision = ctx.computeRoutingDecision(msg);
+          const marker = decision.overridden ? theme.accent("\u2192 ROUTED") : theme.dim("(unchanged)");
+          console.log();
+          console.log(`  Input:    ${theme.dim(msg)}`);
+          console.log(`  Current:  ${theme.info(ctx.getCurrentModel())}`);
+          console.log(`  Decision: ${theme.info(decision.model)}  ${marker}`);
+          console.log(`  Reason:   ${theme.dim(decision.reason)}`);
+          if (typeof decision.ruleIdx === "number") {
+            console.log(`  Rule:     #${decision.ruleIdx}`);
+          }
+          console.log();
+          return;
+        }
+        if (sub === "show" || sub === "status") {
+          console.log();
+          console.log(`  ${theme.heading("Smart Model Routing")}`);
+          console.log(`  Status:   ${routing?.enabled ? theme.success("enabled") : theme.dim("disabled")}`);
+          console.log(`  Provider: ${theme.info(ctx.getCurrentProvider())}`);
+          console.log(`  Current:  ${theme.info(ctx.getCurrentModel())}`);
+          if (routing?.fallback) {
+            console.log(`  Fallback: ${theme.info(routing.fallback)}`);
+          }
+          console.log();
+          if (!routing || routing.rules.length === 0) {
+            console.log(`  ${theme.dim("(no rules configured \u2014 edit ~/.aicli/config.json `routing.rules`)")}`);
+          } else {
+            console.log(`  ${theme.heading("Rules")} ${theme.dim(`(evaluated top-to-bottom)`)}:`);
+            routing.rules.forEach((r, i) => {
+              const parts = [];
+              if (r.match.tag) parts.push(`tag=#${r.match.tag}`);
+              if (r.match.contains && r.match.contains.length > 0) parts.push(`contains=[${r.match.contains.slice(0, 3).join(", ")}${r.match.contains.length > 3 ? ", \u2026" : ""}]`);
+              if (typeof r.match.maxLength === "number") parts.push(`maxLen=${r.match.maxLength}`);
+              if (typeof r.match.minLength === "number") parts.push(`minLen=${r.match.minLength}`);
+              const cond = parts.length > 0 ? parts.join(" & ") : theme.warning("(empty \u2014 never matches)");
+              console.log(`    ${theme.dim(`#${i}`)} ${r.name ? theme.accent(r.name) + " " : ""}${cond} ${theme.dim("\u2192")} ${theme.info(r.model)}`);
+            });
+          }
+          console.log();
+          console.log(`  ${theme.dim("Commands: /route on | off | test <msg> | show")}`);
+          console.log();
+          return;
+        }
+        console.log(theme.warning(`  Unknown subcommand: ${sub}. Usage: /route [on|off|show|test <message>]`));
+      }
+    },
     {
       name: "clear",
       description: "Clear conversation history",
@@ -1124,18 +1197,18 @@ function createDefaultCommands() {
             return;
           }
           const sessions = ctx.sessions.listSessions();
-          const matches = sessions.filter((s) => s.id.startsWith(id));
-          if (matches.length === 0) {
+          const matches2 = sessions.filter((s) => s.id.startsWith(id));
+          if (matches2.length === 0) {
             ctx.renderer.renderError(`Session '${id}' not found.`);
             return;
           }
-          if (matches.length > 1) {
-            console.log(theme.warning(`  \u26A0 Ambiguous prefix '${id}' matches ${matches.length} sessions \u2014 loading most recent:`));
-            for (const m of matches.slice(0, 5)) {
+          if (matches2.length > 1) {
+            console.log(theme.warning(`  \u26A0 Ambiguous prefix '${id}' matches ${matches2.length} sessions \u2014 loading most recent:`));
+            for (const m of matches2.slice(0, 5)) {
               console.log(theme.dim(`    ${m.id.slice(0, 12)}  ${m.title ?? "(untitled)"}`));
             }
           }
-          const match = matches[0];
+          const match = matches2[0];
           ctx.sessions.loadSession(match.id);
           ctx.setProvider(match.provider, match.model);
           ctx.resetSessionTokenUsage();
@@ -1373,13 +1446,13 @@ ${text}
   ${theme.heading(`Found ${results.length} session(s) containing "${query}"`)}
 `);
         for (const r of results) {
-          const { sessionMeta, matches } = r;
+          const { sessionMeta, matches: matches2 } = r;
           const dateStr = sessionMeta.updated.toLocaleDateString();
           console.log(
             `  ${theme.accent(sessionMeta.id.slice(0, 8))}` + theme.dim(`  [${dateStr}]  ${sessionMeta.provider} / ${sessionMeta.model}`) + (sessionMeta.title ? `
   ${theme.dim("  " + sessionMeta.title)}` : "")
           );
-          for (const m of matches) {
+          for (const m of matches2) {
             const icon = m.role === "user" ? "\u{1F464}" : "\u{1F916}";
             console.log(`    ${icon} ${theme.warning(m.snippet)}`);
           }
@@ -2194,7 +2267,7 @@ ${hint}` : "")
       usage: "/test [command|filter]",
       async execute(args, ctx) {
         try {
-          const { executeTests } = await import("./run-tests-NUF7CNM4.js");
+          const { executeTests } = await import("./run-tests-5HDSNAAC.js");
           const argStr = args.join(" ").trim();
           let testArgs = {};
           if (argStr) {
@@ -3394,6 +3467,74 @@ var CostTracker = class {
   }
 };
+// src/core/model-router.ts
+var TAG_REGEX = /(?:^|\s)#([a-zA-Z][\w-]{0,31})\b/g;
+function extractTags(message) {
+  const tags = /* @__PURE__ */ new Set();
+  let m;
+  TAG_REGEX.lastIndex = 0;
+  while ((m = TAG_REGEX.exec(message)) !== null) {
+    tags.add(m[1].toLowerCase());
+  }
+  return tags;
+}
+function matches(message, matcher) {
+  const trimmed = message.trim();
+  const lower = trimmed.toLowerCase();
+  if (matcher.tag) {
+    const tags = extractTags(trimmed);
+    if (!tags.has(matcher.tag.toLowerCase())) return false;
+  }
+  if (matcher.contains && matcher.contains.length > 0) {
+    const hit = matcher.contains.some((kw) => lower.includes(kw.toLowerCase()));
+    if (!hit) return false;
+  }
+  if (typeof matcher.maxLength === "number") {
+    if (trimmed.length > matcher.maxLength) return false;
+  }
+  if (typeof matcher.minLength === "number") {
+    if (trimmed.length < matcher.minLength) return false;
+  }
+  const hasAnyCondition = !!matcher.tag || matcher.contains && matcher.contains.length > 0 || typeof matcher.maxLength === "number" || typeof matcher.minLength === "number";
+  return !!hasAnyCondition;
+}
+function pickModel(message, currentModel, config, availableModels = []) {
+  if (!config.enabled || config.rules.length === 0) {
+    return { model: currentModel, reason: "routing disabled", overridden: false };
+  }
+  const isAvailable = (m) => availableModels.length === 0 || availableModels.includes(m);
+  for (let i = 0; i < config.rules.length; i++) {
+    const rule = config.rules[i];
+    if (!matches(message, rule.match)) continue;
+    if (!isAvailable(rule.model)) continue;
+    if (rule.model === currentModel) {
+      return {
+        model: currentModel,
+        reason: `rule "${rule.name ?? `#${i}`}" matched (same as current)`,
+        overridden: false,
+        ruleIdx: i
+      };
+    }
+    return {
+      model: rule.model,
+      reason: `rule "${rule.name ?? `#${i}`}" matched`,
+      overridden: true,
+      ruleIdx: i
+    };
+  }
+  if (config.fallback && config.fallback !== currentModel && isAvailable(config.fallback)) {
+    return {
+      model: config.fallback,
+      reason: "fallback",
+      overridden: true
+    };
+  }
+  return { model: currentModel, reason: "no rule matched", overridden: false };
+}
+function stripRoutingTags(message) {
+  return message.replace(/(?:^|\s)#(fast|deep|default)\b/gi, " ").replace(/\s{2,}/g, " ").trim();
+}
 // src/repl/notify.ts
 import { spawn } from "child_process";
 import { platform as platform2 } from "os";
@@ -3570,13 +3711,15 @@ var Repl = class {
   contextLayers = [];
   /** 本次会话累计 token 用量 */
   sessionTokenUsage = { inputTokens: 0, outputTokens: 0, cacheCreationTokens: 0, cacheReadTokens: 0 };
-  /** Fold a single-request TokenUsage (with optional cache fields) into sessionTokenUsage + cost tracker. */
-  addSessionUsage(u) {
+  /** Fold a single-request TokenUsage (with optional cache fields) into sessionTokenUsage + cost tracker.
+   *  modelOverride lets the smart router attribute cost to the actually-used model
+   *  when it differs from the UI-selected currentModel. */
+  addSessionUsage(u, modelOverride) {
     this.sessionTokenUsage.inputTokens += u.inputTokens;
     this.sessionTokenUsage.outputTokens += u.outputTokens;
     this.sessionTokenUsage.cacheCreationTokens += u.cacheCreationTokens ?? 0;
     this.sessionTokenUsage.cacheReadTokens += u.cacheReadTokens ?? 0;
-    this.costTracker.addCost(this.currentProvider, this.currentModel, u);
+    this.costTracker.addCost(this.currentProvider, modelOverride ?? this.currentModel, u);
   }
   /** 启动时检测到的 Git 分支（无 git 仓库时为 null） */
   gitBranch = null;
@@ -4468,7 +4611,16 @@ Session '${this.resumeSessionId}' not found.
 `));
       }
     }
-    const messageContent = parts.length > 0 ? parts.length === 1 && parts[0].type === "text" ? parts[0].text : parts : userInput;
+    const routingDecision = this.computeRoutingDecision(userInput);
+    const cleanInput = stripRoutingTags(userInput);
+    let effectiveParts = parts;
+    if (cleanInput !== userInput && parts.length > 0 && parts[0].type === "text") {
+      effectiveParts = [
+        { type: "text", text: stripRoutingTags(parts[0].text ?? "") },
+        ...parts.slice(1)
+      ];
+    }
+    const messageContent = effectiveParts.length > 0 ? effectiveParts.length === 1 && effectiveParts[0].type === "text" ? effectiveParts[0].text : effectiveParts : cleanInput;
     if (hasImage) {
       const visionHint = this.getVisionModelHint();
       if (visionHint) {
@@ -4489,6 +4641,12 @@ Session '${this.resumeSessionId}' not found.
       timestamp: /* @__PURE__ */ new Date()
     });
     this.events.emit("message.before", { input: userInput });
+    if (routingDecision.overridden) {
+      process.stdout.write(
+        theme.dim(`  \u2192 Routed to ${routingDecision.model} (${routingDecision.reason})
+`)
+      );
+    }
     const t0 = Date.now();
     try {
       const provider = this.providers.get(this.currentProvider);
@@ -4496,10 +4654,11 @@ Session '${this.resumeSessionId}' not found.
       if (supportsTools) {
         await this.handleChatWithTools(
           provider,
-          session.messages
+          session.messages,
+          routingDecision.model
         );
       } else {
-        await this.handleChatSimple(provider, session.messages);
+        await this.handleChatSimple(provider, session.messages, routingDecision.model);
       }
       if (this.config.get("session").autoSave) {
         if (autoTrimSessionIfNeeded(session)) {
@@ -4577,9 +4736,10 @@ Session '${this.resumeSessionId}' not found.
    */
   /** 运行时 thinking 模式覆盖：null=使用配置值，true/false=运行时覆盖 */
   runtimeThinking = null;
-  getModelParams() {
+  getModelParams(modelOverride) {
     const allParams = this.config.get("modelParams");
-    const params = allParams[this.currentModel] ?? {};
+    const modelId = modelOverride ?? this.currentModel;
+    const params = allParams[modelId] ?? {};
     return {
       ...params,
       maxTokens: params.maxTokens ?? DEFAULT_MAX_TOKENS,
@@ -4587,6 +4747,25 @@ Session '${this.resumeSessionId}' not found.
       thinkingBudget: params.thinkingBudget
     };
   }
+  /**
+   * Compute smart-routing decision for this user turn.
+   * Only considers models available for the current provider (rule skipped otherwise).
+   * When routing is disabled or no rule matches, returns the current model unchanged.
+   */
+  computeRoutingDecision(userInput) {
+    const routingConfig = this.config.get("routing");
+    if (!routingConfig || !routingConfig.enabled) {
+      return { model: this.currentModel, reason: "routing disabled", overridden: false };
+    }
+    let availableModels = [];
+    try {
+      const provider = this.providers.get(this.currentProvider);
+      availableModels = provider.info.models.map((m) => m.id);
+    } catch {
+      availableModels = [];
+    }
+    return pickModel(userInput, this.currentModel, routingConfig, availableModels);
+  }
   // ─── Context 自动管理 ───────────────────────────────────────────────────
   /**
    * 估算文本的 token 数。
@@ -4639,12 +4818,15 @@ Session '${this.resumeSessionId}' not found.
     return total;
   }
   /**
-   * 获取当前模型的 context window 大小。
+   * 获取指定模型的 context window 大小（默认当前模型）。
+   * 智能路由可能在 handleChatWithTools 内把 effectiveModel 暂时切到别的模型，
+   * 故此处接受可选的 modelOverride 以保持计算一致性。
    */
-  getContextWindowSize() {
+  getContextWindowSize(modelOverride) {
     try {
       const provider = this.providers.get(this.currentProvider);
-      const modelInfo = provider.info.models.find((m) => m.id === this.currentModel);
+      const modelId = modelOverride ?? this.currentModel;
+      const modelInfo = provider.info.models.find((m) => m.id === modelId);
       return modelInfo?.contextWindow ?? 0;
     } catch {
       return 0;
@@ -4881,16 +5063,17 @@ Session '${this.resumeSessionId}' not found.
       }
     });
   }
-  async handleChatSimple(provider, messages) {
+  async handleChatSimple(provider, messages, modelOverride) {
     const session = this.sessions.current;
     const useStreaming = this.config.get("ui").streaming;
-    const modelParams = this.getModelParams();
+    const effectiveModel = modelOverride ?? this.currentModel;
+    const modelParams = this.getModelParams(effectiveModel);
     if (useStreaming) {
       const ac = this.setupStreamInterrupt();
       try {
         const stream = provider.chatStream({
           messages,
-          model: this.currentModel,
+          model: effectiveModel,
           systemPrompt: this.buildCurrentSystemPrompt(),
           stream: true,
           temperature: modelParams.temperature,
@@ -4910,7 +5093,7 @@ Session '${this.resumeSessionId}' not found.
         session.addMessage({ role: "assistant", content, timestamp: /* @__PURE__ */ new Date() });
         this.events.emit("message.after", { content });
         if (usage) {
-          this.addSessionUsage(usage);
+          this.addSessionUsage(usage, effectiveModel);
           session.addTokenUsage(usage);
           if (showTokens && !tokensShown) {
             this.renderer.renderUsage(usage, this.sessionTokenUsage);
@@ -4924,7 +5107,7 @@ Session '${this.resumeSessionId}' not found.
       try {
         const response = await provider.chat({
           messages,
-          model: this.currentModel,
+          model: effectiveModel,
           systemPrompt: this.buildCurrentSystemPrompt(),
           stream: false,
           temperature: modelParams.temperature,
@@ -4939,7 +5122,7 @@ Session '${this.resumeSessionId}' not found.
         session.addMessage({ role: "assistant", content: response.content, timestamp: /* @__PURE__ */ new Date() });
         this.events.emit("message.after", { content: response.content });
         if (response.usage) {
-          this.addSessionUsage(response.usage);
+          this.addSessionUsage(response.usage, effectiveModel);
           session.addTokenUsage(response.usage);
           if (this.shouldShowTokens()) {
             this.renderer.renderUsage(response.usage, this.sessionTokenUsage);
@@ -5052,8 +5235,9 @@ Session '${this.resumeSessionId}' not found.
       rawContent
     };
   }
-  async handleChatWithTools(provider, messages) {
+  async handleChatWithTools(provider, messages, modelOverride) {
     const session = this.sessions.current;
+    const effectiveModel = modelOverride ?? this.currentModel;
     let toolDefs;
     let mcpBudgetNote = null;
     const usedMcpToolNames = /* @__PURE__ */ new Set();
@@ -5064,7 +5248,7 @@ Session '${this.resumeSessionId}' not found.
       if (skillFilter) {
         toolDefs = this.toolRegistry.getDefinitions().filter((t) => skillFilter.has(t.name));
       } else {
-        const contextWindow = this.getContextWindowSize();
+        const contextWindow = this.getContextWindowSize(effectiveModel);
         if (contextWindow > 0) {
           const toolBudget = Math.floor(contextWindow * 0.2);
           const { definitions, trimmedCount, systemNote } = this.toolRegistry.getDefinitionsWithBudget(toolBudget, usedMcpToolNames);
@@ -5114,7 +5298,7 @@ You have a maximum of ${maxToolRounds} tool call rounds for this task. Plan effi
     const systemPrompt = baseSystemPrompt + roundBudgetHint + (mcpBudgetNote ? `
 ${mcpBudgetNote}` : "");
-    const modelParams = this.getModelParams();
+    const modelParams = this.getModelParams(effectiveModel);
     const useStreaming = this.config.get("ui").streaming;
     const spinner = this.renderer.showSpinner("Thinking...");
     const roundUsage = { inputTokens: 0, outputTokens: 0, cacheCreationTokens: 0, cacheReadTokens: 0 };
@@ -5204,7 +5388,7 @@ ${mcpBudgetNote}` : "");
               )
             );
             if (roundUsage.inputTokens > 0 || roundUsage.outputTokens > 0) {
-              this.addSessionUsage(roundUsage);
+              this.addSessionUsage(roundUsage, effectiveModel);
               session.addTokenUsage(roundUsage);
               if (this.shouldShowTokens()) {
                 this.renderer.renderUsage(roundUsage, this.sessionTokenUsage);
@@ -5232,7 +5416,7 @@ ${mcpBudgetNote}` : "");
         let alreadyRendered = false;
         const chatRequest = {
           messages: apiMessages,
-          model: this.currentModel,
+          model: effectiveModel,
           systemPrompt,
           stream: false,
           temperature: modelParams.temperature,
@@ -5334,7 +5518,7 @@ ${mcpBudgetNote}` : "");
               )
             );
             if (roundUsage.inputTokens > 0 || roundUsage.outputTokens > 0) {
-              this.addSessionUsage(roundUsage);
+              this.addSessionUsage(roundUsage, effectiveModel);
               session.addTokenUsage(roundUsage);
               if (this.shouldShowTokens()) {
                 this.renderer.renderUsage(roundUsage, this.sessionTokenUsage);
@@ -5369,7 +5553,7 @@ ${mcpBudgetNote}` : "");
           });
           this.events.emit("message.after", { content: finalContent });
           if (roundUsage.inputTokens > 0 || roundUsage.outputTokens > 0) {
-            this.addSessionUsage(roundUsage);
+            this.addSessionUsage(roundUsage, effectiveModel);
             session.addTokenUsage(roundUsage);
             if (this.shouldShowTokens()) {
               this.renderer.renderUsage(roundUsage, this.sessionTokenUsage);
@@ -5387,7 +5571,7 @@ ${mcpBudgetNote}` : "");
             try {
               const genStream = provider.chatStream({
                 messages: apiMessages,
-                model: this.currentModel,
+                model: effectiveModel,
                 systemPrompt,
                 stream: true,
                 temperature: modelParams.temperature,
@@ -5423,7 +5607,7 @@ ${mcpBudgetNote}` : "");
               const newMsgs2 = provider.buildToolResultMessages(result.toolCalls, syntheticResults, reasoningContent2);
               extraMessages.push(...newMsgs2);
               if (roundUsage.inputTokens > 0 || roundUsage.outputTokens > 0) {
-                this.addSessionUsage(roundUsage);
+                this.addSessionUsage(roundUsage, effectiveModel);
                 session.addTokenUsage(roundUsage);
                 if (teeShowTokens && !teeTokShown) {
                   this.renderer.renderUsage(roundUsage, this.sessionTokenUsage);
@@ -5438,14 +5622,14 @@ ${mcpBudgetNote}` : "");
         askUserContext.rl = this.rl;
         googleSearchContext.configManager = this.config;
         streamToFileContext.provider = provider;
-        streamToFileContext.model = this.currentModel;
+        streamToFileContext.model = effectiveModel;
         streamToFileContext.systemPrompt = systemPrompt;
         streamToFileContext.messages = apiMessages;
         streamToFileContext.extraMessages = extraMessages;
         streamToFileContext.temperature = modelParams.temperature;
         streamToFileContext.timeout = modelParams.timeout;
         spawnAgentContext.provider = provider;
-        spawnAgentContext.model = this.currentModel;
+        spawnAgentContext.model = effectiveModel;
         spawnAgentContext.systemPrompt = systemPrompt;
         spawnAgentContext.modelParams = modelParams;
         spawnAgentContext.configManager = this.config;
@@ -5605,7 +5789,7 @@ ${mcpBudgetNote}` : "");
         const summaryResult = await provider.chatWithTools(
           {
             messages: apiMessages,
-            model: this.currentModel,
+            model: effectiveModel,
             systemPrompt,
             stream: false,
             temperature: modelParams.temperature,
@@ -5643,7 +5827,7 @@ Tip: You can continue the conversation by asking the AI to proceed.`
         );
       }
       if (roundUsage.inputTokens > 0 || roundUsage.outputTokens > 0) {
-        this.addSessionUsage(roundUsage);
+        this.addSessionUsage(roundUsage, effectiveModel);
         session.addTokenUsage(roundUsage);
         if (this.shouldShowTokens()) {
           this.renderer.renderUsage(roundUsage, this.sessionTokenUsage);
@@ -5819,6 +6003,7 @@ Tip: You can continue the conversation by asking the AI to proceed.`
       forkSession: (messageCount, title) => this.sessions.forkSession(messageCount, title),
       getToolExecutor: () => this.toolExecutor,
       getCostTracker: () => this.costTracker,
+      computeRoutingDecision: (userInput) => this.computeRoutingDecision(userInput),
       exit: () => this.handleExit()
     };
     await cmd.execute(args, ctx);
@@ -5923,7 +6108,7 @@ program.command("web").description("Start Web UI server with browser-based chat
     console.error("Error: Invalid port number. Must be between 1 and 65535.");
     process.exit(1);
   }
-  const { startWebServer } = await import("./server-5HLNHRKM.js");
+  const { startWebServer } = await import("./server-L5P63T2I.js");
   await startWebServer({ port, host: options.host });
 });
 program.command("user [action] [username]").description("Manage Web UI users (list | create <name> | delete <name> | reset-password <name> | migrate <name>)").action(async (action, username) => {
@@ -6156,7 +6341,7 @@ program.command("hub [topic]").description("Start multi-agent hub (discuss / bra
     }),
     config.get("customProviders")
   );
-  const { startHub } = await import("./hub-RGK325NQ.js");
+  const { startHub } = await import("./hub-H3OSDWZW.js");
   await startHub(
     {
       topic: topic ?? "",

package/dist/{run-tests-NUF7CNM4.js → run-tests-5HDSNAAC.js} RENAMED Viewed

@@ -2,7 +2,7 @@
 import {
   executeTests,
   runTestsTool
-} from "./chunk-F44OKMB2.js";
+} from "./chunk-APJHOYCH.js";
 export {
   executeTests,
   runTestsTool

package/dist/{run-tests-KGUJL6L5.js → run-tests-TGOMJCVB.js} RENAMED Viewed

@@ -1,7 +1,7 @@
 import {
   executeTests,
   runTestsTool
-} from "./chunk-X7NVAEFI.js";
+} from "./chunk-IJIU46TF.js";
 export {
   executeTests,
   runTestsTool

package/dist/{server-5HLNHRKM.js → server-L5P63T2I.js} RENAMED Viewed

@@ -21,7 +21,7 @@ import {
   persistToolRound,
   rebuildExtraMessages,
   setupProxy
-} from "./chunk-XSIVGDCN.js";
+} from "./chunk-3IZATQV5.js";
 import {
   AuthManager
 } from "./chunk-BYNY5JPB.js";
@@ -42,7 +42,7 @@ import {
   spawnAgentContext,
   truncateOutput,
   undoStack
-} from "./chunk-BVLQ3FRA.js";
+} from "./chunk-ZKHLLGUU.js";
 import "./chunk-4BKXL7SM.js";
 import {
   AGENTIC_BEHAVIOR_GUIDELINE,
@@ -62,7 +62,7 @@ import {
   SKILLS_DIR_NAME,
   VERSION,
   buildUserIdentityPrompt
-} from "./chunk-F44OKMB2.js";
+} from "./chunk-APJHOYCH.js";
 // src/web/server.ts
 import express from "express";
@@ -1946,7 +1946,7 @@ ${undoResults.map((r) => `  \u2022 ${r}`).join("\n")}` });
       case "test": {
         this.send({ type: "info", message: "\u{1F9EA} Running tests..." });
         try {
-          const { executeTests } = await import("./run-tests-NUF7CNM4.js");
+          const { executeTests } = await import("./run-tests-5HDSNAAC.js");
           const argStr = args.join(" ").trim();
           let testArgs = {};
           if (argStr) {

package/dist/{task-orchestrator-4PVBMQJ7.js → task-orchestrator-AZPMRFET.js} RENAMED Viewed

@@ -4,11 +4,11 @@ import {
   getDangerLevel,
   googleSearchContext,
   truncateOutput
-} from "./chunk-BVLQ3FRA.js";
+} from "./chunk-ZKHLLGUU.js";
 import "./chunk-4BKXL7SM.js";
 import {
   SUBAGENT_ALLOWED_TOOLS
-} from "./chunk-F44OKMB2.js";
+} from "./chunk-APJHOYCH.js";
 // src/hub/task-orchestrator.ts
 import { createInterface } from "readline";

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "jinzd-ai-cli",
-  "version": "0.4.67",
+  "version": "0.4.69",
   "description": "Cross-platform REPL-style AI CLI with multi-provider support",
   "type": "module",
   "main": "./dist/index.js",