npm - @blockrun/clawrouter - Versions diffs - 0.9.37 → 0.9.39 - Mend

@blockrun/clawrouter 0.9.37 → 0.9.39

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/dist/index.js CHANGED Viewed

@@ -1683,8 +1683,6 @@ var DEFAULT_ROUTING_CONFIG = {
       primary: "moonshot/kimi-k2.5",
       // $0.50/$2.40 - best quality/price for simple tasks
       fallback: [
-        "minimax/minimax-m2.5",
-        // $0.30/$1.20 - cheap with reasoning
         "google/gemini-2.5-flash",
         // 1M context, cost-effective
         "nvidia/gpt-oss-120b",
@@ -1696,8 +1694,6 @@ var DEFAULT_ROUTING_CONFIG = {
       primary: "xai/grok-code-fast-1",
       // Code specialist, $0.20/$1.50
       fallback: [
-        "minimax/minimax-m2.5",
-        // $0.30/$1.20 - cheap with reasoning
         "google/gemini-2.5-flash",
         // 1M context, cost-effective
         "deepseek/deepseek-chat",
@@ -1712,10 +1708,7 @@ var DEFAULT_ROUTING_CONFIG = {
         "google/gemini-2.5-flash",
         // CRITICAL: 1M context, cheap failsafe before expensive models
         "google/gemini-2.5-pro",
-        "minimax/minimax-m2.5",
-        // $0.30/$1.20 - cheap with reasoning
         "deepseek/deepseek-chat",
-        // Another cheap option
         "xai/grok-4-0709",
         "openai/gpt-5.2",
         // Newer and cheaper input than gpt-4o
@@ -1727,8 +1720,6 @@ var DEFAULT_ROUTING_CONFIG = {
       primary: "xai/grok-4-1-fast-reasoning",
       // Upgraded Grok 4.1 reasoning $0.20/$0.50
       fallback: [
-        "minimax/minimax-m2.5",
-        // $0.30/$1.20 - reasoning capable
         "deepseek/deepseek-reasoner",
         // Cheap reasoning model
         "openai/o4-mini",
@@ -1742,22 +1733,22 @@ var DEFAULT_ROUTING_CONFIG = {
     SIMPLE: {
       primary: "nvidia/gpt-oss-120b",
       // FREE! $0.00/$0.00
-      fallback: ["google/gemini-2.5-flash", "deepseek/deepseek-chat", "minimax/minimax-m2.5"]
+      fallback: ["google/gemini-2.5-flash", "deepseek/deepseek-chat"]
     },
     MEDIUM: {
       primary: "google/gemini-2.5-flash",
       // $0.15/$0.60 - cheapest capable
-      fallback: ["deepseek/deepseek-chat", "nvidia/gpt-oss-120b", "minimax/minimax-m2.5"]
+      fallback: ["deepseek/deepseek-chat", "nvidia/gpt-oss-120b"]
     },
     COMPLEX: {
       primary: "google/gemini-2.5-flash",
       // $0.15/$0.60 - 1M context handles complexity
-      fallback: ["deepseek/deepseek-chat", "xai/grok-4-0709", "minimax/minimax-m2.5"]
+      fallback: ["deepseek/deepseek-chat", "xai/grok-4-0709"]
     },
     REASONING: {
       primary: "xai/grok-4-1-fast-reasoning",
-      // $0.20/$0.50 - was MORE expensive than AUTO!
-      fallback: ["deepseek/deepseek-reasoner", "minimax/minimax-m2.5"]
+      // $0.20/$0.50
+      fallback: ["deepseek/deepseek-reasoner"]
     }
   },
   // Premium tier configs - best quality (blockrun/premium)
@@ -1807,32 +1798,18 @@ var DEFAULT_ROUTING_CONFIG = {
     SIMPLE: {
       primary: "moonshot/kimi-k2.5",
       // Cheaper than Haiku ($0.5/$2.4 vs $1/$5), larger context
-      fallback: [
-        "minimax/minimax-m2.5",
-        // $0.30/$1.20 - agentic capable, cheaper than kimi
-        "claude-haiku-4.5",
-        "xai/grok-4-1-fast-non-reasoning",
-        "openai/gpt-4o-mini"
-      ]
+      fallback: ["claude-haiku-4.5", "xai/grok-4-1-fast-non-reasoning", "openai/gpt-4o-mini"]
     },
     MEDIUM: {
       primary: "xai/grok-code-fast-1",
       // Code specialist for agentic coding
-      fallback: [
-        "minimax/minimax-m2.5",
-        // $0.30/$1.20 - agentic capable
-        "moonshot/kimi-k2.5",
-        "claude-haiku-4.5",
-        "claude-sonnet-4"
-      ]
+      fallback: ["moonshot/kimi-k2.5", "claude-haiku-4.5", "claude-sonnet-4"]
     },
     COMPLEX: {
       primary: "claude-sonnet-4",
       fallback: [
         "claude-opus-4",
         // Latest Opus - best agentic
-        "minimax/minimax-m2.5",
-        // $0.30/$1.20 - cheap agentic fallback
         "openai/gpt-5.2",
         "google/gemini-3-pro-preview",
         "xai/grok-4-0709"
@@ -1841,13 +1818,7 @@ var DEFAULT_ROUTING_CONFIG = {
     REASONING: {
       primary: "claude-sonnet-4",
       // Strong tool use + reasoning for agentic tasks
-      fallback: [
-        "claude-opus-4",
-        "minimax/minimax-m2.5",
-        // $0.30/$1.20 - reasoning + agentic
-        "xai/grok-4-1-fast-reasoning",
-        "deepseek/deepseek-reasoner"
-      ]
+      fallback: ["claude-opus-4", "xai/grok-4-1-fast-reasoning", "deepseek/deepseek-reasoner"]
     }
   },
   overrides: {
@@ -1951,7 +1922,33 @@ async function logUsage(entry) {
 }
 // src/stats.ts
-import { readFile, readdir } from "fs/promises";
+import { readdir } from "fs/promises";
+// src/fs-read.ts
+import { open } from "fs/promises";
+import { openSync, readSync, closeSync, fstatSync } from "fs";
+async function readTextFile(filePath) {
+  const fh = await open(filePath, "r");
+  try {
+    const buf = Buffer.alloc((await fh.stat()).size);
+    await fh.read(buf, 0, buf.length, 0);
+    return buf.toString("utf-8");
+  } finally {
+    await fh.close();
+  }
+}
+function readTextFileSync(filePath) {
+  const fd = openSync(filePath, "r");
+  try {
+    const buf = Buffer.alloc(fstatSync(fd).size);
+    readSync(fd, buf);
+    return buf.toString("utf-8");
+  } finally {
+    closeSync(fd);
+  }
+}
+// src/stats.ts
 import { join as join3 } from "path";
 import { homedir as homedir2 } from "os";
@@ -1970,7 +1967,7 @@ var USER_AGENT = `clawrouter/${VERSION}`;
 var LOG_DIR2 = join3(homedir2(), ".openclaw", "blockrun", "logs");
 async function parseLogFile(filePath) {
   try {
-    const content = await readFile(filePath, "utf-8");
+    const content = await readTextFile(filePath);
     const lines = content.trim().split("\n").filter(Boolean);
     return lines.map((line) => {
       const entry = JSON.parse(line);
@@ -3761,6 +3758,7 @@ var ROUTING_PROFILES = /* @__PURE__ */ new Set([
 ]);
 var FREE_MODEL = "nvidia/gpt-oss-120b";
 var MAX_MESSAGES = 200;
+var CONTEXT_LIMIT_KB = 5120;
 var HEARTBEAT_INTERVAL_MS = 2e3;
 var DEFAULT_REQUEST_TIMEOUT_MS = 18e4;
 var MAX_FALLBACK_ATTEMPTS = 5;
@@ -4147,15 +4145,28 @@ function normalizeMessagesForThinking(messages) {
   return hasChanges ? normalized : messages;
 }
 function truncateMessages(messages) {
-  if (!messages || messages.length <= MAX_MESSAGES) return messages;
+  if (!messages || messages.length <= MAX_MESSAGES) {
+    return {
+      messages,
+      wasTruncated: false,
+      originalCount: messages?.length ?? 0,
+      truncatedCount: messages?.length ?? 0
+    };
+  }
   const systemMsgs = messages.filter((m) => m.role === "system");
   const conversationMsgs = messages.filter((m) => m.role !== "system");
   const maxConversation = MAX_MESSAGES - systemMsgs.length;
   const truncatedConversation = conversationMsgs.slice(-maxConversation);
+  const result = [...systemMsgs, ...truncatedConversation];
   console.log(
-    `[ClawRouter] Truncated messages: ${messages.length} \u2192 ${systemMsgs.length + truncatedConversation.length} (kept ${systemMsgs.length} system + ${truncatedConversation.length} recent)`
+    `[ClawRouter] Truncated messages: ${messages.length} \u2192 ${result.length} (kept ${systemMsgs.length} system + ${truncatedConversation.length} recent)`
   );
-  return [...systemMsgs, ...truncatedConversation];
+  return {
+    messages: result,
+    wasTruncated: true,
+    originalCount: messages.length,
+    truncatedCount: result.length
+  };
 }
 var KIMI_BLOCK_RE = /<[｜|][^<>]*begin[^<>]*[｜|]>[\s\S]*?<[｜|][^<>]*end[^<>]*[｜|]>/gi;
 var KIMI_TOKEN_RE = /<[｜|][^<>]*[｜|]>/g;
@@ -4488,7 +4499,8 @@ async function tryModelRequest(upstreamUrl, method, headers, body, modelId, maxT
       parsed.messages = normalizeMessageRoles(parsed.messages);
     }
     if (Array.isArray(parsed.messages)) {
-      parsed.messages = truncateMessages(parsed.messages);
+      const truncationResult = truncateMessages(parsed.messages);
+      parsed.messages = truncationResult.messages;
     }
     if (Array.isArray(parsed.messages)) {
       parsed.messages = sanitizeToolIds(parsed.messages);
@@ -4562,6 +4574,7 @@ async function proxyRequest(req, res, apiBase, payFetch, options, routerOpts, de
     bodyChunks.push(Buffer.isBuffer(chunk) ? chunk : Buffer.from(chunk));
   }
   let body = Buffer.concat(bodyChunks);
+  const originalContextSizeKB = Math.ceil(body.length / 1024);
   let routingDecision;
   let isStreaming = false;
   let modelId = "";
@@ -4669,7 +4682,7 @@ async function proxyRequest(req, res, apiBase, payFetch, options, routerOpts, de
             const systemPrompt = typeof systemMsg?.content === "string" ? systemMsg.content : void 0;
             const tools = parsed.tools;
             const hasTools = Array.isArray(tools) && tools.length > 0;
-            if (hasTools) {
+            if (hasTools && tools) {
               console.log(
                 `[ClawRouter] Tools detected (${tools.length}), agentic mode via keywords`
               );
@@ -4814,7 +4827,9 @@ async function proxyRequest(req, res, apiBase, payFetch, options, routerOpts, de
     res.writeHead(200, {
       "content-type": "text/event-stream",
       "cache-control": "no-cache",
-      connection: "keep-alive"
+      connection: "keep-alive",
+      "x-context-used-kb": String(originalContextSizeKB),
+      "x-context-limit-kb": String(CONTEXT_LIMIT_KB)
     });
     headersSentEarly = true;
     safeWrite(res, ": heartbeat\n\n");
@@ -4977,7 +4992,11 @@ async function proxyRequest(req, res, apiBase, payFetch, options, routerOpts, de
           completedAt: Date.now()
         });
       } else {
-        res.writeHead(errStatus, { "Content-Type": "application/json" });
+        res.writeHead(errStatus, {
+          "Content-Type": "application/json",
+          "x-context-used-kb": String(originalContextSizeKB),
+          "x-context-limit-kb": String(CONTEXT_LIMIT_KB)
+        });
         res.end(transformedErr);
         deduplicator.complete(dedupKey, {
           status: errStatus,
@@ -5103,6 +5122,8 @@ async function proxyRequest(req, res, apiBase, payFetch, options, routerOpts, de
           return;
         responseHeaders[key] = value;
       });
+      responseHeaders["x-context-used-kb"] = String(originalContextSizeKB);
+      responseHeaders["x-context-limit-kb"] = String(CONTEXT_LIMIT_KB);
       res.writeHead(upstream.status, responseHeaders);
       if (upstream.body) {
         const reader = upstream.body.getReader();
@@ -5197,7 +5218,7 @@ async function proxyRequest(req, res, apiBase, payFetch, options, routerOpts, de
 }
 // src/auth.ts
-import { writeFile, readFile as readFile2, mkdir as mkdir2 } from "fs/promises";
+import { writeFile, mkdir as mkdir2 } from "fs/promises";
 import { join as join4 } from "path";
 import { homedir as homedir3 } from "os";
 import { generatePrivateKey, privateKeyToAccount as privateKeyToAccount3 } from "viem/accounts";
@@ -5205,7 +5226,7 @@ var WALLET_DIR = join4(homedir3(), ".openclaw", "blockrun");
 var WALLET_FILE = join4(WALLET_DIR, "wallet.key");
 async function loadSavedWallet() {
   try {
-    const key = (await readFile2(WALLET_FILE, "utf-8")).trim();
+    const key = (await readTextFile(WALLET_FILE)).trim();
     if (key.startsWith("0x") && key.length === 66) {
       console.log(`[ClawRouter] \u2713 Loaded existing wallet from ${WALLET_FILE}`);
       return key;
@@ -5226,7 +5247,7 @@ async function generateAndSaveWallet() {
   await mkdir2(WALLET_DIR, { recursive: true });
   await writeFile(WALLET_FILE, key + "\n", { mode: 384 });
   try {
-    const verification = (await readFile2(WALLET_FILE, "utf-8")).trim();
+    const verification = (await readTextFile(WALLET_FILE)).trim();
     if (verification !== key) {
       throw new Error("Wallet file verification failed - content mismatch");
     }
@@ -5255,7 +5276,6 @@ async function resolveOrGenerateWalletKey() {
 // src/index.ts
 import {
-  readFileSync,
   writeFileSync,
   existsSync,
   readdirSync,
@@ -5362,7 +5382,7 @@ function injectModelsConfig(logger) {
   }
   if (existsSync(configPath)) {
     try {
-      const content = readFileSync(configPath, "utf-8").trim();
+      const content = readTextFileSync(configPath).trim();
       if (content) {
         config = JSON.parse(content);
       } else {
@@ -5554,7 +5574,7 @@ function injectAuthProfile(logger) {
       };
       if (existsSync(authPath)) {
         try {
-          const existing = JSON.parse(readFileSync(authPath, "utf-8"));
+          const existing = JSON.parse(readTextFileSync(authPath));
           if (existing.version && existing.profiles) {
             store = existing;
           }
@@ -5673,7 +5693,7 @@ async function createWalletCommand() {
       let address;
       try {
         if (existsSync(WALLET_FILE)) {
-          walletKey = readFileSync(WALLET_FILE, "utf-8").trim();
+          walletKey = readTextFileSync(WALLET_FILE).trim();
           if (walletKey.startsWith("0x") && walletKey.length === 66) {
             const account = privateKeyToAccount4(walletKey);
             address = account.address;