npm - @blockrun/clawrouter - Versions diffs - 0.12.73 → 0.12.75 - Mend

@blockrun/clawrouter 0.12.73 → 0.12.75

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (10) hide show

package/README.md +4 -4
package/dist/cli.js +279 -63
package/dist/cli.js.map +1 -1
package/dist/index.d.ts +3 -1
package/dist/index.js +279 -63
package/dist/index.js.map +1 -1
package/docs/clawrouter-vs-openrouter-llm-routing-comparison.md +2 -2
package/docs/smart-llm-router-14-dimension-classifier.md +4 -4
package/package.json +2 -2
package/skills/clawrouter/SKILL.md +3 -3

package/README.md CHANGED Viewed

@@ -32,7 +32,7 @@ Agents can only sign transactions.<br><br>
 </div>
-> **ClawRouter** is an open-source smart LLM router that reduces AI API costs by up to 92%. It analyzes each request across 15 dimensions and routes to the cheapest capable model in under 1ms, entirely locally. ClawRouter is the only LLM router built for autonomous AI agents — it uses wallet signatures for authentication (no API keys) and USDC micropayments via the x402 protocol (no credit cards). 44+ models from OpenAI, Anthropic, Google, xAI, DeepSeek, and more. MIT licensed.
+> **ClawRouter** is an open-source smart LLM router that reduces AI API costs by up to 92%. It analyzes each request across 15 dimensions and routes to the cheapest capable model in under 1ms, entirely locally. ClawRouter is the only LLM router built for autonomous AI agents — it uses wallet signatures for authentication (no API keys) and USDC micropayments via the x402 protocol (no credit cards). 55+ models from OpenAI, Anthropic, Google, xAI, DeepSeek, and more. MIT licensed.
 ---
@@ -58,7 +58,7 @@ This is the stack that lets agents operate autonomously: **x402 + USDC + local r
 |                  | OpenRouter        | LiteLLM          | Martian           | Portkey           | **ClawRouter**          |
 | ---------------- | ----------------- | ---------------- | ----------------- | ----------------- | ----------------------- |
-| **Models**       | 200+              | 100+             | Smart routing     | Gateway           | **44+**                 |
+| **Models**       | 200+              | 100+             | Smart routing     | Gateway           | **55+**                 |
 | **Routing**      | Manual selection  | Manual selection | Smart (closed)    | Observability     | **Smart (open source)** |
 | **Auth**         | Account + API key | Your API keys    | Account + API key | Account + API key | **Wallet signature**    |
 | **Payment**      | Credit card       | BYO keys         | Credit card       | $49-499/mo        | **USDC per-request**    |
@@ -161,7 +161,7 @@ Edit existing images with `/img2img`:
 ## Models & Pricing
-44 models across 8 providers, one wallet. **Starting at $0.0002/request.**
+55+ models across 9 providers, one wallet. **Starting at $0.0002/request.**
 > **💡 "Cost per request"** = estimated cost for a typical chat message (~500 input + 500 output tokens).
@@ -394,7 +394,7 @@ npm test
 **The LLM router built for autonomous agents**
-You're here. 44+ models, local smart routing, x402 USDC payments — the only stack that lets agents operate independently.
+You're here. 55+ models, local smart routing, x402 USDC payments — the only stack that lets agents operate independently.
 `curl -fsSL https://blockrun.ai/ClawRouter-update | bash`

package/dist/cli.js CHANGED Viewed

@@ -39086,7 +39086,11 @@ var RulesStrategy = class {
     let tierConfigs;
     let profileSuffix;
     let profile;
-    if (routingProfile === "eco" && config.ecoTiers) {
+    if (routingProfile === "free" && config.freeTiers) {
+      tierConfigs = config.freeTiers;
+      profileSuffix = " | free";
+      profile = "free";
+    } else if (routingProfile === "eco" && config.ecoTiers) {
       tierConfigs = config.ecoTiers;
       profileSuffix = " | eco";
       profile = "eco";
@@ -40275,39 +40279,50 @@ var DEFAULT_ROUTING_CONFIG = {
       ]
     }
   },
-  // Eco tier configs - absolute cheapest (blockrun/eco)
+  // Eco tier configs - absolute cheapest, free-first (blockrun/eco)
   ecoTiers: {
     SIMPLE: {
       primary: "nvidia/gpt-oss-120b",
-      // 1,252ms, FREE! $0.00/$0.00
+      // FREE! $0.00/$0.00
       fallback: [
+        "nvidia/gpt-oss-20b",
+        // FREE — smaller, faster
         "google/gemini-3.1-flash-lite",
         // $0.25/$1.50 — newest flash-lite
         "openai/gpt-5.4-nano",
         // $0.20/$1.25 — fast nano
         "google/gemini-2.5-flash-lite",
-        // 1,353ms, $0.10/$0.40
+        // $0.10/$0.40
         "xai/grok-4-fast-non-reasoning"
-        // 1,143ms, $0.20/$0.50
+        // $0.20/$0.50
       ]
     },
     MEDIUM: {
-      primary: "google/gemini-3.1-flash-lite",
-      // $0.25/$1.50 — 1M context, newest flash-lite
+      primary: "nvidia/deepseek-v3.2",
+      // FREE — DeepSeek V3.2 quality at zero cost
       fallback: [
+        "nvidia/gpt-oss-120b",
+        // FREE fallback
+        "google/gemini-3.1-flash-lite",
+        // $0.25/$1.50
         "openai/gpt-5.4-nano",
-        // $0.20/$1.25, 1M context
+        // $0.20/$1.25
         "google/gemini-2.5-flash-lite",
-        // 1,353ms, $0.10/$0.40
+        // $0.10/$0.40
         "xai/grok-4-fast-non-reasoning",
-        "google/gemini-2.5-flash",
-        "nvidia/gpt-oss-120b"
+        "google/gemini-2.5-flash"
       ]
     },
     COMPLEX: {
-      primary: "google/gemini-3.1-flash-lite",
-      // $0.25/$1.50 — 1M context handles complexity
+      primary: "nvidia/nemotron-ultra-253b",
+      // FREE — 253B reasoning model
       fallback: [
+        "nvidia/mistral-large-3-675b",
+        // FREE — 675B brute-force
+        "nvidia/deepseek-v3.2",
+        // FREE
+        "google/gemini-3.1-flash-lite",
+        // $0.25/$1.50
         "google/gemini-2.5-flash-lite",
         "xai/grok-4-0709",
         "google/gemini-2.5-flash",
@@ -40316,8 +40331,13 @@ var DEFAULT_ROUTING_CONFIG = {
     },
     REASONING: {
       primary: "xai/grok-4-1-fast-reasoning",
-      // 1,454ms, $0.20/$0.50
-      fallback: ["xai/grok-4-fast-reasoning", "deepseek/deepseek-reasoner"]
+      // $0.20/$0.50
+      fallback: [
+        "xai/grok-4-fast-reasoning",
+        "nvidia/nemotron-ultra-253b",
+        // FREE reasoning fallback
+        "deepseek/deepseek-reasoner"
+      ]
     }
   },
   // Premium tier configs - best quality (blockrun/premium)
@@ -40431,6 +40451,73 @@ var DEFAULT_ROUTING_CONFIG = {
       ]
     }
   },
+  // Free tier configs - NVIDIA free models, smart-routed by task type (blockrun/free)
+  freeTiers: {
+    SIMPLE: {
+      primary: "nvidia/gpt-oss-20b",
+      // Fastest: small 20B for simple tasks
+      fallback: [
+        "nvidia/gpt-oss-120b",
+        // Solid general-purpose
+        "nvidia/nemotron-super-49b",
+        // Thinking mode
+        "nvidia/llama-4-maverick",
+        // MoE broad coverage
+        "nvidia/glm-4.7"
+        // Thinking mode
+      ]
+    },
+    MEDIUM: {
+      primary: "nvidia/deepseek-v3.2",
+      // DeepSeek V3.2 quality, zero cost
+      fallback: [
+        "nvidia/gpt-oss-120b",
+        // Strong 120B general-purpose
+        "nvidia/nemotron-super-49b",
+        // Thinking mode
+        "nvidia/mistral-large-3-675b",
+        // Largest Mistral
+        "nvidia/llama-4-maverick",
+        // MoE breadth
+        "nvidia/glm-4.7"
+        // Thinking mode
+      ]
+    },
+    COMPLEX: {
+      primary: "nvidia/nemotron-ultra-253b",
+      // Strongest free: 253B reasoning
+      fallback: [
+        "nvidia/mistral-large-3-675b",
+        // 675B massive params
+        "nvidia/deepseek-v3.2",
+        // V3.2 quality
+        "nvidia/nemotron-3-super-120b",
+        // Thinking mode MoE
+        "nvidia/qwen3-coder-480b",
+        // 480B MoE for code-heavy tasks
+        "nvidia/devstral-2-123b",
+        // Coding-focused
+        "nvidia/gpt-oss-120b"
+        // Last resort
+      ]
+    },
+    REASONING: {
+      primary: "nvidia/nemotron-ultra-253b",
+      // Best free reasoning: 253B
+      fallback: [
+        "nvidia/nemotron-3-super-120b",
+        // Thinking mode MoE
+        "nvidia/nemotron-super-49b",
+        // Thinking mode
+        "nvidia/deepseek-v3.2",
+        // DeepSeek reasoning
+        "nvidia/mistral-large-3-675b",
+        // Brute-force params
+        "nvidia/glm-4.7"
+        // GLM thinking mode
+      ]
+    }
+  },
   overrides: {
     maxTokensForceComplex: 1e5,
     structuredOutputMinTier: "MEDIUM",
@@ -40510,9 +40597,27 @@ var MODEL_ALIASES = {
   // delisted 2026-03-12
   "xai/grok-3-fast": "xai/grok-4-fast-reasoning",
   // delisted (too expensive)
-  // NVIDIA
+  // NVIDIA — existing alias kept for backward compat
   nvidia: "nvidia/gpt-oss-120b",
   "gpt-120b": "nvidia/gpt-oss-120b",
+  "gpt-20b": "nvidia/gpt-oss-20b",
+  // Free model aliases — "-free" suffix for models with paid twins
+  "deepseek-free": "nvidia/deepseek-v3.2",
+  "mistral-free": "nvidia/mistral-large-3-675b",
+  "glm-free": "nvidia/glm-4.7",
+  "llama-free": "nvidia/llama-4-maverick",
+  // Bare-name aliases for unique free models
+  nemotron: "nvidia/nemotron-ultra-253b",
+  "nemotron-ultra": "nvidia/nemotron-ultra-253b",
+  "nemotron-253b": "nvidia/nemotron-ultra-253b",
+  "nemotron-super": "nvidia/nemotron-super-49b",
+  "nemotron-49b": "nvidia/nemotron-super-49b",
+  "nemotron-120b": "nvidia/nemotron-3-super-120b",
+  devstral: "nvidia/devstral-2-123b",
+  "devstral-2": "nvidia/devstral-2-123b",
+  "qwen-coder": "nvidia/qwen3-coder-480b",
+  "qwen-coder-free": "nvidia/qwen3-coder-480b",
+  maverick: "nvidia/llama-4-maverick",
   // MiniMax
   minimax: "minimax/minimax-m2.7",
   "minimax-m2.7": "minimax/minimax-m2.7",
@@ -40559,11 +40664,11 @@ var BLOCKRUN_MODELS = [
   },
   {
     id: "free",
-    name: "Free (NVIDIA GPT-OSS-120B only)",
+    name: "Free (Smart Router - 11 NVIDIA Models)",
     inputPrice: 0,
     outputPrice: 0,
-    contextWindow: 128e3,
-    maxOutput: 4096
+    contextWindow: 131072,
+    maxOutput: 16384
   },
   {
     id: "eco",
@@ -41068,18 +41173,116 @@ var BLOCKRUN_MODELS = [
     agentic: true,
     toolCalling: true
   },
-  // NVIDIA - Free/cheap models
+  // NVIDIA - Free models (hosted by NVIDIA, billingMode: "free" on server)
+  // toolCalling intentionally omitted on all free models: structured function
+  // calling support unverified. Excluded from tool-heavy routing paths.
   {
     id: "nvidia/gpt-oss-120b",
-    name: "NVIDIA GPT-OSS 120B",
+    name: "[Free] GPT-OSS 120B",
     version: "120b",
     inputPrice: 0,
     outputPrice: 0,
     contextWindow: 128e3,
     maxOutput: 16384
-    // toolCalling intentionally omitted: free model, structured function
-    // calling support unverified. Excluded from tool-heavy routing paths.
   },
+  {
+    id: "nvidia/gpt-oss-20b",
+    name: "[Free] GPT-OSS 20B",
+    version: "20b",
+    inputPrice: 0,
+    outputPrice: 0,
+    contextWindow: 128e3,
+    maxOutput: 16384
+  },
+  {
+    id: "nvidia/nemotron-ultra-253b",
+    name: "[Free] Nemotron Ultra 253B",
+    version: "253b",
+    inputPrice: 0,
+    outputPrice: 0,
+    contextWindow: 131072,
+    maxOutput: 16384,
+    reasoning: true
+  },
+  {
+    id: "nvidia/nemotron-3-super-120b",
+    name: "[Free] Nemotron 3 Super 120B",
+    version: "3-super-120b",
+    inputPrice: 0,
+    outputPrice: 0,
+    contextWindow: 131072,
+    maxOutput: 16384,
+    reasoning: true
+  },
+  {
+    id: "nvidia/nemotron-super-49b",
+    name: "[Free] Nemotron Super 49B",
+    version: "super-49b",
+    inputPrice: 0,
+    outputPrice: 0,
+    contextWindow: 131072,
+    maxOutput: 16384,
+    reasoning: true
+  },
+  {
+    id: "nvidia/deepseek-v3.2",
+    name: "[Free] DeepSeek V3.2",
+    version: "v3.2",
+    inputPrice: 0,
+    outputPrice: 0,
+    contextWindow: 131072,
+    maxOutput: 16384,
+    reasoning: true
+  },
+  {
+    id: "nvidia/mistral-large-3-675b",
+    name: "[Free] Mistral Large 675B",
+    version: "3-675b",
+    inputPrice: 0,
+    outputPrice: 0,
+    contextWindow: 131072,
+    maxOutput: 16384,
+    reasoning: true
+  },
+  {
+    id: "nvidia/qwen3-coder-480b",
+    name: "[Free] Qwen3 Coder 480B",
+    version: "480b",
+    inputPrice: 0,
+    outputPrice: 0,
+    contextWindow: 131072,
+    maxOutput: 16384
+  },
+  {
+    id: "nvidia/devstral-2-123b",
+    name: "[Free] Devstral 2 123B",
+    version: "2-123b",
+    inputPrice: 0,
+    outputPrice: 0,
+    contextWindow: 131072,
+    maxOutput: 16384
+  },
+  {
+    id: "nvidia/glm-4.7",
+    name: "[Free] GLM-4.7",
+    version: "4.7",
+    inputPrice: 0,
+    outputPrice: 0,
+    contextWindow: 131072,
+    maxOutput: 16384,
+    reasoning: true
+  },
+  {
+    id: "nvidia/llama-4-maverick",
+    name: "[Free] Llama 4 Maverick",
+    version: "4-maverick",
+    inputPrice: 0,
+    outputPrice: 0,
+    contextWindow: 131072,
+    maxOutput: 16384,
+    reasoning: true
+  },
+  // NVIDIA - Paid models
   {
     id: "nvidia/kimi-k2.5",
     name: "NVIDIA Kimi K2.5",
@@ -46656,11 +46859,36 @@ var ROUTING_PROFILES = /* @__PURE__ */ new Set([
   "premium"
 ]);
 var FREE_MODEL = "nvidia/gpt-oss-120b";
+var FREE_MODELS = /* @__PURE__ */ new Set([
+  "nvidia/gpt-oss-120b",
+  "nvidia/gpt-oss-20b",
+  "nvidia/nemotron-ultra-253b",
+  "nvidia/nemotron-3-super-120b",
+  "nvidia/nemotron-super-49b",
+  "nvidia/deepseek-v3.2",
+  "nvidia/mistral-large-3-675b",
+  "nvidia/qwen3-coder-480b",
+  "nvidia/devstral-2-123b",
+  "nvidia/glm-4.7",
+  "nvidia/llama-4-maverick"
+]);
 var FREE_TIER_CONFIGS = {
-  SIMPLE: { primary: FREE_MODEL, fallback: [] },
-  MEDIUM: { primary: FREE_MODEL, fallback: [] },
-  COMPLEX: { primary: FREE_MODEL, fallback: [] },
-  REASONING: { primary: FREE_MODEL, fallback: [] }
+  SIMPLE: {
+    primary: "nvidia/gpt-oss-20b",
+    fallback: ["nvidia/gpt-oss-120b", "nvidia/nemotron-super-49b"]
+  },
+  MEDIUM: {
+    primary: "nvidia/deepseek-v3.2",
+    fallback: ["nvidia/gpt-oss-120b", "nvidia/nemotron-super-49b"]
+  },
+  COMPLEX: {
+    primary: "nvidia/nemotron-ultra-253b",
+    fallback: ["nvidia/mistral-large-3-675b", "nvidia/deepseek-v3.2", "nvidia/gpt-oss-120b"]
+  },
+  REASONING: {
+    primary: "nvidia/nemotron-ultra-253b",
+    fallback: ["nvidia/nemotron-3-super-120b", "nvidia/deepseek-v3.2"]
+  }
 };
 var freeRequestCount = 0;
 var MAX_MESSAGES = 200;
@@ -48672,30 +48900,7 @@ async function proxyRequest(req, res, apiBase, payFetch, options, routerOpts, de
         modelId = resolvedModel;
       }
       if (isRoutingProfile) {
-        if (routingProfile === "free") {
-          const freeModel = "nvidia/gpt-oss-120b";
-          console.log(`[ClawRouter] Free profile - using ${freeModel} directly`);
-          parsed.model = freeModel;
-          modelId = freeModel;
-          bodyModified = true;
-          freeRequestCount++;
-          if (freeRequestCount % 5 === 0) {
-            balanceFallbackNotice = `> **\u{1F4A1} Tip:** Not satisfied with free model quality? Fund your wallet to unlock deepseek-chat, gemini-flash, and 30+ premium models \u2014 starting at $0.001/request.
-`;
-          }
-          routingDecision = {
-            model: freeModel,
-            tier: "SIMPLE",
-            confidence: 1,
-            method: "rules",
-            reasoning: "free profile",
-            costEstimate: 0,
-            baselineCost: 0,
-            savings: 1,
-            tierConfigs: FREE_TIER_CONFIGS
-          };
-        } else {
+        {
           effectiveSessionId = getSessionId(req.headers) ?? deriveSessionId(parsedMessages);
           const existingSession = effectiveSessionId ? sessionStore.getSession(effectiveSessionId) : void 0;
           const rawPrompt = lastUserMsg?.content;
@@ -48811,6 +49016,14 @@ async function proxyRequest(req, res, apiBase, payFetch, options, routerOpts, de
             }
           }
           options.onRouted?.(routingDecision);
+          if (routingProfile === "free") {
+            freeRequestCount++;
+            if (freeRequestCount % 5 === 0) {
+              balanceFallbackNotice = `> **\u{1F4A1} Tip:** Free tier gives you 11 NVIDIA models. Want Claude, GPT-5, or Gemini? Fund your wallet \u2014 starting at $0.001/request.
+`;
+            }
+          }
         }
       }
       if (!effectiveSessionId && parsedMessages.length > 0) {
@@ -48906,7 +49119,7 @@ async function proxyRequest(req, res, apiBase, payFetch, options, routerOpts, de
   }
   deduplicator.markInflight(dedupKey);
   let estimatedCostMicros;
-  let isFreeModel = modelId === FREE_MODEL;
+  let isFreeModel = FREE_MODELS.has(modelId ?? "");
   if (modelId && !options.skipBalanceCheck && !isFreeModel) {
     const estimated = estimateAmount(modelId, body.length, maxTokens);
     if (estimated) {
@@ -48915,13 +49128,16 @@ async function proxyRequest(req, res, apiBase, payFetch, options, routerOpts, de
       const sufficiency = await balanceMonitor.checkSufficient(bufferedCostMicros);
       if (sufficiency.info.isEmpty || !sufficiency.sufficient) {
         const originalModel = modelId;
+        const fallbackTier = routingDecision?.tier ?? "SIMPLE";
+        const freeTierConfig = FREE_TIER_CONFIGS[fallbackTier];
+        const freeModel = freeTierConfig.primary;
         console.log(
-          `[ClawRouter] Wallet ${sufficiency.info.isEmpty ? "empty" : "insufficient"} (${sufficiency.info.balanceUSD}), falling back to free model: ${FREE_MODEL} (requested: ${originalModel})`
+          `[ClawRouter] Wallet ${sufficiency.info.isEmpty ? "empty" : "insufficient"} (${sufficiency.info.balanceUSD}), falling back to free model: ${freeModel} (tier: ${fallbackTier}, requested: ${originalModel})`
         );
-        modelId = FREE_MODEL;
+        modelId = freeModel;
         isFreeModel = true;
         const parsed = JSON.parse(body.toString());
-        parsed.model = FREE_MODEL;
+        parsed.model = freeModel;
         body = Buffer.from(JSON.stringify(parsed));
         balanceFallbackNotice = sufficiency.info.isEmpty ? `> **\u26A0\uFE0F Wallet empty** \u2014 using free model. Fund your wallet to use ${originalModel}.
@@ -48930,7 +49146,7 @@ async function proxyRequest(req, res, apiBase, payFetch, options, routerOpts, de
 `;
         freeRequestCount++;
         if (freeRequestCount % 5 === 0) {
-          balanceFallbackNotice = `> **\u{1F4A1} Tip:** Not satisfied with free model quality? Fund your wallet to unlock deepseek-chat, gemini-flash, and 30+ premium models \u2014 starting at $0.001/request.
+          balanceFallbackNotice = `> **\u{1F4A1} Tip:** Free tier gives you 11 NVIDIA models. Want Claude, GPT-5, or Gemini? Fund your wallet \u2014 starting at $0.001/request.
 `;
         }
@@ -48978,7 +49194,7 @@ async function proxyRequest(req, res, apiBase, payFetch, options, routerOpts, de
     const isComplexOrAgentic = hasTools || routingDecision?.tier === "COMPLEX" || routingDecision?.tier === "REASONING";
     if (isComplexOrAgentic) {
       const canAffordAnyNonFreeModel = BLOCKRUN_MODELS.some((m) => {
-        if (m.id === FREE_MODEL) return false;
+        if (FREE_MODELS.has(m.id)) return false;
         const est = estimateAmount(m.id, body.length, maxTokens);
         return est !== void 0 && Number(est) / 1e6 <= remainingUsd;
       });
@@ -49003,7 +49219,7 @@ async function proxyRequest(req, res, apiBase, payFetch, options, routerOpts, de
         deduplicator.removeInflight(dedupKey);
         return;
       }
-    } else if (!routingDecision && modelId && modelId !== FREE_MODEL) {
+    } else if (!routingDecision && modelId && !FREE_MODELS.has(modelId)) {
       const est = estimateAmount(modelId, body.length, maxTokens);
       const canAfford = !est || Number(est) / 1e6 <= remainingUsd;
       if (!canAfford) {
@@ -49144,14 +49360,14 @@ async function proxyRequest(req, res, apiBase, payFetch, options, routerOpts, de
       const remainingUsd = options.maxCostPerRunUsd - runCostUsd;
       const beforeFilter = [...modelsToTry];
       modelsToTry = modelsToTry.filter((m) => {
-        if (m === FREE_MODEL) return true;
+        if (FREE_MODELS.has(m)) return true;
         const est = estimateAmount(m, body.length, maxTokens);
         if (!est) return true;
         return Number(est) / 1e6 <= remainingUsd;
       });
       const excluded = beforeFilter.filter((m) => !modelsToTry.includes(m));
       const isComplexOrAgenticFilter = hasTools || routingDecision?.tier === "COMPLEX" || routingDecision?.tier === "REASONING" || routingDecision === void 0;
-      const filteredToFreeOnly = modelsToTry.length > 0 && modelsToTry.every((m) => m === FREE_MODEL);
+      const filteredToFreeOnly = modelsToTry.length > 0 && modelsToTry.every((m) => FREE_MODELS.has(m));
       if (isComplexOrAgenticFilter && filteredToFreeOnly) {
         const budgetSummary = `$${Math.max(0, remainingUsd).toFixed(4)} remaining (limit: $${options.maxCostPerRunUsd})`;
         console.log(
@@ -49189,7 +49405,7 @@ data: [DONE]
           `[ClawRouter] Budget downgrade (${budgetSummary}): excluded ${excluded.join(", ")}`
         );
         const fromModel = excluded[0];
-        const usingFree = modelsToTry.length === 1 && modelsToTry[0] === FREE_MODEL;
+        const usingFree = modelsToTry.length === 1 && FREE_MODELS.has(modelsToTry[0]);
         if (usingFree) {
           budgetDowngradeNotice = `> **\u26A0\uFE0F Budget cap reached** ($${runCostUsd.toFixed(4)}/$${options.maxCostPerRunUsd}) \u2014 downgraded to free model. Quality may be reduced. Increase \`maxCostPerRun\` to continue with ${fromModel}.
@@ -49243,7 +49459,7 @@ data: [DONE]
         upstream = result.response;
         actualModelUsed = tryModel;
         console.log(`[ClawRouter] Success with model: ${tryModel}`);
-        if (options.maxCostPerRunUsd && effectiveSessionId && tryModel !== FREE_MODEL) {
+        if (options.maxCostPerRunUsd && effectiveSessionId && !FREE_MODELS.has(tryModel)) {
           const costEst = estimateAmount(tryModel, body.length, maxTokens);
           if (costEst) {
             sessionStore.addSessionCost(effectiveSessionId, BigInt(costEst));
@@ -49263,7 +49479,7 @@ data: [DONE]
       const isPaymentErr = /payment.*verification.*failed|payment.*settlement.*failed|insufficient.*funds|transaction_simulation_failed/i.test(
         result.errorBody || ""
       );
-      if (isPaymentErr && tryModel !== FREE_MODEL && !isLastAttempt) {
+      if (isPaymentErr && !FREE_MODELS.has(tryModel) && !isLastAttempt) {
         failedAttempts.push({
           ...failedAttempts[failedAttempts.length - 1],
           reason: "payment_error"