npm - @yeshwanthyk/ai - Versions diffs - 0.2.5 → 0.2.6 - Mend

@yeshwanthyk/ai 0.2.5 → 0.2.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/dist/models.generated.d.ts +407 -215
package/dist/models.generated.d.ts.map +1 -1
package/dist/models.generated.js +528 -354
package/dist/models.generated.js.map +1 -1
package/package.json +1 -1

package/dist/models.generated.js CHANGED Viewed

@@ -70,6 +70,23 @@ export const MODELS = {
             contextWindow: 200000,
             maxTokens: 64000,
         },
+        "claude-sonnet-4-6": {
+            id: "claude-sonnet-4-6",
+            name: "Claude Sonnet 4.6",
+            api: "anthropic-messages",
+            provider: "anthropic",
+            baseUrl: "https://api.anthropic.com",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 3,
+                output: 15,
+                cacheRead: 0.3,
+                cacheWrite: 3.75,
+            },
+            contextWindow: 200000,
+            maxTokens: 64000,
+        },
         "claude-3-5-sonnet-20240620": {
             id: "claude-3-5-sonnet-20240620",
             name: "Claude Sonnet 3.5",
@@ -531,6 +548,23 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 65536,
         },
+        "gemini-3.1-pro-preview-customtools": {
+            id: "gemini-3.1-pro-preview-customtools",
+            name: "Gemini 3.1 Pro Preview Custom Tools",
+            api: "google-generative-ai",
+            provider: "google",
+            baseUrl: "https://generativelanguage.googleapis.com/v1beta",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 2,
+                output: 12,
+                cacheRead: 0.2,
+                cacheWrite: 0,
+            },
+            contextWindow: 1048576,
+            maxTokens: 65536,
+        },
         "gemini-2.0-flash": {
             id: "gemini-2.0-flash",
             name: "Gemini 2.0 Flash",
@@ -667,6 +701,23 @@ export const MODELS = {
             contextWindow: 1048576,
             maxTokens: 65536,
         },
+        "gemini-3.1-pro-preview": {
+            id: "gemini-3.1-pro-preview",
+            name: "Gemini 3.1 Pro Preview",
+            api: "google-generative-ai",
+            provider: "google",
+            baseUrl: "https://generativelanguage.googleapis.com/v1beta",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 2,
+                output: 12,
+                cacheRead: 0.2,
+                cacheWrite: 0,
+            },
+            contextWindow: 1048576,
+            maxTokens: 65536,
+        },
         "gemini-1.5-flash": {
             id: "gemini-1.5-flash",
             name: "Gemini 1.5 Flash",
@@ -754,6 +805,23 @@ export const MODELS = {
             contextWindow: 1047576,
             maxTokens: 32768,
         },
+        "gpt-5.3-codex-spark": {
+            id: "gpt-5.3-codex-spark",
+            name: "GPT-5.3 Codex Spark",
+            api: "openai-responses",
+            provider: "openai",
+            baseUrl: "https://api.openai.com/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 1.75,
+                output: 14,
+                cacheRead: 0.175,
+                cacheWrite: 0,
+            },
+            contextWindow: 128000,
+            maxTokens: 32000,
+        },
         "gpt-4": {
             id: "gpt-4",
             name: "GPT-4",
@@ -1600,8 +1668,8 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0,
-                output: 0,
+                input: 2.25,
+                output: 2.75,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
@@ -1625,6 +1693,23 @@ export const MODELS = {
             contextWindow: 131000,
             maxTokens: 32000,
         },
+        "llama3.1-8b": {
+            id: "llama3.1-8b",
+            name: "Llama 3.1 8B",
+            api: "openai-completions",
+            provider: "cerebras",
+            baseUrl: "https://api.cerebras.ai/v1",
+            reasoning: false,
+            input: ["text"],
+            cost: {
+                input: 0.1,
+                output: 0.1,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 32000,
+            maxTokens: 8000,
+        },
         "gpt-oss-120b": {
             id: "gpt-oss-120b",
             name: "GPT OSS 120B",
@@ -2037,6 +2122,23 @@ export const MODELS = {
             contextWindow: 204800,
             maxTokens: 131072,
         },
+        "glm-5": {
+            id: "glm-5",
+            name: "GLM-5",
+            api: "anthropic-messages",
+            provider: "zai",
+            baseUrl: "https://api.z.ai/api/anthropic",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 1,
+                output: 3.2,
+                cacheRead: 0.2,
+                cacheWrite: 0,
+            },
+            contextWindow: 204800,
+            maxTokens: 131072,
+        },
         "glm-4.5-flash": {
             id: "glm-4.5-flash",
             name: "GLM-4.5-Flash",
@@ -2602,6 +2704,23 @@ export const MODELS = {
             contextWindow: 204800,
             maxTokens: 131072,
         },
+        "glm-5": {
+            id: "glm-5",
+            name: "GLM-5",
+            api: "openai-completions",
+            provider: "opencode",
+            baseUrl: "https://opencode.ai/zen/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 1,
+                output: 3.2,
+                cacheRead: 0.2,
+                cacheWrite: 0,
+            },
+            contextWindow: 204800,
+            maxTokens: 131072,
+        },
         "qwen3-coder": {
             id: "qwen3-coder",
             name: "Qwen3 Coder",
@@ -2704,6 +2823,23 @@ export const MODELS = {
             contextWindow: 200000,
             maxTokens: 64000,
         },
+        "claude-sonnet-4-6": {
+            id: "claude-sonnet-4-6",
+            name: "Claude Sonnet 4.6",
+            api: "openai-completions",
+            provider: "opencode",
+            baseUrl: "https://opencode.ai/zen/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 3,
+                output: 15,
+                cacheRead: 0.3,
+                cacheWrite: 3.75,
+            },
+            contextWindow: 1000000,
+            maxTokens: 64000,
+        },
         "claude-opus-4-6": {
             id: "claude-opus-4-6",
             name: "Claude Opus 4.6",
@@ -2770,7 +2906,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 262144,
+            maxTokens: 65536,
         },
         "gemini-3-pro": {
             id: "gemini-3-pro",
@@ -2840,6 +2976,40 @@ export const MODELS = {
             contextWindow: 262144,
             maxTokens: 262144,
         },
+        "glm-5-free": {
+            id: "glm-5-free",
+            name: "GLM-5 Free",
+            api: "openai-completions",
+            provider: "opencode",
+            baseUrl: "https://opencode.ai/zen/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0,
+                output: 0,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 204800,
+            maxTokens: 131072,
+        },
+        "gemini-3.1-pro": {
+            id: "gemini-3.1-pro",
+            name: "Gemini 3.1 Pro Preview",
+            api: "openai-completions",
+            provider: "opencode",
+            baseUrl: "https://opencode.ai/zen/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 2,
+                output: 12,
+                cacheRead: 0.2,
+                cacheWrite: 0,
+            },
+            contextWindow: 1048576,
+            maxTokens: 65536,
+        },
         "gpt-5.1": {
             id: "gpt-5.1",
             name: "GPT-5.1",
@@ -3097,6 +3267,40 @@ export const MODELS = {
             contextWindow: 204800,
             maxTokens: 131072,
         },
+        "minimax-m2.5-free": {
+            id: "minimax-m2.5-free",
+            name: "MiniMax M2.5 Free",
+            api: "openai-completions",
+            provider: "opencode",
+            baseUrl: "https://opencode.ai/zen/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0,
+                output: 0,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 204800,
+            maxTokens: 131072,
+        },
+        "minimax-m2.5": {
+            id: "minimax-m2.5",
+            name: "MiniMax M2.5",
+            api: "openai-completions",
+            provider: "opencode",
+            baseUrl: "https://opencode.ai/zen/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0.3,
+                output: 1.2,
+                cacheRead: 0.06,
+                cacheWrite: 0,
+            },
+            contextWindow: 204800,
+            maxTokens: 131072,
+        },
         "gpt-5.2": {
             id: "gpt-5.2",
             name: "GPT-5.2",
@@ -3207,7 +3411,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 128000,
-            maxTokens: 16000,
+            maxTokens: 32000,
         },
         "gemini-3-pro-preview": {
             id: "gemini-3-pro-preview",
@@ -3244,7 +3448,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 128000,
-            maxTokens: 100000,
+            maxTokens: 128000,
         },
         "gpt-5.1": {
             id: "gpt-5.1",
@@ -3262,7 +3466,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 128000,
-            maxTokens: 128000,
+            maxTokens: 64000,
         },
         "gpt-4o": {
             id: "gpt-4o",
@@ -3299,7 +3503,7 @@ export const MODELS = {
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 128000,
+            contextWindow: 64000,
             maxTokens: 16384,
         },
         "gpt-5-mini": {
@@ -3320,6 +3524,25 @@ export const MODELS = {
             contextWindow: 128000,
             maxTokens: 64000,
         },
+        "claude-sonnet-4.6": {
+            id: "claude-sonnet-4.6",
+            name: "Claude Sonnet 4.6",
+            api: "openai-completions",
+            provider: "github-copilot",
+            baseUrl: "https://api.individual.githubcopilot.com",
+            headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
+            compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0,
+                output: 0,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 128000,
+            maxTokens: 32000,
+        },
         "gemini-2.5-pro": {
             id: "gemini-2.5-pro",
             name: "Gemini 2.5 Pro",
@@ -3357,6 +3580,25 @@ export const MODELS = {
             contextWindow: 128000,
             maxTokens: 128000,
         },
+        "gemini-3.1-pro-preview": {
+            id: "gemini-3.1-pro-preview",
+            name: "Gemini 3.1 Pro Preview",
+            api: "openai-completions",
+            provider: "github-copilot",
+            baseUrl: "https://api.individual.githubcopilot.com",
+            headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
+            compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0,
+                output: 0,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 128000,
+            maxTokens: 64000,
+        },
         "claude-sonnet-4": {
             id: "claude-sonnet-4",
             name: "Claude Sonnet 4",
@@ -3411,7 +3653,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 128000,
-            maxTokens: 16000,
+            maxTokens: 32000,
         },
         "gpt-5.2": {
             id: "gpt-5.2",
@@ -3448,7 +3690,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 128000,
-            maxTokens: 16000,
+            maxTokens: 32000,
         },
         "claude-opus-4.6": {
             id: "claude-opus-4.6",
@@ -3471,68 +3713,170 @@ export const MODELS = {
         },
     },
     "openrouter": {
-        "openrouter/pony-alpha": {
-            id: "openrouter/pony-alpha",
-            name: "Pony Alpha",
+        "google/gemini-3.1-pro-preview": {
+            id: "google/gemini-3.1-pro-preview",
+            name: "Google: Gemini 3.1 Pro Preview",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: true,
-            input: ["text"],
+            input: ["text", "image"],
             cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
-                cacheWrite: 0,
+                input: 2,
+                output: 12,
+                cacheRead: 0.19999999999999998,
+                cacheWrite: 0.375,
             },
-            contextWindow: 200000,
-            maxTokens: 131000,
+            contextWindow: 1048576,
+            maxTokens: 65536,
         },
-        "anthropic/claude-opus-4.6": {
-            id: "anthropic/claude-opus-4.6",
-            name: "Anthropic: Claude Opus 4.6",
+        "anthropic/claude-sonnet-4.6": {
+            id: "anthropic/claude-sonnet-4.6",
+            name: "Anthropic: Claude Sonnet 4.6",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 5,
-                output: 25,
-                cacheRead: 0.5,
-                cacheWrite: 6.25,
+                input: 3,
+                output: 15,
+                cacheRead: 0.3,
+                cacheWrite: 3.75,
             },
             contextWindow: 1000000,
             maxTokens: 128000,
         },
-        "qwen/qwen3-coder-next": {
-            id: "qwen/qwen3-coder-next",
-            name: "Qwen: Qwen3 Coder Next",
+        "qwen/qwen3.5-plus-02-15": {
+            id: "qwen/qwen3.5-plus-02-15",
+            name: "Qwen: Qwen3.5 Plus 2026-02-15",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
+            reasoning: true,
+            input: ["text", "image"],
             cost: {
-                input: 0.07,
-                output: 0.3,
+                input: 0.39999999999999997,
+                output: 2.4,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 262144,
+            contextWindow: 1000000,
             maxTokens: 65536,
         },
-        "openrouter/free": {
-            id: "openrouter/free",
-            name: "Free Models Router",
+        "qwen/qwen3.5-397b-a17b": {
+            id: "qwen/qwen3.5-397b-a17b",
+            name: "Qwen: Qwen3.5 397B A17B",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0,
-                output: 0,
+                input: 0.15,
+                output: 1,
+                cacheRead: 0.15,
+                cacheWrite: 0,
+            },
+            contextWindow: 262144,
+            maxTokens: 65536,
+        },
+        "minimax/minimax-m2.5": {
+            id: "minimax/minimax-m2.5",
+            name: "MiniMax: MiniMax M2.5",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0.3,
+                output: 1.1,
+                cacheRead: 0.15,
+                cacheWrite: 0,
+            },
+            contextWindow: 196608,
+            maxTokens: 65536,
+        },
+        "z-ai/glm-5": {
+            id: "z-ai/glm-5",
+            name: "Z.ai: GLM 5",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0.95,
+                output: 2.5500000000000003,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 204800,
+            maxTokens: 131072,
+        },
+        "qwen/qwen3-max-thinking": {
+            id: "qwen/qwen3-max-thinking",
+            name: "Qwen: Qwen3 Max Thinking",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 1.2,
+                output: 6,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 262144,
+            maxTokens: 32768,
+        },
+        "anthropic/claude-opus-4.6": {
+            id: "anthropic/claude-opus-4.6",
+            name: "Anthropic: Claude Opus 4.6",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 5,
+                output: 25,
+                cacheRead: 0.5,
+                cacheWrite: 6.25,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
+        "qwen/qwen3-coder-next": {
+            id: "qwen/qwen3-coder-next",
+            name: "Qwen: Qwen3 Coder Next",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: false,
+            input: ["text"],
+            cost: {
+                input: 0.12,
+                output: 0.75,
+                cacheRead: 0.06,
+                cacheWrite: 0,
+            },
+            contextWindow: 262144,
+            maxTokens: 65536,
+        },
+        "openrouter/free": {
+            id: "openrouter/free",
+            name: "Free Models Router",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0,
+                output: 0,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
@@ -3556,6 +3900,23 @@ export const MODELS = {
             contextWindow: 256000,
             maxTokens: 256000,
         },
+        "stepfun/step-3.5-flash": {
+            id: "stepfun/step-3.5-flash",
+            name: "StepFun: Step 3.5 Flash",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0.09999999999999999,
+                output: 0.3,
+                cacheRead: 0.02,
+                cacheWrite: 0,
+            },
+            contextWindow: 256000,
+            maxTokens: 256000,
+        },
         "arcee-ai/trinity-large-preview:free": {
             id: "arcee-ai/trinity-large-preview:free",
             name: "Arcee AI: Trinity Large Preview (free)",
@@ -3583,8 +3944,8 @@ export const MODELS = {
             input: ["text", "image"],
             cost: {
                 input: 0.44999999999999996,
-                output: 2.5,
-                cacheRead: 0,
+                output: 2.2,
+                cacheRead: 0.22499999999999998,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
@@ -3609,7 +3970,7 @@ export const MODELS = {
         },
         "z-ai/glm-4.7-flash": {
             id: "z-ai/glm-4.7-flash",
-            name: "Z.AI: GLM 4.7 Flash",
+            name: "Z.ai: GLM 4.7 Flash",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
@@ -3711,16 +4072,16 @@ export const MODELS = {
         },
         "z-ai/glm-4.7": {
             id: "z-ai/glm-4.7",
-            name: "Z.AI: GLM 4.7",
+            name: "Z.ai: GLM 4.7",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.39999999999999997,
-                output: 1.5,
-                cacheRead: 0,
+                input: 0.38,
+                output: 1.7,
+                cacheRead: 0.19,
                 cacheWrite: 0,
             },
             contextWindow: 202752,
@@ -3771,11 +4132,11 @@ export const MODELS = {
             cost: {
                 input: 0.09,
                 output: 0.29,
-                cacheRead: 0,
+                cacheRead: 0.045,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 4096,
+            maxTokens: 65536,
         },
         "nvidia/nemotron-3-nano-30b-a3b:free": {
             id: "nvidia/nemotron-3-nano-30b-a3b:free",
@@ -3871,13 +4232,13 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.049999999999999996,
-                output: 0.22,
+                input: 0.39999999999999997,
+                output: 2,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 65536,
+            maxTokens: 4096,
         },
         "relace/relace-search": {
             id: "relace/relace-search",
@@ -3898,7 +4259,7 @@ export const MODELS = {
         },
         "z-ai/glm-4.6v": {
             id: "z-ai/glm-4.6v",
-            name: "Z.AI: GLM 4.6V",
+            name: "Z.ai: GLM 4.6V",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
@@ -4075,13 +4436,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.25,
+                input: 0.26,
                 output: 0.38,
-                cacheRead: 0,
+                cacheRead: 0.13,
                 cacheWrite: 0,
             },
             contextWindow: 163840,
-            maxTokens: 65536,
+            maxTokens: 4096,
         },
         "prime-intellect/intellect-3": {
             id: "prime-intellect/intellect-3",
@@ -4100,40 +4461,6 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 131072,
         },
-        "tngtech/tng-r1t-chimera:free": {
-            id: "tngtech/tng-r1t-chimera:free",
-            name: "TNG: R1T Chimera (free)",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 163840,
-            maxTokens: 65536,
-        },
-        "tngtech/tng-r1t-chimera": {
-            id: "tngtech/tng-r1t-chimera",
-            name: "TNG: R1T Chimera",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0.25,
-                output: 0.85,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 163840,
-            maxTokens: 65536,
-        },
         "anthropic/claude-opus-4.5": {
             id: "anthropic/claude-opus-4.5",
             name: "Anthropic: Claude Opus 4.5",
@@ -4279,13 +4606,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.39999999999999997,
-                output: 1.75,
-                cacheRead: 0,
+                input: 0.47,
+                output: 2,
+                cacheRead: 0.14100000000000001,
                 cacheWrite: 0,
             },
-            contextWindow: 262144,
-            maxTokens: 65535,
+            contextWindow: 131072,
+            maxTokens: 4096,
         },
         "amazon/nova-premier-v1": {
             id: "amazon/nova-premier-v1",
@@ -4372,6 +4699,23 @@ export const MODELS = {
             contextWindow: 196608,
             maxTokens: 65536,
         },
+        "qwen/qwen3-vl-32b-instruct": {
+            id: "qwen/qwen3-vl-32b-instruct",
+            name: "Qwen: Qwen3 VL 32B Instruct",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: false,
+            input: ["text", "image"],
+            cost: {
+                input: 0.10400000000000001,
+                output: 0.41600000000000004,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 131072,
+            maxTokens: 32768,
+        },
         "openai/gpt-5-image-mini": {
             id: "openai/gpt-5-image-mini",
             name: "OpenAI: GPT-5 Image Mini",
@@ -4415,12 +4759,12 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.18,
-                output: 2.0999999999999996,
+                input: 0.117,
+                output: 1.365,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 256000,
+            contextWindow: 131072,
             maxTokens: 32768,
         },
         "qwen/qwen3-vl-8b-instruct": {
@@ -4517,8 +4861,8 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.19999999999999998,
-                output: 1,
+                input: 0,
+                output: 0,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
@@ -4534,13 +4878,13 @@ export const MODELS = {
             reasoning: false,
             input: ["text", "image"],
             cost: {
-                input: 0.15,
-                output: 0.6,
-                cacheRead: 0.075,
+                input: 0.13,
+                output: 0.52,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 262144,
-            maxTokens: 4096,
+            contextWindow: 131072,
+            maxTokens: 32768,
         },
         "openai/gpt-5-pro": {
             id: "openai/gpt-5-pro",
@@ -4561,7 +4905,7 @@ export const MODELS = {
         },
         "z-ai/glm-4.6": {
             id: "z-ai/glm-4.6",
-            name: "Z.AI: GLM 4.6",
+            name: "Z.ai: GLM 4.6",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
@@ -4569,16 +4913,16 @@ export const MODELS = {
             input: ["text"],
             cost: {
                 input: 0.35,
-                output: 1.5,
+                output: 1.71,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 202752,
-            maxTokens: 65536,
+            maxTokens: 131072,
         },
         "z-ai/glm-4.6:exacto": {
             id: "z-ai/glm-4.6:exacto",
-            name: "Z.AI: GLM 4.6 (exacto)",
+            name: "Z.ai: GLM 4.6 (exacto)",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
@@ -4627,23 +4971,6 @@ export const MODELS = {
             contextWindow: 163840,
             maxTokens: 65536,
         },
-        "google/gemini-2.5-flash-preview-09-2025": {
-            id: "google/gemini-2.5-flash-preview-09-2025",
-            name: "Google: Gemini 2.5 Flash Preview 09-2025",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: true,
-            input: ["text", "image"],
-            cost: {
-                input: 0.3,
-                output: 2.5,
-                cacheRead: 0.03,
-                cacheWrite: 0.08333333333333334,
-            },
-            contextWindow: 1048576,
-            maxTokens: 65536,
-        },
         "google/gemini-2.5-flash-lite-preview-09-2025": {
             id: "google/gemini-2.5-flash-lite-preview-09-2025",
             name: "Google: Gemini 2.5 Flash Lite Preview 09-2025",
@@ -4670,13 +4997,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.44999999999999996,
-                output: 3.5,
+                input: 0,
+                output: 0,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 262144,
-            maxTokens: 262144,
+            contextWindow: 131072,
+            maxTokens: 32768,
         },
         "qwen/qwen3-vl-235b-a22b-instruct": {
             id: "qwen/qwen3-vl-235b-a22b-instruct",
@@ -4709,7 +5036,7 @@ export const MODELS = {
                 cacheRead: 0.24,
                 cacheWrite: 0,
             },
-            contextWindow: 256000,
+            contextWindow: 262144,
             maxTokens: 32768,
         },
         "qwen/qwen3-coder-plus": {
@@ -4723,10 +5050,10 @@ export const MODELS = {
             cost: {
                 input: 1,
                 output: 5,
-                cacheRead: 0.09999999999999999,
+                cacheRead: 0.19999999999999998,
                 cacheWrite: 0,
             },
-            contextWindow: 128000,
+            contextWindow: 1000000,
             maxTokens: 65536,
         },
         "openai/gpt-5-codex": {
@@ -4825,10 +5152,10 @@ export const MODELS = {
             cost: {
                 input: 0.3,
                 output: 1.5,
-                cacheRead: 0.08,
+                cacheRead: 0.06,
                 cacheWrite: 0,
             },
-            contextWindow: 128000,
+            contextWindow: 1000000,
             maxTokens: 65536,
         },
         "qwen/qwen3-next-80b-a3b-thinking": {
@@ -4909,7 +5236,7 @@ export const MODELS = {
             input: ["text"],
             cost: {
                 input: 0.39999999999999997,
-                output: 4,
+                output: 1.2,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
@@ -4959,13 +5286,13 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.39,
-                output: 1.9,
-                cacheRead: 0,
+                input: 0.39999999999999997,
+                output: 2,
+                cacheRead: 0.15,
                 cacheWrite: 0,
             },
-            contextWindow: 262144,
-            maxTokens: 262144,
+            contextWindow: 131072,
+            maxTokens: 4096,
         },
         "moonshotai/kimi-k2-0905:exacto": {
             id: "moonshotai/kimi-k2-0905:exacto",
@@ -4984,23 +5311,6 @@ export const MODELS = {
             contextWindow: 262144,
             maxTokens: 4096,
         },
-        "stepfun-ai/step3": {
-            id: "stepfun-ai/step3",
-            name: "StepFun: Step3",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: true,
-            input: ["text", "image"],
-            cost: {
-                input: 0.5700000000000001,
-                output: 1.42,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 65536,
-            maxTokens: 65536,
-        },
         "qwen/qwen3-30b-a3b-thinking-2507": {
             id: "qwen/qwen3-30b-a3b-thinking-2507",
             name: "Qwen: Qwen3 30B A3B Thinking 2507",
@@ -5035,23 +5345,6 @@ export const MODELS = {
             contextWindow: 256000,
             maxTokens: 10000,
         },
-        "nousresearch/hermes-4-70b": {
-            id: "nousresearch/hermes-4-70b",
-            name: "Nous: Hermes 4 70B",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0.11,
-                output: 0.38,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 131072,
-        },
         "deepseek/deepseek-chat-v3.1": {
             id: "deepseek/deepseek-chat-v3.1",
             name: "DeepSeek: DeepSeek V3.1",
@@ -5139,7 +5432,7 @@ export const MODELS = {
         },
         "z-ai/glm-4.5v": {
             id: "z-ai/glm-4.5v",
-            name: "Z.AI: GLM 4.5V",
+            name: "Z.ai: GLM 4.5V",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
@@ -5154,23 +5447,6 @@ export const MODELS = {
             contextWindow: 65536,
             maxTokens: 16384,
         },
-        "ai21/jamba-mini-1.7": {
-            id: "ai21/jamba-mini-1.7",
-            name: "AI21: Jamba Mini 1.7",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.19999999999999998,
-                output: 0.39999999999999997,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 256000,
-            maxTokens: 4096,
-        },
         "ai21/jamba-large-1.7": {
             id: "ai21/jamba-large-1.7",
             name: "AI21: Jamba Large 1.7",
@@ -5316,13 +5592,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.02,
-                output: 0.09999999999999999,
+                input: 0.03,
+                output: 0.14,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 131072,
+            maxTokens: 4096,
         },
         "anthropic/claude-opus-4.1": {
             id: "anthropic/claude-opus-4.1",
@@ -5384,8 +5660,8 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.08,
-                output: 0.33,
+                input: 0.09,
+                output: 0.3,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
@@ -5394,24 +5670,24 @@ export const MODELS = {
         },
         "z-ai/glm-4.5": {
             id: "z-ai/glm-4.5",
-            name: "Z.AI: GLM 4.5",
+            name: "Z.ai: GLM 4.5",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.35,
-                output: 1.55,
+                input: 0.55,
+                output: 2,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 131072,
-            maxTokens: 65536,
+            contextWindow: 131000,
+            maxTokens: 131000,
         },
         "z-ai/glm-4.5-air:free": {
             id: "z-ai/glm-4.5-air:free",
-            name: "Z.AI: GLM 4.5 Air (free)",
+            name: "Z.ai: GLM 4.5 Air (free)",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
@@ -5428,20 +5704,20 @@ export const MODELS = {
         },
         "z-ai/glm-4.5-air": {
             id: "z-ai/glm-4.5-air",
-            name: "Z.AI: GLM 4.5 Air",
+            name: "Z.ai: GLM 4.5 Air",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.049999999999999996,
-                output: 0.22,
-                cacheRead: 0,
+                input: 0.13,
+                output: 0.85,
+                cacheRead: 0.024999999999999998,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 131072,
+            maxTokens: 98304,
         },
         "qwen/qwen3-235b-a22b-thinking-2507": {
             id: "qwen/qwen3-235b-a22b-thinking-2507",
@@ -5452,17 +5728,17 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.11,
-                output: 0.6,
+                input: 0,
+                output: 0,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 262144,
-            maxTokens: 262144,
+            contextWindow: 131072,
+            maxTokens: 4096,
         },
         "z-ai/glm-4-32b": {
             id: "z-ai/glm-4-32b",
-            name: "Z.AI: GLM 4 32B ",
+            name: "Z.ai: GLM 4 32B ",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
@@ -5500,16 +5776,16 @@ export const MODELS = {
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: true,
+            reasoning: false,
             input: ["text"],
             cost: {
                 input: 0.22,
-                output: 0.95,
-                cacheRead: 0,
+                output: 1,
+                cacheRead: 0.022,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 262144,
+            maxTokens: 4096,
         },
         "qwen/qwen3-coder:exacto": {
             id: "qwen/qwen3-coder:exacto",
@@ -5641,7 +5917,7 @@ export const MODELS = {
             cost: {
                 input: 0.25,
                 output: 0.85,
-                cacheRead: 0,
+                cacheRead: 0.125,
                 cacheWrite: 0,
             },
             contextWindow: 163840,
@@ -5675,7 +5951,7 @@ export const MODELS = {
             cost: {
                 input: 0.06,
                 output: 0.18,
-                cacheRead: 0,
+                cacheRead: 0.03,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
@@ -5811,7 +6087,7 @@ export const MODELS = {
             cost: {
                 input: 0.39999999999999997,
                 output: 1.75,
-                cacheRead: 0,
+                cacheRead: 0.19999999999999998,
                 cacheWrite: 0,
             },
             contextWindow: 163840,
@@ -5851,23 +6127,6 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 64000,
         },
-        "nousresearch/deephermes-3-mistral-24b-preview": {
-            id: "nousresearch/deephermes-3-mistral-24b-preview",
-            name: "Nous: DeepHermes 3 Mistral 24B Preview",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0.02,
-                output: 0.09999999999999999,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 32768,
-            maxTokens: 32768,
-        },
         "mistralai/mistral-medium-3": {
             id: "mistralai/mistral-medium-3",
             name: "Mistral: Mistral Medium 3",
@@ -5962,8 +6221,8 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.06,
-                output: 0.22,
+                input: 0.08,
+                output: 0.28,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
@@ -5996,8 +6255,8 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.049999999999999996,
-                output: 0.22,
+                input: 0.06,
+                output: 0.24,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
@@ -6015,7 +6274,7 @@ export const MODELS = {
             cost: {
                 input: 0.08,
                 output: 0.24,
-                cacheRead: 0,
+                cacheRead: 0.04,
                 cacheWrite: 0,
             },
             contextWindow: 40960,
@@ -6030,13 +6289,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.19999999999999998,
-                output: 0.6,
+                input: 0.45499999999999996,
+                output: 1.8199999999999998,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 40960,
-            maxTokens: 4096,
+            contextWindow: 131072,
+            maxTokens: 8192,
         },
         "openai/o4-mini-high": {
             id: "openai/o4-mini-high",
@@ -6219,7 +6478,7 @@ export const MODELS = {
             cost: {
                 input: 0.19,
                 output: 0.87,
-                cacheRead: 0,
+                cacheRead: 0.095,
                 cacheWrite: 0,
             },
             contextWindow: 163840,
@@ -6242,23 +6501,6 @@ export const MODELS = {
             contextWindow: 128000,
             maxTokens: 4096,
         },
-        "mistralai/mistral-small-3.1-24b-instruct": {
-            id: "mistralai/mistral-small-3.1-24b-instruct",
-            name: "Mistral: Mistral Small 3.1 24B",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text", "image"],
-            cost: {
-                input: 0.03,
-                output: 0.11,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 131072,
-        },
         "google/gemma-3-27b-it:free": {
             id: "google/gemma-3-27b-it:free",
             name: "Google: Gemma 3 27B (free)",
@@ -6287,7 +6529,7 @@ export const MODELS = {
             cost: {
                 input: 0.04,
                 output: 0.15,
-                cacheRead: 0,
+                cacheRead: 0.02,
                 cacheWrite: 0,
             },
             contextWindow: 128000,
@@ -6327,9 +6569,9 @@ export const MODELS = {
             contextWindow: 1048576,
             maxTokens: 8192,
         },
-        "anthropic/claude-3.7-sonnet:thinking": {
-            id: "anthropic/claude-3.7-sonnet:thinking",
-            name: "Anthropic: Claude 3.7 Sonnet (thinking)",
+        "anthropic/claude-3.7-sonnet": {
+            id: "anthropic/claude-3.7-sonnet",
+            name: "Anthropic: Claude 3.7 Sonnet",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
@@ -6344,9 +6586,9 @@ export const MODELS = {
             contextWindow: 200000,
             maxTokens: 64000,
         },
-        "anthropic/claude-3.7-sonnet": {
-            id: "anthropic/claude-3.7-sonnet",
-            name: "Anthropic: Claude 3.7 Sonnet",
+        "anthropic/claude-3.7-sonnet:thinking": {
+            id: "anthropic/claude-3.7-sonnet:thinking",
+            name: "Anthropic: Claude 3.7 Sonnet (thinking)",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
@@ -6427,7 +6669,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 8192,
+            maxTokens: 32768,
         },
         "qwen/qwen-turbo": {
             id: "qwen/qwen-turbo",
@@ -6440,10 +6682,10 @@ export const MODELS = {
             cost: {
                 input: 0.049999999999999996,
                 output: 0.19999999999999998,
-                cacheRead: 0.02,
+                cacheRead: 0.01,
                 cacheWrite: 0,
             },
-            contextWindow: 1000000,
+            contextWindow: 131072,
             maxTokens: 8192,
         },
         "qwen/qwen-plus": {
@@ -6457,11 +6699,11 @@ export const MODELS = {
             cost: {
                 input: 0.39999999999999997,
                 output: 1.2,
-                cacheRead: 0.16,
+                cacheRead: 0.08,
                 cacheWrite: 0,
             },
-            contextWindow: 131072,
-            maxTokens: 8192,
+            contextWindow: 1000000,
+            maxTokens: 32768,
         },
         "qwen/qwen-max": {
             id: "qwen/qwen-max",
@@ -6474,7 +6716,7 @@ export const MODELS = {
             cost: {
                 input: 1.5999999999999999,
                 output: 6.3999999999999995,
-                cacheRead: 0.64,
+                cacheRead: 0.32,
                 cacheWrite: 0,
             },
             contextWindow: 32768,
@@ -6506,13 +6748,13 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.03,
-                output: 0.11,
+                input: 0.049999999999999996,
+                output: 0.08,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 32768,
-            maxTokens: 32768,
+            maxTokens: 16384,
         },
         "deepseek/deepseek-r1": {
             id: "deepseek/deepseek-r1",
@@ -6540,8 +6782,8 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.3,
-                output: 1.2,
+                input: 0.32,
+                output: 0.8899999999999999,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
@@ -6763,46 +7005,12 @@ export const MODELS = {
             cost: {
                 input: 6,
                 output: 30,
-                cacheRead: 0,
-                cacheWrite: 0,
+                cacheRead: 0.6,
+                cacheWrite: 7.5,
             },
             contextWindow: 200000,
             maxTokens: 8192,
         },
-        "mistralai/ministral-8b": {
-            id: "mistralai/ministral-8b",
-            name: "Mistral: Ministral 8B",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.09999999999999999,
-                output: 0.09999999999999999,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 4096,
-        },
-        "mistralai/ministral-3b": {
-            id: "mistralai/ministral-3b",
-            name: "Mistral: Ministral 3B",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.04,
-                output: 0.04,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 4096,
-        },
         "qwen/qwen-2.5-7b-instruct": {
             id: "qwen/qwen-2.5-7b-instruct",
             name: "Qwen: Qwen2.5 7B Instruct",
@@ -6871,23 +7079,6 @@ export const MODELS = {
             contextWindow: 32768,
             maxTokens: 16384,
         },
-        "mistralai/pixtral-12b": {
-            id: "mistralai/pixtral-12b",
-            name: "Mistral: Pixtral 12B",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text", "image"],
-            cost: {
-                input: 0.09999999999999999,
-                output: 0.09999999999999999,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 32768,
-            maxTokens: 4096,
-        },
         "cohere/command-r-08-2024": {
             id: "cohere/command-r-08-2024",
             name: "Cohere: Command R (08-2024)",
@@ -7245,23 +7436,6 @@ export const MODELS = {
             contextWindow: 128000,
             maxTokens: 4096,
         },
-        "mistralai/mistral-tiny": {
-            id: "mistralai/mistral-tiny",
-            name: "Mistral Tiny",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.25,
-                output: 0.25,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 32768,
-            maxTokens: 4096,
-        },
         "mistralai/mixtral-8x7b-instruct": {
             id: "mistralai/mixtral-8x7b-instruct",
             name: "Mistral: Mixtral 8x7B Instruct",
@@ -7449,7 +7623,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 400000,
-            maxTokens: 32000,
+            maxTokens: 128000,
         },
     },
 };