npm - @mariozechner/pi-ai - Versions diffs - 0.5.43 → 0.5.44 - Mend

@mariozechner/pi-ai 0.5.43 → 0.5.44

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (17) hide show

package/dist/models.generated.d.ts +456 -235
package/dist/models.generated.d.ts.map +1 -1
package/dist/models.generated.js +990 -769
package/dist/models.generated.js.map +1 -1
package/dist/providers/anthropic.js +24 -1
package/dist/providers/anthropic.js.map +1 -1
package/dist/providers/google.js +1 -1
package/dist/providers/google.js.map +1 -1
package/dist/providers/transorm-messages.d.ts.map +1 -1
package/dist/providers/transorm-messages.js +46 -1
package/dist/providers/transorm-messages.js.map +1 -1
package/dist/utils/event-stream.js +3 -7
package/dist/utils/event-stream.js.map +1 -1
package/dist/utils/validation.d.ts.map +1 -1
package/dist/utils/validation.js +25 -3
package/dist/utils/validation.js.map +1 -1
package/package.json +3 -3

package/dist/models.generated.js CHANGED Viewed

@@ -2,13 +2,13 @@
 // Do not edit manually - run 'npm run generate-models' to update
 export const MODELS = {
     anthropic: {
-        "claude-3-7-sonnet-20250219": {
-            id: "claude-3-7-sonnet-20250219",
-            name: "Claude Sonnet 3.7",
+        "claude-3-5-sonnet-20241022": {
+            id: "claude-3-5-sonnet-20241022",
+            name: "Claude Sonnet 3.5 v2",
             api: "anthropic-messages",
             provider: "anthropic",
             baseUrl: "https://api.anthropic.com",
-            reasoning: true,
+            reasoning: false,
             input: ["text", "image"],
             cost: {
                 input: 3,
@@ -17,15 +17,32 @@ export const MODELS = {
                 cacheWrite: 3.75,
             },
             contextWindow: 200000,
-            maxTokens: 64000,
+            maxTokens: 8192,
         },
-        "claude-opus-4-1-20250805": {
-            id: "claude-opus-4-1-20250805",
-            name: "Claude Opus 4.1",
+        "claude-3-5-sonnet-20240620": {
+            id: "claude-3-5-sonnet-20240620",
+            name: "Claude Sonnet 3.5",
             api: "anthropic-messages",
             provider: "anthropic",
             baseUrl: "https://api.anthropic.com",
-            reasoning: true,
+            reasoning: false,
+            input: ["text", "image"],
+            cost: {
+                input: 3,
+                output: 15,
+                cacheRead: 0.3,
+                cacheWrite: 3.75,
+            },
+            contextWindow: 200000,
+            maxTokens: 8192,
+        },
+        "claude-3-opus-20240229": {
+            id: "claude-3-opus-20240229",
+            name: "Claude Opus 3",
+            api: "anthropic-messages",
+            provider: "anthropic",
+            baseUrl: "https://api.anthropic.com",
+            reasoning: false,
             input: ["text", "image"],
             cost: {
                 input: 15,
@@ -34,41 +51,41 @@ export const MODELS = {
                 cacheWrite: 18.75,
             },
             contextWindow: 200000,
-            maxTokens: 32000,
+            maxTokens: 4096,
         },
-        "claude-3-haiku-20240307": {
-            id: "claude-3-haiku-20240307",
-            name: "Claude Haiku 3",
+        "claude-sonnet-4-5-20250929": {
+            id: "claude-sonnet-4-5-20250929",
+            name: "Claude Sonnet 4.5",
             api: "anthropic-messages",
             provider: "anthropic",
             baseUrl: "https://api.anthropic.com",
-            reasoning: false,
+            reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.25,
-                output: 1.25,
-                cacheRead: 0.03,
-                cacheWrite: 0.3,
+                input: 3,
+                output: 15,
+                cacheRead: 0.3,
+                cacheWrite: 3.75,
             },
             contextWindow: 200000,
-            maxTokens: 4096,
+            maxTokens: 64000,
         },
-        "claude-3-5-haiku-20241022": {
-            id: "claude-3-5-haiku-20241022",
-            name: "Claude Haiku 3.5",
+        "claude-sonnet-4-20250514": {
+            id: "claude-sonnet-4-20250514",
+            name: "Claude Sonnet 4",
             api: "anthropic-messages",
             provider: "anthropic",
             baseUrl: "https://api.anthropic.com",
-            reasoning: false,
+            reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.8,
-                output: 4,
-                cacheRead: 0.08,
-                cacheWrite: 1,
+                input: 3,
+                output: 15,
+                cacheRead: 0.3,
+                cacheWrite: 3.75,
             },
             contextWindow: 200000,
-            maxTokens: 8192,
+            maxTokens: 64000,
         },
         "claude-opus-4-20250514": {
             id: "claude-opus-4-20250514",
@@ -87,87 +104,87 @@ export const MODELS = {
             contextWindow: 200000,
             maxTokens: 32000,
         },
-        "claude-3-5-sonnet-20241022": {
-            id: "claude-3-5-sonnet-20241022",
-            name: "Claude Sonnet 3.5 v2",
+        "claude-3-5-haiku-20241022": {
+            id: "claude-3-5-haiku-20241022",
+            name: "Claude Haiku 3.5",
             api: "anthropic-messages",
             provider: "anthropic",
             baseUrl: "https://api.anthropic.com",
             reasoning: false,
             input: ["text", "image"],
             cost: {
-                input: 3,
-                output: 15,
-                cacheRead: 0.3,
-                cacheWrite: 3.75,
+                input: 0.8,
+                output: 4,
+                cacheRead: 0.08,
+                cacheWrite: 1,
             },
             contextWindow: 200000,
             maxTokens: 8192,
         },
-        "claude-3-5-sonnet-20240620": {
-            id: "claude-3-5-sonnet-20240620",
-            name: "Claude Sonnet 3.5",
+        "claude-3-haiku-20240307": {
+            id: "claude-3-haiku-20240307",
+            name: "Claude Haiku 3",
             api: "anthropic-messages",
             provider: "anthropic",
             baseUrl: "https://api.anthropic.com",
             reasoning: false,
             input: ["text", "image"],
             cost: {
-                input: 3,
-                output: 15,
-                cacheRead: 0.3,
-                cacheWrite: 3.75,
+                input: 0.25,
+                output: 1.25,
+                cacheRead: 0.03,
+                cacheWrite: 0.3,
             },
             contextWindow: 200000,
-            maxTokens: 8192,
+            maxTokens: 4096,
         },
-        "claude-3-sonnet-20240229": {
-            id: "claude-3-sonnet-20240229",
-            name: "Claude Sonnet 3",
+        "claude-3-7-sonnet-20250219": {
+            id: "claude-3-7-sonnet-20250219",
+            name: "Claude Sonnet 3.7",
             api: "anthropic-messages",
             provider: "anthropic",
             baseUrl: "https://api.anthropic.com",
-            reasoning: false,
+            reasoning: true,
             input: ["text", "image"],
             cost: {
                 input: 3,
                 output: 15,
                 cacheRead: 0.3,
-                cacheWrite: 0.3,
+                cacheWrite: 3.75,
             },
             contextWindow: 200000,
-            maxTokens: 4096,
+            maxTokens: 64000,
         },
-        "claude-sonnet-4-20250514": {
-            id: "claude-sonnet-4-20250514",
-            name: "Claude Sonnet 4",
+        "claude-opus-4-1-20250805": {
+            id: "claude-opus-4-1-20250805",
+            name: "Claude Opus 4.1",
             api: "anthropic-messages",
             provider: "anthropic",
             baseUrl: "https://api.anthropic.com",
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 3,
-                output: 15,
-                cacheRead: 0.3,
-                cacheWrite: 3.75,
+                input: 15,
+                output: 75,
+                cacheRead: 1.5,
+                cacheWrite: 18.75,
             },
             contextWindow: 200000,
-            maxTokens: 64000,
+            maxTokens: 32000,
         },
-        "claude-3-opus-20240229": {
-            id: "claude-3-opus-20240229",
-            name: "Claude Opus 3",
+        "claude-3-sonnet-20240229": {
+            id: "claude-3-sonnet-20240229",
+            name: "Claude Sonnet 3",
             api: "anthropic-messages",
             provider: "anthropic",
             baseUrl: "https://api.anthropic.com",
             reasoning: false,
             input: ["text", "image"],
             cost: {
-                input: 15,
-                output: 75,
-                cacheRead: 1.5,
-                cacheWrite: 18.75,
+                input: 3,
+                output: 15,
+                cacheRead: 0.3,
+                cacheWrite: 0.3,
             },
             contextWindow: 200000,
             maxTokens: 4096,
@@ -191,39 +208,73 @@ export const MODELS = {
             contextWindow: 1048576,
             maxTokens: 65536,
         },
-        "gemini-2.5-pro": {
-            id: "gemini-2.5-pro",
-            name: "Gemini 2.5 Pro",
+        "gemini-flash-lite-latest": {
+            id: "gemini-flash-lite-latest",
+            name: "Gemini Flash-Lite Latest",
             api: "google-generative-ai",
             provider: "google",
             baseUrl: "https://generativelanguage.googleapis.com/v1beta",
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 1.25,
-                output: 10,
-                cacheRead: 0.31,
+                input: 0.1,
+                output: 0.4,
+                cacheRead: 0.025,
                 cacheWrite: 0,
             },
             contextWindow: 1048576,
             maxTokens: 65536,
         },
-        "gemini-1.5-flash": {
-            id: "gemini-1.5-flash",
-            name: "Gemini 1.5 Flash",
+        "gemini-2.5-flash": {
+            id: "gemini-2.5-flash",
+            name: "Gemini 2.5 Flash",
             api: "google-generative-ai",
             provider: "google",
             baseUrl: "https://generativelanguage.googleapis.com/v1beta",
-            reasoning: false,
+            reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.075,
-                output: 0.3,
-                cacheRead: 0.01875,
+                input: 0.3,
+                output: 2.5,
+                cacheRead: 0.075,
                 cacheWrite: 0,
             },
-            contextWindow: 1000000,
-            maxTokens: 8192,
+            contextWindow: 1048576,
+            maxTokens: 65536,
+        },
+        "gemini-flash-latest": {
+            id: "gemini-flash-latest",
+            name: "Gemini Flash Latest",
+            api: "google-generative-ai",
+            provider: "google",
+            baseUrl: "https://generativelanguage.googleapis.com/v1beta",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0.15,
+                output: 0.6,
+                cacheRead: 0.0375,
+                cacheWrite: 0,
+            },
+            contextWindow: 1048576,
+            maxTokens: 65536,
+        },
+        "gemini-2.5-pro-preview-05-06": {
+            id: "gemini-2.5-pro-preview-05-06",
+            name: "Gemini 2.5 Pro Preview 05-06",
+            api: "google-generative-ai",
+            provider: "google",
+            baseUrl: "https://generativelanguage.googleapis.com/v1beta",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 1.25,
+                output: 10,
+                cacheRead: 0.31,
+                cacheWrite: 0,
+            },
+            contextWindow: 1048576,
+            maxTokens: 65536,
         },
         "gemini-2.0-flash-lite": {
             id: "gemini-2.0-flash-lite",
@@ -242,52 +293,52 @@ export const MODELS = {
             contextWindow: 1048576,
             maxTokens: 8192,
         },
-        "gemini-1.5-pro": {
-            id: "gemini-1.5-pro",
-            name: "Gemini 1.5 Pro",
+        "gemini-live-2.5-flash-preview-native-audio": {
+            id: "gemini-live-2.5-flash-preview-native-audio",
+            name: "Gemini Live 2.5 Flash Preview Native Audio",
             api: "google-generative-ai",
             provider: "google",
             baseUrl: "https://generativelanguage.googleapis.com/v1beta",
-            reasoning: false,
-            input: ["text", "image"],
+            reasoning: true,
+            input: ["text"],
             cost: {
-                input: 1.25,
-                output: 5,
-                cacheRead: 0.3125,
+                input: 0.5,
+                output: 2,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 1000000,
-            maxTokens: 8192,
+            contextWindow: 131072,
+            maxTokens: 65536,
         },
-        "gemini-1.5-flash-8b": {
-            id: "gemini-1.5-flash-8b",
-            name: "Gemini 1.5 Flash-8B",
+        "gemini-2.0-flash": {
+            id: "gemini-2.0-flash",
+            name: "Gemini 2.0 Flash",
             api: "google-generative-ai",
             provider: "google",
             baseUrl: "https://generativelanguage.googleapis.com/v1beta",
             reasoning: false,
             input: ["text", "image"],
             cost: {
-                input: 0.0375,
-                output: 0.15,
-                cacheRead: 0.01,
+                input: 0.1,
+                output: 0.4,
+                cacheRead: 0.025,
                 cacheWrite: 0,
             },
-            contextWindow: 1000000,
+            contextWindow: 1048576,
             maxTokens: 8192,
         },
-        "gemini-2.5-flash": {
-            id: "gemini-2.5-flash",
-            name: "Gemini 2.5 Flash",
+        "gemini-2.5-flash-lite": {
+            id: "gemini-2.5-flash-lite",
+            name: "Gemini 2.5 Flash Lite",
             api: "google-generative-ai",
             provider: "google",
             baseUrl: "https://generativelanguage.googleapis.com/v1beta",
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.3,
-                output: 2.5,
-                cacheRead: 0.075,
+                input: 0.1,
+                output: 0.4,
+                cacheRead: 0.025,
                 cacheWrite: 0,
             },
             contextWindow: 1048576,
@@ -310,43 +361,111 @@ export const MODELS = {
             contextWindow: 1048576,
             maxTokens: 65536,
         },
-        "gemini-2.5-pro-preview-05-06": {
-            id: "gemini-2.5-pro-preview-05-06",
-            name: "Gemini 2.5 Pro Preview 05-06",
+        "gemini-2.5-flash-lite-preview-06-17": {
+            id: "gemini-2.5-flash-lite-preview-06-17",
+            name: "Gemini 2.5 Flash Lite Preview 06-17",
             api: "google-generative-ai",
             provider: "google",
             baseUrl: "https://generativelanguage.googleapis.com/v1beta",
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 1.25,
-                output: 10,
-                cacheRead: 0.31,
+                input: 0.1,
+                output: 0.4,
+                cacheRead: 0.025,
                 cacheWrite: 0,
             },
             contextWindow: 1048576,
             maxTokens: 65536,
         },
-        "gemini-2.0-flash": {
-            id: "gemini-2.0-flash",
-            name: "Gemini 2.0 Flash",
+        "gemini-2.5-flash-preview-09-2025": {
+            id: "gemini-2.5-flash-preview-09-2025",
+            name: "Gemini 2.5 Flash Preview 09-25",
             api: "google-generative-ai",
             provider: "google",
             baseUrl: "https://generativelanguage.googleapis.com/v1beta",
-            reasoning: false,
+            reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.1,
-                output: 0.4,
-                cacheRead: 0.025,
+                input: 0.15,
+                output: 0.6,
+                cacheRead: 0.0375,
+                cacheWrite: 0,
+            },
+            contextWindow: 1048576,
+            maxTokens: 65536,
+        },
+        "gemini-2.5-flash-preview-04-17": {
+            id: "gemini-2.5-flash-preview-04-17",
+            name: "Gemini 2.5 Flash Preview 04-17",
+            api: "google-generative-ai",
+            provider: "google",
+            baseUrl: "https://generativelanguage.googleapis.com/v1beta",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0.15,
+                output: 0.6,
+                cacheRead: 0.0375,
+                cacheWrite: 0,
+            },
+            contextWindow: 1048576,
+            maxTokens: 65536,
+        },
+        "gemini-2.5-pro": {
+            id: "gemini-2.5-pro",
+            name: "Gemini 2.5 Pro",
+            api: "google-generative-ai",
+            provider: "google",
+            baseUrl: "https://generativelanguage.googleapis.com/v1beta",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 1.25,
+                output: 10,
+                cacheRead: 0.31,
                 cacheWrite: 0,
             },
             contextWindow: 1048576,
+            maxTokens: 65536,
+        },
+        "gemini-1.5-flash": {
+            id: "gemini-1.5-flash",
+            name: "Gemini 1.5 Flash",
+            api: "google-generative-ai",
+            provider: "google",
+            baseUrl: "https://generativelanguage.googleapis.com/v1beta",
+            reasoning: false,
+            input: ["text", "image"],
+            cost: {
+                input: 0.075,
+                output: 0.3,
+                cacheRead: 0.01875,
+                cacheWrite: 0,
+            },
+            contextWindow: 1000000,
             maxTokens: 8192,
         },
-        "gemini-2.5-flash-lite-preview-06-17": {
-            id: "gemini-2.5-flash-lite-preview-06-17",
-            name: "Gemini 2.5 Flash Lite Preview 06-17",
+        "gemini-1.5-flash-8b": {
+            id: "gemini-1.5-flash-8b",
+            name: "Gemini 1.5 Flash-8B",
+            api: "google-generative-ai",
+            provider: "google",
+            baseUrl: "https://generativelanguage.googleapis.com/v1beta",
+            reasoning: false,
+            input: ["text", "image"],
+            cost: {
+                input: 0.0375,
+                output: 0.15,
+                cacheRead: 0.01,
+                cacheWrite: 0,
+            },
+            contextWindow: 1000000,
+            maxTokens: 8192,
+        },
+        "gemini-2.5-flash-lite-preview-09-2025": {
+            id: "gemini-2.5-flash-lite-preview-09-2025",
+            name: "Gemini 2.5 Flash Lite Preview 09-25",
             api: "google-generative-ai",
             provider: "google",
             baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -358,129 +477,129 @@ export const MODELS = {
                 cacheRead: 0.025,
                 cacheWrite: 0,
             },
-            contextWindow: 65536,
+            contextWindow: 1048576,
             maxTokens: 65536,
         },
-        "gemini-2.5-flash-preview-04-17": {
-            id: "gemini-2.5-flash-preview-04-17",
-            name: "Gemini 2.5 Flash Preview 04-17",
+        "gemini-1.5-pro": {
+            id: "gemini-1.5-pro",
+            name: "Gemini 1.5 Pro",
             api: "google-generative-ai",
             provider: "google",
             baseUrl: "https://generativelanguage.googleapis.com/v1beta",
-            reasoning: true,
+            reasoning: false,
             input: ["text", "image"],
             cost: {
-                input: 0.15,
-                output: 0.6,
-                cacheRead: 0.0375,
+                input: 1.25,
+                output: 5,
+                cacheRead: 0.3125,
                 cacheWrite: 0,
             },
-            contextWindow: 1048576,
-            maxTokens: 65536,
+            contextWindow: 1000000,
+            maxTokens: 8192,
         },
     },
     openai: {
-        "gpt-5-nano": {
-            id: "gpt-5-nano",
-            name: "GPT-5 Nano",
+        "gpt-4.1-nano": {
+            id: "gpt-4.1-nano",
+            name: "GPT-4.1 nano",
             api: "openai-responses",
             provider: "openai",
             baseUrl: "https://api.openai.com/v1",
-            reasoning: true,
+            reasoning: false,
             input: ["text", "image"],
             cost: {
-                input: 0.05,
+                input: 0.1,
                 output: 0.4,
-                cacheRead: 0.01,
+                cacheRead: 0.03,
                 cacheWrite: 0,
             },
-            contextWindow: 400000,
-            maxTokens: 128000,
+            contextWindow: 1047576,
+            maxTokens: 32768,
         },
-        "o3-pro": {
-            id: "o3-pro",
-            name: "o3-pro",
+        "gpt-4": {
+            id: "gpt-4",
+            name: "GPT-4",
             api: "openai-responses",
             provider: "openai",
             baseUrl: "https://api.openai.com/v1",
-            reasoning: true,
-            input: ["text", "image"],
+            reasoning: false,
+            input: ["text"],
             cost: {
-                input: 20,
-                output: 80,
+                input: 30,
+                output: 60,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 200000,
-            maxTokens: 100000,
+            contextWindow: 8192,
+            maxTokens: 8192,
         },
-        "codex-mini-latest": {
-            id: "codex-mini-latest",
-            name: "Codex Mini",
+        "o1-pro": {
+            id: "o1-pro",
+            name: "o1-pro",
             api: "openai-responses",
             provider: "openai",
             baseUrl: "https://api.openai.com/v1",
             reasoning: true,
-            input: ["text"],
+            input: ["text", "image"],
             cost: {
-                input: 1.5,
-                output: 6,
-                cacheRead: 0.375,
+                input: 150,
+                output: 600,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 200000,
             maxTokens: 100000,
         },
-        "gpt-4.1": {
-            id: "gpt-4.1",
-            name: "GPT-4.1",
+        "gpt-4o-2024-05-13": {
+            id: "gpt-4o-2024-05-13",
+            name: "GPT-4o (2024-05-13)",
             api: "openai-responses",
             provider: "openai",
             baseUrl: "https://api.openai.com/v1",
             reasoning: false,
             input: ["text", "image"],
             cost: {
-                input: 2,
-                output: 8,
-                cacheRead: 0.5,
+                input: 5,
+                output: 15,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 1047576,
-            maxTokens: 32768,
+            contextWindow: 128000,
+            maxTokens: 4096,
         },
-        "gpt-4-turbo": {
-            id: "gpt-4-turbo",
-            name: "GPT-4 Turbo",
+        "gpt-4o-2024-08-06": {
+            id: "gpt-4o-2024-08-06",
+            name: "GPT-4o (2024-08-06)",
             api: "openai-responses",
             provider: "openai",
             baseUrl: "https://api.openai.com/v1",
             reasoning: false,
             input: ["text", "image"],
             cost: {
-                input: 10,
-                output: 30,
-                cacheRead: 0,
+                input: 2.5,
+                output: 10,
+                cacheRead: 1.25,
                 cacheWrite: 0,
             },
             contextWindow: 128000,
-            maxTokens: 4096,
+            maxTokens: 16384,
         },
-        "o1": {
-            id: "o1",
-            name: "o1",
+        "gpt-4.1-mini": {
+            id: "gpt-4.1-mini",
+            name: "GPT-4.1 mini",
             api: "openai-responses",
             provider: "openai",
             baseUrl: "https://api.openai.com/v1",
-            reasoning: true,
+            reasoning: false,
             input: ["text", "image"],
             cost: {
-                input: 15,
-                output: 60,
-                cacheRead: 7.5,
+                input: 0.4,
+                output: 1.6,
+                cacheRead: 0.1,
                 cacheWrite: 0,
             },
-            contextWindow: 200000,
-            maxTokens: 100000,
+            contextWindow: 1047576,
+            maxTokens: 32768,
         },
         "o3-deep-research": {
             id: "o3-deep-research",
@@ -499,145 +618,196 @@ export const MODELS = {
             contextWindow: 200000,
             maxTokens: 100000,
         },
-        "gpt-5": {
-            id: "gpt-5",
-            name: "GPT-5",
+        "gpt-4-turbo": {
+            id: "gpt-4-turbo",
+            name: "GPT-4 Turbo",
             api: "openai-responses",
             provider: "openai",
             baseUrl: "https://api.openai.com/v1",
-            reasoning: true,
+            reasoning: false,
             input: ["text", "image"],
             cost: {
-                input: 1.25,
-                output: 10,
-                cacheRead: 0.13,
+                input: 10,
+                output: 30,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 400000,
-            maxTokens: 128000,
+            contextWindow: 128000,
+            maxTokens: 4096,
         },
-        "o1-pro": {
-            id: "o1-pro",
-            name: "o1-pro",
+        "o3-mini": {
+            id: "o3-mini",
+            name: "o3-mini",
             api: "openai-responses",
             provider: "openai",
             baseUrl: "https://api.openai.com/v1",
             reasoning: true,
-            input: ["text", "image"],
+            input: ["text"],
             cost: {
-                input: 150,
-                output: 600,
-                cacheRead: 0,
+                input: 1.1,
+                output: 4.4,
+                cacheRead: 0.55,
                 cacheWrite: 0,
             },
             contextWindow: 200000,
             maxTokens: 100000,
         },
-        "o3": {
-            id: "o3",
-            name: "o3",
+        "codex-mini-latest": {
+            id: "codex-mini-latest",
+            name: "Codex Mini",
             api: "openai-responses",
             provider: "openai",
             baseUrl: "https://api.openai.com/v1",
             reasoning: true,
-            input: ["text", "image"],
+            input: ["text"],
             cost: {
-                input: 2,
-                output: 8,
-                cacheRead: 0.5,
+                input: 1.5,
+                output: 6,
+                cacheRead: 0.375,
                 cacheWrite: 0,
             },
             contextWindow: 200000,
             maxTokens: 100000,
         },
-        "gpt-5-mini": {
-            id: "gpt-5-mini",
-            name: "GPT-5 Mini",
+        "gpt-5-nano": {
+            id: "gpt-5-nano",
+            name: "GPT-5 Nano",
             api: "openai-responses",
             provider: "openai",
             baseUrl: "https://api.openai.com/v1",
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.25,
-                output: 2,
-                cacheRead: 0.03,
+                input: 0.05,
+                output: 0.4,
+                cacheRead: 0.01,
                 cacheWrite: 0,
             },
             contextWindow: 400000,
             maxTokens: 128000,
         },
-        "o4-mini-deep-research": {
-            id: "o4-mini-deep-research",
-            name: "o4-mini-deep-research",
+        "gpt-5-codex": {
+            id: "gpt-5-codex",
+            name: "GPT-5-Codex",
             api: "openai-responses",
             provider: "openai",
             baseUrl: "https://api.openai.com/v1",
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 2,
-                output: 8,
-                cacheRead: 0.5,
+                input: 0,
+                output: 0,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 200000,
-            maxTokens: 100000,
+            contextWindow: 400000,
+            maxTokens: 128000,
         },
-        "gpt-4o-mini": {
-            id: "gpt-4o-mini",
-            name: "GPT-4o mini",
+        "gpt-4o": {
+            id: "gpt-4o",
+            name: "GPT-4o",
             api: "openai-responses",
             provider: "openai",
             baseUrl: "https://api.openai.com/v1",
             reasoning: false,
             input: ["text", "image"],
             cost: {
-                input: 0.15,
-                output: 0.6,
-                cacheRead: 0.08,
+                input: 2.5,
+                output: 10,
+                cacheRead: 1.25,
                 cacheWrite: 0,
             },
             contextWindow: 128000,
             maxTokens: 16384,
         },
-        "gpt-4.1-nano": {
-            id: "gpt-4.1-nano",
-            name: "GPT-4.1 nano",
+        "gpt-4.1": {
+            id: "gpt-4.1",
+            name: "GPT-4.1",
             api: "openai-responses",
             provider: "openai",
             baseUrl: "https://api.openai.com/v1",
             reasoning: false,
             input: ["text", "image"],
             cost: {
-                input: 0.1,
-                output: 0.4,
-                cacheRead: 0.03,
+                input: 2,
+                output: 8,
+                cacheRead: 0.5,
                 cacheWrite: 0,
             },
             contextWindow: 1047576,
             maxTokens: 32768,
         },
-        "gpt-4.1-mini": {
-            id: "gpt-4.1-mini",
-            name: "GPT-4.1 mini",
+        "o4-mini": {
+            id: "o4-mini",
+            name: "o4-mini",
             api: "openai-responses",
             provider: "openai",
             baseUrl: "https://api.openai.com/v1",
-            reasoning: false,
+            reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.4,
-                output: 1.6,
-                cacheRead: 0.1,
+                input: 1.1,
+                output: 4.4,
+                cacheRead: 0.28,
+                cacheWrite: 0,
+            },
+            contextWindow: 200000,
+            maxTokens: 100000,
+        },
+        "o1": {
+            id: "o1",
+            name: "o1",
+            api: "openai-responses",
+            provider: "openai",
+            baseUrl: "https://api.openai.com/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 15,
+                output: 60,
+                cacheRead: 7.5,
+                cacheWrite: 0,
+            },
+            contextWindow: 200000,
+            maxTokens: 100000,
+        },
+        "gpt-5-mini": {
+            id: "gpt-5-mini",
+            name: "GPT-5 Mini",
+            api: "openai-responses",
+            provider: "openai",
+            baseUrl: "https://api.openai.com/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0.25,
+                output: 2,
+                cacheRead: 0.03,
+                cacheWrite: 0,
+            },
+            contextWindow: 400000,
+            maxTokens: 128000,
+        },
+        "o3-pro": {
+            id: "o3-pro",
+            name: "o3-pro",
+            api: "openai-responses",
+            provider: "openai",
+            baseUrl: "https://api.openai.com/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 20,
+                output: 80,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 1047576,
-            maxTokens: 32768,
+            contextWindow: 200000,
+            maxTokens: 100000,
         },
-        "gpt-4o": {
-            id: "gpt-4o",
-            name: "GPT-4o",
+        "gpt-4o-2024-11-20": {
+            id: "gpt-4o-2024-11-20",
+            name: "GPT-4o (2024-11-20)",
             api: "openai-responses",
             provider: "openai",
             baseUrl: "https://api.openai.com/v1",
@@ -652,56 +822,73 @@ export const MODELS = {
             contextWindow: 128000,
             maxTokens: 16384,
         },
-        "gpt-4": {
-            id: "gpt-4",
-            name: "GPT-4",
+        "o3": {
+            id: "o3",
+            name: "o3",
             api: "openai-responses",
             provider: "openai",
             baseUrl: "https://api.openai.com/v1",
-            reasoning: false,
-            input: ["text"],
+            reasoning: true,
+            input: ["text", "image"],
             cost: {
-                input: 30,
-                output: 60,
-                cacheRead: 0,
+                input: 2,
+                output: 8,
+                cacheRead: 0.5,
                 cacheWrite: 0,
             },
-            contextWindow: 8192,
-            maxTokens: 8192,
+            contextWindow: 200000,
+            maxTokens: 100000,
         },
-        "o4-mini": {
-            id: "o4-mini",
-            name: "o4-mini",
+        "o4-mini-deep-research": {
+            id: "o4-mini-deep-research",
+            name: "o4-mini-deep-research",
             api: "openai-responses",
             provider: "openai",
             baseUrl: "https://api.openai.com/v1",
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 1.1,
-                output: 4.4,
-                cacheRead: 0.28,
+                input: 2,
+                output: 8,
+                cacheRead: 0.5,
                 cacheWrite: 0,
             },
             contextWindow: 200000,
             maxTokens: 100000,
         },
-        "o3-mini": {
-            id: "o3-mini",
-            name: "o3-mini",
+        "gpt-4o-mini": {
+            id: "gpt-4o-mini",
+            name: "GPT-4o mini",
+            api: "openai-responses",
+            provider: "openai",
+            baseUrl: "https://api.openai.com/v1",
+            reasoning: false,
+            input: ["text", "image"],
+            cost: {
+                input: 0.15,
+                output: 0.6,
+                cacheRead: 0.08,
+                cacheWrite: 0,
+            },
+            contextWindow: 128000,
+            maxTokens: 16384,
+        },
+        "gpt-5": {
+            id: "gpt-5",
+            name: "GPT-5",
             api: "openai-responses",
             provider: "openai",
             baseUrl: "https://api.openai.com/v1",
             reasoning: true,
-            input: ["text"],
+            input: ["text", "image"],
             cost: {
-                input: 1.1,
-                output: 4.4,
-                cacheRead: 0.55,
+                input: 1.25,
+                output: 10,
+                cacheRead: 0.13,
                 cacheWrite: 0,
             },
-            contextWindow: 200000,
-            maxTokens: 100000,
+            contextWindow: 400000,
+            maxTokens: 128000,
         },
         "gpt-5-chat-latest": {
             id: "gpt-5-chat-latest",
@@ -739,6 +926,40 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 8192,
         },
+        "mistral-saba-24b": {
+            id: "mistral-saba-24b",
+            name: "Mistral Saba 24B",
+            api: "openai-completions",
+            provider: "groq",
+            baseUrl: "https://api.groq.com/openai/v1",
+            reasoning: false,
+            input: ["text"],
+            cost: {
+                input: 0.79,
+                output: 0.79,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 32768,
+            maxTokens: 32768,
+        },
+        "llama3-8b-8192": {
+            id: "llama3-8b-8192",
+            name: "Llama 3 8B",
+            api: "openai-completions",
+            provider: "groq",
+            baseUrl: "https://api.groq.com/openai/v1",
+            reasoning: false,
+            input: ["text"],
+            cost: {
+                input: 0.05,
+                output: 0.08,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 8192,
+            maxTokens: 8192,
+        },
         "qwen-qwq-32b": {
             id: "qwen-qwq-32b",
             name: "Qwen QwQ 32B",
@@ -790,23 +1011,6 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 8192,
         },
-        "llama3-8b-8192": {
-            id: "llama3-8b-8192",
-            name: "Llama 3 8B",
-            api: "openai-completions",
-            provider: "groq",
-            baseUrl: "https://api.groq.com/openai/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.05,
-                output: 0.08,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 8192,
-            maxTokens: 8192,
-        },
         "gemma2-9b-it": {
             id: "gemma2-9b-it",
             name: "Gemma 2 9B",
@@ -841,22 +1045,39 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 32768,
         },
-        "mistral-saba-24b": {
-            id: "mistral-saba-24b",
-            name: "Mistral Saba 24B",
+        "moonshotai/kimi-k2-instruct-0905": {
+            id: "moonshotai/kimi-k2-instruct-0905",
+            name: "Kimi K2 Instruct 0905",
             api: "openai-completions",
             provider: "groq",
             baseUrl: "https://api.groq.com/openai/v1",
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.79,
-                output: 0.79,
+                input: 1,
+                output: 3,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 32768,
-            maxTokens: 32768,
+            contextWindow: 262144,
+            maxTokens: 16384,
+        },
+        "moonshotai/kimi-k2-instruct": {
+            id: "moonshotai/kimi-k2-instruct",
+            name: "Kimi K2 Instruct",
+            api: "openai-completions",
+            provider: "groq",
+            baseUrl: "https://api.groq.com/openai/v1",
+            reasoning: false,
+            input: ["text"],
+            cost: {
+                input: 1,
+                output: 3,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 131072,
+            maxTokens: 16384,
         },
         "openai/gpt-oss-20b": {
             id: "openai/gpt-oss-20b",
@@ -892,40 +1113,6 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 32768,
         },
-        "meta-llama/llama-4-maverick-17b-128e-instruct": {
-            id: "meta-llama/llama-4-maverick-17b-128e-instruct",
-            name: "Llama 4 Maverick 17B",
-            api: "openai-completions",
-            provider: "groq",
-            baseUrl: "https://api.groq.com/openai/v1",
-            reasoning: false,
-            input: ["text", "image"],
-            cost: {
-                input: 0.2,
-                output: 0.6,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 8192,
-        },
-        "meta-llama/llama-4-scout-17b-16e-instruct": {
-            id: "meta-llama/llama-4-scout-17b-16e-instruct",
-            name: "Llama 4 Scout 17B",
-            api: "openai-completions",
-            provider: "groq",
-            baseUrl: "https://api.groq.com/openai/v1",
-            reasoning: false,
-            input: ["text", "image"],
-            cost: {
-                input: 0.11,
-                output: 0.34,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 8192,
-        },
         "qwen/qwen3-32b": {
             id: "qwen/qwen3-32b",
             name: "Qwen3 32B",
@@ -943,39 +1130,39 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 16384,
         },
-        "moonshotai/kimi-k2-instruct-0905": {
-            id: "moonshotai/kimi-k2-instruct-0905",
-            name: "Kimi K2 Instruct 0905",
+        "meta-llama/llama-4-scout-17b-16e-instruct": {
+            id: "meta-llama/llama-4-scout-17b-16e-instruct",
+            name: "Llama 4 Scout 17B",
             api: "openai-completions",
             provider: "groq",
             baseUrl: "https://api.groq.com/openai/v1",
             reasoning: false,
-            input: ["text"],
+            input: ["text", "image"],
             cost: {
-                input: 1,
-                output: 3,
+                input: 0.11,
+                output: 0.34,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 262144,
-            maxTokens: 16384,
+            contextWindow: 131072,
+            maxTokens: 8192,
         },
-        "moonshotai/kimi-k2-instruct": {
-            id: "moonshotai/kimi-k2-instruct",
-            name: "Kimi K2 Instruct",
+        "meta-llama/llama-4-maverick-17b-128e-instruct": {
+            id: "meta-llama/llama-4-maverick-17b-128e-instruct",
+            name: "Llama 4 Maverick 17B",
             api: "openai-completions",
             provider: "groq",
             baseUrl: "https://api.groq.com/openai/v1",
             reasoning: false,
-            input: ["text"],
+            input: ["text", "image"],
             cost: {
-                input: 1,
-                output: 3,
+                input: 0.2,
+                output: 0.6,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 16384,
+            maxTokens: 8192,
         },
     },
     cerebras: {
@@ -996,23 +1183,6 @@ export const MODELS = {
             contextWindow: 131000,
             maxTokens: 32000,
         },
-        "gpt-oss-120b": {
-            id: "gpt-oss-120b",
-            name: "GPT OSS 120B",
-            api: "openai-completions",
-            provider: "cerebras",
-            baseUrl: "https://api.cerebras.ai/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0.25,
-                output: 0.69,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 32768,
-        },
         "qwen-3-coder-480b": {
             id: "qwen-3-coder-480b",
             name: "Qwen 3 Coder 480B",
@@ -1022,70 +1192,53 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 2,
-                output: 2,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131000,
-            maxTokens: 32000,
-        },
-    },
-    xai: {
-        "grok-3-mini-fast-latest": {
-            id: "grok-3-mini-fast-latest",
-            name: "Grok 3 Mini Fast Latest",
-            api: "openai-completions",
-            provider: "xai",
-            baseUrl: "https://api.x.ai/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0.6,
-                output: 4,
-                cacheRead: 0.15,
+                input: 2,
+                output: 2,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 131072,
-            maxTokens: 8192,
+            contextWindow: 131000,
+            maxTokens: 32000,
         },
-        "grok-3-mini-latest": {
-            id: "grok-3-mini-latest",
-            name: "Grok 3 Mini Latest",
+        "gpt-oss-120b": {
+            id: "gpt-oss-120b",
+            name: "GPT OSS 120B",
             api: "openai-completions",
-            provider: "xai",
-            baseUrl: "https://api.x.ai/v1",
+            provider: "cerebras",
+            baseUrl: "https://api.cerebras.ai/v1",
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.3,
-                output: 0.5,
-                cacheRead: 0.075,
+                input: 0.25,
+                output: 0.69,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 8192,
+            maxTokens: 32768,
         },
-        "grok-beta": {
-            id: "grok-beta",
-            name: "Grok Beta",
+    },
+    xai: {
+        "grok-4-fast-non-reasoning": {
+            id: "grok-4-fast-non-reasoning",
+            name: "Grok 4 Fast (Non-Reasoning)",
             api: "openai-completions",
             provider: "xai",
             baseUrl: "https://api.x.ai/v1",
             reasoning: false,
-            input: ["text"],
+            input: ["text", "image"],
             cost: {
-                input: 5,
-                output: 15,
-                cacheRead: 5,
+                input: 0.2,
+                output: 0.5,
+                cacheRead: 0.05,
                 cacheWrite: 0,
             },
-            contextWindow: 131072,
-            maxTokens: 4096,
+            contextWindow: 2000000,
+            maxTokens: 30000,
         },
-        "grok-3-fast-latest": {
-            id: "grok-3-fast-latest",
-            name: "Grok 3 Fast Latest",
+        "grok-3-fast": {
+            id: "grok-3-fast",
+            name: "Grok 3 Fast",
             api: "openai-completions",
             provider: "xai",
             baseUrl: "https://api.x.ai/v1",
@@ -1100,13 +1253,13 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 8192,
         },
-        "grok-3": {
-            id: "grok-3",
-            name: "Grok 3",
+        "grok-4": {
+            id: "grok-4",
+            name: "Grok 4",
             api: "openai-completions",
             provider: "xai",
             baseUrl: "https://api.x.ai/v1",
-            reasoning: false,
+            reasoning: true,
             input: ["text"],
             cost: {
                 input: 3,
@@ -1114,29 +1267,12 @@ export const MODELS = {
                 cacheRead: 0.75,
                 cacheWrite: 0,
             },
-            contextWindow: 131072,
-            maxTokens: 8192,
-        },
-        "grok-3-mini": {
-            id: "grok-3-mini",
-            name: "Grok 3 Mini",
-            api: "openai-completions",
-            provider: "xai",
-            baseUrl: "https://api.x.ai/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0.3,
-                output: 0.5,
-                cacheRead: 0.075,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 8192,
+            contextWindow: 256000,
+            maxTokens: 64000,
         },
-        "grok-2-vision-1212": {
-            id: "grok-2-vision-1212",
-            name: "Grok 2 Vision (1212)",
+        "grok-2-vision": {
+            id: "grok-2-vision",
+            name: "Grok 2 Vision",
             api: "openai-completions",
             provider: "xai",
             baseUrl: "https://api.x.ai/v1",
@@ -1151,6 +1287,23 @@ export const MODELS = {
             contextWindow: 8192,
             maxTokens: 4096,
         },
+        "grok-code-fast-1": {
+            id: "grok-code-fast-1",
+            name: "Grok Code Fast 1",
+            api: "openai-completions",
+            provider: "xai",
+            baseUrl: "https://api.x.ai/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0.2,
+                output: 1.5,
+                cacheRead: 0.02,
+                cacheWrite: 0,
+            },
+            contextWindow: 256000,
+            maxTokens: 10000,
+        },
         "grok-2": {
             id: "grok-2",
             name: "Grok 2",
@@ -1168,9 +1321,26 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 8192,
         },
-        "grok-2-vision-latest": {
-            id: "grok-2-vision-latest",
-            name: "Grok 2 Vision Latest",
+        "grok-3-mini-fast-latest": {
+            id: "grok-3-mini-fast-latest",
+            name: "Grok 3 Mini Fast Latest",
+            api: "openai-completions",
+            provider: "xai",
+            baseUrl: "https://api.x.ai/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0.6,
+                output: 4,
+                cacheRead: 0.15,
+                cacheWrite: 0,
+            },
+            contextWindow: 131072,
+            maxTokens: 8192,
+        },
+        "grok-2-vision-1212": {
+            id: "grok-2-vision-1212",
+            name: "Grok 2 Vision (1212)",
             api: "openai-completions",
             provider: "xai",
             baseUrl: "https://api.x.ai/v1",
@@ -1185,9 +1355,9 @@ export const MODELS = {
             contextWindow: 8192,
             maxTokens: 4096,
         },
-        "grok-3-latest": {
-            id: "grok-3-latest",
-            name: "Grok 3 Latest",
+        "grok-3": {
+            id: "grok-3",
+            name: "Grok 3",
             api: "openai-completions",
             provider: "xai",
             baseUrl: "https://api.x.ai/v1",
@@ -1202,22 +1372,22 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 8192,
         },
-        "grok-2-vision": {
-            id: "grok-2-vision",
-            name: "Grok 2 Vision",
+        "grok-4-fast": {
+            id: "grok-4-fast",
+            name: "Grok 4 Fast",
             api: "openai-completions",
             provider: "xai",
             baseUrl: "https://api.x.ai/v1",
-            reasoning: false,
+            reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 2,
-                output: 10,
-                cacheRead: 2,
+                input: 0.2,
+                output: 0.5,
+                cacheRead: 0.05,
                 cacheWrite: 0,
             },
-            contextWindow: 8192,
-            maxTokens: 4096,
+            contextWindow: 2000000,
+            maxTokens: 30000,
         },
         "grok-2-latest": {
             id: "grok-2-latest",
@@ -1236,47 +1406,47 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 8192,
         },
-        "grok-3-fast": {
-            id: "grok-3-fast",
-            name: "Grok 3 Fast",
+        "grok-2-1212": {
+            id: "grok-2-1212",
+            name: "Grok 2 (1212)",
             api: "openai-completions",
             provider: "xai",
             baseUrl: "https://api.x.ai/v1",
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 5,
-                output: 25,
-                cacheRead: 1.25,
+                input: 2,
+                output: 10,
+                cacheRead: 2,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
             maxTokens: 8192,
         },
-        "grok-2-1212": {
-            id: "grok-2-1212",
-            name: "Grok 2 (1212)",
+        "grok-3-fast-latest": {
+            id: "grok-3-fast-latest",
+            name: "Grok 3 Fast Latest",
             api: "openai-completions",
             provider: "xai",
             baseUrl: "https://api.x.ai/v1",
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 2,
-                output: 10,
-                cacheRead: 2,
+                input: 5,
+                output: 25,
+                cacheRead: 1.25,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
             maxTokens: 8192,
         },
-        "grok-4": {
-            id: "grok-4",
-            name: "Grok 4",
+        "grok-3-latest": {
+            id: "grok-3-latest",
+            name: "Grok 3 Latest",
             api: "openai-completions",
             provider: "xai",
             baseUrl: "https://api.x.ai/v1",
-            reasoning: true,
+            reasoning: false,
             input: ["text"],
             cost: {
                 input: 3,
@@ -1284,8 +1454,25 @@ export const MODELS = {
                 cacheRead: 0.75,
                 cacheWrite: 0,
             },
-            contextWindow: 256000,
-            maxTokens: 64000,
+            contextWindow: 131072,
+            maxTokens: 8192,
+        },
+        "grok-2-vision-latest": {
+            id: "grok-2-vision-latest",
+            name: "Grok 2 Vision Latest",
+            api: "openai-completions",
+            provider: "xai",
+            baseUrl: "https://api.x.ai/v1",
+            reasoning: false,
+            input: ["text", "image"],
+            cost: {
+                input: 2,
+                output: 10,
+                cacheRead: 2,
+                cacheWrite: 0,
+            },
+            contextWindow: 8192,
+            maxTokens: 4096,
         },
         "grok-vision-beta": {
             id: "grok-vision-beta",
@@ -1304,6 +1491,57 @@ export const MODELS = {
             contextWindow: 8192,
             maxTokens: 4096,
         },
+        "grok-3-mini": {
+            id: "grok-3-mini",
+            name: "Grok 3 Mini",
+            api: "openai-completions",
+            provider: "xai",
+            baseUrl: "https://api.x.ai/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0.3,
+                output: 0.5,
+                cacheRead: 0.075,
+                cacheWrite: 0,
+            },
+            contextWindow: 131072,
+            maxTokens: 8192,
+        },
+        "grok-beta": {
+            id: "grok-beta",
+            name: "Grok Beta",
+            api: "openai-completions",
+            provider: "xai",
+            baseUrl: "https://api.x.ai/v1",
+            reasoning: false,
+            input: ["text"],
+            cost: {
+                input: 5,
+                output: 15,
+                cacheRead: 5,
+                cacheWrite: 0,
+            },
+            contextWindow: 131072,
+            maxTokens: 4096,
+        },
+        "grok-3-mini-latest": {
+            id: "grok-3-mini-latest",
+            name: "Grok 3 Mini Latest",
+            api: "openai-completions",
+            provider: "xai",
+            baseUrl: "https://api.x.ai/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0.3,
+                output: 0.5,
+                cacheRead: 0.075,
+                cacheWrite: 0,
+            },
+            contextWindow: 131072,
+            maxTokens: 8192,
+        },
         "grok-3-mini-fast": {
             id: "grok-3-mini-fast",
             name: "Grok 3 Mini Fast",
@@ -1313,33 +1551,50 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.6,
-                output: 4,
-                cacheRead: 0.15,
+                input: 0.6,
+                output: 4,
+                cacheRead: 0.15,
+                cacheWrite: 0,
+            },
+            contextWindow: 131072,
+            maxTokens: 8192,
+        },
+    },
+    zai: {
+        "glm-4.5-flash": {
+            id: "glm-4.5-flash",
+            name: "GLM-4.5-Flash",
+            api: "anthropic-messages",
+            provider: "zai",
+            baseUrl: "https://api.z.ai/api/anthropic",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0,
+                output: 0,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 8192,
+            maxTokens: 98304,
         },
-        "grok-code-fast-1": {
-            id: "grok-code-fast-1",
-            name: "Grok Code Fast 1",
-            api: "openai-completions",
-            provider: "xai",
-            baseUrl: "https://api.x.ai/v1",
-            reasoning: false,
+        "glm-4.5": {
+            id: "glm-4.5",
+            name: "GLM-4.5",
+            api: "anthropic-messages",
+            provider: "zai",
+            baseUrl: "https://api.z.ai/api/anthropic",
+            reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.2,
-                output: 1.5,
-                cacheRead: 0.02,
+                input: 0.6,
+                output: 2.2,
+                cacheRead: 0.11,
                 cacheWrite: 0,
             },
-            contextWindow: 32768,
-            maxTokens: 8192,
+            contextWindow: 131072,
+            maxTokens: 98304,
         },
-    },
-    zai: {
         "glm-4.5-air": {
             id: "glm-4.5-air",
             name: "GLM-4.5-Air",
@@ -1374,75 +1629,109 @@ export const MODELS = {
             contextWindow: 64000,
             maxTokens: 16384,
         },
-        "glm-4.5-flash": {
-            id: "glm-4.5-flash",
-            name: "GLM-4.5-Flash",
+        "glm-4.6": {
+            id: "glm-4.6",
+            name: "GLM-4.6",
             api: "anthropic-messages",
             provider: "zai",
             baseUrl: "https://api.z.ai/api/anthropic",
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
+                input: 0.6,
+                output: 2.2,
+                cacheRead: 0.11,
                 cacheWrite: 0,
             },
-            contextWindow: 131072,
-            maxTokens: 98304,
+            contextWindow: 204800,
+            maxTokens: 131072,
         },
-        "glm-4.5": {
-            id: "glm-4.5",
-            name: "GLM-4.5",
-            api: "anthropic-messages",
-            provider: "zai",
-            baseUrl: "https://api.z.ai/api/anthropic",
+    },
+    openrouter: {
+        "z-ai/glm-4.6": {
+            id: "z-ai/glm-4.6",
+            name: "Z.AI: GLM 4.6",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.6,
-                output: 2.2,
-                cacheRead: 0.11,
+                input: 0.5,
+                output: 1.75,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 131072,
-            maxTokens: 98304,
+            contextWindow: 202752,
+            maxTokens: 202752,
         },
-    },
-    openrouter: {
-        "alibaba/tongyi-deepresearch-30b-a3b": {
-            id: "alibaba/tongyi-deepresearch-30b-a3b",
-            name: "Tongyi DeepResearch 30B A3B",
+        "deepseek/deepseek-v3.2-exp": {
+            id: "deepseek/deepseek-v3.2-exp",
+            name: "DeepSeek: DeepSeek V3.2 Exp",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.09,
-                output: 0.44999999999999996,
+                input: 0.27,
+                output: 0.39999999999999997,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 163840,
+            maxTokens: 4096,
+        },
+        "qwen/qwen3-vl-235b-a22b-thinking": {
+            id: "qwen/qwen3-vl-235b-a22b-thinking",
+            name: "Qwen: Qwen3 VL 235B A22B Thinking",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0.5,
+                output: 3.5,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 65536,
+            maxTokens: 65536,
+        },
+        "qwen/qwen3-vl-235b-a22b-instruct": {
+            id: "qwen/qwen3-vl-235b-a22b-instruct",
+            name: "Qwen: Qwen3 VL 235B A22B Instruct",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0.3,
+                output: 1.5,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 131072,
+            maxTokens: 32768,
         },
-        "qwen/qwen3-coder-flash": {
-            id: "qwen/qwen3-coder-flash",
-            name: "Qwen: Qwen3 Coder Flash",
+        "qwen/qwen3-max": {
+            id: "qwen/qwen3-max",
+            name: "Qwen: Qwen3 Max",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.3,
-                output: 1.5,
-                cacheRead: 0.08,
+                input: 1.2,
+                output: 6,
+                cacheRead: 0.24,
                 cacheWrite: 0,
             },
-            contextWindow: 128000,
-            maxTokens: 65536,
+            contextWindow: 256000,
+            maxTokens: 32768,
         },
         "qwen/qwen3-coder-plus": {
             id: "qwen/qwen3-coder-plus",
@@ -1461,6 +1750,74 @@ export const MODELS = {
             contextWindow: 128000,
             maxTokens: 65536,
         },
+        "deepseek/deepseek-v3.1-terminus": {
+            id: "deepseek/deepseek-v3.1-terminus",
+            name: "DeepSeek: DeepSeek V3.1 Terminus",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0.22999999999999998,
+                output: 0.8999999999999999,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 163840,
+            maxTokens: 163840,
+        },
+        "alibaba/tongyi-deepresearch-30b-a3b:free": {
+            id: "alibaba/tongyi-deepresearch-30b-a3b:free",
+            name: "Tongyi DeepResearch 30B A3B (free)",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: false,
+            input: ["text"],
+            cost: {
+                input: 0,
+                output: 0,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 131072,
+            maxTokens: 131072,
+        },
+        "alibaba/tongyi-deepresearch-30b-a3b": {
+            id: "alibaba/tongyi-deepresearch-30b-a3b",
+            name: "Tongyi DeepResearch 30B A3B",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0.09,
+                output: 0.39999999999999997,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 131072,
+            maxTokens: 131072,
+        },
+        "qwen/qwen3-coder-flash": {
+            id: "qwen/qwen3-coder-flash",
+            name: "Qwen: Qwen3 Coder Flash",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: false,
+            input: ["text"],
+            cost: {
+                input: 0.3,
+                output: 1.5,
+                cacheRead: 0.08,
+                cacheWrite: 0,
+            },
+            contextWindow: 128000,
+            maxTokens: 65536,
+        },
         "qwen/qwen3-next-80b-a3b-thinking": {
             id: "qwen/qwen3-next-80b-a3b-thinking",
             name: "Qwen: Qwen3 Next 80B A3B Thinking",
@@ -1476,7 +1833,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 4096,
+            maxTokens: 262144,
         },
         "qwen/qwen3-next-80b-a3b-instruct": {
             id: "qwen/qwen3-next-80b-a3b-instruct",
@@ -1493,24 +1850,24 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 4096,
+            maxTokens: 262144,
         },
-        "meituan/longcat-flash-chat": {
-            id: "meituan/longcat-flash-chat",
-            name: "Meituan: LongCat Flash Chat",
+        "meituan/longcat-flash-chat:free": {
+            id: "meituan/longcat-flash-chat:free",
+            name: "Meituan: LongCat Flash Chat (free)",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.12,
-                output: 0.6,
+                input: 0,
+                output: 0,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 4096,
+            maxTokens: 131072,
         },
         "qwen/qwen-plus-2025-07-28": {
             id: "qwen/qwen-plus-2025-07-28",
@@ -1580,57 +1937,6 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 4096,
         },
-        "openrouter/sonoma-dusk-alpha": {
-            id: "openrouter/sonoma-dusk-alpha",
-            name: "Sonoma Dusk Alpha",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text", "image"],
-            cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 2000000,
-            maxTokens: 4096,
-        },
-        "openrouter/sonoma-sky-alpha": {
-            id: "openrouter/sonoma-sky-alpha",
-            name: "Sonoma Sky Alpha",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: true,
-            input: ["text", "image"],
-            cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 2000000,
-            maxTokens: 4096,
-        },
-        "qwen/qwen3-max": {
-            id: "qwen/qwen3-max",
-            name: "Qwen: Qwen3 Max",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 1.2,
-                output: 6,
-                cacheRead: 0.24,
-                cacheWrite: 0,
-            },
-            contextWindow: 256000,
-            maxTokens: 32768,
-        },
         "moonshotai/kimi-k2-0905": {
             id: "moonshotai/kimi-k2-0905",
             name: "MoonshotAI: Kimi K2 0905",
@@ -1640,13 +1946,13 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.38,
-                output: 1.52,
+                input: 0.39,
+                output: 1.9,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 4096,
+            maxTokens: 262144,
         },
         "deepcogito/cogito-v2-preview-llama-109b-moe": {
             id: "deepcogito/cogito-v2-preview-llama-109b-moe",
@@ -1714,7 +2020,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 4096,
+            maxTokens: 131072,
         },
         "nousresearch/hermes-4-405b": {
             id: "nousresearch/hermes-4-405b",
@@ -1725,13 +2031,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.24999987999999998,
-                output: 0.999999888,
+                input: 0.3,
+                output: 1.2,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 4096,
+            maxTokens: 131072,
         },
         "deepseek/deepseek-chat-v3.1:free": {
             id: "deepseek/deepseek-chat-v3.1:free",
@@ -1747,7 +2053,7 @@ export const MODELS = {
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 163840,
+            contextWindow: 163800,
             maxTokens: 4096,
         },
         "deepseek/deepseek-chat-v3.1": {
@@ -1759,13 +2065,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.24999987999999998,
-                output: 0.999999888,
+                input: 0.19999999999999998,
+                output: 0.7999999999999999,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 163840,
-            maxTokens: 4096,
+            maxTokens: 163840,
         },
         "mistralai/mistral-medium-3.1": {
             id: "mistralai/mistral-medium-3.1",
@@ -1793,13 +2099,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.5,
+                input: 0.6,
                 output: 1.7999999999999998,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 65536,
-            maxTokens: 65536,
+            maxTokens: 16384,
         },
         "ai21/jamba-mini-1.7": {
             id: "ai21/jamba-mini-1.7",
@@ -1861,13 +2167,13 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.07,
-                output: 0.28,
+                input: 0.06,
+                output: 0.25,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 4096,
+            maxTokens: 262144,
         },
         "qwen/qwen3-30b-a3b-instruct-2507": {
             id: "qwen/qwen3-30b-a3b-instruct-2507",
@@ -1878,13 +2184,13 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.07,
-                output: 0.28,
+                input: 0.08,
+                output: 0.33,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 4096,
+            maxTokens: 262144,
         },
         "z-ai/glm-4.5": {
             id: "z-ai/glm-4.5",
@@ -1895,13 +2201,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.41,
-                output: 1.6500000000000001,
+                input: 0.35,
+                output: 1.55,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 4096,
+            maxTokens: 131072,
         },
         "z-ai/glm-4.5-air:free": {
             id: "z-ai/glm-4.5-air:free",
@@ -1918,7 +2224,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 4096,
+            maxTokens: 131072,
         },
         "z-ai/glm-4.5-air": {
             id: "z-ai/glm-4.5-air",
@@ -1946,13 +2252,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.09999999999999999,
-                output: 0.39,
+                input: 0.11,
+                output: 0.6,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 4096,
+            maxTokens: 262144,
         },
         "z-ai/glm-4-32b": {
             id: "z-ai/glm-4-32b",
@@ -2003,7 +2309,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 4096,
+            maxTokens: 262144,
         },
         "qwen/qwen3-235b-a22b-2507": {
             id: "qwen/qwen3-235b-a22b-2507",
@@ -2014,31 +2320,14 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.09999999999999999,
-                output: 0.09999999999999999,
+                input: 0.08,
+                output: 0.55,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
             maxTokens: 262144,
         },
-        "moonshotai/kimi-k2:free": {
-            id: "moonshotai/kimi-k2:free",
-            name: "MoonshotAI: Kimi K2 0711 (free)",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 32768,
-            maxTokens: 4096,
-        },
         "moonshotai/kimi-k2": {
             id: "moonshotai/kimi-k2",
             name: "MoonshotAI: Kimi K2 0711",
@@ -2133,13 +2422,13 @@ export const MODELS = {
             reasoning: false,
             input: ["text", "image"],
             cost: {
-                input: 0.075,
-                output: 0.19999999999999998,
+                input: 0.06,
+                output: 0.18,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 128000,
-            maxTokens: 4096,
+            contextWindow: 131072,
+            maxTokens: 131072,
         },
         "minimax/minimax-m1": {
             id: "minimax/minimax-m1",
@@ -2224,7 +2513,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 163840,
-            maxTokens: 4096,
+            maxTokens: 163840,
         },
         "mistralai/devstral-small-2505:free": {
             id: "mistralai/devstral-small-2505:free",
@@ -2252,13 +2541,13 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.04,
-                output: 0.14,
+                input: 0.049999999999999996,
+                output: 0.22,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 4096,
+            maxTokens: 131072,
         },
         "meta-llama/llama-3.3-8b-instruct:free": {
             id: "meta-llama/llama-3.3-8b-instruct:free",
@@ -2360,7 +2649,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 40960,
-            maxTokens: 4096,
+            maxTokens: 40960,
         },
         "qwen/qwen3-14b": {
             id: "qwen/qwen3-14b",
@@ -2371,8 +2660,8 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.06,
-                output: 0.24,
+                input: 0.049999999999999996,
+                output: 0.22,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
@@ -2388,13 +2677,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.03,
-                output: 0.13,
+                input: 0.049999999999999996,
+                output: 0.19999999999999998,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 40960,
-            maxTokens: 4096,
+            maxTokens: 40960,
         },
         "qwen/qwen3-235b-a22b:free": {
             id: "qwen/qwen3-235b-a22b:free",
@@ -2495,8 +2784,8 @@ export const MODELS = {
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 1048576,
-            maxTokens: 1048576,
+            contextWindow: 327680,
+            maxTokens: 16384,
         },
         "deepseek/deepseek-chat-v3-0324:free": {
             id: "deepseek/deepseek-chat-v3-0324:free",
@@ -2524,13 +2813,13 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.24999987999999998,
-                output: 0.999999888,
+                input: 0.24,
+                output: 0.84,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 163840,
-            maxTokens: 4096,
+            maxTokens: 163840,
         },
         "mistralai/mistral-small-3.1-24b-instruct:free": {
             id: "mistralai/mistral-small-3.1-24b-instruct:free",
@@ -2558,13 +2847,13 @@ export const MODELS = {
             reasoning: false,
             input: ["text", "image"],
             cost: {
-                input: 0.04,
-                output: 0.15,
+                input: 0.049999999999999996,
+                output: 0.09999999999999999,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 131072,
-            maxTokens: 96000,
+            contextWindow: 128000,
+            maxTokens: 4096,
         },
         "microsoft/phi-4-multimodal-instruct": {
             id: "microsoft/phi-4-multimodal-instruct",
@@ -2677,13 +2966,13 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.04,
-                output: 0.15,
+                input: 0.049999999999999996,
+                output: 0.08,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 32768,
-            maxTokens: 4096,
+            maxTokens: 16384,
         },
         "deepseek/deepseek-r1-distill-llama-70b": {
             id: "deepseek/deepseek-r1-distill-llama-70b",
@@ -2700,7 +2989,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 4096,
+            maxTokens: 131072,
         },
         "deepseek/deepseek-r1": {
             id: "deepseek/deepseek-r1",
@@ -2745,13 +3034,13 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.24999987999999998,
-                output: 0.999999888,
+                input: 0.3,
+                output: 0.85,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 163840,
-            maxTokens: 4096,
+            maxTokens: 163840,
         },
         "meta-llama/llama-3.3-70b-instruct:free": {
             id: "meta-llama/llama-3.3-70b-instruct:free",
@@ -2779,13 +3068,13 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.012,
-                output: 0.036,
+                input: 0.04,
+                output: 0.12,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 8192,
+            maxTokens: 131072,
         },
         "amazon/nova-lite-v1": {
             id: "amazon/nova-lite-v1",
@@ -2989,7 +3278,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 32768,
-            maxTokens: 4096,
+            maxTokens: 32768,
         },
         "mistralai/pixtral-12b": {
             id: "mistralai/pixtral-12b",
@@ -3008,34 +3297,34 @@ export const MODELS = {
             contextWindow: 32768,
             maxTokens: 4096,
         },
-        "cohere/command-r-08-2024": {
-            id: "cohere/command-r-08-2024",
-            name: "Cohere: Command R (08-2024)",
+        "cohere/command-r-plus-08-2024": {
+            id: "cohere/command-r-plus-08-2024",
+            name: "Cohere: Command R+ (08-2024)",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.15,
-                output: 0.6,
+                input: 2.5,
+                output: 10,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 128000,
             maxTokens: 4000,
         },
-        "cohere/command-r-plus-08-2024": {
-            id: "cohere/command-r-plus-08-2024",
-            name: "Cohere: Command R+ (08-2024)",
+        "cohere/command-r-08-2024": {
+            id: "cohere/command-r-08-2024",
+            name: "Cohere: Command R (08-2024)",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 2.5,
-                output: 10,
+                input: 0.15,
+                output: 0.6,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
@@ -3068,46 +3357,46 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.12,
+                input: 0.3,
                 output: 0.3,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 131072,
-            maxTokens: 131072,
+            contextWindow: 65000,
+            maxTokens: 4096,
         },
-        "meta-llama/llama-3.1-8b-instruct": {
-            id: "meta-llama/llama-3.1-8b-instruct",
-            name: "Meta: Llama 3.1 8B Instruct",
+        "meta-llama/llama-3.1-405b-instruct": {
+            id: "meta-llama/llama-3.1-405b-instruct",
+            name: "Meta: Llama 3.1 405B Instruct",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.02,
-                output: 0.03,
+                input: 0.7999999999999999,
+                output: 0.7999999999999999,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 16384,
+            contextWindow: 32768,
             maxTokens: 16384,
         },
-        "meta-llama/llama-3.1-405b-instruct": {
-            id: "meta-llama/llama-3.1-405b-instruct",
-            name: "Meta: Llama 3.1 405B Instruct",
+        "meta-llama/llama-3.1-8b-instruct": {
+            id: "meta-llama/llama-3.1-8b-instruct",
+            name: "Meta: Llama 3.1 8B Instruct",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.7999999999999999,
-                output: 0.7999999999999999,
+                input: 0.02,
+                output: 0.03,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 32768,
+            contextWindow: 16384,
             maxTokens: 16384,
         },
         "meta-llama/llama-3.1-70b-instruct": {
@@ -3119,13 +3408,13 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.09999999999999999,
-                output: 0.28,
+                input: 0.39999999999999997,
+                output: 0.39999999999999997,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 16384,
+            maxTokens: 4096,
         },
         "mistralai/mistral-nemo": {
             id: "mistralai/mistral-nemo",
@@ -3144,43 +3433,43 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 16384,
         },
-        "mistralai/mistral-7b-instruct-v0.3": {
-            id: "mistralai/mistral-7b-instruct-v0.3",
-            name: "Mistral: Mistral 7B Instruct v0.3",
+        "mistralai/mistral-7b-instruct:free": {
+            id: "mistralai/mistral-7b-instruct:free",
+            name: "Mistral: Mistral 7B Instruct (free)",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.028,
-                output: 0.054,
+                input: 0,
+                output: 0,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 32768,
             maxTokens: 16384,
         },
-        "mistralai/mistral-7b-instruct:free": {
-            id: "mistralai/mistral-7b-instruct:free",
-            name: "Mistral: Mistral 7B Instruct (free)",
+        "mistralai/mistral-7b-instruct": {
+            id: "mistralai/mistral-7b-instruct",
+            name: "Mistral: Mistral 7B Instruct",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0,
-                output: 0,
+                input: 0.028,
+                output: 0.054,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 32768,
             maxTokens: 16384,
         },
-        "mistralai/mistral-7b-instruct": {
-            id: "mistralai/mistral-7b-instruct",
-            name: "Mistral: Mistral 7B Instruct",
+        "mistralai/mistral-7b-instruct-v0.3": {
+            id: "mistralai/mistral-7b-instruct-v0.3",
+            name: "Mistral: Mistral 7B Instruct v0.3",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
@@ -3280,74 +3569,6 @@ export const MODELS = {
             contextWindow: 65536,
             maxTokens: 4096,
         },
-        "cohere/command-r-plus": {
-            id: "cohere/command-r-plus",
-            name: "Cohere: Command R+",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 3,
-                output: 15,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 128000,
-            maxTokens: 4000,
-        },
-        "cohere/command-r-plus-04-2024": {
-            id: "cohere/command-r-plus-04-2024",
-            name: "Cohere: Command R+ (04-2024)",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 3,
-                output: 15,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 128000,
-            maxTokens: 4000,
-        },
-        "cohere/command-r": {
-            id: "cohere/command-r",
-            name: "Cohere: Command R",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.5,
-                output: 1.5,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 128000,
-            maxTokens: 4000,
-        },
-        "cohere/command-r-03-2024": {
-            id: "cohere/command-r-03-2024",
-            name: "Cohere: Command R (03-2024)",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.5,
-                output: 1.5,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 128000,
-            maxTokens: 4000,
-        },
         "mistralai/mistral-large": {
             id: "mistralai/mistral-large",
             name: "Mistral Large",
@@ -3365,34 +3586,34 @@ export const MODELS = {
             contextWindow: 128000,
             maxTokens: 4096,
         },
-        "mistralai/mistral-tiny": {
-            id: "mistralai/mistral-tiny",
-            name: "Mistral Tiny",
+        "mistralai/mistral-small": {
+            id: "mistralai/mistral-small",
+            name: "Mistral Small",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.25,
-                output: 0.25,
+                input: 0.19999999999999998,
+                output: 0.6,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 32768,
             maxTokens: 4096,
         },
-        "mistralai/mistral-small": {
-            id: "mistralai/mistral-small",
-            name: "Mistral Small",
+        "mistralai/mistral-tiny": {
+            id: "mistralai/mistral-tiny",
+            name: "Mistral Tiny",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.19999999999999998,
-                output: 0.6,
+                input: 0.25,
+                output: 0.25,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
@@ -3408,8 +3629,8 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.39999999999999997,
-                output: 0.39999999999999997,
+                input: 0.54,
+                output: 0.54,
                 cacheRead: 0,
                 cacheWrite: 0,
             },