npm - @earendil-works/pi-ai - Versions diffs - 0.74.1 → 0.74.2 - Mend

@earendil-works/pi-ai 0.74.1 → 0.74.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

package/dist/image-models.generated.d.ts +15 -0
package/dist/image-models.generated.d.ts.map +1 -1
package/dist/image-models.generated.js +15 -0
package/dist/image-models.generated.js.map +1 -1
package/dist/models.generated.d.ts +256 -351
package/dist/models.generated.d.ts.map +1 -1
package/dist/models.generated.js +325 -437
package/dist/models.generated.js.map +1 -1
package/package.json +1 -1

package/dist/models.generated.js CHANGED Viewed

@@ -908,8 +908,8 @@ export const MODELS = {
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 256000,
-            maxTokens: 256000,
+            contextWindow: 262143,
+            maxTokens: 16000,
         },
         "moonshotai.kimi-k2.5": {
             id: "moonshotai.kimi-k2.5",
@@ -925,8 +925,8 @@ export const MODELS = {
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 256000,
-            maxTokens: 256000,
+            contextWindow: 262143,
+            maxTokens: 16000,
         },
         "nvidia.nemotron-nano-12b-v2": {
             id: "nvidia.nemotron-nano-12b-v2",
@@ -3275,6 +3275,42 @@ export const MODELS = {
             contextWindow: 256000,
             maxTokens: 16384,
         },
+        "@cf/ibm-granite/granite-4.0-h-micro": {
+            id: "@cf/ibm-granite/granite-4.0-h-micro",
+            name: "Granite 4.0 H Micro",
+            api: "openai-completions",
+            provider: "cloudflare-workers-ai",
+            baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
+            compat: { "sendSessionAffinityHeaders": true },
+            reasoning: false,
+            input: ["text"],
+            cost: {
+                input: 0.017,
+                output: 0.112,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 131000,
+            maxTokens: 131000,
+        },
+        "@cf/meta/llama-3.3-70b-instruct-fp8-fast": {
+            id: "@cf/meta/llama-3.3-70b-instruct-fp8-fast",
+            name: "Llama 3.3 70B Instruct fp8 Fast",
+            api: "openai-completions",
+            provider: "cloudflare-workers-ai",
+            baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
+            compat: { "sendSessionAffinityHeaders": true },
+            reasoning: false,
+            input: ["text"],
+            cost: {
+                input: 0.293,
+                output: 2.253,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 24000,
+            maxTokens: 24000,
+        },
         "@cf/meta/llama-4-scout-17b-16e-instruct": {
             id: "@cf/meta/llama-4-scout-17b-16e-instruct",
             name: "Llama 4 Scout 17B 16E Instruct",
@@ -3290,9 +3326,27 @@ export const MODELS = {
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 128000,
+            contextWindow: 131000,
             maxTokens: 16384,
         },
+        "@cf/mistralai/mistral-small-3.1-24b-instruct": {
+            id: "@cf/mistralai/mistral-small-3.1-24b-instruct",
+            name: "Mistral Small 3.1 24B Instruct",
+            api: "openai-completions",
+            provider: "cloudflare-workers-ai",
+            baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
+            compat: { "sendSessionAffinityHeaders": true },
+            reasoning: false,
+            input: ["text"],
+            cost: {
+                input: 0.351,
+                output: 0.555,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 128000,
+            maxTokens: 128000,
+        },
         "@cf/moonshotai/kimi-k2.5": {
             id: "@cf/moonshotai/kimi-k2.5",
             name: "Kimi K2.5",
@@ -3326,7 +3380,7 @@ export const MODELS = {
                 cacheRead: 0.16,
                 cacheWrite: 0,
             },
-            contextWindow: 256000,
+            contextWindow: 262144,
             maxTokens: 256000,
         },
         "@cf/nvidia/nemotron-3-120b-a12b": {
@@ -3383,6 +3437,24 @@ export const MODELS = {
             contextWindow: 128000,
             maxTokens: 16384,
         },
+        "@cf/qwen/qwen3-30b-a3b-fp8": {
+            id: "@cf/qwen/qwen3-30b-a3b-fp8",
+            name: "Qwen3 30B A3b fp8",
+            api: "openai-completions",
+            provider: "cloudflare-workers-ai",
+            baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
+            compat: { "sendSessionAffinityHeaders": true },
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0.0509,
+                output: 0.335,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 32768,
+            maxTokens: 32768,
+        },
         "@cf/zai-org/glm-4.7-flash": {
             id: "@cf/zai-org/glm-4.7-flash",
             name: "GLM-4.7-Flash",
@@ -3393,7 +3465,7 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.06,
+                input: 0.0605,
                 output: 0.4,
                 cacheRead: 0,
                 cacheWrite: 0,
@@ -3479,6 +3551,24 @@ export const MODELS = {
             contextWindow: 160000,
             maxTokens: 160000,
         },
+        "accounts/fireworks/models/deepseek-v4-flash": {
+            id: "accounts/fireworks/models/deepseek-v4-flash",
+            name: "DeepSeek V4 Flash",
+            api: "anthropic-messages",
+            provider: "fireworks",
+            baseUrl: "https://api.fireworks.ai/inference",
+            compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0.14,
+                output: 0.28,
+                cacheRead: 0.03,
+                cacheWrite: 0,
+            },
+            contextWindow: 1000000,
+            maxTokens: 384000,
+        },
         "accounts/fireworks/models/deepseek-v4-pro": {
             id: "accounts/fireworks/models/deepseek-v4-pro",
             name: "DeepSeek V4 Pro",
@@ -4148,57 +4238,6 @@ export const MODELS = {
         },
     },
     "google": {
-        "gemini-1.5-flash": {
-            id: "gemini-1.5-flash",
-            name: "Gemini 1.5 Flash",
-            api: "google-generative-ai",
-            provider: "google",
-            baseUrl: "https://generativelanguage.googleapis.com/v1beta",
-            reasoning: false,
-            input: ["text", "image"],
-            cost: {
-                input: 0.075,
-                output: 0.3,
-                cacheRead: 0.01875,
-                cacheWrite: 0,
-            },
-            contextWindow: 1000000,
-            maxTokens: 8192,
-        },
-        "gemini-1.5-flash-8b": {
-            id: "gemini-1.5-flash-8b",
-            name: "Gemini 1.5 Flash-8B",
-            api: "google-generative-ai",
-            provider: "google",
-            baseUrl: "https://generativelanguage.googleapis.com/v1beta",
-            reasoning: false,
-            input: ["text", "image"],
-            cost: {
-                input: 0.0375,
-                output: 0.15,
-                cacheRead: 0.01,
-                cacheWrite: 0,
-            },
-            contextWindow: 1000000,
-            maxTokens: 8192,
-        },
-        "gemini-1.5-pro": {
-            id: "gemini-1.5-pro",
-            name: "Gemini 1.5 Pro",
-            api: "google-generative-ai",
-            provider: "google",
-            baseUrl: "https://generativelanguage.googleapis.com/v1beta",
-            reasoning: false,
-            input: ["text", "image"],
-            cost: {
-                input: 1.25,
-                output: 5,
-                cacheRead: 0.3125,
-                cacheWrite: 0,
-            },
-            contextWindow: 1000000,
-            maxTokens: 8192,
-        },
         "gemini-2.0-flash": {
             id: "gemini-2.0-flash",
             name: "Gemini 2.0 Flash",
@@ -4218,7 +4257,7 @@ export const MODELS = {
         },
         "gemini-2.0-flash-lite": {
             id: "gemini-2.0-flash-lite",
-            name: "Gemini 2.0 Flash Lite",
+            name: "Gemini 2.0 Flash-Lite",
             api: "google-generative-ai",
             provider: "google",
             baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4252,7 +4291,7 @@ export const MODELS = {
         },
         "gemini-2.5-flash-lite": {
             id: "gemini-2.5-flash-lite",
-            name: "Gemini 2.5 Flash Lite",
+            name: "Gemini 2.5 Flash-Lite",
             api: "google-generative-ai",
             provider: "google",
             baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4267,91 +4306,6 @@ export const MODELS = {
             contextWindow: 1048576,
             maxTokens: 65536,
         },
-        "gemini-2.5-flash-lite-preview-06-17": {
-            id: "gemini-2.5-flash-lite-preview-06-17",
-            name: "Gemini 2.5 Flash Lite Preview 06-17",
-            api: "google-generative-ai",
-            provider: "google",
-            baseUrl: "https://generativelanguage.googleapis.com/v1beta",
-            reasoning: true,
-            input: ["text", "image"],
-            cost: {
-                input: 0.1,
-                output: 0.4,
-                cacheRead: 0.025,
-                cacheWrite: 0,
-            },
-            contextWindow: 1048576,
-            maxTokens: 65536,
-        },
-        "gemini-2.5-flash-lite-preview-09-2025": {
-            id: "gemini-2.5-flash-lite-preview-09-2025",
-            name: "Gemini 2.5 Flash Lite Preview 09-25",
-            api: "google-generative-ai",
-            provider: "google",
-            baseUrl: "https://generativelanguage.googleapis.com/v1beta",
-            reasoning: true,
-            input: ["text", "image"],
-            cost: {
-                input: 0.1,
-                output: 0.4,
-                cacheRead: 0.025,
-                cacheWrite: 0,
-            },
-            contextWindow: 1048576,
-            maxTokens: 65536,
-        },
-        "gemini-2.5-flash-preview-04-17": {
-            id: "gemini-2.5-flash-preview-04-17",
-            name: "Gemini 2.5 Flash Preview 04-17",
-            api: "google-generative-ai",
-            provider: "google",
-            baseUrl: "https://generativelanguage.googleapis.com/v1beta",
-            reasoning: true,
-            input: ["text", "image"],
-            cost: {
-                input: 0.15,
-                output: 0.6,
-                cacheRead: 0.0375,
-                cacheWrite: 0,
-            },
-            contextWindow: 1048576,
-            maxTokens: 65536,
-        },
-        "gemini-2.5-flash-preview-05-20": {
-            id: "gemini-2.5-flash-preview-05-20",
-            name: "Gemini 2.5 Flash Preview 05-20",
-            api: "google-generative-ai",
-            provider: "google",
-            baseUrl: "https://generativelanguage.googleapis.com/v1beta",
-            reasoning: true,
-            input: ["text", "image"],
-            cost: {
-                input: 0.15,
-                output: 0.6,
-                cacheRead: 0.0375,
-                cacheWrite: 0,
-            },
-            contextWindow: 1048576,
-            maxTokens: 65536,
-        },
-        "gemini-2.5-flash-preview-09-2025": {
-            id: "gemini-2.5-flash-preview-09-2025",
-            name: "Gemini 2.5 Flash Preview 09-25",
-            api: "google-generative-ai",
-            provider: "google",
-            baseUrl: "https://generativelanguage.googleapis.com/v1beta",
-            reasoning: true,
-            input: ["text", "image"],
-            cost: {
-                input: 0.3,
-                output: 2.5,
-                cacheRead: 0.075,
-                cacheWrite: 0,
-            },
-            contextWindow: 1048576,
-            maxTokens: 65536,
-        },
         "gemini-2.5-pro": {
             id: "gemini-2.5-pro",
             name: "Gemini 2.5 Pro",
@@ -4369,40 +4323,6 @@ export const MODELS = {
             contextWindow: 1048576,
             maxTokens: 65536,
         },
-        "gemini-2.5-pro-preview-05-06": {
-            id: "gemini-2.5-pro-preview-05-06",
-            name: "Gemini 2.5 Pro Preview 05-06",
-            api: "google-generative-ai",
-            provider: "google",
-            baseUrl: "https://generativelanguage.googleapis.com/v1beta",
-            reasoning: true,
-            input: ["text", "image"],
-            cost: {
-                input: 1.25,
-                output: 10,
-                cacheRead: 0.31,
-                cacheWrite: 0,
-            },
-            contextWindow: 1048576,
-            maxTokens: 65536,
-        },
-        "gemini-2.5-pro-preview-06-05": {
-            id: "gemini-2.5-pro-preview-06-05",
-            name: "Gemini 2.5 Pro Preview 06-05",
-            api: "google-generative-ai",
-            provider: "google",
-            baseUrl: "https://generativelanguage.googleapis.com/v1beta",
-            reasoning: true,
-            input: ["text", "image"],
-            cost: {
-                input: 1.25,
-                output: 10,
-                cacheRead: 0.31,
-                cacheWrite: 0,
-            },
-            contextWindow: 1048576,
-            maxTokens: 65536,
-        },
         "gemini-3-flash-preview": {
             id: "gemini-3-flash-preview",
             name: "Gemini 3 Flash Preview",
@@ -4436,8 +4356,8 @@ export const MODELS = {
                 cacheRead: 0.2,
                 cacheWrite: 0,
             },
-            contextWindow: 1000000,
-            maxTokens: 64000,
+            contextWindow: 1048576,
+            maxTokens: 65536,
         },
         "gemini-3.1-flash-lite": {
             id: "gemini-3.1-flash-lite",
@@ -4511,6 +4431,24 @@ export const MODELS = {
             contextWindow: 1048576,
             maxTokens: 65536,
         },
+        "gemini-3.5-flash": {
+            id: "gemini-3.5-flash",
+            name: "Gemini 3.5 Flash",
+            api: "google-generative-ai",
+            provider: "google",
+            baseUrl: "https://generativelanguage.googleapis.com/v1beta",
+            reasoning: true,
+            thinkingLevelMap: { "off": null },
+            input: ["text", "image"],
+            cost: {
+                input: 1.5,
+                output: 9,
+                cacheRead: 0.15,
+                cacheWrite: 0,
+            },
+            contextWindow: 1048576,
+            maxTokens: 65536,
+        },
         "gemini-flash-latest": {
             id: "gemini-flash-latest",
             name: "Gemini Flash Latest",
@@ -4545,60 +4483,9 @@ export const MODELS = {
             contextWindow: 1048576,
             maxTokens: 65536,
         },
-        "gemini-live-2.5-flash": {
-            id: "gemini-live-2.5-flash",
-            name: "Gemini Live 2.5 Flash",
-            api: "google-generative-ai",
-            provider: "google",
-            baseUrl: "https://generativelanguage.googleapis.com/v1beta",
-            reasoning: true,
-            input: ["text", "image"],
-            cost: {
-                input: 0.5,
-                output: 2,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 128000,
-            maxTokens: 8000,
-        },
-        "gemini-live-2.5-flash-preview-native-audio": {
-            id: "gemini-live-2.5-flash-preview-native-audio",
-            name: "Gemini Live 2.5 Flash Preview Native Audio",
-            api: "google-generative-ai",
-            provider: "google",
-            baseUrl: "https://generativelanguage.googleapis.com/v1beta",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0.5,
-                output: 2,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 65536,
-        },
-        "gemma-3-27b-it": {
-            id: "gemma-3-27b-it",
-            name: "Gemma 3 27B",
-            api: "google-generative-ai",
-            provider: "google",
-            baseUrl: "https://generativelanguage.googleapis.com/v1beta",
-            reasoning: false,
-            input: ["text", "image"],
-            cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 8192,
-        },
         "gemma-4-26b-a4b-it": {
             id: "gemma-4-26b-a4b-it",
-            name: "Gemma 4 26B",
+            name: "Gemma 4 26B A4B IT",
             api: "google-generative-ai",
             provider: "google",
             baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4611,12 +4498,12 @@ export const MODELS = {
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 256000,
-            maxTokens: 8192,
+            contextWindow: 262144,
+            maxTokens: 32768,
         },
         "gemma-4-31b-it": {
             id: "gemma-4-31b-it",
-            name: "Gemma 4 31B",
+            name: "Gemma 4 31B IT",
             api: "google-generative-ai",
             provider: "google",
             baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4629,8 +4516,8 @@ export const MODELS = {
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 256000,
-            maxTokens: 8192,
+            contextWindow: 262144,
+            maxTokens: 32768,
         },
     },
     "google-vertex": {
@@ -7542,6 +7429,24 @@ export const MODELS = {
             contextWindow: 1048576,
             maxTokens: 65536,
         },
+        "gemini-3.5-flash": {
+            id: "gemini-3.5-flash",
+            name: "Gemini 3.5 Flash",
+            api: "google-generative-ai",
+            provider: "opencode",
+            baseUrl: "https://opencode.ai/zen/v1",
+            reasoning: true,
+            thinkingLevelMap: { "off": null },
+            input: ["text", "image"],
+            cost: {
+                input: 1.5,
+                output: 9,
+                cacheRead: 0.15,
+                cacheWrite: 0,
+            },
+            contextWindow: 1048576,
+            maxTokens: 65536,
+        },
         "glm-5": {
             id: "glm-5",
             name: "GLM-5",
@@ -7864,6 +7769,23 @@ export const MODELS = {
             contextWindow: 1050000,
             maxTokens: 128000,
         },
+        "grok-build-0.1": {
+            id: "grok-build-0.1",
+            name: "Grok Build 0.1",
+            api: "openai-completions",
+            provider: "opencode",
+            baseUrl: "https://opencode.ai/zen/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 1,
+                output: 2,
+                cacheRead: 0.2,
+                cacheWrite: 0,
+            },
+            contextWindow: 256000,
+            maxTokens: 256000,
+        },
         "kimi-k2.5": {
             id: "kimi-k2.5",
             name: "Kimi K2.5",
@@ -7915,23 +7837,6 @@ export const MODELS = {
             contextWindow: 204800,
             maxTokens: 131072,
         },
-        "minimax-m2.5-free": {
-            id: "minimax-m2.5-free",
-            name: "MiniMax M2.5 Free",
-            api: "anthropic-messages",
-            provider: "opencode",
-            baseUrl: "https://opencode.ai/zen",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 204800,
-            maxTokens: 131072,
-        },
         "minimax-m2.7": {
             id: "minimax-m2.7",
             name: "MiniMax M2.7",
@@ -8567,30 +8472,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 3,
-                output: 15,
-                cacheRead: 0.3,
-                cacheWrite: 3.75,
-            },
-            contextWindow: 1000000,
-            maxTokens: 128000,
-        },
-        "arcee-ai/trinity-large-preview": {
-            id: "arcee-ai/trinity-large-preview",
-            name: "Arcee AI: Trinity Large Preview",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.15,
-                output: 0.44999999999999996,
-                cacheRead: 0,
-                cacheWrite: 0,
+                input: 3,
+                output: 15,
+                cacheRead: 0.3,
+                cacheWrite: 3.75,
             },
-            contextWindow: 131000,
-            maxTokens: 4096,
+            contextWindow: 1000000,
+            maxTokens: 128000,
         },
         "arcee-ai/trinity-large-thinking": {
             id: "arcee-ai/trinity-large-thinking",
@@ -9054,7 +8942,7 @@ export const MODELS = {
                 cacheRead: 0.024999999999999998,
                 cacheWrite: 0.08333333333333334,
             },
-            contextWindow: 1048576,
+            contextWindow: 1000000,
             maxTokens: 8192,
         },
         "google/gemini-2.0-flash-lite-001": {
@@ -9261,6 +9149,23 @@ export const MODELS = {
             contextWindow: 1048756,
             maxTokens: 65536,
         },
+        "google/gemini-3.5-flash": {
+            id: "google/gemini-3.5-flash",
+            name: "Google: Gemini 3.5 Flash",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 1.5,
+                output: 9,
+                cacheRead: 0.15,
+                cacheWrite: 0.08333333333333334,
+            },
+            contextWindow: 1048576,
+            maxTokens: 65536,
+        },
         "google/gemma-3-12b-it": {
             id: "google/gemma-3-12b-it",
             name: "Google: Gemma 3 12B",
@@ -9304,13 +9209,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.07,
-                output: 0.33999999999999997,
+                input: 0.06,
+                output: 0.33,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 16384,
+            maxTokens: 4096,
         },
         "google/gemma-4-26b-a4b-it:free": {
             id: "google/gemma-4-26b-a4b-it:free",
@@ -9407,9 +9312,9 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.3,
-                output: 2.5,
-                cacheRead: 0.06,
+                input: 0.075,
+                output: 0.625,
+                cacheRead: 0.015,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
@@ -9901,12 +9806,12 @@ export const MODELS = {
             input: ["text"],
             cost: {
                 input: 0.02,
-                output: 0.04,
+                output: 0.03,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 16384,
+            maxTokens: 4096,
         },
         "mistralai/mistral-saba": {
             id: "mistralai/mistral-saba",
@@ -10189,13 +10094,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.09999999999999999,
-                output: 0.5,
+                input: 0.09,
+                output: 0.44999999999999996,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 1000000,
-            maxTokens: 16384,
+            maxTokens: 4096,
         },
         "nvidia/nemotron-3-super-120b-a12b:free": {
             id: "nvidia/nemotron-3-super-120b-a12b:free",
@@ -11018,12 +10923,12 @@ export const MODELS = {
             input: ["text"],
             cost: {
                 input: 0.039,
-                output: 0.19,
+                output: 0.18,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 131072,
+            maxTokens: 4096,
         },
         "openai/gpt-oss-120b:free": {
             id: "openai/gpt-oss-120b:free",
@@ -11935,13 +11840,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.14,
+                input: 0.13899999999999998,
                 output: 1,
-                cacheRead: 0.049999999999999996,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 81920,
+            maxTokens: 4096,
         },
         "qwen/qwen3.5-397b-a17b": {
             id: "qwen/qwen3.5-397b-a17b",
@@ -11954,7 +11859,7 @@ export const MODELS = {
             cost: {
                 input: 0.39,
                 output: 2.34,
-                cacheRead: 0.195,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
@@ -12037,13 +11942,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.32,
+                input: 0.317,
                 output: 3.1999999999999997,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 81920,
+            maxTokens: 262140,
         },
         "qwen/qwen3.6-35b-a3b": {
             id: "qwen/qwen3.6-35b-a3b",
@@ -12113,6 +12018,23 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 65536,
         },
+        "qwen/qwen3.7-max": {
+            id: "qwen/qwen3.7-max",
+            name: "Qwen: Qwen3.7 Max",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 2.5,
+                output: 7.5,
+                cacheRead: 0,
+                cacheWrite: 3.125,
+            },
+            contextWindow: 1000000,
+            maxTokens: 65536,
+        },
         "rekaai/reka-edge": {
             id: "rekaai/reka-edge",
             name: "Reka Edge",
@@ -12190,13 +12112,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.09999999999999999,
+                input: 0.09,
                 output: 0.3,
-                cacheRead: 0,
+                cacheRead: 0.02,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 65536,
+            maxTokens: 16384,
         },
         "tencent/hy3-preview": {
             id: "tencent/hy3-preview",
@@ -12300,6 +12222,23 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 4096,
         },
+        "x-ai/grok-build-0.1": {
+            id: "x-ai/grok-build-0.1",
+            name: "xAI: Grok Build 0.1",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 1,
+                output: 2,
+                cacheRead: 0.19999999999999998,
+                cacheWrite: 0,
+            },
+            contextWindow: 256000,
+            maxTokens: 4096,
+        },
         "xiaomi/mimo-v2-flash": {
             id: "xiaomi/mimo-v2-flash",
             name: "Xiaomi: MiMo-V2-Flash",
@@ -12666,9 +12605,9 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.5,
-                output: 3,
-                cacheRead: 0.049999999999999996,
+                input: 1.5,
+                output: 9,
+                cacheRead: 0.15,
                 cacheWrite: 0.08333333333333334,
             },
             contextWindow: 1048576,
@@ -13372,6 +13311,23 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 64000,
         },
+        "alibaba/qwen3.7-max": {
+            id: "alibaba/qwen3.7-max",
+            name: "Qwen 3.7 Max",
+            api: "anthropic-messages",
+            provider: "vercel-ai-gateway",
+            baseUrl: "https://ai-gateway.vercel.sh",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 2.5,
+                output: 7.5,
+                cacheRead: 0.5,
+                cacheWrite: 3.125,
+            },
+            contextWindow: 991000,
+            maxTokens: 64000,
+        },
         "anthropic/claude-3-haiku": {
             id: "anthropic/claude-3-haiku",
             name: "Claude 3 Haiku",
@@ -13935,6 +13891,23 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 64000,
         },
+        "google/gemini-3.5-flash": {
+            id: "google/gemini-3.5-flash",
+            name: "Gemini 3.5 Flash",
+            api: "anthropic-messages",
+            provider: "vercel-ai-gateway",
+            baseUrl: "https://ai-gateway.vercel.sh",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 1.5,
+                output: 9,
+                cacheRead: 0.15,
+                cacheWrite: 0,
+            },
+            contextWindow: 1000000,
+            maxTokens: 64000,
+        },
         "google/gemma-4-26b-a4b-it": {
             id: "google/gemma-4-26b-a4b-it",
             name: "Gemma 4 26B A4B IT",
@@ -14394,6 +14367,23 @@ export const MODELS = {
             contextWindow: 128000,
             maxTokens: 64000,
         },
+        "mistral/mistral-medium-3.5": {
+            id: "mistral/mistral-medium-3.5",
+            name: "Mistral Medium Latest",
+            api: "anthropic-messages",
+            provider: "vercel-ai-gateway",
+            baseUrl: "https://ai-gateway.vercel.sh",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 1.5,
+                output: 7.5,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 256000,
+            maxTokens: 256000,
+        },
         "mistral/mistral-small": {
             id: "mistral/mistral-small",
             name: "Mistral Small",
@@ -15409,6 +15399,23 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 1000000,
         },
+        "xai/grok-build-0.1": {
+            id: "xai/grok-build-0.1",
+            name: "Grok Build 0.1",
+            api: "anthropic-messages",
+            provider: "vercel-ai-gateway",
+            baseUrl: "https://ai-gateway.vercel.sh",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 1,
+                output: 2,
+                cacheRead: 0.19999999999999998,
+                cacheWrite: 0,
+            },
+            contextWindow: 256000,
+            maxTokens: 256000,
+        },
         "xiaomi/mimo-v2-flash": {
             id: "xiaomi/mimo-v2-flash",
             name: "MiMo V2 Flash",
@@ -15700,108 +15707,6 @@ export const MODELS = {
         },
     },
     "xai": {
-        "grok-2": {
-            id: "grok-2",
-            name: "Grok 2",
-            api: "openai-completions",
-            provider: "xai",
-            baseUrl: "https://api.x.ai/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 2,
-                output: 10,
-                cacheRead: 2,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 8192,
-        },
-        "grok-2-1212": {
-            id: "grok-2-1212",
-            name: "Grok 2 (1212)",
-            api: "openai-completions",
-            provider: "xai",
-            baseUrl: "https://api.x.ai/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 2,
-                output: 10,
-                cacheRead: 2,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 8192,
-        },
-        "grok-2-latest": {
-            id: "grok-2-latest",
-            name: "Grok 2 Latest",
-            api: "openai-completions",
-            provider: "xai",
-            baseUrl: "https://api.x.ai/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 2,
-                output: 10,
-                cacheRead: 2,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 8192,
-        },
-        "grok-2-vision": {
-            id: "grok-2-vision",
-            name: "Grok 2 Vision",
-            api: "openai-completions",
-            provider: "xai",
-            baseUrl: "https://api.x.ai/v1",
-            reasoning: false,
-            input: ["text", "image"],
-            cost: {
-                input: 2,
-                output: 10,
-                cacheRead: 2,
-                cacheWrite: 0,
-            },
-            contextWindow: 8192,
-            maxTokens: 4096,
-        },
-        "grok-2-vision-1212": {
-            id: "grok-2-vision-1212",
-            name: "Grok 2 Vision (1212)",
-            api: "openai-completions",
-            provider: "xai",
-            baseUrl: "https://api.x.ai/v1",
-            reasoning: false,
-            input: ["text", "image"],
-            cost: {
-                input: 2,
-                output: 10,
-                cacheRead: 2,
-                cacheWrite: 0,
-            },
-            contextWindow: 8192,
-            maxTokens: 4096,
-        },
-        "grok-2-vision-latest": {
-            id: "grok-2-vision-latest",
-            name: "Grok 2 Vision Latest",
-            api: "openai-completions",
-            provider: "xai",
-            baseUrl: "https://api.x.ai/v1",
-            reasoning: false,
-            input: ["text", "image"],
-            cost: {
-                input: 2,
-                output: 10,
-                cacheRead: 2,
-                cacheWrite: 0,
-            },
-            contextWindow: 8192,
-            maxTokens: 4096,
-        },
         "grok-3": {
             id: "grok-3",
             name: "Grok 3",
@@ -15845,8 +15750,8 @@ export const MODELS = {
             reasoning: false,
             input: ["text", "image"],
             cost: {
-                input: 2,
-                output: 6,
+                input: 1.25,
+                output: 2.5,
                 cacheRead: 0.2,
                 cacheWrite: 0,
             },
@@ -15862,8 +15767,8 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 2,
-                output: 6,
+                input: 1.25,
+                output: 2.5,
                 cacheRead: 0.2,
                 cacheWrite: 0,
             },
@@ -15887,22 +15792,22 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 30000,
         },
-        "grok-beta": {
-            id: "grok-beta",
-            name: "Grok Beta",
+        "grok-build-0.1": {
+            id: "grok-build-0.1",
+            name: "Grok Build 0.1",
             api: "openai-completions",
             provider: "xai",
             baseUrl: "https://api.x.ai/v1",
-            reasoning: false,
-            input: ["text"],
+            reasoning: true,
+            input: ["text", "image"],
             cost: {
-                input: 5,
-                output: 15,
-                cacheRead: 5,
+                input: 1,
+                output: 2,
+                cacheRead: 0.2,
                 cacheWrite: 0,
             },
-            contextWindow: 131072,
-            maxTokens: 4096,
+            contextWindow: 256000,
+            maxTokens: 256000,
         },
         "grok-code-fast-1": {
             id: "grok-code-fast-1",
@@ -15921,23 +15826,6 @@ export const MODELS = {
             contextWindow: 32768,
             maxTokens: 8192,
         },
-        "grok-vision-beta": {
-            id: "grok-vision-beta",
-            name: "Grok Vision Beta",
-            api: "openai-completions",
-            provider: "xai",
-            baseUrl: "https://api.x.ai/v1",
-            reasoning: false,
-            input: ["text", "image"],
-            cost: {
-                input: 5,
-                output: 15,
-                cacheRead: 5,
-                cacheWrite: 0,
-            },
-            contextWindow: 8192,
-            maxTokens: 4096,
-        },
     },
     "xiaomi": {
         "mimo-v2-flash": {