npm - @hyperspaceng/neural-ai - Versions diffs - 0.65.3 → 0.67.2 - Mend

@hyperspaceng/neural-ai 0.65.3 → 0.67.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (21) hide show

package/dist/cli.d.ts.map +1 -1
package/dist/cli.js +1 -1
package/dist/cli.js.map +1 -1
package/dist/models.generated.d.ts +149 -92
package/dist/models.generated.d.ts.map +1 -1
package/dist/models.generated.js +246 -193
package/dist/models.generated.js.map +1 -1
package/dist/providers/google-gemini-cli.d.ts.map +1 -1
package/dist/providers/google-gemini-cli.js +1 -1
package/dist/providers/google-gemini-cli.js.map +1 -1
package/dist/providers/google.d.ts.map +1 -1
package/dist/providers/google.js +28 -3
package/dist/providers/google.js.map +1 -1
package/dist/providers/openai-codex-responses.d.ts +2 -0
package/dist/providers/openai-codex-responses.d.ts.map +1 -1
package/dist/providers/openai-codex-responses.js +33 -4
package/dist/providers/openai-codex-responses.js.map +1 -1
package/dist/types.d.ts +61 -4
package/dist/types.d.ts.map +1 -1
package/dist/types.js.map +1 -1
package/package.json +1 -1

package/dist/models.generated.js CHANGED Viewed

@@ -1209,6 +1209,23 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 65536,
         },
+        "qwen.qwen3-coder-next": {
+            id: "qwen.qwen3-coder-next",
+            name: "Qwen3 Coder Next",
+            api: "bedrock-converse-stream",
+            provider: "amazon-bedrock",
+            baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0.22,
+                output: 1.8,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 131072,
+            maxTokens: 65536,
+        },
         "qwen.qwen3-next-80b-a3b": {
             id: "qwen.qwen3-next-80b-a3b",
             name: "Qwen/Qwen3-Next-80B-A3B-Instruct",
@@ -4339,6 +4356,24 @@ export const MODELS = {
             contextWindow: 204800,
             maxTokens: 131072,
         },
+        "MiniMaxAI/MiniMax-M2.7": {
+            id: "MiniMaxAI/MiniMax-M2.7",
+            name: "MiniMax-M2.7",
+            api: "openai-completions",
+            provider: "huggingface",
+            baseUrl: "https://router.huggingface.co/v1",
+            compat: { "supportsDeveloperRole": false },
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0.3,
+                output: 1.2,
+                cacheRead: 0.06,
+                cacheWrite: 0,
+            },
+            contextWindow: 204800,
+            maxTokens: 131072,
+        },
         "Qwen/Qwen3-235B-A22B-Thinking-2507": {
             id: "Qwen/Qwen3-235B-A22B-Thinking-2507",
             name: "Qwen3-235B-A22B-Thinking-2507",
@@ -4627,6 +4662,24 @@ export const MODELS = {
             contextWindow: 202752,
             maxTokens: 131072,
         },
+        "zai-org/GLM-5.1": {
+            id: "zai-org/GLM-5.1",
+            name: "GLM-5.1",
+            api: "openai-completions",
+            provider: "huggingface",
+            baseUrl: "https://router.huggingface.co/v1",
+            compat: { "supportsDeveloperRole": false },
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 1,
+                output: 3.2,
+                cacheRead: 0.2,
+                cacheWrite: 0,
+            },
+            contextWindow: 202752,
+            maxTokens: 131072,
+        },
     },
     "kimi-coding": {
         "k2p5": {
@@ -6239,6 +6292,23 @@ export const MODELS = {
             contextWindow: 204800,
             maxTokens: 131072,
         },
+        "glm-5.1": {
+            id: "glm-5.1",
+            name: "GLM-5.1",
+            api: "openai-completions",
+            provider: "opencode",
+            baseUrl: "https://opencode.ai/zen/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 1.4,
+                output: 4.4,
+                cacheRead: 0.26,
+                cacheWrite: 0,
+            },
+            contextWindow: 204800,
+            maxTokens: 131072,
+        },
         "gpt-5": {
             id: "gpt-5",
             name: "GPT-5",
@@ -6545,23 +6615,6 @@ export const MODELS = {
             contextWindow: 204800,
             maxTokens: 128000,
         },
-        "qwen3.6-plus-free": {
-            id: "qwen3.6-plus-free",
-            name: "Qwen3.6 Plus Free",
-            api: "openai-completions",
-            provider: "opencode",
-            baseUrl: "https://opencode.ai/zen/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 1048576,
-            maxTokens: 64000,
-        },
     },
     "opencode-go": {
         "glm-5": {
@@ -6581,6 +6634,23 @@ export const MODELS = {
             contextWindow: 204800,
             maxTokens: 131072,
         },
+        "glm-5.1": {
+            id: "glm-5.1",
+            name: "GLM-5.1",
+            api: "openai-completions",
+            provider: "opencode-go",
+            baseUrl: "https://opencode.ai/zen/go/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 1.4,
+                output: 4.4,
+                cacheRead: 0.26,
+                cacheWrite: 0,
+            },
+            contextWindow: 204800,
+            maxTokens: 131072,
+        },
         "kimi-k2.5": {
             id: "kimi-k2.5",
             name: "Kimi K2.5",
@@ -6635,9 +6705,9 @@ export const MODELS = {
         "minimax-m2.5": {
             id: "minimax-m2.5",
             name: "MiniMax M2.5",
-            api: "openai-completions",
+            api: "anthropic-messages",
             provider: "opencode-go",
-            baseUrl: "https://opencode.ai/zen/go/v1",
+            baseUrl: "https://opencode.ai/zen/go",
             reasoning: true,
             input: ["text"],
             cost: {
@@ -6853,7 +6923,7 @@ export const MODELS = {
                 cacheWrite: 3.75,
             },
             contextWindow: 200000,
-            maxTokens: 64000,
+            maxTokens: 128000,
         },
         "anthropic/claude-3.7-sonnet:thinking": {
             id: "anthropic/claude-3.7-sonnet:thinking",
@@ -6957,6 +7027,23 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 128000,
         },
+        "anthropic/claude-opus-4.6-fast": {
+            id: "anthropic/claude-opus-4.6-fast",
+            name: "Anthropic: Claude Opus 4.6 (Fast)",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 30,
+                output: 150,
+                cacheRead: 3,
+                cacheWrite: 37.5,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
         "anthropic/claude-sonnet-4": {
             id: "anthropic/claude-sonnet-4",
             name: "Anthropic: Claude Sonnet 4",
@@ -6971,7 +7058,7 @@ export const MODELS = {
                 cacheRead: 0.3,
                 cacheWrite: 3.75,
             },
-            contextWindow: 200000,
+            contextWindow: 1000000,
             maxTokens: 64000,
         },
         "anthropic/claude-sonnet-4.5": {
@@ -7036,7 +7123,7 @@ export const MODELS = {
             cost: {
                 input: 0.22,
                 output: 0.85,
-                cacheRead: 0,
+                cacheRead: 0.06,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
@@ -7059,23 +7146,6 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 131072,
         },
-        "arcee-ai/trinity-mini:free": {
-            id: "arcee-ai/trinity-mini:free",
-            name: "Arcee AI: Trinity Mini (free)",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 4096,
-        },
         "arcee-ai/virtuoso-large": {
             id: "arcee-ai/virtuoso-large",
             name: "Arcee AI: Virtuoso Large",
@@ -7323,13 +7393,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.44999999999999996,
+                input: 0.5,
                 output: 2.1500000000000004,
-                cacheRead: 0.22499999999999998,
+                cacheRead: 0.35,
                 cacheWrite: 0,
             },
             contextWindow: 163840,
-            maxTokens: 65536,
+            maxTokens: 4096,
         },
         "deepseek/deepseek-v3.1-terminus": {
             id: "deepseek/deepseek-v3.1-terminus",
@@ -7612,72 +7682,72 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.13,
-                output: 0.39999999999999997,
-                cacheRead: 0,
+                input: 0.08,
+                output: 0.35,
+                cacheRead: 0.01,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 262144,
+            maxTokens: 4096,
         },
-        "google/gemma-4-31b-it": {
-            id: "google/gemma-4-31b-it",
-            name: "Google: Gemma 4 31B",
+        "google/gemma-4-26b-a4b-it:free": {
+            id: "google/gemma-4-26b-a4b-it:free",
+            name: "Google: Gemma 4 26B A4B  (free)",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.14,
-                output: 0.39999999999999997,
+                input: 0,
+                output: 0,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 131072,
+            maxTokens: 32768,
         },
-        "inception/mercury": {
-            id: "inception/mercury",
-            name: "Inception: Mercury",
+        "google/gemma-4-31b-it": {
+            id: "google/gemma-4-31b-it",
+            name: "Google: Gemma 4 31B",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
+            reasoning: true,
+            input: ["text", "image"],
             cost: {
-                input: 0.25,
-                output: 0.75,
-                cacheRead: 0.024999999999999998,
+                input: 0.13,
+                output: 0.38,
+                cacheRead: 0.019999999499999997,
                 cacheWrite: 0,
             },
-            contextWindow: 128000,
-            maxTokens: 32000,
+            contextWindow: 262144,
+            maxTokens: 4096,
         },
-        "inception/mercury-2": {
-            id: "inception/mercury-2",
-            name: "Inception: Mercury 2",
+        "google/gemma-4-31b-it:free": {
+            id: "google/gemma-4-31b-it:free",
+            name: "Google: Gemma 4 31B (free)",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: true,
-            input: ["text"],
+            input: ["text", "image"],
             cost: {
-                input: 0.25,
-                output: 0.75,
-                cacheRead: 0.024999999999999998,
+                input: 0,
+                output: 0,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 128000,
-            maxTokens: 50000,
+            contextWindow: 262144,
+            maxTokens: 32768,
         },
-        "inception/mercury-coder": {
-            id: "inception/mercury-coder",
-            name: "Inception: Mercury Coder",
+        "inception/mercury-2": {
+            id: "inception/mercury-2",
+            name: "Inception: Mercury 2",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
+            reasoning: true,
             input: ["text"],
             cost: {
                 input: 0.25,
@@ -7686,7 +7756,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 128000,
-            maxTokens: 32000,
+            maxTokens: 50000,
         },
         "kwaipilot/kat-coder-pro-v2": {
             id: "kwaipilot/kat-coder-pro-v2",
@@ -7705,23 +7775,6 @@ export const MODELS = {
             contextWindow: 256000,
             maxTokens: 80000,
         },
-        "meituan/longcat-flash-chat": {
-            id: "meituan/longcat-flash-chat",
-            name: "Meituan: LongCat Flash Chat",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.19999999999999998,
-                output: 0.7999999999999999,
-                cacheRead: 0.19999999999999998,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 131072,
-        },
         "meta-llama/llama-3-8b-instruct": {
             id: "meta-llama/llama-3-8b-instruct",
             name: "Meta: Llama 3 8B Instruct",
@@ -7884,13 +7937,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.27,
+                input: 0.29,
                 output: 0.95,
-                cacheRead: 0.0290000007,
+                cacheRead: 0.03,
                 cacheWrite: 0,
             },
             contextWindow: 196608,
-            maxTokens: 4096,
+            maxTokens: 196608,
         },
         "minimax/minimax-m2.5": {
             id: "minimax/minimax-m2.5",
@@ -7924,7 +7977,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 196608,
-            maxTokens: 196608,
+            maxTokens: 8192,
         },
         "minimax/minimax-m2.7": {
             id: "minimax/minimax-m2.7",
@@ -7937,11 +7990,11 @@ export const MODELS = {
             cost: {
                 input: 0.3,
                 output: 1.2,
-                cacheRead: 0.06,
+                cacheRead: 0.059,
                 cacheWrite: 0,
             },
-            contextWindow: 204800,
-            maxTokens: 131072,
+            contextWindow: 196608,
+            maxTokens: 4096,
         },
         "mistralai/codestral-2508": {
             id: "mistralai/codestral-2508",
@@ -8345,11 +8398,11 @@ export const MODELS = {
             cost: {
                 input: 0.39999999999999997,
                 output: 2,
-                cacheRead: 0.15,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 131072,
-            maxTokens: 4096,
+            contextWindow: 262144,
+            maxTokens: 262144,
         },
         "moonshotai/kimi-k2-thinking": {
             id: "moonshotai/kimi-k2-thinking",
@@ -8360,13 +8413,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.47,
-                output: 2,
-                cacheRead: 0.14100000000000001,
+                input: 0.6,
+                output: 2.5,
+                cacheRead: 0.15,
                 cacheWrite: 0,
             },
-            contextWindow: 131072,
-            maxTokens: 4096,
+            contextWindow: 262144,
+            maxTokens: 262144,
         },
         "moonshotai/kimi-k2.5": {
             id: "moonshotai/kimi-k2.5",
@@ -8706,7 +8759,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 1047576,
-            maxTokens: 32768,
+            maxTokens: 4096,
         },
         "openai/gpt-4.1-mini": {
             id: "openai/gpt-4.1-mini",
@@ -8753,7 +8806,7 @@ export const MODELS = {
             cost: {
                 input: 2.5,
                 output: 10,
-                cacheRead: 1.25,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 128000,
@@ -8974,11 +9027,11 @@ export const MODELS = {
             cost: {
                 input: 0.049999999999999996,
                 output: 0.39999999999999997,
-                cacheRead: 0.005,
+                cacheRead: 0.01,
                 cacheWrite: 0,
             },
             contextWindow: 400000,
-            maxTokens: 128000,
+            maxTokens: 4096,
         },
         "openai/gpt-5-pro": {
             id: "openai/gpt-5-pro",
@@ -9008,7 +9061,7 @@ export const MODELS = {
             cost: {
                 input: 1.25,
                 output: 10,
-                cacheRead: 0.125,
+                cacheRead: 0.13,
                 cacheWrite: 0,
             },
             contextWindow: 400000,
@@ -9076,11 +9129,11 @@ export const MODELS = {
             cost: {
                 input: 0.25,
                 output: 2,
-                cacheRead: 0.024999999999999998,
+                cacheRead: 0.03,
                 cacheWrite: 0,
             },
             contextWindow: 400000,
-            maxTokens: 100000,
+            maxTokens: 128000,
         },
         "openai/gpt-5.2": {
             id: "openai/gpt-5.2",
@@ -9114,7 +9167,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 128000,
-            maxTokens: 16384,
+            maxTokens: 32000,
         },
         "openai/gpt-5.2-codex": {
             id: "openai/gpt-5.2-codex",
@@ -9330,12 +9383,12 @@ export const MODELS = {
             input: ["text"],
             cost: {
                 input: 0.03,
-                output: 0.11,
-                cacheRead: 0.015,
+                output: 0.14,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 131072,
+            maxTokens: 4096,
         },
         "openai/gpt-oss-20b:free": {
             id: "openai/gpt-oss-20b:free",
@@ -9352,7 +9405,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 131072,
+            maxTokens: 8192,
         },
         "openai/gpt-oss-safeguard-20b": {
             id: "openai/gpt-oss-safeguard-20b",
@@ -9541,6 +9594,23 @@ export const MODELS = {
             contextWindow: 2000000,
             maxTokens: 4096,
         },
+        "openrouter/elephant-alpha": {
+            id: "openrouter/elephant-alpha",
+            name: "Elephant",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: false,
+            input: ["text"],
+            cost: {
+                input: 0,
+                output: 0,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 262144,
+            maxTokens: 32768,
+        },
         "openrouter/free": {
             id: "openrouter/free",
             name: "Free Models Router",
@@ -9924,13 +9994,13 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.12,
-                output: 0.75,
-                cacheRead: 0.06,
+                input: 0.15,
+                output: 0.7999999999999999,
+                cacheRead: 0.12,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 65536,
+            maxTokens: 262144,
         },
         "qwen/qwen3-coder-plus": {
             id: "qwen/qwen3-coder-plus",
@@ -10289,17 +10359,17 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 65536,
         },
-        "qwen/qwen3.6-plus:free": {
-            id: "qwen/qwen3.6-plus:free",
-            name: "Qwen: Qwen3.6 Plus (free)",
+        "qwen/qwen3.6-plus": {
+            id: "qwen/qwen3.6-plus",
+            name: "Qwen: Qwen3.6 Plus",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0,
-                output: 0,
+                input: 0.325,
+                output: 1.95,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
@@ -10408,23 +10478,6 @@ export const MODELS = {
             contextWindow: 262144,
             maxTokens: 65536,
         },
-        "stepfun/step-3.5-flash:free": {
-            id: "stepfun/step-3.5-flash:free",
-            name: "StepFun: Step 3.5 Flash (free)",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 256000,
-            maxTokens: 256000,
-        },
         "thedrummer/rocinante-12b": {
             id: "thedrummer/rocinante-12b",
             name: "TheDrummer: Rocinante 12B",
@@ -10884,6 +10937,23 @@ export const MODELS = {
             contextWindow: 202752,
             maxTokens: 131072,
         },
+        "z-ai/glm-5.1": {
+            id: "z-ai/glm-5.1",
+            name: "Z.ai: GLM 5.1",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0.95,
+                output: 3.15,
+                cacheRead: 0.475,
+                cacheWrite: 0,
+            },
+            contextWindow: 202752,
+            maxTokens: 65535,
+        },
         "z-ai/glm-5v-turbo": {
             id: "z-ai/glm-5v-turbo",
             name: "Z.ai: GLM 5V Turbo",
@@ -10929,13 +10999,13 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.22,
-                output: 0.88,
-                cacheRead: 0.11,
+                input: 0.6,
+                output: 1.2,
+                cacheRead: 0.6,
                 cacheWrite: 0,
             },
-            contextWindow: 32768,
-            maxTokens: 16384,
+            contextWindow: 131000,
+            maxTokens: 40000,
         },
         "alibaba/qwen-3-30b": {
             id: "alibaba/qwen-3-30b",
@@ -11170,7 +11240,7 @@ export const MODELS = {
                 input: 0.5,
                 output: 3,
                 cacheRead: 0.09999999999999999,
-                cacheWrite: 0.625,
+                cacheWrite: 0,
             },
             contextWindow: 1000000,
             maxTokens: 64000,
@@ -11662,7 +11732,7 @@ export const MODELS = {
             cost: {
                 input: 0.25,
                 output: 1.5,
-                cacheRead: 0,
+                cacheRead: 0.03,
                 cacheWrite: 0,
             },
             contextWindow: 1000000,
@@ -11785,7 +11855,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 128000,
-            maxTokens: 8192,
+            maxTokens: 100000,
         },
         "meta/llama-3.1-70b": {
             id: "meta/llama-3.1-70b",
@@ -12790,23 +12860,6 @@ export const MODELS = {
             contextWindow: 1050000,
             maxTokens: 128000,
         },
-        "openai/gpt-oss-120b": {
-            id: "openai/gpt-oss-120b",
-            name: "gpt-oss-120b",
-            api: "anthropic-messages",
-            provider: "vercel-ai-gateway",
-            baseUrl: "https://ai-gateway.vercel.sh",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0.15,
-                output: 0.6,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 128000,
-            maxTokens: 8192,
-        },
         "openai/gpt-oss-20b": {
             id: "openai/gpt-oss-20b",
             name: "gpt-oss-20b",
@@ -12994,23 +13047,6 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 131072,
         },
-        "xai/grok-2-vision": {
-            id: "xai/grok-2-vision",
-            name: "Grok 2 Vision",
-            api: "anthropic-messages",
-            provider: "vercel-ai-gateway",
-            baseUrl: "https://ai-gateway.vercel.sh",
-            reasoning: false,
-            input: ["text", "image"],
-            cost: {
-                input: 2,
-                output: 10,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 32768,
-            maxTokens: 32768,
-        },
         "xai/grok-3": {
             id: "xai/grok-3",
             name: "Grok 3 Beta",
@@ -13428,13 +13464,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.6,
-                output: 2.2,
-                cacheRead: 0.11,
+                input: 2.25,
+                output: 2.75,
+                cacheRead: 2.25,
                 cacheWrite: 0,
             },
-            contextWindow: 200000,
-            maxTokens: 120000,
+            contextWindow: 131000,
+            maxTokens: 40000,
         },
         "zai/glm-4.7-flash": {
             id: "zai/glm-4.7-flash",
@@ -13504,6 +13540,23 @@ export const MODELS = {
             contextWindow: 202800,
             maxTokens: 131100,
         },
+        "zai/glm-5.1": {
+            id: "zai/glm-5.1",
+            name: "GLM 5.1",
+            api: "anthropic-messages",
+            provider: "vercel-ai-gateway",
+            baseUrl: "https://ai-gateway.vercel.sh",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 1.4,
+                output: 4.4,
+                cacheRead: 0.26,
+                cacheWrite: 0,
+            },
+            contextWindow: 202800,
+            maxTokens: 64000,
+        },
         "zai/glm-5v-turbo": {
             id: "zai/glm-5v-turbo",
             name: "GLM 5V Turbo",