npm - @avadisabelle/ava-pi-ai - Versions diffs - 0.64.0 → 0.64.2 - Mend

@avadisabelle/ava-pi-ai 0.64.0 → 0.64.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/dist/models.generated.d.ts +379 -97
package/dist/models.generated.d.ts.map +1 -1
package/dist/models.generated.js +497 -222
package/dist/models.generated.js.map +1 -1
package/package.json +1 -1

package/dist/models.generated.js CHANGED Viewed

@@ -257,6 +257,23 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 128000,
         },
+        "anthropic.claude-opus-4-7": {
+            id: "anthropic.claude-opus-4-7",
+            name: "Claude Opus 4.7",
+            api: "bedrock-converse-stream",
+            provider: "amazon-bedrock",
+            baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 5,
+                output: 25,
+                cacheRead: 0.5,
+                cacheWrite: 6.25,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
         "anthropic.claude-sonnet-4-20250514-v1:0": {
             id: "anthropic.claude-sonnet-4-20250514-v1:0",
             name: "Claude Sonnet 4",
@@ -410,6 +427,23 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 128000,
         },
+        "eu.anthropic.claude-opus-4-7": {
+            id: "eu.anthropic.claude-opus-4-7",
+            name: "Claude Opus 4.7 (EU)",
+            api: "bedrock-converse-stream",
+            provider: "amazon-bedrock",
+            baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 5,
+                output: 25,
+                cacheRead: 0.5,
+                cacheWrite: 6.25,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
         "eu.anthropic.claude-sonnet-4-20250514-v1:0": {
             id: "eu.anthropic.claude-sonnet-4-20250514-v1:0",
             name: "Claude Sonnet 4 (EU)",
@@ -512,6 +546,23 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 128000,
         },
+        "global.anthropic.claude-opus-4-7": {
+            id: "global.anthropic.claude-opus-4-7",
+            name: "Claude Opus 4.7 (Global)",
+            api: "bedrock-converse-stream",
+            provider: "amazon-bedrock",
+            baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 5,
+                output: 25,
+                cacheRead: 0.5,
+                cacheWrite: 6.25,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
         "global.anthropic.claude-sonnet-4-20250514-v1:0": {
             id: "global.anthropic.claude-sonnet-4-20250514-v1:0",
             name: "Claude Sonnet 4 (Global)",
@@ -1209,6 +1260,23 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 65536,
         },
+        "qwen.qwen3-coder-next": {
+            id: "qwen.qwen3-coder-next",
+            name: "Qwen3 Coder Next",
+            api: "bedrock-converse-stream",
+            provider: "amazon-bedrock",
+            baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0.22,
+                output: 1.8,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 131072,
+            maxTokens: 65536,
+        },
         "qwen.qwen3-next-80b-a3b": {
             id: "qwen.qwen3-next-80b-a3b",
             name: "Qwen/Qwen3-Next-80B-A3B-Instruct",
@@ -1328,6 +1396,23 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 128000,
         },
+        "us.anthropic.claude-opus-4-7": {
+            id: "us.anthropic.claude-opus-4-7",
+            name: "Claude Opus 4.7 (US)",
+            api: "bedrock-converse-stream",
+            provider: "amazon-bedrock",
+            baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 5,
+                output: 25,
+                cacheRead: 0.5,
+                cacheWrite: 6.25,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
         "us.anthropic.claude-sonnet-4-20250514-v1:0": {
             id: "us.anthropic.claude-sonnet-4-20250514-v1:0",
             name: "Claude Sonnet 4 (US)",
@@ -1755,6 +1840,23 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 128000,
         },
+        "claude-opus-4-7": {
+            id: "claude-opus-4-7",
+            name: "Claude Opus 4.7",
+            api: "anthropic-messages",
+            provider: "anthropic",
+            baseUrl: "https://api.anthropic.com",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 5,
+                output: 25,
+                cacheRead: 0.5,
+                cacheWrite: 6.25,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
         "claude-sonnet-4-0": {
             id: "claude-sonnet-4-0",
             name: "Claude Sonnet 4 (latest)",
@@ -3015,7 +3117,7 @@ export const MODELS = {
         },
         "gpt-5.4-mini": {
             id: "gpt-5.4-mini",
-            name: "GPT-5.4 mini",
+            name: "GPT-5.4 Mini",
             api: "openai-responses",
             provider: "github-copilot",
             baseUrl: "https://api.individual.githubcopilot.com",
@@ -3477,8 +3579,8 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 8192,
         },
-        "gemma-4-26b": {
-            id: "gemma-4-26b",
+        "gemma-4-26b-it": {
+            id: "gemma-4-26b-it",
             name: "Gemma 4 26B",
             api: "google-generative-ai",
             provider: "google",
@@ -3494,8 +3596,8 @@ export const MODELS = {
             contextWindow: 256000,
             maxTokens: 8192,
         },
-        "gemma-4-31b": {
-            id: "gemma-4-31b",
+        "gemma-4-31b-it": {
+            id: "gemma-4-31b-it",
             name: "Gemma 4 31B",
             api: "google-generative-ai",
             provider: "google",
@@ -4322,6 +4424,24 @@ export const MODELS = {
             contextWindow: 204800,
             maxTokens: 131072,
         },
+        "MiniMaxAI/MiniMax-M2.7": {
+            id: "MiniMaxAI/MiniMax-M2.7",
+            name: "MiniMax-M2.7",
+            api: "openai-completions",
+            provider: "huggingface",
+            baseUrl: "https://router.huggingface.co/v1",
+            compat: { "supportsDeveloperRole": false },
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0.3,
+                output: 1.2,
+                cacheRead: 0.06,
+                cacheWrite: 0,
+            },
+            contextWindow: 204800,
+            maxTokens: 131072,
+        },
         "Qwen/Qwen3-235B-A22B-Thinking-2507": {
             id: "Qwen/Qwen3-235B-A22B-Thinking-2507",
             name: "Qwen3-235B-A22B-Thinking-2507",
@@ -4610,6 +4730,24 @@ export const MODELS = {
             contextWindow: 202752,
             maxTokens: 131072,
         },
+        "zai-org/GLM-5.1": {
+            id: "zai-org/GLM-5.1",
+            name: "GLM-5.1",
+            api: "openai-completions",
+            provider: "huggingface",
+            baseUrl: "https://router.huggingface.co/v1",
+            compat: { "supportsDeveloperRole": false },
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 1,
+                output: 3.2,
+                cacheRead: 0.2,
+                cacheWrite: 0,
+            },
+            contextWindow: 202752,
+            maxTokens: 131072,
+        },
     },
     "kimi-coding": {
         "k2p5": {
@@ -6290,6 +6428,23 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 128000,
         },
+        "claude-opus-4-7": {
+            id: "claude-opus-4-7",
+            name: "Claude Opus 4.7",
+            api: "anthropic-messages",
+            provider: "opencode",
+            baseUrl: "https://opencode.ai/zen",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 5,
+                output: 25,
+                cacheRead: 0.5,
+                cacheWrite: 6.25,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
         "claude-sonnet-4": {
             id: "claude-sonnet-4",
             name: "Claude Sonnet 4",
@@ -6392,6 +6547,23 @@ export const MODELS = {
             contextWindow: 204800,
             maxTokens: 131072,
         },
+        "glm-5.1": {
+            id: "glm-5.1",
+            name: "GLM-5.1",
+            api: "openai-completions",
+            provider: "opencode",
+            baseUrl: "https://opencode.ai/zen/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 1.4,
+                output: 4.4,
+                cacheRead: 0.26,
+                cacheWrite: 0,
+            },
+            contextWindow: 204800,
+            maxTokens: 131072,
+        },
         "gpt-5": {
             id: "gpt-5",
             name: "GPT-5",
@@ -6698,22 +6870,39 @@ export const MODELS = {
             contextWindow: 204800,
             maxTokens: 128000,
         },
-        "qwen3.6-plus-free": {
-            id: "qwen3.6-plus-free",
-            name: "Qwen3.6 Plus Free",
+        "qwen3.5-plus": {
+            id: "qwen3.5-plus",
+            name: "Qwen3.5 Plus",
             api: "openai-completions",
             provider: "opencode",
             baseUrl: "https://opencode.ai/zen/v1",
             reasoning: true,
-            input: ["text"],
+            input: ["text", "image"],
             cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
-                cacheWrite: 0,
+                input: 0.2,
+                output: 1.2,
+                cacheRead: 0.02,
+                cacheWrite: 0.25,
             },
-            contextWindow: 1048576,
-            maxTokens: 64000,
+            contextWindow: 262144,
+            maxTokens: 65536,
+        },
+        "qwen3.6-plus": {
+            id: "qwen3.6-plus",
+            name: "Qwen3.6 Plus",
+            api: "openai-completions",
+            provider: "opencode",
+            baseUrl: "https://opencode.ai/zen/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0.5,
+                output: 3,
+                cacheRead: 0.05,
+                cacheWrite: 0.625,
+            },
+            contextWindow: 262144,
+            maxTokens: 65536,
         },
     },
     "opencode-go": {
@@ -6734,6 +6923,23 @@ export const MODELS = {
             contextWindow: 204800,
             maxTokens: 131072,
         },
+        "glm-5.1": {
+            id: "glm-5.1",
+            name: "GLM-5.1",
+            api: "openai-completions",
+            provider: "opencode-go",
+            baseUrl: "https://opencode.ai/zen/go/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 1.4,
+                output: 4.4,
+                cacheRead: 0.26,
+                cacheWrite: 0,
+            },
+            contextWindow: 204800,
+            maxTokens: 131072,
+        },
         "kimi-k2.5": {
             id: "kimi-k2.5",
             name: "Kimi K2.5",
@@ -6788,9 +6994,9 @@ export const MODELS = {
         "minimax-m2.5": {
             id: "minimax-m2.5",
             name: "MiniMax M2.5",
-            api: "openai-completions",
+            api: "anthropic-messages",
             provider: "opencode-go",
-            baseUrl: "https://opencode.ai/zen/go/v1",
+            baseUrl: "https://opencode.ai/zen/go",
             reasoning: true,
             input: ["text"],
             cost: {
@@ -6819,6 +7025,40 @@ export const MODELS = {
             contextWindow: 204800,
             maxTokens: 131072,
         },
+        "qwen3.5-plus": {
+            id: "qwen3.5-plus",
+            name: "Qwen3.5 Plus",
+            api: "openai-completions",
+            provider: "opencode-go",
+            baseUrl: "https://opencode.ai/zen/go/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0.2,
+                output: 1.2,
+                cacheRead: 0.02,
+                cacheWrite: 0.25,
+            },
+            contextWindow: 262144,
+            maxTokens: 65536,
+        },
+        "qwen3.6-plus": {
+            id: "qwen3.6-plus",
+            name: "Qwen3.6 Plus",
+            api: "openai-completions",
+            provider: "opencode-go",
+            baseUrl: "https://opencode.ai/zen/go/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0.5,
+                output: 3,
+                cacheRead: 0.05,
+                cacheWrite: 0.625,
+            },
+            contextWindow: 262144,
+            maxTokens: 65536,
+        },
     },
     "openrouter": {
         "ai21/jamba-large-1.7": {
@@ -7006,7 +7246,7 @@ export const MODELS = {
                 cacheWrite: 3.75,
             },
             contextWindow: 200000,
-            maxTokens: 64000,
+            maxTokens: 128000,
         },
         "anthropic/claude-3.7-sonnet:thinking": {
             id: "anthropic/claude-3.7-sonnet:thinking",
@@ -7110,6 +7350,40 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 128000,
         },
+        "anthropic/claude-opus-4.6-fast": {
+            id: "anthropic/claude-opus-4.6-fast",
+            name: "Anthropic: Claude Opus 4.6 (Fast)",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 30,
+                output: 150,
+                cacheRead: 3,
+                cacheWrite: 37.5,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
+        "anthropic/claude-opus-4.7": {
+            id: "anthropic/claude-opus-4.7",
+            name: "Anthropic: Claude Opus 4.7",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 5,
+                output: 25,
+                cacheRead: 0.5,
+                cacheWrite: 6.25,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
         "anthropic/claude-sonnet-4": {
             id: "anthropic/claude-sonnet-4",
             name: "Anthropic: Claude Sonnet 4",
@@ -7124,7 +7398,7 @@ export const MODELS = {
                 cacheRead: 0.3,
                 cacheWrite: 3.75,
             },
-            contextWindow: 200000,
+            contextWindow: 1000000,
             maxTokens: 64000,
         },
         "anthropic/claude-sonnet-4.5": {
@@ -7189,7 +7463,7 @@ export const MODELS = {
             cost: {
                 input: 0.22,
                 output: 0.85,
-                cacheRead: 0,
+                cacheRead: 0.06,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
@@ -7212,39 +7486,22 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 131072,
         },
-        "arcee-ai/trinity-mini:free": {
-            id: "arcee-ai/trinity-mini:free",
-            name: "Arcee AI: Trinity Mini (free)",
+        "arcee-ai/virtuoso-large": {
+            id: "arcee-ai/virtuoso-large",
+            name: "Arcee AI: Virtuoso Large",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: true,
+            reasoning: false,
             input: ["text"],
             cost: {
-                input: 0,
-                output: 0,
+                input: 0.75,
+                output: 1.2,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 4096,
-        },
-        "arcee-ai/virtuoso-large": {
-            id: "arcee-ai/virtuoso-large",
-            name: "Arcee AI: Virtuoso Large",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.75,
-                output: 1.2,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 64000,
+            maxTokens: 64000,
         },
         "auto": {
             id: "auto",
@@ -7476,13 +7733,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.44999999999999996,
+                input: 0.5,
                 output: 2.1500000000000004,
-                cacheRead: 0.22499999999999998,
+                cacheRead: 0.35,
                 cacheWrite: 0,
             },
             contextWindow: 163840,
-            maxTokens: 65536,
+            maxTokens: 4096,
         },
         "deepseek/deepseek-v3.1-terminus": {
             id: "deepseek/deepseek-v3.1-terminus",
@@ -7765,72 +8022,72 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.13,
+                input: 0.07,
                 output: 0.39999999999999997,
-                cacheRead: 0,
+                cacheRead: 0.04,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
             maxTokens: 262144,
         },
-        "google/gemma-4-31b-it": {
-            id: "google/gemma-4-31b-it",
-            name: "Google: Gemma 4 31B",
+        "google/gemma-4-26b-a4b-it:free": {
+            id: "google/gemma-4-26b-a4b-it:free",
+            name: "Google: Gemma 4 26B A4B  (free)",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.14,
-                output: 0.39999999999999997,
+                input: 0,
+                output: 0,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 131072,
+            maxTokens: 32768,
         },
-        "inception/mercury": {
-            id: "inception/mercury",
-            name: "Inception: Mercury",
+        "google/gemma-4-31b-it": {
+            id: "google/gemma-4-31b-it",
+            name: "Google: Gemma 4 31B",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
+            reasoning: true,
+            input: ["text", "image"],
             cost: {
-                input: 0.25,
-                output: 0.75,
-                cacheRead: 0.024999999999999998,
+                input: 0.13,
+                output: 0.38,
+                cacheRead: 0.019999999499999997,
                 cacheWrite: 0,
             },
-            contextWindow: 128000,
-            maxTokens: 32000,
+            contextWindow: 262144,
+            maxTokens: 4096,
         },
-        "inception/mercury-2": {
-            id: "inception/mercury-2",
-            name: "Inception: Mercury 2",
+        "google/gemma-4-31b-it:free": {
+            id: "google/gemma-4-31b-it:free",
+            name: "Google: Gemma 4 31B (free)",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: true,
-            input: ["text"],
+            input: ["text", "image"],
             cost: {
-                input: 0.25,
-                output: 0.75,
-                cacheRead: 0.024999999999999998,
+                input: 0,
+                output: 0,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 128000,
-            maxTokens: 50000,
+            contextWindow: 262144,
+            maxTokens: 32768,
         },
-        "inception/mercury-coder": {
-            id: "inception/mercury-coder",
-            name: "Inception: Mercury Coder",
+        "inception/mercury-2": {
+            id: "inception/mercury-2",
+            name: "Inception: Mercury 2",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
+            reasoning: true,
             input: ["text"],
             cost: {
                 input: 0.25,
@@ -7839,7 +8096,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 128000,
-            maxTokens: 32000,
+            maxTokens: 50000,
         },
         "kwaipilot/kat-coder-pro-v2": {
             id: "kwaipilot/kat-coder-pro-v2",
@@ -7858,23 +8115,6 @@ export const MODELS = {
             contextWindow: 256000,
             maxTokens: 80000,
         },
-        "meituan/longcat-flash-chat": {
-            id: "meituan/longcat-flash-chat",
-            name: "Meituan: LongCat Flash Chat",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.19999999999999998,
-                output: 0.7999999999999999,
-                cacheRead: 0.19999999999999998,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 131072,
-        },
         "meta-llama/llama-3-8b-instruct": {
             id: "meta-llama/llama-3-8b-instruct",
             name: "Meta: Llama 3 8B Instruct",
@@ -8037,13 +8277,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.27,
+                input: 0.29,
                 output: 0.95,
-                cacheRead: 0.0290000007,
+                cacheRead: 0.03,
                 cacheWrite: 0,
             },
             contextWindow: 196608,
-            maxTokens: 4096,
+            maxTokens: 196608,
         },
         "minimax/minimax-m2.5": {
             id: "minimax/minimax-m2.5",
@@ -8077,7 +8317,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 196608,
-            maxTokens: 196608,
+            maxTokens: 8192,
         },
         "minimax/minimax-m2.7": {
             id: "minimax/minimax-m2.7",
@@ -8090,11 +8330,11 @@ export const MODELS = {
             cost: {
                 input: 0.3,
                 output: 1.2,
-                cacheRead: 0.06,
+                cacheRead: 0.059,
                 cacheWrite: 0,
             },
-            contextWindow: 204800,
-            maxTokens: 131072,
+            contextWindow: 196608,
+            maxTokens: 4096,
         },
         "mistralai/codestral-2508": {
             id: "mistralai/codestral-2508",
@@ -8485,7 +8725,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 131072,
+            maxTokens: 32768,
         },
         "moonshotai/kimi-k2-0905": {
             id: "moonshotai/kimi-k2-0905",
@@ -8498,11 +8738,11 @@ export const MODELS = {
             cost: {
                 input: 0.39999999999999997,
                 output: 2,
-                cacheRead: 0.15,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 131072,
-            maxTokens: 4096,
+            contextWindow: 262144,
+            maxTokens: 262144,
         },
         "moonshotai/kimi-k2-thinking": {
             id: "moonshotai/kimi-k2-thinking",
@@ -8513,13 +8753,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.47,
-                output: 2,
-                cacheRead: 0.14100000000000001,
+                input: 0.6,
+                output: 2.5,
+                cacheRead: 0.15,
                 cacheWrite: 0,
             },
-            contextWindow: 131072,
-            maxTokens: 4096,
+            contextWindow: 262144,
+            maxTokens: 262144,
         },
         "moonshotai/kimi-k2.5": {
             id: "moonshotai/kimi-k2.5",
@@ -8632,9 +8872,9 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.09999999999999999,
-                output: 0.5,
-                cacheRead: 0.09999999999999999,
+                input: 0.09,
+                output: 0.44999999999999996,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
@@ -8859,7 +9099,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 1047576,
-            maxTokens: 32768,
+            maxTokens: 4096,
         },
         "openai/gpt-4.1-mini": {
             id: "openai/gpt-4.1-mini",
@@ -8906,7 +9146,7 @@ export const MODELS = {
             cost: {
                 input: 2.5,
                 output: 10,
-                cacheRead: 1.25,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 128000,
@@ -9127,11 +9367,11 @@ export const MODELS = {
             cost: {
                 input: 0.049999999999999996,
                 output: 0.39999999999999997,
-                cacheRead: 0.005,
+                cacheRead: 0.01,
                 cacheWrite: 0,
             },
             contextWindow: 400000,
-            maxTokens: 128000,
+            maxTokens: 4096,
         },
         "openai/gpt-5-pro": {
             id: "openai/gpt-5-pro",
@@ -9161,7 +9401,7 @@ export const MODELS = {
             cost: {
                 input: 1.25,
                 output: 10,
-                cacheRead: 0.125,
+                cacheRead: 0.13,
                 cacheWrite: 0,
             },
             contextWindow: 400000,
@@ -9229,11 +9469,11 @@ export const MODELS = {
             cost: {
                 input: 0.25,
                 output: 2,
-                cacheRead: 0.024999999999999998,
+                cacheRead: 0.03,
                 cacheWrite: 0,
             },
             contextWindow: 400000,
-            maxTokens: 100000,
+            maxTokens: 128000,
         },
         "openai/gpt-5.2": {
             id: "openai/gpt-5.2",
@@ -9267,7 +9507,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 128000,
-            maxTokens: 16384,
+            maxTokens: 32000,
         },
         "openai/gpt-5.2-codex": {
             id: "openai/gpt-5.2-codex",
@@ -9483,12 +9723,12 @@ export const MODELS = {
             input: ["text"],
             cost: {
                 input: 0.03,
-                output: 0.11,
-                cacheRead: 0.015,
+                output: 0.14,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 131072,
+            maxTokens: 4096,
         },
         "openai/gpt-oss-20b:free": {
             id: "openai/gpt-oss-20b:free",
@@ -9505,7 +9745,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 131072,
+            maxTokens: 8192,
         },
         "openai/gpt-oss-safeguard-20b": {
             id: "openai/gpt-oss-safeguard-20b",
@@ -9694,6 +9934,23 @@ export const MODELS = {
             contextWindow: 2000000,
             maxTokens: 4096,
         },
+        "openrouter/elephant-alpha": {
+            id: "openrouter/elephant-alpha",
+            name: "Elephant",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: false,
+            input: ["text"],
+            cost: {
+                input: 0,
+                output: 0,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 262144,
+            maxTokens: 32768,
+        },
         "openrouter/free": {
             id: "openrouter/free",
             name: "Free Models Router",
@@ -9791,7 +10048,7 @@ export const MODELS = {
                 input: 0.26,
                 output: 0.78,
                 cacheRead: 0.052000000000000005,
-                cacheWrite: 0,
+                cacheWrite: 0.325,
             },
             contextWindow: 1000000,
             maxTokens: 32768,
@@ -9808,7 +10065,7 @@ export const MODELS = {
                 input: 0.26,
                 output: 0.78,
                 cacheRead: 0,
-                cacheWrite: 0,
+                cacheWrite: 0.325,
             },
             contextWindow: 1000000,
             maxTokens: 32768,
@@ -9825,7 +10082,7 @@ export const MODELS = {
                 input: 0.26,
                 output: 0.78,
                 cacheRead: 0,
-                cacheWrite: 0,
+                cacheWrite: 0.325,
             },
             contextWindow: 1000000,
             maxTokens: 32768,
@@ -9924,13 +10181,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.14950000000000002,
-                output: 1.495,
+                input: 0.13,
+                output: 0.6,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 131072,
-            maxTokens: 4096,
+            contextWindow: 262144,
+            maxTokens: 262144,
         },
         "qwen/qwen3-30b-a3b": {
             id: "qwen/qwen3-30b-a3b",
@@ -10063,7 +10320,7 @@ export const MODELS = {
                 input: 0.195,
                 output: 0.975,
                 cacheRead: 0.039,
-                cacheWrite: 0,
+                cacheWrite: 0.24375,
             },
             contextWindow: 1000000,
             maxTokens: 65536,
@@ -10077,13 +10334,13 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.12,
-                output: 0.75,
-                cacheRead: 0.06,
+                input: 0.15,
+                output: 0.7999999999999999,
+                cacheRead: 0.12,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 65536,
+            maxTokens: 262144,
         },
         "qwen/qwen3-coder-plus": {
             id: "qwen/qwen3-coder-plus",
@@ -10097,7 +10354,7 @@ export const MODELS = {
                 input: 0.65,
                 output: 3.25,
                 cacheRead: 0.13,
-                cacheWrite: 0,
+                cacheWrite: 0.8125,
             },
             contextWindow: 1000000,
             maxTokens: 65536,
@@ -10131,7 +10388,7 @@ export const MODELS = {
                 input: 0.78,
                 output: 3.9,
                 cacheRead: 0.156,
-                cacheWrite: 0,
+                cacheWrite: 0.975,
             },
             contextWindow: 262144,
             maxTokens: 32768,
@@ -10385,7 +10642,7 @@ export const MODELS = {
             cost: {
                 input: 0.39,
                 output: 2.34,
-                cacheRead: 0,
+                cacheRead: 0.195,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
@@ -10420,7 +10677,7 @@ export const MODELS = {
                 input: 0.065,
                 output: 0.26,
                 cacheRead: 0,
-                cacheWrite: 0,
+                cacheWrite: 0.08125,
             },
             contextWindow: 1000000,
             maxTokens: 65536,
@@ -10437,24 +10694,24 @@ export const MODELS = {
                 input: 0.26,
                 output: 1.56,
                 cacheRead: 0,
-                cacheWrite: 0,
+                cacheWrite: 0.325,
             },
             contextWindow: 1000000,
             maxTokens: 65536,
         },
-        "qwen/qwen3.6-plus:free": {
-            id: "qwen/qwen3.6-plus:free",
-            name: "Qwen: Qwen3.6 Plus (free)",
+        "qwen/qwen3.6-plus": {
+            id: "qwen/qwen3.6-plus",
+            name: "Qwen: Qwen3.6 Plus",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0,
-                output: 0,
+                input: 0.325,
+                output: 1.95,
                 cacheRead: 0,
-                cacheWrite: 0,
+                cacheWrite: 0.40625,
             },
             contextWindow: 1000000,
             maxTokens: 65536,
@@ -10561,23 +10818,6 @@ export const MODELS = {
             contextWindow: 262144,
             maxTokens: 65536,
         },
-        "stepfun/step-3.5-flash:free": {
-            id: "stepfun/step-3.5-flash:free",
-            name: "StepFun: Step 3.5 Flash (free)",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 256000,
-            maxTokens: 256000,
-        },
         "thedrummer/rocinante-12b": {
             id: "thedrummer/rocinante-12b",
             name: "TheDrummer: Rocinante 12B",
@@ -11037,6 +11277,23 @@ export const MODELS = {
             contextWindow: 202752,
             maxTokens: 131072,
         },
+        "z-ai/glm-5.1": {
+            id: "z-ai/glm-5.1",
+            name: "Z.ai: GLM 5.1",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0.95,
+                output: 3.15,
+                cacheRead: 0.475,
+                cacheWrite: 0,
+            },
+            contextWindow: 202752,
+            maxTokens: 65535,
+        },
         "z-ai/glm-5v-turbo": {
             id: "z-ai/glm-5v-turbo",
             name: "Z.ai: GLM 5V Turbo",
@@ -11082,13 +11339,13 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.22,
-                output: 0.88,
-                cacheRead: 0.11,
+                input: 0.6,
+                output: 1.2,
+                cacheRead: 0.6,
                 cacheWrite: 0,
             },
-            contextWindow: 32768,
-            maxTokens: 16384,
+            contextWindow: 131000,
+            maxTokens: 40000,
         },
         "alibaba/qwen-3-30b": {
             id: "alibaba/qwen-3-30b",
@@ -11323,7 +11580,7 @@ export const MODELS = {
                 input: 0.5,
                 output: 3,
                 cacheRead: 0.09999999999999999,
-                cacheWrite: 0.625,
+                cacheWrite: 0,
             },
             contextWindow: 1000000,
             maxTokens: 64000,
@@ -11464,6 +11721,23 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 128000,
         },
+        "anthropic/claude-opus-4.7": {
+            id: "anthropic/claude-opus-4.7",
+            name: "Claude Opus 4.7",
+            api: "anthropic-messages",
+            provider: "vercel-ai-gateway",
+            baseUrl: "https://ai-gateway.vercel.sh",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 5,
+                output: 25,
+                cacheRead: 0.5,
+                cacheWrite: 6.25,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
         "anthropic/claude-sonnet-4": {
             id: "anthropic/claude-sonnet-4",
             name: "Claude Sonnet 4",
@@ -11815,7 +12089,7 @@ export const MODELS = {
             cost: {
                 input: 0.25,
                 output: 1.5,
-                cacheRead: 0,
+                cacheRead: 0.03,
                 cacheWrite: 0,
             },
             contextWindow: 1000000,
@@ -11938,7 +12212,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 128000,
-            maxTokens: 8192,
+            maxTokens: 100000,
         },
         "meta/llama-3.1-70b": {
             id: "meta/llama-3.1-70b",
@@ -12943,26 +13217,9 @@ export const MODELS = {
             contextWindow: 1050000,
             maxTokens: 128000,
         },
-        "openai/gpt-oss-120b": {
-            id: "openai/gpt-oss-120b",
-            name: "gpt-oss-120b",
-            api: "anthropic-messages",
-            provider: "vercel-ai-gateway",
-            baseUrl: "https://ai-gateway.vercel.sh",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0.15,
-                output: 0.6,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 128000,
-            maxTokens: 8192,
-        },
         "openai/gpt-oss-20b": {
             id: "openai/gpt-oss-20b",
-            name: "gpt-oss-20b",
+            name: "GPT OSS 120B",
             api: "anthropic-messages",
             provider: "vercel-ai-gateway",
             baseUrl: "https://ai-gateway.vercel.sh",
@@ -12979,7 +13236,7 @@ export const MODELS = {
         },
         "openai/gpt-oss-safeguard-20b": {
             id: "openai/gpt-oss-safeguard-20b",
-            name: "gpt-oss-safeguard-20b",
+            name: "GPT OSS Safeguard 20B",
             api: "anthropic-messages",
             provider: "vercel-ai-gateway",
             baseUrl: "https://ai-gateway.vercel.sh",
@@ -13147,23 +13404,6 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 131072,
         },
-        "xai/grok-2-vision": {
-            id: "xai/grok-2-vision",
-            name: "Grok 2 Vision",
-            api: "anthropic-messages",
-            provider: "vercel-ai-gateway",
-            baseUrl: "https://ai-gateway.vercel.sh",
-            reasoning: false,
-            input: ["text", "image"],
-            cost: {
-                input: 2,
-                output: 10,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 32768,
-            maxTokens: 32768,
-        },
         "xai/grok-3": {
             id: "xai/grok-3",
             name: "Grok 3 Beta",
@@ -13256,7 +13496,7 @@ export const MODELS = {
             provider: "vercel-ai-gateway",
             baseUrl: "https://ai-gateway.vercel.sh",
             reasoning: false,
-            input: ["text"],
+            input: ["text", "image"],
             cost: {
                 input: 0.19999999999999998,
                 output: 0.5,
@@ -13273,7 +13513,7 @@ export const MODELS = {
             provider: "vercel-ai-gateway",
             baseUrl: "https://ai-gateway.vercel.sh",
             reasoning: true,
-            input: ["text"],
+            input: ["text", "image"],
             cost: {
                 input: 0.19999999999999998,
                 output: 0.5,
@@ -13290,7 +13530,7 @@ export const MODELS = {
             provider: "vercel-ai-gateway",
             baseUrl: "https://ai-gateway.vercel.sh",
             reasoning: false,
-            input: ["text"],
+            input: ["text", "image"],
             cost: {
                 input: 0.19999999999999998,
                 output: 0.5,
@@ -13307,7 +13547,7 @@ export const MODELS = {
             provider: "vercel-ai-gateway",
             baseUrl: "https://ai-gateway.vercel.sh",
             reasoning: true,
-            input: ["text"],
+            input: ["text", "image"],
             cost: {
                 input: 0.19999999999999998,
                 output: 0.5,
@@ -13324,7 +13564,7 @@ export const MODELS = {
             provider: "vercel-ai-gateway",
             baseUrl: "https://ai-gateway.vercel.sh",
             reasoning: true,
-            input: ["text"],
+            input: ["text", "image"],
             cost: {
                 input: 2,
                 output: 6,
@@ -13341,7 +13581,7 @@ export const MODELS = {
             provider: "vercel-ai-gateway",
             baseUrl: "https://ai-gateway.vercel.sh",
             reasoning: true,
-            input: ["text"],
+            input: ["text", "image"],
             cost: {
                 input: 2,
                 output: 6,
@@ -13581,13 +13821,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.6,
-                output: 2.2,
-                cacheRead: 0.11,
+                input: 2.25,
+                output: 2.75,
+                cacheRead: 2.25,
                 cacheWrite: 0,
             },
-            contextWindow: 200000,
-            maxTokens: 120000,
+            contextWindow: 131000,
+            maxTokens: 40000,
         },
         "zai/glm-4.7-flash": {
             id: "zai/glm-4.7-flash",
@@ -13657,6 +13897,23 @@ export const MODELS = {
             contextWindow: 202800,
             maxTokens: 131100,
         },
+        "zai/glm-5.1": {
+            id: "zai/glm-5.1",
+            name: "GLM 5.1",
+            api: "anthropic-messages",
+            provider: "vercel-ai-gateway",
+            baseUrl: "https://ai-gateway.vercel.sh",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 1.4,
+                output: 4.4,
+                cacheRead: 0.26,
+                cacheWrite: 0,
+            },
+            contextWindow: 202752,
+            maxTokens: 202752,
+        },
         "zai/glm-5v-turbo": {
             id: "zai/glm-5v-turbo",
             name: "GLM 5V Turbo",
@@ -14284,6 +14541,24 @@ export const MODELS = {
             contextWindow: 200000,
             maxTokens: 131072,
         },
+        "glm-5.1": {
+            id: "glm-5.1",
+            name: "GLM-5.1",
+            api: "openai-completions",
+            provider: "zai",
+            baseUrl: "https://api.z.ai/api/coding/paas/v4",
+            compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai" },
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 1.4,
+                output: 4.4,
+                cacheRead: 0.26,
+                cacheWrite: 0,
+            },
+            contextWindow: 200000,
+            maxTokens: 131072,
+        },
         "glm-5v-turbo": {
             id: "glm-5v-turbo",
             name: "glm-5v-turbo",