npm - @caupulican/pi-ai - Versions diffs - 0.75.6 → 0.78.3 - Mend

@caupulican/pi-ai 0.75.6 → 0.78.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (71) hide show

package/README.md +1 -1
package/dist/image-models.generated.d.ts.map +1 -1
package/dist/image-models.generated.js +146 -146
package/dist/image-models.generated.js.map +1 -1
package/dist/models.generated.d.ts +500 -298
package/dist/models.generated.d.ts.map +1 -1
package/dist/models.generated.js +617 -491
package/dist/models.generated.js.map +1 -1
package/dist/providers/amazon-bedrock.d.ts +1 -1
package/dist/providers/amazon-bedrock.d.ts.map +1 -1
package/dist/providers/amazon-bedrock.js +48 -5
package/dist/providers/amazon-bedrock.js.map +1 -1
package/dist/providers/anthropic.d.ts.map +1 -1
package/dist/providers/anthropic.js +51 -15
package/dist/providers/anthropic.js.map +1 -1
package/dist/providers/azure-openai-responses.d.ts.map +1 -1
package/dist/providers/azure-openai-responses.js +6 -10
package/dist/providers/azure-openai-responses.js.map +1 -1
package/dist/providers/google-vertex.d.ts.map +1 -1
package/dist/providers/google-vertex.js +1 -1
package/dist/providers/google-vertex.js.map +1 -1
package/dist/providers/google.d.ts.map +1 -1
package/dist/providers/google.js +5 -3
package/dist/providers/google.js.map +1 -1
package/dist/providers/images/openrouter.d.ts.map +1 -1
package/dist/providers/images/openrouter.js +3 -4
package/dist/providers/images/openrouter.js.map +1 -1
package/dist/providers/mistral.d.ts.map +1 -1
package/dist/providers/mistral.js +2 -3
package/dist/providers/mistral.js.map +1 -1
package/dist/providers/openai-codex-responses.d.ts.map +1 -1
package/dist/providers/openai-codex-responses.js +159 -78
package/dist/providers/openai-codex-responses.js.map +1 -1
package/dist/providers/openai-completions.d.ts.map +1 -1
package/dist/providers/openai-completions.js +44 -18
package/dist/providers/openai-completions.js.map +1 -1
package/dist/providers/openai-responses-shared.d.ts.map +1 -1
package/dist/providers/openai-responses-shared.js +4 -1
package/dist/providers/openai-responses-shared.js.map +1 -1
package/dist/providers/openai-responses.d.ts.map +1 -1
package/dist/providers/openai-responses.js +6 -10
package/dist/providers/openai-responses.js.map +1 -1
package/dist/providers/simple-options.d.ts.map +1 -1
package/dist/providers/simple-options.js +1 -0
package/dist/providers/simple-options.js.map +1 -1
package/dist/stream.d.ts.map +1 -1
package/dist/stream.js +14 -2
package/dist/stream.js.map +1 -1
package/dist/types.d.ts +21 -5
package/dist/types.d.ts.map +1 -1
package/dist/types.js.map +1 -1
package/dist/utils/abort-signals.d.ts +6 -0
package/dist/utils/abort-signals.d.ts.map +1 -0
package/dist/utils/abort-signals.js +34 -0
package/dist/utils/abort-signals.js.map +1 -0
package/dist/utils/oauth/device-code.d.ts +9 -7
package/dist/utils/oauth/device-code.d.ts.map +1 -1
package/dist/utils/oauth/device-code.js +8 -7
package/dist/utils/oauth/device-code.js.map +1 -1
package/dist/utils/oauth/github-copilot.d.ts.map +1 -1
package/dist/utils/oauth/github-copilot.js +1 -1
package/dist/utils/oauth/github-copilot.js.map +1 -1
package/dist/utils/oauth/index.d.ts +1 -1
package/dist/utils/oauth/index.d.ts.map +1 -1
package/dist/utils/oauth/index.js +1 -1
package/dist/utils/oauth/index.js.map +1 -1
package/dist/utils/oauth/openai-codex.d.ts +10 -1
package/dist/utils/oauth/openai-codex.d.ts.map +1 -1
package/dist/utils/oauth/openai-codex.js +179 -79
package/dist/utils/oauth/openai-codex.js.map +1 -1
package/package.json +104 -91

package/dist/models.generated.js CHANGED Viewed

@@ -157,6 +157,24 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 128000,
         },
+        "anthropic.claude-opus-4-8": {
+            id: "anthropic.claude-opus-4-8",
+            name: "Claude Opus 4.8",
+            api: "bedrock-converse-stream",
+            provider: "amazon-bedrock",
+            baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
+            reasoning: true,
+            thinkingLevelMap: { "xhigh": "xhigh" },
+            input: ["text", "image"],
+            cost: {
+                input: 5,
+                output: 25,
+                cacheRead: 0.5,
+                cacheWrite: 6.25,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
         "anthropic.claude-sonnet-4-5-20250929-v1:0": {
             id: "anthropic.claude-sonnet-4-5-20250929-v1:0",
             name: "Claude Sonnet 4.5",
@@ -226,6 +244,24 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 128000,
         },
+        "au.anthropic.claude-opus-4-8": {
+            id: "au.anthropic.claude-opus-4-8",
+            name: "Claude Opus 4.8 (AU)",
+            api: "bedrock-converse-stream",
+            provider: "amazon-bedrock",
+            baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
+            reasoning: true,
+            thinkingLevelMap: { "xhigh": "xhigh" },
+            input: ["text", "image"],
+            cost: {
+                input: 5,
+                output: 25,
+                cacheRead: 0.5,
+                cacheWrite: 6.25,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
         "au.anthropic.claude-sonnet-4-5-20250929-v1:0": {
             id: "au.anthropic.claude-sonnet-4-5-20250929-v1:0",
             name: "Claude Sonnet 4.5 (AU)",
@@ -355,8 +391,8 @@ export const MODELS = {
             thinkingLevelMap: { "xhigh": "max" },
             input: ["text", "image"],
             cost: {
-                input: 5,
-                output: 25,
+                input: 5.5,
+                output: 27.5,
                 cacheRead: 0.5,
                 cacheWrite: 6.25,
             },
@@ -373,10 +409,28 @@ export const MODELS = {
             thinkingLevelMap: { "xhigh": "xhigh" },
             input: ["text", "image"],
             cost: {
-                input: 5,
-                output: 25,
-                cacheRead: 0.5,
-                cacheWrite: 6.25,
+                input: 5.5,
+                output: 27.5,
+                cacheRead: 0.55,
+                cacheWrite: 6.875,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
+        "eu.anthropic.claude-opus-4-8": {
+            id: "eu.anthropic.claude-opus-4-8",
+            name: "Claude Opus 4.8 (EU)",
+            api: "bedrock-converse-stream",
+            provider: "amazon-bedrock",
+            baseUrl: "https://bedrock-runtime.eu-central-1.amazonaws.com",
+            reasoning: true,
+            thinkingLevelMap: { "xhigh": "xhigh" },
+            input: ["text", "image"],
+            cost: {
+                input: 5.5,
+                output: 27.5,
+                cacheRead: 0.55,
+                cacheWrite: 6.875,
             },
             contextWindow: 1000000,
             maxTokens: 128000,
@@ -390,10 +444,10 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 3,
-                output: 15,
-                cacheRead: 0.3,
-                cacheWrite: 3.75,
+                input: 3.3,
+                output: 16.5,
+                cacheRead: 0.33,
+                cacheWrite: 4.125,
             },
             contextWindow: 200000,
             maxTokens: 64000,
@@ -407,10 +461,10 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 3,
-                output: 15,
-                cacheRead: 0.3,
-                cacheWrite: 3.75,
+                input: 3.3,
+                output: 16.5,
+                cacheRead: 0.33,
+                cacheWrite: 4.125,
             },
             contextWindow: 1000000,
             maxTokens: 64000,
@@ -485,6 +539,24 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 128000,
         },
+        "global.anthropic.claude-opus-4-8": {
+            id: "global.anthropic.claude-opus-4-8",
+            name: "Claude Opus 4.8 (Global)",
+            api: "bedrock-converse-stream",
+            provider: "amazon-bedrock",
+            baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
+            reasoning: true,
+            thinkingLevelMap: { "xhigh": "xhigh" },
+            input: ["text", "image"],
+            cost: {
+                input: 5,
+                output: 25,
+                cacheRead: 0.5,
+                cacheWrite: 6.25,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
         "global.anthropic.claude-sonnet-4-5-20250929-v1:0": {
             id: "global.anthropic.claude-sonnet-4-5-20250929-v1:0",
             name: "Claude Sonnet 4.5 (Global)",
@@ -571,6 +643,24 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 128000,
         },
+        "jp.anthropic.claude-opus-4-8": {
+            id: "jp.anthropic.claude-opus-4-8",
+            name: "Claude Opus 4.8 (JP)",
+            api: "bedrock-converse-stream",
+            provider: "amazon-bedrock",
+            baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
+            reasoning: true,
+            thinkingLevelMap: { "xhigh": "xhigh" },
+            input: ["text", "image"],
+            cost: {
+                input: 5,
+                output: 25,
+                cacheRead: 0.5,
+                cacheWrite: 6.25,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
         "jp.anthropic.claude-sonnet-4-5-20250929-v1:0": {
             id: "jp.anthropic.claude-sonnet-4-5-20250929-v1:0",
             name: "Claude Sonnet 4.5 (JP)",
@@ -1270,6 +1360,24 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 128000,
         },
+        "us.anthropic.claude-opus-4-8": {
+            id: "us.anthropic.claude-opus-4-8",
+            name: "Claude Opus 4.8 (US)",
+            api: "bedrock-converse-stream",
+            provider: "amazon-bedrock",
+            baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
+            reasoning: true,
+            thinkingLevelMap: { "xhigh": "xhigh" },
+            input: ["text", "image"],
+            cost: {
+                input: 5,
+                output: 25,
+                cacheRead: 0.5,
+                cacheWrite: 6.25,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
         "us.anthropic.claude-sonnet-4-5-20250929-v1:0": {
             id: "us.anthropic.claude-sonnet-4-5-20250929-v1:0",
             name: "Claude Sonnet 4.5 (US)",
@@ -1739,7 +1847,26 @@ export const MODELS = {
             api: "anthropic-messages",
             provider: "anthropic",
             baseUrl: "https://api.anthropic.com",
-            compat: { "forceAdaptiveThinking": true },
+            compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
+            reasoning: true,
+            thinkingLevelMap: { "xhigh": "xhigh" },
+            input: ["text", "image"],
+            cost: {
+                input: 5,
+                output: 25,
+                cacheRead: 0.5,
+                cacheWrite: 6.25,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
+        "claude-opus-4-8": {
+            id: "claude-opus-4-8",
+            name: "Claude Opus 4.8",
+            api: "anthropic-messages",
+            provider: "anthropic",
+            baseUrl: "https://api.anthropic.com",
+            compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
             reasoning: true,
             thinkingLevelMap: { "xhigh": "xhigh" },
             input: ["text", "image"],
@@ -1919,7 +2046,7 @@ export const MODELS = {
             cost: {
                 input: 0.1,
                 output: 0.4,
-                cacheRead: 0.03,
+                cacheRead: 0.025,
                 cacheWrite: 0,
             },
             contextWindow: 1047576,
@@ -2004,7 +2131,7 @@ export const MODELS = {
             cost: {
                 input: 0.15,
                 output: 0.6,
-                cacheRead: 0.08,
+                cacheRead: 0.075,
                 cacheWrite: 0,
             },
             contextWindow: 128000,
@@ -2130,7 +2257,7 @@ export const MODELS = {
             cost: {
                 input: 1.25,
                 output: 10,
-                cacheRead: 0.13,
+                cacheRead: 0.125,
                 cacheWrite: 0,
             },
             contextWindow: 400000,
@@ -2431,7 +2558,7 @@ export const MODELS = {
             provider: "azure-openai-responses",
             baseUrl: "",
             reasoning: true,
-            thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
+            thinkingLevelMap: { "off": null, "xhigh": "xhigh", "minimal": null, "low": null },
             input: ["text", "image"],
             cost: {
                 input: 30,
@@ -2555,7 +2682,7 @@ export const MODELS = {
             cost: {
                 input: 1.1,
                 output: 4.4,
-                cacheRead: 0.28,
+                cacheRead: 0.275,
                 cacheWrite: 0,
             },
             contextWindow: 200000,
@@ -2614,23 +2741,6 @@ export const MODELS = {
             contextWindow: 32000,
             maxTokens: 8000,
         },
-        "qwen-3-235b-a22b-instruct-2507": {
-            id: "qwen-3-235b-a22b-instruct-2507",
-            name: "Qwen 3 235B Instruct",
-            api: "openai-completions",
-            provider: "cerebras",
-            baseUrl: "https://api.cerebras.ai/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.6,
-                output: 1.2,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131000,
-            maxTokens: 32000,
-        },
         "zai-glm-4.7": {
             id: "zai-glm-4.7",
             name: "Z.AI GLM-4.7",
@@ -2845,7 +2955,26 @@ export const MODELS = {
             api: "anthropic-messages",
             provider: "cloudflare-ai-gateway",
             baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
-            compat: { "forceAdaptiveThinking": true },
+            compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
+            reasoning: true,
+            thinkingLevelMap: { "xhigh": "xhigh" },
+            input: ["text", "image"],
+            cost: {
+                input: 5,
+                output: 25,
+                cacheRead: 0.5,
+                cacheWrite: 6.25,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
+        "claude-opus-4-8": {
+            id: "claude-opus-4-8",
+            name: "Claude Opus 4.8",
+            api: "anthropic-messages",
+            provider: "cloudflare-ai-gateway",
+            baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
+            compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
             reasoning: true,
             thinkingLevelMap: { "xhigh": "xhigh" },
             input: ["text", "image"],
@@ -3353,24 +3482,6 @@ export const MODELS = {
             contextWindow: 128000,
             maxTokens: 128000,
         },
-        "@cf/moonshotai/kimi-k2.5": {
-            id: "@cf/moonshotai/kimi-k2.5",
-            name: "Kimi K2.5",
-            api: "openai-completions",
-            provider: "cloudflare-workers-ai",
-            baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
-            compat: { "sendSessionAffinityHeaders": true },
-            reasoning: true,
-            input: ["text", "image"],
-            cost: {
-                input: 0.6,
-                output: 3,
-                cacheRead: 0.1,
-                cacheWrite: 0,
-            },
-            contextWindow: 256000,
-            maxTokens: 256000,
-        },
         "@cf/moonshotai/kimi-k2.6": {
             id: "@cf/moonshotai/kimi-k2.6",
             name: "Kimi K2.6",
@@ -3755,8 +3866,8 @@ export const MODELS = {
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 144000,
-            maxTokens: 32000,
+            contextWindow: 200000,
+            maxTokens: 64000,
         },
         "claude-opus-4.5": {
             id: "claude-opus-4.5",
@@ -3773,7 +3884,7 @@ export const MODELS = {
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 160000,
+            contextWindow: 200000,
             maxTokens: 32000,
         },
         "claude-opus-4.6": {
@@ -3794,7 +3905,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 1000000,
-            maxTokens: 64000,
+            maxTokens: 32000,
         },
         "claude-opus-4.7": {
             id: "claude-opus-4.7",
@@ -3803,7 +3914,27 @@ export const MODELS = {
             provider: "github-copilot",
             baseUrl: "https://api.individual.githubcopilot.com",
             headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
-            compat: { "forceAdaptiveThinking": true },
+            compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
+            reasoning: true,
+            thinkingLevelMap: { "xhigh": "xhigh" },
+            input: ["text", "image"],
+            cost: {
+                input: 0,
+                output: 0,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 200000,
+            maxTokens: 32000,
+        },
+        "claude-opus-4.8": {
+            id: "claude-opus-4.8",
+            name: "Claude Opus 4.8",
+            api: "anthropic-messages",
+            provider: "github-copilot",
+            baseUrl: "https://api.individual.githubcopilot.com",
+            headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
+            compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
             reasoning: true,
             thinkingLevelMap: { "xhigh": "xhigh" },
             input: ["text", "image"],
@@ -3813,7 +3944,7 @@ export const MODELS = {
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 144000,
+            contextWindow: 200000,
             maxTokens: 64000,
         },
         "claude-sonnet-4.5": {
@@ -3832,7 +3963,7 @@ export const MODELS = {
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 144000,
+            contextWindow: 200000,
             maxTokens: 32000,
         },
         "claude-sonnet-4.6": {
@@ -3908,7 +4039,7 @@ export const MODELS = {
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 128000,
+            contextWindow: 200000,
             maxTokens: 64000,
         },
         "gemini-3.5-flash": {
@@ -3927,7 +4058,7 @@ export const MODELS = {
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 128000,
+            contextWindow: 200000,
             maxTokens: 64000,
         },
         "gpt-4.1": {
@@ -4003,8 +4134,8 @@ export const MODELS = {
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 264000,
-            maxTokens: 64000,
+            contextWindow: 400000,
+            maxTokens: 128000,
         },
         "gpt-5.2-codex": {
             id: "gpt-5.2-codex",
@@ -4847,7 +4978,7 @@ export const MODELS = {
             cost: {
                 input: 1,
                 output: 3,
-                cacheRead: 0,
+                cacheRead: 0.5,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
@@ -4864,7 +4995,7 @@ export const MODELS = {
             cost: {
                 input: 0.15,
                 output: 0.6,
-                cacheRead: 0,
+                cacheRead: 0.075,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
@@ -4881,7 +5012,7 @@ export const MODELS = {
             cost: {
                 input: 0.075,
                 output: 0.3,
-                cacheRead: 0,
+                cacheRead: 0.0375,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
@@ -5167,9 +5298,9 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 1.74,
-                output: 3.48,
-                cacheRead: 0.145,
+                input: 0.435,
+                output: 0.87,
+                cacheRead: 0.003625,
                 cacheWrite: 0,
             },
             contextWindow: 1048576,
@@ -5376,6 +5507,26 @@ export const MODELS = {
             maxTokens: 32768,
         },
     },
+    "llama-cpp": {
+        "local": {
+            id: "local",
+            name: "llama.cpp local server",
+            api: "openai-completions",
+            provider: "llama-cpp",
+            baseUrl: "http://127.0.0.1:8080/v1",
+            compat: { "supportsDeveloperRole": false, "supportsStore": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
+            reasoning: false,
+            input: ["text"],
+            cost: {
+                input: 0,
+                output: 0,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 32768,
+            maxTokens: 4096,
+        },
+    },
     "minimax": {
         "MiniMax-M2.7": {
             id: "MiniMax-M2.7",
@@ -6262,7 +6413,7 @@ export const MODELS = {
             cost: {
                 input: 0.1,
                 output: 0.4,
-                cacheRead: 0.03,
+                cacheRead: 0.025,
                 cacheWrite: 0,
             },
             contextWindow: 1047576,
@@ -6347,7 +6498,7 @@ export const MODELS = {
             cost: {
                 input: 0.15,
                 output: 0.6,
-                cacheRead: 0.08,
+                cacheRead: 0.075,
                 cacheWrite: 0,
             },
             contextWindow: 128000,
@@ -6473,7 +6624,7 @@ export const MODELS = {
             cost: {
                 input: 1.25,
                 output: 10,
-                cacheRead: 0.13,
+                cacheRead: 0.125,
                 cacheWrite: 0,
             },
             contextWindow: 400000,
@@ -6756,7 +6907,7 @@ export const MODELS = {
             provider: "openai",
             baseUrl: "https://api.openai.com/v1",
             reasoning: true,
-            thinkingLevelMap: { "off": "none", "xhigh": "xhigh" },
+            thinkingLevelMap: { "off": "none", "xhigh": "xhigh", "minimal": null },
             input: ["text", "image"],
             cost: {
                 input: 5,
@@ -6774,7 +6925,7 @@ export const MODELS = {
             provider: "openai",
             baseUrl: "https://api.openai.com/v1",
             reasoning: true,
-            thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
+            thinkingLevelMap: { "off": null, "xhigh": "xhigh", "minimal": null, "low": null },
             input: ["text", "image"],
             cost: {
                 input: 30,
@@ -6898,7 +7049,7 @@ export const MODELS = {
             cost: {
                 input: 1.1,
                 output: 4.4,
-                cacheRead: 0.28,
+                cacheRead: 0.275,
                 cacheWrite: 0,
             },
             contextWindow: 200000,
@@ -7048,7 +7199,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 200000,
-            maxTokens: 128000,
+            maxTokens: 32000,
         },
         "claude-haiku-4-5": {
             id: "claude-haiku-4-5",
@@ -7126,7 +7277,7 @@ export const MODELS = {
             api: "anthropic-messages",
             provider: "opencode",
             baseUrl: "https://opencode.ai/zen",
-            compat: { "forceAdaptiveThinking": true },
+            compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
             reasoning: true,
             thinkingLevelMap: { "xhigh": "xhigh" },
             input: ["text", "image"],
@@ -7139,9 +7290,28 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 128000,
         },
-        "claude-sonnet-4": {
-            id: "claude-sonnet-4",
-            name: "Claude Sonnet 4",
+        "claude-opus-4-8": {
+            id: "claude-opus-4-8",
+            name: "Claude Opus 4.8",
+            api: "anthropic-messages",
+            provider: "opencode",
+            baseUrl: "https://opencode.ai/zen",
+            compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
+            reasoning: true,
+            thinkingLevelMap: { "xhigh": "xhigh" },
+            input: ["text", "image"],
+            cost: {
+                input: 5,
+                output: 25,
+                cacheRead: 0.5,
+                cacheWrite: 6.25,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
+        "claude-sonnet-4": {
+            id: "claude-sonnet-4",
+            name: "Claude Sonnet 4",
             api: "anthropic-messages",
             provider: "opencode",
             baseUrl: "https://opencode.ai/zen",
@@ -7191,6 +7361,25 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 64000,
         },
+        "deepseek-v4-flash": {
+            id: "deepseek-v4-flash",
+            name: "DeepSeek V4 Flash",
+            api: "openai-completions",
+            provider: "opencode",
+            baseUrl: "https://opencode.ai/zen/v1",
+            compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
+            reasoning: true,
+            thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
+            input: ["text"],
+            cost: {
+                input: 0.14,
+                output: 0.28,
+                cacheRead: 0.03,
+                cacheWrite: 0,
+            },
+            contextWindow: 1000000,
+            maxTokens: 384000,
+        },
         "deepseek-v4-flash-free": {
             id: "deepseek-v4-flash-free",
             name: "DeepSeek V4 Flash Free",
@@ -7575,7 +7764,7 @@ export const MODELS = {
             provider: "opencode",
             baseUrl: "https://opencode.ai/zen/v1",
             reasoning: true,
-            thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
+            thinkingLevelMap: { "off": null, "xhigh": "xhigh", "minimal": null, "low": null },
             input: ["text", "image"],
             cost: {
                 input: 30,
@@ -7592,7 +7781,9 @@ export const MODELS = {
             api: "openai-completions",
             provider: "opencode",
             baseUrl: "https://opencode.ai/zen/v1",
+            compat: { "supportsReasoningEffort": false },
             reasoning: true,
+            thinkingLevelMap: { "off": null, "minimal": null, "low": null, "medium": null },
             input: ["text", "image"],
             cost: {
                 input: 1,
@@ -7626,6 +7817,7 @@ export const MODELS = {
             api: "openai-completions",
             provider: "opencode",
             baseUrl: "https://opencode.ai/zen/v1",
+            compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false },
             reasoning: true,
             input: ["text", "image"],
             cost: {
@@ -7637,6 +7829,23 @@ export const MODELS = {
             contextWindow: 262144,
             maxTokens: 65536,
         },
+        "mimo-v2.5-free": {
+            id: "mimo-v2.5-free",
+            name: "MiMo V2.5 Free",
+            api: "openai-completions",
+            provider: "opencode",
+            baseUrl: "https://opencode.ai/zen/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0,
+                output: 0,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 200000,
+            maxTokens: 32000,
+        },
         "minimax-m2.5": {
             id: "minimax-m2.5",
             name: "MiniMax M2.5",
@@ -7671,6 +7880,23 @@ export const MODELS = {
             contextWindow: 204800,
             maxTokens: 131072,
         },
+        "minimax-m3-free": {
+            id: "minimax-m3-free",
+            name: "MiniMax M3 Free",
+            api: "anthropic-messages",
+            provider: "opencode",
+            baseUrl: "https://opencode.ai/zen",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0,
+                output: 0,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 200000,
+            maxTokens: 32000,
+        },
         "nemotron-3-super-free": {
             id: "nemotron-3-super-free",
             name: "Nemotron 3 Super Free",
@@ -7819,7 +8045,9 @@ export const MODELS = {
             api: "openai-completions",
             provider: "opencode-go",
             baseUrl: "https://opencode.ai/zen/go/v1",
+            compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false },
             reasoning: true,
+            thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
             input: ["text", "image"],
             cost: {
                 input: 0.95,
@@ -7839,9 +8067,9 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.4,
-                output: 2,
-                cacheRead: 0.08,
+                input: 0.14,
+                output: 0.28,
+                cacheRead: 0.0028,
                 cacheWrite: 0,
             },
             contextWindow: 1000000,
@@ -7856,9 +8084,9 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 1,
-                output: 3,
-                cacheRead: 0.2,
+                input: 1.74,
+                output: 3.48,
+                cacheRead: 0.0145,
                 cacheWrite: 0,
             },
             contextWindow: 1048576,
@@ -7898,23 +8126,22 @@ export const MODELS = {
             contextWindow: 204800,
             maxTokens: 131072,
         },
-        "qwen3.5-plus": {
-            id: "qwen3.5-plus",
-            name: "Qwen3.5 Plus",
-            api: "openai-completions",
+        "minimax-m3": {
+            id: "minimax-m3",
+            name: "MiniMax M3",
+            api: "anthropic-messages",
             provider: "opencode-go",
-            baseUrl: "https://opencode.ai/zen/go/v1",
-            compat: { "thinkingFormat": "qwen" },
+            baseUrl: "https://opencode.ai/zen/go",
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.2,
-                output: 1.2,
-                cacheRead: 0.02,
-                cacheWrite: 0.25,
+                input: 0.6,
+                output: 2.4,
+                cacheRead: 0.12,
+                cacheWrite: 0,
             },
-            contextWindow: 262144,
-            maxTokens: 65536,
+            contextWindow: 512000,
+            maxTokens: 131072,
         },
         "qwen3.6-plus": {
             id: "qwen3.6-plus",
@@ -7934,6 +8161,23 @@ export const MODELS = {
             contextWindow: 262144,
             maxTokens: 65536,
         },
+        "qwen3.7-max": {
+            id: "qwen3.7-max",
+            name: "Qwen3.7 Max",
+            api: "anthropic-messages",
+            provider: "opencode-go",
+            baseUrl: "https://opencode.ai/zen/go",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 2.5,
+                output: 7.5,
+                cacheRead: 0.5,
+                cacheWrite: 3.125,
+            },
+            contextWindow: 1000000,
+            maxTokens: 65536,
+        },
     },
     "openrouter": {
         "ai21/jamba-large-1.7": {
@@ -7953,23 +8197,6 @@ export const MODELS = {
             contextWindow: 256000,
             maxTokens: 4096,
         },
-        "alibaba/tongyi-deepresearch-30b-a3b": {
-            id: "alibaba/tongyi-deepresearch-30b-a3b",
-            name: "Tongyi DeepResearch 30B A3B",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0.09,
-                output: 0.44999999999999996,
-                cacheRead: 0.09,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 131072,
-        },
         "amazon/nova-2-lite-v1": {
             id: "amazon/nova-2-lite-v1",
             name: "Amazon: Nova 2 Lite",
@@ -8229,6 +8456,42 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 128000,
         },
+        "anthropic/claude-opus-4.8": {
+            id: "anthropic/claude-opus-4.8",
+            name: "Anthropic: Claude Opus 4.8",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            thinkingLevelMap: { "xhigh": "xhigh" },
+            input: ["text", "image"],
+            cost: {
+                input: 5,
+                output: 25,
+                cacheRead: 0.5,
+                cacheWrite: 6.25,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
+        "anthropic/claude-opus-4.8-fast": {
+            id: "anthropic/claude-opus-4.8-fast",
+            name: "Anthropic: Claude Opus 4.8 (Fast)",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            thinkingLevelMap: { "xhigh": "xhigh" },
+            input: ["text", "image"],
+            cost: {
+                input: 10,
+                output: 50,
+                cacheRead: 1,
+                cacheWrite: 12.5,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
         "anthropic/claude-sonnet-4": {
             id: "anthropic/claude-sonnet-4",
             name: "Anthropic: Claude Sonnet 4",
@@ -8297,23 +8560,6 @@ export const MODELS = {
             contextWindow: 262144,
             maxTokens: 262144,
         },
-        "arcee-ai/trinity-large-thinking:free": {
-            id: "arcee-ai/trinity-large-thinking:free",
-            name: "Arcee AI: Trinity Large Thinking (free)",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 262144,
-            maxTokens: 80000,
-        },
         "arcee-ai/trinity-mini": {
             id: "arcee-ai/trinity-mini",
             name: "Arcee AI: Trinity Mini",
@@ -8365,40 +8611,6 @@ export const MODELS = {
             contextWindow: 2000000,
             maxTokens: 30000,
         },
-        "baidu/cobuddy:free": {
-            id: "baidu/cobuddy:free",
-            name: "Baidu Qianfan: CoBuddy (free)",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 65536,
-        },
-        "baidu/ernie-4.5-21b-a3b": {
-            id: "baidu/ernie-4.5-21b-a3b",
-            name: "Baidu: ERNIE 4.5 21B A3B",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.07,
-                output: 0.28,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 8000,
-        },
         "baidu/ernie-4.5-vl-28b-a3b": {
             id: "baidu/ernie-4.5-vl-28b-a3b",
             name: "Baidu: ERNIE 4.5 VL 28B A3B",
@@ -8527,13 +8739,13 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.32,
-                output: 0.8899999999999999,
+                input: 0.2288,
+                output: 0.9144,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 163840,
-            maxTokens: 16384,
+            contextWindow: 131072,
+            maxTokens: 16000,
         },
         "deepseek/deepseek-chat-v3-0324": {
             id: "deepseek/deepseek-chat-v3-0324",
@@ -8660,37 +8872,18 @@ export const MODELS = {
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
-            compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
+            compat: { "requiresReasoningContentOnAssistantMessages": true },
             reasoning: true,
-            thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
+            thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "xhigh" },
             input: ["text"],
             cost: {
-                input: 0.09999999999999999,
-                output: 0.19999999999999998,
-                cacheRead: 0.02,
+                input: 0.0983,
+                output: 0.1966,
+                cacheRead: 0.019700000000000002,
                 cacheWrite: 0,
             },
             contextWindow: 1048576,
-            maxTokens: 16384,
-        },
-        "deepseek/deepseek-v4-flash:free": {
-            id: "deepseek/deepseek-v4-flash:free",
-            name: "DeepSeek: DeepSeek V4 Flash (free)",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
-            reasoning: true,
-            thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
-            input: ["text"],
-            cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 1048576,
-            maxTokens: 384000,
+            maxTokens: 131072,
         },
         "deepseek/deepseek-v4-pro": {
             id: "deepseek/deepseek-v4-pro",
@@ -8698,9 +8891,9 @@ export const MODELS = {
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
-            compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
+            compat: { "requiresReasoningContentOnAssistantMessages": true },
             reasoning: true,
-            thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
+            thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "xhigh" },
             input: ["text"],
             cost: {
                 input: 0.435,
@@ -8742,7 +8935,7 @@ export const MODELS = {
                 cacheRead: 0.024999999999999998,
                 cacheWrite: 0.08333333333333334,
             },
-            contextWindow: 1000000,
+            contextWindow: 1048576,
             maxTokens: 8192,
         },
         "google/gemini-2.0-flash-lite-001": {
@@ -9146,9 +9339,9 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.075,
-                output: 0.625,
-                cacheRead: 0.015,
+                input: 0.3,
+                output: 2.5,
+                cacheRead: 0.06,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
@@ -9239,6 +9432,23 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 4096,
         },
+        "meta-llama/llama-4-maverick": {
+            id: "meta-llama/llama-4-maverick",
+            name: "Meta: Llama 4 Maverick",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: false,
+            input: ["text", "image"],
+            cost: {
+                input: 0.15,
+                output: 0.6,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 1048576,
+            maxTokens: 16384,
+        },
         "meta-llama/llama-4-scout": {
             id: "meta-llama/llama-4-scout",
             name: "Meta: Llama 4 Scout",
@@ -9324,39 +9534,39 @@ export const MODELS = {
             contextWindow: 204800,
             maxTokens: 196608,
         },
-        "minimax/minimax-m2.5:free": {
-            id: "minimax/minimax-m2.5:free",
-            name: "MiniMax: MiniMax M2.5 (free)",
+        "minimax/minimax-m2.7": {
+            id: "minimax/minimax-m2.7",
+            name: "MiniMax: MiniMax M2.7",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0,
-                output: 0,
+                input: 0.26,
+                output: 1.2,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 204800,
-            maxTokens: 8192,
+            maxTokens: 4096,
         },
-        "minimax/minimax-m2.7": {
-            id: "minimax/minimax-m2.7",
-            name: "MiniMax: MiniMax M2.7",
+        "minimax/minimax-m3": {
+            id: "minimax/minimax-m3",
+            name: "MiniMax: MiniMax M3",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: true,
-            input: ["text"],
+            input: ["text", "image"],
             cost: {
-                input: 0.27899999999999997,
+                input: 0.3,
                 output: 1.2,
-                cacheRead: 0,
+                cacheRead: 0.06,
                 cacheWrite: 0,
             },
-            contextWindow: 204800,
-            maxTokens: 131072,
+            contextWindow: 1048576,
+            maxTokens: 512000,
         },
         "mistralai/codestral-2508": {
             id: "mistralai/codestral-2508",
@@ -9392,40 +9602,6 @@ export const MODELS = {
             contextWindow: 262144,
             maxTokens: 4096,
         },
-        "mistralai/devstral-medium": {
-            id: "mistralai/devstral-medium",
-            name: "Mistral: Devstral Medium",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.39999999999999997,
-                output: 2,
-                cacheRead: 0.04,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 4096,
-        },
-        "mistralai/devstral-small": {
-            id: "mistralai/devstral-small",
-            name: "Mistral: Devstral Small 1.1",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.09999999999999999,
-                output: 0.3,
-                cacheRead: 0.01,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 4096,
-        },
         "mistralai/ministral-14b-2512": {
             id: "mistralai/ministral-14b-2512",
             name: "Mistral: Ministral 3 14B 2512",
@@ -9511,23 +9687,6 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 4096,
         },
-        "mistralai/mistral-large-2411": {
-            id: "mistralai/mistral-large-2411",
-            name: "Mistral Large 2411",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 2,
-                output: 6,
-                cacheRead: 0.19999999999999998,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 4096,
-        },
         "mistralai/mistral-large-2512": {
             id: "mistralai/mistral-large-2512",
             name: "Mistral: Mistral Large 3 2512",
@@ -9681,23 +9840,6 @@ export const MODELS = {
             contextWindow: 65536,
             maxTokens: 4096,
         },
-        "mistralai/pixtral-large-2411": {
-            id: "mistralai/pixtral-large-2411",
-            name: "Mistral: Pixtral Large 2411",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text", "image"],
-            cost: {
-                input: 2,
-                output: 6,
-                cacheRead: 0.19999999999999998,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 4096,
-        },
         "mistralai/voxtral-small-24b-2507": {
             id: "mistralai/voxtral-small-24b-2507",
             name: "Mistral: Voxtral Small 24B 2507",
@@ -9789,16 +9931,35 @@ export const MODELS = {
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
+            compat: { "supportsDeveloperRole": false },
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.73,
-                output: 3.49,
-                cacheRead: 0.25,
+                input: 0.684,
+                output: 3.42,
+                cacheRead: 0.144,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 262142,
+            maxTokens: 262144,
+        },
+        "moonshotai/kimi-k2.6:free": {
+            id: "moonshotai/kimi-k2.6:free",
+            name: "MoonshotAI: Kimi K2.6 (free)",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            compat: { "supportsDeveloperRole": false },
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0,
+                output: 0,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 262144,
+            maxTokens: 4096,
         },
         "nex-agi/deepseek-v3.1-nex-n1": {
             id: "nex-agi/deepseek-v3.1-nex-n1",
@@ -10225,23 +10386,6 @@ export const MODELS = {
             contextWindow: 128000,
             maxTokens: 16384,
         },
-        "openai/gpt-4o-audio-preview": {
-            id: "openai/gpt-4o-audio-preview",
-            name: "OpenAI: GPT-4o Audio",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 2.5,
-                output: 10,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 128000,
-            maxTokens: 16384,
-        },
         "openai/gpt-4o-mini": {
             id: "openai/gpt-4o-mini",
             name: "OpenAI: GPT-4o-mini",
@@ -10389,11 +10533,11 @@ export const MODELS = {
             cost: {
                 input: 1.25,
                 output: 10,
-                cacheRead: 0.125,
+                cacheRead: 0.13,
                 cacheWrite: 0,
             },
             contextWindow: 128000,
-            maxTokens: 16384,
+            maxTokens: 32000,
         },
         "openai/gpt-5.1-codex": {
             id: "openai/gpt-5.1-codex",
@@ -10406,7 +10550,7 @@ export const MODELS = {
             cost: {
                 input: 1.25,
                 output: 10,
-                cacheRead: 0.125,
+                cacheRead: 0.13,
                 cacheWrite: 0,
             },
             contextWindow: 400000,
@@ -10440,11 +10584,11 @@ export const MODELS = {
             cost: {
                 input: 0.25,
                 output: 2,
-                cacheRead: 0.03,
+                cacheRead: 0.024999999999999998,
                 cacheWrite: 0,
             },
             contextWindow: 400000,
-            maxTokens: 128000,
+            maxTokens: 100000,
         },
         "openai/gpt-5.2": {
             id: "openai/gpt-5.2",
@@ -10480,7 +10624,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 128000,
-            maxTokens: 32000,
+            maxTokens: 16384,
         },
         "openai/gpt-5.2-codex": {
             id: "openai/gpt-5.2-codex",
@@ -10651,7 +10795,7 @@ export const MODELS = {
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: true,
-            thinkingLevelMap: { "xhigh": "xhigh" },
+            thinkingLevelMap: { "xhigh": "xhigh", "off": null, "minimal": null, "low": null },
             input: ["text", "image"],
             cost: {
                 input: 30,
@@ -10756,13 +10900,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.03,
+                input: 0.029,
                 output: 0.14,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 131072,
+            maxTokens: 4096,
         },
         "openai/gpt-oss-20b:free": {
             id: "openai/gpt-oss-20b:free",
@@ -11016,8 +11160,8 @@ export const MODELS = {
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 131072,
-            maxTokens: 8192,
+            contextWindow: 262144,
+            maxTokens: 32768,
         },
         "poolside/laguna-xs.2:free": {
             id: "poolside/laguna-xs.2:free",
@@ -11033,8 +11177,8 @@ export const MODELS = {
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 131072,
-            maxTokens: 8192,
+            contextWindow: 262144,
+            maxTokens: 32768,
         },
         "prime-intellect/intellect-3": {
             id: "prime-intellect/intellect-3",
@@ -11045,47 +11189,30 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.19999999999999998,
-                output: 1.1,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 131072,
-        },
-        "qwen/qwen-2.5-72b-instruct": {
-            id: "qwen/qwen-2.5-72b-instruct",
-            name: "Qwen2.5 72B Instruct",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.36,
-                output: 0.39999999999999997,
+                input: 0.19999999999999998,
+                output: 1.1,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 16384,
+            maxTokens: 131072,
         },
-        "qwen/qwen-2.5-7b-instruct": {
-            id: "qwen/qwen-2.5-7b-instruct",
-            name: "Qwen: Qwen2.5 7B Instruct",
+        "qwen/qwen-2.5-72b-instruct": {
+            id: "qwen/qwen-2.5-72b-instruct",
+            name: "Qwen2.5 72B Instruct",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.04,
-                output: 0.09999999999999999,
+                input: 0.36,
+                output: 0.39999999999999997,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 32768,
+            maxTokens: 16384,
         },
         "qwen/qwen-plus": {
             id: "qwen/qwen-plus",
@@ -11116,7 +11243,7 @@ export const MODELS = {
                 input: 0.26,
                 output: 0.78,
                 cacheRead: 0,
-                cacheWrite: 0.325,
+                cacheWrite: 0,
             },
             contextWindow: 1000000,
             maxTokens: 32768,
@@ -11198,13 +11325,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.14950000000000002,
-                output: 1.495,
-                cacheRead: 0,
+                input: 0.09999999999999999,
+                output: 0.09999999999999999,
+                cacheRead: 0.09999999999999999,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 4096,
+            maxTokens: 262144,
         },
         "qwen/qwen3-30b-a3b": {
             id: "qwen/qwen3-30b-a3b",
@@ -11640,13 +11767,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.13899999999999998,
+                input: 0.14,
                 output: 1,
-                cacheRead: 0,
+                cacheRead: 0.049999999999999996,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 4096,
+            maxTokens: 262144,
         },
         "qwen/qwen3.5-397b-a17b": {
             id: "qwen/qwen3.5-397b-a17b",
@@ -11694,7 +11821,7 @@ export const MODELS = {
                 input: 0.065,
                 output: 0.26,
                 cacheRead: 0,
-                cacheWrite: 0.08125,
+                cacheWrite: 0,
             },
             contextWindow: 1000000,
             maxTokens: 65536,
@@ -11711,7 +11838,7 @@ export const MODELS = {
                 input: 0.26,
                 output: 1.56,
                 cacheRead: 0,
-                cacheWrite: 0.325,
+                cacheWrite: 0,
             },
             contextWindow: 1000000,
             maxTokens: 65536,
@@ -11728,7 +11855,7 @@ export const MODELS = {
                 input: 0.3,
                 output: 1.7999999999999998,
                 cacheRead: 0,
-                cacheWrite: 0,
+                cacheWrite: 0.375,
             },
             contextWindow: 1000000,
             maxTokens: 65536,
@@ -11742,13 +11869,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.3,
+                input: 0.29,
                 output: 3.1999999999999997,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 262144,
+            maxTokens: 262140,
         },
         "qwen/qwen3.6-35b-a3b": {
             id: "qwen/qwen3.6-35b-a3b",
@@ -11759,7 +11886,7 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.15,
+                input: 0.14,
                 output: 1,
                 cacheRead: 0,
                 cacheWrite: 0,
@@ -11827,10 +11954,10 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 2.5,
-                output: 7.5,
-                cacheRead: 0,
-                cacheWrite: 3.125,
+                input: 1.25,
+                output: 3.75,
+                cacheRead: 0.25,
+                cacheWrite: 1.5625,
             },
             contextWindow: 1000000,
             maxTokens: 65536,
@@ -11920,6 +12047,23 @@ export const MODELS = {
             contextWindow: 262144,
             maxTokens: 16384,
         },
+        "stepfun/step-3.7-flash": {
+            id: "stepfun/step-3.7-flash",
+            name: "StepFun: Step 3.7 Flash",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0.19999999999999998,
+                output: 1.15,
+                cacheRead: 0.04,
+                cacheWrite: 0,
+            },
+            contextWindow: 256000,
+            maxTokens: 256000,
+        },
         "tencent/hy3-preview": {
             id: "tencent/hy3-preview",
             name: "Tencent: Hy3 preview",
@@ -11929,13 +12073,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.06599999999999999,
-                output: 0.26,
-                cacheRead: 0.029,
+                input: 0.063,
+                output: 0.21,
+                cacheRead: 0.020999999999999998,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 262144,
+            maxTokens: 4096,
         },
         "thedrummer/rocinante-12b": {
             id: "thedrummer/rocinante-12b",
@@ -12056,40 +12200,6 @@ export const MODELS = {
             contextWindow: 262144,
             maxTokens: 65536,
         },
-        "xiaomi/mimo-v2-omni": {
-            id: "xiaomi/mimo-v2-omni",
-            name: "Xiaomi: MiMo-V2-Omni",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: true,
-            input: ["text", "image"],
-            cost: {
-                input: 0.39999999999999997,
-                output: 2,
-                cacheRead: 0.08,
-                cacheWrite: 0,
-            },
-            contextWindow: 262144,
-            maxTokens: 65536,
-        },
-        "xiaomi/mimo-v2-pro": {
-            id: "xiaomi/mimo-v2-pro",
-            name: "Xiaomi: MiMo-V2-Pro",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 1,
-                output: 3,
-                cacheRead: 0.19999999999999998,
-                cacheWrite: 0,
-            },
-            contextWindow: 1048576,
-            maxTokens: 131072,
-        },
         "xiaomi/mimo-v2.5": {
             id: "xiaomi/mimo-v2.5",
             name: "Xiaomi: MiMo-V2.5",
@@ -12099,9 +12209,9 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.39999999999999997,
-                output: 2,
-                cacheRead: 0.08,
+                input: 0.14,
+                output: 0.28,
+                cacheRead: 0.0028,
                 cacheWrite: 0,
             },
             contextWindow: 1048576,
@@ -12116,13 +12226,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 1,
-                output: 3,
-                cacheRead: 0.19999999999999998,
+                input: 0.435,
+                output: 0.87,
+                cacheRead: 0.0036,
                 cacheWrite: 0,
             },
             contextWindow: 1048576,
-            maxTokens: 16384,
+            maxTokens: 131072,
         },
         "z-ai/glm-4-32b": {
             id: "z-ai/glm-4-32b",
@@ -12167,13 +12277,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.13,
+                input: 0.125,
                 output: 0.85,
-                cacheRead: 0.024999999999999998,
+                cacheRead: 0.06,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 98304,
+            maxTokens: 131070,
         },
         "z-ai/glm-4.5-air:free": {
             id: "z-ai/glm-4.5-air:free",
@@ -12439,13 +12549,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.73,
-                output: 3.49,
-                cacheRead: 0.25,
+                input: 0.684,
+                output: 3.42,
+                cacheRead: 0.144,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 262142,
+            maxTokens: 262144,
         },
         "~openai/gpt-latest": {
             id: "~openai/gpt-latest",
@@ -12843,20 +12953,20 @@ export const MODELS = {
         },
         "alibaba/qwen-3-235b": {
             id: "alibaba/qwen-3-235b",
-            name: "Qwen3 235B A22b Instruct 2507",
+            name: "Qwen3 235B A22B",
             api: "anthropic-messages",
             provider: "vercel-ai-gateway",
             baseUrl: "https://ai-gateway.vercel.sh",
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.6,
-                output: 1.2,
-                cacheRead: 0.6,
+                input: 0.22,
+                output: 0.88,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 131000,
-            maxTokens: 40000,
+            contextWindow: 262144,
+            maxTokens: 16384,
         },
         "alibaba/qwen-3-30b": {
             id: "alibaba/qwen-3-30b",
@@ -13274,7 +13384,26 @@ export const MODELS = {
             api: "anthropic-messages",
             provider: "vercel-ai-gateway",
             baseUrl: "https://ai-gateway.vercel.sh",
-            compat: { "forceAdaptiveThinking": true },
+            compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
+            reasoning: true,
+            thinkingLevelMap: { "xhigh": "xhigh" },
+            input: ["text", "image"],
+            cost: {
+                input: 5,
+                output: 25,
+                cacheRead: 0.5,
+                cacheWrite: 6.25,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
+        "anthropic/claude-opus-4.8": {
+            id: "anthropic/claude-opus-4.8",
+            name: "Claude Opus 4.8",
+            api: "anthropic-messages",
+            provider: "vercel-ai-gateway",
+            baseUrl: "https://ai-gateway.vercel.sh",
+            compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
             reasoning: true,
             thinkingLevelMap: { "xhigh": "xhigh" },
             input: ["text", "image"],
@@ -13433,17 +13562,17 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.77,
-                output: 0.77,
-                cacheRead: 0,
+                input: 0.27,
+                output: 1.12,
+                cacheRead: 0.135,
                 cacheWrite: 0,
             },
             contextWindow: 163840,
-            maxTokens: 16384,
+            maxTokens: 163840,
         },
         "deepseek/deepseek-v3.1": {
             id: "deepseek/deepseek-v3.1",
-            name: "DeepSeek-V3.1",
+            name: "DeepSeek V3.1",
             api: "anthropic-messages",
             provider: "vercel-ai-gateway",
             baseUrl: "https://ai-gateway.vercel.sh",
@@ -14070,6 +14199,23 @@ export const MODELS = {
             contextWindow: 204800,
             maxTokens: 131100,
         },
+        "minimax/minimax-m3": {
+            id: "minimax/minimax-m3",
+            name: "MiniMax M3",
+            api: "anthropic-messages",
+            provider: "vercel-ai-gateway",
+            baseUrl: "https://ai-gateway.vercel.sh",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0.3,
+                output: 1.2,
+                cacheRead: 0.06,
+                cacheWrite: 0,
+            },
+            contextWindow: 1000000,
+            maxTokens: 1000000,
+        },
         "mistral/codestral": {
             id: "mistral/codestral",
             name: "Mistral Codestral",
@@ -14887,7 +15033,7 @@ export const MODELS = {
             provider: "vercel-ai-gateway",
             baseUrl: "https://ai-gateway.vercel.sh",
             reasoning: true,
-            thinkingLevelMap: { "xhigh": "xhigh" },
+            thinkingLevelMap: { "xhigh": "xhigh", "off": null, "minimal": null, "low": null },
             input: ["text", "image"],
             cost: {
                 input: 30,
@@ -15068,6 +15214,40 @@ export const MODELS = {
             contextWindow: 200000,
             maxTokens: 8000,
         },
+        "stepfun/step-3.5-flash": {
+            id: "stepfun/step-3.5-flash",
+            name: "StepFun 3.5 Flash",
+            api: "anthropic-messages",
+            provider: "vercel-ai-gateway",
+            baseUrl: "https://ai-gateway.vercel.sh",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0.09,
+                output: 0.3,
+                cacheRead: 0,
+                cacheWrite: 0.02,
+            },
+            contextWindow: 262114,
+            maxTokens: 262114,
+        },
+        "stepfun/step-3.7-flash": {
+            id: "stepfun/step-3.7-flash",
+            name: "Step 3.7 Flash",
+            api: "anthropic-messages",
+            provider: "vercel-ai-gateway",
+            baseUrl: "https://ai-gateway.vercel.sh",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0.19999999999999998,
+                output: 1.15,
+                cacheRead: 0.04,
+                cacheWrite: 0,
+            },
+            contextWindow: 256000,
+            maxTokens: 256000,
+        },
         "xai/grok-4.1-fast-non-reasoning": {
             id: "xai/grok-4.1-fast-non-reasoning",
             name: "Grok 4.1 Fast Non-Reasoning",
@@ -15281,9 +15461,9 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.39999999999999997,
-                output: 2,
-                cacheRead: 0.08,
+                input: 0.14,
+                output: 0.28,
+                cacheRead: 0.0028,
                 cacheWrite: 0,
             },
             contextWindow: 1050000,
@@ -15298,9 +15478,9 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 1,
-                output: 3,
-                cacheRead: 0.19999999999999998,
+                input: 0.435,
+                output: 0.87,
+                cacheRead: 0.0036,
                 cacheWrite: 0,
             },
             contextWindow: 1050000,
@@ -15742,24 +15922,6 @@ export const MODELS = {
         },
     },
     "xiaomi-token-plan-ams": {
-        "mimo-v2-flash": {
-            id: "mimo-v2-flash",
-            name: "MiMo-V2-Flash",
-            api: "openai-completions",
-            provider: "xiaomi-token-plan-ams",
-            baseUrl: "https://token-plan-ams.xiaomimimo.com/v1",
-            compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0.1,
-                output: 0.3,
-                cacheRead: 0.01,
-                cacheWrite: 0,
-            },
-            contextWindow: 262144,
-            maxTokens: 65536,
-        },
         "mimo-v2-omni": {
             id: "mimo-v2-omni",
             name: "MiMo-V2-Omni",
@@ -15834,24 +15996,6 @@ export const MODELS = {
         },
     },
     "xiaomi-token-plan-cn": {
-        "mimo-v2-flash": {
-            id: "mimo-v2-flash",
-            name: "MiMo-V2-Flash",
-            api: "openai-completions",
-            provider: "xiaomi-token-plan-cn",
-            baseUrl: "https://token-plan-cn.xiaomimimo.com/v1",
-            compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0.1,
-                output: 0.3,
-                cacheRead: 0.01,
-                cacheWrite: 0,
-            },
-            contextWindow: 262144,
-            maxTokens: 65536,
-        },
         "mimo-v2-omni": {
             id: "mimo-v2-omni",
             name: "MiMo-V2-Omni",
@@ -15926,24 +16070,6 @@ export const MODELS = {
         },
     },
     "xiaomi-token-plan-sgp": {
-        "mimo-v2-flash": {
-            id: "mimo-v2-flash",
-            name: "MiMo-V2-Flash",
-            api: "openai-completions",
-            provider: "xiaomi-token-plan-sgp",
-            baseUrl: "https://token-plan-sgp.xiaomimimo.com/v1",
-            compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0.1,
-                output: 0.3,
-                cacheRead: 0.01,
-                cacheWrite: 0,
-            },
-            contextWindow: 262144,
-            maxTokens: 65536,
-        },
         "mimo-v2-omni": {
             id: "mimo-v2-omni",
             name: "MiMo-V2-Omni",