npm - @fleetagent/pi-ai - Versions diffs - 0.0.9 → 0.0.10 - Mend

@fleetagent/pi-ai 0.0.9 → 0.0.10

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

package/dist/image-models.generated.d.ts +2 -2
package/dist/image-models.generated.d.ts.map +1 -1
package/dist/image-models.generated.js +6 -6
package/dist/image-models.generated.js.map +1 -1
package/dist/models.generated.d.ts +273 -283
package/dist/models.generated.d.ts.map +1 -1
package/dist/models.generated.js +295 -324
package/dist/models.generated.js.map +1 -1
package/package.json +1 -1

package/dist/models.generated.js CHANGED Viewed

@@ -8,7 +8,7 @@ export const MODELS = {
             api: "bedrock-converse-stream",
             provider: "amazon-bedrock",
             baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
-            reasoning: false,
+            reasoning: true,
             input: ["text", "image"],
             cost: {
                 input: 0.33,
@@ -345,6 +345,23 @@ export const MODELS = {
             contextWindow: 163840,
             maxTokens: 81920,
         },
+        "eu.anthropic.claude-fable-5": {
+            id: "eu.anthropic.claude-fable-5",
+            name: "Claude Fable 5 (EU)",
+            api: "bedrock-converse-stream",
+            provider: "amazon-bedrock",
+            baseUrl: "https://bedrock-runtime.eu-central-1.amazonaws.com",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 11,
+                output: 55,
+                cacheRead: 1.1,
+                cacheWrite: 13.75,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
         "eu.anthropic.claude-haiku-4-5-20251001-v1:0": {
             id: "eu.anthropic.claude-haiku-4-5-20251001-v1:0",
             name: "Claude Haiku 4.5 (EU)",
@@ -466,6 +483,23 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 64000,
         },
+        "global.anthropic.claude-fable-5": {
+            id: "global.anthropic.claude-fable-5",
+            name: "Claude Fable 5 (Global)",
+            api: "bedrock-converse-stream",
+            provider: "amazon-bedrock",
+            baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 10,
+                output: 50,
+                cacheRead: 1,
+                cacheWrite: 12.5,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
         "global.anthropic.claude-haiku-4-5-20251001-v1:0": {
             id: "global.anthropic.claude-haiku-4-5-20251001-v1:0",
             name: "Claude Haiku 4.5 (Global)",
@@ -1123,7 +1157,7 @@ export const MODELS = {
             api: "bedrock-converse-stream",
             provider: "amazon-bedrock",
             baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
-            reasoning: false,
+            reasoning: true,
             input: ["text"],
             cost: {
                 input: 0.15,
@@ -1140,7 +1174,7 @@ export const MODELS = {
             api: "bedrock-converse-stream",
             provider: "amazon-bedrock",
             baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
-            reasoning: false,
+            reasoning: true,
             input: ["text"],
             cost: {
                 input: 0.15,
@@ -1157,7 +1191,7 @@ export const MODELS = {
             api: "bedrock-converse-stream",
             provider: "amazon-bedrock",
             baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
-            reasoning: false,
+            reasoning: true,
             input: ["text"],
             cost: {
                 input: 0.07,
@@ -1174,7 +1208,7 @@ export const MODELS = {
             api: "bedrock-converse-stream",
             provider: "amazon-bedrock",
             baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
-            reasoning: false,
+            reasoning: true,
             input: ["text"],
             cost: {
                 input: 0.07,
@@ -1338,6 +1372,23 @@ export const MODELS = {
             contextWindow: 262000,
             maxTokens: 262000,
         },
+        "us.anthropic.claude-fable-5": {
+            id: "us.anthropic.claude-fable-5",
+            name: "Claude Fable 5 (US)",
+            api: "bedrock-converse-stream",
+            provider: "amazon-bedrock",
+            baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 10,
+                output: 50,
+                cacheRead: 1,
+                cacheWrite: 12.5,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
         "us.anthropic.claude-haiku-4-5-20251001-v1:0": {
             id: "us.anthropic.claude-haiku-4-5-20251001-v1:0",
             name: "Claude Haiku 4.5 (US)",
@@ -1750,6 +1801,23 @@ export const MODELS = {
             contextWindow: 200000,
             maxTokens: 4096,
         },
+        "claude-fable-5": {
+            id: "claude-fable-5",
+            name: "Claude Fable 5",
+            api: "anthropic-messages",
+            provider: "anthropic",
+            baseUrl: "https://api.anthropic.com",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 10,
+                output: 50,
+                cacheRead: 1,
+                cacheWrite: 12.5,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
         "claude-haiku-4-5": {
             id: "claude-haiku-4-5",
             name: "Claude Haiku 4.5 (latest)",
@@ -2925,6 +2993,23 @@ export const MODELS = {
             contextWindow: 200000,
             maxTokens: 8192,
         },
+        "claude-fable-5": {
+            id: "claude-fable-5",
+            name: "Claude Fable 5",
+            api: "anthropic-messages",
+            provider: "cloudflare-ai-gateway",
+            baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 10,
+                output: 50,
+                cacheRead: 1,
+                cacheWrite: 12.5,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
         "claude-haiku-4-5": {
             id: "claude-haiku-4-5",
             name: "Claude Haiku 4.5 (latest)",
@@ -4861,77 +4946,9 @@ export const MODELS = {
         },
     },
     "groq": {
-        "deepseek-r1-distill-llama-70b": {
-            id: "deepseek-r1-distill-llama-70b",
-            name: "DeepSeek R1 Distill Llama 70B",
-            api: "openai-completions",
-            provider: "groq",
-            baseUrl: "https://api.groq.com/openai/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0.75,
-                output: 0.99,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 8192,
-        },
-        "gemma2-9b-it": {
-            id: "gemma2-9b-it",
-            name: "Gemma 2 9B",
-            api: "openai-completions",
-            provider: "groq",
-            baseUrl: "https://api.groq.com/openai/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.2,
-                output: 0.2,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 8192,
-            maxTokens: 8192,
-        },
-        "groq/compound": {
-            id: "groq/compound",
-            name: "Compound",
-            api: "openai-completions",
-            provider: "groq",
-            baseUrl: "https://api.groq.com/openai/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 8192,
-        },
-        "groq/compound-mini": {
-            id: "groq/compound-mini",
-            name: "Compound Mini",
-            api: "openai-completions",
-            provider: "groq",
-            baseUrl: "https://api.groq.com/openai/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 8192,
-        },
         "llama-3.1-8b-instant": {
             id: "llama-3.1-8b-instant",
-            name: "Llama 3.1 8B Instant",
+            name: "Llama 3.1 8B",
             api: "openai-completions",
             provider: "groq",
             baseUrl: "https://api.groq.com/openai/v1",
@@ -4948,7 +4965,7 @@ export const MODELS = {
         },
         "llama-3.3-70b-versatile": {
             id: "llama-3.3-70b-versatile",
-            name: "Llama 3.3 70B Versatile",
+            name: "Llama 3.3 70B",
             api: "openai-completions",
             provider: "groq",
             baseUrl: "https://api.groq.com/openai/v1",
@@ -4963,60 +4980,9 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 32768,
         },
-        "llama3-70b-8192": {
-            id: "llama3-70b-8192",
-            name: "Llama 3 70B",
-            api: "openai-completions",
-            provider: "groq",
-            baseUrl: "https://api.groq.com/openai/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.59,
-                output: 0.79,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 8192,
-            maxTokens: 8192,
-        },
-        "llama3-8b-8192": {
-            id: "llama3-8b-8192",
-            name: "Llama 3 8B",
-            api: "openai-completions",
-            provider: "groq",
-            baseUrl: "https://api.groq.com/openai/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.05,
-                output: 0.08,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 8192,
-            maxTokens: 8192,
-        },
-        "meta-llama/llama-4-maverick-17b-128e-instruct": {
-            id: "meta-llama/llama-4-maverick-17b-128e-instruct",
-            name: "Llama 4 Maverick 17B",
-            api: "openai-completions",
-            provider: "groq",
-            baseUrl: "https://api.groq.com/openai/v1",
-            reasoning: false,
-            input: ["text", "image"],
-            cost: {
-                input: 0.2,
-                output: 0.6,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 8192,
-        },
         "meta-llama/llama-4-scout-17b-16e-instruct": {
             id: "meta-llama/llama-4-scout-17b-16e-instruct",
-            name: "Llama 4 Scout 17B",
+            name: "Llama 4 Scout 17B 16E",
             api: "openai-completions",
             provider: "groq",
             baseUrl: "https://api.groq.com/openai/v1",
@@ -5031,57 +4997,6 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 8192,
         },
-        "mistral-saba-24b": {
-            id: "mistral-saba-24b",
-            name: "Mistral Saba 24B",
-            api: "openai-completions",
-            provider: "groq",
-            baseUrl: "https://api.groq.com/openai/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.79,
-                output: 0.79,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 32768,
-            maxTokens: 32768,
-        },
-        "moonshotai/kimi-k2-instruct": {
-            id: "moonshotai/kimi-k2-instruct",
-            name: "Kimi K2 Instruct",
-            api: "openai-completions",
-            provider: "groq",
-            baseUrl: "https://api.groq.com/openai/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 1,
-                output: 3,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 16384,
-        },
-        "moonshotai/kimi-k2-instruct-0905": {
-            id: "moonshotai/kimi-k2-instruct-0905",
-            name: "Kimi K2 Instruct 0905",
-            api: "openai-completions",
-            provider: "groq",
-            baseUrl: "https://api.groq.com/openai/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 1,
-                output: 3,
-                cacheRead: 0.5,
-                cacheWrite: 0,
-            },
-            contextWindow: 262144,
-            maxTokens: 16384,
-        },
         "openai/gpt-oss-120b": {
             id: "openai/gpt-oss-120b",
             name: "GPT OSS 120B",
@@ -5133,26 +5048,9 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 65536,
         },
-        "qwen-qwq-32b": {
-            id: "qwen-qwq-32b",
-            name: "Qwen QwQ 32B",
-            api: "openai-completions",
-            provider: "groq",
-            baseUrl: "https://api.groq.com/openai/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0.29,
-                output: 0.39,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 16384,
-        },
         "qwen/qwen3-32b": {
             id: "qwen/qwen3-32b",
-            name: "Qwen3 32B",
+            name: "Qwen3-32B",
             api: "openai-completions",
             provider: "groq",
             baseUrl: "https://api.groq.com/openai/v1",
@@ -7313,6 +7211,23 @@ export const MODELS = {
             contextWindow: 200000,
             maxTokens: 32000,
         },
+        "claude-fable-5": {
+            id: "claude-fable-5",
+            name: "Claude Fable 5",
+            api: "anthropic-messages",
+            provider: "opencode",
+            baseUrl: "https://opencode.ai/zen",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 10,
+                output: 50,
+                cacheRead: 1,
+                cacheWrite: 12.5,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
         "claude-haiku-4-5": {
             id: "claude-haiku-4-5",
             name: "Claude Haiku 4.5",
@@ -7485,7 +7400,7 @@ export const MODELS = {
             cost: {
                 input: 0.14,
                 output: 0.28,
-                cacheRead: 0.03,
+                cacheRead: 0.028,
                 cacheWrite: 0,
             },
             contextWindow: 1000000,
@@ -7510,6 +7425,25 @@ export const MODELS = {
             contextWindow: 200000,
             maxTokens: 128000,
         },
+        "deepseek-v4-pro": {
+            id: "deepseek-v4-pro",
+            name: "DeepSeek V4 Pro",
+            api: "openai-completions",
+            provider: "opencode",
+            baseUrl: "https://opencode.ai/zen/v1",
+            compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
+            reasoning: true,
+            thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
+            input: ["text"],
+            cost: {
+                input: 1.74,
+                output: 3.84,
+                cacheRead: 0.145,
+                cacheWrite: 0,
+            },
+            contextWindow: 1000000,
+            maxTokens: 384000,
+        },
         "gemini-3-flash": {
             id: "gemini-3-flash",
             name: "Gemini 3 Flash",
@@ -8008,6 +7942,23 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 128000,
         },
+        "north-mini-code-free": {
+            id: "north-mini-code-free",
+            name: "North Mini Code Free",
+            api: "openai-completions",
+            provider: "opencode",
+            baseUrl: "https://opencode.ai/zen/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0,
+                output: 0,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 256000,
+            maxTokens: 64000,
+        },
         "qwen3.5-plus": {
             id: "qwen3.5-plus",
             name: "Qwen3.5 Plus",
@@ -8229,9 +8180,9 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.6,
-                output: 2.4,
-                cacheRead: 0.12,
+                input: 0.3,
+                output: 1.2,
+                cacheRead: 0.06,
                 cacheWrite: 0,
             },
             contextWindow: 512000,
@@ -8427,6 +8378,23 @@ export const MODELS = {
             contextWindow: 200000,
             maxTokens: 8192,
         },
+        "anthropic/claude-fable-5": {
+            id: "anthropic/claude-fable-5",
+            name: "Anthropic: Claude Fable 5",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 10,
+                output: 50,
+                cacheRead: 1,
+                cacheWrite: 12.5,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
         "anthropic/claude-haiku-4.5": {
             id: "anthropic/claude-haiku-4.5",
             name: "Anthropic: Claude Haiku 4.5",
@@ -8853,7 +8821,7 @@ export const MODELS = {
                 cacheRead: 0.135,
                 cacheWrite: 0,
             },
-            contextWindow: 163840,
+            contextWindow: 131072,
             maxTokens: 16384,
         },
         "deepseek/deepseek-chat-v3.1": {
@@ -9585,8 +9553,8 @@ export const MODELS = {
             input: ["text"],
             cost: {
                 input: 0.15,
-                output: 1.15,
-                cacheRead: 0,
+                output: 0.8999999999999999,
+                cacheRead: 0.049999999999999996,
                 cacheWrite: 0,
             },
             contextWindow: 204800,
@@ -9601,13 +9569,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.27899999999999997,
-                output: 1.2,
-                cacheRead: 0,
+                input: 0.27,
+                output: 1.08,
+                cacheRead: 0.054,
                 cacheWrite: 0,
             },
             contextWindow: 204800,
-            maxTokens: 196608,
+            maxTokens: 131072,
         },
         "minimax/minimax-m3": {
             id: "minimax/minimax-m3",
@@ -9993,21 +9961,20 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.684,
-                output: 3.42,
-                cacheRead: 0.144,
+                input: 0.6799999999999999,
+                output: 3.41,
+                cacheRead: 0.33999999999999997,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 262144,
+            maxTokens: 262142,
         },
-        "moonshotai/kimi-k2.6:free": {
-            id: "moonshotai/kimi-k2.6:free",
-            name: "MoonshotAI: Kimi K2.6 (free)",
+        "nex-agi/nex-n2-pro:free": {
+            id: "nex-agi/nex-n2-pro:free",
+            name: "Nex AGI: Nex-N2-Pro (free)",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
-            compat: { "supportsDeveloperRole": false },
             reasoning: true,
             input: ["text", "image"],
             cost: {
@@ -10017,24 +9984,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 4096,
-        },
-        "nex-agi/deepseek-v3.1-nex-n1": {
-            id: "nex-agi/deepseek-v3.1-nex-n1",
-            name: "Nex AGI: DeepSeek V3.1 Nex N1",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.135,
-                output: 0.5,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 163840,
+            maxTokens: 262144,
         },
         "nvidia/llama-3.3-nemotron-super-49b-v1.5": {
             id: "nvidia/llama-3.3-nemotron-super-49b-v1.5",
@@ -11944,13 +11894,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.14,
+                input: 0.15,
                 output: 1,
-                cacheRead: 0,
+                cacheRead: 0.049999999999999996,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 262140,
+            maxTokens: 262144,
         },
         "qwen/qwen3.6-flash": {
             id: "qwen/qwen3.6-flash",
@@ -12292,23 +12242,6 @@ export const MODELS = {
             contextWindow: 1048576,
             maxTokens: 131072,
         },
-        "z-ai/glm-4-32b": {
-            id: "z-ai/glm-4-32b",
-            name: "Z.ai: GLM 4 32B ",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.09999999999999999,
-                output: 0.09999999999999999,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 128000,
-            maxTokens: 4096,
-        },
         "z-ai/glm-4.5": {
             id: "z-ai/glm-4.5",
             name: "Z.ai: GLM 4.5",
@@ -12343,23 +12276,6 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 131070,
         },
-        "z-ai/glm-4.5-air:free": {
-            id: "z-ai/glm-4.5-air:free",
-            name: "Z.ai: GLM 4.5 Air (free)",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 96000,
-        },
         "z-ai/glm-4.5v": {
             id: "z-ai/glm-4.5v",
             name: "Z.ai: GLM 4.5V",
@@ -12405,11 +12321,11 @@ export const MODELS = {
             cost: {
                 input: 0.3,
                 output: 0.8999999999999999,
-                cacheRead: 0.049999999999999996,
+                cacheRead: 0.055,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 24000,
+            maxTokens: 32768,
         },
         "z-ai/glm-4.7": {
             id: "z-ai/glm-4.7",
@@ -12476,7 +12392,7 @@ export const MODELS = {
                 cacheRead: 0.24,
                 cacheWrite: 0,
             },
-            contextWindow: 202752,
+            contextWindow: 262144,
             maxTokens: 131072,
         },
         "z-ai/glm-5.1": {
@@ -12496,22 +12412,22 @@ export const MODELS = {
             contextWindow: 202752,
             maxTokens: 4096,
         },
-        "z-ai/glm-5v-turbo": {
-            id: "z-ai/glm-5v-turbo",
-            name: "Z.ai: GLM 5V Turbo",
+        "~anthropic/claude-fable-latest": {
+            id: "~anthropic/claude-fable-latest",
+            name: "Anthropic: Claude Fable Latest",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 1.2,
-                output: 4,
-                cacheRead: 0.24,
-                cacheWrite: 0,
+                input: 10,
+                output: 50,
+                cacheRead: 1,
+                cacheWrite: 12.5,
             },
-            contextWindow: 202752,
-            maxTokens: 131072,
+            contextWindow: 1000000,
+            maxTokens: 128000,
         },
         "~anthropic/claude-haiku-latest": {
             id: "~anthropic/claude-haiku-latest",
@@ -12607,13 +12523,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.684,
-                output: 3.42,
-                cacheRead: 0.144,
+                input: 0.6799999999999999,
+                output: 3.41,
+                cacheRead: 0.33999999999999997,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 262144,
+            maxTokens: 262142,
         },
         "~openai/gpt-latest": {
             id: "~openai/gpt-latest",
@@ -13054,8 +12970,8 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.08,
-                output: 0.29,
+                input: 0.12,
+                output: 0.5,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
@@ -13419,6 +13335,23 @@ export const MODELS = {
             contextWindow: 200000,
             maxTokens: 8192,
         },
+        "anthropic/claude-fable-5": {
+            id: "anthropic/claude-fable-5",
+            name: "Claude Fable 5",
+            api: "anthropic-messages",
+            provider: "vercel-ai-gateway",
+            baseUrl: "https://ai-gateway.vercel.sh",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 10,
+                output: 50,
+                cacheRead: 1,
+                cacheWrite: 12.5,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
         "anthropic/claude-haiku-4.5": {
             id: "anthropic/claude-haiku-4.5",
             name: "Claude Haiku 4.5",
@@ -13799,40 +13732,6 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 384000,
         },
-        "google/gemini-2.0-flash": {
-            id: "google/gemini-2.0-flash",
-            name: "Gemini 2.0 Flash",
-            api: "anthropic-messages",
-            provider: "vercel-ai-gateway",
-            baseUrl: "https://ai-gateway.vercel.sh",
-            reasoning: false,
-            input: ["text", "image"],
-            cost: {
-                input: 0.15,
-                output: 0.6,
-                cacheRead: 0.024999999999999998,
-                cacheWrite: 0,
-            },
-            contextWindow: 1048576,
-            maxTokens: 8192,
-        },
-        "google/gemini-2.0-flash-lite": {
-            id: "google/gemini-2.0-flash-lite",
-            name: "Gemini 2.0 Flash Lite",
-            api: "anthropic-messages",
-            provider: "vercel-ai-gateway",
-            baseUrl: "https://ai-gateway.vercel.sh",
-            reasoning: false,
-            input: ["text", "image"],
-            cost: {
-                input: 0.075,
-                output: 0.3,
-                cacheRead: 0.02,
-                cacheWrite: 0,
-            },
-            contextWindow: 1048576,
-            maxTokens: 8192,
-        },
         "google/gemini-2.5-flash": {
             id: "google/gemini-2.5-flash",
             name: "Gemini 2.5 Flash",
@@ -15952,7 +15851,7 @@ export const MODELS = {
                 cacheRead: 0.2,
                 cacheWrite: 0,
             },
-            contextWindow: 2000000,
+            contextWindow: 1000000,
             maxTokens: 30000,
         },
         "grok-4.20-0309-reasoning": {
@@ -15969,7 +15868,7 @@ export const MODELS = {
                 cacheRead: 0.2,
                 cacheWrite: 0,
             },
-            contextWindow: 2000000,
+            contextWindow: 1000000,
             maxTokens: 30000,
         },
         "grok-4.3": {
@@ -16115,6 +16014,24 @@ export const MODELS = {
             contextWindow: 1048576,
             maxTokens: 131072,
         },
+        "mimo-v2.5-pro-ultraspeed": {
+            id: "mimo-v2.5-pro-ultraspeed",
+            name: "MiMo-V2.5-Pro-UltraSpeed",
+            api: "openai-completions",
+            provider: "xiaomi",
+            baseUrl: "https://api.xiaomimimo.com/v1",
+            compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 1.305,
+                output: 2.61,
+                cacheRead: 0.0108,
+                cacheWrite: 0,
+            },
+            contextWindow: 1048576,
+            maxTokens: 131072,
+        },
     },
     "xiaomi-token-plan-ams": {
         "mimo-v2-omni": {
@@ -16189,6 +16106,24 @@ export const MODELS = {
             contextWindow: 1048576,
             maxTokens: 131072,
         },
+        "mimo-v2.5-pro-ultraspeed": {
+            id: "mimo-v2.5-pro-ultraspeed",
+            name: "MiMo-V2.5-Pro-UltraSpeed",
+            api: "openai-completions",
+            provider: "xiaomi-token-plan-ams",
+            baseUrl: "https://token-plan-ams.xiaomimimo.com/v1",
+            compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 1.305,
+                output: 2.61,
+                cacheRead: 0.0108,
+                cacheWrite: 0,
+            },
+            contextWindow: 1048576,
+            maxTokens: 131072,
+        },
     },
     "xiaomi-token-plan-cn": {
         "mimo-v2-omni": {
@@ -16263,6 +16198,24 @@ export const MODELS = {
             contextWindow: 1048576,
             maxTokens: 131072,
         },
+        "mimo-v2.5-pro-ultraspeed": {
+            id: "mimo-v2.5-pro-ultraspeed",
+            name: "MiMo-V2.5-Pro-UltraSpeed",
+            api: "openai-completions",
+            provider: "xiaomi-token-plan-cn",
+            baseUrl: "https://token-plan-cn.xiaomimimo.com/v1",
+            compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 1.305,
+                output: 2.61,
+                cacheRead: 0.0108,
+                cacheWrite: 0,
+            },
+            contextWindow: 1048576,
+            maxTokens: 131072,
+        },
     },
     "xiaomi-token-plan-sgp": {
         "mimo-v2-omni": {
@@ -16337,6 +16290,24 @@ export const MODELS = {
             contextWindow: 1048576,
             maxTokens: 131072,
         },
+        "mimo-v2.5-pro-ultraspeed": {
+            id: "mimo-v2.5-pro-ultraspeed",
+            name: "MiMo-V2.5-Pro-UltraSpeed",
+            api: "openai-completions",
+            provider: "xiaomi-token-plan-sgp",
+            baseUrl: "https://token-plan-sgp.xiaomimimo.com/v1",
+            compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 1.305,
+                output: 2.61,
+                cacheRead: 0.0108,
+                cacheWrite: 0,
+            },
+            contextWindow: 1048576,
+            maxTokens: 131072,
+        },
     },
     "zai": {
         "glm-4.5-air": {