npm - @clinebot/llms - Versions diffs - 0.0.10 → 0.0.12 - Mend

@clinebot/llms 0.0.10 → 0.0.12

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (27) hide show

package/dist/index.browser.js +14 -14
package/dist/index.js +13 -13
package/dist/providers/handlers/ai-sdk-community.d.ts +1 -1
package/dist/providers/handlers/base.d.ts +7 -2
package/dist/providers/types/stream.d.ts +1 -1
package/package.json +2 -2
package/src/models/generated.ts +223 -641
package/src/models/models-dev-catalog.test.ts +2 -2
package/src/models/models-dev-catalog.ts +9 -2
package/src/providers/handlers/ai-sdk-community.ts +3 -0
package/src/providers/handlers/ai-sdk-provider-base.ts +12 -2
package/src/providers/handlers/anthropic-base.test.ts +30 -0
package/src/providers/handlers/anthropic-base.ts +31 -29
package/src/providers/handlers/base.test.ts +127 -2
package/src/providers/handlers/base.ts +115 -1
package/src/providers/handlers/bedrock-base.ts +4 -4
package/src/providers/handlers/community-sdk.test.ts +33 -0
package/src/providers/handlers/gemini-base.ts +6 -19
package/src/providers/handlers/openai-base.ts +33 -14
package/src/providers/handlers/openai-responses.test.ts +46 -0
package/src/providers/handlers/openai-responses.ts +12 -8
package/src/providers/handlers/r1-base.ts +10 -8
package/src/providers/handlers/vertex.ts +14 -4
package/src/providers/transform/anthropic-format.ts +14 -2
package/src/providers/transform/format-conversion.test.ts +23 -0
package/src/providers/transform/gemini-format.ts +77 -1
package/src/providers/types/stream.ts +1 -1

package/src/models/generated.ts CHANGED Viewed

@@ -14,7 +14,7 @@ export const GENERATED_PROVIDER_MODELS: {
 	version: number;
 	providers: Record<string, Record<string, ModelInfo>>;
 } = {
-	version: 1774031158558,
+	version: 1774365323810,
 	providers: {
 		aihubmix: {
 			"claude-sonnet-4-6": {
@@ -147,7 +147,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "kimi-k2.5",
 				name: "Kimi K2.5",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["images", "tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.6,
@@ -545,7 +545,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "Kimi-K2-0905",
 				name: "Kimi K2 0905",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["tools", "temperature"],
 				pricing: {
 					input: 0.55,
@@ -587,7 +587,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "qwen3-235b-a22b-instruct-2507",
 				name: "Qwen3 235B A22B Instruct 2507",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["tools", "temperature"],
 				pricing: {
 					input: 0.28,
@@ -601,7 +601,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "qwen3-235b-a22b-thinking-2507",
 				name: "Qwen3 235B A22B Thinking 2507",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.28,
@@ -993,8 +993,8 @@ export const GENERATED_PROVIDER_MODELS: {
 			},
 		},
 		baseten: {
-			"nvidia/Nemotron-3-Super": {
-				id: "nvidia/Nemotron-3-Super",
+			"nvidia/Nemotron-120B-A12B": {
+				id: "nvidia/Nemotron-120B-A12B",
 				name: "Nemotron 3 Super",
 				contextWindow: 262144,
 				maxTokens: 32678,
@@ -1011,7 +1011,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "MiniMaxAI/MiniMax-M2.5",
 				name: "MiniMax-M2.5",
 				contextWindow: 204000,
-				maxTokens: 204000,
+				maxTokens: 10200,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.3,
@@ -1067,7 +1067,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "zai-org/GLM-4.6",
 				name: "GLM 4.6",
 				contextWindow: 200000,
-				maxTokens: 200000,
+				maxTokens: 10000,
 				capabilities: ["tools", "temperature"],
 				pricing: {
 					input: 0.6,
@@ -1095,7 +1095,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "openai/gpt-oss-120b",
 				name: "GPT OSS 120B",
 				contextWindow: 128000,
-				maxTokens: 128000,
+				maxTokens: 6400,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.1,
@@ -1191,6 +1191,34 @@ export const GENERATED_PROVIDER_MODELS: {
 				},
 				releaseDate: "2026-02-17",
 			},
+			"minimax.minimax-m2.5": {
+				id: "minimax.minimax-m2.5",
+				name: "MiniMax M2.5",
+				contextWindow: 1000000,
+				maxTokens: 131072,
+				capabilities: ["tools", "reasoning", "temperature"],
+				pricing: {
+					input: 0.3,
+					output: 1.2,
+					cacheRead: 0,
+					cacheWrite: 0,
+				},
+				releaseDate: "2026-02-12",
+			},
+			"zai.glm-5": {
+				id: "zai.glm-5",
+				name: "GLM-5",
+				contextWindow: 200000,
+				maxTokens: 131072,
+				capabilities: ["tools", "reasoning", "temperature"],
+				pricing: {
+					input: 1,
+					output: 3.2,
+					cacheRead: 0,
+					cacheWrite: 0,
+				},
+				releaseDate: "2026-02-11",
+			},
 			"deepseek.v3.2": {
 				id: "deepseek.v3.2",
 				name: "DeepSeek-V3.2",
@@ -1209,7 +1237,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "moonshotai.kimi-k2.5",
 				name: "Kimi K2.5",
 				contextWindow: 256000,
-				maxTokens: 256000,
+				maxTokens: 12800,
 				capabilities: ["images", "tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.6,
@@ -1377,7 +1405,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "moonshot.kimi-k2-thinking",
 				name: "Kimi K2 Thinking",
 				contextWindow: 256000,
-				maxTokens: 256000,
+				maxTokens: 12800,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.6,
@@ -1517,7 +1545,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "qwen.qwen3-vl-235b-a22b",
 				name: "Qwen/Qwen3-VL-235B-A22B-Instruct",
 				contextWindow: 262000,
-				maxTokens: 262000,
+				maxTokens: 13100,
 				capabilities: ["images", "tools", "structured_output", "temperature"],
 				pricing: {
 					input: 0.3,
@@ -1615,7 +1643,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "qwen.qwen3-32b-v1:0",
 				name: "Qwen3 32B (dense)",
 				contextWindow: 16384,
-				maxTokens: 16384,
+				maxTokens: 819,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.15,
@@ -1657,7 +1685,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "qwen.qwen3-next-80b-a3b",
 				name: "Qwen/Qwen3-Next-80B-A3B-Instruct",
 				contextWindow: 262000,
-				maxTokens: 262000,
+				maxTokens: 13100,
 				capabilities: ["tools", "structured_output", "temperature"],
 				pricing: {
 					input: 0.14,
@@ -2377,7 +2405,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "accounts/fireworks/models/minimax-m2p5",
 				name: "MiniMax-M2.5",
 				contextWindow: 196608,
-				maxTokens: 196608,
+				maxTokens: 9830,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.3,
@@ -2405,7 +2433,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "accounts/fireworks/models/kimi-k2p5",
 				name: "Kimi K2.5",
 				contextWindow: 256000,
-				maxTokens: 256000,
+				maxTokens: 12800,
 				capabilities: ["images", "tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.6,
@@ -2415,11 +2443,25 @@ export const GENERATED_PROVIDER_MODELS: {
 				},
 				releaseDate: "2026-01-27",
 			},
+			"accounts/fireworks/routers/kimi-k2p5-turbo": {
+				id: "accounts/fireworks/routers/kimi-k2p5-turbo",
+				name: "Kimi K2.5 Turbo",
+				contextWindow: 256000,
+				maxTokens: 12800,
+				capabilities: ["images", "tools", "reasoning", "temperature"],
+				pricing: {
+					input: 0,
+					output: 0,
+					cacheRead: 0,
+					cacheWrite: 0,
+				},
+				releaseDate: "2026-01-27",
+			},
 			"accounts/fireworks/models/minimax-m2p1": {
 				id: "accounts/fireworks/models/minimax-m2p1",
 				name: "MiniMax-M2.1",
 				contextWindow: 200000,
-				maxTokens: 200000,
+				maxTokens: 10000,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.3,
@@ -2433,7 +2475,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "accounts/fireworks/models/glm-4p7",
 				name: "GLM 4.7",
 				contextWindow: 198000,
-				maxTokens: 198000,
+				maxTokens: 9900,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.6,
@@ -2447,7 +2489,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "accounts/fireworks/models/deepseek-v3p2",
 				name: "DeepSeek V3.2",
 				contextWindow: 160000,
-				maxTokens: 160000,
+				maxTokens: 8000,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.56,
@@ -2461,7 +2503,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "accounts/fireworks/models/kimi-k2-thinking",
 				name: "Kimi K2 Thinking",
 				contextWindow: 256000,
-				maxTokens: 256000,
+				maxTokens: 12800,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.6,
@@ -2475,7 +2517,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "accounts/fireworks/models/deepseek-v3p1",
 				name: "DeepSeek V3.1",
 				contextWindow: 163840,
-				maxTokens: 163840,
+				maxTokens: 8192,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.56,
@@ -2517,7 +2559,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "accounts/fireworks/models/glm-4p5-air",
 				name: "GLM 4.5 Air",
 				contextWindow: 131072,
-				maxTokens: 131072,
+				maxTokens: 6553,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.22,
@@ -2531,7 +2573,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "accounts/fireworks/models/glm-4p5",
 				name: "GLM 4.5",
 				contextWindow: 131072,
-				maxTokens: 131072,
+				maxTokens: 6553,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.55,
@@ -3124,7 +3166,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "llama-3.1-8b-instant",
 				name: "Llama 3.1 8B Instant",
 				contextWindow: 131072,
-				maxTokens: 131072,
+				maxTokens: 6553,
 				capabilities: ["tools", "temperature"],
 				pricing: {
 					input: 0.05,
@@ -3196,7 +3238,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "moonshotai/Kimi-K2.5",
 				name: "Kimi-K2.5",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["images", "tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.6,
@@ -3266,7 +3308,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "moonshotai/Kimi-K2-Thinking",
 				name: "Kimi-K2-Thinking",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.6,
@@ -3378,7 +3420,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "deepseek-ai/DeepSeek-R1-0528",
 				name: "DeepSeek-R1-0528",
 				contextWindow: 163840,
-				maxTokens: 163840,
+				maxTokens: 8192,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 3,
@@ -3524,7 +3566,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "kimi-k2.5",
 				name: "Kimi K2.5",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["images", "tools", "reasoning", "structured_output"],
 				pricing: {
 					input: 0.6,
@@ -3538,7 +3580,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "kimi-k2-thinking",
 				name: "Kimi K2 Thinking",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.6,
@@ -3552,7 +3594,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "kimi-k2-thinking-turbo",
 				name: "Kimi K2 Thinking Turbo",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 1.15,
@@ -3566,7 +3608,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "kimi-k2-0905-preview",
 				name: "Kimi K2 0905",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["tools", "temperature"],
 				pricing: {
 					input: 0.6,
@@ -3580,7 +3622,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "kimi-k2-turbo-preview",
 				name: "Kimi K2 Turbo",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["tools", "temperature"],
 				pricing: {
 					input: 2.4,
@@ -4323,7 +4365,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "kimi-k2.5",
 				name: "kimi-k2.5",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["images", "tools", "reasoning"],
 				pricing: {
 					input: 0,
@@ -4393,7 +4435,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "devstral-2:123b",
 				name: "devstral-2:123b",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["tools"],
 				pricing: {
 					input: 0,
@@ -4407,7 +4449,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "devstral-small-2:24b",
 				name: "devstral-small-2:24b",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["images", "tools"],
 				pricing: {
 					input: 0,
@@ -4435,7 +4477,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "mistral-large-3:675b",
 				name: "mistral-large-3:675b",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["images", "tools"],
 				pricing: {
 					input: 0,
@@ -4463,7 +4505,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "kimi-k2-thinking",
 				name: "kimi-k2-thinking",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["tools", "reasoning"],
 				pricing: {
 					input: 0,
@@ -4547,7 +4589,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "deepseek-v3.1:671b",
 				name: "deepseek-v3.1:671b",
 				contextWindow: 163840,
-				maxTokens: 163840,
+				maxTokens: 8192,
 				capabilities: ["tools", "reasoning"],
 				pricing: {
 					input: 0,
@@ -4603,7 +4645,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "kimi-k2:1t",
 				name: "kimi-k2:1t",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["tools"],
 				pricing: {
 					input: 0,
@@ -5217,7 +5259,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "gpt-4",
 				name: "GPT-4",
 				contextWindow: 8192,
-				maxTokens: 8192,
+				maxTokens: 409,
 				capabilities: ["tools", "temperature"],
 				pricing: {
 					input: 30,
@@ -5351,40 +5393,26 @@ export const GENERATED_PROVIDER_MODELS: {
 				},
 				releaseDate: "2026-03-12",
 			},
-			"openrouter/healer-alpha": {
-				id: "openrouter/healer-alpha",
-				name: "Healer Alpha",
+			"nvidia/nemotron-3-super-120b-a12b": {
+				id: "nvidia/nemotron-3-super-120b-a12b",
+				name: "Nemotron 3 Super",
 				contextWindow: 262144,
-				maxTokens: 64000,
-				capabilities: [
-					"images",
-					"files",
-					"tools",
-					"reasoning",
-					"structured_output",
-					"temperature",
-				],
+				maxTokens: 13107,
+				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
-					input: 0,
-					output: 0,
+					input: 0.1,
+					output: 0.5,
 					cacheRead: 0,
 					cacheWrite: 0,
 				},
 				releaseDate: "2026-03-11",
 			},
-			"openrouter/hunter-alpha": {
-				id: "openrouter/hunter-alpha",
-				name: "Hunter Alpha",
-				contextWindow: 1048576,
-				maxTokens: 64000,
-				capabilities: [
-					"images",
-					"files",
-					"tools",
-					"reasoning",
-					"structured_output",
-					"temperature",
-				],
+			"nvidia/nemotron-3-super-120b-a12b-free": {
+				id: "nvidia/nemotron-3-super-120b-a12b-free",
+				name: "Nemotron 3 Super (free)",
+				contextWindow: 262144,
+				maxTokens: 13107,
+				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0,
 					output: 0,
@@ -5627,25 +5655,6 @@ export const GENERATED_PROVIDER_MODELS: {
 				},
 				releaseDate: "2026-02-12",
 			},
-			"openrouter/aurora-alpha": {
-				id: "openrouter/aurora-alpha",
-				name: "Aurora Alpha",
-				contextWindow: 128000,
-				maxTokens: 50000,
-				capabilities: [
-					"tools",
-					"reasoning",
-					"structured_output",
-					"temperature",
-				],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2026-02-09",
-			},
 			"anthropic/claude-opus-4.6": {
 				id: "anthropic/claude-opus-4.6",
 				name: "Claude Opus 4.6",
@@ -5691,7 +5700,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "stepfun/step-3.5-flash",
 				name: "Step 3.5 Flash",
 				contextWindow: 256000,
-				maxTokens: 256000,
+				maxTokens: 12800,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.1,
@@ -5705,7 +5714,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "stepfun/step-3.5-flash:free",
 				name: "Step 3.5 Flash (free)",
 				contextWindow: 256000,
-				maxTokens: 256000,
+				maxTokens: 12800,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0,
@@ -5719,7 +5728,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "arcee-ai/trinity-large-preview:free",
 				name: "Trinity Large Preview",
 				contextWindow: 131072,
-				maxTokens: 131072,
+				maxTokens: 6553,
 				capabilities: ["tools", "structured_output", "temperature"],
 				pricing: {
 					input: 0,
@@ -5733,7 +5742,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "arcee-ai/trinity-mini:free",
 				name: "Trinity Mini",
 				contextWindow: 131072,
-				maxTokens: 131072,
+				maxTokens: 6553,
 				capabilities: ["tools", "structured_output", "temperature"],
 				pricing: {
 					input: 0,
@@ -5747,7 +5756,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "moonshotai/kimi-k2.5",
 				name: "Kimi K2.5",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: [
 					"images",
 					"tools",
@@ -5865,7 +5874,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "nvidia/nemotron-3-nano-30b-a3b:free",
 				name: "Nemotron 3 Nano 30B A3B (free)",
 				contextWindow: 256000,
-				maxTokens: 256000,
+				maxTokens: 12800,
 				capabilities: [
 					"tools",
 					"reasoning",
@@ -5979,25 +5988,6 @@ export const GENERATED_PROVIDER_MODELS: {
 				},
 				releaseDate: "2025-12-01",
 			},
-			"tngtech/tng-r1t-chimera:free": {
-				id: "tngtech/tng-r1t-chimera:free",
-				name: "R1T Chimera (free)",
-				contextWindow: 163840,
-				maxTokens: 163840,
-				capabilities: [
-					"tools",
-					"reasoning",
-					"structured_output",
-					"temperature",
-				],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-11-26",
-			},
 			"anthropic/claude-opus-4.5": {
 				id: "anthropic/claude-opus-4.5",
 				name: "Claude Opus 4.5",
@@ -6060,34 +6050,6 @@ export const GENERATED_PROVIDER_MODELS: {
 				},
 				releaseDate: "2025-11-18",
 			},
-			"openrouter/sherlock-dash-alpha": {
-				id: "openrouter/sherlock-dash-alpha",
-				name: "Sherlock Dash Alpha",
-				contextWindow: 1840000,
-				maxTokens: 0,
-				capabilities: ["images", "tools", "temperature"],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-11-15",
-			},
-			"openrouter/sherlock-think-alpha": {
-				id: "openrouter/sherlock-think-alpha",
-				name: "Sherlock Think Alpha",
-				contextWindow: 1840000,
-				maxTokens: 0,
-				capabilities: ["images", "tools", "reasoning", "temperature"],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-11-15",
-			},
 			"openai/gpt-5.1": {
 				id: "openai/gpt-5.1",
 				name: "GPT-5.1",
@@ -6188,25 +6150,11 @@ export const GENERATED_PROVIDER_MODELS: {
 				},
 				releaseDate: "2025-11-13",
 			},
-			"kwaipilot/kat-coder-pro:free": {
-				id: "kwaipilot/kat-coder-pro:free",
-				name: "Kat Coder Pro (free)",
-				contextWindow: 256000,
-				maxTokens: 65536,
-				capabilities: ["tools", "structured_output", "temperature"],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-11-10",
-			},
 			"moonshotai/kimi-k2-thinking": {
 				id: "moonshotai/kimi-k2-thinking",
 				name: "Kimi K2 Thinking",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: [
 					"tools",
 					"reasoning",
@@ -6239,7 +6187,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "nvidia/nemotron-nano-12b-v2-vl:free",
 				name: "Nemotron Nano 12B 2 VL (free)",
 				contextWindow: 128000,
-				maxTokens: 128000,
+				maxTokens: 6400,
 				capabilities: ["images", "tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0,
@@ -6487,7 +6435,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "mistralai/devstral-2512",
 				name: "Devstral 2 2512",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["tools", "structured_output", "temperature"],
 				pricing: {
 					input: 0.15,
@@ -6497,25 +6445,11 @@ export const GENERATED_PROVIDER_MODELS: {
 				},
 				releaseDate: "2025-09-12",
 			},
-			"mistralai/devstral-2512:free": {
-				id: "mistralai/devstral-2512:free",
-				name: "Devstral 2 2512 (free)",
-				contextWindow: 262144,
-				maxTokens: 262144,
-				capabilities: ["tools", "temperature"],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-09-12",
-			},
 			"qwen/qwen3-next-80b-a3b-instruct": {
 				id: "qwen/qwen3-next-80b-a3b-instruct",
 				name: "Qwen3 Next 80B A3B Instruct",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["tools", "structured_output", "temperature"],
 				pricing: {
 					input: 0.14,
@@ -6529,7 +6463,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "qwen/qwen3-next-80b-a3b-instruct:free",
 				name: "Qwen3 Next 80B A3B Instruct (free)",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["tools", "structured_output", "temperature"],
 				pricing: {
 					input: 0,
@@ -6543,7 +6477,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "qwen/qwen3-next-80b-a3b-thinking",
 				name: "Qwen3 Next 80B A3B Thinking",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: [
 					"tools",
 					"reasoning",
@@ -6590,7 +6524,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "nvidia/nemotron-nano-9b-v2:free",
 				name: "Nemotron Nano 9B V2 (free)",
 				contextWindow: 128000,
-				maxTokens: 128000,
+				maxTokens: 6400,
 				capabilities: [
 					"tools",
 					"reasoning",
@@ -6642,7 +6576,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "nousresearch/hermes-4-405b",
 				name: "Hermes 4 405B",
 				contextWindow: 131072,
-				maxTokens: 131072,
+				maxTokens: 6553,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 1,
@@ -6656,7 +6590,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "nousresearch/hermes-4-70b",
 				name: "Hermes 4 70B",
 				contextWindow: 131072,
-				maxTokens: 131072,
+				maxTokens: 6553,
 				capabilities: [
 					"tools",
 					"reasoning",
@@ -6675,7 +6609,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "deepseek/deepseek-chat-v3.1",
 				name: "DeepSeek-V3.1",
 				contextWindow: 163840,
-				maxTokens: 163840,
+				maxTokens: 8192,
 				capabilities: [
 					"tools",
 					"reasoning",
@@ -6714,7 +6648,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "nvidia/nemotron-nano-9b-v2",
 				name: "nvidia-nemotron-nano-9b-v2",
 				contextWindow: 131072,
-				maxTokens: 131072,
+				maxTokens: 6553,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.04,
@@ -6728,7 +6662,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "mistralai/mistral-medium-3.1",
 				name: "Mistral Medium 3.1",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["images", "tools", "structured_output", "temperature"],
 				pricing: {
 					input: 0.4,
@@ -6928,7 +6862,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "mistralai/codestral-2508",
 				name: "Codestral 2508",
 				contextWindow: 256000,
-				maxTokens: 256000,
+				maxTokens: 12800,
 				capabilities: ["tools", "structured_output", "temperature"],
 				pricing: {
 					input: 0.3,
@@ -6956,7 +6890,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "qwen/qwen3-30b-a3b-instruct-2507",
 				name: "Qwen3 30B A3B Instruct 2507",
 				contextWindow: 262000,
-				maxTokens: 262000,
+				maxTokens: 13100,
 				capabilities: ["tools", "structured_output", "temperature"],
 				pricing: {
 					input: 0.2,
@@ -6970,7 +6904,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "qwen/qwen3-30b-a3b-thinking-2507",
 				name: "Qwen3 30B A3B Thinking 2507",
 				contextWindow: 262000,
-				maxTokens: 262000,
+				maxTokens: 13100,
 				capabilities: [
 					"tools",
 					"reasoning",
@@ -7137,7 +7071,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "moonshotai/kimi-k2:free",
 				name: "Kimi K2 (free)",
 				contextWindow: 32800,
-				maxTokens: 32800,
+				maxTokens: 1640,
 				capabilities: ["tools", "temperature"],
 				pricing: {
 					input: 0,
@@ -7151,7 +7085,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "mistralai/devstral-medium-2507",
 				name: "Devstral Medium",
 				contextWindow: 131072,
-				maxTokens: 131072,
+				maxTokens: 6553,
 				capabilities: ["tools", "structured_output", "temperature"],
 				pricing: {
 					input: 0.4,
@@ -7165,7 +7099,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "mistralai/devstral-small-2507",
 				name: "Devstral Small 1.1",
 				contextWindow: 131072,
-				maxTokens: 131072,
+				maxTokens: 6553,
 				capabilities: ["tools", "structured_output", "temperature"],
 				pricing: {
 					input: 0.1,
@@ -7222,20 +7156,6 @@ export const GENERATED_PROVIDER_MODELS: {
 				},
 				releaseDate: "2025-06-20",
 			},
-			"mistralai/mistral-small-3.2-24b-instruct:free": {
-				id: "mistralai/mistral-small-3.2-24b-instruct:free",
-				name: "Mistral Small 3.2 24B (free)",
-				contextWindow: 96000,
-				maxTokens: 96000,
-				capabilities: ["images", "tools", "structured_output", "temperature"],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-06-20",
-			},
 			"google/gemini-2.5-flash-lite": {
 				id: "google/gemini-2.5-flash-lite",
 				name: "Gemini 2.5 Flash Lite",
@@ -7271,20 +7191,6 @@ export const GENERATED_PROVIDER_MODELS: {
 				},
 				releaseDate: "2025-06-17",
 			},
-			"moonshotai/kimi-dev-72b:free": {
-				id: "moonshotai/kimi-dev-72b:free",
-				name: "Kimi Dev 72b (free)",
-				contextWindow: 131072,
-				maxTokens: 131072,
-				capabilities: ["tools", "temperature"],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-06-16",
-			},
 			"google/gemini-2.5-pro-preview-06-05": {
 				id: "google/gemini-2.5-pro-preview-06-05",
 				name: "Gemini 2.5 Pro Preview 06-05",
@@ -7306,34 +7212,6 @@ export const GENERATED_PROVIDER_MODELS: {
 				},
 				releaseDate: "2025-06-05",
 			},
-			"deepseek/deepseek-r1-0528-qwen3-8b:free": {
-				id: "deepseek/deepseek-r1-0528-qwen3-8b:free",
-				name: "Deepseek R1 0528 Qwen3 8B (free)",
-				contextWindow: 131072,
-				maxTokens: 131072,
-				capabilities: ["tools", "reasoning", "temperature"],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-05-29",
-			},
-			"sarvamai/sarvam-m:free": {
-				id: "sarvamai/sarvam-m:free",
-				name: "Sarvam-M (free)",
-				contextWindow: 32768,
-				maxTokens: 32768,
-				capabilities: ["tools", "reasoning", "temperature"],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-05-25",
-			},
 			"anthropic/claude-opus-4": {
 				id: "anthropic/claude-opus-4",
 				name: "Claude Opus 4",
@@ -7362,25 +7240,11 @@ export const GENERATED_PROVIDER_MODELS: {
 				},
 				releaseDate: "2025-05-22",
 			},
-			"mistralai/devstral-small-2505:free": {
-				id: "mistralai/devstral-small-2505:free",
-				name: "Devstral Small 2505 (free)",
-				contextWindow: 32768,
-				maxTokens: 32768,
-				capabilities: ["tools", "temperature"],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-05-21",
-			},
 			"mistralai/devstral-small-2505": {
 				id: "mistralai/devstral-small-2505",
 				name: "Devstral Small",
 				contextWindow: 128000,
-				maxTokens: 128000,
+				maxTokens: 6400,
 				capabilities: ["tools", "temperature"],
 				pricing: {
 					input: 0.06,
@@ -7394,7 +7258,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "mistralai/mistral-medium-3",
 				name: "Mistral Medium 3",
 				contextWindow: 131072,
-				maxTokens: 131072,
+				maxTokens: 6553,
 				capabilities: ["images", "tools", "structured_output", "temperature"],
 				pricing: {
 					input: 0.4,
@@ -7443,7 +7307,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "qwen/qwen3-4b:free",
 				name: "Qwen3 4B (free)",
 				contextWindow: 40960,
-				maxTokens: 40960,
+				maxTokens: 2048,
 				capabilities: [
 					"tools",
 					"reasoning",
@@ -7458,25 +7322,6 @@ export const GENERATED_PROVIDER_MODELS: {
 				},
 				releaseDate: "2025-04-30",
 			},
-			"qwen/qwen3-14b:free": {
-				id: "qwen/qwen3-14b:free",
-				name: "Qwen3 14B (free)",
-				contextWindow: 40960,
-				maxTokens: 40960,
-				capabilities: [
-					"tools",
-					"reasoning",
-					"structured_output",
-					"temperature",
-				],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-04-28",
-			},
 			"qwen/qwen3-235b-a22b-07-25": {
 				id: "qwen/qwen3-235b-a22b-07-25",
 				name: "Qwen3 235B A22B Instruct 2507",
@@ -7491,140 +7336,22 @@ export const GENERATED_PROVIDER_MODELS: {
 				},
 				releaseDate: "2025-04-28",
 			},
-			"qwen/qwen3-235b-a22b-07-25:free": {
-				id: "qwen/qwen3-235b-a22b-07-25:free",
-				name: "Qwen3 235B A22B Instruct 2507 (free)",
-				contextWindow: 262144,
-				maxTokens: 131072,
-				capabilities: ["tools", "temperature"],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-04-28",
-			},
-			"qwen/qwen3-235b-a22b:free": {
-				id: "qwen/qwen3-235b-a22b:free",
-				name: "Qwen3 235B A22B (free)",
-				contextWindow: 131072,
-				maxTokens: 131072,
+			"openai/o4-mini": {
+				id: "openai/o4-mini",
+				name: "o4 Mini",
+				contextWindow: 200000,
+				maxTokens: 100000,
 				capabilities: [
+					"images",
 					"tools",
 					"reasoning",
 					"structured_output",
 					"temperature",
 				],
 				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-04-28",
-			},
-			"qwen/qwen3-30b-a3b:free": {
-				id: "qwen/qwen3-30b-a3b:free",
-				name: "Qwen3 30B A3B (free)",
-				contextWindow: 40960,
-				maxTokens: 40960,
-				capabilities: [
-					"tools",
-					"reasoning",
-					"structured_output",
-					"temperature",
-				],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-04-28",
-			},
-			"qwen/qwen3-32b:free": {
-				id: "qwen/qwen3-32b:free",
-				name: "Qwen3 32B (free)",
-				contextWindow: 40960,
-				maxTokens: 40960,
-				capabilities: [
-					"tools",
-					"reasoning",
-					"structured_output",
-					"temperature",
-				],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-04-28",
-			},
-			"qwen/qwen3-8b:free": {
-				id: "qwen/qwen3-8b:free",
-				name: "Qwen3 8B (free)",
-				contextWindow: 40960,
-				maxTokens: 40960,
-				capabilities: [
-					"tools",
-					"reasoning",
-					"structured_output",
-					"temperature",
-				],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-04-28",
-			},
-			"microsoft/mai-ds-r1:free": {
-				id: "microsoft/mai-ds-r1:free",
-				name: "MAI DS R1 (free)",
-				contextWindow: 163840,
-				maxTokens: 163840,
-				capabilities: ["tools", "reasoning", "temperature"],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-04-21",
-			},
-			"thudm/glm-z1-32b:free": {
-				id: "thudm/glm-z1-32b:free",
-				name: "GLM Z1 32B (free)",
-				contextWindow: 32768,
-				maxTokens: 32768,
-				capabilities: ["tools", "reasoning", "temperature"],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-04-17",
-			},
-			"openai/o4-mini": {
-				id: "openai/o4-mini",
-				name: "o4 Mini",
-				contextWindow: 200000,
-				maxTokens: 100000,
-				capabilities: [
-					"images",
-					"tools",
-					"reasoning",
-					"structured_output",
-					"temperature",
-				],
-				pricing: {
-					input: 1.1,
-					output: 4.4,
-					cacheRead: 0.28,
+					input: 1.1,
+					output: 4.4,
+					cacheRead: 0.28,
 					cacheWrite: 0,
 				},
 				releaseDate: "2025-04-16",
@@ -7657,34 +7384,6 @@ export const GENERATED_PROVIDER_MODELS: {
 				},
 				releaseDate: "2025-04-14",
 			},
-			"meta-llama/llama-4-scout:free": {
-				id: "meta-llama/llama-4-scout:free",
-				name: "Llama 4 Scout (free)",
-				contextWindow: 64000,
-				maxTokens: 64000,
-				capabilities: ["images", "tools", "structured_output", "temperature"],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-04-05",
-			},
-			"qwen/qwen2.5-vl-32b-instruct:free": {
-				id: "qwen/qwen2.5-vl-32b-instruct:free",
-				name: "Qwen2.5 VL 32B Instruct (free)",
-				contextWindow: 8192,
-				maxTokens: 8192,
-				capabilities: ["images", "tools", "structured_output", "temperature"],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-03-24",
-			},
 			"google/gemini-2.5-pro": {
 				id: "google/gemini-2.5-pro",
 				name: "Gemini 2.5 Pro",
@@ -7724,7 +7423,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "google/gemma-3-27b-it",
 				name: "Gemma 3 27B",
 				contextWindow: 96000,
-				maxTokens: 96000,
+				maxTokens: 4800,
 				capabilities: ["images", "tools", "structured_output", "temperature"],
 				pricing: {
 					input: 0.04,
@@ -7748,53 +7447,6 @@ export const GENERATED_PROVIDER_MODELS: {
 				},
 				releaseDate: "2025-03-12",
 			},
-			"rekaai/reka-flash-3": {
-				id: "rekaai/reka-flash-3",
-				name: "Reka Flash 3",
-				contextWindow: 32768,
-				maxTokens: 8192,
-				capabilities: ["tools", "reasoning", "temperature"],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-03-12",
-			},
-			"qwen/qwq-32b:free": {
-				id: "qwen/qwq-32b:free",
-				name: "QwQ 32B (free)",
-				contextWindow: 32768,
-				maxTokens: 32768,
-				capabilities: [
-					"tools",
-					"reasoning",
-					"structured_output",
-					"temperature",
-				],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-03-05",
-			},
-			"nousresearch/deephermes-3-llama-3-8b-preview": {
-				id: "nousresearch/deephermes-3-llama-3-8b-preview",
-				name: "DeepHermes 3 Llama 3 8B Preview",
-				contextWindow: 131072,
-				maxTokens: 8192,
-				capabilities: ["tools", "reasoning", "temperature"],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-02-28",
-			},
 			"anthropic/claude-3.7-sonnet": {
 				id: "anthropic/claude-3.7-sonnet",
 				name: "Claude Sonnet 3.7",
@@ -7870,67 +7522,11 @@ export const GENERATED_PROVIDER_MODELS: {
 				},
 				releaseDate: "2025-02-17",
 			},
-			"cognitivecomputations/dolphin3.0-mistral-24b": {
-				id: "cognitivecomputations/dolphin3.0-mistral-24b",
-				name: "Dolphin3.0 Mistral 24B",
-				contextWindow: 32768,
-				maxTokens: 8192,
-				capabilities: ["tools", "temperature"],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-02-13",
-			},
-			"cognitivecomputations/dolphin3.0-r1-mistral-24b": {
-				id: "cognitivecomputations/dolphin3.0-r1-mistral-24b",
-				name: "Dolphin3.0 R1 Mistral 24B",
-				contextWindow: 32768,
-				maxTokens: 8192,
-				capabilities: ["tools", "reasoning", "temperature"],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-02-13",
-			},
-			"qwen/qwen2.5-vl-72b-instruct:free": {
-				id: "qwen/qwen2.5-vl-72b-instruct:free",
-				name: "Qwen2.5 VL 72B Instruct (free)",
-				contextWindow: 32768,
-				maxTokens: 32768,
-				capabilities: ["images", "tools", "temperature"],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-02-01",
-			},
-			"deepseek/deepseek-r1:free": {
-				id: "deepseek/deepseek-r1:free",
-				name: "R1 (free)",
-				contextWindow: 163840,
-				maxTokens: 163840,
-				capabilities: ["tools", "reasoning", "temperature"],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2025-01-20",
-			},
 			"minimax/minimax-01": {
 				id: "minimax/minimax-01",
 				name: "MiniMax-01",
 				contextWindow: 1000000,
-				maxTokens: 1000000,
+				maxTokens: 50000,
 				capabilities: ["images", "tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.2,
@@ -7979,25 +7575,11 @@ export const GENERATED_PROVIDER_MODELS: {
 				},
 				releaseDate: "2024-12-11",
 			},
-			"google/gemini-2.0-flash-exp:free": {
-				id: "google/gemini-2.0-flash-exp:free",
-				name: "Gemini 2.0 Flash Experimental (free)",
-				contextWindow: 1048576,
-				maxTokens: 1048576,
-				capabilities: ["images", "tools", "temperature"],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2024-12-11",
-			},
 			"meta-llama/llama-3.3-70b-instruct:free": {
 				id: "meta-llama/llama-3.3-70b-instruct:free",
 				name: "Llama 3.3 70B Instruct (free)",
 				contextWindow: 131072,
-				maxTokens: 131072,
+				maxTokens: 6553,
 				capabilities: ["tools", "structured_output", "temperature"],
 				pricing: {
 					input: 0,
@@ -8021,34 +7603,6 @@ export const GENERATED_PROVIDER_MODELS: {
 				},
 				releaseDate: "2024-10-22",
 			},
-			"qwen/qwen-2.5-vl-7b-instruct:free": {
-				id: "qwen/qwen-2.5-vl-7b-instruct:free",
-				name: "Qwen2.5-VL 7B Instruct (free)",
-				contextWindow: 32768,
-				maxTokens: 32768,
-				capabilities: ["images", "tools", "temperature"],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2024-08-28",
-			},
-			"mistralai/mistral-nemo:free": {
-				id: "mistralai/mistral-nemo:free",
-				name: "Mistral Nemo (free)",
-				contextWindow: 131072,
-				maxTokens: 131072,
-				capabilities: ["tools", "structured_output", "temperature"],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2024-07-19",
-			},
 			"openai/gpt-4o-mini": {
 				id: "openai/gpt-4o-mini",
 				name: "GPT-4o-mini",
@@ -8063,20 +7617,6 @@ export const GENERATED_PROVIDER_MODELS: {
 				},
 				releaseDate: "2024-07-18",
 			},
-			"mistralai/mistral-7b-instruct:free": {
-				id: "mistralai/mistral-7b-instruct:free",
-				name: "Mistral 7B Instruct (free)",
-				contextWindow: 32768,
-				maxTokens: 32768,
-				capabilities: ["tools", "temperature"],
-				pricing: {
-					input: 0,
-					output: 0,
-					cacheRead: 0,
-					cacheWrite: 0,
-				},
-				releaseDate: "2024-05-27",
-			},
 		},
 		requesty: {
 			"openai/gpt-5.4": {
@@ -9027,7 +8567,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "Qwen/Qwen3-Coder-Next-FP8",
 				name: "Qwen3 Coder Next FP8",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.5,
@@ -9041,7 +8581,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "moonshotai/Kimi-K2.5",
 				name: "Kimi K2.5",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["images", "tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.5,
@@ -9055,7 +8595,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "essentialai/Rnj-1-Instruct",
 				name: "Rnj-1 Instruct",
 				contextWindow: 32768,
-				maxTokens: 32768,
+				maxTokens: 1638,
 				capabilities: ["tools", "temperature"],
 				pricing: {
 					input: 0.15,
@@ -9069,7 +8609,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "zai-org/GLM-4.6",
 				name: "GLM 4.6",
 				contextWindow: 200000,
-				maxTokens: 200000,
+				maxTokens: 10000,
 				capabilities: ["tools", "temperature"],
 				pricing: {
 					input: 0.6,
@@ -9083,7 +8623,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "deepseek-ai/DeepSeek-V3-1",
 				name: "DeepSeek V3.1",
 				contextWindow: 131072,
-				maxTokens: 131072,
+				maxTokens: 6553,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.6,
@@ -9097,7 +8637,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "openai/gpt-oss-120b",
 				name: "GPT OSS 120B",
 				contextWindow: 131072,
-				maxTokens: 131072,
+				maxTokens: 6553,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.15,
@@ -9111,7 +8651,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "Qwen/Qwen3-235B-A22B-Instruct-2507-tput",
 				name: "Qwen3 235B A22B Instruct 2507 FP8",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.2,
@@ -9125,7 +8665,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "Qwen/Qwen3-Next-80B-A3B-Instruct",
 				name: "Qwen3-Next-80B-A3B-Instruct",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["tools", "temperature"],
 				pricing: {
 					input: 0.15,
@@ -9139,7 +8679,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "zai-org/GLM-4.7",
 				name: "GLM-4.7",
 				contextWindow: 200000,
-				maxTokens: 200000,
+				maxTokens: 10000,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.45,
@@ -9153,7 +8693,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
 				name: "Qwen3 Coder 480B A35B Instruct",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["tools", "temperature"],
 				pricing: {
 					input: 2,
@@ -9167,7 +8707,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "moonshotai/Kimi-K2-Instruct",
 				name: "Kimi K2 Instruct",
 				contextWindow: 131072,
-				maxTokens: 131072,
+				maxTokens: 6553,
 				capabilities: ["tools", "temperature"],
 				pricing: {
 					input: 1,
@@ -9181,7 +8721,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "deepseek-ai/DeepSeek-V3",
 				name: "DeepSeek V3",
 				contextWindow: 131072,
-				maxTokens: 131072,
+				maxTokens: 6553,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 1.25,
@@ -9195,7 +8735,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "meta-llama/Llama-3.3-70B-Instruct-Turbo",
 				name: "Llama 3.3 70B",
 				contextWindow: 131072,
-				maxTokens: 131072,
+				maxTokens: 6553,
 				capabilities: ["tools", "temperature"],
 				pricing: {
 					input: 0.88,
@@ -9309,7 +8849,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "xai/grok-4.20-multi-agent-beta",
 				name: "Grok 4.20 Multi Agent Beta",
 				contextWindow: 2000000,
-				maxTokens: 2000000,
+				maxTokens: 100000,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 2,
@@ -9323,7 +8863,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "xai/grok-4.20-non-reasoning-beta",
 				name: "Grok 4.20 Beta Non-Reasoning",
 				contextWindow: 2000000,
-				maxTokens: 2000000,
+				maxTokens: 100000,
 				capabilities: ["images", "files", "tools", "temperature"],
 				pricing: {
 					input: 2,
@@ -9337,7 +8877,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "xai/grok-4.20-reasoning-beta",
 				name: "Grok 4.20 Beta Reasoning",
 				contextWindow: 2000000,
-				maxTokens: 2000000,
+				maxTokens: 100000,
 				capabilities: ["images", "files", "tools", "reasoning", "temperature"],
 				pricing: {
 					input: 2,
@@ -9347,6 +8887,48 @@ export const GENERATED_PROVIDER_MODELS: {
 				},
 				releaseDate: "2026-03-11",
 			},
+			"xai/grok-4.20-multi-agent": {
+				id: "xai/grok-4.20-multi-agent",
+				name: "Grok 4.20 Multi-Agent",
+				contextWindow: 2000000,
+				maxTokens: 100000,
+				capabilities: ["tools", "reasoning", "temperature"],
+				pricing: {
+					input: 2,
+					output: 6,
+					cacheRead: 0.19999999999999998,
+					cacheWrite: 0,
+				},
+				releaseDate: "2026-03-09",
+			},
+			"xai/grok-4.20-non-reasoning": {
+				id: "xai/grok-4.20-non-reasoning",
+				name: "Grok 4.20 Non-Reasoning",
+				contextWindow: 2000000,
+				maxTokens: 100000,
+				capabilities: ["images", "files", "tools", "temperature"],
+				pricing: {
+					input: 2,
+					output: 6,
+					cacheRead: 0.19999999999999998,
+					cacheWrite: 0,
+				},
+				releaseDate: "2026-03-09",
+			},
+			"xai/grok-4.20-reasoning": {
+				id: "xai/grok-4.20-reasoning",
+				name: "Grok 4.20 Reasoning",
+				contextWindow: 2000000,
+				maxTokens: 100000,
+				capabilities: ["images", "files", "tools", "reasoning", "temperature"],
+				pricing: {
+					input: 2,
+					output: 6,
+					cacheRead: 0.19999999999999998,
+					cacheWrite: 0,
+				},
+				releaseDate: "2026-03-09",
+			},
 			"openai/gpt-5.4": {
 				id: "openai/gpt-5.4",
 				name: "GPT 5.4",
@@ -9421,7 +9003,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "inception/mercury-2",
 				name: "Mercury 2",
 				contextWindow: 128000,
-				maxTokens: 128000,
+				maxTokens: 6400,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.25,
@@ -9547,7 +9129,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "moonshotai/kimi-k2.5",
 				name: "Kimi K2.5",
 				contextWindow: 262144,
-				maxTokens: 262144,
+				maxTokens: 13107,
 				capabilities: ["images", "tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.6,
@@ -9603,7 +9185,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "mistral/devstral-2",
 				name: "Devstral 2",
 				contextWindow: 256000,
-				maxTokens: 256000,
+				maxTokens: 12800,
 				capabilities: ["tools", "temperature"],
 				pricing: {
 					input: 0,
@@ -9645,7 +9227,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "prime-intellect/intellect-3",
 				name: "INTELLECT 3",
 				contextWindow: 131072,
-				maxTokens: 131072,
+				maxTokens: 6553,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.2,
@@ -9687,7 +9269,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "moonshotai/kimi-k2-thinking",
 				name: "Kimi K2 Thinking",
 				contextWindow: 216144,
-				maxTokens: 216144,
+				maxTokens: 10807,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.47,
@@ -9701,7 +9283,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "moonshotai/kimi-k2-thinking-turbo",
 				name: "Kimi K2 Thinking Turbo",
 				contextWindow: 262114,
-				maxTokens: 262114,
+				maxTokens: 13105,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 1.15,
@@ -9715,7 +9297,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "minimax/minimax-m2",
 				name: "MiniMax M2",
 				contextWindow: 262114,
-				maxTokens: 262114,
+				maxTokens: 13105,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.27,
@@ -9841,7 +9423,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "deepseek/deepseek-v3.2-exp",
 				name: "DeepSeek V3.2 Exp",
 				contextWindow: 163840,
-				maxTokens: 163840,
+				maxTokens: 8192,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.27,
@@ -10093,7 +9675,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "nvidia/nemotron-nano-9b-v2",
 				name: "Nvidia Nemotron Nano 9B V2",
 				contextWindow: 131072,
-				maxTokens: 131072,
+				maxTokens: 6553,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.04,
@@ -10107,7 +9689,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "zai/glm-4.5v",
 				name: "GLM 4.5V",
 				contextWindow: 66000,
-				maxTokens: 66000,
+				maxTokens: 3300,
 				capabilities: ["images", "tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.6,
@@ -10289,7 +9871,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "openai/gpt-oss-120b",
 				name: "GPT OSS 120B",
 				contextWindow: 131072,
-				maxTokens: 131072,
+				maxTokens: 6553,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.1,
@@ -10317,7 +9899,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "zai/glm-4.5",
 				name: "GLM 4.5",
 				contextWindow: 131072,
-				maxTokens: 131072,
+				maxTokens: 6553,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.6,
@@ -10345,7 +9927,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "alibaba/qwen3-coder-plus",
 				name: "Qwen3 Coder Plus",
 				contextWindow: 1000000,
-				maxTokens: 1000000,
+				maxTokens: 50000,
 				capabilities: ["tools", "temperature"],
 				pricing: {
 					input: 1,
@@ -10359,7 +9941,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "alibaba/qwen3-coder-next",
 				name: "Qwen3 Coder Next",
 				contextWindow: 256000,
-				maxTokens: 256000,
+				maxTokens: 12800,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.5,
@@ -10555,7 +10137,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "mistral/devstral-small-2",
 				name: "Devstral Small 2",
 				contextWindow: 256000,
-				maxTokens: 256000,
+				maxTokens: 12800,
 				capabilities: ["tools", "temperature"],
 				pricing: {
 					input: 0,
@@ -10751,7 +10333,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "alibaba/qwen3-235b-a22b-thinking",
 				name: "Qwen3 235B A22B Thinking 2507",
 				contextWindow: 262114,
-				maxTokens: 262114,
+				maxTokens: 13105,
 				capabilities: ["images", "files", "tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.3,
@@ -10849,7 +10431,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "mistral/magistral-small",
 				name: "Magistral Small",
 				contextWindow: 128000,
-				maxTokens: 128000,
+				maxTokens: 6400,
 				capabilities: ["tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.5,
@@ -11017,7 +10599,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "arcee-ai/trinity-large-preview",
 				name: "Trinity Large Preview",
 				contextWindow: 131000,
-				maxTokens: 131000,
+				maxTokens: 6550,
 				capabilities: ["tools", "temperature"],
 				pricing: {
 					input: 0.25,
@@ -11183,7 +10765,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "nvidia/nemotron-nano-12b-v2-vl",
 				name: "Nvidia Nemotron Nano 12B V2 VL",
 				contextWindow: 131072,
-				maxTokens: 131072,
+				maxTokens: 6553,
 				capabilities: ["images", "tools", "reasoning", "temperature"],
 				pricing: {
 					input: 0.2,
@@ -11211,7 +10793,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "mistral/pixtral-large",
 				name: "Pixtral Large (latest)",
 				contextWindow: 128000,
-				maxTokens: 128000,
+				maxTokens: 6400,
 				capabilities: ["images", "tools", "temperature"],
 				pricing: {
 					input: 2,
@@ -11253,7 +10835,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "mistral/ministral-3b",
 				name: "Ministral 3B (latest)",
 				contextWindow: 128000,
-				maxTokens: 128000,
+				maxTokens: 6400,
 				capabilities: ["tools", "temperature"],
 				pricing: {
 					input: 0.04,
@@ -11267,7 +10849,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "mistral/ministral-8b",
 				name: "Ministral 8B (latest)",
 				contextWindow: 128000,
-				maxTokens: 128000,
+				maxTokens: 6400,
 				capabilities: ["tools", "temperature"],
 				pricing: {
 					input: 0.1,
@@ -11323,7 +10905,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "mistral/pixtral-12b",
 				name: "Pixtral 12B",
 				contextWindow: 128000,
-				maxTokens: 128000,
+				maxTokens: 6400,
 				capabilities: ["images", "tools", "temperature"],
 				pricing: {
 					input: 0.15,
@@ -11463,7 +11045,7 @@ export const GENERATED_PROVIDER_MODELS: {
 				id: "mistral/mixtral-8x22b-instruct",
 				name: "Mixtral 8x22B",
 				contextWindow: 64000,
-				maxTokens: 64000,
+				maxTokens: 3200,
 				capabilities: ["tools", "temperature"],
 				pricing: {
 					input: 2,
@@ -11673,9 +11255,9 @@ export const GENERATED_PROVIDER_MODELS: {
 			},
 		},
 		xai: {
-			"grok-4.20-beta-latest-non-reasoning": {
-				id: "grok-4.20-beta-latest-non-reasoning",
-				name: "Grok 4.20 Beta (Non-Reasoning)",
+			"grok-4.20-0309-non-reasoning": {
+				id: "grok-4.20-0309-non-reasoning",
+				name: "Grok 4.20 (Non-Reasoning)",
 				contextWindow: 2000000,
 				maxTokens: 30000,
 				capabilities: ["images", "tools", "temperature"],
@@ -11687,9 +11269,9 @@ export const GENERATED_PROVIDER_MODELS: {
 				},
 				releaseDate: "2026-03-09",
 			},
-			"grok-4.20-beta-latest-reasoning": {
-				id: "grok-4.20-beta-latest-reasoning",
-				name: "Grok 4.20 Beta (Reasoning)",
+			"grok-4.20-0309-reasoning": {
+				id: "grok-4.20-0309-reasoning",
+				name: "Grok 4.20 (Reasoning)",
 				contextWindow: 2000000,
 				maxTokens: 30000,
 				capabilities: ["images", "tools", "reasoning", "temperature"],