npm - @dreb/ai - Versions diffs - 2.14.1 → 2.15.1 - Mend

@dreb/ai 2.14.1 → 2.15.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (16) hide show

package/dist/models.d.ts.map +1 -1
package/dist/models.generated.d.ts +127 -161
package/dist/models.generated.d.ts.map +1 -1
package/dist/models.generated.js +231 -265
package/dist/models.generated.js.map +1 -1
package/dist/models.js +4 -1
package/dist/models.js.map +1 -1
package/dist/providers/openai-codex-responses.d.ts +7 -0
package/dist/providers/openai-codex-responses.d.ts.map +1 -1
package/dist/providers/openai-codex-responses.js +133 -16
package/dist/providers/openai-codex-responses.js.map +1 -1
package/dist/providers/openai-responses-shared.d.ts +7 -0
package/dist/providers/openai-responses-shared.d.ts.map +1 -1
package/dist/providers/openai-responses-shared.js +8 -1
package/dist/providers/openai-responses-shared.js.map +1 -1
package/package.json +1 -1

package/dist/models.generated.js CHANGED Viewed

@@ -3513,6 +3513,23 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 64000,
         },
+        "gemini-3.1-flash-lite": {
+            id: "gemini-3.1-flash-lite",
+            name: "Gemini 3.1 Flash Lite",
+            api: "google-generative-ai",
+            provider: "google",
+            baseUrl: "https://generativelanguage.googleapis.com/v1beta",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0.25,
+                output: 1.5,
+                cacheRead: 0.025,
+                cacheWrite: 1,
+            },
+            contextWindow: 1048576,
+            maxTokens: 65536,
+        },
         "gemini-3.1-flash-lite-preview": {
             id: "gemini-3.1-flash-lite-preview",
             name: "Gemini 3.1 Flash Lite Preview",
@@ -6229,40 +6246,6 @@ export const MODELS = {
             contextWindow: 272000,
             maxTokens: 128000,
         },
-        "gpt-5.2": {
-            id: "gpt-5.2",
-            name: "GPT-5.2",
-            api: "openai-codex-responses",
-            provider: "openai-codex",
-            baseUrl: "https://chatgpt.com/backend-api",
-            reasoning: true,
-            input: ["text", "image"],
-            cost: {
-                input: 1.75,
-                output: 14,
-                cacheRead: 0.175,
-                cacheWrite: 0,
-            },
-            contextWindow: 272000,
-            maxTokens: 128000,
-        },
-        "gpt-5.2-codex": {
-            id: "gpt-5.2-codex",
-            name: "GPT-5.2 Codex",
-            api: "openai-codex-responses",
-            provider: "openai-codex",
-            baseUrl: "https://chatgpt.com/backend-api",
-            reasoning: true,
-            input: ["text", "image"],
-            cost: {
-                input: 1.75,
-                output: 14,
-                cacheRead: 0.175,
-                cacheWrite: 0,
-            },
-            contextWindow: 272000,
-            maxTokens: 128000,
-        },
         "gpt-5.3-codex": {
             id: "gpt-5.3-codex",
             name: "GPT-5.3 Codex",
@@ -6331,14 +6314,31 @@ export const MODELS = {
             contextWindow: 272000,
             maxTokens: 128000,
         },
+        "gpt-5.5": {
+            id: "gpt-5.5",
+            name: "GPT-5.5",
+            api: "openai-codex-responses",
+            provider: "openai-codex",
+            baseUrl: "https://chatgpt.com/backend-api",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 5,
+                output: 30,
+                cacheRead: 0.5,
+                cacheWrite: 0,
+            },
+            contextWindow: 400000,
+            maxTokens: 128000,
+        },
     },
     "opencode": {
         "big-pickle": {
             id: "big-pickle",
             name: "Big Pickle",
-            api: "anthropic-messages",
+            api: "openai-completions",
             provider: "opencode",
-            baseUrl: "https://opencode.ai/zen",
+            baseUrl: "https://opencode.ai/zen/v1",
             reasoning: true,
             input: ["text"],
             cost: {
@@ -6597,9 +6597,9 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
+                input: 0.05,
+                output: 0.4,
+                cacheRead: 0.005,
                 cacheWrite: 0,
             },
             contextWindow: 400000,
@@ -6826,23 +6826,6 @@ export const MODELS = {
             contextWindow: 1050000,
             maxTokens: 128000,
         },
-        "hy3-preview-free": {
-            id: "hy3-preview-free",
-            name: "Hy3 preview Free",
-            api: "openai-completions",
-            provider: "opencode",
-            baseUrl: "https://opencode.ai/zen/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 256000,
-            maxTokens: 64000,
-        },
         "kimi-k2.5": {
             id: "kimi-k2.5",
             name: "Kimi K2.5",
@@ -7068,55 +7051,21 @@ export const MODELS = {
         },
         "kimi-k2.6": {
             id: "kimi-k2.6",
-            name: "Kimi K2.6 (3x limits)",
+            name: "Kimi K2.6",
             api: "openai-completions",
             provider: "opencode-go",
             baseUrl: "https://opencode.ai/zen/go/v1",
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.32,
-                output: 1.34,
-                cacheRead: 0.054,
+                input: 0.95,
+                output: 4,
+                cacheRead: 0.16,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
             maxTokens: 65536,
         },
-        "mimo-v2-omni": {
-            id: "mimo-v2-omni",
-            name: "MiMo V2 Omni",
-            api: "openai-completions",
-            provider: "opencode-go",
-            baseUrl: "https://opencode.ai/zen/go/v1",
-            reasoning: true,
-            input: ["text", "image"],
-            cost: {
-                input: 0.4,
-                output: 2,
-                cacheRead: 0.08,
-                cacheWrite: 0,
-            },
-            contextWindow: 262144,
-            maxTokens: 128000,
-        },
-        "mimo-v2-pro": {
-            id: "mimo-v2-pro",
-            name: "MiMo V2 Pro",
-            api: "openai-completions",
-            provider: "opencode-go",
-            baseUrl: "https://opencode.ai/zen/go/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 1,
-                output: 3,
-                cacheRead: 0.2,
-                cacheWrite: 0,
-            },
-            contextWindow: 1048576,
-            maxTokens: 128000,
-        },
         "mimo-v2.5": {
             id: "mimo-v2.5",
             name: "MiMo V2.5",
@@ -7255,23 +7204,6 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 131072,
         },
-        "allenai/olmo-3.1-32b-instruct": {
-            id: "allenai/olmo-3.1-32b-instruct",
-            name: "AllenAI: Olmo 3.1 32B Instruct",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.19999999999999998,
-                output: 0.6,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 65536,
-            maxTokens: 16384,
-        },
         "amazon/nova-2-lite-v1": {
             id: "amazon/nova-2-lite-v1",
             name: "Amazon: Nova 2 Lite",
@@ -7406,7 +7338,7 @@ export const MODELS = {
                 cacheWrite: 3.75,
             },
             contextWindow: 200000,
-            maxTokens: 128000,
+            maxTokens: 64000,
         },
         "anthropic/claude-3.7-sonnet:thinking": {
             id: "anthropic/claude-3.7-sonnet:thinking",
@@ -7680,6 +7612,23 @@ export const MODELS = {
             contextWindow: 2000000,
             maxTokens: 30000,
         },
+        "baidu/cobuddy:free": {
+            id: "baidu/cobuddy:free",
+            name: "Baidu Qianfan: CoBuddy (free)",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text"],
+            cost: {
+                input: 0,
+                output: 0,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 131072,
+            maxTokens: 65536,
+        },
         "baidu/ernie-4.5-21b-a3b": {
             id: "baidu/ernie-4.5-21b-a3b",
             name: "Baidu: ERNIE 4.5 21B A3B",
@@ -7910,8 +7859,8 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.21,
-                output: 0.7899999999999999,
+                input: 0.27,
+                output: 0.95,
                 cacheRead: 0.13,
                 cacheWrite: 0,
             },
@@ -8156,6 +8105,23 @@ export const MODELS = {
             contextWindow: 1048576,
             maxTokens: 65536,
         },
+        "google/gemini-3.1-flash-lite": {
+            id: "google/gemini-3.1-flash-lite",
+            name: "Google: Gemini 3.1 Flash Lite",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0.25,
+                output: 1.5,
+                cacheRead: 0.024999999999999998,
+                cacheWrite: 0.08333333333333334,
+            },
+            contextWindow: 1048576,
+            maxTokens: 65536,
+        },
         "google/gemini-3.1-flash-lite-preview": {
             id: "google/gemini-3.1-flash-lite-preview",
             name: "Google: Gemini 3.1 Flash Lite Preview",
@@ -8343,18 +8309,18 @@ export const MODELS = {
             contextWindow: 128000,
             maxTokens: 50000,
         },
-        "inclusionai/ling-2.6-1t:free": {
-            id: "inclusionai/ling-2.6-1t:free",
-            name: "inclusionAI: Ling-2.6-1T (free)",
+        "inclusionai/ling-2.6-1t": {
+            id: "inclusionai/ling-2.6-1t",
+            name: "inclusionAI: Ling-2.6-1T",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
+                input: 0.3,
+                output: 2.5,
+                cacheRead: 0.06,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
@@ -8377,39 +8343,39 @@ export const MODELS = {
             contextWindow: 262144,
             maxTokens: 32768,
         },
-        "kwaipilot/kat-coder-pro-v2": {
-            id: "kwaipilot/kat-coder-pro-v2",
-            name: "Kwaipilot: KAT-Coder-Pro V2",
+        "inclusionai/ring-2.6-1t:free": {
+            id: "inclusionai/ring-2.6-1t:free",
+            name: "inclusionAI: Ring-2.6-1T (free)",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
+            reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.3,
-                output: 1.2,
-                cacheRead: 0.06,
+                input: 0,
+                output: 0,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 256000,
-            maxTokens: 80000,
+            contextWindow: 262144,
+            maxTokens: 65536,
         },
-        "meta-llama/llama-3-8b-instruct": {
-            id: "meta-llama/llama-3-8b-instruct",
-            name: "Meta: Llama 3 8B Instruct",
+        "kwaipilot/kat-coder-pro-v2": {
+            id: "kwaipilot/kat-coder-pro-v2",
+            name: "Kwaipilot: KAT-Coder-Pro V2",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.03,
-                output: 0.04,
-                cacheRead: 0,
+                input: 0.3,
+                output: 1.2,
+                cacheRead: 0.06,
                 cacheWrite: 0,
             },
-            contextWindow: 8192,
-            maxTokens: 16384,
+            contextWindow: 256000,
+            maxTokens: 80000,
         },
         "meta-llama/llama-3.1-70b-instruct": {
             id: "meta-llama/llama-3.1-70b-instruct",
@@ -8558,11 +8524,11 @@ export const MODELS = {
             cost: {
                 input: 0.15,
                 output: 1.15,
-                cacheRead: 0.03,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 196608,
-            maxTokens: 131072,
+            maxTokens: 196608,
         },
         "minimax/minimax-m2.5:free": {
             id: "minimax/minimax-m2.5:free",
@@ -8590,13 +8556,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.3,
+                input: 0.29900000000000004,
                 output: 1.2,
-                cacheRead: 0.059,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 196608,
-            maxTokens: 4096,
+            maxTokens: 131072,
         },
         "mistralai/codestral-2508": {
             id: "mistralai/codestral-2508",
@@ -8802,6 +8768,23 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 4096,
         },
+        "mistralai/mistral-medium-3-5": {
+            id: "mistralai/mistral-medium-3-5",
+            name: "Mistral: Mistral Medium 3.5",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 1.5,
+                output: 7.5,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 262144,
+            maxTokens: 4096,
+        },
         "mistralai/mistral-medium-3.1": {
             id: "mistralai/mistral-medium-3.1",
             name: "Mistral: Mistral Medium 3.1",
@@ -8904,23 +8887,6 @@ export const MODELS = {
             contextWindow: 65536,
             maxTokens: 4096,
         },
-        "mistralai/mixtral-8x7b-instruct": {
-            id: "mistralai/mixtral-8x7b-instruct",
-            name: "Mistral: Mixtral 8x7B Instruct",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.54,
-                output: 0.54,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 32768,
-            maxTokens: 16384,
-        },
         "mistralai/pixtral-large-2411": {
             id: "mistralai/pixtral-large-2411",
             name: "Mistral: Pixtral Large 2411",
@@ -9032,13 +8998,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.74,
-                output: 3.49,
-                cacheRead: 0.14,
+                input: 0.75,
+                output: 3.5,
+                cacheRead: 0.15,
                 cacheWrite: 0,
             },
-            contextWindow: 262142,
-            maxTokens: 262142,
+            contextWindow: 262144,
+            maxTokens: 16384,
         },
         "nex-agi/deepseek-v3.1-nex-n1": {
             id: "nex-agi/deepseek-v3.1-nex-n1",
@@ -9057,23 +9023,6 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 163840,
         },
-        "nvidia/llama-3.1-nemotron-70b-instruct": {
-            id: "nvidia/llama-3.1-nemotron-70b-instruct",
-            name: "NVIDIA: Llama 3.1 Nemotron 70B Instruct",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 1.2,
-                output: 1.2,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 16384,
-        },
         "nvidia/llama-3.3-nemotron-super-49b-v1.5": {
             id: "nvidia/llama-3.3-nemotron-super-49b-v1.5",
             name: "NVIDIA: Llama 3.3 Nemotron Super 49B V1.5",
@@ -9941,6 +9890,23 @@ export const MODELS = {
             contextWindow: 128000,
             maxTokens: 16384,
         },
+        "openai/gpt-chat-latest": {
+            id: "openai/gpt-chat-latest",
+            name: "OpenAI: GPT Chat Latest",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: false,
+            input: ["text", "image"],
+            cost: {
+                input: 5,
+                output: 30,
+                cacheRead: 0.5,
+                cacheWrite: 0,
+            },
+            contextWindow: 400000,
+            maxTokens: 128000,
+        },
         "openai/gpt-oss-120b": {
             id: "openai/gpt-oss-120b",
             name: "OpenAI: gpt-oss-120b",
@@ -10494,13 +10460,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.08,
-                output: 0.28,
+                input: 0.09,
+                output: 0.44999999999999996,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 40960,
-            maxTokens: 16384,
+            maxTokens: 20000,
         },
         "qwen/qwen3-30b-a3b-instruct-2507": {
             id: "qwen/qwen3-30b-a3b-instruct-2507",
@@ -10546,12 +10512,12 @@ export const MODELS = {
             input: ["text"],
             cost: {
                 input: 0.08,
-                output: 0.24,
-                cacheRead: 0.04,
+                output: 0.28,
+                cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 40960,
-            maxTokens: 40960,
+            maxTokens: 16384,
         },
         "qwen/qwen3-8b": {
             id: "qwen/qwen3-8b",
@@ -10630,7 +10596,7 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.12,
+                input: 0.11,
                 output: 0.7999999999999999,
                 cacheRead: 0.07,
                 cacheWrite: 0,
@@ -10919,13 +10885,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.1625,
-                output: 1.3,
-                cacheRead: 0,
+                input: 0.14,
+                output: 1,
+                cacheRead: 0.049999999999999996,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 65536,
+            maxTokens: 81920,
         },
         "qwen/qwen3.5-397b-a17b": {
             id: "qwen/qwen3.5-397b-a17b",
@@ -10953,13 +10919,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.09999999999999999,
+                input: 0.04,
                 output: 0.15,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 4096,
+            maxTokens: 81920,
         },
         "qwen/qwen3.5-flash-02-23": {
             id: "qwen/qwen3.5-flash-02-23",
@@ -11021,13 +10987,30 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.325,
-                output: 3.25,
+                input: 0.32,
+                output: 3.1999999999999997,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 256000,
-            maxTokens: 65536,
+            contextWindow: 262144,
+            maxTokens: 81920,
+        },
+        "qwen/qwen3.6-35b-a3b": {
+            id: "qwen/qwen3.6-35b-a3b",
+            name: "Qwen: Qwen3.6 35B A3B",
+            api: "openai-completions",
+            provider: "openrouter",
+            baseUrl: "https://openrouter.ai/api/v1",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0.15,
+                output: 1,
+                cacheRead: 0.049999999999999996,
+                cacheWrite: 0,
+            },
+            contextWindow: 262144,
+            maxTokens: 262144,
         },
         "qwen/qwen3.6-flash": {
             id: "qwen/qwen3.6-flash",
@@ -11165,18 +11148,18 @@ export const MODELS = {
             contextWindow: 262144,
             maxTokens: 65536,
         },
-        "tencent/hy3-preview:free": {
-            id: "tencent/hy3-preview:free",
-            name: "Tencent: Hy3 preview (free)",
+        "tencent/hy3-preview": {
+            id: "tencent/hy3-preview",
+            name: "Tencent: Hy3 preview",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
+                input: 0.06599999999999999,
+                output: 0.26,
+                cacheRead: 0.029,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
@@ -11216,23 +11199,6 @@ export const MODELS = {
             contextWindow: 32768,
             maxTokens: 32768,
         },
-        "tngtech/deepseek-r1t2-chimera": {
-            id: "tngtech/deepseek-r1t2-chimera",
-            name: "TNG: DeepSeek R1T2 Chimera",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0.3,
-                output: 1.1,
-                cacheRead: 0.15,
-                cacheWrite: 0,
-            },
-            contextWindow: 163840,
-            maxTokens: 163840,
-        },
         "upstage/solar-pro-3": {
             id: "upstage/solar-pro-3",
             name: "Upstage: Solar Pro 3",
@@ -11429,9 +11395,9 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.09,
-                output: 0.29,
-                cacheRead: 0.045,
+                input: 0.09999999999999999,
+                output: 0.3,
+                cacheRead: 0.01,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
@@ -11503,7 +11469,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 1048576,
-            maxTokens: 131072,
+            maxTokens: 16384,
         },
         "z-ai/glm-4-32b": {
             id: "z-ai/glm-4-32b",
@@ -11633,13 +11599,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.38,
-                output: 1.74,
-                cacheRead: 0,
+                input: 0.39999999999999997,
+                output: 1.75,
+                cacheRead: 0.08,
                 cacheWrite: 0,
             },
             contextWindow: 202752,
-            maxTokens: 4096,
+            maxTokens: 131072,
         },
         "z-ai/glm-4.7-flash": {
             id: "z-ai/glm-4.7-flash",
@@ -11668,12 +11634,12 @@ export const MODELS = {
             input: ["text"],
             cost: {
                 input: 0.6,
-                output: 2.08,
+                output: 1.92,
                 cacheRead: 0.12,
                 cacheWrite: 0,
             },
             contextWindow: 202752,
-            maxTokens: 16384,
+            maxTokens: 4096,
         },
         "z-ai/glm-5-turbo": {
             id: "z-ai/glm-5-turbo",
@@ -11820,13 +11786,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.74,
-                output: 3.49,
-                cacheRead: 0.14,
+                input: 0.75,
+                output: 3.5,
+                cacheRead: 0.15,
                 cacheWrite: 0,
             },
-            contextWindow: 262142,
-            maxTokens: 262142,
+            contextWindow: 262144,
+            maxTokens: 16384,
         },
         "~openai/gpt-latest": {
             id: "~openai/gpt-latest",
@@ -12697,6 +12663,23 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 64000,
         },
+        "google/gemini-3.1-flash-lite": {
+            id: "google/gemini-3.1-flash-lite",
+            name: "Gemini 3.1 Flash Lite",
+            api: "anthropic-messages",
+            provider: "vercel-ai-gateway",
+            baseUrl: "https://ai-gateway.vercel.sh",
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 0.25,
+                output: 1.5,
+                cacheRead: 0.03,
+                cacheWrite: 0,
+            },
+            contextWindow: 1000000,
+            maxTokens: 65000,
+        },
         "google/gemini-3.1-flash-lite-preview": {
             id: "google/gemini-3.1-flash-lite-preview",
             name: "Gemini 3.1 Flash Lite Preview",
@@ -13258,23 +13241,6 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 131072,
         },
-        "moonshotai/kimi-k2-0905": {
-            id: "moonshotai/kimi-k2-0905",
-            name: "Kimi K2 0905",
-            api: "anthropic-messages",
-            provider: "vercel-ai-gateway",
-            baseUrl: "https://ai-gateway.vercel.sh",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.6,
-                output: 2.5,
-                cacheRead: 0.3,
-                cacheWrite: 0,
-            },
-            contextWindow: 256000,
-            maxTokens: 128000,
-        },
         "moonshotai/kimi-k2-thinking": {
             id: "moonshotai/kimi-k2-thinking",
             name: "Kimi K2 Thinking",
@@ -14219,8 +14185,8 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 2,
-                output: 6,
+                input: 1.25,
+                output: 2.5,
                 cacheRead: 0.19999999999999998,
                 cacheWrite: 0,
             },
@@ -14236,8 +14202,8 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 2,
-                output: 6,
+                input: 1.25,
+                output: 2.5,
                 cacheRead: 0.19999999999999998,
                 cacheWrite: 0,
             },
@@ -14253,8 +14219,8 @@ export const MODELS = {
             reasoning: false,
             input: ["text", "image"],
             cost: {
-                input: 2,
-                output: 6,
+                input: 1.25,
+                output: 2.5,
                 cacheRead: 0.19999999999999998,
                 cacheWrite: 0,
             },
@@ -14270,8 +14236,8 @@ export const MODELS = {
             reasoning: false,
             input: ["text", "image"],
             cost: {
-                input: 2,
-                output: 6,
+                input: 1.25,
+                output: 2.5,
                 cacheRead: 0.19999999999999998,
                 cacheWrite: 0,
             },
@@ -14287,8 +14253,8 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 2,
-                output: 6,
+                input: 1.25,
+                output: 2.5,
                 cacheRead: 0.19999999999999998,
                 cacheWrite: 0,
             },
@@ -14304,8 +14270,8 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 2,
-                output: 6,
+                input: 1.25,
+                output: 2.5,
                 cacheRead: 0.19999999999999998,
                 cacheWrite: 0,
             },