npm - @caupulican/pi-ai - Versions diffs - 0.80.20 → 0.80.22 - Mend

@caupulican/pi-ai 0.80.20 → 0.80.22

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/dist/models.generated.d.ts +92 -369
package/dist/models.generated.d.ts.map +1 -1
package/dist/models.generated.js +157 -415
package/dist/models.generated.js.map +1 -1
package/package.json +1 -1

package/dist/models.generated.js CHANGED Viewed

@@ -2854,30 +2854,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.25,
-                output: 0.69,
+                input: 0.35,
+                output: 0.75,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 32768,
-        },
-        "llama3.1-8b": {
-            id: "llama3.1-8b",
-            name: "Llama 3.1 8B",
-            api: "openai-completions",
-            provider: "cerebras",
-            baseUrl: "https://api.cerebras.ai/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.1,
-                output: 0.1,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 32000,
-            maxTokens: 8000,
+            maxTokens: 40960,
         },
         "zai-glm-4.7": {
             id: "zai-glm-4.7",
@@ -2885,7 +2868,7 @@ export const MODELS = {
             api: "openai-completions",
             provider: "cerebras",
             baseUrl: "https://api.cerebras.ai/v1",
-            reasoning: false,
+            reasoning: true,
             input: ["text"],
             cost: {
                 input: 2.25,
@@ -2894,7 +2877,7 @@ export const MODELS = {
                 cacheWrite: 0,
             },
             contextWindow: 131072,
-            maxTokens: 40000,
+            maxTokens: 40960,
         },
     },
     "cloudflare-ai-gateway": {
@@ -4023,6 +4006,25 @@ export const MODELS = {
         },
     },
     "github-copilot": {
+        "claude-fable-5": {
+            id: "claude-fable-5",
+            name: "Claude Fable 5",
+            api: "openai-completions",
+            provider: "github-copilot",
+            baseUrl: "https://api.individual.githubcopilot.com",
+            headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
+            compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
+            reasoning: true,
+            input: ["text", "image"],
+            cost: {
+                input: 10,
+                output: 50,
+                cacheRead: 1,
+                cacheWrite: 12.5,
+            },
+            contextWindow: 1000000,
+            maxTokens: 128000,
+        },
         "claude-haiku-4.5": {
             id: "claude-haiku-4.5",
             name: "Claude Haiku 4.5 (latest)",
@@ -4955,77 +4957,9 @@ export const MODELS = {
         },
     },
     "groq": {
-        "deepseek-r1-distill-llama-70b": {
-            id: "deepseek-r1-distill-llama-70b",
-            name: "DeepSeek R1 Distill Llama 70B",
-            api: "openai-completions",
-            provider: "groq",
-            baseUrl: "https://api.groq.com/openai/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0.75,
-                output: 0.99,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 8192,
-        },
-        "gemma2-9b-it": {
-            id: "gemma2-9b-it",
-            name: "Gemma 2 9B",
-            api: "openai-completions",
-            provider: "groq",
-            baseUrl: "https://api.groq.com/openai/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.2,
-                output: 0.2,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 8192,
-            maxTokens: 8192,
-        },
-        "groq/compound": {
-            id: "groq/compound",
-            name: "Compound",
-            api: "openai-completions",
-            provider: "groq",
-            baseUrl: "https://api.groq.com/openai/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 8192,
-        },
-        "groq/compound-mini": {
-            id: "groq/compound-mini",
-            name: "Compound Mini",
-            api: "openai-completions",
-            provider: "groq",
-            baseUrl: "https://api.groq.com/openai/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 8192,
-        },
         "llama-3.1-8b-instant": {
             id: "llama-3.1-8b-instant",
-            name: "Llama 3.1 8B Instant",
+            name: "Llama 3.1 8B",
             api: "openai-completions",
             provider: "groq",
             baseUrl: "https://api.groq.com/openai/v1",
@@ -5042,7 +4976,7 @@ export const MODELS = {
         },
         "llama-3.3-70b-versatile": {
             id: "llama-3.3-70b-versatile",
-            name: "Llama 3.3 70B Versatile",
+            name: "Llama 3.3 70B",
             api: "openai-completions",
             provider: "groq",
             baseUrl: "https://api.groq.com/openai/v1",
@@ -5057,60 +4991,9 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 32768,
         },
-        "llama3-70b-8192": {
-            id: "llama3-70b-8192",
-            name: "Llama 3 70B",
-            api: "openai-completions",
-            provider: "groq",
-            baseUrl: "https://api.groq.com/openai/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.59,
-                output: 0.79,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 8192,
-            maxTokens: 8192,
-        },
-        "llama3-8b-8192": {
-            id: "llama3-8b-8192",
-            name: "Llama 3 8B",
-            api: "openai-completions",
-            provider: "groq",
-            baseUrl: "https://api.groq.com/openai/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.05,
-                output: 0.08,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 8192,
-            maxTokens: 8192,
-        },
-        "meta-llama/llama-4-maverick-17b-128e-instruct": {
-            id: "meta-llama/llama-4-maverick-17b-128e-instruct",
-            name: "Llama 4 Maverick 17B",
-            api: "openai-completions",
-            provider: "groq",
-            baseUrl: "https://api.groq.com/openai/v1",
-            reasoning: false,
-            input: ["text", "image"],
-            cost: {
-                input: 0.2,
-                output: 0.6,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 8192,
-        },
         "meta-llama/llama-4-scout-17b-16e-instruct": {
             id: "meta-llama/llama-4-scout-17b-16e-instruct",
-            name: "Llama 4 Scout 17B",
+            name: "Llama 4 Scout 17B 16E",
             api: "openai-completions",
             provider: "groq",
             baseUrl: "https://api.groq.com/openai/v1",
@@ -5125,57 +5008,6 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 8192,
         },
-        "mistral-saba-24b": {
-            id: "mistral-saba-24b",
-            name: "Mistral Saba 24B",
-            api: "openai-completions",
-            provider: "groq",
-            baseUrl: "https://api.groq.com/openai/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 0.79,
-                output: 0.79,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 32768,
-            maxTokens: 32768,
-        },
-        "moonshotai/kimi-k2-instruct": {
-            id: "moonshotai/kimi-k2-instruct",
-            name: "Kimi K2 Instruct",
-            api: "openai-completions",
-            provider: "groq",
-            baseUrl: "https://api.groq.com/openai/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 1,
-                output: 3,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 16384,
-        },
-        "moonshotai/kimi-k2-instruct-0905": {
-            id: "moonshotai/kimi-k2-instruct-0905",
-            name: "Kimi K2 Instruct 0905",
-            api: "openai-completions",
-            provider: "groq",
-            baseUrl: "https://api.groq.com/openai/v1",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 1,
-                output: 3,
-                cacheRead: 0.5,
-                cacheWrite: 0,
-            },
-            contextWindow: 262144,
-            maxTokens: 16384,
-        },
         "openai/gpt-oss-120b": {
             id: "openai/gpt-oss-120b",
             name: "GPT OSS 120B",
@@ -5227,26 +5059,9 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 65536,
         },
-        "qwen-qwq-32b": {
-            id: "qwen-qwq-32b",
-            name: "Qwen QwQ 32B",
-            api: "openai-completions",
-            provider: "groq",
-            baseUrl: "https://api.groq.com/openai/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0.29,
-                output: 0.39,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 16384,
-        },
         "qwen/qwen3-32b": {
             id: "qwen/qwen3-32b",
-            name: "Qwen3 32B",
+            name: "Qwen3-32B",
             api: "openai-completions",
             provider: "groq",
             baseUrl: "https://api.groq.com/openai/v1",
@@ -7617,7 +7432,7 @@ export const MODELS = {
             cost: {
                 input: 0.14,
                 output: 0.28,
-                cacheRead: 0.03,
+                cacheRead: 0.028,
                 cacheWrite: 0,
             },
             contextWindow: 1000000,
@@ -7642,6 +7457,25 @@ export const MODELS = {
             contextWindow: 200000,
             maxTokens: 128000,
         },
+        "deepseek-v4-pro": {
+            id: "deepseek-v4-pro",
+            name: "DeepSeek V4 Pro",
+            api: "openai-completions",
+            provider: "opencode",
+            baseUrl: "https://opencode.ai/zen/v1",
+            compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
+            reasoning: true,
+            thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
+            input: ["text"],
+            cost: {
+                input: 1.74,
+                output: 3.84,
+                cacheRead: 0.145,
+                cacheWrite: 0,
+            },
+            contextWindow: 1000000,
+            maxTokens: 384000,
+        },
         "gemini-3-flash": {
             id: "gemini-3-flash",
             name: "Gemini 3 Flash",
@@ -8371,16 +8205,16 @@ export const MODELS = {
         },
         "minimax-m3": {
             id: "minimax-m3",
-            name: "MiniMax M3",
+            name: "MiniMax M3 (3x usage)",
             api: "anthropic-messages",
             provider: "opencode-go",
             baseUrl: "https://opencode.ai/zen/go",
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.3,
-                output: 1.2,
-                cacheRead: 0.06,
+                input: 0.1,
+                output: 0.4,
+                cacheRead: 0.02,
                 cacheWrite: 0,
             },
             contextWindow: 512000,
@@ -9021,7 +8855,7 @@ export const MODELS = {
                 cacheRead: 0.135,
                 cacheWrite: 0,
             },
-            contextWindow: 163840,
+            contextWindow: 131072,
             maxTokens: 16384,
         },
         "deepseek/deepseek-chat-v3.1": {
@@ -9137,13 +8971,13 @@ export const MODELS = {
             thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "xhigh" },
             input: ["text"],
             cost: {
-                input: 0.0983,
-                output: 0.1966,
-                cacheRead: 0.019700000000000002,
+                input: 0.098,
+                output: 0.196,
+                cacheRead: 0.02,
                 cacheWrite: 0,
             },
             contextWindow: 1048576,
-            maxTokens: 131072,
+            maxTokens: 4096,
         },
         "deepseek/deepseek-v4-pro": {
             id: "deepseek/deepseek-v4-pro",
@@ -9463,12 +9297,12 @@ export const MODELS = {
             input: ["text", "image"],
             cost: {
                 input: 0.12,
-                output: 0.36,
+                output: 0.35,
                 cacheRead: 0.09,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 8192,
+            maxTokens: 262144,
         },
         "google/gemma-4-31b-it:free": {
             id: "google/gemma-4-31b-it:free",
@@ -9769,9 +9603,9 @@ export const MODELS = {
             reasoning: true,
             input: ["text"],
             cost: {
-                input: 0.27,
-                output: 1.08,
-                cacheRead: 0.054,
+                input: 0.25,
+                output: 1,
+                cacheRead: 0.049999999999999996,
                 cacheWrite: 0,
             },
             contextWindow: 204800,
@@ -10161,27 +9995,26 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.6799999999999999,
-                output: 3.41,
-                cacheRead: 0.33999999999999997,
+                input: 0.67,
+                output: 3.39,
+                cacheRead: 0.14,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 262142,
+            maxTokens: 262144,
         },
-        "moonshotai/kimi-k2.6:free": {
-            id: "moonshotai/kimi-k2.6:free",
-            name: "MoonshotAI: Kimi K2.6 (free)",
+        "moonshotai/kimi-k2.7-code": {
+            id: "moonshotai/kimi-k2.7-code",
+            name: "MoonshotAI: Kimi K2.7 Code",
             api: "openai-completions",
             provider: "openrouter",
             baseUrl: "https://openrouter.ai/api/v1",
-            compat: { "supportsDeveloperRole": false },
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0,
-                output: 0,
-                cacheRead: 0,
+                input: 0.95,
+                output: 4,
+                cacheRead: 0.19,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
@@ -10357,23 +10190,6 @@ export const MODELS = {
             contextWindow: 128000,
             maxTokens: 128000,
         },
-        "nvidia/nemotron-nano-9b-v2": {
-            id: "nvidia/nemotron-nano-9b-v2",
-            name: "NVIDIA: Nemotron Nano 9B V2",
-            api: "openai-completions",
-            provider: "openrouter",
-            baseUrl: "https://openrouter.ai/api/v1",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 0.04,
-                output: 0.16,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 16384,
-        },
         "nvidia/nemotron-nano-9b-v2:free": {
             id: "nvidia/nemotron-nano-9b-v2:free",
             name: "NVIDIA: Nemotron Nano 9B V2 (free)",
@@ -12095,13 +11911,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.28900000000000003,
-                output: 2.4,
+                input: 0.28700000000000003,
+                output: 3.1,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 131072,
+            maxTokens: 262140,
         },
         "qwen/qwen3.6-35b-a3b": {
             id: "qwen/qwen3.6-35b-a3b",
@@ -12112,13 +11928,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.14,
+                input: 0.15,
                 output: 1,
-                cacheRead: 0,
+                cacheRead: 0.049999999999999996,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 262140,
+            maxTokens: 262144,
         },
         "qwen/qwen3.6-flash": {
             id: "qwen/qwen3.6-flash",
@@ -12197,10 +12013,10 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.39999999999999997,
-                output: 1.5999999999999999,
-                cacheRead: 0.08,
-                cacheWrite: 0.5,
+                input: 0.32,
+                output: 1.28,
+                cacheRead: 0.064,
+                cacheWrite: 0.39999999999999997,
             },
             contextWindow: 1000000,
             maxTokens: 65536,
@@ -12741,13 +12557,13 @@ export const MODELS = {
             reasoning: true,
             input: ["text", "image"],
             cost: {
-                input: 0.6799999999999999,
-                output: 3.41,
-                cacheRead: 0.33999999999999997,
+                input: 0.67,
+                output: 3.39,
+                cacheRead: 0.14,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 262142,
+            maxTokens: 262144,
         },
         "~openai/gpt-latest": {
             id: "~openai/gpt-latest",
@@ -12785,25 +12601,6 @@ export const MODELS = {
         },
     },
     "together": {
-        "MiniMaxAI/MiniMax-M2.5": {
-            id: "MiniMaxAI/MiniMax-M2.5",
-            name: "MiniMax-M2.5",
-            api: "openai-completions",
-            provider: "together",
-            baseUrl: "https://api.together.ai/v1",
-            compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
-            reasoning: true,
-            thinkingLevelMap: { "off": null, "minimal": null, "low": null, "medium": null },
-            input: ["text"],
-            cost: {
-                input: 0.3,
-                output: 1.2,
-                cacheRead: 0.06,
-                cacheWrite: 0,
-            },
-            contextWindow: 204800,
-            maxTokens: 131072,
-        },
         "MiniMaxAI/MiniMax-M2.7": {
             id: "MiniMaxAI/MiniMax-M2.7",
             name: "MiniMax-M2.7",
@@ -12823,28 +12620,27 @@ export const MODELS = {
             contextWindow: 202752,
             maxTokens: 131072,
         },
-        "Qwen/Qwen3-235B-A22B-Instruct-2507-tput": {
-            id: "Qwen/Qwen3-235B-A22B-Instruct-2507-tput",
-            name: "Qwen3 235B A22B Instruct 2507 FP8",
+        "Qwen/Qwen2.5-7B-Instruct-Turbo": {
+            id: "Qwen/Qwen2.5-7B-Instruct-Turbo",
+            name: "Qwen 2.5 7B Instruct Turbo",
             api: "openai-completions",
             provider: "together",
             baseUrl: "https://api.together.ai/v1",
-            compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
-            reasoning: true,
-            thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
+            compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
+            reasoning: false,
             input: ["text"],
             cost: {
-                input: 0.2,
-                output: 0.6,
+                input: 0.3,
+                output: 0.3,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
-            contextWindow: 262144,
-            maxTokens: 262144,
+            contextWindow: 32768,
+            maxTokens: 32768,
         },
-        "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8": {
-            id: "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
-            name: "Qwen3 Coder 480B A35B Instruct",
+        "Qwen/Qwen3-235B-A22B-Instruct-2507-tput": {
+            id: "Qwen/Qwen3-235B-A22B-Instruct-2507-tput",
+            name: "Qwen3 235B A22B Instruct 2507 FP8",
             api: "openai-completions",
             provider: "together",
             baseUrl: "https://api.together.ai/v1",
@@ -12852,36 +12648,36 @@ export const MODELS = {
             reasoning: false,
             input: ["text"],
             cost: {
-                input: 2,
-                output: 2,
+                input: 0.2,
+                output: 0.6,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
             maxTokens: 262144,
         },
-        "Qwen/Qwen3-Coder-Next-FP8": {
-            id: "Qwen/Qwen3-Coder-Next-FP8",
-            name: "Qwen3 Coder Next FP8",
+        "Qwen/Qwen3.5-397B-A17B": {
+            id: "Qwen/Qwen3.5-397B-A17B",
+            name: "Qwen3.5 397B A17B",
             api: "openai-completions",
             provider: "together",
             baseUrl: "https://api.together.ai/v1",
             compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
             reasoning: true,
             thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
-            input: ["text"],
+            input: ["text", "image"],
             cost: {
-                input: 0.5,
-                output: 1.2,
+                input: 0.6,
+                output: 3.6,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 262144,
+            maxTokens: 130000,
         },
-        "Qwen/Qwen3.5-397B-A17B": {
-            id: "Qwen/Qwen3.5-397B-A17B",
-            name: "Qwen3.5 397B A17B",
+        "Qwen/Qwen3.5-9B": {
+            id: "Qwen/Qwen3.5-9B",
+            name: "Qwen3.5 9B",
             api: "openai-completions",
             provider: "together",
             baseUrl: "https://api.together.ai/v1",
@@ -12890,13 +12686,13 @@ export const MODELS = {
             thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
             input: ["text", "image"],
             cost: {
-                input: 0.6,
-                output: 3.6,
+                input: 0.17,
+                output: 0.25,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
             contextWindow: 262144,
-            maxTokens: 130000,
+            maxTokens: 65536,
         },
         "Qwen/Qwen3.6-Plus": {
             id: "Qwen/Qwen3.6-Plus",
@@ -12923,9 +12719,8 @@ export const MODELS = {
             api: "openai-completions",
             provider: "together",
             baseUrl: "https://api.together.ai/v1",
-            compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
-            reasoning: true,
-            thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
+            compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
+            reasoning: false,
             input: ["text"],
             cost: {
                 input: 2.5,
@@ -12936,44 +12731,6 @@ export const MODELS = {
             contextWindow: 1000000,
             maxTokens: 500000,
         },
-        "deepseek-ai/DeepSeek-V3": {
-            id: "deepseek-ai/DeepSeek-V3",
-            name: "DeepSeek-V3",
-            api: "openai-completions",
-            provider: "together",
-            baseUrl: "https://api.together.ai/v1",
-            compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
-            reasoning: true,
-            thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
-            input: ["text"],
-            cost: {
-                input: 1.25,
-                output: 1.25,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 131072,
-        },
-        "deepseek-ai/DeepSeek-V3-1": {
-            id: "deepseek-ai/DeepSeek-V3-1",
-            name: "DeepSeek V3.1",
-            api: "openai-completions",
-            provider: "together",
-            baseUrl: "https://api.together.ai/v1",
-            compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
-            reasoning: true,
-            thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
-            input: ["text"],
-            cost: {
-                input: 0.6,
-                output: 1.7,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 131072,
-            maxTokens: 131072,
-        },
         "deepseek-ai/DeepSeek-V4-Pro": {
             id: "deepseek-ai/DeepSeek-V4-Pro",
             name: "DeepSeek V4 Pro",
@@ -12985,8 +12742,8 @@ export const MODELS = {
             thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": null },
             input: ["text"],
             cost: {
-                input: 2.1,
-                output: 4.4,
+                input: 1.74,
+                output: 3.48,
                 cacheRead: 0.2,
                 cacheWrite: 0,
             },
@@ -13022,8 +12779,8 @@ export const MODELS = {
             thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
             input: ["text", "image"],
             cost: {
-                input: 0.2,
-                output: 0.5,
+                input: 0.39,
+                output: 0.97,
                 cacheRead: 0,
                 cacheWrite: 0,
             },
@@ -13048,25 +12805,6 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 131072,
         },
-        "moonshotai/Kimi-K2.5": {
-            id: "moonshotai/Kimi-K2.5",
-            name: "Kimi K2.5",
-            api: "openai-completions",
-            provider: "together",
-            baseUrl: "https://api.together.ai/v1",
-            compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
-            reasoning: true,
-            thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
-            input: ["text", "image"],
-            cost: {
-                input: 0.5,
-                output: 2.8,
-                cacheRead: 0,
-                cacheWrite: 0,
-            },
-            contextWindow: 262144,
-            maxTokens: 262144,
-        },
         "moonshotai/Kimi-K2.6": {
             id: "moonshotai/Kimi-K2.6",
             name: "Kimi K2.6",
@@ -13124,6 +12862,44 @@ export const MODELS = {
             contextWindow: 131072,
             maxTokens: 131072,
         },
+        "openai/gpt-oss-20b": {
+            id: "openai/gpt-oss-20b",
+            name: "GPT OSS 20B",
+            api: "openai-completions",
+            provider: "together",
+            baseUrl: "https://api.together.ai/v1",
+            compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": true, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "openai" },
+            reasoning: true,
+            thinkingLevelMap: { "off": null, "minimal": null },
+            input: ["text"],
+            cost: {
+                input: 0.05,
+                output: 0.2,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 131072,
+            maxTokens: 131072,
+        },
+        "zai-org/GLM-5": {
+            id: "zai-org/GLM-5",
+            name: "GLM-5",
+            api: "openai-completions",
+            provider: "together",
+            baseUrl: "https://api.together.ai/v1",
+            compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
+            reasoning: true,
+            thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
+            input: ["text"],
+            cost: {
+                input: 1,
+                output: 3.2,
+                cacheRead: 0,
+                cacheWrite: 0,
+            },
+            contextWindow: 202752,
+            maxTokens: 131072,
+        },
         "zai-org/GLM-5.1": {
             id: "zai-org/GLM-5.1",
             name: "GLM-5.1",
@@ -14699,40 +14475,6 @@ export const MODELS = {
             contextWindow: 262114,
             maxTokens: 262114,
         },
-        "moonshotai/kimi-k2-thinking-turbo": {
-            id: "moonshotai/kimi-k2-thinking-turbo",
-            name: "Kimi K2 Thinking Turbo",
-            api: "anthropic-messages",
-            provider: "vercel-ai-gateway",
-            baseUrl: "https://ai-gateway.vercel.sh",
-            reasoning: true,
-            input: ["text"],
-            cost: {
-                input: 1.15,
-                output: 8,
-                cacheRead: 0.15,
-                cacheWrite: 0,
-            },
-            contextWindow: 262114,
-            maxTokens: 262114,
-        },
-        "moonshotai/kimi-k2-turbo": {
-            id: "moonshotai/kimi-k2-turbo",
-            name: "Kimi K2 Turbo",
-            api: "anthropic-messages",
-            provider: "vercel-ai-gateway",
-            baseUrl: "https://ai-gateway.vercel.sh",
-            reasoning: false,
-            input: ["text"],
-            cost: {
-                input: 1.15,
-                output: 8,
-                cacheRead: 0.15,
-                cacheWrite: 0,
-            },
-            contextWindow: 256000,
-            maxTokens: 16384,
-        },
         "moonshotai/kimi-k2.5": {
             id: "moonshotai/kimi-k2.5",
             name: "Kimi K2.5",