@earendil-works/pi-ai 0.79.1 → 0.79.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/models.generated.d.ts +273 -501
- package/dist/models.generated.d.ts.map +1 -1
- package/dist/models.generated.js +519 -740
- package/dist/models.generated.js.map +1 -1
- package/dist/providers/amazon-bedrock.d.ts.map +1 -1
- package/dist/providers/amazon-bedrock.js +11 -2
- package/dist/providers/amazon-bedrock.js.map +1 -1
- package/dist/providers/anthropic.d.ts.map +1 -1
- package/dist/providers/anthropic.js +18 -11
- package/dist/providers/anthropic.js.map +1 -1
- package/dist/providers/openai-codex-responses.d.ts.map +1 -1
- package/dist/providers/openai-codex-responses.js +3 -1
- package/dist/providers/openai-codex-responses.js.map +1 -1
- package/dist/utils/overflow.d.ts +1 -1
- package/dist/utils/overflow.d.ts.map +1 -1
- package/dist/utils/overflow.js +3 -2
- package/dist/utils/overflow.js.map +1 -1
- package/package.json +1 -1
package/dist/models.generated.js
CHANGED
|
@@ -354,7 +354,7 @@ export const MODELS = {
|
|
|
354
354
|
provider: "amazon-bedrock",
|
|
355
355
|
baseUrl: "https://bedrock-runtime.eu-central-1.amazonaws.com",
|
|
356
356
|
reasoning: true,
|
|
357
|
-
thinkingLevelMap: { "xhigh": "xhigh" },
|
|
357
|
+
thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
|
|
358
358
|
input: ["text", "image"],
|
|
359
359
|
cost: {
|
|
360
360
|
input: 11,
|
|
@@ -494,7 +494,7 @@ export const MODELS = {
|
|
|
494
494
|
provider: "amazon-bedrock",
|
|
495
495
|
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
496
496
|
reasoning: true,
|
|
497
|
-
thinkingLevelMap: { "xhigh": "xhigh" },
|
|
497
|
+
thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
|
|
498
498
|
input: ["text", "image"],
|
|
499
499
|
cost: {
|
|
500
500
|
input: 10,
|
|
@@ -1386,7 +1386,7 @@ export const MODELS = {
|
|
|
1386
1386
|
provider: "amazon-bedrock",
|
|
1387
1387
|
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
1388
1388
|
reasoning: true,
|
|
1389
|
-
thinkingLevelMap: { "xhigh": "xhigh" },
|
|
1389
|
+
thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
|
|
1390
1390
|
input: ["text", "image"],
|
|
1391
1391
|
cost: {
|
|
1392
1392
|
input: 10,
|
|
@@ -1875,7 +1875,7 @@ export const MODELS = {
|
|
|
1875
1875
|
baseUrl: "https://api.anthropic.com",
|
|
1876
1876
|
compat: { "forceAdaptiveThinking": true },
|
|
1877
1877
|
reasoning: true,
|
|
1878
|
-
thinkingLevelMap: { "xhigh": "xhigh" },
|
|
1878
|
+
thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
|
|
1879
1879
|
input: ["text", "image"],
|
|
1880
1880
|
cost: {
|
|
1881
1881
|
input: 10,
|
|
@@ -2916,30 +2916,13 @@ export const MODELS = {
|
|
|
2916
2916
|
reasoning: true,
|
|
2917
2917
|
input: ["text"],
|
|
2918
2918
|
cost: {
|
|
2919
|
-
input: 0.
|
|
2920
|
-
output: 0.
|
|
2919
|
+
input: 0.35,
|
|
2920
|
+
output: 0.75,
|
|
2921
2921
|
cacheRead: 0,
|
|
2922
2922
|
cacheWrite: 0,
|
|
2923
2923
|
},
|
|
2924
2924
|
contextWindow: 131072,
|
|
2925
|
-
maxTokens:
|
|
2926
|
-
},
|
|
2927
|
-
"llama3.1-8b": {
|
|
2928
|
-
id: "llama3.1-8b",
|
|
2929
|
-
name: "Llama 3.1 8B",
|
|
2930
|
-
api: "openai-completions",
|
|
2931
|
-
provider: "cerebras",
|
|
2932
|
-
baseUrl: "https://api.cerebras.ai/v1",
|
|
2933
|
-
reasoning: false,
|
|
2934
|
-
input: ["text"],
|
|
2935
|
-
cost: {
|
|
2936
|
-
input: 0.1,
|
|
2937
|
-
output: 0.1,
|
|
2938
|
-
cacheRead: 0,
|
|
2939
|
-
cacheWrite: 0,
|
|
2940
|
-
},
|
|
2941
|
-
contextWindow: 32000,
|
|
2942
|
-
maxTokens: 8000,
|
|
2925
|
+
maxTokens: 40960,
|
|
2943
2926
|
},
|
|
2944
2927
|
"zai-glm-4.7": {
|
|
2945
2928
|
id: "zai-glm-4.7",
|
|
@@ -2947,7 +2930,7 @@ export const MODELS = {
|
|
|
2947
2930
|
api: "openai-completions",
|
|
2948
2931
|
provider: "cerebras",
|
|
2949
2932
|
baseUrl: "https://api.cerebras.ai/v1",
|
|
2950
|
-
reasoning:
|
|
2933
|
+
reasoning: true,
|
|
2951
2934
|
input: ["text"],
|
|
2952
2935
|
cost: {
|
|
2953
2936
|
input: 2.25,
|
|
@@ -2956,7 +2939,7 @@ export const MODELS = {
|
|
|
2956
2939
|
cacheWrite: 0,
|
|
2957
2940
|
},
|
|
2958
2941
|
contextWindow: 131072,
|
|
2959
|
-
maxTokens:
|
|
2942
|
+
maxTokens: 40960,
|
|
2960
2943
|
},
|
|
2961
2944
|
},
|
|
2962
2945
|
"cloudflare-ai-gateway": {
|
|
@@ -3070,7 +3053,7 @@ export const MODELS = {
|
|
|
3070
3053
|
baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
|
|
3071
3054
|
compat: { "forceAdaptiveThinking": true },
|
|
3072
3055
|
reasoning: true,
|
|
3073
|
-
thinkingLevelMap: { "xhigh": "xhigh" },
|
|
3056
|
+
thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
|
|
3074
3057
|
input: ["text", "image"],
|
|
3075
3058
|
cost: {
|
|
3076
3059
|
input: 10,
|
|
@@ -3719,6 +3702,24 @@ export const MODELS = {
|
|
|
3719
3702
|
contextWindow: 262144,
|
|
3720
3703
|
maxTokens: 256000,
|
|
3721
3704
|
},
|
|
3705
|
+
"@cf/moonshotai/kimi-k2.7-code": {
|
|
3706
|
+
id: "@cf/moonshotai/kimi-k2.7-code",
|
|
3707
|
+
name: "Kimi K2.7 Code",
|
|
3708
|
+
api: "openai-completions",
|
|
3709
|
+
provider: "cloudflare-workers-ai",
|
|
3710
|
+
baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
|
|
3711
|
+
compat: { "sendSessionAffinityHeaders": true },
|
|
3712
|
+
reasoning: true,
|
|
3713
|
+
input: ["text", "image"],
|
|
3714
|
+
cost: {
|
|
3715
|
+
input: 0.95,
|
|
3716
|
+
output: 4,
|
|
3717
|
+
cacheRead: 0.19,
|
|
3718
|
+
cacheWrite: 0,
|
|
3719
|
+
},
|
|
3720
|
+
contextWindow: 262144,
|
|
3721
|
+
maxTokens: 262144,
|
|
3722
|
+
},
|
|
3722
3723
|
"@cf/nvidia/nemotron-3-120b-a12b": {
|
|
3723
3724
|
id: "@cf/nvidia/nemotron-3-120b-a12b",
|
|
3724
3725
|
name: "Nemotron 3 Super 120B",
|
|
@@ -4087,6 +4088,25 @@ export const MODELS = {
|
|
|
4087
4088
|
},
|
|
4088
4089
|
},
|
|
4089
4090
|
"github-copilot": {
|
|
4091
|
+
"claude-fable-5": {
|
|
4092
|
+
id: "claude-fable-5",
|
|
4093
|
+
name: "Claude Fable 5",
|
|
4094
|
+
api: "openai-completions",
|
|
4095
|
+
provider: "github-copilot",
|
|
4096
|
+
baseUrl: "https://api.individual.githubcopilot.com",
|
|
4097
|
+
headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
|
|
4098
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
|
|
4099
|
+
reasoning: true,
|
|
4100
|
+
input: ["text", "image"],
|
|
4101
|
+
cost: {
|
|
4102
|
+
input: 10,
|
|
4103
|
+
output: 50,
|
|
4104
|
+
cacheRead: 1,
|
|
4105
|
+
cacheWrite: 12.5,
|
|
4106
|
+
},
|
|
4107
|
+
contextWindow: 1000000,
|
|
4108
|
+
maxTokens: 128000,
|
|
4109
|
+
},
|
|
4090
4110
|
"claude-haiku-4.5": {
|
|
4091
4111
|
id: "claude-haiku-4.5",
|
|
4092
4112
|
name: "Claude Haiku 4.5 (latest)",
|
|
@@ -5019,77 +5039,9 @@ export const MODELS = {
|
|
|
5019
5039
|
},
|
|
5020
5040
|
},
|
|
5021
5041
|
"groq": {
|
|
5022
|
-
"deepseek-r1-distill-llama-70b": {
|
|
5023
|
-
id: "deepseek-r1-distill-llama-70b",
|
|
5024
|
-
name: "DeepSeek R1 Distill Llama 70B",
|
|
5025
|
-
api: "openai-completions",
|
|
5026
|
-
provider: "groq",
|
|
5027
|
-
baseUrl: "https://api.groq.com/openai/v1",
|
|
5028
|
-
reasoning: true,
|
|
5029
|
-
input: ["text"],
|
|
5030
|
-
cost: {
|
|
5031
|
-
input: 0.75,
|
|
5032
|
-
output: 0.99,
|
|
5033
|
-
cacheRead: 0,
|
|
5034
|
-
cacheWrite: 0,
|
|
5035
|
-
},
|
|
5036
|
-
contextWindow: 131072,
|
|
5037
|
-
maxTokens: 8192,
|
|
5038
|
-
},
|
|
5039
|
-
"gemma2-9b-it": {
|
|
5040
|
-
id: "gemma2-9b-it",
|
|
5041
|
-
name: "Gemma 2 9B",
|
|
5042
|
-
api: "openai-completions",
|
|
5043
|
-
provider: "groq",
|
|
5044
|
-
baseUrl: "https://api.groq.com/openai/v1",
|
|
5045
|
-
reasoning: false,
|
|
5046
|
-
input: ["text"],
|
|
5047
|
-
cost: {
|
|
5048
|
-
input: 0.2,
|
|
5049
|
-
output: 0.2,
|
|
5050
|
-
cacheRead: 0,
|
|
5051
|
-
cacheWrite: 0,
|
|
5052
|
-
},
|
|
5053
|
-
contextWindow: 8192,
|
|
5054
|
-
maxTokens: 8192,
|
|
5055
|
-
},
|
|
5056
|
-
"groq/compound": {
|
|
5057
|
-
id: "groq/compound",
|
|
5058
|
-
name: "Compound",
|
|
5059
|
-
api: "openai-completions",
|
|
5060
|
-
provider: "groq",
|
|
5061
|
-
baseUrl: "https://api.groq.com/openai/v1",
|
|
5062
|
-
reasoning: true,
|
|
5063
|
-
input: ["text"],
|
|
5064
|
-
cost: {
|
|
5065
|
-
input: 0,
|
|
5066
|
-
output: 0,
|
|
5067
|
-
cacheRead: 0,
|
|
5068
|
-
cacheWrite: 0,
|
|
5069
|
-
},
|
|
5070
|
-
contextWindow: 131072,
|
|
5071
|
-
maxTokens: 8192,
|
|
5072
|
-
},
|
|
5073
|
-
"groq/compound-mini": {
|
|
5074
|
-
id: "groq/compound-mini",
|
|
5075
|
-
name: "Compound Mini",
|
|
5076
|
-
api: "openai-completions",
|
|
5077
|
-
provider: "groq",
|
|
5078
|
-
baseUrl: "https://api.groq.com/openai/v1",
|
|
5079
|
-
reasoning: true,
|
|
5080
|
-
input: ["text"],
|
|
5081
|
-
cost: {
|
|
5082
|
-
input: 0,
|
|
5083
|
-
output: 0,
|
|
5084
|
-
cacheRead: 0,
|
|
5085
|
-
cacheWrite: 0,
|
|
5086
|
-
},
|
|
5087
|
-
contextWindow: 131072,
|
|
5088
|
-
maxTokens: 8192,
|
|
5089
|
-
},
|
|
5090
5042
|
"llama-3.1-8b-instant": {
|
|
5091
5043
|
id: "llama-3.1-8b-instant",
|
|
5092
|
-
name: "Llama 3.1 8B
|
|
5044
|
+
name: "Llama 3.1 8B",
|
|
5093
5045
|
api: "openai-completions",
|
|
5094
5046
|
provider: "groq",
|
|
5095
5047
|
baseUrl: "https://api.groq.com/openai/v1",
|
|
@@ -5106,7 +5058,7 @@ export const MODELS = {
|
|
|
5106
5058
|
},
|
|
5107
5059
|
"llama-3.3-70b-versatile": {
|
|
5108
5060
|
id: "llama-3.3-70b-versatile",
|
|
5109
|
-
name: "Llama 3.3 70B
|
|
5061
|
+
name: "Llama 3.3 70B",
|
|
5110
5062
|
api: "openai-completions",
|
|
5111
5063
|
provider: "groq",
|
|
5112
5064
|
baseUrl: "https://api.groq.com/openai/v1",
|
|
@@ -5121,60 +5073,9 @@ export const MODELS = {
|
|
|
5121
5073
|
contextWindow: 131072,
|
|
5122
5074
|
maxTokens: 32768,
|
|
5123
5075
|
},
|
|
5124
|
-
"llama3-70b-8192": {
|
|
5125
|
-
id: "llama3-70b-8192",
|
|
5126
|
-
name: "Llama 3 70B",
|
|
5127
|
-
api: "openai-completions",
|
|
5128
|
-
provider: "groq",
|
|
5129
|
-
baseUrl: "https://api.groq.com/openai/v1",
|
|
5130
|
-
reasoning: false,
|
|
5131
|
-
input: ["text"],
|
|
5132
|
-
cost: {
|
|
5133
|
-
input: 0.59,
|
|
5134
|
-
output: 0.79,
|
|
5135
|
-
cacheRead: 0,
|
|
5136
|
-
cacheWrite: 0,
|
|
5137
|
-
},
|
|
5138
|
-
contextWindow: 8192,
|
|
5139
|
-
maxTokens: 8192,
|
|
5140
|
-
},
|
|
5141
|
-
"llama3-8b-8192": {
|
|
5142
|
-
id: "llama3-8b-8192",
|
|
5143
|
-
name: "Llama 3 8B",
|
|
5144
|
-
api: "openai-completions",
|
|
5145
|
-
provider: "groq",
|
|
5146
|
-
baseUrl: "https://api.groq.com/openai/v1",
|
|
5147
|
-
reasoning: false,
|
|
5148
|
-
input: ["text"],
|
|
5149
|
-
cost: {
|
|
5150
|
-
input: 0.05,
|
|
5151
|
-
output: 0.08,
|
|
5152
|
-
cacheRead: 0,
|
|
5153
|
-
cacheWrite: 0,
|
|
5154
|
-
},
|
|
5155
|
-
contextWindow: 8192,
|
|
5156
|
-
maxTokens: 8192,
|
|
5157
|
-
},
|
|
5158
|
-
"meta-llama/llama-4-maverick-17b-128e-instruct": {
|
|
5159
|
-
id: "meta-llama/llama-4-maverick-17b-128e-instruct",
|
|
5160
|
-
name: "Llama 4 Maverick 17B",
|
|
5161
|
-
api: "openai-completions",
|
|
5162
|
-
provider: "groq",
|
|
5163
|
-
baseUrl: "https://api.groq.com/openai/v1",
|
|
5164
|
-
reasoning: false,
|
|
5165
|
-
input: ["text", "image"],
|
|
5166
|
-
cost: {
|
|
5167
|
-
input: 0.2,
|
|
5168
|
-
output: 0.6,
|
|
5169
|
-
cacheRead: 0,
|
|
5170
|
-
cacheWrite: 0,
|
|
5171
|
-
},
|
|
5172
|
-
contextWindow: 131072,
|
|
5173
|
-
maxTokens: 8192,
|
|
5174
|
-
},
|
|
5175
5076
|
"meta-llama/llama-4-scout-17b-16e-instruct": {
|
|
5176
5077
|
id: "meta-llama/llama-4-scout-17b-16e-instruct",
|
|
5177
|
-
name: "Llama 4 Scout 17B",
|
|
5078
|
+
name: "Llama 4 Scout 17B 16E",
|
|
5178
5079
|
api: "openai-completions",
|
|
5179
5080
|
provider: "groq",
|
|
5180
5081
|
baseUrl: "https://api.groq.com/openai/v1",
|
|
@@ -5189,57 +5090,6 @@ export const MODELS = {
|
|
|
5189
5090
|
contextWindow: 131072,
|
|
5190
5091
|
maxTokens: 8192,
|
|
5191
5092
|
},
|
|
5192
|
-
"mistral-saba-24b": {
|
|
5193
|
-
id: "mistral-saba-24b",
|
|
5194
|
-
name: "Mistral Saba 24B",
|
|
5195
|
-
api: "openai-completions",
|
|
5196
|
-
provider: "groq",
|
|
5197
|
-
baseUrl: "https://api.groq.com/openai/v1",
|
|
5198
|
-
reasoning: false,
|
|
5199
|
-
input: ["text"],
|
|
5200
|
-
cost: {
|
|
5201
|
-
input: 0.79,
|
|
5202
|
-
output: 0.79,
|
|
5203
|
-
cacheRead: 0,
|
|
5204
|
-
cacheWrite: 0,
|
|
5205
|
-
},
|
|
5206
|
-
contextWindow: 32768,
|
|
5207
|
-
maxTokens: 32768,
|
|
5208
|
-
},
|
|
5209
|
-
"moonshotai/kimi-k2-instruct": {
|
|
5210
|
-
id: "moonshotai/kimi-k2-instruct",
|
|
5211
|
-
name: "Kimi K2 Instruct",
|
|
5212
|
-
api: "openai-completions",
|
|
5213
|
-
provider: "groq",
|
|
5214
|
-
baseUrl: "https://api.groq.com/openai/v1",
|
|
5215
|
-
reasoning: false,
|
|
5216
|
-
input: ["text"],
|
|
5217
|
-
cost: {
|
|
5218
|
-
input: 1,
|
|
5219
|
-
output: 3,
|
|
5220
|
-
cacheRead: 0,
|
|
5221
|
-
cacheWrite: 0,
|
|
5222
|
-
},
|
|
5223
|
-
contextWindow: 131072,
|
|
5224
|
-
maxTokens: 16384,
|
|
5225
|
-
},
|
|
5226
|
-
"moonshotai/kimi-k2-instruct-0905": {
|
|
5227
|
-
id: "moonshotai/kimi-k2-instruct-0905",
|
|
5228
|
-
name: "Kimi K2 Instruct 0905",
|
|
5229
|
-
api: "openai-completions",
|
|
5230
|
-
provider: "groq",
|
|
5231
|
-
baseUrl: "https://api.groq.com/openai/v1",
|
|
5232
|
-
reasoning: false,
|
|
5233
|
-
input: ["text"],
|
|
5234
|
-
cost: {
|
|
5235
|
-
input: 1,
|
|
5236
|
-
output: 3,
|
|
5237
|
-
cacheRead: 0.5,
|
|
5238
|
-
cacheWrite: 0,
|
|
5239
|
-
},
|
|
5240
|
-
contextWindow: 262144,
|
|
5241
|
-
maxTokens: 16384,
|
|
5242
|
-
},
|
|
5243
5093
|
"openai/gpt-oss-120b": {
|
|
5244
5094
|
id: "openai/gpt-oss-120b",
|
|
5245
5095
|
name: "GPT OSS 120B",
|
|
@@ -5291,26 +5141,9 @@ export const MODELS = {
|
|
|
5291
5141
|
contextWindow: 131072,
|
|
5292
5142
|
maxTokens: 65536,
|
|
5293
5143
|
},
|
|
5294
|
-
"qwen-qwq-32b": {
|
|
5295
|
-
id: "qwen-qwq-32b",
|
|
5296
|
-
name: "Qwen QwQ 32B",
|
|
5297
|
-
api: "openai-completions",
|
|
5298
|
-
provider: "groq",
|
|
5299
|
-
baseUrl: "https://api.groq.com/openai/v1",
|
|
5300
|
-
reasoning: true,
|
|
5301
|
-
input: ["text"],
|
|
5302
|
-
cost: {
|
|
5303
|
-
input: 0.29,
|
|
5304
|
-
output: 0.39,
|
|
5305
|
-
cacheRead: 0,
|
|
5306
|
-
cacheWrite: 0,
|
|
5307
|
-
},
|
|
5308
|
-
contextWindow: 131072,
|
|
5309
|
-
maxTokens: 16384,
|
|
5310
|
-
},
|
|
5311
5144
|
"qwen/qwen3-32b": {
|
|
5312
5145
|
id: "qwen/qwen3-32b",
|
|
5313
|
-
name: "Qwen3
|
|
5146
|
+
name: "Qwen3-32B",
|
|
5314
5147
|
api: "openai-completions",
|
|
5315
5148
|
provider: "groq",
|
|
5316
5149
|
baseUrl: "https://api.groq.com/openai/v1",
|
|
@@ -5726,6 +5559,24 @@ export const MODELS = {
|
|
|
5726
5559
|
},
|
|
5727
5560
|
},
|
|
5728
5561
|
"kimi-coding": {
|
|
5562
|
+
"k2p7": {
|
|
5563
|
+
id: "k2p7",
|
|
5564
|
+
name: "Kimi K2.7 Code",
|
|
5565
|
+
api: "anthropic-messages",
|
|
5566
|
+
provider: "kimi-coding",
|
|
5567
|
+
baseUrl: "https://api.kimi.com/coding",
|
|
5568
|
+
headers: { "User-Agent": "KimiCLI/1.5" },
|
|
5569
|
+
reasoning: true,
|
|
5570
|
+
input: ["text", "image"],
|
|
5571
|
+
cost: {
|
|
5572
|
+
input: 0,
|
|
5573
|
+
output: 0,
|
|
5574
|
+
cacheRead: 0,
|
|
5575
|
+
cacheWrite: 0,
|
|
5576
|
+
},
|
|
5577
|
+
contextWindow: 262144,
|
|
5578
|
+
maxTokens: 32768,
|
|
5579
|
+
},
|
|
5729
5580
|
"kimi-for-coding": {
|
|
5730
5581
|
id: "kimi-for-coding",
|
|
5731
5582
|
name: "Kimi For Coding",
|
|
@@ -6508,6 +6359,24 @@ export const MODELS = {
|
|
|
6508
6359
|
contextWindow: 262144,
|
|
6509
6360
|
maxTokens: 262144,
|
|
6510
6361
|
},
|
|
6362
|
+
"kimi-k2.7-code": {
|
|
6363
|
+
id: "kimi-k2.7-code",
|
|
6364
|
+
name: "Kimi K2.7 Code",
|
|
6365
|
+
api: "openai-completions",
|
|
6366
|
+
provider: "moonshotai",
|
|
6367
|
+
baseUrl: "https://api.moonshot.ai/v1",
|
|
6368
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
|
|
6369
|
+
reasoning: true,
|
|
6370
|
+
input: ["text", "image"],
|
|
6371
|
+
cost: {
|
|
6372
|
+
input: 0.95,
|
|
6373
|
+
output: 4,
|
|
6374
|
+
cacheRead: 0.19,
|
|
6375
|
+
cacheWrite: 0,
|
|
6376
|
+
},
|
|
6377
|
+
contextWindow: 262144,
|
|
6378
|
+
maxTokens: 262144,
|
|
6379
|
+
},
|
|
6511
6380
|
},
|
|
6512
6381
|
"moonshotai-cn": {
|
|
6513
6382
|
"kimi-k2-0711-preview": {
|
|
@@ -6760,8 +6629,8 @@ export const MODELS = {
|
|
|
6760
6629
|
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
6761
6630
|
headers: { "NVCF-POLL-SECONDS": "3600" },
|
|
6762
6631
|
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
6763
|
-
reasoning:
|
|
6764
|
-
input: ["text"],
|
|
6632
|
+
reasoning: true,
|
|
6633
|
+
input: ["text", "image"],
|
|
6765
6634
|
cost: {
|
|
6766
6635
|
input: 0,
|
|
6767
6636
|
output: 0,
|
|
@@ -6790,44 +6659,6 @@ export const MODELS = {
|
|
|
6790
6659
|
contextWindow: 262144,
|
|
6791
6660
|
maxTokens: 262144,
|
|
6792
6661
|
},
|
|
6793
|
-
"nvidia/llama-3.3-nemotron-super-49b-v1": {
|
|
6794
|
-
id: "nvidia/llama-3.3-nemotron-super-49b-v1",
|
|
6795
|
-
name: "Llama 3.3 Nemotron Super 49B v1",
|
|
6796
|
-
api: "openai-completions",
|
|
6797
|
-
provider: "nvidia",
|
|
6798
|
-
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
6799
|
-
headers: { "NVCF-POLL-SECONDS": "3600" },
|
|
6800
|
-
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
6801
|
-
reasoning: true,
|
|
6802
|
-
input: ["text"],
|
|
6803
|
-
cost: {
|
|
6804
|
-
input: 0,
|
|
6805
|
-
output: 0,
|
|
6806
|
-
cacheRead: 0,
|
|
6807
|
-
cacheWrite: 0,
|
|
6808
|
-
},
|
|
6809
|
-
contextWindow: 131072,
|
|
6810
|
-
maxTokens: 131072,
|
|
6811
|
-
},
|
|
6812
|
-
"nvidia/llama-3.3-nemotron-super-49b-v1.5": {
|
|
6813
|
-
id: "nvidia/llama-3.3-nemotron-super-49b-v1.5",
|
|
6814
|
-
name: "Llama 3.3 Nemotron Super 49B v1.5",
|
|
6815
|
-
api: "openai-completions",
|
|
6816
|
-
provider: "nvidia",
|
|
6817
|
-
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
6818
|
-
headers: { "NVCF-POLL-SECONDS": "3600" },
|
|
6819
|
-
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
6820
|
-
reasoning: true,
|
|
6821
|
-
input: ["text"],
|
|
6822
|
-
cost: {
|
|
6823
|
-
input: 0,
|
|
6824
|
-
output: 0,
|
|
6825
|
-
cacheRead: 0,
|
|
6826
|
-
cacheWrite: 0,
|
|
6827
|
-
},
|
|
6828
|
-
contextWindow: 131072,
|
|
6829
|
-
maxTokens: 131072,
|
|
6830
|
-
},
|
|
6831
6662
|
"nvidia/nemotron-3-nano-30b-a3b": {
|
|
6832
6663
|
id: "nvidia/nemotron-3-nano-30b-a3b",
|
|
6833
6664
|
name: "nemotron-3-nano-30b-a3b",
|
|
@@ -6923,9 +6754,9 @@ export const MODELS = {
|
|
|
6923
6754
|
contextWindow: 131072,
|
|
6924
6755
|
maxTokens: 131072,
|
|
6925
6756
|
},
|
|
6926
|
-
"openai/gpt-oss-
|
|
6927
|
-
id: "openai/gpt-oss-
|
|
6928
|
-
name: "GPT
|
|
6757
|
+
"openai/gpt-oss-120b": {
|
|
6758
|
+
id: "openai/gpt-oss-120b",
|
|
6759
|
+
name: "GPT-OSS-120B",
|
|
6929
6760
|
api: "openai-completions",
|
|
6930
6761
|
provider: "nvidia",
|
|
6931
6762
|
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
@@ -6939,18 +6770,18 @@ export const MODELS = {
|
|
|
6939
6770
|
cacheRead: 0,
|
|
6940
6771
|
cacheWrite: 0,
|
|
6941
6772
|
},
|
|
6942
|
-
contextWindow:
|
|
6943
|
-
maxTokens:
|
|
6773
|
+
contextWindow: 128000,
|
|
6774
|
+
maxTokens: 8192,
|
|
6944
6775
|
},
|
|
6945
|
-
"
|
|
6946
|
-
id: "
|
|
6947
|
-
name: "
|
|
6776
|
+
"openai/gpt-oss-20b": {
|
|
6777
|
+
id: "openai/gpt-oss-20b",
|
|
6778
|
+
name: "GPT OSS 20B",
|
|
6948
6779
|
api: "openai-completions",
|
|
6949
6780
|
provider: "nvidia",
|
|
6950
6781
|
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
6951
6782
|
headers: { "NVCF-POLL-SECONDS": "3600" },
|
|
6952
6783
|
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
6953
|
-
reasoning:
|
|
6784
|
+
reasoning: true,
|
|
6954
6785
|
input: ["text"],
|
|
6955
6786
|
cost: {
|
|
6956
6787
|
input: 0,
|
|
@@ -6958,8 +6789,8 @@ export const MODELS = {
|
|
|
6958
6789
|
cacheRead: 0,
|
|
6959
6790
|
cacheWrite: 0,
|
|
6960
6791
|
},
|
|
6961
|
-
contextWindow:
|
|
6962
|
-
maxTokens:
|
|
6792
|
+
contextWindow: 131072,
|
|
6793
|
+
maxTokens: 32768,
|
|
6963
6794
|
},
|
|
6964
6795
|
"qwen/qwen3.5-122b-a10b": {
|
|
6965
6796
|
id: "qwen/qwen3.5-122b-a10b",
|
|
@@ -7548,7 +7379,7 @@ export const MODELS = {
|
|
|
7548
7379
|
cacheRead: 0.25,
|
|
7549
7380
|
cacheWrite: 0,
|
|
7550
7381
|
},
|
|
7551
|
-
contextWindow:
|
|
7382
|
+
contextWindow: 1050000,
|
|
7552
7383
|
maxTokens: 128000,
|
|
7553
7384
|
},
|
|
7554
7385
|
"gpt-5.4-mini": {
|
|
@@ -7620,7 +7451,7 @@ export const MODELS = {
|
|
|
7620
7451
|
cacheRead: 0.5,
|
|
7621
7452
|
cacheWrite: 0,
|
|
7622
7453
|
},
|
|
7623
|
-
contextWindow:
|
|
7454
|
+
contextWindow: 1050000,
|
|
7624
7455
|
maxTokens: 128000,
|
|
7625
7456
|
},
|
|
7626
7457
|
"gpt-5.5-pro": {
|
|
@@ -7812,7 +7643,7 @@ export const MODELS = {
|
|
|
7812
7643
|
cacheRead: 0.25,
|
|
7813
7644
|
cacheWrite: 0,
|
|
7814
7645
|
},
|
|
7815
|
-
contextWindow:
|
|
7646
|
+
contextWindow: 1000000,
|
|
7816
7647
|
maxTokens: 128000,
|
|
7817
7648
|
},
|
|
7818
7649
|
"gpt-5.4-mini": {
|
|
@@ -7830,7 +7661,7 @@ export const MODELS = {
|
|
|
7830
7661
|
cacheRead: 0.075,
|
|
7831
7662
|
cacheWrite: 0,
|
|
7832
7663
|
},
|
|
7833
|
-
contextWindow:
|
|
7664
|
+
contextWindow: 400000,
|
|
7834
7665
|
maxTokens: 128000,
|
|
7835
7666
|
},
|
|
7836
7667
|
"gpt-5.5": {
|
|
@@ -7848,7 +7679,7 @@ export const MODELS = {
|
|
|
7848
7679
|
cacheRead: 0.5,
|
|
7849
7680
|
cacheWrite: 0,
|
|
7850
7681
|
},
|
|
7851
|
-
contextWindow:
|
|
7682
|
+
contextWindow: 400000,
|
|
7852
7683
|
maxTokens: 128000,
|
|
7853
7684
|
},
|
|
7854
7685
|
},
|
|
@@ -7879,7 +7710,7 @@ export const MODELS = {
|
|
|
7879
7710
|
baseUrl: "https://opencode.ai/zen",
|
|
7880
7711
|
compat: { "forceAdaptiveThinking": true },
|
|
7881
7712
|
reasoning: true,
|
|
7882
|
-
thinkingLevelMap: { "xhigh": "xhigh" },
|
|
7713
|
+
thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
|
|
7883
7714
|
input: ["text", "image"],
|
|
7884
7715
|
cost: {
|
|
7885
7716
|
input: 10,
|
|
@@ -8063,7 +7894,7 @@ export const MODELS = {
|
|
|
8063
7894
|
cost: {
|
|
8064
7895
|
input: 0.14,
|
|
8065
7896
|
output: 0.28,
|
|
8066
|
-
cacheRead: 0.
|
|
7897
|
+
cacheRead: 0.028,
|
|
8067
7898
|
cacheWrite: 0,
|
|
8068
7899
|
},
|
|
8069
7900
|
contextWindow: 1000000,
|
|
@@ -8088,6 +7919,25 @@ export const MODELS = {
|
|
|
8088
7919
|
contextWindow: 200000,
|
|
8089
7920
|
maxTokens: 128000,
|
|
8090
7921
|
},
|
|
7922
|
+
"deepseek-v4-pro": {
|
|
7923
|
+
id: "deepseek-v4-pro",
|
|
7924
|
+
name: "DeepSeek V4 Pro",
|
|
7925
|
+
api: "openai-completions",
|
|
7926
|
+
provider: "opencode",
|
|
7927
|
+
baseUrl: "https://opencode.ai/zen/v1",
|
|
7928
|
+
compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
|
|
7929
|
+
reasoning: true,
|
|
7930
|
+
thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
|
|
7931
|
+
input: ["text"],
|
|
7932
|
+
cost: {
|
|
7933
|
+
input: 1.74,
|
|
7934
|
+
output: 3.84,
|
|
7935
|
+
cacheRead: 0.145,
|
|
7936
|
+
cacheWrite: 0,
|
|
7937
|
+
},
|
|
7938
|
+
contextWindow: 1000000,
|
|
7939
|
+
maxTokens: 384000,
|
|
7940
|
+
},
|
|
8091
7941
|
"gemini-3-flash": {
|
|
8092
7942
|
id: "gemini-3-flash",
|
|
8093
7943
|
name: "Gemini 3 Flash",
|
|
@@ -8721,42 +8571,42 @@ export const MODELS = {
|
|
|
8721
8571
|
contextWindow: 202752,
|
|
8722
8572
|
maxTokens: 32768,
|
|
8723
8573
|
},
|
|
8724
|
-
"kimi-k2.
|
|
8725
|
-
id: "kimi-k2.
|
|
8726
|
-
name: "Kimi K2.
|
|
8574
|
+
"kimi-k2.6": {
|
|
8575
|
+
id: "kimi-k2.6",
|
|
8576
|
+
name: "Kimi K2.6",
|
|
8727
8577
|
api: "openai-completions",
|
|
8728
8578
|
provider: "opencode-go",
|
|
8729
8579
|
baseUrl: "https://opencode.ai/zen/go/v1",
|
|
8730
|
-
compat: { "maxTokensField": "max_tokens" },
|
|
8580
|
+
compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false, "maxTokensField": "max_tokens" },
|
|
8731
8581
|
reasoning: true,
|
|
8582
|
+
thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
|
|
8732
8583
|
input: ["text", "image"],
|
|
8733
8584
|
cost: {
|
|
8734
|
-
input: 0.
|
|
8735
|
-
output:
|
|
8736
|
-
cacheRead: 0.
|
|
8585
|
+
input: 0.95,
|
|
8586
|
+
output: 4,
|
|
8587
|
+
cacheRead: 0.16,
|
|
8737
8588
|
cacheWrite: 0,
|
|
8738
8589
|
},
|
|
8739
8590
|
contextWindow: 262144,
|
|
8740
8591
|
maxTokens: 65536,
|
|
8741
8592
|
},
|
|
8742
|
-
"kimi-k2.
|
|
8743
|
-
id: "kimi-k2.
|
|
8744
|
-
name: "Kimi K2.
|
|
8593
|
+
"kimi-k2.7-code": {
|
|
8594
|
+
id: "kimi-k2.7-code",
|
|
8595
|
+
name: "Kimi K2.7 Code",
|
|
8745
8596
|
api: "openai-completions",
|
|
8746
8597
|
provider: "opencode-go",
|
|
8747
8598
|
baseUrl: "https://opencode.ai/zen/go/v1",
|
|
8748
|
-
compat: { "
|
|
8599
|
+
compat: { "maxTokensField": "max_tokens" },
|
|
8749
8600
|
reasoning: true,
|
|
8750
|
-
thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
|
|
8751
8601
|
input: ["text", "image"],
|
|
8752
8602
|
cost: {
|
|
8753
8603
|
input: 0.95,
|
|
8754
8604
|
output: 4,
|
|
8755
|
-
cacheRead: 0.
|
|
8605
|
+
cacheRead: 0.19,
|
|
8756
8606
|
cacheWrite: 0,
|
|
8757
8607
|
},
|
|
8758
8608
|
contextWindow: 262144,
|
|
8759
|
-
maxTokens:
|
|
8609
|
+
maxTokens: 262144,
|
|
8760
8610
|
},
|
|
8761
8611
|
"mimo-v2.5": {
|
|
8762
8612
|
id: "mimo-v2.5",
|
|
@@ -8794,23 +8644,6 @@ export const MODELS = {
|
|
|
8794
8644
|
contextWindow: 1048576,
|
|
8795
8645
|
maxTokens: 128000,
|
|
8796
8646
|
},
|
|
8797
|
-
"minimax-m2.5": {
|
|
8798
|
-
id: "minimax-m2.5",
|
|
8799
|
-
name: "MiniMax M2.5",
|
|
8800
|
-
api: "anthropic-messages",
|
|
8801
|
-
provider: "opencode-go",
|
|
8802
|
-
baseUrl: "https://opencode.ai/zen/go",
|
|
8803
|
-
reasoning: true,
|
|
8804
|
-
input: ["text"],
|
|
8805
|
-
cost: {
|
|
8806
|
-
input: 0.3,
|
|
8807
|
-
output: 1.2,
|
|
8808
|
-
cacheRead: 0.03,
|
|
8809
|
-
cacheWrite: 0,
|
|
8810
|
-
},
|
|
8811
|
-
contextWindow: 204800,
|
|
8812
|
-
maxTokens: 65536,
|
|
8813
|
-
},
|
|
8814
8647
|
"minimax-m2.7": {
|
|
8815
8648
|
id: "minimax-m2.7",
|
|
8816
8649
|
name: "MiniMax M2.7",
|
|
@@ -8831,16 +8664,16 @@ export const MODELS = {
|
|
|
8831
8664
|
},
|
|
8832
8665
|
"minimax-m3": {
|
|
8833
8666
|
id: "minimax-m3",
|
|
8834
|
-
name: "MiniMax M3",
|
|
8667
|
+
name: "MiniMax M3 (3x usage)",
|
|
8835
8668
|
api: "anthropic-messages",
|
|
8836
8669
|
provider: "opencode-go",
|
|
8837
8670
|
baseUrl: "https://opencode.ai/zen/go",
|
|
8838
8671
|
reasoning: true,
|
|
8839
8672
|
input: ["text", "image"],
|
|
8840
8673
|
cost: {
|
|
8841
|
-
input: 0.
|
|
8842
|
-
output:
|
|
8843
|
-
cacheRead: 0.
|
|
8674
|
+
input: 0.1,
|
|
8675
|
+
output: 0.4,
|
|
8676
|
+
cacheRead: 0.02,
|
|
8844
8677
|
cacheWrite: 0,
|
|
8845
8678
|
},
|
|
8846
8679
|
contextWindow: 512000,
|
|
@@ -8994,8 +8827,8 @@ export const MODELS = {
|
|
|
8994
8827
|
reasoning: false,
|
|
8995
8828
|
input: ["text", "image"],
|
|
8996
8829
|
cost: {
|
|
8997
|
-
input: 0.
|
|
8998
|
-
output: 3.
|
|
8830
|
+
input: 0.8,
|
|
8831
|
+
output: 3.2,
|
|
8999
8832
|
cacheRead: 0,
|
|
9000
8833
|
cacheWrite: 0,
|
|
9001
8834
|
},
|
|
@@ -9028,7 +8861,7 @@ export const MODELS = {
|
|
|
9028
8861
|
reasoning: false,
|
|
9029
8862
|
input: ["text", "image"],
|
|
9030
8863
|
cost: {
|
|
9031
|
-
input: 0.
|
|
8864
|
+
input: 0.8,
|
|
9032
8865
|
output: 4,
|
|
9033
8866
|
cacheRead: 0.08,
|
|
9034
8867
|
cacheWrite: 1,
|
|
@@ -9064,7 +8897,7 @@ export const MODELS = {
|
|
|
9064
8897
|
cost: {
|
|
9065
8898
|
input: 1,
|
|
9066
8899
|
output: 5,
|
|
9067
|
-
cacheRead: 0.
|
|
8900
|
+
cacheRead: 0.1,
|
|
9068
8901
|
cacheWrite: 1.25,
|
|
9069
8902
|
},
|
|
9070
8903
|
contextWindow: 200000,
|
|
@@ -9408,8 +9241,8 @@ export const MODELS = {
|
|
|
9408
9241
|
reasoning: true,
|
|
9409
9242
|
input: ["text", "image"],
|
|
9410
9243
|
cost: {
|
|
9411
|
-
input: 0.
|
|
9412
|
-
output: 0.
|
|
9244
|
+
input: 0.1,
|
|
9245
|
+
output: 0.4,
|
|
9413
9246
|
cacheRead: 0,
|
|
9414
9247
|
cacheWrite: 0,
|
|
9415
9248
|
},
|
|
@@ -9459,8 +9292,8 @@ export const MODELS = {
|
|
|
9459
9292
|
reasoning: false,
|
|
9460
9293
|
input: ["text"],
|
|
9461
9294
|
cost: {
|
|
9462
|
-
input: 0.
|
|
9463
|
-
output: 0.
|
|
9295
|
+
input: 0.2002,
|
|
9296
|
+
output: 0.8001,
|
|
9464
9297
|
cacheRead: 0,
|
|
9465
9298
|
cacheWrite: 0,
|
|
9466
9299
|
},
|
|
@@ -9476,7 +9309,7 @@ export const MODELS = {
|
|
|
9476
9309
|
reasoning: false,
|
|
9477
9310
|
input: ["text"],
|
|
9478
9311
|
cost: {
|
|
9479
|
-
input: 0.
|
|
9312
|
+
input: 0.2,
|
|
9480
9313
|
output: 0.77,
|
|
9481
9314
|
cacheRead: 0.135,
|
|
9482
9315
|
cacheWrite: 0,
|
|
@@ -9494,7 +9327,7 @@ export const MODELS = {
|
|
|
9494
9327
|
input: ["text"],
|
|
9495
9328
|
cost: {
|
|
9496
9329
|
input: 0.21,
|
|
9497
|
-
output: 0.
|
|
9330
|
+
output: 0.79,
|
|
9498
9331
|
cacheRead: 0.13,
|
|
9499
9332
|
cacheWrite: 0,
|
|
9500
9333
|
},
|
|
@@ -9528,7 +9361,7 @@ export const MODELS = {
|
|
|
9528
9361
|
input: ["text"],
|
|
9529
9362
|
cost: {
|
|
9530
9363
|
input: 0.5,
|
|
9531
|
-
output: 2.
|
|
9364
|
+
output: 2.15,
|
|
9532
9365
|
cacheRead: 0.35,
|
|
9533
9366
|
cacheWrite: 0,
|
|
9534
9367
|
},
|
|
@@ -9597,13 +9430,13 @@ export const MODELS = {
|
|
|
9597
9430
|
thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "xhigh" },
|
|
9598
9431
|
input: ["text"],
|
|
9599
9432
|
cost: {
|
|
9600
|
-
input: 0.
|
|
9601
|
-
output: 0.
|
|
9602
|
-
cacheRead: 0.
|
|
9433
|
+
input: 0.098,
|
|
9434
|
+
output: 0.196,
|
|
9435
|
+
cacheRead: 0.02,
|
|
9603
9436
|
cacheWrite: 0,
|
|
9604
9437
|
},
|
|
9605
9438
|
contextWindow: 1048576,
|
|
9606
|
-
maxTokens:
|
|
9439
|
+
maxTokens: 4096,
|
|
9607
9440
|
},
|
|
9608
9441
|
"deepseek/deepseek-v4-pro": {
|
|
9609
9442
|
id: "deepseek/deepseek-v4-pro",
|
|
@@ -9653,7 +9486,7 @@ export const MODELS = {
|
|
|
9653
9486
|
input: 0.3,
|
|
9654
9487
|
output: 2.5,
|
|
9655
9488
|
cacheRead: 0.03,
|
|
9656
|
-
cacheWrite: 0.
|
|
9489
|
+
cacheWrite: 0.083333,
|
|
9657
9490
|
},
|
|
9658
9491
|
contextWindow: 1048576,
|
|
9659
9492
|
maxTokens: 65535,
|
|
@@ -9667,10 +9500,10 @@ export const MODELS = {
|
|
|
9667
9500
|
reasoning: true,
|
|
9668
9501
|
input: ["text", "image"],
|
|
9669
9502
|
cost: {
|
|
9670
|
-
input: 0.
|
|
9671
|
-
output: 0.
|
|
9503
|
+
input: 0.1,
|
|
9504
|
+
output: 0.4,
|
|
9672
9505
|
cacheRead: 0.01,
|
|
9673
|
-
cacheWrite: 0.
|
|
9506
|
+
cacheWrite: 0.083333,
|
|
9674
9507
|
},
|
|
9675
9508
|
contextWindow: 1048576,
|
|
9676
9509
|
maxTokens: 65535,
|
|
@@ -9684,10 +9517,10 @@ export const MODELS = {
|
|
|
9684
9517
|
reasoning: true,
|
|
9685
9518
|
input: ["text", "image"],
|
|
9686
9519
|
cost: {
|
|
9687
|
-
input: 0.
|
|
9688
|
-
output: 0.
|
|
9520
|
+
input: 0.1,
|
|
9521
|
+
output: 0.4,
|
|
9689
9522
|
cacheRead: 0.01,
|
|
9690
|
-
cacheWrite: 0.
|
|
9523
|
+
cacheWrite: 0.083333,
|
|
9691
9524
|
},
|
|
9692
9525
|
contextWindow: 1048576,
|
|
9693
9526
|
maxTokens: 65535,
|
|
@@ -9754,8 +9587,8 @@ export const MODELS = {
|
|
|
9754
9587
|
cost: {
|
|
9755
9588
|
input: 0.5,
|
|
9756
9589
|
output: 3,
|
|
9757
|
-
cacheRead: 0.
|
|
9758
|
-
cacheWrite: 0.
|
|
9590
|
+
cacheRead: 0.05,
|
|
9591
|
+
cacheWrite: 0.083333,
|
|
9759
9592
|
},
|
|
9760
9593
|
contextWindow: 1048576,
|
|
9761
9594
|
maxTokens: 65536,
|
|
@@ -9771,8 +9604,8 @@ export const MODELS = {
|
|
|
9771
9604
|
cost: {
|
|
9772
9605
|
input: 0.25,
|
|
9773
9606
|
output: 1.5,
|
|
9774
|
-
cacheRead: 0.
|
|
9775
|
-
cacheWrite: 0.
|
|
9607
|
+
cacheRead: 0.025,
|
|
9608
|
+
cacheWrite: 0.083333,
|
|
9776
9609
|
},
|
|
9777
9610
|
contextWindow: 1048576,
|
|
9778
9611
|
maxTokens: 65536,
|
|
@@ -9788,8 +9621,8 @@ export const MODELS = {
|
|
|
9788
9621
|
cost: {
|
|
9789
9622
|
input: 0.25,
|
|
9790
9623
|
output: 1.5,
|
|
9791
|
-
cacheRead: 0.
|
|
9792
|
-
cacheWrite: 0.
|
|
9624
|
+
cacheRead: 0.025,
|
|
9625
|
+
cacheWrite: 0.083333,
|
|
9793
9626
|
},
|
|
9794
9627
|
contextWindow: 1048576,
|
|
9795
9628
|
maxTokens: 65536,
|
|
@@ -9805,7 +9638,7 @@ export const MODELS = {
|
|
|
9805
9638
|
cost: {
|
|
9806
9639
|
input: 2,
|
|
9807
9640
|
output: 12,
|
|
9808
|
-
cacheRead: 0.
|
|
9641
|
+
cacheRead: 0.2,
|
|
9809
9642
|
cacheWrite: 0.375,
|
|
9810
9643
|
},
|
|
9811
9644
|
contextWindow: 1048576,
|
|
@@ -9822,7 +9655,7 @@ export const MODELS = {
|
|
|
9822
9655
|
cost: {
|
|
9823
9656
|
input: 2,
|
|
9824
9657
|
output: 12,
|
|
9825
|
-
cacheRead: 0.
|
|
9658
|
+
cacheRead: 0.2,
|
|
9826
9659
|
cacheWrite: 0.375,
|
|
9827
9660
|
},
|
|
9828
9661
|
contextWindow: 1048756,
|
|
@@ -9840,7 +9673,7 @@ export const MODELS = {
|
|
|
9840
9673
|
input: 1.5,
|
|
9841
9674
|
output: 9,
|
|
9842
9675
|
cacheRead: 0.15,
|
|
9843
|
-
cacheWrite: 0.
|
|
9676
|
+
cacheWrite: 0.083333,
|
|
9844
9677
|
},
|
|
9845
9678
|
contextWindow: 1048576,
|
|
9846
9679
|
maxTokens: 65536,
|
|
@@ -9854,7 +9687,7 @@ export const MODELS = {
|
|
|
9854
9687
|
reasoning: false,
|
|
9855
9688
|
input: ["text", "image"],
|
|
9856
9689
|
cost: {
|
|
9857
|
-
input: 0.
|
|
9690
|
+
input: 0.05,
|
|
9858
9691
|
output: 0.15,
|
|
9859
9692
|
cacheRead: 0,
|
|
9860
9693
|
cacheWrite: 0,
|
|
@@ -9923,12 +9756,12 @@ export const MODELS = {
|
|
|
9923
9756
|
input: ["text", "image"],
|
|
9924
9757
|
cost: {
|
|
9925
9758
|
input: 0.12,
|
|
9926
|
-
output: 0.
|
|
9759
|
+
output: 0.35,
|
|
9927
9760
|
cacheRead: 0.09,
|
|
9928
9761
|
cacheWrite: 0,
|
|
9929
9762
|
},
|
|
9930
9763
|
contextWindow: 262144,
|
|
9931
|
-
maxTokens:
|
|
9764
|
+
maxTokens: 262144,
|
|
9932
9765
|
},
|
|
9933
9766
|
"google/gemma-4-31b-it:free": {
|
|
9934
9767
|
id: "google/gemma-4-31b-it:free",
|
|
@@ -9956,9 +9789,9 @@ export const MODELS = {
|
|
|
9956
9789
|
reasoning: false,
|
|
9957
9790
|
input: ["text"],
|
|
9958
9791
|
cost: {
|
|
9959
|
-
input: 0.
|
|
9960
|
-
output: 0.
|
|
9961
|
-
cacheRead: 0.
|
|
9792
|
+
input: 0.05,
|
|
9793
|
+
output: 0.1,
|
|
9794
|
+
cacheRead: 0.05,
|
|
9962
9795
|
cacheWrite: 0,
|
|
9963
9796
|
},
|
|
9964
9797
|
contextWindow: 131072,
|
|
@@ -9976,7 +9809,7 @@ export const MODELS = {
|
|
|
9976
9809
|
cost: {
|
|
9977
9810
|
input: 0.25,
|
|
9978
9811
|
output: 0.75,
|
|
9979
|
-
cacheRead: 0.
|
|
9812
|
+
cacheRead: 0.025,
|
|
9980
9813
|
cacheWrite: 0,
|
|
9981
9814
|
},
|
|
9982
9815
|
contextWindow: 128000,
|
|
@@ -10059,8 +9892,8 @@ export const MODELS = {
|
|
|
10059
9892
|
reasoning: false,
|
|
10060
9893
|
input: ["text"],
|
|
10061
9894
|
cost: {
|
|
10062
|
-
input: 0.
|
|
10063
|
-
output: 0.
|
|
9895
|
+
input: 0.4,
|
|
9896
|
+
output: 0.4,
|
|
10064
9897
|
cacheRead: 0,
|
|
10065
9898
|
cacheWrite: 0,
|
|
10066
9899
|
},
|
|
@@ -10093,7 +9926,7 @@ export const MODELS = {
|
|
|
10093
9926
|
reasoning: false,
|
|
10094
9927
|
input: ["text"],
|
|
10095
9928
|
cost: {
|
|
10096
|
-
input: 0.
|
|
9929
|
+
input: 0.1,
|
|
10097
9930
|
output: 0.32,
|
|
10098
9931
|
cacheRead: 0,
|
|
10099
9932
|
cacheWrite: 0,
|
|
@@ -10144,7 +9977,7 @@ export const MODELS = {
|
|
|
10144
9977
|
reasoning: false,
|
|
10145
9978
|
input: ["text", "image"],
|
|
10146
9979
|
cost: {
|
|
10147
|
-
input: 0.
|
|
9980
|
+
input: 0.1,
|
|
10148
9981
|
output: 0.3,
|
|
10149
9982
|
cacheRead: 0,
|
|
10150
9983
|
cacheWrite: 0,
|
|
@@ -10161,7 +9994,7 @@ export const MODELS = {
|
|
|
10161
9994
|
reasoning: true,
|
|
10162
9995
|
input: ["text"],
|
|
10163
9996
|
cost: {
|
|
10164
|
-
input: 0.
|
|
9997
|
+
input: 0.4,
|
|
10165
9998
|
output: 2.2,
|
|
10166
9999
|
cacheRead: 0,
|
|
10167
10000
|
cacheWrite: 0,
|
|
@@ -10213,8 +10046,8 @@ export const MODELS = {
|
|
|
10213
10046
|
input: ["text"],
|
|
10214
10047
|
cost: {
|
|
10215
10048
|
input: 0.15,
|
|
10216
|
-
output: 0.
|
|
10217
|
-
cacheRead: 0.
|
|
10049
|
+
output: 0.9,
|
|
10050
|
+
cacheRead: 0.05,
|
|
10218
10051
|
cacheWrite: 0,
|
|
10219
10052
|
},
|
|
10220
10053
|
contextWindow: 204800,
|
|
@@ -10229,9 +10062,9 @@ export const MODELS = {
|
|
|
10229
10062
|
reasoning: true,
|
|
10230
10063
|
input: ["text"],
|
|
10231
10064
|
cost: {
|
|
10232
|
-
input: 0.
|
|
10233
|
-
output: 1
|
|
10234
|
-
cacheRead: 0.
|
|
10065
|
+
input: 0.25,
|
|
10066
|
+
output: 1,
|
|
10067
|
+
cacheRead: 0.05,
|
|
10235
10068
|
cacheWrite: 0,
|
|
10236
10069
|
},
|
|
10237
10070
|
contextWindow: 204800,
|
|
@@ -10264,7 +10097,7 @@ export const MODELS = {
|
|
|
10264
10097
|
input: ["text"],
|
|
10265
10098
|
cost: {
|
|
10266
10099
|
input: 0.3,
|
|
10267
|
-
output: 0.
|
|
10100
|
+
output: 0.9,
|
|
10268
10101
|
cacheRead: 0.03,
|
|
10269
10102
|
cacheWrite: 0,
|
|
10270
10103
|
},
|
|
@@ -10280,7 +10113,7 @@ export const MODELS = {
|
|
|
10280
10113
|
reasoning: false,
|
|
10281
10114
|
input: ["text"],
|
|
10282
10115
|
cost: {
|
|
10283
|
-
input: 0.
|
|
10116
|
+
input: 0.4,
|
|
10284
10117
|
output: 2,
|
|
10285
10118
|
cacheRead: 0.04,
|
|
10286
10119
|
cacheWrite: 0,
|
|
@@ -10297,8 +10130,8 @@ export const MODELS = {
|
|
|
10297
10130
|
reasoning: false,
|
|
10298
10131
|
input: ["text", "image"],
|
|
10299
10132
|
cost: {
|
|
10300
|
-
input: 0.
|
|
10301
|
-
output: 0.
|
|
10133
|
+
input: 0.2,
|
|
10134
|
+
output: 0.2,
|
|
10302
10135
|
cacheRead: 0.02,
|
|
10303
10136
|
cacheWrite: 0,
|
|
10304
10137
|
},
|
|
@@ -10314,8 +10147,8 @@ export const MODELS = {
|
|
|
10314
10147
|
reasoning: false,
|
|
10315
10148
|
input: ["text", "image"],
|
|
10316
10149
|
cost: {
|
|
10317
|
-
input: 0.
|
|
10318
|
-
output: 0.
|
|
10150
|
+
input: 0.1,
|
|
10151
|
+
output: 0.1,
|
|
10319
10152
|
cacheRead: 0.01,
|
|
10320
10153
|
cacheWrite: 0,
|
|
10321
10154
|
},
|
|
@@ -10350,7 +10183,7 @@ export const MODELS = {
|
|
|
10350
10183
|
cost: {
|
|
10351
10184
|
input: 2,
|
|
10352
10185
|
output: 6,
|
|
10353
|
-
cacheRead: 0.
|
|
10186
|
+
cacheRead: 0.2,
|
|
10354
10187
|
cacheWrite: 0,
|
|
10355
10188
|
},
|
|
10356
10189
|
contextWindow: 128000,
|
|
@@ -10367,7 +10200,7 @@ export const MODELS = {
|
|
|
10367
10200
|
cost: {
|
|
10368
10201
|
input: 2,
|
|
10369
10202
|
output: 6,
|
|
10370
|
-
cacheRead: 0.
|
|
10203
|
+
cacheRead: 0.2,
|
|
10371
10204
|
cacheWrite: 0,
|
|
10372
10205
|
},
|
|
10373
10206
|
contextWindow: 131072,
|
|
@@ -10384,7 +10217,7 @@ export const MODELS = {
|
|
|
10384
10217
|
cost: {
|
|
10385
10218
|
input: 0.5,
|
|
10386
10219
|
output: 1.5,
|
|
10387
|
-
cacheRead: 0.
|
|
10220
|
+
cacheRead: 0.05,
|
|
10388
10221
|
cacheWrite: 0,
|
|
10389
10222
|
},
|
|
10390
10223
|
contextWindow: 262144,
|
|
@@ -10399,7 +10232,7 @@ export const MODELS = {
|
|
|
10399
10232
|
reasoning: false,
|
|
10400
10233
|
input: ["text", "image"],
|
|
10401
10234
|
cost: {
|
|
10402
|
-
input: 0.
|
|
10235
|
+
input: 0.4,
|
|
10403
10236
|
output: 2,
|
|
10404
10237
|
cacheRead: 0.04,
|
|
10405
10238
|
cacheWrite: 0,
|
|
@@ -10433,7 +10266,7 @@ export const MODELS = {
|
|
|
10433
10266
|
reasoning: false,
|
|
10434
10267
|
input: ["text", "image"],
|
|
10435
10268
|
cost: {
|
|
10436
|
-
input: 0.
|
|
10269
|
+
input: 0.4,
|
|
10437
10270
|
output: 2,
|
|
10438
10271
|
cacheRead: 0.04,
|
|
10439
10272
|
cacheWrite: 0,
|
|
@@ -10467,7 +10300,7 @@ export const MODELS = {
|
|
|
10467
10300
|
reasoning: false,
|
|
10468
10301
|
input: ["text"],
|
|
10469
10302
|
cost: {
|
|
10470
|
-
input: 0.
|
|
10303
|
+
input: 0.2,
|
|
10471
10304
|
output: 0.6,
|
|
10472
10305
|
cacheRead: 0.02,
|
|
10473
10306
|
cacheWrite: 0,
|
|
@@ -10502,7 +10335,7 @@ export const MODELS = {
|
|
|
10502
10335
|
input: ["text", "image"],
|
|
10503
10336
|
cost: {
|
|
10504
10337
|
input: 0.075,
|
|
10505
|
-
output: 0.
|
|
10338
|
+
output: 0.2,
|
|
10506
10339
|
cacheRead: 0,
|
|
10507
10340
|
cacheWrite: 0,
|
|
10508
10341
|
},
|
|
@@ -10520,7 +10353,7 @@ export const MODELS = {
|
|
|
10520
10353
|
cost: {
|
|
10521
10354
|
input: 2,
|
|
10522
10355
|
output: 6,
|
|
10523
|
-
cacheRead: 0.
|
|
10356
|
+
cacheRead: 0.2,
|
|
10524
10357
|
cacheWrite: 0,
|
|
10525
10358
|
},
|
|
10526
10359
|
contextWindow: 65536,
|
|
@@ -10535,7 +10368,7 @@ export const MODELS = {
|
|
|
10535
10368
|
reasoning: false,
|
|
10536
10369
|
input: ["text"],
|
|
10537
10370
|
cost: {
|
|
10538
|
-
input: 0.
|
|
10371
|
+
input: 0.1,
|
|
10539
10372
|
output: 0.3,
|
|
10540
10373
|
cacheRead: 0.01,
|
|
10541
10374
|
cacheWrite: 0,
|
|
@@ -10552,7 +10385,7 @@ export const MODELS = {
|
|
|
10552
10385
|
reasoning: false,
|
|
10553
10386
|
input: ["text"],
|
|
10554
10387
|
cost: {
|
|
10555
|
-
input: 0.
|
|
10388
|
+
input: 0.57,
|
|
10556
10389
|
output: 2.3,
|
|
10557
10390
|
cacheRead: 0,
|
|
10558
10391
|
cacheWrite: 0,
|
|
@@ -10621,27 +10454,26 @@ export const MODELS = {
|
|
|
10621
10454
|
reasoning: true,
|
|
10622
10455
|
input: ["text", "image"],
|
|
10623
10456
|
cost: {
|
|
10624
|
-
input: 0.
|
|
10457
|
+
input: 0.68,
|
|
10625
10458
|
output: 3.41,
|
|
10626
|
-
cacheRead: 0.
|
|
10459
|
+
cacheRead: 0.34,
|
|
10627
10460
|
cacheWrite: 0,
|
|
10628
10461
|
},
|
|
10629
10462
|
contextWindow: 262144,
|
|
10630
10463
|
maxTokens: 262142,
|
|
10631
10464
|
},
|
|
10632
|
-
"moonshotai/kimi-k2.
|
|
10633
|
-
id: "moonshotai/kimi-k2.
|
|
10634
|
-
name: "MoonshotAI: Kimi K2.
|
|
10465
|
+
"moonshotai/kimi-k2.7-code": {
|
|
10466
|
+
id: "moonshotai/kimi-k2.7-code",
|
|
10467
|
+
name: "MoonshotAI: Kimi K2.7 Code",
|
|
10635
10468
|
api: "openai-completions",
|
|
10636
10469
|
provider: "openrouter",
|
|
10637
10470
|
baseUrl: "https://openrouter.ai/api/v1",
|
|
10638
|
-
compat: { "supportsDeveloperRole": false, "requiresReasoningContentOnAssistantMessages": true },
|
|
10639
10471
|
reasoning: true,
|
|
10640
10472
|
input: ["text", "image"],
|
|
10641
10473
|
cost: {
|
|
10642
|
-
input: 0,
|
|
10643
|
-
output:
|
|
10644
|
-
cacheRead: 0,
|
|
10474
|
+
input: 0.95,
|
|
10475
|
+
output: 4,
|
|
10476
|
+
cacheRead: 0.19,
|
|
10645
10477
|
cacheWrite: 0,
|
|
10646
10478
|
},
|
|
10647
10479
|
contextWindow: 262144,
|
|
@@ -10673,8 +10505,8 @@ export const MODELS = {
|
|
|
10673
10505
|
reasoning: true,
|
|
10674
10506
|
input: ["text"],
|
|
10675
10507
|
cost: {
|
|
10676
|
-
input: 0.
|
|
10677
|
-
output: 0.
|
|
10508
|
+
input: 0.4,
|
|
10509
|
+
output: 0.4,
|
|
10678
10510
|
cacheRead: 0,
|
|
10679
10511
|
cacheWrite: 0,
|
|
10680
10512
|
},
|
|
@@ -10690,8 +10522,8 @@ export const MODELS = {
|
|
|
10690
10522
|
reasoning: true,
|
|
10691
10523
|
input: ["text"],
|
|
10692
10524
|
cost: {
|
|
10693
|
-
input: 0.
|
|
10694
|
-
output: 0.
|
|
10525
|
+
input: 0.05,
|
|
10526
|
+
output: 0.2,
|
|
10695
10527
|
cacheRead: 0,
|
|
10696
10528
|
cacheWrite: 0,
|
|
10697
10529
|
},
|
|
@@ -10742,7 +10574,7 @@ export const MODELS = {
|
|
|
10742
10574
|
input: ["text"],
|
|
10743
10575
|
cost: {
|
|
10744
10576
|
input: 0.09,
|
|
10745
|
-
output: 0.
|
|
10577
|
+
output: 0.45,
|
|
10746
10578
|
cacheRead: 0,
|
|
10747
10579
|
cacheWrite: 0,
|
|
10748
10580
|
},
|
|
@@ -10817,23 +10649,6 @@ export const MODELS = {
|
|
|
10817
10649
|
contextWindow: 128000,
|
|
10818
10650
|
maxTokens: 128000,
|
|
10819
10651
|
},
|
|
10820
|
-
"nvidia/nemotron-nano-9b-v2": {
|
|
10821
|
-
id: "nvidia/nemotron-nano-9b-v2",
|
|
10822
|
-
name: "NVIDIA: Nemotron Nano 9B V2",
|
|
10823
|
-
api: "openai-completions",
|
|
10824
|
-
provider: "openrouter",
|
|
10825
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
10826
|
-
reasoning: true,
|
|
10827
|
-
input: ["text"],
|
|
10828
|
-
cost: {
|
|
10829
|
-
input: 0.04,
|
|
10830
|
-
output: 0.16,
|
|
10831
|
-
cacheRead: 0,
|
|
10832
|
-
cacheWrite: 0,
|
|
10833
|
-
},
|
|
10834
|
-
contextWindow: 131072,
|
|
10835
|
-
maxTokens: 16384,
|
|
10836
|
-
},
|
|
10837
10652
|
"nvidia/nemotron-nano-9b-v2:free": {
|
|
10838
10653
|
id: "nvidia/nemotron-nano-9b-v2:free",
|
|
10839
10654
|
name: "NVIDIA: Nemotron Nano 9B V2 (free)",
|
|
@@ -10979,9 +10794,9 @@ export const MODELS = {
|
|
|
10979
10794
|
reasoning: false,
|
|
10980
10795
|
input: ["text", "image"],
|
|
10981
10796
|
cost: {
|
|
10982
|
-
input: 0.
|
|
10983
|
-
output: 1.
|
|
10984
|
-
cacheRead: 0.
|
|
10797
|
+
input: 0.4,
|
|
10798
|
+
output: 1.6,
|
|
10799
|
+
cacheRead: 0.1,
|
|
10985
10800
|
cacheWrite: 0,
|
|
10986
10801
|
},
|
|
10987
10802
|
contextWindow: 1047576,
|
|
@@ -10996,9 +10811,9 @@ export const MODELS = {
|
|
|
10996
10811
|
reasoning: false,
|
|
10997
10812
|
input: ["text", "image"],
|
|
10998
10813
|
cost: {
|
|
10999
|
-
input: 0.
|
|
11000
|
-
output: 0.
|
|
11001
|
-
cacheRead: 0.
|
|
10814
|
+
input: 0.1,
|
|
10815
|
+
output: 0.4,
|
|
10816
|
+
cacheRead: 0.025,
|
|
11002
10817
|
cacheWrite: 0,
|
|
11003
10818
|
},
|
|
11004
10819
|
contextWindow: 1047576,
|
|
@@ -11151,7 +10966,7 @@ export const MODELS = {
|
|
|
11151
10966
|
cost: {
|
|
11152
10967
|
input: 0.25,
|
|
11153
10968
|
output: 2,
|
|
11154
|
-
cacheRead: 0.
|
|
10969
|
+
cacheRead: 0.025,
|
|
11155
10970
|
cacheWrite: 0,
|
|
11156
10971
|
},
|
|
11157
10972
|
contextWindow: 400000,
|
|
@@ -11166,8 +10981,8 @@ export const MODELS = {
|
|
|
11166
10981
|
reasoning: true,
|
|
11167
10982
|
input: ["text", "image"],
|
|
11168
10983
|
cost: {
|
|
11169
|
-
input: 0.
|
|
11170
|
-
output: 0.
|
|
10984
|
+
input: 0.05,
|
|
10985
|
+
output: 0.4,
|
|
11171
10986
|
cacheRead: 0.01,
|
|
11172
10987
|
cacheWrite: 0,
|
|
11173
10988
|
},
|
|
@@ -11270,7 +11085,7 @@ export const MODELS = {
|
|
|
11270
11085
|
cost: {
|
|
11271
11086
|
input: 0.25,
|
|
11272
11087
|
output: 2,
|
|
11273
|
-
cacheRead: 0.
|
|
11088
|
+
cacheRead: 0.025,
|
|
11274
11089
|
cacheWrite: 0,
|
|
11275
11090
|
},
|
|
11276
11091
|
contextWindow: 400000,
|
|
@@ -11430,7 +11245,7 @@ export const MODELS = {
|
|
|
11430
11245
|
thinkingLevelMap: { "xhigh": "xhigh" },
|
|
11431
11246
|
input: ["text", "image"],
|
|
11432
11247
|
cost: {
|
|
11433
|
-
input: 0.
|
|
11248
|
+
input: 0.2,
|
|
11434
11249
|
output: 1.25,
|
|
11435
11250
|
cacheRead: 0.02,
|
|
11436
11251
|
cacheWrite: 0,
|
|
@@ -11875,7 +11690,7 @@ export const MODELS = {
|
|
|
11875
11690
|
reasoning: true,
|
|
11876
11691
|
input: ["text"],
|
|
11877
11692
|
cost: {
|
|
11878
|
-
input: 0.
|
|
11693
|
+
input: 0.2,
|
|
11879
11694
|
output: 1.1,
|
|
11880
11695
|
cacheRead: 0,
|
|
11881
11696
|
cacheWrite: 0,
|
|
@@ -11893,7 +11708,7 @@ export const MODELS = {
|
|
|
11893
11708
|
input: ["text"],
|
|
11894
11709
|
cost: {
|
|
11895
11710
|
input: 0.36,
|
|
11896
|
-
output: 0.
|
|
11711
|
+
output: 0.4,
|
|
11897
11712
|
cacheRead: 0,
|
|
11898
11713
|
cacheWrite: 0,
|
|
11899
11714
|
},
|
|
@@ -11911,7 +11726,7 @@ export const MODELS = {
|
|
|
11911
11726
|
cost: {
|
|
11912
11727
|
input: 0.26,
|
|
11913
11728
|
output: 0.78,
|
|
11914
|
-
cacheRead: 0.
|
|
11729
|
+
cacheRead: 0.052,
|
|
11915
11730
|
cacheWrite: 0.325,
|
|
11916
11731
|
},
|
|
11917
11732
|
contextWindow: 1000000,
|
|
@@ -11960,7 +11775,7 @@ export const MODELS = {
|
|
|
11960
11775
|
reasoning: true,
|
|
11961
11776
|
input: ["text"],
|
|
11962
11777
|
cost: {
|
|
11963
|
-
input: 0.
|
|
11778
|
+
input: 0.1,
|
|
11964
11779
|
output: 0.24,
|
|
11965
11780
|
cacheRead: 0,
|
|
11966
11781
|
cacheWrite: 0,
|
|
@@ -11977,8 +11792,8 @@ export const MODELS = {
|
|
|
11977
11792
|
reasoning: true,
|
|
11978
11793
|
input: ["text"],
|
|
11979
11794
|
cost: {
|
|
11980
|
-
input: 0.
|
|
11981
|
-
output: 1.
|
|
11795
|
+
input: 0.455,
|
|
11796
|
+
output: 1.82,
|
|
11982
11797
|
cacheRead: 0,
|
|
11983
11798
|
cacheWrite: 0,
|
|
11984
11799
|
},
|
|
@@ -11995,7 +11810,7 @@ export const MODELS = {
|
|
|
11995
11810
|
input: ["text"],
|
|
11996
11811
|
cost: {
|
|
11997
11812
|
input: 0.09,
|
|
11998
|
-
output: 0.
|
|
11813
|
+
output: 0.1,
|
|
11999
11814
|
cacheRead: 0,
|
|
12000
11815
|
cacheWrite: 0,
|
|
12001
11816
|
},
|
|
@@ -12011,9 +11826,9 @@ export const MODELS = {
|
|
|
12011
11826
|
reasoning: true,
|
|
12012
11827
|
input: ["text"],
|
|
12013
11828
|
cost: {
|
|
12014
|
-
input: 0.
|
|
12015
|
-
output: 0.
|
|
12016
|
-
cacheRead: 0.
|
|
11829
|
+
input: 0.1,
|
|
11830
|
+
output: 0.1,
|
|
11831
|
+
cacheRead: 0.1,
|
|
12017
11832
|
cacheWrite: 0,
|
|
12018
11833
|
},
|
|
12019
11834
|
contextWindow: 262144,
|
|
@@ -12063,7 +11878,7 @@ export const MODELS = {
|
|
|
12063
11878
|
input: ["text"],
|
|
12064
11879
|
cost: {
|
|
12065
11880
|
input: 0.08,
|
|
12066
|
-
output: 0.
|
|
11881
|
+
output: 0.4,
|
|
12067
11882
|
cacheRead: 0.08,
|
|
12068
11883
|
cacheWrite: 0,
|
|
12069
11884
|
},
|
|
@@ -12096,9 +11911,9 @@ export const MODELS = {
|
|
|
12096
11911
|
reasoning: true,
|
|
12097
11912
|
input: ["text"],
|
|
12098
11913
|
cost: {
|
|
12099
|
-
input: 0.
|
|
12100
|
-
output: 0.
|
|
12101
|
-
cacheRead: 0.
|
|
11914
|
+
input: 0.05,
|
|
11915
|
+
output: 0.4,
|
|
11916
|
+
cacheRead: 0.05,
|
|
12102
11917
|
cacheWrite: 0,
|
|
12103
11918
|
},
|
|
12104
11919
|
contextWindow: 131072,
|
|
@@ -12114,7 +11929,7 @@ export const MODELS = {
|
|
|
12114
11929
|
input: ["text"],
|
|
12115
11930
|
cost: {
|
|
12116
11931
|
input: 0.22,
|
|
12117
|
-
output: 1.
|
|
11932
|
+
output: 1.8,
|
|
12118
11933
|
cacheRead: 0,
|
|
12119
11934
|
cacheWrite: 0,
|
|
12120
11935
|
},
|
|
@@ -12165,7 +11980,7 @@ export const MODELS = {
|
|
|
12165
11980
|
input: ["text"],
|
|
12166
11981
|
cost: {
|
|
12167
11982
|
input: 0.11,
|
|
12168
|
-
output: 0.
|
|
11983
|
+
output: 0.8,
|
|
12169
11984
|
cacheRead: 0.07,
|
|
12170
11985
|
cacheWrite: 0,
|
|
12171
11986
|
},
|
|
@@ -12300,7 +12115,7 @@ export const MODELS = {
|
|
|
12300
12115
|
reasoning: false,
|
|
12301
12116
|
input: ["text", "image"],
|
|
12302
12117
|
cost: {
|
|
12303
|
-
input: 0.
|
|
12118
|
+
input: 0.2,
|
|
12304
12119
|
output: 0.88,
|
|
12305
12120
|
cacheRead: 0.11,
|
|
12306
12121
|
cacheWrite: 0,
|
|
@@ -12368,8 +12183,8 @@ export const MODELS = {
|
|
|
12368
12183
|
reasoning: false,
|
|
12369
12184
|
input: ["text", "image"],
|
|
12370
12185
|
cost: {
|
|
12371
|
-
input: 0.
|
|
12372
|
-
output: 0.
|
|
12186
|
+
input: 0.104,
|
|
12187
|
+
output: 0.416,
|
|
12373
12188
|
cacheRead: 0,
|
|
12374
12189
|
cacheWrite: 0,
|
|
12375
12190
|
},
|
|
@@ -12455,7 +12270,7 @@ export const MODELS = {
|
|
|
12455
12270
|
cost: {
|
|
12456
12271
|
input: 0.14,
|
|
12457
12272
|
output: 1,
|
|
12458
|
-
cacheRead: 0.
|
|
12273
|
+
cacheRead: 0.05,
|
|
12459
12274
|
cacheWrite: 0,
|
|
12460
12275
|
},
|
|
12461
12276
|
contextWindow: 262144,
|
|
@@ -12487,7 +12302,7 @@ export const MODELS = {
|
|
|
12487
12302
|
reasoning: true,
|
|
12488
12303
|
input: ["text", "image"],
|
|
12489
12304
|
cost: {
|
|
12490
|
-
input: 0.
|
|
12305
|
+
input: 0.1,
|
|
12491
12306
|
output: 0.15,
|
|
12492
12307
|
cacheRead: 0,
|
|
12493
12308
|
cacheWrite: 0,
|
|
@@ -12539,7 +12354,7 @@ export const MODELS = {
|
|
|
12539
12354
|
input: ["text", "image"],
|
|
12540
12355
|
cost: {
|
|
12541
12356
|
input: 0.3,
|
|
12542
|
-
output: 1.
|
|
12357
|
+
output: 1.8,
|
|
12543
12358
|
cacheRead: 0,
|
|
12544
12359
|
cacheWrite: 0.375,
|
|
12545
12360
|
},
|
|
@@ -12555,13 +12370,13 @@ export const MODELS = {
|
|
|
12555
12370
|
reasoning: true,
|
|
12556
12371
|
input: ["text", "image"],
|
|
12557
12372
|
cost: {
|
|
12558
|
-
input: 0.
|
|
12559
|
-
output:
|
|
12373
|
+
input: 0.2885,
|
|
12374
|
+
output: 3.17,
|
|
12560
12375
|
cacheRead: 0,
|
|
12561
12376
|
cacheWrite: 0,
|
|
12562
12377
|
},
|
|
12563
12378
|
contextWindow: 262144,
|
|
12564
|
-
maxTokens:
|
|
12379
|
+
maxTokens: 262140,
|
|
12565
12380
|
},
|
|
12566
12381
|
"qwen/qwen3.6-35b-a3b": {
|
|
12567
12382
|
id: "qwen/qwen3.6-35b-a3b",
|
|
@@ -12572,13 +12387,13 @@ export const MODELS = {
|
|
|
12572
12387
|
reasoning: true,
|
|
12573
12388
|
input: ["text", "image"],
|
|
12574
12389
|
cost: {
|
|
12575
|
-
input: 0.
|
|
12390
|
+
input: 0.15,
|
|
12576
12391
|
output: 1,
|
|
12577
|
-
cacheRead: 0,
|
|
12392
|
+
cacheRead: 0.05,
|
|
12578
12393
|
cacheWrite: 0,
|
|
12579
12394
|
},
|
|
12580
12395
|
contextWindow: 262144,
|
|
12581
|
-
maxTokens:
|
|
12396
|
+
maxTokens: 262144,
|
|
12582
12397
|
},
|
|
12583
12398
|
"qwen/qwen3.6-flash": {
|
|
12584
12399
|
id: "qwen/qwen3.6-flash",
|
|
@@ -12657,10 +12472,10 @@ export const MODELS = {
|
|
|
12657
12472
|
reasoning: true,
|
|
12658
12473
|
input: ["text", "image"],
|
|
12659
12474
|
cost: {
|
|
12660
|
-
input: 0.
|
|
12661
|
-
output: 1.
|
|
12662
|
-
cacheRead: 0.
|
|
12663
|
-
cacheWrite: 0.
|
|
12475
|
+
input: 0.32,
|
|
12476
|
+
output: 1.28,
|
|
12477
|
+
cacheRead: 0.064,
|
|
12478
|
+
cacheWrite: 0.4,
|
|
12664
12479
|
},
|
|
12665
12480
|
contextWindow: 1000000,
|
|
12666
12481
|
maxTokens: 65536,
|
|
@@ -12674,8 +12489,8 @@ export const MODELS = {
|
|
|
12674
12489
|
reasoning: false,
|
|
12675
12490
|
input: ["text", "image"],
|
|
12676
12491
|
cost: {
|
|
12677
|
-
input: 0.
|
|
12678
|
-
output: 0.
|
|
12492
|
+
input: 0.1,
|
|
12493
|
+
output: 0.1,
|
|
12679
12494
|
cacheRead: 0,
|
|
12680
12495
|
cacheWrite: 0,
|
|
12681
12496
|
},
|
|
@@ -12742,7 +12557,7 @@ export const MODELS = {
|
|
|
12742
12557
|
reasoning: true,
|
|
12743
12558
|
input: ["text", "image"],
|
|
12744
12559
|
cost: {
|
|
12745
|
-
input: 0.
|
|
12560
|
+
input: 0.2,
|
|
12746
12561
|
output: 1.15,
|
|
12747
12562
|
cacheRead: 0.04,
|
|
12748
12563
|
cacheWrite: 0,
|
|
@@ -12761,7 +12576,7 @@ export const MODELS = {
|
|
|
12761
12576
|
cost: {
|
|
12762
12577
|
input: 0.063,
|
|
12763
12578
|
output: 0.21,
|
|
12764
|
-
cacheRead: 0.
|
|
12579
|
+
cacheRead: 0.021,
|
|
12765
12580
|
cacheWrite: 0,
|
|
12766
12581
|
},
|
|
12767
12582
|
contextWindow: 262144,
|
|
@@ -12776,7 +12591,7 @@ export const MODELS = {
|
|
|
12776
12591
|
reasoning: false,
|
|
12777
12592
|
input: ["text"],
|
|
12778
12593
|
cost: {
|
|
12779
|
-
input: 0.
|
|
12594
|
+
input: 0.17,
|
|
12780
12595
|
output: 0.43,
|
|
12781
12596
|
cacheRead: 0,
|
|
12782
12597
|
cacheWrite: 0,
|
|
@@ -12793,8 +12608,8 @@ export const MODELS = {
|
|
|
12793
12608
|
reasoning: false,
|
|
12794
12609
|
input: ["text"],
|
|
12795
12610
|
cost: {
|
|
12796
|
-
input: 0.
|
|
12797
|
-
output: 0.
|
|
12611
|
+
input: 0.4,
|
|
12612
|
+
output: 0.4,
|
|
12798
12613
|
cacheRead: 0,
|
|
12799
12614
|
cacheWrite: 0,
|
|
12800
12615
|
},
|
|
@@ -12829,7 +12644,7 @@ export const MODELS = {
|
|
|
12829
12644
|
cost: {
|
|
12830
12645
|
input: 1.25,
|
|
12831
12646
|
output: 2.5,
|
|
12832
|
-
cacheRead: 0.
|
|
12647
|
+
cacheRead: 0.2,
|
|
12833
12648
|
cacheWrite: 0,
|
|
12834
12649
|
},
|
|
12835
12650
|
contextWindow: 2000000,
|
|
@@ -12846,7 +12661,7 @@ export const MODELS = {
|
|
|
12846
12661
|
cost: {
|
|
12847
12662
|
input: 1.25,
|
|
12848
12663
|
output: 2.5,
|
|
12849
|
-
cacheRead: 0.
|
|
12664
|
+
cacheRead: 0.2,
|
|
12850
12665
|
cacheWrite: 0,
|
|
12851
12666
|
},
|
|
12852
12667
|
contextWindow: 1000000,
|
|
@@ -12863,7 +12678,7 @@ export const MODELS = {
|
|
|
12863
12678
|
cost: {
|
|
12864
12679
|
input: 1,
|
|
12865
12680
|
output: 2,
|
|
12866
|
-
cacheRead: 0.
|
|
12681
|
+
cacheRead: 0.2,
|
|
12867
12682
|
cacheWrite: 0,
|
|
12868
12683
|
},
|
|
12869
12684
|
contextWindow: 256000,
|
|
@@ -12878,7 +12693,7 @@ export const MODELS = {
|
|
|
12878
12693
|
reasoning: true,
|
|
12879
12694
|
input: ["text"],
|
|
12880
12695
|
cost: {
|
|
12881
|
-
input: 0.
|
|
12696
|
+
input: 0.1,
|
|
12882
12697
|
output: 0.3,
|
|
12883
12698
|
cacheRead: 0.01,
|
|
12884
12699
|
cacheWrite: 0,
|
|
@@ -12920,23 +12735,6 @@ export const MODELS = {
|
|
|
12920
12735
|
contextWindow: 1048576,
|
|
12921
12736
|
maxTokens: 131072,
|
|
12922
12737
|
},
|
|
12923
|
-
"z-ai/glm-4-32b": {
|
|
12924
|
-
id: "z-ai/glm-4-32b",
|
|
12925
|
-
name: "Z.ai: GLM 4 32B ",
|
|
12926
|
-
api: "openai-completions",
|
|
12927
|
-
provider: "openrouter",
|
|
12928
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
12929
|
-
reasoning: false,
|
|
12930
|
-
input: ["text"],
|
|
12931
|
-
cost: {
|
|
12932
|
-
input: 0.09999999999999999,
|
|
12933
|
-
output: 0.09999999999999999,
|
|
12934
|
-
cacheRead: 0,
|
|
12935
|
-
cacheWrite: 0,
|
|
12936
|
-
},
|
|
12937
|
-
contextWindow: 128000,
|
|
12938
|
-
maxTokens: 4096,
|
|
12939
|
-
},
|
|
12940
12738
|
"z-ai/glm-4.5": {
|
|
12941
12739
|
id: "z-ai/glm-4.5",
|
|
12942
12740
|
name: "Z.ai: GLM 4.5",
|
|
@@ -12971,23 +12769,6 @@ export const MODELS = {
|
|
|
12971
12769
|
contextWindow: 131072,
|
|
12972
12770
|
maxTokens: 131070,
|
|
12973
12771
|
},
|
|
12974
|
-
"z-ai/glm-4.5-air:free": {
|
|
12975
|
-
id: "z-ai/glm-4.5-air:free",
|
|
12976
|
-
name: "Z.ai: GLM 4.5 Air (free)",
|
|
12977
|
-
api: "openai-completions",
|
|
12978
|
-
provider: "openrouter",
|
|
12979
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
12980
|
-
reasoning: true,
|
|
12981
|
-
input: ["text"],
|
|
12982
|
-
cost: {
|
|
12983
|
-
input: 0,
|
|
12984
|
-
output: 0,
|
|
12985
|
-
cacheRead: 0,
|
|
12986
|
-
cacheWrite: 0,
|
|
12987
|
-
},
|
|
12988
|
-
contextWindow: 131072,
|
|
12989
|
-
maxTokens: 96000,
|
|
12990
|
-
},
|
|
12991
12772
|
"z-ai/glm-4.5v": {
|
|
12992
12773
|
id: "z-ai/glm-4.5v",
|
|
12993
12774
|
name: "Z.ai: GLM 4.5V",
|
|
@@ -12998,7 +12779,7 @@ export const MODELS = {
|
|
|
12998
12779
|
input: ["text", "image"],
|
|
12999
12780
|
cost: {
|
|
13000
12781
|
input: 0.6,
|
|
13001
|
-
output: 1.
|
|
12782
|
+
output: 1.8,
|
|
13002
12783
|
cacheRead: 0.11,
|
|
13003
12784
|
cacheWrite: 0,
|
|
13004
12785
|
},
|
|
@@ -13032,12 +12813,12 @@ export const MODELS = {
|
|
|
13032
12813
|
input: ["text", "image"],
|
|
13033
12814
|
cost: {
|
|
13034
12815
|
input: 0.3,
|
|
13035
|
-
output: 0.
|
|
13036
|
-
cacheRead: 0.
|
|
12816
|
+
output: 0.9,
|
|
12817
|
+
cacheRead: 0.055,
|
|
13037
12818
|
cacheWrite: 0,
|
|
13038
12819
|
},
|
|
13039
12820
|
contextWindow: 131072,
|
|
13040
|
-
maxTokens:
|
|
12821
|
+
maxTokens: 32768,
|
|
13041
12822
|
},
|
|
13042
12823
|
"z-ai/glm-4.7": {
|
|
13043
12824
|
id: "z-ai/glm-4.7",
|
|
@@ -13048,7 +12829,7 @@ export const MODELS = {
|
|
|
13048
12829
|
reasoning: true,
|
|
13049
12830
|
input: ["text"],
|
|
13050
12831
|
cost: {
|
|
13051
|
-
input: 0.
|
|
12832
|
+
input: 0.4,
|
|
13052
12833
|
output: 1.75,
|
|
13053
12834
|
cacheRead: 0.08,
|
|
13054
12835
|
cacheWrite: 0,
|
|
@@ -13066,7 +12847,7 @@ export const MODELS = {
|
|
|
13066
12847
|
input: ["text"],
|
|
13067
12848
|
cost: {
|
|
13068
12849
|
input: 0.06,
|
|
13069
|
-
output: 0.
|
|
12850
|
+
output: 0.4,
|
|
13070
12851
|
cacheRead: 0.01,
|
|
13071
12852
|
cacheWrite: 0,
|
|
13072
12853
|
},
|
|
@@ -13104,7 +12885,7 @@ export const MODELS = {
|
|
|
13104
12885
|
cacheRead: 0.24,
|
|
13105
12886
|
cacheWrite: 0,
|
|
13106
12887
|
},
|
|
13107
|
-
contextWindow:
|
|
12888
|
+
contextWindow: 262144,
|
|
13108
12889
|
maxTokens: 131072,
|
|
13109
12890
|
},
|
|
13110
12891
|
"z-ai/glm-5.1": {
|
|
@@ -13124,23 +12905,6 @@ export const MODELS = {
|
|
|
13124
12905
|
contextWindow: 202752,
|
|
13125
12906
|
maxTokens: 4096,
|
|
13126
12907
|
},
|
|
13127
|
-
"z-ai/glm-5v-turbo": {
|
|
13128
|
-
id: "z-ai/glm-5v-turbo",
|
|
13129
|
-
name: "Z.ai: GLM 5V Turbo",
|
|
13130
|
-
api: "openai-completions",
|
|
13131
|
-
provider: "openrouter",
|
|
13132
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
13133
|
-
reasoning: true,
|
|
13134
|
-
input: ["text", "image"],
|
|
13135
|
-
cost: {
|
|
13136
|
-
input: 1.2,
|
|
13137
|
-
output: 4,
|
|
13138
|
-
cacheRead: 0.24,
|
|
13139
|
-
cacheWrite: 0,
|
|
13140
|
-
},
|
|
13141
|
-
contextWindow: 202752,
|
|
13142
|
-
maxTokens: 131072,
|
|
13143
|
-
},
|
|
13144
12908
|
"~anthropic/claude-fable-latest": {
|
|
13145
12909
|
id: "~anthropic/claude-fable-latest",
|
|
13146
12910
|
name: "Anthropic: Claude Fable Latest",
|
|
@@ -13169,7 +12933,7 @@ export const MODELS = {
|
|
|
13169
12933
|
cost: {
|
|
13170
12934
|
input: 1,
|
|
13171
12935
|
output: 5,
|
|
13172
|
-
cacheRead: 0.
|
|
12936
|
+
cacheRead: 0.1,
|
|
13173
12937
|
cacheWrite: 1.25,
|
|
13174
12938
|
},
|
|
13175
12939
|
contextWindow: 200000,
|
|
@@ -13221,7 +12985,7 @@ export const MODELS = {
|
|
|
13221
12985
|
input: 1.5,
|
|
13222
12986
|
output: 9,
|
|
13223
12987
|
cacheRead: 0.15,
|
|
13224
|
-
cacheWrite: 0.
|
|
12988
|
+
cacheWrite: 0.083333,
|
|
13225
12989
|
},
|
|
13226
12990
|
contextWindow: 1048576,
|
|
13227
12991
|
maxTokens: 65536,
|
|
@@ -13237,7 +13001,7 @@ export const MODELS = {
|
|
|
13237
13001
|
cost: {
|
|
13238
13002
|
input: 2,
|
|
13239
13003
|
output: 12,
|
|
13240
|
-
cacheRead: 0.
|
|
13004
|
+
cacheRead: 0.2,
|
|
13241
13005
|
cacheWrite: 0.375,
|
|
13242
13006
|
},
|
|
13243
13007
|
contextWindow: 1048576,
|
|
@@ -13252,9 +13016,9 @@ export const MODELS = {
|
|
|
13252
13016
|
reasoning: true,
|
|
13253
13017
|
input: ["text", "image"],
|
|
13254
13018
|
cost: {
|
|
13255
|
-
input: 0.
|
|
13019
|
+
input: 0.68,
|
|
13256
13020
|
output: 3.41,
|
|
13257
|
-
cacheRead: 0.
|
|
13021
|
+
cacheRead: 0.34,
|
|
13258
13022
|
cacheWrite: 0,
|
|
13259
13023
|
},
|
|
13260
13024
|
contextWindow: 262144,
|
|
@@ -13296,25 +13060,6 @@ export const MODELS = {
|
|
|
13296
13060
|
},
|
|
13297
13061
|
},
|
|
13298
13062
|
"together": {
|
|
13299
|
-
"MiniMaxAI/MiniMax-M2.5": {
|
|
13300
|
-
id: "MiniMaxAI/MiniMax-M2.5",
|
|
13301
|
-
name: "MiniMax-M2.5",
|
|
13302
|
-
api: "openai-completions",
|
|
13303
|
-
provider: "together",
|
|
13304
|
-
baseUrl: "https://api.together.ai/v1",
|
|
13305
|
-
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
|
|
13306
|
-
reasoning: true,
|
|
13307
|
-
thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
|
|
13308
|
-
input: ["text"],
|
|
13309
|
-
cost: {
|
|
13310
|
-
input: 0.3,
|
|
13311
|
-
output: 1.2,
|
|
13312
|
-
cacheRead: 0.06,
|
|
13313
|
-
cacheWrite: 0,
|
|
13314
|
-
},
|
|
13315
|
-
contextWindow: 204800,
|
|
13316
|
-
maxTokens: 131072,
|
|
13317
|
-
},
|
|
13318
13063
|
"MiniMaxAI/MiniMax-M2.7": {
|
|
13319
13064
|
id: "MiniMaxAI/MiniMax-M2.7",
|
|
13320
13065
|
name: "MiniMax-M2.7",
|
|
@@ -13334,28 +13079,27 @@ export const MODELS = {
|
|
|
13334
13079
|
contextWindow: 202752,
|
|
13335
13080
|
maxTokens: 131072,
|
|
13336
13081
|
},
|
|
13337
|
-
"Qwen/
|
|
13338
|
-
id: "Qwen/
|
|
13339
|
-
name: "
|
|
13082
|
+
"Qwen/Qwen2.5-7B-Instruct-Turbo": {
|
|
13083
|
+
id: "Qwen/Qwen2.5-7B-Instruct-Turbo",
|
|
13084
|
+
name: "Qwen 2.5 7B Instruct Turbo",
|
|
13340
13085
|
api: "openai-completions",
|
|
13341
13086
|
provider: "together",
|
|
13342
13087
|
baseUrl: "https://api.together.ai/v1",
|
|
13343
|
-
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false
|
|
13344
|
-
reasoning:
|
|
13345
|
-
thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
|
|
13088
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
13089
|
+
reasoning: false,
|
|
13346
13090
|
input: ["text"],
|
|
13347
13091
|
cost: {
|
|
13348
|
-
input: 0.
|
|
13349
|
-
output: 0.
|
|
13092
|
+
input: 0.3,
|
|
13093
|
+
output: 0.3,
|
|
13350
13094
|
cacheRead: 0,
|
|
13351
13095
|
cacheWrite: 0,
|
|
13352
13096
|
},
|
|
13353
|
-
contextWindow:
|
|
13354
|
-
maxTokens:
|
|
13097
|
+
contextWindow: 32768,
|
|
13098
|
+
maxTokens: 32768,
|
|
13355
13099
|
},
|
|
13356
|
-
"Qwen/Qwen3-
|
|
13357
|
-
id: "Qwen/Qwen3-
|
|
13358
|
-
name: "Qwen3
|
|
13100
|
+
"Qwen/Qwen3-235B-A22B-Instruct-2507-tput": {
|
|
13101
|
+
id: "Qwen/Qwen3-235B-A22B-Instruct-2507-tput",
|
|
13102
|
+
name: "Qwen3 235B A22B Instruct 2507 FP8",
|
|
13359
13103
|
api: "openai-completions",
|
|
13360
13104
|
provider: "together",
|
|
13361
13105
|
baseUrl: "https://api.together.ai/v1",
|
|
@@ -13363,36 +13107,36 @@ export const MODELS = {
|
|
|
13363
13107
|
reasoning: false,
|
|
13364
13108
|
input: ["text"],
|
|
13365
13109
|
cost: {
|
|
13366
|
-
input: 2,
|
|
13367
|
-
output:
|
|
13110
|
+
input: 0.2,
|
|
13111
|
+
output: 0.6,
|
|
13368
13112
|
cacheRead: 0,
|
|
13369
13113
|
cacheWrite: 0,
|
|
13370
13114
|
},
|
|
13371
13115
|
contextWindow: 262144,
|
|
13372
13116
|
maxTokens: 262144,
|
|
13373
13117
|
},
|
|
13374
|
-
"Qwen/Qwen3-
|
|
13375
|
-
id: "Qwen/Qwen3-
|
|
13376
|
-
name: "Qwen3
|
|
13118
|
+
"Qwen/Qwen3.5-397B-A17B": {
|
|
13119
|
+
id: "Qwen/Qwen3.5-397B-A17B",
|
|
13120
|
+
name: "Qwen3.5 397B A17B",
|
|
13377
13121
|
api: "openai-completions",
|
|
13378
13122
|
provider: "together",
|
|
13379
13123
|
baseUrl: "https://api.together.ai/v1",
|
|
13380
13124
|
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
|
|
13381
13125
|
reasoning: true,
|
|
13382
13126
|
thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
|
|
13383
|
-
input: ["text"],
|
|
13127
|
+
input: ["text", "image"],
|
|
13384
13128
|
cost: {
|
|
13385
|
-
input: 0.
|
|
13386
|
-
output:
|
|
13129
|
+
input: 0.6,
|
|
13130
|
+
output: 3.6,
|
|
13387
13131
|
cacheRead: 0,
|
|
13388
13132
|
cacheWrite: 0,
|
|
13389
13133
|
},
|
|
13390
13134
|
contextWindow: 262144,
|
|
13391
|
-
maxTokens:
|
|
13135
|
+
maxTokens: 130000,
|
|
13392
13136
|
},
|
|
13393
|
-
"Qwen/Qwen3.5-
|
|
13394
|
-
id: "Qwen/Qwen3.5-
|
|
13395
|
-
name: "Qwen3.5
|
|
13137
|
+
"Qwen/Qwen3.5-9B": {
|
|
13138
|
+
id: "Qwen/Qwen3.5-9B",
|
|
13139
|
+
name: "Qwen3.5 9B",
|
|
13396
13140
|
api: "openai-completions",
|
|
13397
13141
|
provider: "together",
|
|
13398
13142
|
baseUrl: "https://api.together.ai/v1",
|
|
@@ -13401,13 +13145,13 @@ export const MODELS = {
|
|
|
13401
13145
|
thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
|
|
13402
13146
|
input: ["text", "image"],
|
|
13403
13147
|
cost: {
|
|
13404
|
-
input: 0.
|
|
13405
|
-
output:
|
|
13148
|
+
input: 0.17,
|
|
13149
|
+
output: 0.25,
|
|
13406
13150
|
cacheRead: 0,
|
|
13407
13151
|
cacheWrite: 0,
|
|
13408
13152
|
},
|
|
13409
13153
|
contextWindow: 262144,
|
|
13410
|
-
maxTokens:
|
|
13154
|
+
maxTokens: 65536,
|
|
13411
13155
|
},
|
|
13412
13156
|
"Qwen/Qwen3.6-Plus": {
|
|
13413
13157
|
id: "Qwen/Qwen3.6-Plus",
|
|
@@ -13434,9 +13178,8 @@ export const MODELS = {
|
|
|
13434
13178
|
api: "openai-completions",
|
|
13435
13179
|
provider: "together",
|
|
13436
13180
|
baseUrl: "https://api.together.ai/v1",
|
|
13437
|
-
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false
|
|
13438
|
-
reasoning:
|
|
13439
|
-
thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
|
|
13181
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
13182
|
+
reasoning: false,
|
|
13440
13183
|
input: ["text"],
|
|
13441
13184
|
cost: {
|
|
13442
13185
|
input: 2.5,
|
|
@@ -13447,44 +13190,6 @@ export const MODELS = {
|
|
|
13447
13190
|
contextWindow: 1000000,
|
|
13448
13191
|
maxTokens: 500000,
|
|
13449
13192
|
},
|
|
13450
|
-
"deepseek-ai/DeepSeek-V3": {
|
|
13451
|
-
id: "deepseek-ai/DeepSeek-V3",
|
|
13452
|
-
name: "DeepSeek-V3",
|
|
13453
|
-
api: "openai-completions",
|
|
13454
|
-
provider: "together",
|
|
13455
|
-
baseUrl: "https://api.together.ai/v1",
|
|
13456
|
-
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
|
|
13457
|
-
reasoning: true,
|
|
13458
|
-
thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
|
|
13459
|
-
input: ["text"],
|
|
13460
|
-
cost: {
|
|
13461
|
-
input: 1.25,
|
|
13462
|
-
output: 1.25,
|
|
13463
|
-
cacheRead: 0,
|
|
13464
|
-
cacheWrite: 0,
|
|
13465
|
-
},
|
|
13466
|
-
contextWindow: 131072,
|
|
13467
|
-
maxTokens: 131072,
|
|
13468
|
-
},
|
|
13469
|
-
"deepseek-ai/DeepSeek-V3-1": {
|
|
13470
|
-
id: "deepseek-ai/DeepSeek-V3-1",
|
|
13471
|
-
name: "DeepSeek V3.1",
|
|
13472
|
-
api: "openai-completions",
|
|
13473
|
-
provider: "together",
|
|
13474
|
-
baseUrl: "https://api.together.ai/v1",
|
|
13475
|
-
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
|
|
13476
|
-
reasoning: true,
|
|
13477
|
-
thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
|
|
13478
|
-
input: ["text"],
|
|
13479
|
-
cost: {
|
|
13480
|
-
input: 0.6,
|
|
13481
|
-
output: 1.7,
|
|
13482
|
-
cacheRead: 0,
|
|
13483
|
-
cacheWrite: 0,
|
|
13484
|
-
},
|
|
13485
|
-
contextWindow: 131072,
|
|
13486
|
-
maxTokens: 131072,
|
|
13487
|
-
},
|
|
13488
13193
|
"deepseek-ai/DeepSeek-V4-Pro": {
|
|
13489
13194
|
id: "deepseek-ai/DeepSeek-V4-Pro",
|
|
13490
13195
|
name: "DeepSeek V4 Pro",
|
|
@@ -13496,8 +13201,8 @@ export const MODELS = {
|
|
|
13496
13201
|
thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": null },
|
|
13497
13202
|
input: ["text"],
|
|
13498
13203
|
cost: {
|
|
13499
|
-
input:
|
|
13500
|
-
output:
|
|
13204
|
+
input: 1.74,
|
|
13205
|
+
output: 3.48,
|
|
13501
13206
|
cacheRead: 0.2,
|
|
13502
13207
|
cacheWrite: 0,
|
|
13503
13208
|
},
|
|
@@ -13533,8 +13238,8 @@ export const MODELS = {
|
|
|
13533
13238
|
thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
|
|
13534
13239
|
input: ["text", "image"],
|
|
13535
13240
|
cost: {
|
|
13536
|
-
input: 0.
|
|
13537
|
-
output: 0.
|
|
13241
|
+
input: 0.39,
|
|
13242
|
+
output: 0.97,
|
|
13538
13243
|
cacheRead: 0,
|
|
13539
13244
|
cacheWrite: 0,
|
|
13540
13245
|
},
|
|
@@ -13559,25 +13264,6 @@ export const MODELS = {
|
|
|
13559
13264
|
contextWindow: 131072,
|
|
13560
13265
|
maxTokens: 131072,
|
|
13561
13266
|
},
|
|
13562
|
-
"moonshotai/Kimi-K2.5": {
|
|
13563
|
-
id: "moonshotai/Kimi-K2.5",
|
|
13564
|
-
name: "Kimi K2.5",
|
|
13565
|
-
api: "openai-completions",
|
|
13566
|
-
provider: "together",
|
|
13567
|
-
baseUrl: "https://api.together.ai/v1",
|
|
13568
|
-
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
|
|
13569
|
-
reasoning: true,
|
|
13570
|
-
thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
|
|
13571
|
-
input: ["text", "image"],
|
|
13572
|
-
cost: {
|
|
13573
|
-
input: 0.5,
|
|
13574
|
-
output: 2.8,
|
|
13575
|
-
cacheRead: 0,
|
|
13576
|
-
cacheWrite: 0,
|
|
13577
|
-
},
|
|
13578
|
-
contextWindow: 262144,
|
|
13579
|
-
maxTokens: 262144,
|
|
13580
|
-
},
|
|
13581
13267
|
"moonshotai/Kimi-K2.6": {
|
|
13582
13268
|
id: "moonshotai/Kimi-K2.6",
|
|
13583
13269
|
name: "Kimi K2.6",
|
|
@@ -13635,6 +13321,44 @@ export const MODELS = {
|
|
|
13635
13321
|
contextWindow: 131072,
|
|
13636
13322
|
maxTokens: 131072,
|
|
13637
13323
|
},
|
|
13324
|
+
"openai/gpt-oss-20b": {
|
|
13325
|
+
id: "openai/gpt-oss-20b",
|
|
13326
|
+
name: "GPT OSS 20B",
|
|
13327
|
+
api: "openai-completions",
|
|
13328
|
+
provider: "together",
|
|
13329
|
+
baseUrl: "https://api.together.ai/v1",
|
|
13330
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": true, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "openai" },
|
|
13331
|
+
reasoning: true,
|
|
13332
|
+
thinkingLevelMap: { "off": null, "minimal": null },
|
|
13333
|
+
input: ["text"],
|
|
13334
|
+
cost: {
|
|
13335
|
+
input: 0.05,
|
|
13336
|
+
output: 0.2,
|
|
13337
|
+
cacheRead: 0,
|
|
13338
|
+
cacheWrite: 0,
|
|
13339
|
+
},
|
|
13340
|
+
contextWindow: 131072,
|
|
13341
|
+
maxTokens: 131072,
|
|
13342
|
+
},
|
|
13343
|
+
"zai-org/GLM-5": {
|
|
13344
|
+
id: "zai-org/GLM-5",
|
|
13345
|
+
name: "GLM-5",
|
|
13346
|
+
api: "openai-completions",
|
|
13347
|
+
provider: "together",
|
|
13348
|
+
baseUrl: "https://api.together.ai/v1",
|
|
13349
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
|
|
13350
|
+
reasoning: true,
|
|
13351
|
+
thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
|
|
13352
|
+
input: ["text"],
|
|
13353
|
+
cost: {
|
|
13354
|
+
input: 1,
|
|
13355
|
+
output: 3.2,
|
|
13356
|
+
cacheRead: 0,
|
|
13357
|
+
cacheWrite: 0,
|
|
13358
|
+
},
|
|
13359
|
+
contextWindow: 202752,
|
|
13360
|
+
maxTokens: 131072,
|
|
13361
|
+
},
|
|
13638
13362
|
"zai-org/GLM-5.1": {
|
|
13639
13363
|
id: "zai-org/GLM-5.1",
|
|
13640
13364
|
name: "GLM-5.1",
|
|
@@ -13750,7 +13474,7 @@ export const MODELS = {
|
|
|
13750
13474
|
reasoning: true,
|
|
13751
13475
|
input: ["text", "image"],
|
|
13752
13476
|
cost: {
|
|
13753
|
-
input: 0.
|
|
13477
|
+
input: 0.4,
|
|
13754
13478
|
output: 4,
|
|
13755
13479
|
cacheRead: 0,
|
|
13756
13480
|
cacheWrite: 0,
|
|
@@ -13820,7 +13544,7 @@ export const MODELS = {
|
|
|
13820
13544
|
cost: {
|
|
13821
13545
|
input: 1,
|
|
13822
13546
|
output: 5,
|
|
13823
|
-
cacheRead: 0.
|
|
13547
|
+
cacheRead: 0.2,
|
|
13824
13548
|
cacheWrite: 0,
|
|
13825
13549
|
},
|
|
13826
13550
|
contextWindow: 1000000,
|
|
@@ -13920,7 +13644,7 @@ export const MODELS = {
|
|
|
13920
13644
|
reasoning: true,
|
|
13921
13645
|
input: ["text", "image"],
|
|
13922
13646
|
cost: {
|
|
13923
|
-
input: 0.
|
|
13647
|
+
input: 0.4,
|
|
13924
13648
|
output: 4,
|
|
13925
13649
|
cacheRead: 0,
|
|
13926
13650
|
cacheWrite: 0,
|
|
@@ -13937,8 +13661,8 @@ export const MODELS = {
|
|
|
13937
13661
|
reasoning: true,
|
|
13938
13662
|
input: ["text", "image"],
|
|
13939
13663
|
cost: {
|
|
13940
|
-
input: 0.
|
|
13941
|
-
output: 0.
|
|
13664
|
+
input: 0.1,
|
|
13665
|
+
output: 0.4,
|
|
13942
13666
|
cacheRead: 0.001,
|
|
13943
13667
|
cacheWrite: 0.125,
|
|
13944
13668
|
},
|
|
@@ -13954,7 +13678,7 @@ export const MODELS = {
|
|
|
13954
13678
|
reasoning: true,
|
|
13955
13679
|
input: ["text", "image"],
|
|
13956
13680
|
cost: {
|
|
13957
|
-
input: 0.
|
|
13681
|
+
input: 0.4,
|
|
13958
13682
|
output: 2.4,
|
|
13959
13683
|
cacheRead: 0.04,
|
|
13960
13684
|
cacheWrite: 0.5,
|
|
@@ -13972,7 +13696,7 @@ export const MODELS = {
|
|
|
13972
13696
|
input: ["text", "image"],
|
|
13973
13697
|
cost: {
|
|
13974
13698
|
input: 0.6,
|
|
13975
|
-
output: 3.
|
|
13699
|
+
output: 3.6,
|
|
13976
13700
|
cacheRead: 0,
|
|
13977
13701
|
cacheWrite: 0,
|
|
13978
13702
|
},
|
|
@@ -13990,7 +13714,7 @@ export const MODELS = {
|
|
|
13990
13714
|
cost: {
|
|
13991
13715
|
input: 0.5,
|
|
13992
13716
|
output: 3,
|
|
13993
|
-
cacheRead: 0.
|
|
13717
|
+
cacheRead: 0.1,
|
|
13994
13718
|
cacheWrite: 0.625,
|
|
13995
13719
|
},
|
|
13996
13720
|
contextWindow: 1000000,
|
|
@@ -14022,8 +13746,8 @@ export const MODELS = {
|
|
|
14022
13746
|
reasoning: true,
|
|
14023
13747
|
input: ["text", "image"],
|
|
14024
13748
|
cost: {
|
|
14025
|
-
input: 0.
|
|
14026
|
-
output: 1.
|
|
13749
|
+
input: 0.4,
|
|
13750
|
+
output: 1.6,
|
|
14027
13751
|
cacheRead: 0.08,
|
|
14028
13752
|
cacheWrite: 0.5,
|
|
14029
13753
|
},
|
|
@@ -14056,7 +13780,7 @@ export const MODELS = {
|
|
|
14056
13780
|
reasoning: false,
|
|
14057
13781
|
input: ["text", "image"],
|
|
14058
13782
|
cost: {
|
|
14059
|
-
input: 0.
|
|
13783
|
+
input: 0.8,
|
|
14060
13784
|
output: 4,
|
|
14061
13785
|
cacheRead: 0.08,
|
|
14062
13786
|
cacheWrite: 1,
|
|
@@ -14072,7 +13796,7 @@ export const MODELS = {
|
|
|
14072
13796
|
baseUrl: "https://ai-gateway.vercel.sh",
|
|
14073
13797
|
compat: { "forceAdaptiveThinking": true },
|
|
14074
13798
|
reasoning: true,
|
|
14075
|
-
thinkingLevelMap: { "xhigh": "xhigh" },
|
|
13799
|
+
thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
|
|
14076
13800
|
input: ["text", "image"],
|
|
14077
13801
|
cost: {
|
|
14078
13802
|
input: 10,
|
|
@@ -14094,7 +13818,7 @@ export const MODELS = {
|
|
|
14094
13818
|
cost: {
|
|
14095
13819
|
input: 1,
|
|
14096
13820
|
output: 5,
|
|
14097
|
-
cacheRead: 0.
|
|
13821
|
+
cacheRead: 0.1,
|
|
14098
13822
|
cacheWrite: 1.25,
|
|
14099
13823
|
},
|
|
14100
13824
|
contextWindow: 200000,
|
|
@@ -14287,7 +14011,7 @@ export const MODELS = {
|
|
|
14287
14011
|
input: ["text"],
|
|
14288
14012
|
cost: {
|
|
14289
14013
|
input: 0.25,
|
|
14290
|
-
output: 0.
|
|
14014
|
+
output: 0.9,
|
|
14291
14015
|
cacheRead: 0,
|
|
14292
14016
|
cacheWrite: 0,
|
|
14293
14017
|
},
|
|
@@ -14305,7 +14029,7 @@ export const MODELS = {
|
|
|
14305
14029
|
cost: {
|
|
14306
14030
|
input: 0.25,
|
|
14307
14031
|
output: 2,
|
|
14308
|
-
cacheRead: 0.
|
|
14032
|
+
cacheRead: 0.05,
|
|
14309
14033
|
cacheWrite: 0,
|
|
14310
14034
|
},
|
|
14311
14035
|
contextWindow: 256000,
|
|
@@ -14490,8 +14214,8 @@ export const MODELS = {
|
|
|
14490
14214
|
reasoning: true,
|
|
14491
14215
|
input: ["text", "image"],
|
|
14492
14216
|
cost: {
|
|
14493
|
-
input: 0.
|
|
14494
|
-
output: 0.
|
|
14217
|
+
input: 0.1,
|
|
14218
|
+
output: 0.4,
|
|
14495
14219
|
cacheRead: 0.01,
|
|
14496
14220
|
cacheWrite: 0,
|
|
14497
14221
|
},
|
|
@@ -14526,7 +14250,7 @@ export const MODELS = {
|
|
|
14526
14250
|
cost: {
|
|
14527
14251
|
input: 0.5,
|
|
14528
14252
|
output: 3,
|
|
14529
|
-
cacheRead: 0.
|
|
14253
|
+
cacheRead: 0.05,
|
|
14530
14254
|
cacheWrite: 0,
|
|
14531
14255
|
},
|
|
14532
14256
|
contextWindow: 1000000,
|
|
@@ -14543,7 +14267,7 @@ export const MODELS = {
|
|
|
14543
14267
|
cost: {
|
|
14544
14268
|
input: 2,
|
|
14545
14269
|
output: 12,
|
|
14546
|
-
cacheRead: 0.
|
|
14270
|
+
cacheRead: 0.2,
|
|
14547
14271
|
cacheWrite: 0,
|
|
14548
14272
|
},
|
|
14549
14273
|
contextWindow: 1000000,
|
|
@@ -14594,7 +14318,7 @@ export const MODELS = {
|
|
|
14594
14318
|
cost: {
|
|
14595
14319
|
input: 2,
|
|
14596
14320
|
output: 12,
|
|
14597
|
-
cacheRead: 0.
|
|
14321
|
+
cacheRead: 0.2,
|
|
14598
14322
|
cacheWrite: 0,
|
|
14599
14323
|
},
|
|
14600
14324
|
contextWindow: 1000000,
|
|
@@ -14644,7 +14368,7 @@ export const MODELS = {
|
|
|
14644
14368
|
input: ["text", "image"],
|
|
14645
14369
|
cost: {
|
|
14646
14370
|
input: 0.14,
|
|
14647
|
-
output: 0.
|
|
14371
|
+
output: 0.4,
|
|
14648
14372
|
cacheRead: 0,
|
|
14649
14373
|
cacheWrite: 0,
|
|
14650
14374
|
},
|
|
@@ -14662,7 +14386,7 @@ export const MODELS = {
|
|
|
14662
14386
|
cost: {
|
|
14663
14387
|
input: 0.25,
|
|
14664
14388
|
output: 0.75,
|
|
14665
|
-
cacheRead: 0.
|
|
14389
|
+
cacheRead: 0.025,
|
|
14666
14390
|
cacheWrite: 0,
|
|
14667
14391
|
},
|
|
14668
14392
|
contextWindow: 128000,
|
|
@@ -14814,7 +14538,7 @@ export const MODELS = {
|
|
|
14814
14538
|
input: ["text", "image"],
|
|
14815
14539
|
cost: {
|
|
14816
14540
|
input: 0.24,
|
|
14817
|
-
output: 0.
|
|
14541
|
+
output: 0.97,
|
|
14818
14542
|
cacheRead: 0,
|
|
14819
14543
|
cacheWrite: 0,
|
|
14820
14544
|
},
|
|
@@ -14830,7 +14554,7 @@ export const MODELS = {
|
|
|
14830
14554
|
reasoning: false,
|
|
14831
14555
|
input: ["text", "image"],
|
|
14832
14556
|
cost: {
|
|
14833
|
-
input: 0.
|
|
14557
|
+
input: 0.17,
|
|
14834
14558
|
output: 0.66,
|
|
14835
14559
|
cacheRead: 0,
|
|
14836
14560
|
cacheWrite: 0,
|
|
@@ -14984,7 +14708,7 @@ export const MODELS = {
|
|
|
14984
14708
|
input: ["text"],
|
|
14985
14709
|
cost: {
|
|
14986
14710
|
input: 0.3,
|
|
14987
|
-
output: 0.
|
|
14711
|
+
output: 0.9,
|
|
14988
14712
|
cacheRead: 0,
|
|
14989
14713
|
cacheWrite: 0,
|
|
14990
14714
|
},
|
|
@@ -15000,7 +14724,7 @@ export const MODELS = {
|
|
|
15000
14724
|
reasoning: false,
|
|
15001
14725
|
input: ["text"],
|
|
15002
14726
|
cost: {
|
|
15003
|
-
input: 0.
|
|
14727
|
+
input: 0.4,
|
|
15004
14728
|
output: 2,
|
|
15005
14729
|
cacheRead: 0,
|
|
15006
14730
|
cacheWrite: 0,
|
|
@@ -15017,7 +14741,7 @@ export const MODELS = {
|
|
|
15017
14741
|
reasoning: false,
|
|
15018
14742
|
input: ["text"],
|
|
15019
14743
|
cost: {
|
|
15020
|
-
input: 0.
|
|
14744
|
+
input: 0.1,
|
|
15021
14745
|
output: 0.3,
|
|
15022
14746
|
cacheRead: 0,
|
|
15023
14747
|
cacheWrite: 0,
|
|
@@ -15034,7 +14758,7 @@ export const MODELS = {
|
|
|
15034
14758
|
reasoning: false,
|
|
15035
14759
|
input: ["text"],
|
|
15036
14760
|
cost: {
|
|
15037
|
-
input: 0.
|
|
14761
|
+
input: 0.1,
|
|
15038
14762
|
output: 0.3,
|
|
15039
14763
|
cacheRead: 0,
|
|
15040
14764
|
cacheWrite: 0,
|
|
@@ -15051,8 +14775,8 @@ export const MODELS = {
|
|
|
15051
14775
|
reasoning: false,
|
|
15052
14776
|
input: ["text"],
|
|
15053
14777
|
cost: {
|
|
15054
|
-
input: 0.
|
|
15055
|
-
output: 0.
|
|
14778
|
+
input: 0.1,
|
|
14779
|
+
output: 0.1,
|
|
15056
14780
|
cacheRead: 0,
|
|
15057
14781
|
cacheWrite: 0,
|
|
15058
14782
|
},
|
|
@@ -15085,7 +14809,7 @@ export const MODELS = {
|
|
|
15085
14809
|
reasoning: false,
|
|
15086
14810
|
input: ["text", "image"],
|
|
15087
14811
|
cost: {
|
|
15088
|
-
input: 0.
|
|
14812
|
+
input: 0.4,
|
|
15089
14813
|
output: 2,
|
|
15090
14814
|
cacheRead: 0,
|
|
15091
14815
|
cacheWrite: 0,
|
|
@@ -15136,7 +14860,7 @@ export const MODELS = {
|
|
|
15136
14860
|
reasoning: false,
|
|
15137
14861
|
input: ["text", "image"],
|
|
15138
14862
|
cost: {
|
|
15139
|
-
input: 0.
|
|
14863
|
+
input: 0.1,
|
|
15140
14864
|
output: 0.3,
|
|
15141
14865
|
cacheRead: 0,
|
|
15142
14866
|
cacheWrite: 0,
|
|
@@ -15187,7 +14911,7 @@ export const MODELS = {
|
|
|
15187
14911
|
reasoning: false,
|
|
15188
14912
|
input: ["text"],
|
|
15189
14913
|
cost: {
|
|
15190
|
-
input: 0.
|
|
14914
|
+
input: 0.57,
|
|
15191
14915
|
output: 2.3,
|
|
15192
14916
|
cacheRead: 0,
|
|
15193
14917
|
cacheWrite: 0,
|
|
@@ -15212,40 +14936,6 @@ export const MODELS = {
|
|
|
15212
14936
|
contextWindow: 262114,
|
|
15213
14937
|
maxTokens: 262114,
|
|
15214
14938
|
},
|
|
15215
|
-
"moonshotai/kimi-k2-thinking-turbo": {
|
|
15216
|
-
id: "moonshotai/kimi-k2-thinking-turbo",
|
|
15217
|
-
name: "Kimi K2 Thinking Turbo",
|
|
15218
|
-
api: "anthropic-messages",
|
|
15219
|
-
provider: "vercel-ai-gateway",
|
|
15220
|
-
baseUrl: "https://ai-gateway.vercel.sh",
|
|
15221
|
-
reasoning: true,
|
|
15222
|
-
input: ["text"],
|
|
15223
|
-
cost: {
|
|
15224
|
-
input: 1.15,
|
|
15225
|
-
output: 8,
|
|
15226
|
-
cacheRead: 0.15,
|
|
15227
|
-
cacheWrite: 0,
|
|
15228
|
-
},
|
|
15229
|
-
contextWindow: 262114,
|
|
15230
|
-
maxTokens: 262114,
|
|
15231
|
-
},
|
|
15232
|
-
"moonshotai/kimi-k2-turbo": {
|
|
15233
|
-
id: "moonshotai/kimi-k2-turbo",
|
|
15234
|
-
name: "Kimi K2 Turbo",
|
|
15235
|
-
api: "anthropic-messages",
|
|
15236
|
-
provider: "vercel-ai-gateway",
|
|
15237
|
-
baseUrl: "https://ai-gateway.vercel.sh",
|
|
15238
|
-
reasoning: false,
|
|
15239
|
-
input: ["text"],
|
|
15240
|
-
cost: {
|
|
15241
|
-
input: 1.15,
|
|
15242
|
-
output: 8,
|
|
15243
|
-
cacheRead: 0.15,
|
|
15244
|
-
cacheWrite: 0,
|
|
15245
|
-
},
|
|
15246
|
-
contextWindow: 256000,
|
|
15247
|
-
maxTokens: 16384,
|
|
15248
|
-
},
|
|
15249
14939
|
"moonshotai/kimi-k2.5": {
|
|
15250
14940
|
id: "moonshotai/kimi-k2.5",
|
|
15251
14941
|
name: "Kimi K2.5",
|
|
@@ -15257,7 +14947,7 @@ export const MODELS = {
|
|
|
15257
14947
|
cost: {
|
|
15258
14948
|
input: 0.6,
|
|
15259
14949
|
output: 3,
|
|
15260
|
-
cacheRead: 0.
|
|
14950
|
+
cacheRead: 0.1,
|
|
15261
14951
|
cacheWrite: 0,
|
|
15262
14952
|
},
|
|
15263
14953
|
contextWindow: 262114,
|
|
@@ -15280,6 +14970,23 @@ export const MODELS = {
|
|
|
15280
14970
|
contextWindow: 262000,
|
|
15281
14971
|
maxTokens: 262000,
|
|
15282
14972
|
},
|
|
14973
|
+
"moonshotai/kimi-k2.7-code": {
|
|
14974
|
+
id: "moonshotai/kimi-k2.7-code",
|
|
14975
|
+
name: "Kimi K2.7 Code",
|
|
14976
|
+
api: "anthropic-messages",
|
|
14977
|
+
provider: "vercel-ai-gateway",
|
|
14978
|
+
baseUrl: "https://ai-gateway.vercel.sh",
|
|
14979
|
+
reasoning: true,
|
|
14980
|
+
input: ["text", "image"],
|
|
14981
|
+
cost: {
|
|
14982
|
+
input: 0.95,
|
|
14983
|
+
output: 4,
|
|
14984
|
+
cacheRead: 0.19,
|
|
14985
|
+
cacheWrite: 0,
|
|
14986
|
+
},
|
|
14987
|
+
contextWindow: 256000,
|
|
14988
|
+
maxTokens: 32768,
|
|
14989
|
+
},
|
|
15283
14990
|
"nvidia/nemotron-3-super-120b-a12b": {
|
|
15284
14991
|
id: "nvidia/nemotron-3-super-120b-a12b",
|
|
15285
14992
|
name: "NVIDIA Nemotron 3 Super 120B A12B",
|
|
@@ -15323,7 +15030,7 @@ export const MODELS = {
|
|
|
15323
15030
|
reasoning: true,
|
|
15324
15031
|
input: ["text", "image"],
|
|
15325
15032
|
cost: {
|
|
15326
|
-
input: 0.
|
|
15033
|
+
input: 0.2,
|
|
15327
15034
|
output: 0.6,
|
|
15328
15035
|
cacheRead: 0,
|
|
15329
15036
|
cacheWrite: 0,
|
|
@@ -15341,7 +15048,7 @@ export const MODELS = {
|
|
|
15341
15048
|
input: ["text"],
|
|
15342
15049
|
cost: {
|
|
15343
15050
|
input: 0.06,
|
|
15344
|
-
output: 0.
|
|
15051
|
+
output: 0.23,
|
|
15345
15052
|
cacheRead: 0,
|
|
15346
15053
|
cacheWrite: 0,
|
|
15347
15054
|
},
|
|
@@ -15391,9 +15098,9 @@ export const MODELS = {
|
|
|
15391
15098
|
reasoning: false,
|
|
15392
15099
|
input: ["text", "image"],
|
|
15393
15100
|
cost: {
|
|
15394
|
-
input: 0.
|
|
15395
|
-
output: 1.
|
|
15396
|
-
cacheRead: 0.
|
|
15101
|
+
input: 0.4,
|
|
15102
|
+
output: 1.6,
|
|
15103
|
+
cacheRead: 0.1,
|
|
15397
15104
|
cacheWrite: 0,
|
|
15398
15105
|
},
|
|
15399
15106
|
contextWindow: 1047576,
|
|
@@ -15408,9 +15115,9 @@ export const MODELS = {
|
|
|
15408
15115
|
reasoning: false,
|
|
15409
15116
|
input: ["text", "image"],
|
|
15410
15117
|
cost: {
|
|
15411
|
-
input: 0.
|
|
15412
|
-
output: 0.
|
|
15413
|
-
cacheRead: 0.
|
|
15118
|
+
input: 0.1,
|
|
15119
|
+
output: 0.4,
|
|
15120
|
+
cacheRead: 0.025,
|
|
15414
15121
|
cacheWrite: 0,
|
|
15415
15122
|
},
|
|
15416
15123
|
contextWindow: 1047576,
|
|
@@ -15512,7 +15219,7 @@ export const MODELS = {
|
|
|
15512
15219
|
cost: {
|
|
15513
15220
|
input: 0.25,
|
|
15514
15221
|
output: 2,
|
|
15515
|
-
cacheRead: 0.
|
|
15222
|
+
cacheRead: 0.025,
|
|
15516
15223
|
cacheWrite: 0,
|
|
15517
15224
|
},
|
|
15518
15225
|
contextWindow: 400000,
|
|
@@ -15527,8 +15234,8 @@ export const MODELS = {
|
|
|
15527
15234
|
reasoning: true,
|
|
15528
15235
|
input: ["text", "image"],
|
|
15529
15236
|
cost: {
|
|
15530
|
-
input: 0.
|
|
15531
|
-
output: 0.
|
|
15237
|
+
input: 0.05,
|
|
15238
|
+
output: 0.4,
|
|
15532
15239
|
cacheRead: 0.005,
|
|
15533
15240
|
cacheWrite: 0,
|
|
15534
15241
|
},
|
|
@@ -15597,7 +15304,7 @@ export const MODELS = {
|
|
|
15597
15304
|
cost: {
|
|
15598
15305
|
input: 0.25,
|
|
15599
15306
|
output: 2,
|
|
15600
|
-
cacheRead: 0.
|
|
15307
|
+
cacheRead: 0.025,
|
|
15601
15308
|
cacheWrite: 0,
|
|
15602
15309
|
},
|
|
15603
15310
|
contextWindow: 400000,
|
|
@@ -15791,7 +15498,7 @@ export const MODELS = {
|
|
|
15791
15498
|
thinkingLevelMap: { "xhigh": "xhigh" },
|
|
15792
15499
|
input: ["text", "image"],
|
|
15793
15500
|
cost: {
|
|
15794
|
-
input: 0.
|
|
15501
|
+
input: 0.2,
|
|
15795
15502
|
output: 1.25,
|
|
15796
15503
|
cacheRead: 0.02,
|
|
15797
15504
|
cacheWrite: 0,
|
|
@@ -15879,8 +15586,8 @@ export const MODELS = {
|
|
|
15879
15586
|
reasoning: true,
|
|
15880
15587
|
input: ["text"],
|
|
15881
15588
|
cost: {
|
|
15882
|
-
input: 0.
|
|
15883
|
-
output: 0.
|
|
15589
|
+
input: 0.05,
|
|
15590
|
+
output: 0.2,
|
|
15884
15591
|
cacheRead: 0,
|
|
15885
15592
|
cacheWrite: 0,
|
|
15886
15593
|
},
|
|
@@ -16066,7 +15773,7 @@ export const MODELS = {
|
|
|
16066
15773
|
reasoning: true,
|
|
16067
15774
|
input: ["text", "image"],
|
|
16068
15775
|
cost: {
|
|
16069
|
-
input: 0.
|
|
15776
|
+
input: 0.2,
|
|
16070
15777
|
output: 1.15,
|
|
16071
15778
|
cacheRead: 0.04,
|
|
16072
15779
|
cacheWrite: 0,
|
|
@@ -16083,9 +15790,9 @@ export const MODELS = {
|
|
|
16083
15790
|
reasoning: false,
|
|
16084
15791
|
input: ["text", "image"],
|
|
16085
15792
|
cost: {
|
|
16086
|
-
input: 0.
|
|
15793
|
+
input: 0.2,
|
|
16087
15794
|
output: 0.5,
|
|
16088
|
-
cacheRead: 0.
|
|
15795
|
+
cacheRead: 0.05,
|
|
16089
15796
|
cacheWrite: 0,
|
|
16090
15797
|
},
|
|
16091
15798
|
contextWindow: 1000000,
|
|
@@ -16100,9 +15807,9 @@ export const MODELS = {
|
|
|
16100
15807
|
reasoning: true,
|
|
16101
15808
|
input: ["text", "image"],
|
|
16102
15809
|
cost: {
|
|
16103
|
-
input: 0.
|
|
15810
|
+
input: 0.2,
|
|
16104
15811
|
output: 0.5,
|
|
16105
|
-
cacheRead: 0.
|
|
15812
|
+
cacheRead: 0.05,
|
|
16106
15813
|
cacheWrite: 0,
|
|
16107
15814
|
},
|
|
16108
15815
|
contextWindow: 1000000,
|
|
@@ -16119,7 +15826,7 @@ export const MODELS = {
|
|
|
16119
15826
|
cost: {
|
|
16120
15827
|
input: 1.25,
|
|
16121
15828
|
output: 2.5,
|
|
16122
|
-
cacheRead: 0.
|
|
15829
|
+
cacheRead: 0.2,
|
|
16123
15830
|
cacheWrite: 0,
|
|
16124
15831
|
},
|
|
16125
15832
|
contextWindow: 2000000,
|
|
@@ -16136,7 +15843,7 @@ export const MODELS = {
|
|
|
16136
15843
|
cost: {
|
|
16137
15844
|
input: 1.25,
|
|
16138
15845
|
output: 2.5,
|
|
16139
|
-
cacheRead: 0.
|
|
15846
|
+
cacheRead: 0.2,
|
|
16140
15847
|
cacheWrite: 0,
|
|
16141
15848
|
},
|
|
16142
15849
|
contextWindow: 2000000,
|
|
@@ -16153,7 +15860,7 @@ export const MODELS = {
|
|
|
16153
15860
|
cost: {
|
|
16154
15861
|
input: 1.25,
|
|
16155
15862
|
output: 2.5,
|
|
16156
|
-
cacheRead: 0.
|
|
15863
|
+
cacheRead: 0.2,
|
|
16157
15864
|
cacheWrite: 0,
|
|
16158
15865
|
},
|
|
16159
15866
|
contextWindow: 2000000,
|
|
@@ -16170,7 +15877,7 @@ export const MODELS = {
|
|
|
16170
15877
|
cost: {
|
|
16171
15878
|
input: 1.25,
|
|
16172
15879
|
output: 2.5,
|
|
16173
|
-
cacheRead: 0.
|
|
15880
|
+
cacheRead: 0.2,
|
|
16174
15881
|
cacheWrite: 0,
|
|
16175
15882
|
},
|
|
16176
15883
|
contextWindow: 2000000,
|
|
@@ -16187,7 +15894,7 @@ export const MODELS = {
|
|
|
16187
15894
|
cost: {
|
|
16188
15895
|
input: 1.25,
|
|
16189
15896
|
output: 2.5,
|
|
16190
|
-
cacheRead: 0.
|
|
15897
|
+
cacheRead: 0.2,
|
|
16191
15898
|
cacheWrite: 0,
|
|
16192
15899
|
},
|
|
16193
15900
|
contextWindow: 2000000,
|
|
@@ -16204,7 +15911,7 @@ export const MODELS = {
|
|
|
16204
15911
|
cost: {
|
|
16205
15912
|
input: 1.25,
|
|
16206
15913
|
output: 2.5,
|
|
16207
|
-
cacheRead: 0.
|
|
15914
|
+
cacheRead: 0.2,
|
|
16208
15915
|
cacheWrite: 0,
|
|
16209
15916
|
},
|
|
16210
15917
|
contextWindow: 2000000,
|
|
@@ -16221,7 +15928,7 @@ export const MODELS = {
|
|
|
16221
15928
|
cost: {
|
|
16222
15929
|
input: 1.25,
|
|
16223
15930
|
output: 2.5,
|
|
16224
|
-
cacheRead: 0.
|
|
15931
|
+
cacheRead: 0.2,
|
|
16225
15932
|
cacheWrite: 0,
|
|
16226
15933
|
},
|
|
16227
15934
|
contextWindow: 1000000,
|
|
@@ -16238,7 +15945,7 @@ export const MODELS = {
|
|
|
16238
15945
|
cost: {
|
|
16239
15946
|
input: 1,
|
|
16240
15947
|
output: 2,
|
|
16241
|
-
cacheRead: 0.
|
|
15948
|
+
cacheRead: 0.2,
|
|
16242
15949
|
cacheWrite: 0,
|
|
16243
15950
|
},
|
|
16244
15951
|
contextWindow: 256000,
|
|
@@ -16253,7 +15960,7 @@ export const MODELS = {
|
|
|
16253
15960
|
reasoning: true,
|
|
16254
15961
|
input: ["text"],
|
|
16255
15962
|
cost: {
|
|
16256
|
-
input: 0.
|
|
15963
|
+
input: 0.1,
|
|
16257
15964
|
output: 0.3,
|
|
16258
15965
|
cacheRead: 0.01,
|
|
16259
15966
|
cacheWrite: 0,
|
|
@@ -16272,7 +15979,7 @@ export const MODELS = {
|
|
|
16272
15979
|
cost: {
|
|
16273
15980
|
input: 1,
|
|
16274
15981
|
output: 3,
|
|
16275
|
-
cacheRead: 0.
|
|
15982
|
+
cacheRead: 0.2,
|
|
16276
15983
|
cacheWrite: 0,
|
|
16277
15984
|
},
|
|
16278
15985
|
contextWindow: 1000000,
|
|
@@ -16338,7 +16045,7 @@ export const MODELS = {
|
|
|
16338
16045
|
reasoning: true,
|
|
16339
16046
|
input: ["text"],
|
|
16340
16047
|
cost: {
|
|
16341
|
-
input: 0.
|
|
16048
|
+
input: 0.2,
|
|
16342
16049
|
output: 1.1,
|
|
16343
16050
|
cacheRead: 0.03,
|
|
16344
16051
|
cacheWrite: 0,
|
|
@@ -16356,7 +16063,7 @@ export const MODELS = {
|
|
|
16356
16063
|
input: ["text", "image"],
|
|
16357
16064
|
cost: {
|
|
16358
16065
|
input: 0.6,
|
|
16359
|
-
output: 1.
|
|
16066
|
+
output: 1.8,
|
|
16360
16067
|
cacheRead: 0.11,
|
|
16361
16068
|
cacheWrite: 0,
|
|
16362
16069
|
},
|
|
@@ -16390,8 +16097,8 @@ export const MODELS = {
|
|
|
16390
16097
|
input: ["text", "image"],
|
|
16391
16098
|
cost: {
|
|
16392
16099
|
input: 0.3,
|
|
16393
|
-
output: 0.
|
|
16394
|
-
cacheRead: 0.
|
|
16100
|
+
output: 0.9,
|
|
16101
|
+
cacheRead: 0.05,
|
|
16395
16102
|
cacheWrite: 0,
|
|
16396
16103
|
},
|
|
16397
16104
|
contextWindow: 128000,
|
|
@@ -16441,7 +16148,7 @@ export const MODELS = {
|
|
|
16441
16148
|
input: ["text"],
|
|
16442
16149
|
cost: {
|
|
16443
16150
|
input: 0.07,
|
|
16444
|
-
output: 0.
|
|
16151
|
+
output: 0.4,
|
|
16445
16152
|
cacheRead: 0,
|
|
16446
16153
|
cacheWrite: 0,
|
|
16447
16154
|
},
|
|
@@ -16458,7 +16165,7 @@ export const MODELS = {
|
|
|
16458
16165
|
input: ["text"],
|
|
16459
16166
|
cost: {
|
|
16460
16167
|
input: 0.06,
|
|
16461
|
-
output: 0.
|
|
16168
|
+
output: 0.4,
|
|
16462
16169
|
cacheRead: 0.01,
|
|
16463
16170
|
cacheWrite: 0,
|
|
16464
16171
|
},
|
|
@@ -16475,8 +16182,8 @@ export const MODELS = {
|
|
|
16475
16182
|
input: ["text"],
|
|
16476
16183
|
cost: {
|
|
16477
16184
|
input: 1,
|
|
16478
|
-
output: 3.
|
|
16479
|
-
cacheRead: 0.
|
|
16185
|
+
output: 3.2,
|
|
16186
|
+
cacheRead: 0.2,
|
|
16480
16187
|
cacheWrite: 0,
|
|
16481
16188
|
},
|
|
16482
16189
|
contextWindow: 202800,
|
|
@@ -16746,6 +16453,24 @@ export const MODELS = {
|
|
|
16746
16453
|
contextWindow: 1048576,
|
|
16747
16454
|
maxTokens: 131072,
|
|
16748
16455
|
},
|
|
16456
|
+
"mimo-v2.5-pro-ultraspeed": {
|
|
16457
|
+
id: "mimo-v2.5-pro-ultraspeed",
|
|
16458
|
+
name: "MiMo-V2.5-Pro-UltraSpeed",
|
|
16459
|
+
api: "openai-completions",
|
|
16460
|
+
provider: "xiaomi",
|
|
16461
|
+
baseUrl: "https://api.xiaomimimo.com/v1",
|
|
16462
|
+
compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
|
|
16463
|
+
reasoning: true,
|
|
16464
|
+
input: ["text"],
|
|
16465
|
+
cost: {
|
|
16466
|
+
input: 1.305,
|
|
16467
|
+
output: 2.61,
|
|
16468
|
+
cacheRead: 0.0108,
|
|
16469
|
+
cacheWrite: 0,
|
|
16470
|
+
},
|
|
16471
|
+
contextWindow: 1048576,
|
|
16472
|
+
maxTokens: 131072,
|
|
16473
|
+
},
|
|
16749
16474
|
},
|
|
16750
16475
|
"xiaomi-token-plan-ams": {
|
|
16751
16476
|
"mimo-v2-omni": {
|
|
@@ -16820,6 +16545,24 @@ export const MODELS = {
|
|
|
16820
16545
|
contextWindow: 1048576,
|
|
16821
16546
|
maxTokens: 131072,
|
|
16822
16547
|
},
|
|
16548
|
+
"mimo-v2.5-pro-ultraspeed": {
|
|
16549
|
+
id: "mimo-v2.5-pro-ultraspeed",
|
|
16550
|
+
name: "MiMo-V2.5-Pro-UltraSpeed",
|
|
16551
|
+
api: "openai-completions",
|
|
16552
|
+
provider: "xiaomi-token-plan-ams",
|
|
16553
|
+
baseUrl: "https://token-plan-ams.xiaomimimo.com/v1",
|
|
16554
|
+
compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
|
|
16555
|
+
reasoning: true,
|
|
16556
|
+
input: ["text"],
|
|
16557
|
+
cost: {
|
|
16558
|
+
input: 1.305,
|
|
16559
|
+
output: 2.61,
|
|
16560
|
+
cacheRead: 0.0108,
|
|
16561
|
+
cacheWrite: 0,
|
|
16562
|
+
},
|
|
16563
|
+
contextWindow: 1048576,
|
|
16564
|
+
maxTokens: 131072,
|
|
16565
|
+
},
|
|
16823
16566
|
},
|
|
16824
16567
|
"xiaomi-token-plan-cn": {
|
|
16825
16568
|
"mimo-v2-omni": {
|
|
@@ -16894,6 +16637,24 @@ export const MODELS = {
|
|
|
16894
16637
|
contextWindow: 1048576,
|
|
16895
16638
|
maxTokens: 131072,
|
|
16896
16639
|
},
|
|
16640
|
+
"mimo-v2.5-pro-ultraspeed": {
|
|
16641
|
+
id: "mimo-v2.5-pro-ultraspeed",
|
|
16642
|
+
name: "MiMo-V2.5-Pro-UltraSpeed",
|
|
16643
|
+
api: "openai-completions",
|
|
16644
|
+
provider: "xiaomi-token-plan-cn",
|
|
16645
|
+
baseUrl: "https://token-plan-cn.xiaomimimo.com/v1",
|
|
16646
|
+
compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
|
|
16647
|
+
reasoning: true,
|
|
16648
|
+
input: ["text"],
|
|
16649
|
+
cost: {
|
|
16650
|
+
input: 1.305,
|
|
16651
|
+
output: 2.61,
|
|
16652
|
+
cacheRead: 0.0108,
|
|
16653
|
+
cacheWrite: 0,
|
|
16654
|
+
},
|
|
16655
|
+
contextWindow: 1048576,
|
|
16656
|
+
maxTokens: 131072,
|
|
16657
|
+
},
|
|
16897
16658
|
},
|
|
16898
16659
|
"xiaomi-token-plan-sgp": {
|
|
16899
16660
|
"mimo-v2-omni": {
|
|
@@ -16968,6 +16729,24 @@ export const MODELS = {
|
|
|
16968
16729
|
contextWindow: 1048576,
|
|
16969
16730
|
maxTokens: 131072,
|
|
16970
16731
|
},
|
|
16732
|
+
"mimo-v2.5-pro-ultraspeed": {
|
|
16733
|
+
id: "mimo-v2.5-pro-ultraspeed",
|
|
16734
|
+
name: "MiMo-V2.5-Pro-UltraSpeed",
|
|
16735
|
+
api: "openai-completions",
|
|
16736
|
+
provider: "xiaomi-token-plan-sgp",
|
|
16737
|
+
baseUrl: "https://token-plan-sgp.xiaomimimo.com/v1",
|
|
16738
|
+
compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
|
|
16739
|
+
reasoning: true,
|
|
16740
|
+
input: ["text"],
|
|
16741
|
+
cost: {
|
|
16742
|
+
input: 1.305,
|
|
16743
|
+
output: 2.61,
|
|
16744
|
+
cacheRead: 0.0108,
|
|
16745
|
+
cacheWrite: 0,
|
|
16746
|
+
},
|
|
16747
|
+
contextWindow: 1048576,
|
|
16748
|
+
maxTokens: 131072,
|
|
16749
|
+
},
|
|
16971
16750
|
},
|
|
16972
16751
|
"zai": {
|
|
16973
16752
|
"glm-4.5-air": {
|