@earendil-works/pi-ai 0.74.0 → 0.74.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +76 -6
- package/dist/env-api-keys.d.ts.map +1 -1
- package/dist/env-api-keys.js +2 -1
- package/dist/env-api-keys.js.map +1 -1
- package/dist/image-models.d.ts +10 -0
- package/dist/image-models.d.ts.map +1 -0
- package/dist/image-models.generated.d.ts +440 -0
- package/dist/image-models.generated.d.ts.map +1 -0
- package/dist/image-models.generated.js +442 -0
- package/dist/image-models.generated.js.map +1 -0
- package/dist/image-models.js +23 -0
- package/dist/image-models.js.map +1 -0
- package/dist/images-api-registry.d.ts +14 -0
- package/dist/images-api-registry.d.ts.map +1 -0
- package/dist/images-api-registry.js +22 -0
- package/dist/images-api-registry.js.map +1 -0
- package/dist/images.d.ts +4 -0
- package/dist/images.d.ts.map +1 -0
- package/dist/images.js +14 -0
- package/dist/images.js.map +1 -0
- package/dist/index.d.ts +4 -0
- package/dist/index.d.ts.map +1 -1
- package/dist/index.js +4 -0
- package/dist/index.js.map +1 -1
- package/dist/models.generated.d.ts +2148 -2396
- package/dist/models.generated.d.ts.map +1 -1
- package/dist/models.generated.js +1124 -1649
- package/dist/models.generated.js.map +1 -1
- package/dist/providers/amazon-bedrock.d.ts.map +1 -1
- package/dist/providers/amazon-bedrock.js +7 -16
- package/dist/providers/amazon-bedrock.js.map +1 -1
- package/dist/providers/anthropic.d.ts.map +1 -1
- package/dist/providers/anthropic.js +15 -6
- package/dist/providers/anthropic.js.map +1 -1
- package/dist/providers/images/openrouter.d.ts +3 -0
- package/dist/providers/images/openrouter.d.ts.map +1 -0
- package/dist/providers/images/openrouter.js +129 -0
- package/dist/providers/images/openrouter.js.map +1 -0
- package/dist/providers/images/register-builtins.d.ts +4 -0
- package/dist/providers/images/register-builtins.d.ts.map +1 -0
- package/dist/providers/images/register-builtins.js +34 -0
- package/dist/providers/images/register-builtins.js.map +1 -0
- package/dist/providers/openai-codex-responses.d.ts.map +1 -1
- package/dist/providers/openai-codex-responses.js +49 -3
- package/dist/providers/openai-codex-responses.js.map +1 -1
- package/dist/providers/openai-completions.d.ts.map +1 -1
- package/dist/providers/openai-completions.js +32 -14
- package/dist/providers/openai-completions.js.map +1 -1
- package/dist/providers/simple-options.d.ts.map +1 -1
- package/dist/providers/simple-options.js +1 -1
- package/dist/providers/simple-options.js.map +1 -1
- package/dist/types.d.ts +86 -3
- package/dist/types.d.ts.map +1 -1
- package/dist/types.js.map +1 -1
- package/dist/utils/node-http-proxy.d.ts +10 -0
- package/dist/utils/node-http-proxy.d.ts.map +1 -0
- package/dist/utils/node-http-proxy.js +97 -0
- package/dist/utils/node-http-proxy.js.map +1 -0
- package/dist/utils/overflow.d.ts +2 -1
- package/dist/utils/overflow.d.ts.map +1 -1
- package/dist/utils/overflow.js +6 -1
- package/dist/utils/overflow.js.map +1 -1
- package/package.json +6 -7
package/dist/models.generated.js
CHANGED
|
@@ -53,23 +53,6 @@ export const MODELS = {
|
|
|
53
53
|
contextWindow: 128000,
|
|
54
54
|
maxTokens: 8192,
|
|
55
55
|
},
|
|
56
|
-
"amazon.nova-premier-v1:0": {
|
|
57
|
-
id: "amazon.nova-premier-v1:0",
|
|
58
|
-
name: "Nova Premier",
|
|
59
|
-
api: "bedrock-converse-stream",
|
|
60
|
-
provider: "amazon-bedrock",
|
|
61
|
-
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
62
|
-
reasoning: true,
|
|
63
|
-
input: ["text", "image"],
|
|
64
|
-
cost: {
|
|
65
|
-
input: 2.5,
|
|
66
|
-
output: 12.5,
|
|
67
|
-
cacheRead: 0,
|
|
68
|
-
cacheWrite: 0,
|
|
69
|
-
},
|
|
70
|
-
contextWindow: 1000000,
|
|
71
|
-
maxTokens: 16384,
|
|
72
|
-
},
|
|
73
56
|
"amazon.nova-pro-v1:0": {
|
|
74
57
|
id: "amazon.nova-pro-v1:0",
|
|
75
58
|
name: "Nova Pro",
|
|
@@ -87,91 +70,6 @@ export const MODELS = {
|
|
|
87
70
|
contextWindow: 300000,
|
|
88
71
|
maxTokens: 8192,
|
|
89
72
|
},
|
|
90
|
-
"anthropic.claude-3-5-haiku-20241022-v1:0": {
|
|
91
|
-
id: "anthropic.claude-3-5-haiku-20241022-v1:0",
|
|
92
|
-
name: "Claude Haiku 3.5",
|
|
93
|
-
api: "bedrock-converse-stream",
|
|
94
|
-
provider: "amazon-bedrock",
|
|
95
|
-
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
96
|
-
reasoning: false,
|
|
97
|
-
input: ["text", "image"],
|
|
98
|
-
cost: {
|
|
99
|
-
input: 0.8,
|
|
100
|
-
output: 4,
|
|
101
|
-
cacheRead: 0.08,
|
|
102
|
-
cacheWrite: 1,
|
|
103
|
-
},
|
|
104
|
-
contextWindow: 200000,
|
|
105
|
-
maxTokens: 8192,
|
|
106
|
-
},
|
|
107
|
-
"anthropic.claude-3-5-sonnet-20240620-v1:0": {
|
|
108
|
-
id: "anthropic.claude-3-5-sonnet-20240620-v1:0",
|
|
109
|
-
name: "Claude Sonnet 3.5",
|
|
110
|
-
api: "bedrock-converse-stream",
|
|
111
|
-
provider: "amazon-bedrock",
|
|
112
|
-
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
113
|
-
reasoning: false,
|
|
114
|
-
input: ["text", "image"],
|
|
115
|
-
cost: {
|
|
116
|
-
input: 3,
|
|
117
|
-
output: 15,
|
|
118
|
-
cacheRead: 0.3,
|
|
119
|
-
cacheWrite: 3.75,
|
|
120
|
-
},
|
|
121
|
-
contextWindow: 200000,
|
|
122
|
-
maxTokens: 8192,
|
|
123
|
-
},
|
|
124
|
-
"anthropic.claude-3-5-sonnet-20241022-v2:0": {
|
|
125
|
-
id: "anthropic.claude-3-5-sonnet-20241022-v2:0",
|
|
126
|
-
name: "Claude Sonnet 3.5 v2",
|
|
127
|
-
api: "bedrock-converse-stream",
|
|
128
|
-
provider: "amazon-bedrock",
|
|
129
|
-
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
130
|
-
reasoning: false,
|
|
131
|
-
input: ["text", "image"],
|
|
132
|
-
cost: {
|
|
133
|
-
input: 3,
|
|
134
|
-
output: 15,
|
|
135
|
-
cacheRead: 0.3,
|
|
136
|
-
cacheWrite: 3.75,
|
|
137
|
-
},
|
|
138
|
-
contextWindow: 200000,
|
|
139
|
-
maxTokens: 8192,
|
|
140
|
-
},
|
|
141
|
-
"anthropic.claude-3-7-sonnet-20250219-v1:0": {
|
|
142
|
-
id: "anthropic.claude-3-7-sonnet-20250219-v1:0",
|
|
143
|
-
name: "Claude Sonnet 3.7",
|
|
144
|
-
api: "bedrock-converse-stream",
|
|
145
|
-
provider: "amazon-bedrock",
|
|
146
|
-
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
147
|
-
reasoning: false,
|
|
148
|
-
input: ["text", "image"],
|
|
149
|
-
cost: {
|
|
150
|
-
input: 3,
|
|
151
|
-
output: 15,
|
|
152
|
-
cacheRead: 0.3,
|
|
153
|
-
cacheWrite: 3.75,
|
|
154
|
-
},
|
|
155
|
-
contextWindow: 200000,
|
|
156
|
-
maxTokens: 8192,
|
|
157
|
-
},
|
|
158
|
-
"anthropic.claude-3-haiku-20240307-v1:0": {
|
|
159
|
-
id: "anthropic.claude-3-haiku-20240307-v1:0",
|
|
160
|
-
name: "Claude Haiku 3",
|
|
161
|
-
api: "bedrock-converse-stream",
|
|
162
|
-
provider: "amazon-bedrock",
|
|
163
|
-
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
164
|
-
reasoning: false,
|
|
165
|
-
input: ["text", "image"],
|
|
166
|
-
cost: {
|
|
167
|
-
input: 0.25,
|
|
168
|
-
output: 1.25,
|
|
169
|
-
cacheRead: 0,
|
|
170
|
-
cacheWrite: 0,
|
|
171
|
-
},
|
|
172
|
-
contextWindow: 200000,
|
|
173
|
-
maxTokens: 4096,
|
|
174
|
-
},
|
|
175
73
|
"anthropic.claude-haiku-4-5-20251001-v1:0": {
|
|
176
74
|
id: "anthropic.claude-haiku-4-5-20251001-v1:0",
|
|
177
75
|
name: "Claude Haiku 4.5",
|
|
@@ -206,23 +104,6 @@ export const MODELS = {
|
|
|
206
104
|
contextWindow: 200000,
|
|
207
105
|
maxTokens: 32000,
|
|
208
106
|
},
|
|
209
|
-
"anthropic.claude-opus-4-20250514-v1:0": {
|
|
210
|
-
id: "anthropic.claude-opus-4-20250514-v1:0",
|
|
211
|
-
name: "Claude Opus 4",
|
|
212
|
-
api: "bedrock-converse-stream",
|
|
213
|
-
provider: "amazon-bedrock",
|
|
214
|
-
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
215
|
-
reasoning: true,
|
|
216
|
-
input: ["text", "image"],
|
|
217
|
-
cost: {
|
|
218
|
-
input: 15,
|
|
219
|
-
output: 75,
|
|
220
|
-
cacheRead: 1.5,
|
|
221
|
-
cacheWrite: 18.75,
|
|
222
|
-
},
|
|
223
|
-
contextWindow: 200000,
|
|
224
|
-
maxTokens: 32000,
|
|
225
|
-
},
|
|
226
107
|
"anthropic.claude-opus-4-5-20251101-v1:0": {
|
|
227
108
|
id: "anthropic.claude-opus-4-5-20251101-v1:0",
|
|
228
109
|
name: "Claude Opus 4.5",
|
|
@@ -276,9 +157,9 @@ export const MODELS = {
|
|
|
276
157
|
contextWindow: 1000000,
|
|
277
158
|
maxTokens: 128000,
|
|
278
159
|
},
|
|
279
|
-
"anthropic.claude-sonnet-4-
|
|
280
|
-
id: "anthropic.claude-sonnet-4-
|
|
281
|
-
name: "Claude Sonnet 4",
|
|
160
|
+
"anthropic.claude-sonnet-4-5-20250929-v1:0": {
|
|
161
|
+
id: "anthropic.claude-sonnet-4-5-20250929-v1:0",
|
|
162
|
+
name: "Claude Sonnet 4.5",
|
|
282
163
|
api: "bedrock-converse-stream",
|
|
283
164
|
provider: "amazon-bedrock",
|
|
284
165
|
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
@@ -293,9 +174,9 @@ export const MODELS = {
|
|
|
293
174
|
contextWindow: 200000,
|
|
294
175
|
maxTokens: 64000,
|
|
295
176
|
},
|
|
296
|
-
"anthropic.claude-sonnet-4-
|
|
297
|
-
id: "anthropic.claude-sonnet-4-
|
|
298
|
-
name: "Claude Sonnet 4.
|
|
177
|
+
"anthropic.claude-sonnet-4-6": {
|
|
178
|
+
id: "anthropic.claude-sonnet-4-6",
|
|
179
|
+
name: "Claude Sonnet 4.6",
|
|
299
180
|
api: "bedrock-converse-stream",
|
|
300
181
|
provider: "amazon-bedrock",
|
|
301
182
|
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
@@ -307,24 +188,24 @@ export const MODELS = {
|
|
|
307
188
|
cacheRead: 0.3,
|
|
308
189
|
cacheWrite: 3.75,
|
|
309
190
|
},
|
|
310
|
-
contextWindow:
|
|
191
|
+
contextWindow: 1000000,
|
|
311
192
|
maxTokens: 64000,
|
|
312
193
|
},
|
|
313
|
-
"anthropic.claude-
|
|
314
|
-
id: "anthropic.claude-
|
|
315
|
-
name: "Claude
|
|
194
|
+
"au.anthropic.claude-haiku-4-5-20251001-v1:0": {
|
|
195
|
+
id: "au.anthropic.claude-haiku-4-5-20251001-v1:0",
|
|
196
|
+
name: "Claude Haiku 4.5 (AU)",
|
|
316
197
|
api: "bedrock-converse-stream",
|
|
317
198
|
provider: "amazon-bedrock",
|
|
318
199
|
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
319
200
|
reasoning: true,
|
|
320
201
|
input: ["text", "image"],
|
|
321
202
|
cost: {
|
|
322
|
-
input:
|
|
323
|
-
output:
|
|
324
|
-
cacheRead: 0.
|
|
325
|
-
cacheWrite:
|
|
203
|
+
input: 1,
|
|
204
|
+
output: 5,
|
|
205
|
+
cacheRead: 0.1,
|
|
206
|
+
cacheWrite: 1.25,
|
|
326
207
|
},
|
|
327
|
-
contextWindow:
|
|
208
|
+
contextWindow: 200000,
|
|
328
209
|
maxTokens: 64000,
|
|
329
210
|
},
|
|
330
211
|
"au.anthropic.claude-opus-4-6-v1": {
|
|
@@ -345,6 +226,23 @@ export const MODELS = {
|
|
|
345
226
|
contextWindow: 1000000,
|
|
346
227
|
maxTokens: 128000,
|
|
347
228
|
},
|
|
229
|
+
"au.anthropic.claude-sonnet-4-5-20250929-v1:0": {
|
|
230
|
+
id: "au.anthropic.claude-sonnet-4-5-20250929-v1:0",
|
|
231
|
+
name: "Claude Sonnet 4.5 (AU)",
|
|
232
|
+
api: "bedrock-converse-stream",
|
|
233
|
+
provider: "amazon-bedrock",
|
|
234
|
+
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
235
|
+
reasoning: true,
|
|
236
|
+
input: ["text", "image"],
|
|
237
|
+
cost: {
|
|
238
|
+
input: 3,
|
|
239
|
+
output: 15,
|
|
240
|
+
cacheRead: 0.3,
|
|
241
|
+
cacheWrite: 3.75,
|
|
242
|
+
},
|
|
243
|
+
contextWindow: 200000,
|
|
244
|
+
maxTokens: 64000,
|
|
245
|
+
},
|
|
348
246
|
"au.anthropic.claude-sonnet-4-6": {
|
|
349
247
|
id: "au.anthropic.claude-sonnet-4-6",
|
|
350
248
|
name: "AU Anthropic Claude Sonnet 4.6",
|
|
@@ -483,23 +381,6 @@ export const MODELS = {
|
|
|
483
381
|
contextWindow: 1000000,
|
|
484
382
|
maxTokens: 128000,
|
|
485
383
|
},
|
|
486
|
-
"eu.anthropic.claude-sonnet-4-20250514-v1:0": {
|
|
487
|
-
id: "eu.anthropic.claude-sonnet-4-20250514-v1:0",
|
|
488
|
-
name: "Claude Sonnet 4 (EU)",
|
|
489
|
-
api: "bedrock-converse-stream",
|
|
490
|
-
provider: "amazon-bedrock",
|
|
491
|
-
baseUrl: "https://bedrock-runtime.eu-central-1.amazonaws.com",
|
|
492
|
-
reasoning: true,
|
|
493
|
-
input: ["text", "image"],
|
|
494
|
-
cost: {
|
|
495
|
-
input: 3,
|
|
496
|
-
output: 15,
|
|
497
|
-
cacheRead: 0.3,
|
|
498
|
-
cacheWrite: 3.75,
|
|
499
|
-
},
|
|
500
|
-
contextWindow: 200000,
|
|
501
|
-
maxTokens: 64000,
|
|
502
|
-
},
|
|
503
384
|
"eu.anthropic.claude-sonnet-4-5-20250929-v1:0": {
|
|
504
385
|
id: "eu.anthropic.claude-sonnet-4-5-20250929-v1:0",
|
|
505
386
|
name: "Claude Sonnet 4.5 (EU)",
|
|
@@ -604,23 +485,6 @@ export const MODELS = {
|
|
|
604
485
|
contextWindow: 1000000,
|
|
605
486
|
maxTokens: 128000,
|
|
606
487
|
},
|
|
607
|
-
"global.anthropic.claude-sonnet-4-20250514-v1:0": {
|
|
608
|
-
id: "global.anthropic.claude-sonnet-4-20250514-v1:0",
|
|
609
|
-
name: "Claude Sonnet 4 (Global)",
|
|
610
|
-
api: "bedrock-converse-stream",
|
|
611
|
-
provider: "amazon-bedrock",
|
|
612
|
-
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
613
|
-
reasoning: true,
|
|
614
|
-
input: ["text", "image"],
|
|
615
|
-
cost: {
|
|
616
|
-
input: 3,
|
|
617
|
-
output: 15,
|
|
618
|
-
cacheRead: 0.3,
|
|
619
|
-
cacheWrite: 3.75,
|
|
620
|
-
},
|
|
621
|
-
contextWindow: 200000,
|
|
622
|
-
maxTokens: 64000,
|
|
623
|
-
},
|
|
624
488
|
"global.anthropic.claude-sonnet-4-5-20250929-v1:0": {
|
|
625
489
|
id: "global.anthropic.claude-sonnet-4-5-20250929-v1:0",
|
|
626
490
|
name: "Claude Sonnet 4.5 (Global)",
|
|
@@ -689,22 +553,57 @@ export const MODELS = {
|
|
|
689
553
|
contextWindow: 128000,
|
|
690
554
|
maxTokens: 4096,
|
|
691
555
|
},
|
|
692
|
-
"
|
|
693
|
-
id: "
|
|
694
|
-
name: "
|
|
556
|
+
"jp.anthropic.claude-opus-4-7": {
|
|
557
|
+
id: "jp.anthropic.claude-opus-4-7",
|
|
558
|
+
name: "Claude Opus 4.7 (JP)",
|
|
695
559
|
api: "bedrock-converse-stream",
|
|
696
560
|
provider: "amazon-bedrock",
|
|
697
561
|
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
698
|
-
reasoning:
|
|
699
|
-
|
|
562
|
+
reasoning: true,
|
|
563
|
+
thinkingLevelMap: { "xhigh": "xhigh" },
|
|
564
|
+
input: ["text", "image"],
|
|
700
565
|
cost: {
|
|
701
|
-
input:
|
|
702
|
-
output:
|
|
703
|
-
cacheRead: 0,
|
|
704
|
-
cacheWrite:
|
|
566
|
+
input: 5,
|
|
567
|
+
output: 25,
|
|
568
|
+
cacheRead: 0.5,
|
|
569
|
+
cacheWrite: 6.25,
|
|
705
570
|
},
|
|
706
|
-
contextWindow:
|
|
707
|
-
maxTokens:
|
|
571
|
+
contextWindow: 1000000,
|
|
572
|
+
maxTokens: 128000,
|
|
573
|
+
},
|
|
574
|
+
"jp.anthropic.claude-sonnet-4-5-20250929-v1:0": {
|
|
575
|
+
id: "jp.anthropic.claude-sonnet-4-5-20250929-v1:0",
|
|
576
|
+
name: "Claude Sonnet 4.5 (JP)",
|
|
577
|
+
api: "bedrock-converse-stream",
|
|
578
|
+
provider: "amazon-bedrock",
|
|
579
|
+
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
580
|
+
reasoning: true,
|
|
581
|
+
input: ["text", "image"],
|
|
582
|
+
cost: {
|
|
583
|
+
input: 3,
|
|
584
|
+
output: 15,
|
|
585
|
+
cacheRead: 0.3,
|
|
586
|
+
cacheWrite: 3.75,
|
|
587
|
+
},
|
|
588
|
+
contextWindow: 200000,
|
|
589
|
+
maxTokens: 64000,
|
|
590
|
+
},
|
|
591
|
+
"jp.anthropic.claude-sonnet-4-6": {
|
|
592
|
+
id: "jp.anthropic.claude-sonnet-4-6",
|
|
593
|
+
name: "Claude Sonnet 4.6 (JP)",
|
|
594
|
+
api: "bedrock-converse-stream",
|
|
595
|
+
provider: "amazon-bedrock",
|
|
596
|
+
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
597
|
+
reasoning: true,
|
|
598
|
+
input: ["text", "image"],
|
|
599
|
+
cost: {
|
|
600
|
+
input: 3,
|
|
601
|
+
output: 15,
|
|
602
|
+
cacheRead: 0.3,
|
|
603
|
+
cacheWrite: 3.75,
|
|
604
|
+
},
|
|
605
|
+
contextWindow: 1000000,
|
|
606
|
+
maxTokens: 64000,
|
|
708
607
|
},
|
|
709
608
|
"meta.llama3-1-70b-instruct-v1:0": {
|
|
710
609
|
id: "meta.llama3-1-70b-instruct-v1:0",
|
|
@@ -740,128 +639,60 @@ export const MODELS = {
|
|
|
740
639
|
contextWindow: 128000,
|
|
741
640
|
maxTokens: 4096,
|
|
742
641
|
},
|
|
743
|
-
"meta.llama3-
|
|
744
|
-
id: "meta.llama3-
|
|
745
|
-
name: "Llama 3.
|
|
642
|
+
"meta.llama3-3-70b-instruct-v1:0": {
|
|
643
|
+
id: "meta.llama3-3-70b-instruct-v1:0",
|
|
644
|
+
name: "Llama 3.3 70B Instruct",
|
|
746
645
|
api: "bedrock-converse-stream",
|
|
747
646
|
provider: "amazon-bedrock",
|
|
748
647
|
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
749
648
|
reasoning: false,
|
|
750
|
-
input: ["text"
|
|
649
|
+
input: ["text"],
|
|
751
650
|
cost: {
|
|
752
|
-
input: 0.
|
|
753
|
-
output: 0.
|
|
651
|
+
input: 0.72,
|
|
652
|
+
output: 0.72,
|
|
754
653
|
cacheRead: 0,
|
|
755
654
|
cacheWrite: 0,
|
|
756
655
|
},
|
|
757
656
|
contextWindow: 128000,
|
|
758
657
|
maxTokens: 4096,
|
|
759
658
|
},
|
|
760
|
-
"meta.
|
|
761
|
-
id: "meta.
|
|
762
|
-
name: "Llama
|
|
659
|
+
"meta.llama4-maverick-17b-instruct-v1:0": {
|
|
660
|
+
id: "meta.llama4-maverick-17b-instruct-v1:0",
|
|
661
|
+
name: "Llama 4 Maverick 17B Instruct",
|
|
763
662
|
api: "bedrock-converse-stream",
|
|
764
663
|
provider: "amazon-bedrock",
|
|
765
664
|
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
766
665
|
reasoning: false,
|
|
767
|
-
input: ["text"],
|
|
666
|
+
input: ["text", "image"],
|
|
768
667
|
cost: {
|
|
769
|
-
input: 0.
|
|
770
|
-
output: 0.
|
|
668
|
+
input: 0.24,
|
|
669
|
+
output: 0.97,
|
|
771
670
|
cacheRead: 0,
|
|
772
671
|
cacheWrite: 0,
|
|
773
672
|
},
|
|
774
|
-
contextWindow:
|
|
775
|
-
maxTokens:
|
|
673
|
+
contextWindow: 1000000,
|
|
674
|
+
maxTokens: 16384,
|
|
776
675
|
},
|
|
777
|
-
"meta.
|
|
778
|
-
id: "meta.
|
|
779
|
-
name: "Llama
|
|
676
|
+
"meta.llama4-scout-17b-instruct-v1:0": {
|
|
677
|
+
id: "meta.llama4-scout-17b-instruct-v1:0",
|
|
678
|
+
name: "Llama 4 Scout 17B Instruct",
|
|
780
679
|
api: "bedrock-converse-stream",
|
|
781
680
|
provider: "amazon-bedrock",
|
|
782
681
|
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
783
682
|
reasoning: false,
|
|
784
|
-
input: ["text"],
|
|
683
|
+
input: ["text", "image"],
|
|
785
684
|
cost: {
|
|
786
|
-
input: 0.
|
|
787
|
-
output: 0.
|
|
685
|
+
input: 0.17,
|
|
686
|
+
output: 0.66,
|
|
788
687
|
cacheRead: 0,
|
|
789
688
|
cacheWrite: 0,
|
|
790
689
|
},
|
|
791
|
-
contextWindow:
|
|
792
|
-
maxTokens:
|
|
690
|
+
contextWindow: 3500000,
|
|
691
|
+
maxTokens: 16384,
|
|
793
692
|
},
|
|
794
|
-
"
|
|
795
|
-
id: "
|
|
796
|
-
name: "
|
|
797
|
-
api: "bedrock-converse-stream",
|
|
798
|
-
provider: "amazon-bedrock",
|
|
799
|
-
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
800
|
-
reasoning: false,
|
|
801
|
-
input: ["text", "image"],
|
|
802
|
-
cost: {
|
|
803
|
-
input: 0.72,
|
|
804
|
-
output: 0.72,
|
|
805
|
-
cacheRead: 0,
|
|
806
|
-
cacheWrite: 0,
|
|
807
|
-
},
|
|
808
|
-
contextWindow: 128000,
|
|
809
|
-
maxTokens: 4096,
|
|
810
|
-
},
|
|
811
|
-
"meta.llama3-3-70b-instruct-v1:0": {
|
|
812
|
-
id: "meta.llama3-3-70b-instruct-v1:0",
|
|
813
|
-
name: "Llama 3.3 70B Instruct",
|
|
814
|
-
api: "bedrock-converse-stream",
|
|
815
|
-
provider: "amazon-bedrock",
|
|
816
|
-
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
817
|
-
reasoning: false,
|
|
818
|
-
input: ["text"],
|
|
819
|
-
cost: {
|
|
820
|
-
input: 0.72,
|
|
821
|
-
output: 0.72,
|
|
822
|
-
cacheRead: 0,
|
|
823
|
-
cacheWrite: 0,
|
|
824
|
-
},
|
|
825
|
-
contextWindow: 128000,
|
|
826
|
-
maxTokens: 4096,
|
|
827
|
-
},
|
|
828
|
-
"meta.llama4-maverick-17b-instruct-v1:0": {
|
|
829
|
-
id: "meta.llama4-maverick-17b-instruct-v1:0",
|
|
830
|
-
name: "Llama 4 Maverick 17B Instruct",
|
|
831
|
-
api: "bedrock-converse-stream",
|
|
832
|
-
provider: "amazon-bedrock",
|
|
833
|
-
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
834
|
-
reasoning: false,
|
|
835
|
-
input: ["text", "image"],
|
|
836
|
-
cost: {
|
|
837
|
-
input: 0.24,
|
|
838
|
-
output: 0.97,
|
|
839
|
-
cacheRead: 0,
|
|
840
|
-
cacheWrite: 0,
|
|
841
|
-
},
|
|
842
|
-
contextWindow: 1000000,
|
|
843
|
-
maxTokens: 16384,
|
|
844
|
-
},
|
|
845
|
-
"meta.llama4-scout-17b-instruct-v1:0": {
|
|
846
|
-
id: "meta.llama4-scout-17b-instruct-v1:0",
|
|
847
|
-
name: "Llama 4 Scout 17B Instruct",
|
|
848
|
-
api: "bedrock-converse-stream",
|
|
849
|
-
provider: "amazon-bedrock",
|
|
850
|
-
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
851
|
-
reasoning: false,
|
|
852
|
-
input: ["text", "image"],
|
|
853
|
-
cost: {
|
|
854
|
-
input: 0.17,
|
|
855
|
-
output: 0.66,
|
|
856
|
-
cacheRead: 0,
|
|
857
|
-
cacheWrite: 0,
|
|
858
|
-
},
|
|
859
|
-
contextWindow: 3500000,
|
|
860
|
-
maxTokens: 16384,
|
|
861
|
-
},
|
|
862
|
-
"minimax.minimax-m2": {
|
|
863
|
-
id: "minimax.minimax-m2",
|
|
864
|
-
name: "MiniMax M2",
|
|
693
|
+
"minimax.minimax-m2": {
|
|
694
|
+
id: "minimax.minimax-m2",
|
|
695
|
+
name: "MiniMax M2",
|
|
865
696
|
api: "bedrock-converse-stream",
|
|
866
697
|
provider: "amazon-bedrock",
|
|
867
698
|
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
@@ -1077,8 +908,8 @@ export const MODELS = {
|
|
|
1077
908
|
cacheRead: 0,
|
|
1078
909
|
cacheWrite: 0,
|
|
1079
910
|
},
|
|
1080
|
-
contextWindow:
|
|
1081
|
-
maxTokens:
|
|
911
|
+
contextWindow: 262143,
|
|
912
|
+
maxTokens: 16000,
|
|
1082
913
|
},
|
|
1083
914
|
"moonshotai.kimi-k2.5": {
|
|
1084
915
|
id: "moonshotai.kimi-k2.5",
|
|
@@ -1094,8 +925,8 @@ export const MODELS = {
|
|
|
1094
925
|
cacheRead: 0,
|
|
1095
926
|
cacheWrite: 0,
|
|
1096
927
|
},
|
|
1097
|
-
contextWindow:
|
|
1098
|
-
maxTokens:
|
|
928
|
+
contextWindow: 262143,
|
|
929
|
+
maxTokens: 16000,
|
|
1099
930
|
},
|
|
1100
931
|
"nvidia.nemotron-nano-12b-v2": {
|
|
1101
932
|
id: "nvidia.nemotron-nano-12b-v2",
|
|
@@ -1180,7 +1011,7 @@ export const MODELS = {
|
|
|
1180
1011
|
cacheWrite: 0,
|
|
1181
1012
|
},
|
|
1182
1013
|
contextWindow: 128000,
|
|
1183
|
-
maxTokens:
|
|
1014
|
+
maxTokens: 16384,
|
|
1184
1015
|
},
|
|
1185
1016
|
"openai.gpt-oss-20b-1:0": {
|
|
1186
1017
|
id: "openai.gpt-oss-20b-1:0",
|
|
@@ -1197,7 +1028,7 @@ export const MODELS = {
|
|
|
1197
1028
|
cacheWrite: 0,
|
|
1198
1029
|
},
|
|
1199
1030
|
contextWindow: 128000,
|
|
1200
|
-
maxTokens:
|
|
1031
|
+
maxTokens: 16384,
|
|
1201
1032
|
},
|
|
1202
1033
|
"openai.gpt-oss-safeguard-120b": {
|
|
1203
1034
|
id: "openai.gpt-oss-safeguard-120b",
|
|
@@ -1214,7 +1045,7 @@ export const MODELS = {
|
|
|
1214
1045
|
cacheWrite: 0,
|
|
1215
1046
|
},
|
|
1216
1047
|
contextWindow: 128000,
|
|
1217
|
-
maxTokens:
|
|
1048
|
+
maxTokens: 16384,
|
|
1218
1049
|
},
|
|
1219
1050
|
"openai.gpt-oss-safeguard-20b": {
|
|
1220
1051
|
id: "openai.gpt-oss-safeguard-20b",
|
|
@@ -1231,7 +1062,7 @@ export const MODELS = {
|
|
|
1231
1062
|
cacheWrite: 0,
|
|
1232
1063
|
},
|
|
1233
1064
|
contextWindow: 128000,
|
|
1234
|
-
maxTokens:
|
|
1065
|
+
maxTokens: 16384,
|
|
1235
1066
|
},
|
|
1236
1067
|
"qwen.qwen3-235b-a22b-2507-v1:0": {
|
|
1237
1068
|
id: "qwen.qwen3-235b-a22b-2507-v1:0",
|
|
@@ -1386,23 +1217,6 @@ export const MODELS = {
|
|
|
1386
1217
|
contextWindow: 200000,
|
|
1387
1218
|
maxTokens: 32000,
|
|
1388
1219
|
},
|
|
1389
|
-
"us.anthropic.claude-opus-4-20250514-v1:0": {
|
|
1390
|
-
id: "us.anthropic.claude-opus-4-20250514-v1:0",
|
|
1391
|
-
name: "Claude Opus 4 (US)",
|
|
1392
|
-
api: "bedrock-converse-stream",
|
|
1393
|
-
provider: "amazon-bedrock",
|
|
1394
|
-
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
1395
|
-
reasoning: true,
|
|
1396
|
-
input: ["text", "image"],
|
|
1397
|
-
cost: {
|
|
1398
|
-
input: 15,
|
|
1399
|
-
output: 75,
|
|
1400
|
-
cacheRead: 1.5,
|
|
1401
|
-
cacheWrite: 18.75,
|
|
1402
|
-
},
|
|
1403
|
-
contextWindow: 200000,
|
|
1404
|
-
maxTokens: 32000,
|
|
1405
|
-
},
|
|
1406
1220
|
"us.anthropic.claude-opus-4-5-20251101-v1:0": {
|
|
1407
1221
|
id: "us.anthropic.claude-opus-4-5-20251101-v1:0",
|
|
1408
1222
|
name: "Claude Opus 4.5 (US)",
|
|
@@ -1456,9 +1270,9 @@ export const MODELS = {
|
|
|
1456
1270
|
contextWindow: 1000000,
|
|
1457
1271
|
maxTokens: 128000,
|
|
1458
1272
|
},
|
|
1459
|
-
"us.anthropic.claude-sonnet-4-
|
|
1460
|
-
id: "us.anthropic.claude-sonnet-4-
|
|
1461
|
-
name: "Claude Sonnet 4 (US)",
|
|
1273
|
+
"us.anthropic.claude-sonnet-4-5-20250929-v1:0": {
|
|
1274
|
+
id: "us.anthropic.claude-sonnet-4-5-20250929-v1:0",
|
|
1275
|
+
name: "Claude Sonnet 4.5 (US)",
|
|
1462
1276
|
api: "bedrock-converse-stream",
|
|
1463
1277
|
provider: "amazon-bedrock",
|
|
1464
1278
|
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
@@ -1473,9 +1287,9 @@ export const MODELS = {
|
|
|
1473
1287
|
contextWindow: 200000,
|
|
1474
1288
|
maxTokens: 64000,
|
|
1475
1289
|
},
|
|
1476
|
-
"us.anthropic.claude-sonnet-4-
|
|
1477
|
-
id: "us.anthropic.claude-sonnet-4-
|
|
1478
|
-
name: "Claude Sonnet 4.
|
|
1290
|
+
"us.anthropic.claude-sonnet-4-6": {
|
|
1291
|
+
id: "us.anthropic.claude-sonnet-4-6",
|
|
1292
|
+
name: "Claude Sonnet 4.6 (US)",
|
|
1479
1293
|
api: "bedrock-converse-stream",
|
|
1480
1294
|
provider: "amazon-bedrock",
|
|
1481
1295
|
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
@@ -1487,25 +1301,59 @@ export const MODELS = {
|
|
|
1487
1301
|
cacheRead: 0.3,
|
|
1488
1302
|
cacheWrite: 3.75,
|
|
1489
1303
|
},
|
|
1490
|
-
contextWindow:
|
|
1304
|
+
contextWindow: 1000000,
|
|
1491
1305
|
maxTokens: 64000,
|
|
1492
1306
|
},
|
|
1493
|
-
"us.
|
|
1494
|
-
id: "us.
|
|
1495
|
-
name: "
|
|
1307
|
+
"us.deepseek.r1-v1:0": {
|
|
1308
|
+
id: "us.deepseek.r1-v1:0",
|
|
1309
|
+
name: "DeepSeek-R1 (US)",
|
|
1496
1310
|
api: "bedrock-converse-stream",
|
|
1497
1311
|
provider: "amazon-bedrock",
|
|
1498
1312
|
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
1499
1313
|
reasoning: true,
|
|
1314
|
+
input: ["text"],
|
|
1315
|
+
cost: {
|
|
1316
|
+
input: 1.35,
|
|
1317
|
+
output: 5.4,
|
|
1318
|
+
cacheRead: 0,
|
|
1319
|
+
cacheWrite: 0,
|
|
1320
|
+
},
|
|
1321
|
+
contextWindow: 128000,
|
|
1322
|
+
maxTokens: 32768,
|
|
1323
|
+
},
|
|
1324
|
+
"us.meta.llama4-maverick-17b-instruct-v1:0": {
|
|
1325
|
+
id: "us.meta.llama4-maverick-17b-instruct-v1:0",
|
|
1326
|
+
name: "Llama 4 Maverick 17B Instruct (US)",
|
|
1327
|
+
api: "bedrock-converse-stream",
|
|
1328
|
+
provider: "amazon-bedrock",
|
|
1329
|
+
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
1330
|
+
reasoning: false,
|
|
1500
1331
|
input: ["text", "image"],
|
|
1501
1332
|
cost: {
|
|
1502
|
-
input:
|
|
1503
|
-
output:
|
|
1504
|
-
cacheRead: 0
|
|
1505
|
-
cacheWrite:
|
|
1333
|
+
input: 0.24,
|
|
1334
|
+
output: 0.97,
|
|
1335
|
+
cacheRead: 0,
|
|
1336
|
+
cacheWrite: 0,
|
|
1506
1337
|
},
|
|
1507
1338
|
contextWindow: 1000000,
|
|
1508
|
-
maxTokens:
|
|
1339
|
+
maxTokens: 16384,
|
|
1340
|
+
},
|
|
1341
|
+
"us.meta.llama4-scout-17b-instruct-v1:0": {
|
|
1342
|
+
id: "us.meta.llama4-scout-17b-instruct-v1:0",
|
|
1343
|
+
name: "Llama 4 Scout 17B Instruct (US)",
|
|
1344
|
+
api: "bedrock-converse-stream",
|
|
1345
|
+
provider: "amazon-bedrock",
|
|
1346
|
+
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
1347
|
+
reasoning: false,
|
|
1348
|
+
input: ["text", "image"],
|
|
1349
|
+
cost: {
|
|
1350
|
+
input: 0.17,
|
|
1351
|
+
output: 0.66,
|
|
1352
|
+
cacheRead: 0,
|
|
1353
|
+
cacheWrite: 0,
|
|
1354
|
+
},
|
|
1355
|
+
contextWindow: 3500000,
|
|
1356
|
+
maxTokens: 16384,
|
|
1509
1357
|
},
|
|
1510
1358
|
"writer.palmyra-x4-v1:0": {
|
|
1511
1359
|
id: "writer.palmyra-x4-v1:0",
|
|
@@ -3427,6 +3275,42 @@ export const MODELS = {
|
|
|
3427
3275
|
contextWindow: 256000,
|
|
3428
3276
|
maxTokens: 16384,
|
|
3429
3277
|
},
|
|
3278
|
+
"@cf/ibm-granite/granite-4.0-h-micro": {
|
|
3279
|
+
id: "@cf/ibm-granite/granite-4.0-h-micro",
|
|
3280
|
+
name: "Granite 4.0 H Micro",
|
|
3281
|
+
api: "openai-completions",
|
|
3282
|
+
provider: "cloudflare-workers-ai",
|
|
3283
|
+
baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
|
|
3284
|
+
compat: { "sendSessionAffinityHeaders": true },
|
|
3285
|
+
reasoning: false,
|
|
3286
|
+
input: ["text"],
|
|
3287
|
+
cost: {
|
|
3288
|
+
input: 0.017,
|
|
3289
|
+
output: 0.112,
|
|
3290
|
+
cacheRead: 0,
|
|
3291
|
+
cacheWrite: 0,
|
|
3292
|
+
},
|
|
3293
|
+
contextWindow: 131000,
|
|
3294
|
+
maxTokens: 131000,
|
|
3295
|
+
},
|
|
3296
|
+
"@cf/meta/llama-3.3-70b-instruct-fp8-fast": {
|
|
3297
|
+
id: "@cf/meta/llama-3.3-70b-instruct-fp8-fast",
|
|
3298
|
+
name: "Llama 3.3 70B Instruct fp8 Fast",
|
|
3299
|
+
api: "openai-completions",
|
|
3300
|
+
provider: "cloudflare-workers-ai",
|
|
3301
|
+
baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
|
|
3302
|
+
compat: { "sendSessionAffinityHeaders": true },
|
|
3303
|
+
reasoning: false,
|
|
3304
|
+
input: ["text"],
|
|
3305
|
+
cost: {
|
|
3306
|
+
input: 0.293,
|
|
3307
|
+
output: 2.253,
|
|
3308
|
+
cacheRead: 0,
|
|
3309
|
+
cacheWrite: 0,
|
|
3310
|
+
},
|
|
3311
|
+
contextWindow: 24000,
|
|
3312
|
+
maxTokens: 24000,
|
|
3313
|
+
},
|
|
3430
3314
|
"@cf/meta/llama-4-scout-17b-16e-instruct": {
|
|
3431
3315
|
id: "@cf/meta/llama-4-scout-17b-16e-instruct",
|
|
3432
3316
|
name: "Llama 4 Scout 17B 16E Instruct",
|
|
@@ -3442,9 +3326,27 @@ export const MODELS = {
|
|
|
3442
3326
|
cacheRead: 0,
|
|
3443
3327
|
cacheWrite: 0,
|
|
3444
3328
|
},
|
|
3445
|
-
contextWindow:
|
|
3329
|
+
contextWindow: 131000,
|
|
3446
3330
|
maxTokens: 16384,
|
|
3447
3331
|
},
|
|
3332
|
+
"@cf/mistralai/mistral-small-3.1-24b-instruct": {
|
|
3333
|
+
id: "@cf/mistralai/mistral-small-3.1-24b-instruct",
|
|
3334
|
+
name: "Mistral Small 3.1 24B Instruct",
|
|
3335
|
+
api: "openai-completions",
|
|
3336
|
+
provider: "cloudflare-workers-ai",
|
|
3337
|
+
baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
|
|
3338
|
+
compat: { "sendSessionAffinityHeaders": true },
|
|
3339
|
+
reasoning: false,
|
|
3340
|
+
input: ["text"],
|
|
3341
|
+
cost: {
|
|
3342
|
+
input: 0.351,
|
|
3343
|
+
output: 0.555,
|
|
3344
|
+
cacheRead: 0,
|
|
3345
|
+
cacheWrite: 0,
|
|
3346
|
+
},
|
|
3347
|
+
contextWindow: 128000,
|
|
3348
|
+
maxTokens: 128000,
|
|
3349
|
+
},
|
|
3448
3350
|
"@cf/moonshotai/kimi-k2.5": {
|
|
3449
3351
|
id: "@cf/moonshotai/kimi-k2.5",
|
|
3450
3352
|
name: "Kimi K2.5",
|
|
@@ -3478,7 +3380,7 @@ export const MODELS = {
|
|
|
3478
3380
|
cacheRead: 0.16,
|
|
3479
3381
|
cacheWrite: 0,
|
|
3480
3382
|
},
|
|
3481
|
-
contextWindow:
|
|
3383
|
+
contextWindow: 262144,
|
|
3482
3384
|
maxTokens: 256000,
|
|
3483
3385
|
},
|
|
3484
3386
|
"@cf/nvidia/nemotron-3-120b-a12b": {
|
|
@@ -3535,6 +3437,24 @@ export const MODELS = {
|
|
|
3535
3437
|
contextWindow: 128000,
|
|
3536
3438
|
maxTokens: 16384,
|
|
3537
3439
|
},
|
|
3440
|
+
"@cf/qwen/qwen3-30b-a3b-fp8": {
|
|
3441
|
+
id: "@cf/qwen/qwen3-30b-a3b-fp8",
|
|
3442
|
+
name: "Qwen3 30B A3b fp8",
|
|
3443
|
+
api: "openai-completions",
|
|
3444
|
+
provider: "cloudflare-workers-ai",
|
|
3445
|
+
baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
|
|
3446
|
+
compat: { "sendSessionAffinityHeaders": true },
|
|
3447
|
+
reasoning: true,
|
|
3448
|
+
input: ["text"],
|
|
3449
|
+
cost: {
|
|
3450
|
+
input: 0.0509,
|
|
3451
|
+
output: 0.335,
|
|
3452
|
+
cacheRead: 0,
|
|
3453
|
+
cacheWrite: 0,
|
|
3454
|
+
},
|
|
3455
|
+
contextWindow: 32768,
|
|
3456
|
+
maxTokens: 32768,
|
|
3457
|
+
},
|
|
3538
3458
|
"@cf/zai-org/glm-4.7-flash": {
|
|
3539
3459
|
id: "@cf/zai-org/glm-4.7-flash",
|
|
3540
3460
|
name: "GLM-4.7-Flash",
|
|
@@ -3545,7 +3465,7 @@ export const MODELS = {
|
|
|
3545
3465
|
reasoning: true,
|
|
3546
3466
|
input: ["text"],
|
|
3547
3467
|
cost: {
|
|
3548
|
-
input: 0.
|
|
3468
|
+
input: 0.0605,
|
|
3549
3469
|
output: 0.4,
|
|
3550
3470
|
cacheRead: 0,
|
|
3551
3471
|
cacheWrite: 0,
|
|
@@ -3601,6 +3521,7 @@ export const MODELS = {
|
|
|
3601
3521
|
api: "anthropic-messages",
|
|
3602
3522
|
provider: "fireworks",
|
|
3603
3523
|
baseUrl: "https://api.fireworks.ai/inference",
|
|
3524
|
+
compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
|
|
3604
3525
|
reasoning: true,
|
|
3605
3526
|
input: ["text"],
|
|
3606
3527
|
cost: {
|
|
@@ -3618,6 +3539,7 @@ export const MODELS = {
|
|
|
3618
3539
|
api: "anthropic-messages",
|
|
3619
3540
|
provider: "fireworks",
|
|
3620
3541
|
baseUrl: "https://api.fireworks.ai/inference",
|
|
3542
|
+
compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
|
|
3621
3543
|
reasoning: true,
|
|
3622
3544
|
input: ["text"],
|
|
3623
3545
|
cost: {
|
|
@@ -3629,12 +3551,31 @@ export const MODELS = {
|
|
|
3629
3551
|
contextWindow: 160000,
|
|
3630
3552
|
maxTokens: 160000,
|
|
3631
3553
|
},
|
|
3554
|
+
"accounts/fireworks/models/deepseek-v4-flash": {
|
|
3555
|
+
id: "accounts/fireworks/models/deepseek-v4-flash",
|
|
3556
|
+
name: "DeepSeek V4 Flash",
|
|
3557
|
+
api: "anthropic-messages",
|
|
3558
|
+
provider: "fireworks",
|
|
3559
|
+
baseUrl: "https://api.fireworks.ai/inference",
|
|
3560
|
+
compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
|
|
3561
|
+
reasoning: true,
|
|
3562
|
+
input: ["text"],
|
|
3563
|
+
cost: {
|
|
3564
|
+
input: 0.14,
|
|
3565
|
+
output: 0.28,
|
|
3566
|
+
cacheRead: 0.03,
|
|
3567
|
+
cacheWrite: 0,
|
|
3568
|
+
},
|
|
3569
|
+
contextWindow: 1000000,
|
|
3570
|
+
maxTokens: 384000,
|
|
3571
|
+
},
|
|
3632
3572
|
"accounts/fireworks/models/deepseek-v4-pro": {
|
|
3633
3573
|
id: "accounts/fireworks/models/deepseek-v4-pro",
|
|
3634
3574
|
name: "DeepSeek V4 Pro",
|
|
3635
3575
|
api: "anthropic-messages",
|
|
3636
3576
|
provider: "fireworks",
|
|
3637
3577
|
baseUrl: "https://api.fireworks.ai/inference",
|
|
3578
|
+
compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
|
|
3638
3579
|
reasoning: true,
|
|
3639
3580
|
input: ["text"],
|
|
3640
3581
|
cost: {
|
|
@@ -3652,6 +3593,7 @@ export const MODELS = {
|
|
|
3652
3593
|
api: "anthropic-messages",
|
|
3653
3594
|
provider: "fireworks",
|
|
3654
3595
|
baseUrl: "https://api.fireworks.ai/inference",
|
|
3596
|
+
compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
|
|
3655
3597
|
reasoning: true,
|
|
3656
3598
|
input: ["text"],
|
|
3657
3599
|
cost: {
|
|
@@ -3669,6 +3611,7 @@ export const MODELS = {
|
|
|
3669
3611
|
api: "anthropic-messages",
|
|
3670
3612
|
provider: "fireworks",
|
|
3671
3613
|
baseUrl: "https://api.fireworks.ai/inference",
|
|
3614
|
+
compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
|
|
3672
3615
|
reasoning: true,
|
|
3673
3616
|
input: ["text"],
|
|
3674
3617
|
cost: {
|
|
@@ -3686,6 +3629,7 @@ export const MODELS = {
|
|
|
3686
3629
|
api: "anthropic-messages",
|
|
3687
3630
|
provider: "fireworks",
|
|
3688
3631
|
baseUrl: "https://api.fireworks.ai/inference",
|
|
3632
|
+
compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
|
|
3689
3633
|
reasoning: true,
|
|
3690
3634
|
input: ["text"],
|
|
3691
3635
|
cost: {
|
|
@@ -3703,6 +3647,7 @@ export const MODELS = {
|
|
|
3703
3647
|
api: "anthropic-messages",
|
|
3704
3648
|
provider: "fireworks",
|
|
3705
3649
|
baseUrl: "https://api.fireworks.ai/inference",
|
|
3650
|
+
compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
|
|
3706
3651
|
reasoning: true,
|
|
3707
3652
|
input: ["text"],
|
|
3708
3653
|
cost: {
|
|
@@ -3720,6 +3665,7 @@ export const MODELS = {
|
|
|
3720
3665
|
api: "anthropic-messages",
|
|
3721
3666
|
provider: "fireworks",
|
|
3722
3667
|
baseUrl: "https://api.fireworks.ai/inference",
|
|
3668
|
+
compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
|
|
3723
3669
|
reasoning: true,
|
|
3724
3670
|
input: ["text"],
|
|
3725
3671
|
cost: {
|
|
@@ -3737,6 +3683,7 @@ export const MODELS = {
|
|
|
3737
3683
|
api: "anthropic-messages",
|
|
3738
3684
|
provider: "fireworks",
|
|
3739
3685
|
baseUrl: "https://api.fireworks.ai/inference",
|
|
3686
|
+
compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
|
|
3740
3687
|
reasoning: true,
|
|
3741
3688
|
input: ["text"],
|
|
3742
3689
|
cost: {
|
|
@@ -3754,6 +3701,7 @@ export const MODELS = {
|
|
|
3754
3701
|
api: "anthropic-messages",
|
|
3755
3702
|
provider: "fireworks",
|
|
3756
3703
|
baseUrl: "https://api.fireworks.ai/inference",
|
|
3704
|
+
compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
|
|
3757
3705
|
reasoning: true,
|
|
3758
3706
|
input: ["text"],
|
|
3759
3707
|
cost: {
|
|
@@ -3771,6 +3719,7 @@ export const MODELS = {
|
|
|
3771
3719
|
api: "anthropic-messages",
|
|
3772
3720
|
provider: "fireworks",
|
|
3773
3721
|
baseUrl: "https://api.fireworks.ai/inference",
|
|
3722
|
+
compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
|
|
3774
3723
|
reasoning: false,
|
|
3775
3724
|
input: ["text"],
|
|
3776
3725
|
cost: {
|
|
@@ -3788,6 +3737,7 @@ export const MODELS = {
|
|
|
3788
3737
|
api: "anthropic-messages",
|
|
3789
3738
|
provider: "fireworks",
|
|
3790
3739
|
baseUrl: "https://api.fireworks.ai/inference",
|
|
3740
|
+
compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
|
|
3791
3741
|
reasoning: true,
|
|
3792
3742
|
input: ["text"],
|
|
3793
3743
|
cost: {
|
|
@@ -3805,6 +3755,7 @@ export const MODELS = {
|
|
|
3805
3755
|
api: "anthropic-messages",
|
|
3806
3756
|
provider: "fireworks",
|
|
3807
3757
|
baseUrl: "https://api.fireworks.ai/inference",
|
|
3758
|
+
compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
|
|
3808
3759
|
reasoning: true,
|
|
3809
3760
|
input: ["text", "image"],
|
|
3810
3761
|
cost: {
|
|
@@ -3822,6 +3773,7 @@ export const MODELS = {
|
|
|
3822
3773
|
api: "anthropic-messages",
|
|
3823
3774
|
provider: "fireworks",
|
|
3824
3775
|
baseUrl: "https://api.fireworks.ai/inference",
|
|
3776
|
+
compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
|
|
3825
3777
|
reasoning: true,
|
|
3826
3778
|
input: ["text", "image"],
|
|
3827
3779
|
cost: {
|
|
@@ -3839,6 +3791,7 @@ export const MODELS = {
|
|
|
3839
3791
|
api: "anthropic-messages",
|
|
3840
3792
|
provider: "fireworks",
|
|
3841
3793
|
baseUrl: "https://api.fireworks.ai/inference",
|
|
3794
|
+
compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
|
|
3842
3795
|
reasoning: true,
|
|
3843
3796
|
input: ["text"],
|
|
3844
3797
|
cost: {
|
|
@@ -3856,6 +3809,7 @@ export const MODELS = {
|
|
|
3856
3809
|
api: "anthropic-messages",
|
|
3857
3810
|
provider: "fireworks",
|
|
3858
3811
|
baseUrl: "https://api.fireworks.ai/inference",
|
|
3812
|
+
compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
|
|
3859
3813
|
reasoning: true,
|
|
3860
3814
|
input: ["text"],
|
|
3861
3815
|
cost: {
|
|
@@ -3873,6 +3827,7 @@ export const MODELS = {
|
|
|
3873
3827
|
api: "anthropic-messages",
|
|
3874
3828
|
provider: "fireworks",
|
|
3875
3829
|
baseUrl: "https://api.fireworks.ai/inference",
|
|
3830
|
+
compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
|
|
3876
3831
|
reasoning: true,
|
|
3877
3832
|
input: ["text"],
|
|
3878
3833
|
cost: {
|
|
@@ -3890,6 +3845,7 @@ export const MODELS = {
|
|
|
3890
3845
|
api: "anthropic-messages",
|
|
3891
3846
|
provider: "fireworks",
|
|
3892
3847
|
baseUrl: "https://api.fireworks.ai/inference",
|
|
3848
|
+
compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
|
|
3893
3849
|
reasoning: true,
|
|
3894
3850
|
input: ["text", "image"],
|
|
3895
3851
|
cost: {
|
|
@@ -3907,6 +3863,7 @@ export const MODELS = {
|
|
|
3907
3863
|
api: "anthropic-messages",
|
|
3908
3864
|
provider: "fireworks",
|
|
3909
3865
|
baseUrl: "https://api.fireworks.ai/inference",
|
|
3866
|
+
compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
|
|
3910
3867
|
reasoning: true,
|
|
3911
3868
|
input: ["text", "image"],
|
|
3912
3869
|
cost: {
|
|
@@ -3995,25 +3952,6 @@ export const MODELS = {
|
|
|
3995
3952
|
contextWindow: 144000,
|
|
3996
3953
|
maxTokens: 64000,
|
|
3997
3954
|
},
|
|
3998
|
-
"claude-sonnet-4": {
|
|
3999
|
-
id: "claude-sonnet-4",
|
|
4000
|
-
name: "Claude Sonnet 4",
|
|
4001
|
-
api: "anthropic-messages",
|
|
4002
|
-
provider: "github-copilot",
|
|
4003
|
-
baseUrl: "https://api.individual.githubcopilot.com",
|
|
4004
|
-
headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
|
|
4005
|
-
compat: { "supportsEagerToolInputStreaming": false },
|
|
4006
|
-
reasoning: true,
|
|
4007
|
-
input: ["text", "image"],
|
|
4008
|
-
cost: {
|
|
4009
|
-
input: 0,
|
|
4010
|
-
output: 0,
|
|
4011
|
-
cacheRead: 0,
|
|
4012
|
-
cacheWrite: 0,
|
|
4013
|
-
},
|
|
4014
|
-
contextWindow: 216000,
|
|
4015
|
-
maxTokens: 16000,
|
|
4016
|
-
},
|
|
4017
3955
|
"claude-sonnet-4.5": {
|
|
4018
3956
|
id: "claude-sonnet-4.5",
|
|
4019
3957
|
name: "Claude Sonnet 4.5",
|
|
@@ -4089,25 +4027,6 @@ export const MODELS = {
|
|
|
4089
4027
|
contextWindow: 128000,
|
|
4090
4028
|
maxTokens: 64000,
|
|
4091
4029
|
},
|
|
4092
|
-
"gemini-3-pro-preview": {
|
|
4093
|
-
id: "gemini-3-pro-preview",
|
|
4094
|
-
name: "Gemini 3 Pro Preview",
|
|
4095
|
-
api: "openai-completions",
|
|
4096
|
-
provider: "github-copilot",
|
|
4097
|
-
baseUrl: "https://api.individual.githubcopilot.com",
|
|
4098
|
-
headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
|
|
4099
|
-
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
|
|
4100
|
-
reasoning: true,
|
|
4101
|
-
input: ["text", "image"],
|
|
4102
|
-
cost: {
|
|
4103
|
-
input: 0,
|
|
4104
|
-
output: 0,
|
|
4105
|
-
cacheRead: 0,
|
|
4106
|
-
cacheWrite: 0,
|
|
4107
|
-
},
|
|
4108
|
-
contextWindow: 128000,
|
|
4109
|
-
maxTokens: 64000,
|
|
4110
|
-
},
|
|
4111
4030
|
"gemini-3.1-pro-preview": {
|
|
4112
4031
|
id: "gemini-3.1-pro-preview",
|
|
4113
4032
|
name: "Gemini 3.1 Pro Preview",
|
|
@@ -4165,25 +4084,6 @@ export const MODELS = {
|
|
|
4165
4084
|
contextWindow: 128000,
|
|
4166
4085
|
maxTokens: 4096,
|
|
4167
4086
|
},
|
|
4168
|
-
"gpt-5": {
|
|
4169
|
-
id: "gpt-5",
|
|
4170
|
-
name: "GPT-5",
|
|
4171
|
-
api: "openai-responses",
|
|
4172
|
-
provider: "github-copilot",
|
|
4173
|
-
baseUrl: "https://api.individual.githubcopilot.com",
|
|
4174
|
-
headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
|
|
4175
|
-
reasoning: true,
|
|
4176
|
-
thinkingLevelMap: { "off": null },
|
|
4177
|
-
input: ["text", "image"],
|
|
4178
|
-
cost: {
|
|
4179
|
-
input: 0,
|
|
4180
|
-
output: 0,
|
|
4181
|
-
cacheRead: 0,
|
|
4182
|
-
cacheWrite: 0,
|
|
4183
|
-
},
|
|
4184
|
-
contextWindow: 128000,
|
|
4185
|
-
maxTokens: 128000,
|
|
4186
|
-
},
|
|
4187
4087
|
"gpt-5-mini": {
|
|
4188
4088
|
id: "gpt-5-mini",
|
|
4189
4089
|
name: "GPT-5-mini",
|
|
@@ -4203,82 +4103,6 @@ export const MODELS = {
|
|
|
4203
4103
|
contextWindow: 264000,
|
|
4204
4104
|
maxTokens: 64000,
|
|
4205
4105
|
},
|
|
4206
|
-
"gpt-5.1": {
|
|
4207
|
-
id: "gpt-5.1",
|
|
4208
|
-
name: "GPT-5.1",
|
|
4209
|
-
api: "openai-responses",
|
|
4210
|
-
provider: "github-copilot",
|
|
4211
|
-
baseUrl: "https://api.individual.githubcopilot.com",
|
|
4212
|
-
headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
|
|
4213
|
-
reasoning: true,
|
|
4214
|
-
thinkingLevelMap: { "off": null },
|
|
4215
|
-
input: ["text", "image"],
|
|
4216
|
-
cost: {
|
|
4217
|
-
input: 0,
|
|
4218
|
-
output: 0,
|
|
4219
|
-
cacheRead: 0,
|
|
4220
|
-
cacheWrite: 0,
|
|
4221
|
-
},
|
|
4222
|
-
contextWindow: 264000,
|
|
4223
|
-
maxTokens: 64000,
|
|
4224
|
-
},
|
|
4225
|
-
"gpt-5.1-codex": {
|
|
4226
|
-
id: "gpt-5.1-codex",
|
|
4227
|
-
name: "GPT-5.1-Codex",
|
|
4228
|
-
api: "openai-responses",
|
|
4229
|
-
provider: "github-copilot",
|
|
4230
|
-
baseUrl: "https://api.individual.githubcopilot.com",
|
|
4231
|
-
headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
|
|
4232
|
-
reasoning: true,
|
|
4233
|
-
thinkingLevelMap: { "off": null },
|
|
4234
|
-
input: ["text", "image"],
|
|
4235
|
-
cost: {
|
|
4236
|
-
input: 0,
|
|
4237
|
-
output: 0,
|
|
4238
|
-
cacheRead: 0,
|
|
4239
|
-
cacheWrite: 0,
|
|
4240
|
-
},
|
|
4241
|
-
contextWindow: 400000,
|
|
4242
|
-
maxTokens: 128000,
|
|
4243
|
-
},
|
|
4244
|
-
"gpt-5.1-codex-max": {
|
|
4245
|
-
id: "gpt-5.1-codex-max",
|
|
4246
|
-
name: "GPT-5.1-Codex-max",
|
|
4247
|
-
api: "openai-responses",
|
|
4248
|
-
provider: "github-copilot",
|
|
4249
|
-
baseUrl: "https://api.individual.githubcopilot.com",
|
|
4250
|
-
headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
|
|
4251
|
-
reasoning: true,
|
|
4252
|
-
thinkingLevelMap: { "off": null },
|
|
4253
|
-
input: ["text", "image"],
|
|
4254
|
-
cost: {
|
|
4255
|
-
input: 0,
|
|
4256
|
-
output: 0,
|
|
4257
|
-
cacheRead: 0,
|
|
4258
|
-
cacheWrite: 0,
|
|
4259
|
-
},
|
|
4260
|
-
contextWindow: 400000,
|
|
4261
|
-
maxTokens: 128000,
|
|
4262
|
-
},
|
|
4263
|
-
"gpt-5.1-codex-mini": {
|
|
4264
|
-
id: "gpt-5.1-codex-mini",
|
|
4265
|
-
name: "GPT-5.1-Codex-mini",
|
|
4266
|
-
api: "openai-responses",
|
|
4267
|
-
provider: "github-copilot",
|
|
4268
|
-
baseUrl: "https://api.individual.githubcopilot.com",
|
|
4269
|
-
headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
|
|
4270
|
-
reasoning: true,
|
|
4271
|
-
thinkingLevelMap: { "off": null },
|
|
4272
|
-
input: ["text", "image"],
|
|
4273
|
-
cost: {
|
|
4274
|
-
input: 0,
|
|
4275
|
-
output: 0,
|
|
4276
|
-
cacheRead: 0,
|
|
4277
|
-
cacheWrite: 0,
|
|
4278
|
-
},
|
|
4279
|
-
contextWindow: 400000,
|
|
4280
|
-
maxTokens: 128000,
|
|
4281
|
-
},
|
|
4282
4106
|
"gpt-5.2": {
|
|
4283
4107
|
id: "gpt-5.2",
|
|
4284
4108
|
name: "GPT-5.2",
|
|
@@ -4414,57 +4238,6 @@ export const MODELS = {
|
|
|
4414
4238
|
},
|
|
4415
4239
|
},
|
|
4416
4240
|
"google": {
|
|
4417
|
-
"gemini-1.5-flash": {
|
|
4418
|
-
id: "gemini-1.5-flash",
|
|
4419
|
-
name: "Gemini 1.5 Flash",
|
|
4420
|
-
api: "google-generative-ai",
|
|
4421
|
-
provider: "google",
|
|
4422
|
-
baseUrl: "https://generativelanguage.googleapis.com/v1beta",
|
|
4423
|
-
reasoning: false,
|
|
4424
|
-
input: ["text", "image"],
|
|
4425
|
-
cost: {
|
|
4426
|
-
input: 0.075,
|
|
4427
|
-
output: 0.3,
|
|
4428
|
-
cacheRead: 0.01875,
|
|
4429
|
-
cacheWrite: 0,
|
|
4430
|
-
},
|
|
4431
|
-
contextWindow: 1000000,
|
|
4432
|
-
maxTokens: 8192,
|
|
4433
|
-
},
|
|
4434
|
-
"gemini-1.5-flash-8b": {
|
|
4435
|
-
id: "gemini-1.5-flash-8b",
|
|
4436
|
-
name: "Gemini 1.5 Flash-8B",
|
|
4437
|
-
api: "google-generative-ai",
|
|
4438
|
-
provider: "google",
|
|
4439
|
-
baseUrl: "https://generativelanguage.googleapis.com/v1beta",
|
|
4440
|
-
reasoning: false,
|
|
4441
|
-
input: ["text", "image"],
|
|
4442
|
-
cost: {
|
|
4443
|
-
input: 0.0375,
|
|
4444
|
-
output: 0.15,
|
|
4445
|
-
cacheRead: 0.01,
|
|
4446
|
-
cacheWrite: 0,
|
|
4447
|
-
},
|
|
4448
|
-
contextWindow: 1000000,
|
|
4449
|
-
maxTokens: 8192,
|
|
4450
|
-
},
|
|
4451
|
-
"gemini-1.5-pro": {
|
|
4452
|
-
id: "gemini-1.5-pro",
|
|
4453
|
-
name: "Gemini 1.5 Pro",
|
|
4454
|
-
api: "google-generative-ai",
|
|
4455
|
-
provider: "google",
|
|
4456
|
-
baseUrl: "https://generativelanguage.googleapis.com/v1beta",
|
|
4457
|
-
reasoning: false,
|
|
4458
|
-
input: ["text", "image"],
|
|
4459
|
-
cost: {
|
|
4460
|
-
input: 1.25,
|
|
4461
|
-
output: 5,
|
|
4462
|
-
cacheRead: 0.3125,
|
|
4463
|
-
cacheWrite: 0,
|
|
4464
|
-
},
|
|
4465
|
-
contextWindow: 1000000,
|
|
4466
|
-
maxTokens: 8192,
|
|
4467
|
-
},
|
|
4468
4241
|
"gemini-2.0-flash": {
|
|
4469
4242
|
id: "gemini-2.0-flash",
|
|
4470
4243
|
name: "Gemini 2.0 Flash",
|
|
@@ -4484,7 +4257,7 @@ export const MODELS = {
|
|
|
4484
4257
|
},
|
|
4485
4258
|
"gemini-2.0-flash-lite": {
|
|
4486
4259
|
id: "gemini-2.0-flash-lite",
|
|
4487
|
-
name: "Gemini 2.0 Flash
|
|
4260
|
+
name: "Gemini 2.0 Flash-Lite",
|
|
4488
4261
|
api: "google-generative-ai",
|
|
4489
4262
|
provider: "google",
|
|
4490
4263
|
baseUrl: "https://generativelanguage.googleapis.com/v1beta",
|
|
@@ -4518,7 +4291,7 @@ export const MODELS = {
|
|
|
4518
4291
|
},
|
|
4519
4292
|
"gemini-2.5-flash-lite": {
|
|
4520
4293
|
id: "gemini-2.5-flash-lite",
|
|
4521
|
-
name: "Gemini 2.5 Flash
|
|
4294
|
+
name: "Gemini 2.5 Flash-Lite",
|
|
4522
4295
|
api: "google-generative-ai",
|
|
4523
4296
|
provider: "google",
|
|
4524
4297
|
baseUrl: "https://generativelanguage.googleapis.com/v1beta",
|
|
@@ -4527,331 +4300,197 @@ export const MODELS = {
|
|
|
4527
4300
|
cost: {
|
|
4528
4301
|
input: 0.1,
|
|
4529
4302
|
output: 0.4,
|
|
4530
|
-
cacheRead: 0.
|
|
4303
|
+
cacheRead: 0.01,
|
|
4531
4304
|
cacheWrite: 0,
|
|
4532
4305
|
},
|
|
4533
4306
|
contextWindow: 1048576,
|
|
4534
4307
|
maxTokens: 65536,
|
|
4535
4308
|
},
|
|
4536
|
-
"gemini-2.5-
|
|
4537
|
-
id: "gemini-2.5-
|
|
4538
|
-
name: "Gemini 2.5
|
|
4309
|
+
"gemini-2.5-pro": {
|
|
4310
|
+
id: "gemini-2.5-pro",
|
|
4311
|
+
name: "Gemini 2.5 Pro",
|
|
4539
4312
|
api: "google-generative-ai",
|
|
4540
4313
|
provider: "google",
|
|
4541
4314
|
baseUrl: "https://generativelanguage.googleapis.com/v1beta",
|
|
4542
4315
|
reasoning: true,
|
|
4543
4316
|
input: ["text", "image"],
|
|
4544
4317
|
cost: {
|
|
4545
|
-
input:
|
|
4546
|
-
output:
|
|
4547
|
-
cacheRead: 0.
|
|
4318
|
+
input: 1.25,
|
|
4319
|
+
output: 10,
|
|
4320
|
+
cacheRead: 0.125,
|
|
4548
4321
|
cacheWrite: 0,
|
|
4549
4322
|
},
|
|
4550
4323
|
contextWindow: 1048576,
|
|
4551
4324
|
maxTokens: 65536,
|
|
4552
4325
|
},
|
|
4553
|
-
"gemini-
|
|
4554
|
-
id: "gemini-
|
|
4555
|
-
name: "Gemini
|
|
4326
|
+
"gemini-3-flash-preview": {
|
|
4327
|
+
id: "gemini-3-flash-preview",
|
|
4328
|
+
name: "Gemini 3 Flash Preview",
|
|
4556
4329
|
api: "google-generative-ai",
|
|
4557
4330
|
provider: "google",
|
|
4558
4331
|
baseUrl: "https://generativelanguage.googleapis.com/v1beta",
|
|
4559
4332
|
reasoning: true,
|
|
4333
|
+
thinkingLevelMap: { "off": null },
|
|
4560
4334
|
input: ["text", "image"],
|
|
4561
4335
|
cost: {
|
|
4562
|
-
input: 0.
|
|
4563
|
-
output:
|
|
4564
|
-
cacheRead: 0.
|
|
4336
|
+
input: 0.5,
|
|
4337
|
+
output: 3,
|
|
4338
|
+
cacheRead: 0.05,
|
|
4565
4339
|
cacheWrite: 0,
|
|
4566
4340
|
},
|
|
4567
4341
|
contextWindow: 1048576,
|
|
4568
4342
|
maxTokens: 65536,
|
|
4569
4343
|
},
|
|
4570
|
-
"gemini-
|
|
4571
|
-
id: "gemini-
|
|
4572
|
-
name: "Gemini
|
|
4344
|
+
"gemini-3-pro-preview": {
|
|
4345
|
+
id: "gemini-3-pro-preview",
|
|
4346
|
+
name: "Gemini 3 Pro Preview",
|
|
4573
4347
|
api: "google-generative-ai",
|
|
4574
4348
|
provider: "google",
|
|
4575
4349
|
baseUrl: "https://generativelanguage.googleapis.com/v1beta",
|
|
4576
4350
|
reasoning: true,
|
|
4351
|
+
thinkingLevelMap: { "off": null, "minimal": null, "low": "LOW", "medium": null, "high": "HIGH" },
|
|
4577
4352
|
input: ["text", "image"],
|
|
4578
4353
|
cost: {
|
|
4579
|
-
input:
|
|
4580
|
-
output:
|
|
4581
|
-
cacheRead: 0.
|
|
4354
|
+
input: 2,
|
|
4355
|
+
output: 12,
|
|
4356
|
+
cacheRead: 0.2,
|
|
4582
4357
|
cacheWrite: 0,
|
|
4583
4358
|
},
|
|
4584
4359
|
contextWindow: 1048576,
|
|
4585
4360
|
maxTokens: 65536,
|
|
4586
4361
|
},
|
|
4587
|
-
"gemini-
|
|
4588
|
-
id: "gemini-
|
|
4589
|
-
name: "Gemini
|
|
4362
|
+
"gemini-3.1-flash-lite": {
|
|
4363
|
+
id: "gemini-3.1-flash-lite",
|
|
4364
|
+
name: "Gemini 3.1 Flash Lite",
|
|
4590
4365
|
api: "google-generative-ai",
|
|
4591
4366
|
provider: "google",
|
|
4592
4367
|
baseUrl: "https://generativelanguage.googleapis.com/v1beta",
|
|
4593
4368
|
reasoning: true,
|
|
4369
|
+
thinkingLevelMap: { "off": null },
|
|
4594
4370
|
input: ["text", "image"],
|
|
4595
4371
|
cost: {
|
|
4596
|
-
input: 0.
|
|
4597
|
-
output:
|
|
4598
|
-
cacheRead: 0.
|
|
4372
|
+
input: 0.25,
|
|
4373
|
+
output: 1.5,
|
|
4374
|
+
cacheRead: 0.025,
|
|
4599
4375
|
cacheWrite: 0,
|
|
4600
4376
|
},
|
|
4601
4377
|
contextWindow: 1048576,
|
|
4602
4378
|
maxTokens: 65536,
|
|
4603
4379
|
},
|
|
4604
|
-
"gemini-
|
|
4605
|
-
id: "gemini-
|
|
4606
|
-
name: "Gemini
|
|
4380
|
+
"gemini-3.1-flash-lite-preview": {
|
|
4381
|
+
id: "gemini-3.1-flash-lite-preview",
|
|
4382
|
+
name: "Gemini 3.1 Flash Lite Preview",
|
|
4607
4383
|
api: "google-generative-ai",
|
|
4608
4384
|
provider: "google",
|
|
4609
4385
|
baseUrl: "https://generativelanguage.googleapis.com/v1beta",
|
|
4610
4386
|
reasoning: true,
|
|
4387
|
+
thinkingLevelMap: { "off": null },
|
|
4611
4388
|
input: ["text", "image"],
|
|
4612
4389
|
cost: {
|
|
4613
|
-
input: 0.
|
|
4614
|
-
output:
|
|
4615
|
-
cacheRead: 0.
|
|
4390
|
+
input: 0.25,
|
|
4391
|
+
output: 1.5,
|
|
4392
|
+
cacheRead: 0.025,
|
|
4616
4393
|
cacheWrite: 0,
|
|
4617
4394
|
},
|
|
4618
4395
|
contextWindow: 1048576,
|
|
4619
4396
|
maxTokens: 65536,
|
|
4620
4397
|
},
|
|
4621
|
-
"gemini-
|
|
4622
|
-
id: "gemini-
|
|
4623
|
-
name: "Gemini
|
|
4398
|
+
"gemini-3.1-pro-preview": {
|
|
4399
|
+
id: "gemini-3.1-pro-preview",
|
|
4400
|
+
name: "Gemini 3.1 Pro Preview",
|
|
4624
4401
|
api: "google-generative-ai",
|
|
4625
4402
|
provider: "google",
|
|
4626
4403
|
baseUrl: "https://generativelanguage.googleapis.com/v1beta",
|
|
4627
4404
|
reasoning: true,
|
|
4405
|
+
thinkingLevelMap: { "off": null, "minimal": null, "low": "LOW", "medium": null, "high": "HIGH" },
|
|
4628
4406
|
input: ["text", "image"],
|
|
4629
4407
|
cost: {
|
|
4630
|
-
input:
|
|
4631
|
-
output:
|
|
4632
|
-
cacheRead: 0.
|
|
4408
|
+
input: 2,
|
|
4409
|
+
output: 12,
|
|
4410
|
+
cacheRead: 0.2,
|
|
4633
4411
|
cacheWrite: 0,
|
|
4634
4412
|
},
|
|
4635
4413
|
contextWindow: 1048576,
|
|
4636
4414
|
maxTokens: 65536,
|
|
4637
4415
|
},
|
|
4638
|
-
"gemini-
|
|
4639
|
-
id: "gemini-
|
|
4640
|
-
name: "Gemini
|
|
4416
|
+
"gemini-3.1-pro-preview-customtools": {
|
|
4417
|
+
id: "gemini-3.1-pro-preview-customtools",
|
|
4418
|
+
name: "Gemini 3.1 Pro Preview Custom Tools",
|
|
4641
4419
|
api: "google-generative-ai",
|
|
4642
4420
|
provider: "google",
|
|
4643
4421
|
baseUrl: "https://generativelanguage.googleapis.com/v1beta",
|
|
4644
4422
|
reasoning: true,
|
|
4423
|
+
thinkingLevelMap: { "off": null, "minimal": null, "low": "LOW", "medium": null, "high": "HIGH" },
|
|
4645
4424
|
input: ["text", "image"],
|
|
4646
4425
|
cost: {
|
|
4647
|
-
input:
|
|
4648
|
-
output:
|
|
4649
|
-
cacheRead: 0.
|
|
4426
|
+
input: 2,
|
|
4427
|
+
output: 12,
|
|
4428
|
+
cacheRead: 0.2,
|
|
4650
4429
|
cacheWrite: 0,
|
|
4651
4430
|
},
|
|
4652
4431
|
contextWindow: 1048576,
|
|
4653
4432
|
maxTokens: 65536,
|
|
4654
4433
|
},
|
|
4655
|
-
"gemini-
|
|
4656
|
-
id: "gemini-
|
|
4657
|
-
name: "Gemini
|
|
4434
|
+
"gemini-3.5-flash": {
|
|
4435
|
+
id: "gemini-3.5-flash",
|
|
4436
|
+
name: "Gemini 3.5 Flash",
|
|
4658
4437
|
api: "google-generative-ai",
|
|
4659
4438
|
provider: "google",
|
|
4660
4439
|
baseUrl: "https://generativelanguage.googleapis.com/v1beta",
|
|
4661
4440
|
reasoning: true,
|
|
4441
|
+
thinkingLevelMap: { "off": null },
|
|
4662
4442
|
input: ["text", "image"],
|
|
4663
4443
|
cost: {
|
|
4664
|
-
input: 1.
|
|
4665
|
-
output:
|
|
4666
|
-
cacheRead: 0.
|
|
4444
|
+
input: 1.5,
|
|
4445
|
+
output: 9,
|
|
4446
|
+
cacheRead: 0.15,
|
|
4667
4447
|
cacheWrite: 0,
|
|
4668
4448
|
},
|
|
4669
4449
|
contextWindow: 1048576,
|
|
4670
4450
|
maxTokens: 65536,
|
|
4671
4451
|
},
|
|
4672
|
-
"gemini-
|
|
4673
|
-
id: "gemini-
|
|
4674
|
-
name: "Gemini
|
|
4452
|
+
"gemini-flash-latest": {
|
|
4453
|
+
id: "gemini-flash-latest",
|
|
4454
|
+
name: "Gemini Flash Latest",
|
|
4675
4455
|
api: "google-generative-ai",
|
|
4676
4456
|
provider: "google",
|
|
4677
4457
|
baseUrl: "https://generativelanguage.googleapis.com/v1beta",
|
|
4678
4458
|
reasoning: true,
|
|
4679
|
-
thinkingLevelMap: { "off": null },
|
|
4680
4459
|
input: ["text", "image"],
|
|
4681
4460
|
cost: {
|
|
4682
|
-
input: 0.
|
|
4683
|
-
output:
|
|
4684
|
-
cacheRead: 0.
|
|
4461
|
+
input: 0.3,
|
|
4462
|
+
output: 2.5,
|
|
4463
|
+
cacheRead: 0.075,
|
|
4685
4464
|
cacheWrite: 0,
|
|
4686
4465
|
},
|
|
4687
4466
|
contextWindow: 1048576,
|
|
4688
4467
|
maxTokens: 65536,
|
|
4689
4468
|
},
|
|
4690
|
-
"gemini-
|
|
4691
|
-
id: "gemini-
|
|
4692
|
-
name: "Gemini
|
|
4469
|
+
"gemini-flash-lite-latest": {
|
|
4470
|
+
id: "gemini-flash-lite-latest",
|
|
4471
|
+
name: "Gemini Flash-Lite Latest",
|
|
4693
4472
|
api: "google-generative-ai",
|
|
4694
4473
|
provider: "google",
|
|
4695
4474
|
baseUrl: "https://generativelanguage.googleapis.com/v1beta",
|
|
4696
4475
|
reasoning: true,
|
|
4697
|
-
thinkingLevelMap: { "off": null, "minimal": null, "low": "LOW", "medium": null, "high": "HIGH" },
|
|
4698
4476
|
input: ["text", "image"],
|
|
4699
4477
|
cost: {
|
|
4700
|
-
input:
|
|
4701
|
-
output:
|
|
4702
|
-
cacheRead: 0.
|
|
4478
|
+
input: 0.1,
|
|
4479
|
+
output: 0.4,
|
|
4480
|
+
cacheRead: 0.025,
|
|
4703
4481
|
cacheWrite: 0,
|
|
4704
4482
|
},
|
|
4705
|
-
contextWindow:
|
|
4706
|
-
maxTokens:
|
|
4483
|
+
contextWindow: 1048576,
|
|
4484
|
+
maxTokens: 65536,
|
|
4707
4485
|
},
|
|
4708
|
-
"
|
|
4709
|
-
id: "
|
|
4710
|
-
name: "
|
|
4486
|
+
"gemma-4-26b-a4b-it": {
|
|
4487
|
+
id: "gemma-4-26b-a4b-it",
|
|
4488
|
+
name: "Gemma 4 26B A4B IT",
|
|
4711
4489
|
api: "google-generative-ai",
|
|
4712
4490
|
provider: "google",
|
|
4713
4491
|
baseUrl: "https://generativelanguage.googleapis.com/v1beta",
|
|
4714
4492
|
reasoning: true,
|
|
4715
|
-
thinkingLevelMap: { "off": null },
|
|
4716
|
-
input: ["text", "image"],
|
|
4717
|
-
cost: {
|
|
4718
|
-
input: 0.25,
|
|
4719
|
-
output: 1.5,
|
|
4720
|
-
cacheRead: 0.025,
|
|
4721
|
-
cacheWrite: 1,
|
|
4722
|
-
},
|
|
4723
|
-
contextWindow: 1048576,
|
|
4724
|
-
maxTokens: 65536,
|
|
4725
|
-
},
|
|
4726
|
-
"gemini-3.1-pro-preview": {
|
|
4727
|
-
id: "gemini-3.1-pro-preview",
|
|
4728
|
-
name: "Gemini 3.1 Pro Preview",
|
|
4729
|
-
api: "google-generative-ai",
|
|
4730
|
-
provider: "google",
|
|
4731
|
-
baseUrl: "https://generativelanguage.googleapis.com/v1beta",
|
|
4732
|
-
reasoning: true,
|
|
4733
|
-
thinkingLevelMap: { "off": null, "minimal": null, "low": "LOW", "medium": null, "high": "HIGH" },
|
|
4734
|
-
input: ["text", "image"],
|
|
4735
|
-
cost: {
|
|
4736
|
-
input: 2,
|
|
4737
|
-
output: 12,
|
|
4738
|
-
cacheRead: 0.2,
|
|
4739
|
-
cacheWrite: 0,
|
|
4740
|
-
},
|
|
4741
|
-
contextWindow: 1048576,
|
|
4742
|
-
maxTokens: 65536,
|
|
4743
|
-
},
|
|
4744
|
-
"gemini-3.1-pro-preview-customtools": {
|
|
4745
|
-
id: "gemini-3.1-pro-preview-customtools",
|
|
4746
|
-
name: "Gemini 3.1 Pro Preview Custom Tools",
|
|
4747
|
-
api: "google-generative-ai",
|
|
4748
|
-
provider: "google",
|
|
4749
|
-
baseUrl: "https://generativelanguage.googleapis.com/v1beta",
|
|
4750
|
-
reasoning: true,
|
|
4751
|
-
thinkingLevelMap: { "off": null, "minimal": null, "low": "LOW", "medium": null, "high": "HIGH" },
|
|
4752
|
-
input: ["text", "image"],
|
|
4753
|
-
cost: {
|
|
4754
|
-
input: 2,
|
|
4755
|
-
output: 12,
|
|
4756
|
-
cacheRead: 0.2,
|
|
4757
|
-
cacheWrite: 0,
|
|
4758
|
-
},
|
|
4759
|
-
contextWindow: 1048576,
|
|
4760
|
-
maxTokens: 65536,
|
|
4761
|
-
},
|
|
4762
|
-
"gemini-flash-latest": {
|
|
4763
|
-
id: "gemini-flash-latest",
|
|
4764
|
-
name: "Gemini Flash Latest",
|
|
4765
|
-
api: "google-generative-ai",
|
|
4766
|
-
provider: "google",
|
|
4767
|
-
baseUrl: "https://generativelanguage.googleapis.com/v1beta",
|
|
4768
|
-
reasoning: true,
|
|
4769
|
-
input: ["text", "image"],
|
|
4770
|
-
cost: {
|
|
4771
|
-
input: 0.3,
|
|
4772
|
-
output: 2.5,
|
|
4773
|
-
cacheRead: 0.075,
|
|
4774
|
-
cacheWrite: 0,
|
|
4775
|
-
},
|
|
4776
|
-
contextWindow: 1048576,
|
|
4777
|
-
maxTokens: 65536,
|
|
4778
|
-
},
|
|
4779
|
-
"gemini-flash-lite-latest": {
|
|
4780
|
-
id: "gemini-flash-lite-latest",
|
|
4781
|
-
name: "Gemini Flash-Lite Latest",
|
|
4782
|
-
api: "google-generative-ai",
|
|
4783
|
-
provider: "google",
|
|
4784
|
-
baseUrl: "https://generativelanguage.googleapis.com/v1beta",
|
|
4785
|
-
reasoning: true,
|
|
4786
|
-
input: ["text", "image"],
|
|
4787
|
-
cost: {
|
|
4788
|
-
input: 0.1,
|
|
4789
|
-
output: 0.4,
|
|
4790
|
-
cacheRead: 0.025,
|
|
4791
|
-
cacheWrite: 0,
|
|
4792
|
-
},
|
|
4793
|
-
contextWindow: 1048576,
|
|
4794
|
-
maxTokens: 65536,
|
|
4795
|
-
},
|
|
4796
|
-
"gemini-live-2.5-flash": {
|
|
4797
|
-
id: "gemini-live-2.5-flash",
|
|
4798
|
-
name: "Gemini Live 2.5 Flash",
|
|
4799
|
-
api: "google-generative-ai",
|
|
4800
|
-
provider: "google",
|
|
4801
|
-
baseUrl: "https://generativelanguage.googleapis.com/v1beta",
|
|
4802
|
-
reasoning: true,
|
|
4803
|
-
input: ["text", "image"],
|
|
4804
|
-
cost: {
|
|
4805
|
-
input: 0.5,
|
|
4806
|
-
output: 2,
|
|
4807
|
-
cacheRead: 0,
|
|
4808
|
-
cacheWrite: 0,
|
|
4809
|
-
},
|
|
4810
|
-
contextWindow: 128000,
|
|
4811
|
-
maxTokens: 8000,
|
|
4812
|
-
},
|
|
4813
|
-
"gemini-live-2.5-flash-preview-native-audio": {
|
|
4814
|
-
id: "gemini-live-2.5-flash-preview-native-audio",
|
|
4815
|
-
name: "Gemini Live 2.5 Flash Preview Native Audio",
|
|
4816
|
-
api: "google-generative-ai",
|
|
4817
|
-
provider: "google",
|
|
4818
|
-
baseUrl: "https://generativelanguage.googleapis.com/v1beta",
|
|
4819
|
-
reasoning: true,
|
|
4820
|
-
input: ["text"],
|
|
4821
|
-
cost: {
|
|
4822
|
-
input: 0.5,
|
|
4823
|
-
output: 2,
|
|
4824
|
-
cacheRead: 0,
|
|
4825
|
-
cacheWrite: 0,
|
|
4826
|
-
},
|
|
4827
|
-
contextWindow: 131072,
|
|
4828
|
-
maxTokens: 65536,
|
|
4829
|
-
},
|
|
4830
|
-
"gemma-3-27b-it": {
|
|
4831
|
-
id: "gemma-3-27b-it",
|
|
4832
|
-
name: "Gemma 3 27B",
|
|
4833
|
-
api: "google-generative-ai",
|
|
4834
|
-
provider: "google",
|
|
4835
|
-
baseUrl: "https://generativelanguage.googleapis.com/v1beta",
|
|
4836
|
-
reasoning: false,
|
|
4837
|
-
input: ["text", "image"],
|
|
4838
|
-
cost: {
|
|
4839
|
-
input: 0,
|
|
4840
|
-
output: 0,
|
|
4841
|
-
cacheRead: 0,
|
|
4842
|
-
cacheWrite: 0,
|
|
4843
|
-
},
|
|
4844
|
-
contextWindow: 131072,
|
|
4845
|
-
maxTokens: 8192,
|
|
4846
|
-
},
|
|
4847
|
-
"gemma-4-26b-a4b-it": {
|
|
4848
|
-
id: "gemma-4-26b-a4b-it",
|
|
4849
|
-
name: "Gemma 4 26B",
|
|
4850
|
-
api: "google-generative-ai",
|
|
4851
|
-
provider: "google",
|
|
4852
|
-
baseUrl: "https://generativelanguage.googleapis.com/v1beta",
|
|
4853
|
-
reasoning: true,
|
|
4854
|
-
thinkingLevelMap: { "off": null, "minimal": "MINIMAL", "low": null, "medium": null, "high": "HIGH" },
|
|
4493
|
+
thinkingLevelMap: { "off": null, "minimal": "MINIMAL", "low": null, "medium": null, "high": "HIGH" },
|
|
4855
4494
|
input: ["text", "image"],
|
|
4856
4495
|
cost: {
|
|
4857
4496
|
input: 0,
|
|
@@ -4859,12 +4498,12 @@ export const MODELS = {
|
|
|
4859
4498
|
cacheRead: 0,
|
|
4860
4499
|
cacheWrite: 0,
|
|
4861
4500
|
},
|
|
4862
|
-
contextWindow:
|
|
4863
|
-
maxTokens:
|
|
4501
|
+
contextWindow: 262144,
|
|
4502
|
+
maxTokens: 32768,
|
|
4864
4503
|
},
|
|
4865
4504
|
"gemma-4-31b-it": {
|
|
4866
4505
|
id: "gemma-4-31b-it",
|
|
4867
|
-
name: "Gemma 4 31B",
|
|
4506
|
+
name: "Gemma 4 31B IT",
|
|
4868
4507
|
api: "google-generative-ai",
|
|
4869
4508
|
provider: "google",
|
|
4870
4509
|
baseUrl: "https://generativelanguage.googleapis.com/v1beta",
|
|
@@ -4877,8 +4516,8 @@ export const MODELS = {
|
|
|
4877
4516
|
cacheRead: 0,
|
|
4878
4517
|
cacheWrite: 0,
|
|
4879
4518
|
},
|
|
4880
|
-
contextWindow:
|
|
4881
|
-
maxTokens:
|
|
4519
|
+
contextWindow: 262144,
|
|
4520
|
+
maxTokens: 32768,
|
|
4882
4521
|
},
|
|
4883
4522
|
},
|
|
4884
4523
|
"google-vertex": {
|
|
@@ -6945,7 +6584,7 @@ export const MODELS = {
|
|
|
6945
6584
|
provider: "openai",
|
|
6946
6585
|
baseUrl: "https://api.openai.com/v1",
|
|
6947
6586
|
reasoning: true,
|
|
6948
|
-
thinkingLevelMap: { "off":
|
|
6587
|
+
thinkingLevelMap: { "off": "none" },
|
|
6949
6588
|
input: ["text", "image"],
|
|
6950
6589
|
cost: {
|
|
6951
6590
|
input: 1.25,
|
|
@@ -7035,7 +6674,7 @@ export const MODELS = {
|
|
|
7035
6674
|
provider: "openai",
|
|
7036
6675
|
baseUrl: "https://api.openai.com/v1",
|
|
7037
6676
|
reasoning: true,
|
|
7038
|
-
thinkingLevelMap: { "off":
|
|
6677
|
+
thinkingLevelMap: { "off": "none", "xhigh": "xhigh" },
|
|
7039
6678
|
input: ["text", "image"],
|
|
7040
6679
|
cost: {
|
|
7041
6680
|
input: 1.75,
|
|
@@ -7125,7 +6764,7 @@ export const MODELS = {
|
|
|
7125
6764
|
provider: "openai",
|
|
7126
6765
|
baseUrl: "https://api.openai.com/v1",
|
|
7127
6766
|
reasoning: true,
|
|
7128
|
-
thinkingLevelMap: { "off":
|
|
6767
|
+
thinkingLevelMap: { "off": "none", "xhigh": "xhigh" },
|
|
7129
6768
|
input: ["text", "image"],
|
|
7130
6769
|
cost: {
|
|
7131
6770
|
input: 1.75,
|
|
@@ -7161,7 +6800,7 @@ export const MODELS = {
|
|
|
7161
6800
|
provider: "openai",
|
|
7162
6801
|
baseUrl: "https://api.openai.com/v1",
|
|
7163
6802
|
reasoning: true,
|
|
7164
|
-
thinkingLevelMap: { "off":
|
|
6803
|
+
thinkingLevelMap: { "off": "none", "xhigh": "xhigh" },
|
|
7165
6804
|
input: ["text", "image"],
|
|
7166
6805
|
cost: {
|
|
7167
6806
|
input: 2.5,
|
|
@@ -7179,7 +6818,7 @@ export const MODELS = {
|
|
|
7179
6818
|
provider: "openai",
|
|
7180
6819
|
baseUrl: "https://api.openai.com/v1",
|
|
7181
6820
|
reasoning: true,
|
|
7182
|
-
thinkingLevelMap: { "off":
|
|
6821
|
+
thinkingLevelMap: { "off": "none", "xhigh": "xhigh" },
|
|
7183
6822
|
input: ["text", "image"],
|
|
7184
6823
|
cost: {
|
|
7185
6824
|
input: 0.75,
|
|
@@ -7197,7 +6836,7 @@ export const MODELS = {
|
|
|
7197
6836
|
provider: "openai",
|
|
7198
6837
|
baseUrl: "https://api.openai.com/v1",
|
|
7199
6838
|
reasoning: true,
|
|
7200
|
-
thinkingLevelMap: { "off":
|
|
6839
|
+
thinkingLevelMap: { "off": "none", "xhigh": "xhigh" },
|
|
7201
6840
|
input: ["text", "image"],
|
|
7202
6841
|
cost: {
|
|
7203
6842
|
input: 0.2,
|
|
@@ -7233,7 +6872,7 @@ export const MODELS = {
|
|
|
7233
6872
|
provider: "openai",
|
|
7234
6873
|
baseUrl: "https://api.openai.com/v1",
|
|
7235
6874
|
reasoning: true,
|
|
7236
|
-
thinkingLevelMap: { "off":
|
|
6875
|
+
thinkingLevelMap: { "off": "none", "xhigh": "xhigh" },
|
|
7237
6876
|
input: ["text", "image"],
|
|
7238
6877
|
cost: {
|
|
7239
6878
|
input: 5,
|
|
@@ -7735,6 +7374,25 @@ export const MODELS = {
|
|
|
7735
7374
|
contextWindow: 1000000,
|
|
7736
7375
|
maxTokens: 64000,
|
|
7737
7376
|
},
|
|
7377
|
+
"deepseek-v4-flash-free": {
|
|
7378
|
+
id: "deepseek-v4-flash-free",
|
|
7379
|
+
name: "DeepSeek V4 Flash Free",
|
|
7380
|
+
api: "openai-completions",
|
|
7381
|
+
provider: "opencode",
|
|
7382
|
+
baseUrl: "https://opencode.ai/zen/v1",
|
|
7383
|
+
compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
|
|
7384
|
+
reasoning: true,
|
|
7385
|
+
thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
|
|
7386
|
+
input: ["text"],
|
|
7387
|
+
cost: {
|
|
7388
|
+
input: 0,
|
|
7389
|
+
output: 0,
|
|
7390
|
+
cacheRead: 0,
|
|
7391
|
+
cacheWrite: 0,
|
|
7392
|
+
},
|
|
7393
|
+
contextWindow: 200000,
|
|
7394
|
+
maxTokens: 128000,
|
|
7395
|
+
},
|
|
7738
7396
|
"gemini-3-flash": {
|
|
7739
7397
|
id: "gemini-3-flash",
|
|
7740
7398
|
name: "Gemini 3 Flash",
|
|
@@ -7771,6 +7429,24 @@ export const MODELS = {
|
|
|
7771
7429
|
contextWindow: 1048576,
|
|
7772
7430
|
maxTokens: 65536,
|
|
7773
7431
|
},
|
|
7432
|
+
"gemini-3.5-flash": {
|
|
7433
|
+
id: "gemini-3.5-flash",
|
|
7434
|
+
name: "Gemini 3.5 Flash",
|
|
7435
|
+
api: "google-generative-ai",
|
|
7436
|
+
provider: "opencode",
|
|
7437
|
+
baseUrl: "https://opencode.ai/zen/v1",
|
|
7438
|
+
reasoning: true,
|
|
7439
|
+
thinkingLevelMap: { "off": null },
|
|
7440
|
+
input: ["text", "image"],
|
|
7441
|
+
cost: {
|
|
7442
|
+
input: 1.5,
|
|
7443
|
+
output: 9,
|
|
7444
|
+
cacheRead: 0.15,
|
|
7445
|
+
cacheWrite: 0,
|
|
7446
|
+
},
|
|
7447
|
+
contextWindow: 1048576,
|
|
7448
|
+
maxTokens: 65536,
|
|
7449
|
+
},
|
|
7774
7450
|
"glm-5": {
|
|
7775
7451
|
id: "glm-5",
|
|
7776
7452
|
name: "GLM-5",
|
|
@@ -8093,22 +7769,22 @@ export const MODELS = {
|
|
|
8093
7769
|
contextWindow: 1050000,
|
|
8094
7770
|
maxTokens: 128000,
|
|
8095
7771
|
},
|
|
8096
|
-
"
|
|
8097
|
-
id: "
|
|
8098
|
-
name: "
|
|
7772
|
+
"grok-build-0.1": {
|
|
7773
|
+
id: "grok-build-0.1",
|
|
7774
|
+
name: "Grok Build 0.1",
|
|
8099
7775
|
api: "openai-completions",
|
|
8100
7776
|
provider: "opencode",
|
|
8101
7777
|
baseUrl: "https://opencode.ai/zen/v1",
|
|
8102
7778
|
reasoning: true,
|
|
8103
|
-
input: ["text"],
|
|
7779
|
+
input: ["text", "image"],
|
|
8104
7780
|
cost: {
|
|
8105
|
-
input:
|
|
8106
|
-
output:
|
|
8107
|
-
cacheRead: 0,
|
|
7781
|
+
input: 1,
|
|
7782
|
+
output: 2,
|
|
7783
|
+
cacheRead: 0.2,
|
|
8108
7784
|
cacheWrite: 0,
|
|
8109
7785
|
},
|
|
8110
7786
|
contextWindow: 256000,
|
|
8111
|
-
maxTokens:
|
|
7787
|
+
maxTokens: 256000,
|
|
8112
7788
|
},
|
|
8113
7789
|
"kimi-k2.5": {
|
|
8114
7790
|
id: "kimi-k2.5",
|
|
@@ -8161,23 +7837,6 @@ export const MODELS = {
|
|
|
8161
7837
|
contextWindow: 204800,
|
|
8162
7838
|
maxTokens: 131072,
|
|
8163
7839
|
},
|
|
8164
|
-
"minimax-m2.5-free": {
|
|
8165
|
-
id: "minimax-m2.5-free",
|
|
8166
|
-
name: "MiniMax M2.5 Free",
|
|
8167
|
-
api: "anthropic-messages",
|
|
8168
|
-
provider: "opencode",
|
|
8169
|
-
baseUrl: "https://opencode.ai/zen",
|
|
8170
|
-
reasoning: true,
|
|
8171
|
-
input: ["text"],
|
|
8172
|
-
cost: {
|
|
8173
|
-
input: 0,
|
|
8174
|
-
output: 0,
|
|
8175
|
-
cacheRead: 0,
|
|
8176
|
-
cacheWrite: 0,
|
|
8177
|
-
},
|
|
8178
|
-
contextWindow: 204800,
|
|
8179
|
-
maxTokens: 131072,
|
|
8180
|
-
},
|
|
8181
7840
|
"minimax-m2.7": {
|
|
8182
7841
|
id: "minimax-m2.7",
|
|
8183
7842
|
name: "MiniMax M2.7",
|
|
@@ -8246,6 +7905,23 @@ export const MODELS = {
|
|
|
8246
7905
|
contextWindow: 262144,
|
|
8247
7906
|
maxTokens: 65536,
|
|
8248
7907
|
},
|
|
7908
|
+
"qwen3.6-plus-free": {
|
|
7909
|
+
id: "qwen3.6-plus-free",
|
|
7910
|
+
name: "Qwen3.6 Plus Free",
|
|
7911
|
+
api: "anthropic-messages",
|
|
7912
|
+
provider: "opencode",
|
|
7913
|
+
baseUrl: "https://opencode.ai/zen",
|
|
7914
|
+
reasoning: true,
|
|
7915
|
+
input: ["text", "image"],
|
|
7916
|
+
cost: {
|
|
7917
|
+
input: 0,
|
|
7918
|
+
output: 0,
|
|
7919
|
+
cacheRead: 0,
|
|
7920
|
+
cacheWrite: 0,
|
|
7921
|
+
},
|
|
7922
|
+
contextWindow: 262144,
|
|
7923
|
+
maxTokens: 65536,
|
|
7924
|
+
},
|
|
8249
7925
|
},
|
|
8250
7926
|
"opencode-go": {
|
|
8251
7927
|
"deepseek-v4-flash": {
|
|
@@ -8391,9 +8067,9 @@ export const MODELS = {
|
|
|
8391
8067
|
"minimax-m2.5": {
|
|
8392
8068
|
id: "minimax-m2.5",
|
|
8393
8069
|
name: "MiniMax M2.5",
|
|
8394
|
-
api: "
|
|
8070
|
+
api: "anthropic-messages",
|
|
8395
8071
|
provider: "opencode-go",
|
|
8396
|
-
baseUrl: "https://opencode.ai/zen/go
|
|
8072
|
+
baseUrl: "https://opencode.ai/zen/go",
|
|
8397
8073
|
reasoning: true,
|
|
8398
8074
|
input: ["text"],
|
|
8399
8075
|
cost: {
|
|
@@ -8613,40 +8289,6 @@ export const MODELS = {
|
|
|
8613
8289
|
contextWindow: 200000,
|
|
8614
8290
|
maxTokens: 8192,
|
|
8615
8291
|
},
|
|
8616
|
-
"anthropic/claude-3.7-sonnet": {
|
|
8617
|
-
id: "anthropic/claude-3.7-sonnet",
|
|
8618
|
-
name: "Anthropic: Claude 3.7 Sonnet",
|
|
8619
|
-
api: "openai-completions",
|
|
8620
|
-
provider: "openrouter",
|
|
8621
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
8622
|
-
reasoning: true,
|
|
8623
|
-
input: ["text", "image"],
|
|
8624
|
-
cost: {
|
|
8625
|
-
input: 3,
|
|
8626
|
-
output: 15,
|
|
8627
|
-
cacheRead: 0.3,
|
|
8628
|
-
cacheWrite: 3.75,
|
|
8629
|
-
},
|
|
8630
|
-
contextWindow: 200000,
|
|
8631
|
-
maxTokens: 64000,
|
|
8632
|
-
},
|
|
8633
|
-
"anthropic/claude-3.7-sonnet:thinking": {
|
|
8634
|
-
id: "anthropic/claude-3.7-sonnet:thinking",
|
|
8635
|
-
name: "Anthropic: Claude 3.7 Sonnet (thinking)",
|
|
8636
|
-
api: "openai-completions",
|
|
8637
|
-
provider: "openrouter",
|
|
8638
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
8639
|
-
reasoning: true,
|
|
8640
|
-
input: ["text", "image"],
|
|
8641
|
-
cost: {
|
|
8642
|
-
input: 3,
|
|
8643
|
-
output: 15,
|
|
8644
|
-
cacheRead: 0.3,
|
|
8645
|
-
cacheWrite: 3.75,
|
|
8646
|
-
},
|
|
8647
|
-
contextWindow: 200000,
|
|
8648
|
-
maxTokens: 64000,
|
|
8649
|
-
},
|
|
8650
8292
|
"anthropic/claude-haiku-4.5": {
|
|
8651
8293
|
id: "anthropic/claude-haiku-4.5",
|
|
8652
8294
|
name: "Anthropic: Claude Haiku 4.5",
|
|
@@ -8769,19 +8411,37 @@ export const MODELS = {
|
|
|
8769
8411
|
contextWindow: 1000000,
|
|
8770
8412
|
maxTokens: 128000,
|
|
8771
8413
|
},
|
|
8772
|
-
"anthropic/claude-
|
|
8773
|
-
id: "anthropic/claude-
|
|
8774
|
-
name: "Anthropic: Claude
|
|
8414
|
+
"anthropic/claude-opus-4.7-fast": {
|
|
8415
|
+
id: "anthropic/claude-opus-4.7-fast",
|
|
8416
|
+
name: "Anthropic: Claude Opus 4.7 (Fast)",
|
|
8775
8417
|
api: "openai-completions",
|
|
8776
8418
|
provider: "openrouter",
|
|
8777
8419
|
baseUrl: "https://openrouter.ai/api/v1",
|
|
8778
8420
|
reasoning: true,
|
|
8421
|
+
thinkingLevelMap: { "xhigh": "xhigh" },
|
|
8779
8422
|
input: ["text", "image"],
|
|
8780
8423
|
cost: {
|
|
8781
|
-
input:
|
|
8782
|
-
output:
|
|
8783
|
-
cacheRead:
|
|
8784
|
-
cacheWrite:
|
|
8424
|
+
input: 30,
|
|
8425
|
+
output: 150,
|
|
8426
|
+
cacheRead: 3,
|
|
8427
|
+
cacheWrite: 37.5,
|
|
8428
|
+
},
|
|
8429
|
+
contextWindow: 1000000,
|
|
8430
|
+
maxTokens: 128000,
|
|
8431
|
+
},
|
|
8432
|
+
"anthropic/claude-sonnet-4": {
|
|
8433
|
+
id: "anthropic/claude-sonnet-4",
|
|
8434
|
+
name: "Anthropic: Claude Sonnet 4",
|
|
8435
|
+
api: "openai-completions",
|
|
8436
|
+
provider: "openrouter",
|
|
8437
|
+
baseUrl: "https://openrouter.ai/api/v1",
|
|
8438
|
+
reasoning: true,
|
|
8439
|
+
input: ["text", "image"],
|
|
8440
|
+
cost: {
|
|
8441
|
+
input: 3,
|
|
8442
|
+
output: 15,
|
|
8443
|
+
cacheRead: 0.3,
|
|
8444
|
+
cacheWrite: 3.75,
|
|
8785
8445
|
},
|
|
8786
8446
|
contextWindow: 1000000,
|
|
8787
8447
|
maxTokens: 64000,
|
|
@@ -8820,39 +8480,39 @@ export const MODELS = {
|
|
|
8820
8480
|
contextWindow: 1000000,
|
|
8821
8481
|
maxTokens: 128000,
|
|
8822
8482
|
},
|
|
8823
|
-
"arcee-ai/trinity-large-
|
|
8824
|
-
id: "arcee-ai/trinity-large-
|
|
8825
|
-
name: "Arcee AI: Trinity Large
|
|
8483
|
+
"arcee-ai/trinity-large-thinking": {
|
|
8484
|
+
id: "arcee-ai/trinity-large-thinking",
|
|
8485
|
+
name: "Arcee AI: Trinity Large Thinking",
|
|
8826
8486
|
api: "openai-completions",
|
|
8827
8487
|
provider: "openrouter",
|
|
8828
8488
|
baseUrl: "https://openrouter.ai/api/v1",
|
|
8829
|
-
reasoning:
|
|
8489
|
+
reasoning: true,
|
|
8830
8490
|
input: ["text"],
|
|
8831
8491
|
cost: {
|
|
8832
|
-
input: 0.
|
|
8833
|
-
output: 0.
|
|
8834
|
-
cacheRead: 0,
|
|
8492
|
+
input: 0.22,
|
|
8493
|
+
output: 0.85,
|
|
8494
|
+
cacheRead: 0.06,
|
|
8835
8495
|
cacheWrite: 0,
|
|
8836
8496
|
},
|
|
8837
|
-
contextWindow:
|
|
8838
|
-
maxTokens:
|
|
8497
|
+
contextWindow: 262144,
|
|
8498
|
+
maxTokens: 262144,
|
|
8839
8499
|
},
|
|
8840
|
-
"arcee-ai/trinity-large-thinking": {
|
|
8841
|
-
id: "arcee-ai/trinity-large-thinking",
|
|
8842
|
-
name: "Arcee AI: Trinity Large Thinking",
|
|
8500
|
+
"arcee-ai/trinity-large-thinking:free": {
|
|
8501
|
+
id: "arcee-ai/trinity-large-thinking:free",
|
|
8502
|
+
name: "Arcee AI: Trinity Large Thinking (free)",
|
|
8843
8503
|
api: "openai-completions",
|
|
8844
8504
|
provider: "openrouter",
|
|
8845
8505
|
baseUrl: "https://openrouter.ai/api/v1",
|
|
8846
8506
|
reasoning: true,
|
|
8847
8507
|
input: ["text"],
|
|
8848
8508
|
cost: {
|
|
8849
|
-
input: 0
|
|
8850
|
-
output: 0
|
|
8851
|
-
cacheRead: 0
|
|
8509
|
+
input: 0,
|
|
8510
|
+
output: 0,
|
|
8511
|
+
cacheRead: 0,
|
|
8852
8512
|
cacheWrite: 0,
|
|
8853
8513
|
},
|
|
8854
8514
|
contextWindow: 262144,
|
|
8855
|
-
maxTokens:
|
|
8515
|
+
maxTokens: 80000,
|
|
8856
8516
|
},
|
|
8857
8517
|
"arcee-ai/trinity-mini": {
|
|
8858
8518
|
id: "arcee-ai/trinity-mini",
|
|
@@ -8936,7 +8596,7 @@ export const MODELS = {
|
|
|
8936
8596
|
cacheRead: 0,
|
|
8937
8597
|
cacheWrite: 0,
|
|
8938
8598
|
},
|
|
8939
|
-
contextWindow:
|
|
8599
|
+
contextWindow: 131072,
|
|
8940
8600
|
maxTokens: 8000,
|
|
8941
8601
|
},
|
|
8942
8602
|
"baidu/ernie-4.5-vl-28b-a3b": {
|
|
@@ -8953,7 +8613,7 @@ export const MODELS = {
|
|
|
8953
8613
|
cacheRead: 0,
|
|
8954
8614
|
cacheWrite: 0,
|
|
8955
8615
|
},
|
|
8956
|
-
contextWindow:
|
|
8616
|
+
contextWindow: 131072,
|
|
8957
8617
|
maxTokens: 8000,
|
|
8958
8618
|
},
|
|
8959
8619
|
"bytedance-seed/seed-1.6": {
|
|
@@ -9101,13 +8761,13 @@ export const MODELS = {
|
|
|
9101
8761
|
reasoning: true,
|
|
9102
8762
|
input: ["text"],
|
|
9103
8763
|
cost: {
|
|
9104
|
-
input: 0.
|
|
9105
|
-
output: 0.
|
|
9106
|
-
cacheRead: 0,
|
|
8764
|
+
input: 0.21,
|
|
8765
|
+
output: 0.7899999999999999,
|
|
8766
|
+
cacheRead: 0.13,
|
|
9107
8767
|
cacheWrite: 0,
|
|
9108
8768
|
},
|
|
9109
|
-
contextWindow:
|
|
9110
|
-
maxTokens:
|
|
8769
|
+
contextWindow: 163840,
|
|
8770
|
+
maxTokens: 32768,
|
|
9111
8771
|
},
|
|
9112
8772
|
"deepseek/deepseek-r1": {
|
|
9113
8773
|
id: "deepseek/deepseek-r1",
|
|
@@ -9123,7 +8783,7 @@ export const MODELS = {
|
|
|
9123
8783
|
cacheRead: 0,
|
|
9124
8784
|
cacheWrite: 0,
|
|
9125
8785
|
},
|
|
9126
|
-
contextWindow:
|
|
8786
|
+
contextWindow: 163840,
|
|
9127
8787
|
maxTokens: 16000,
|
|
9128
8788
|
},
|
|
9129
8789
|
"deepseek/deepseek-r1-0528": {
|
|
@@ -9205,9 +8865,28 @@ export const MODELS = {
|
|
|
9205
8865
|
thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
|
|
9206
8866
|
input: ["text"],
|
|
9207
8867
|
cost: {
|
|
9208
|
-
input: 0.
|
|
9209
|
-
output: 0.
|
|
9210
|
-
cacheRead: 0.
|
|
8868
|
+
input: 0.112,
|
|
8869
|
+
output: 0.224,
|
|
8870
|
+
cacheRead: 0.022,
|
|
8871
|
+
cacheWrite: 0,
|
|
8872
|
+
},
|
|
8873
|
+
contextWindow: 1048576,
|
|
8874
|
+
maxTokens: 4096,
|
|
8875
|
+
},
|
|
8876
|
+
"deepseek/deepseek-v4-flash:free": {
|
|
8877
|
+
id: "deepseek/deepseek-v4-flash:free",
|
|
8878
|
+
name: "DeepSeek: DeepSeek V4 Flash (free)",
|
|
8879
|
+
api: "openai-completions",
|
|
8880
|
+
provider: "openrouter",
|
|
8881
|
+
baseUrl: "https://openrouter.ai/api/v1",
|
|
8882
|
+
compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
|
|
8883
|
+
reasoning: true,
|
|
8884
|
+
thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
|
|
8885
|
+
input: ["text"],
|
|
8886
|
+
cost: {
|
|
8887
|
+
input: 0,
|
|
8888
|
+
output: 0,
|
|
8889
|
+
cacheRead: 0,
|
|
9211
8890
|
cacheWrite: 0,
|
|
9212
8891
|
},
|
|
9213
8892
|
contextWindow: 1048576,
|
|
@@ -9263,7 +8942,7 @@ export const MODELS = {
|
|
|
9263
8942
|
cacheRead: 0.024999999999999998,
|
|
9264
8943
|
cacheWrite: 0.08333333333333334,
|
|
9265
8944
|
},
|
|
9266
|
-
contextWindow:
|
|
8945
|
+
contextWindow: 1000000,
|
|
9267
8946
|
maxTokens: 8192,
|
|
9268
8947
|
},
|
|
9269
8948
|
"google/gemini-2.0-flash-lite-001": {
|
|
@@ -9402,6 +9081,23 @@ export const MODELS = {
|
|
|
9402
9081
|
contextWindow: 1048576,
|
|
9403
9082
|
maxTokens: 65536,
|
|
9404
9083
|
},
|
|
9084
|
+
"google/gemini-3.1-flash-lite": {
|
|
9085
|
+
id: "google/gemini-3.1-flash-lite",
|
|
9086
|
+
name: "Google: Gemini 3.1 Flash Lite",
|
|
9087
|
+
api: "openai-completions",
|
|
9088
|
+
provider: "openrouter",
|
|
9089
|
+
baseUrl: "https://openrouter.ai/api/v1",
|
|
9090
|
+
reasoning: true,
|
|
9091
|
+
input: ["text", "image"],
|
|
9092
|
+
cost: {
|
|
9093
|
+
input: 0.25,
|
|
9094
|
+
output: 1.5,
|
|
9095
|
+
cacheRead: 0.024999999999999998,
|
|
9096
|
+
cacheWrite: 0.08333333333333334,
|
|
9097
|
+
},
|
|
9098
|
+
contextWindow: 1048576,
|
|
9099
|
+
maxTokens: 65536,
|
|
9100
|
+
},
|
|
9405
9101
|
"google/gemini-3.1-flash-lite-preview": {
|
|
9406
9102
|
id: "google/gemini-3.1-flash-lite-preview",
|
|
9407
9103
|
name: "Google: Gemini 3.1 Flash Lite Preview",
|
|
@@ -9450,6 +9146,23 @@ export const MODELS = {
|
|
|
9450
9146
|
cacheRead: 0.19999999999999998,
|
|
9451
9147
|
cacheWrite: 0.375,
|
|
9452
9148
|
},
|
|
9149
|
+
contextWindow: 1048756,
|
|
9150
|
+
maxTokens: 65536,
|
|
9151
|
+
},
|
|
9152
|
+
"google/gemini-3.5-flash": {
|
|
9153
|
+
id: "google/gemini-3.5-flash",
|
|
9154
|
+
name: "Google: Gemini 3.5 Flash",
|
|
9155
|
+
api: "openai-completions",
|
|
9156
|
+
provider: "openrouter",
|
|
9157
|
+
baseUrl: "https://openrouter.ai/api/v1",
|
|
9158
|
+
reasoning: true,
|
|
9159
|
+
input: ["text", "image"],
|
|
9160
|
+
cost: {
|
|
9161
|
+
input: 1.5,
|
|
9162
|
+
output: 9,
|
|
9163
|
+
cacheRead: 0.15,
|
|
9164
|
+
cacheWrite: 0.08333333333333334,
|
|
9165
|
+
},
|
|
9453
9166
|
contextWindow: 1048576,
|
|
9454
9167
|
maxTokens: 65536,
|
|
9455
9168
|
},
|
|
@@ -9530,8 +9243,8 @@ export const MODELS = {
|
|
|
9530
9243
|
reasoning: true,
|
|
9531
9244
|
input: ["text", "image"],
|
|
9532
9245
|
cost: {
|
|
9533
|
-
input: 0.
|
|
9534
|
-
output: 0.
|
|
9246
|
+
input: 0.12,
|
|
9247
|
+
output: 0.37,
|
|
9535
9248
|
cacheRead: 0,
|
|
9536
9249
|
cacheWrite: 0,
|
|
9537
9250
|
},
|
|
@@ -9579,6 +9292,7 @@ export const MODELS = {
|
|
|
9579
9292
|
provider: "openrouter",
|
|
9580
9293
|
baseUrl: "https://openrouter.ai/api/v1",
|
|
9581
9294
|
reasoning: true,
|
|
9295
|
+
thinkingLevelMap: { "off": null },
|
|
9582
9296
|
input: ["text"],
|
|
9583
9297
|
cost: {
|
|
9584
9298
|
input: 0.25,
|
|
@@ -9598,9 +9312,9 @@ export const MODELS = {
|
|
|
9598
9312
|
reasoning: false,
|
|
9599
9313
|
input: ["text"],
|
|
9600
9314
|
cost: {
|
|
9601
|
-
input: 0.
|
|
9602
|
-
output:
|
|
9603
|
-
cacheRead: 0.
|
|
9315
|
+
input: 0.075,
|
|
9316
|
+
output: 0.625,
|
|
9317
|
+
cacheRead: 0.015,
|
|
9604
9318
|
cacheWrite: 0,
|
|
9605
9319
|
},
|
|
9606
9320
|
contextWindow: 262144,
|
|
@@ -9615,14 +9329,31 @@ export const MODELS = {
|
|
|
9615
9329
|
reasoning: false,
|
|
9616
9330
|
input: ["text"],
|
|
9617
9331
|
cost: {
|
|
9618
|
-
input: 0.
|
|
9619
|
-
output: 0.
|
|
9620
|
-
cacheRead: 0.
|
|
9332
|
+
input: 0.01,
|
|
9333
|
+
output: 0.03,
|
|
9334
|
+
cacheRead: 0.002,
|
|
9621
9335
|
cacheWrite: 0,
|
|
9622
9336
|
},
|
|
9623
9337
|
contextWindow: 262144,
|
|
9624
9338
|
maxTokens: 32768,
|
|
9625
9339
|
},
|
|
9340
|
+
"inclusionai/ring-2.6-1t": {
|
|
9341
|
+
id: "inclusionai/ring-2.6-1t",
|
|
9342
|
+
name: "inclusionAI: Ring-2.6-1T",
|
|
9343
|
+
api: "openai-completions",
|
|
9344
|
+
provider: "openrouter",
|
|
9345
|
+
baseUrl: "https://openrouter.ai/api/v1",
|
|
9346
|
+
reasoning: true,
|
|
9347
|
+
input: ["text"],
|
|
9348
|
+
cost: {
|
|
9349
|
+
input: 0.075,
|
|
9350
|
+
output: 0.625,
|
|
9351
|
+
cacheRead: 0.015,
|
|
9352
|
+
cacheWrite: 0,
|
|
9353
|
+
},
|
|
9354
|
+
contextWindow: 262144,
|
|
9355
|
+
maxTokens: 65536,
|
|
9356
|
+
},
|
|
9626
9357
|
"kwaipilot/kat-coder-pro-v2": {
|
|
9627
9358
|
id: "kwaipilot/kat-coder-pro-v2",
|
|
9628
9359
|
name: "Kwaipilot: KAT-Coder-Pro V2",
|
|
@@ -9671,7 +9402,7 @@ export const MODELS = {
|
|
|
9671
9402
|
cacheRead: 0,
|
|
9672
9403
|
cacheWrite: 0,
|
|
9673
9404
|
},
|
|
9674
|
-
contextWindow:
|
|
9405
|
+
contextWindow: 131072,
|
|
9675
9406
|
maxTokens: 16384,
|
|
9676
9407
|
},
|
|
9677
9408
|
"meta-llama/llama-3.3-70b-instruct": {
|
|
@@ -9705,7 +9436,7 @@ export const MODELS = {
|
|
|
9705
9436
|
cacheRead: 0,
|
|
9706
9437
|
cacheWrite: 0,
|
|
9707
9438
|
},
|
|
9708
|
-
contextWindow:
|
|
9439
|
+
contextWindow: 131072,
|
|
9709
9440
|
maxTokens: 4096,
|
|
9710
9441
|
},
|
|
9711
9442
|
"meta-llama/llama-4-scout": {
|
|
@@ -9722,7 +9453,7 @@ export const MODELS = {
|
|
|
9722
9453
|
cacheRead: 0,
|
|
9723
9454
|
cacheWrite: 0,
|
|
9724
9455
|
},
|
|
9725
|
-
contextWindow:
|
|
9456
|
+
contextWindow: 10000000,
|
|
9726
9457
|
maxTokens: 16384,
|
|
9727
9458
|
},
|
|
9728
9459
|
"minimax/minimax-m1": {
|
|
@@ -9756,7 +9487,7 @@ export const MODELS = {
|
|
|
9756
9487
|
cacheRead: 0.03,
|
|
9757
9488
|
cacheWrite: 0,
|
|
9758
9489
|
},
|
|
9759
|
-
contextWindow:
|
|
9490
|
+
contextWindow: 204800,
|
|
9760
9491
|
maxTokens: 196608,
|
|
9761
9492
|
},
|
|
9762
9493
|
"minimax/minimax-m2.1": {
|
|
@@ -9773,7 +9504,7 @@ export const MODELS = {
|
|
|
9773
9504
|
cacheRead: 0.03,
|
|
9774
9505
|
cacheWrite: 0,
|
|
9775
9506
|
},
|
|
9776
|
-
contextWindow:
|
|
9507
|
+
contextWindow: 204800,
|
|
9777
9508
|
maxTokens: 196608,
|
|
9778
9509
|
},
|
|
9779
9510
|
"minimax/minimax-m2.5": {
|
|
@@ -9787,11 +9518,11 @@ export const MODELS = {
|
|
|
9787
9518
|
cost: {
|
|
9788
9519
|
input: 0.15,
|
|
9789
9520
|
output: 1.15,
|
|
9790
|
-
cacheRead: 0
|
|
9521
|
+
cacheRead: 0,
|
|
9791
9522
|
cacheWrite: 0,
|
|
9792
9523
|
},
|
|
9793
|
-
contextWindow:
|
|
9794
|
-
maxTokens:
|
|
9524
|
+
contextWindow: 204800,
|
|
9525
|
+
maxTokens: 196608,
|
|
9795
9526
|
},
|
|
9796
9527
|
"minimax/minimax-m2.5:free": {
|
|
9797
9528
|
id: "minimax/minimax-m2.5:free",
|
|
@@ -9807,7 +9538,7 @@ export const MODELS = {
|
|
|
9807
9538
|
cacheRead: 0,
|
|
9808
9539
|
cacheWrite: 0,
|
|
9809
9540
|
},
|
|
9810
|
-
contextWindow:
|
|
9541
|
+
contextWindow: 204800,
|
|
9811
9542
|
maxTokens: 8192,
|
|
9812
9543
|
},
|
|
9813
9544
|
"minimax/minimax-m2.7": {
|
|
@@ -9819,13 +9550,13 @@ export const MODELS = {
|
|
|
9819
9550
|
reasoning: true,
|
|
9820
9551
|
input: ["text"],
|
|
9821
9552
|
cost: {
|
|
9822
|
-
input: 0.
|
|
9553
|
+
input: 0.27899999999999997,
|
|
9823
9554
|
output: 1.2,
|
|
9824
|
-
cacheRead: 0
|
|
9555
|
+
cacheRead: 0,
|
|
9825
9556
|
cacheWrite: 0,
|
|
9826
9557
|
},
|
|
9827
|
-
contextWindow:
|
|
9828
|
-
maxTokens:
|
|
9558
|
+
contextWindow: 204800,
|
|
9559
|
+
maxTokens: 131072,
|
|
9829
9560
|
},
|
|
9830
9561
|
"mistralai/codestral-2508": {
|
|
9831
9562
|
id: "mistralai/codestral-2508",
|
|
@@ -10150,23 +9881,6 @@ export const MODELS = {
|
|
|
10150
9881
|
contextWindow: 65536,
|
|
10151
9882
|
maxTokens: 4096,
|
|
10152
9883
|
},
|
|
10153
|
-
"mistralai/mixtral-8x7b-instruct": {
|
|
10154
|
-
id: "mistralai/mixtral-8x7b-instruct",
|
|
10155
|
-
name: "Mistral: Mixtral 8x7B Instruct",
|
|
10156
|
-
api: "openai-completions",
|
|
10157
|
-
provider: "openrouter",
|
|
10158
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
10159
|
-
reasoning: false,
|
|
10160
|
-
input: ["text"],
|
|
10161
|
-
cost: {
|
|
10162
|
-
input: 0.54,
|
|
10163
|
-
output: 0.54,
|
|
10164
|
-
cacheRead: 0,
|
|
10165
|
-
cacheWrite: 0,
|
|
10166
|
-
},
|
|
10167
|
-
contextWindow: 32768,
|
|
10168
|
-
maxTokens: 16384,
|
|
10169
|
-
},
|
|
10170
9884
|
"mistralai/pixtral-large-2411": {
|
|
10171
9885
|
id: "mistralai/pixtral-large-2411",
|
|
10172
9886
|
name: "Mistral: Pixtral Large 2411",
|
|
@@ -10227,8 +9941,8 @@ export const MODELS = {
|
|
|
10227
9941
|
reasoning: false,
|
|
10228
9942
|
input: ["text"],
|
|
10229
9943
|
cost: {
|
|
10230
|
-
input: 0.
|
|
10231
|
-
output: 2,
|
|
9944
|
+
input: 0.6,
|
|
9945
|
+
output: 2.5,
|
|
10232
9946
|
cacheRead: 0,
|
|
10233
9947
|
cacheWrite: 0,
|
|
10234
9948
|
},
|
|
@@ -10246,7 +9960,7 @@ export const MODELS = {
|
|
|
10246
9960
|
cost: {
|
|
10247
9961
|
input: 0.6,
|
|
10248
9962
|
output: 2.5,
|
|
10249
|
-
cacheRead: 0
|
|
9963
|
+
cacheRead: 0,
|
|
10250
9964
|
cacheWrite: 0,
|
|
10251
9965
|
},
|
|
10252
9966
|
contextWindow: 262144,
|
|
@@ -10278,13 +9992,13 @@ export const MODELS = {
|
|
|
10278
9992
|
reasoning: true,
|
|
10279
9993
|
input: ["text", "image"],
|
|
10280
9994
|
cost: {
|
|
10281
|
-
input: 0.
|
|
10282
|
-
output: 3.
|
|
10283
|
-
cacheRead: 0.
|
|
9995
|
+
input: 0.73,
|
|
9996
|
+
output: 3.49,
|
|
9997
|
+
cacheRead: 0.25,
|
|
10284
9998
|
cacheWrite: 0,
|
|
10285
9999
|
},
|
|
10286
10000
|
contextWindow: 262144,
|
|
10287
|
-
maxTokens:
|
|
10001
|
+
maxTokens: 262142,
|
|
10288
10002
|
},
|
|
10289
10003
|
"nex-agi/deepseek-v3.1-nex-n1": {
|
|
10290
10004
|
id: "nex-agi/deepseek-v3.1-nex-n1",
|
|
@@ -10303,23 +10017,6 @@ export const MODELS = {
|
|
|
10303
10017
|
contextWindow: 131072,
|
|
10304
10018
|
maxTokens: 163840,
|
|
10305
10019
|
},
|
|
10306
|
-
"nvidia/llama-3.1-nemotron-70b-instruct": {
|
|
10307
|
-
id: "nvidia/llama-3.1-nemotron-70b-instruct",
|
|
10308
|
-
name: "NVIDIA: Llama 3.1 Nemotron 70B Instruct",
|
|
10309
|
-
api: "openai-completions",
|
|
10310
|
-
provider: "openrouter",
|
|
10311
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
10312
|
-
reasoning: false,
|
|
10313
|
-
input: ["text"],
|
|
10314
|
-
cost: {
|
|
10315
|
-
input: 1.2,
|
|
10316
|
-
output: 1.2,
|
|
10317
|
-
cacheRead: 0,
|
|
10318
|
-
cacheWrite: 0,
|
|
10319
|
-
},
|
|
10320
|
-
contextWindow: 131072,
|
|
10321
|
-
maxTokens: 16384,
|
|
10322
|
-
},
|
|
10323
10020
|
"nvidia/llama-3.3-nemotron-super-49b-v1.5": {
|
|
10324
10021
|
id: "nvidia/llama-3.3-nemotron-super-49b-v1.5",
|
|
10325
10022
|
name: "NVIDIA: Llama 3.3 Nemotron Super 49B V1.5",
|
|
@@ -10402,7 +10099,7 @@ export const MODELS = {
|
|
|
10402
10099
|
cacheRead: 0,
|
|
10403
10100
|
cacheWrite: 0,
|
|
10404
10101
|
},
|
|
10405
|
-
contextWindow:
|
|
10102
|
+
contextWindow: 1000000,
|
|
10406
10103
|
maxTokens: 4096,
|
|
10407
10104
|
},
|
|
10408
10105
|
"nvidia/nemotron-3-super-120b-a12b:free": {
|
|
@@ -10419,7 +10116,7 @@ export const MODELS = {
|
|
|
10419
10116
|
cacheRead: 0,
|
|
10420
10117
|
cacheWrite: 0,
|
|
10421
10118
|
},
|
|
10422
|
-
contextWindow:
|
|
10119
|
+
contextWindow: 1000000,
|
|
10423
10120
|
maxTokens: 262144,
|
|
10424
10121
|
},
|
|
10425
10122
|
"nvidia/nemotron-nano-12b-v2-vl:free": {
|
|
@@ -11570,7 +11267,7 @@ export const MODELS = {
|
|
|
11570
11267
|
cacheRead: 0,
|
|
11571
11268
|
cacheWrite: 0,
|
|
11572
11269
|
},
|
|
11573
|
-
contextWindow:
|
|
11270
|
+
contextWindow: 131072,
|
|
11574
11271
|
maxTokens: 16384,
|
|
11575
11272
|
},
|
|
11576
11273
|
"qwen/qwen-2.5-7b-instruct": {
|
|
@@ -11587,26 +11284,9 @@ export const MODELS = {
|
|
|
11587
11284
|
cacheRead: 0,
|
|
11588
11285
|
cacheWrite: 0,
|
|
11589
11286
|
},
|
|
11590
|
-
contextWindow:
|
|
11287
|
+
contextWindow: 131072,
|
|
11591
11288
|
maxTokens: 32768,
|
|
11592
11289
|
},
|
|
11593
|
-
"qwen/qwen-max": {
|
|
11594
|
-
id: "qwen/qwen-max",
|
|
11595
|
-
name: "Qwen: Qwen-Max ",
|
|
11596
|
-
api: "openai-completions",
|
|
11597
|
-
provider: "openrouter",
|
|
11598
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
11599
|
-
reasoning: false,
|
|
11600
|
-
input: ["text"],
|
|
11601
|
-
cost: {
|
|
11602
|
-
input: 1.04,
|
|
11603
|
-
output: 4.16,
|
|
11604
|
-
cacheRead: 0.20800000000000002,
|
|
11605
|
-
cacheWrite: 0,
|
|
11606
|
-
},
|
|
11607
|
-
contextWindow: 32768,
|
|
11608
|
-
maxTokens: 8192,
|
|
11609
|
-
},
|
|
11610
11290
|
"qwen/qwen-plus": {
|
|
11611
11291
|
id: "qwen/qwen-plus",
|
|
11612
11292
|
name: "Qwen: Qwen-Plus",
|
|
@@ -11658,40 +11338,6 @@ export const MODELS = {
|
|
|
11658
11338
|
contextWindow: 1000000,
|
|
11659
11339
|
maxTokens: 32768,
|
|
11660
11340
|
},
|
|
11661
|
-
"qwen/qwen-turbo": {
|
|
11662
|
-
id: "qwen/qwen-turbo",
|
|
11663
|
-
name: "Qwen: Qwen-Turbo",
|
|
11664
|
-
api: "openai-completions",
|
|
11665
|
-
provider: "openrouter",
|
|
11666
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
11667
|
-
reasoning: false,
|
|
11668
|
-
input: ["text"],
|
|
11669
|
-
cost: {
|
|
11670
|
-
input: 0.0325,
|
|
11671
|
-
output: 0.13,
|
|
11672
|
-
cacheRead: 0.006500000000000001,
|
|
11673
|
-
cacheWrite: 0,
|
|
11674
|
-
},
|
|
11675
|
-
contextWindow: 131072,
|
|
11676
|
-
maxTokens: 8192,
|
|
11677
|
-
},
|
|
11678
|
-
"qwen/qwen-vl-max": {
|
|
11679
|
-
id: "qwen/qwen-vl-max",
|
|
11680
|
-
name: "Qwen: Qwen VL Max",
|
|
11681
|
-
api: "openai-completions",
|
|
11682
|
-
provider: "openrouter",
|
|
11683
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
11684
|
-
reasoning: false,
|
|
11685
|
-
input: ["text", "image"],
|
|
11686
|
-
cost: {
|
|
11687
|
-
input: 0.52,
|
|
11688
|
-
output: 2.08,
|
|
11689
|
-
cacheRead: 0,
|
|
11690
|
-
cacheWrite: 0,
|
|
11691
|
-
},
|
|
11692
|
-
contextWindow: 131072,
|
|
11693
|
-
maxTokens: 32768,
|
|
11694
|
-
},
|
|
11695
11341
|
"qwen/qwen3-14b": {
|
|
11696
11342
|
id: "qwen/qwen3-14b",
|
|
11697
11343
|
name: "Qwen: Qwen3 14B",
|
|
@@ -11701,12 +11347,12 @@ export const MODELS = {
|
|
|
11701
11347
|
reasoning: true,
|
|
11702
11348
|
input: ["text"],
|
|
11703
11349
|
cost: {
|
|
11704
|
-
input: 0.
|
|
11350
|
+
input: 0.09999999999999999,
|
|
11705
11351
|
output: 0.24,
|
|
11706
11352
|
cacheRead: 0,
|
|
11707
11353
|
cacheWrite: 0,
|
|
11708
11354
|
},
|
|
11709
|
-
contextWindow:
|
|
11355
|
+
contextWindow: 131702,
|
|
11710
11356
|
maxTokens: 40960,
|
|
11711
11357
|
},
|
|
11712
11358
|
"qwen/qwen3-235b-a22b": {
|
|
@@ -11757,7 +11403,7 @@ export const MODELS = {
|
|
|
11757
11403
|
cacheRead: 0,
|
|
11758
11404
|
cacheWrite: 0,
|
|
11759
11405
|
},
|
|
11760
|
-
contextWindow:
|
|
11406
|
+
contextWindow: 262144,
|
|
11761
11407
|
maxTokens: 4096,
|
|
11762
11408
|
},
|
|
11763
11409
|
"qwen/qwen3-30b-a3b": {
|
|
@@ -11774,7 +11420,7 @@ export const MODELS = {
|
|
|
11774
11420
|
cacheRead: 0,
|
|
11775
11421
|
cacheWrite: 0,
|
|
11776
11422
|
},
|
|
11777
|
-
contextWindow:
|
|
11423
|
+
contextWindow: 131072,
|
|
11778
11424
|
maxTokens: 20000,
|
|
11779
11425
|
},
|
|
11780
11426
|
"qwen/qwen3-30b-a3b-instruct-2507": {
|
|
@@ -11821,12 +11467,12 @@ export const MODELS = {
|
|
|
11821
11467
|
input: ["text"],
|
|
11822
11468
|
cost: {
|
|
11823
11469
|
input: 0.08,
|
|
11824
|
-
output: 0.
|
|
11825
|
-
cacheRead: 0
|
|
11470
|
+
output: 0.28,
|
|
11471
|
+
cacheRead: 0,
|
|
11826
11472
|
cacheWrite: 0,
|
|
11827
11473
|
},
|
|
11828
|
-
contextWindow:
|
|
11829
|
-
maxTokens:
|
|
11474
|
+
contextWindow: 131072,
|
|
11475
|
+
maxTokens: 16384,
|
|
11830
11476
|
},
|
|
11831
11477
|
"qwen/qwen3-8b": {
|
|
11832
11478
|
id: "qwen/qwen3-8b",
|
|
@@ -11842,7 +11488,7 @@ export const MODELS = {
|
|
|
11842
11488
|
cacheRead: 0.049999999999999996,
|
|
11843
11489
|
cacheWrite: 0,
|
|
11844
11490
|
},
|
|
11845
|
-
contextWindow:
|
|
11491
|
+
contextWindow: 131072,
|
|
11846
11492
|
maxTokens: 8192,
|
|
11847
11493
|
},
|
|
11848
11494
|
"qwen/qwen3-coder": {
|
|
@@ -11859,7 +11505,7 @@ export const MODELS = {
|
|
|
11859
11505
|
cacheRead: 0,
|
|
11860
11506
|
cacheWrite: 0,
|
|
11861
11507
|
},
|
|
11862
|
-
contextWindow:
|
|
11508
|
+
contextWindow: 1048576,
|
|
11863
11509
|
maxTokens: 65536,
|
|
11864
11510
|
},
|
|
11865
11511
|
"qwen/qwen3-coder-30b-a3b-instruct": {
|
|
@@ -11944,7 +11590,7 @@ export const MODELS = {
|
|
|
11944
11590
|
cacheRead: 0,
|
|
11945
11591
|
cacheWrite: 0,
|
|
11946
11592
|
},
|
|
11947
|
-
contextWindow:
|
|
11593
|
+
contextWindow: 1048576,
|
|
11948
11594
|
maxTokens: 262000,
|
|
11949
11595
|
},
|
|
11950
11596
|
"qwen/qwen3-max": {
|
|
@@ -12029,7 +11675,7 @@ export const MODELS = {
|
|
|
12029
11675
|
cacheRead: 0,
|
|
12030
11676
|
cacheWrite: 0,
|
|
12031
11677
|
},
|
|
12032
|
-
contextWindow:
|
|
11678
|
+
contextWindow: 262144,
|
|
12033
11679
|
maxTokens: 32768,
|
|
12034
11680
|
},
|
|
12035
11681
|
"qwen/qwen3-vl-235b-a22b-instruct": {
|
|
@@ -12080,7 +11726,7 @@ export const MODELS = {
|
|
|
12080
11726
|
cacheRead: 0,
|
|
12081
11727
|
cacheWrite: 0,
|
|
12082
11728
|
},
|
|
12083
|
-
contextWindow:
|
|
11729
|
+
contextWindow: 262144,
|
|
12084
11730
|
maxTokens: 32768,
|
|
12085
11731
|
},
|
|
12086
11732
|
"qwen/qwen3-vl-30b-a3b-thinking": {
|
|
@@ -12114,7 +11760,7 @@ export const MODELS = {
|
|
|
12114
11760
|
cacheRead: 0,
|
|
12115
11761
|
cacheWrite: 0,
|
|
12116
11762
|
},
|
|
12117
|
-
contextWindow:
|
|
11763
|
+
contextWindow: 262144,
|
|
12118
11764
|
maxTokens: 32768,
|
|
12119
11765
|
},
|
|
12120
11766
|
"qwen/qwen3-vl-8b-instruct": {
|
|
@@ -12131,7 +11777,7 @@ export const MODELS = {
|
|
|
12131
11777
|
cacheRead: 0,
|
|
12132
11778
|
cacheWrite: 0,
|
|
12133
11779
|
},
|
|
12134
|
-
contextWindow:
|
|
11780
|
+
contextWindow: 256000,
|
|
12135
11781
|
maxTokens: 32768,
|
|
12136
11782
|
},
|
|
12137
11783
|
"qwen/qwen3-vl-8b-thinking": {
|
|
@@ -12148,7 +11794,7 @@ export const MODELS = {
|
|
|
12148
11794
|
cacheRead: 0,
|
|
12149
11795
|
cacheWrite: 0,
|
|
12150
11796
|
},
|
|
12151
|
-
contextWindow:
|
|
11797
|
+
contextWindow: 256000,
|
|
12152
11798
|
maxTokens: 32768,
|
|
12153
11799
|
},
|
|
12154
11800
|
"qwen/qwen3.5-122b-a10b": {
|
|
@@ -12194,13 +11840,13 @@ export const MODELS = {
|
|
|
12194
11840
|
reasoning: true,
|
|
12195
11841
|
input: ["text", "image"],
|
|
12196
11842
|
cost: {
|
|
12197
|
-
input: 0.
|
|
11843
|
+
input: 0.13899999999999998,
|
|
12198
11844
|
output: 1,
|
|
12199
|
-
cacheRead: 0
|
|
11845
|
+
cacheRead: 0,
|
|
12200
11846
|
cacheWrite: 0,
|
|
12201
11847
|
},
|
|
12202
11848
|
contextWindow: 262144,
|
|
12203
|
-
maxTokens:
|
|
11849
|
+
maxTokens: 4096,
|
|
12204
11850
|
},
|
|
12205
11851
|
"qwen/qwen3.5-397b-a17b": {
|
|
12206
11852
|
id: "qwen/qwen3.5-397b-a17b",
|
|
@@ -12213,7 +11859,7 @@ export const MODELS = {
|
|
|
12213
11859
|
cost: {
|
|
12214
11860
|
input: 0.39,
|
|
12215
11861
|
output: 2.34,
|
|
12216
|
-
cacheRead: 0
|
|
11862
|
+
cacheRead: 0,
|
|
12217
11863
|
cacheWrite: 0,
|
|
12218
11864
|
},
|
|
12219
11865
|
contextWindow: 262144,
|
|
@@ -12279,8 +11925,8 @@ export const MODELS = {
|
|
|
12279
11925
|
reasoning: true,
|
|
12280
11926
|
input: ["text", "image"],
|
|
12281
11927
|
cost: {
|
|
12282
|
-
input: 0.
|
|
12283
|
-
output:
|
|
11928
|
+
input: 0.3,
|
|
11929
|
+
output: 1.7999999999999998,
|
|
12284
11930
|
cacheRead: 0,
|
|
12285
11931
|
cacheWrite: 0,
|
|
12286
11932
|
},
|
|
@@ -12296,13 +11942,13 @@ export const MODELS = {
|
|
|
12296
11942
|
reasoning: true,
|
|
12297
11943
|
input: ["text", "image"],
|
|
12298
11944
|
cost: {
|
|
12299
|
-
input: 0.
|
|
11945
|
+
input: 0.317,
|
|
12300
11946
|
output: 3.1999999999999997,
|
|
12301
11947
|
cacheRead: 0,
|
|
12302
11948
|
cacheWrite: 0,
|
|
12303
11949
|
},
|
|
12304
11950
|
contextWindow: 262144,
|
|
12305
|
-
maxTokens:
|
|
11951
|
+
maxTokens: 262140,
|
|
12306
11952
|
},
|
|
12307
11953
|
"qwen/qwen3.6-35b-a3b": {
|
|
12308
11954
|
id: "qwen/qwen3.6-35b-a3b",
|
|
@@ -12330,10 +11976,10 @@ export const MODELS = {
|
|
|
12330
11976
|
reasoning: true,
|
|
12331
11977
|
input: ["text", "image"],
|
|
12332
11978
|
cost: {
|
|
12333
|
-
input: 0.
|
|
12334
|
-
output: 1.
|
|
11979
|
+
input: 0.1875,
|
|
11980
|
+
output: 1.125,
|
|
12335
11981
|
cacheRead: 0,
|
|
12336
|
-
cacheWrite: 0.
|
|
11982
|
+
cacheWrite: 0.234375,
|
|
12337
11983
|
},
|
|
12338
11984
|
contextWindow: 1000000,
|
|
12339
11985
|
maxTokens: 65536,
|
|
@@ -12372,6 +12018,23 @@ export const MODELS = {
|
|
|
12372
12018
|
contextWindow: 1000000,
|
|
12373
12019
|
maxTokens: 65536,
|
|
12374
12020
|
},
|
|
12021
|
+
"qwen/qwen3.7-max": {
|
|
12022
|
+
id: "qwen/qwen3.7-max",
|
|
12023
|
+
name: "Qwen: Qwen3.7 Max",
|
|
12024
|
+
api: "openai-completions",
|
|
12025
|
+
provider: "openrouter",
|
|
12026
|
+
baseUrl: "https://openrouter.ai/api/v1",
|
|
12027
|
+
reasoning: true,
|
|
12028
|
+
input: ["text"],
|
|
12029
|
+
cost: {
|
|
12030
|
+
input: 2.5,
|
|
12031
|
+
output: 7.5,
|
|
12032
|
+
cacheRead: 0,
|
|
12033
|
+
cacheWrite: 3.125,
|
|
12034
|
+
},
|
|
12035
|
+
contextWindow: 1000000,
|
|
12036
|
+
maxTokens: 65536,
|
|
12037
|
+
},
|
|
12375
12038
|
"rekaai/reka-edge": {
|
|
12376
12039
|
id: "rekaai/reka-edge",
|
|
12377
12040
|
name: "Reka Edge",
|
|
@@ -12449,26 +12112,26 @@ export const MODELS = {
|
|
|
12449
12112
|
reasoning: true,
|
|
12450
12113
|
input: ["text"],
|
|
12451
12114
|
cost: {
|
|
12452
|
-
input: 0.
|
|
12115
|
+
input: 0.09,
|
|
12453
12116
|
output: 0.3,
|
|
12454
|
-
cacheRead: 0,
|
|
12117
|
+
cacheRead: 0.02,
|
|
12455
12118
|
cacheWrite: 0,
|
|
12456
12119
|
},
|
|
12457
12120
|
contextWindow: 262144,
|
|
12458
|
-
maxTokens:
|
|
12121
|
+
maxTokens: 16384,
|
|
12459
12122
|
},
|
|
12460
|
-
"tencent/hy3-preview
|
|
12461
|
-
id: "tencent/hy3-preview
|
|
12462
|
-
name: "Tencent: Hy3 preview
|
|
12123
|
+
"tencent/hy3-preview": {
|
|
12124
|
+
id: "tencent/hy3-preview",
|
|
12125
|
+
name: "Tencent: Hy3 preview",
|
|
12463
12126
|
api: "openai-completions",
|
|
12464
12127
|
provider: "openrouter",
|
|
12465
12128
|
baseUrl: "https://openrouter.ai/api/v1",
|
|
12466
12129
|
reasoning: true,
|
|
12467
12130
|
input: ["text"],
|
|
12468
12131
|
cost: {
|
|
12469
|
-
input: 0,
|
|
12470
|
-
output: 0,
|
|
12471
|
-
cacheRead: 0,
|
|
12132
|
+
input: 0.06599999999999999,
|
|
12133
|
+
output: 0.26,
|
|
12134
|
+
cacheRead: 0.029,
|
|
12472
12135
|
cacheWrite: 0,
|
|
12473
12136
|
},
|
|
12474
12137
|
contextWindow: 262144,
|
|
@@ -12508,23 +12171,6 @@ export const MODELS = {
|
|
|
12508
12171
|
contextWindow: 32768,
|
|
12509
12172
|
maxTokens: 32768,
|
|
12510
12173
|
},
|
|
12511
|
-
"tngtech/deepseek-r1t2-chimera": {
|
|
12512
|
-
id: "tngtech/deepseek-r1t2-chimera",
|
|
12513
|
-
name: "TNG: DeepSeek R1T2 Chimera",
|
|
12514
|
-
api: "openai-completions",
|
|
12515
|
-
provider: "openrouter",
|
|
12516
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
12517
|
-
reasoning: true,
|
|
12518
|
-
input: ["text"],
|
|
12519
|
-
cost: {
|
|
12520
|
-
input: 0.3,
|
|
12521
|
-
output: 1.1,
|
|
12522
|
-
cacheRead: 0.15,
|
|
12523
|
-
cacheWrite: 0,
|
|
12524
|
-
},
|
|
12525
|
-
contextWindow: 163840,
|
|
12526
|
-
maxTokens: 163840,
|
|
12527
|
-
},
|
|
12528
12174
|
"upstage/solar-pro-3": {
|
|
12529
12175
|
id: "upstage/solar-pro-3",
|
|
12530
12176
|
name: "Upstage: Solar Pro 3",
|
|
@@ -12542,125 +12188,6 @@ export const MODELS = {
|
|
|
12542
12188
|
contextWindow: 128000,
|
|
12543
12189
|
maxTokens: 4096,
|
|
12544
12190
|
},
|
|
12545
|
-
"x-ai/grok-3": {
|
|
12546
|
-
id: "x-ai/grok-3",
|
|
12547
|
-
name: "xAI: Grok 3",
|
|
12548
|
-
api: "openai-completions",
|
|
12549
|
-
provider: "openrouter",
|
|
12550
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
12551
|
-
reasoning: false,
|
|
12552
|
-
input: ["text"],
|
|
12553
|
-
cost: {
|
|
12554
|
-
input: 3,
|
|
12555
|
-
output: 15,
|
|
12556
|
-
cacheRead: 0.75,
|
|
12557
|
-
cacheWrite: 0,
|
|
12558
|
-
},
|
|
12559
|
-
contextWindow: 131072,
|
|
12560
|
-
maxTokens: 4096,
|
|
12561
|
-
},
|
|
12562
|
-
"x-ai/grok-3-beta": {
|
|
12563
|
-
id: "x-ai/grok-3-beta",
|
|
12564
|
-
name: "xAI: Grok 3 Beta",
|
|
12565
|
-
api: "openai-completions",
|
|
12566
|
-
provider: "openrouter",
|
|
12567
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
12568
|
-
reasoning: false,
|
|
12569
|
-
input: ["text"],
|
|
12570
|
-
cost: {
|
|
12571
|
-
input: 3,
|
|
12572
|
-
output: 15,
|
|
12573
|
-
cacheRead: 0.75,
|
|
12574
|
-
cacheWrite: 0,
|
|
12575
|
-
},
|
|
12576
|
-
contextWindow: 131072,
|
|
12577
|
-
maxTokens: 4096,
|
|
12578
|
-
},
|
|
12579
|
-
"x-ai/grok-3-mini": {
|
|
12580
|
-
id: "x-ai/grok-3-mini",
|
|
12581
|
-
name: "xAI: Grok 3 Mini",
|
|
12582
|
-
api: "openai-completions",
|
|
12583
|
-
provider: "openrouter",
|
|
12584
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
12585
|
-
reasoning: true,
|
|
12586
|
-
input: ["text"],
|
|
12587
|
-
cost: {
|
|
12588
|
-
input: 0.3,
|
|
12589
|
-
output: 0.5,
|
|
12590
|
-
cacheRead: 0.075,
|
|
12591
|
-
cacheWrite: 0,
|
|
12592
|
-
},
|
|
12593
|
-
contextWindow: 131072,
|
|
12594
|
-
maxTokens: 4096,
|
|
12595
|
-
},
|
|
12596
|
-
"x-ai/grok-3-mini-beta": {
|
|
12597
|
-
id: "x-ai/grok-3-mini-beta",
|
|
12598
|
-
name: "xAI: Grok 3 Mini Beta",
|
|
12599
|
-
api: "openai-completions",
|
|
12600
|
-
provider: "openrouter",
|
|
12601
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
12602
|
-
reasoning: true,
|
|
12603
|
-
input: ["text"],
|
|
12604
|
-
cost: {
|
|
12605
|
-
input: 0.3,
|
|
12606
|
-
output: 0.5,
|
|
12607
|
-
cacheRead: 0.075,
|
|
12608
|
-
cacheWrite: 0,
|
|
12609
|
-
},
|
|
12610
|
-
contextWindow: 131072,
|
|
12611
|
-
maxTokens: 4096,
|
|
12612
|
-
},
|
|
12613
|
-
"x-ai/grok-4": {
|
|
12614
|
-
id: "x-ai/grok-4",
|
|
12615
|
-
name: "xAI: Grok 4",
|
|
12616
|
-
api: "openai-completions",
|
|
12617
|
-
provider: "openrouter",
|
|
12618
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
12619
|
-
reasoning: true,
|
|
12620
|
-
input: ["text", "image"],
|
|
12621
|
-
cost: {
|
|
12622
|
-
input: 3,
|
|
12623
|
-
output: 15,
|
|
12624
|
-
cacheRead: 0.75,
|
|
12625
|
-
cacheWrite: 0,
|
|
12626
|
-
},
|
|
12627
|
-
contextWindow: 256000,
|
|
12628
|
-
maxTokens: 4096,
|
|
12629
|
-
},
|
|
12630
|
-
"x-ai/grok-4-fast": {
|
|
12631
|
-
id: "x-ai/grok-4-fast",
|
|
12632
|
-
name: "xAI: Grok 4 Fast",
|
|
12633
|
-
api: "openai-completions",
|
|
12634
|
-
provider: "openrouter",
|
|
12635
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
12636
|
-
reasoning: true,
|
|
12637
|
-
input: ["text", "image"],
|
|
12638
|
-
cost: {
|
|
12639
|
-
input: 0.19999999999999998,
|
|
12640
|
-
output: 0.5,
|
|
12641
|
-
cacheRead: 0.049999999999999996,
|
|
12642
|
-
cacheWrite: 0,
|
|
12643
|
-
},
|
|
12644
|
-
contextWindow: 2000000,
|
|
12645
|
-
maxTokens: 30000,
|
|
12646
|
-
},
|
|
12647
|
-
"x-ai/grok-4.1-fast": {
|
|
12648
|
-
id: "x-ai/grok-4.1-fast",
|
|
12649
|
-
name: "xAI: Grok 4.1 Fast",
|
|
12650
|
-
api: "openai-completions",
|
|
12651
|
-
provider: "openrouter",
|
|
12652
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
12653
|
-
reasoning: true,
|
|
12654
|
-
input: ["text", "image"],
|
|
12655
|
-
cost: {
|
|
12656
|
-
input: 0.19999999999999998,
|
|
12657
|
-
output: 0.5,
|
|
12658
|
-
cacheRead: 0.049999999999999996,
|
|
12659
|
-
cacheWrite: 0,
|
|
12660
|
-
},
|
|
12661
|
-
contextWindow: 2000000,
|
|
12662
|
-
maxTokens: 30000,
|
|
12663
|
-
},
|
|
12664
12191
|
"x-ai/grok-4.20": {
|
|
12665
12192
|
id: "x-ai/grok-4.20",
|
|
12666
12193
|
name: "xAI: Grok 4.20",
|
|
@@ -12695,22 +12222,22 @@ export const MODELS = {
|
|
|
12695
12222
|
contextWindow: 1000000,
|
|
12696
12223
|
maxTokens: 4096,
|
|
12697
12224
|
},
|
|
12698
|
-
"x-ai/grok-
|
|
12699
|
-
id: "x-ai/grok-
|
|
12700
|
-
name: "xAI: Grok
|
|
12225
|
+
"x-ai/grok-build-0.1": {
|
|
12226
|
+
id: "x-ai/grok-build-0.1",
|
|
12227
|
+
name: "xAI: Grok Build 0.1",
|
|
12701
12228
|
api: "openai-completions",
|
|
12702
12229
|
provider: "openrouter",
|
|
12703
12230
|
baseUrl: "https://openrouter.ai/api/v1",
|
|
12704
12231
|
reasoning: true,
|
|
12705
|
-
input: ["text"],
|
|
12232
|
+
input: ["text", "image"],
|
|
12706
12233
|
cost: {
|
|
12707
|
-
input:
|
|
12708
|
-
output:
|
|
12709
|
-
cacheRead: 0.
|
|
12234
|
+
input: 1,
|
|
12235
|
+
output: 2,
|
|
12236
|
+
cacheRead: 0.19999999999999998,
|
|
12710
12237
|
cacheWrite: 0,
|
|
12711
12238
|
},
|
|
12712
12239
|
contextWindow: 256000,
|
|
12713
|
-
maxTokens:
|
|
12240
|
+
maxTokens: 4096,
|
|
12714
12241
|
},
|
|
12715
12242
|
"xiaomi/mimo-v2-flash": {
|
|
12716
12243
|
id: "xiaomi/mimo-v2-flash",
|
|
@@ -12721,9 +12248,9 @@ export const MODELS = {
|
|
|
12721
12248
|
reasoning: true,
|
|
12722
12249
|
input: ["text"],
|
|
12723
12250
|
cost: {
|
|
12724
|
-
input: 0.
|
|
12725
|
-
output: 0.
|
|
12726
|
-
cacheRead: 0.
|
|
12251
|
+
input: 0.09999999999999999,
|
|
12252
|
+
output: 0.3,
|
|
12253
|
+
cacheRead: 0.01,
|
|
12727
12254
|
cacheWrite: 0,
|
|
12728
12255
|
},
|
|
12729
12256
|
contextWindow: 262144,
|
|
@@ -12795,7 +12322,7 @@ export const MODELS = {
|
|
|
12795
12322
|
cacheWrite: 0,
|
|
12796
12323
|
},
|
|
12797
12324
|
contextWindow: 1048576,
|
|
12798
|
-
maxTokens:
|
|
12325
|
+
maxTokens: 16384,
|
|
12799
12326
|
},
|
|
12800
12327
|
"z-ai/glm-4-32b": {
|
|
12801
12328
|
id: "z-ai/glm-4-32b",
|
|
@@ -12891,13 +12418,13 @@ export const MODELS = {
|
|
|
12891
12418
|
reasoning: true,
|
|
12892
12419
|
input: ["text"],
|
|
12893
12420
|
cost: {
|
|
12894
|
-
input: 0.
|
|
12895
|
-
output: 1.
|
|
12896
|
-
cacheRead: 0,
|
|
12421
|
+
input: 0.43,
|
|
12422
|
+
output: 1.74,
|
|
12423
|
+
cacheRead: 0.08,
|
|
12897
12424
|
cacheWrite: 0,
|
|
12898
12425
|
},
|
|
12899
|
-
contextWindow:
|
|
12900
|
-
maxTokens:
|
|
12426
|
+
contextWindow: 202752,
|
|
12427
|
+
maxTokens: 131072,
|
|
12901
12428
|
},
|
|
12902
12429
|
"z-ai/glm-4.6v": {
|
|
12903
12430
|
id: "z-ai/glm-4.6v",
|
|
@@ -12925,13 +12452,13 @@ export const MODELS = {
|
|
|
12925
12452
|
reasoning: true,
|
|
12926
12453
|
input: ["text"],
|
|
12927
12454
|
cost: {
|
|
12928
|
-
input: 0.
|
|
12929
|
-
output: 1.
|
|
12930
|
-
cacheRead: 0,
|
|
12455
|
+
input: 0.39999999999999997,
|
|
12456
|
+
output: 1.75,
|
|
12457
|
+
cacheRead: 0.08,
|
|
12931
12458
|
cacheWrite: 0,
|
|
12932
12459
|
},
|
|
12933
12460
|
contextWindow: 202752,
|
|
12934
|
-
maxTokens:
|
|
12461
|
+
maxTokens: 131072,
|
|
12935
12462
|
},
|
|
12936
12463
|
"z-ai/glm-4.7-flash": {
|
|
12937
12464
|
id: "z-ai/glm-4.7-flash",
|
|
@@ -12993,13 +12520,13 @@ export const MODELS = {
|
|
|
12993
12520
|
reasoning: true,
|
|
12994
12521
|
input: ["text"],
|
|
12995
12522
|
cost: {
|
|
12996
|
-
input:
|
|
12997
|
-
output: 3.
|
|
12998
|
-
cacheRead: 0.
|
|
12523
|
+
input: 0.98,
|
|
12524
|
+
output: 3.08,
|
|
12525
|
+
cacheRead: 0.182,
|
|
12999
12526
|
cacheWrite: 0,
|
|
13000
12527
|
},
|
|
13001
12528
|
contextWindow: 202752,
|
|
13002
|
-
maxTokens:
|
|
12529
|
+
maxTokens: 4096,
|
|
13003
12530
|
},
|
|
13004
12531
|
"z-ai/glm-5v-turbo": {
|
|
13005
12532
|
id: "z-ai/glm-5v-turbo",
|
|
@@ -13078,9 +12605,9 @@ export const MODELS = {
|
|
|
13078
12605
|
reasoning: true,
|
|
13079
12606
|
input: ["text", "image"],
|
|
13080
12607
|
cost: {
|
|
13081
|
-
input:
|
|
13082
|
-
output:
|
|
13083
|
-
cacheRead: 0.
|
|
12608
|
+
input: 1.5,
|
|
12609
|
+
output: 9,
|
|
12610
|
+
cacheRead: 0.15,
|
|
13084
12611
|
cacheWrite: 0.08333333333333334,
|
|
13085
12612
|
},
|
|
13086
12613
|
contextWindow: 1048576,
|
|
@@ -13112,13 +12639,13 @@ export const MODELS = {
|
|
|
13112
12639
|
reasoning: true,
|
|
13113
12640
|
input: ["text", "image"],
|
|
13114
12641
|
cost: {
|
|
13115
|
-
input: 0.
|
|
13116
|
-
output: 3.
|
|
13117
|
-
cacheRead: 0.
|
|
12642
|
+
input: 0.73,
|
|
12643
|
+
output: 3.49,
|
|
12644
|
+
cacheRead: 0.25,
|
|
13118
12645
|
cacheWrite: 0,
|
|
13119
12646
|
},
|
|
13120
12647
|
contextWindow: 262144,
|
|
13121
|
-
maxTokens:
|
|
12648
|
+
maxTokens: 262142,
|
|
13122
12649
|
},
|
|
13123
12650
|
"~openai/gpt-latest": {
|
|
13124
12651
|
id: "~openai/gpt-latest",
|
|
@@ -13155,62 +12682,384 @@ export const MODELS = {
|
|
|
13155
12682
|
maxTokens: 128000,
|
|
13156
12683
|
},
|
|
13157
12684
|
},
|
|
13158
|
-
"
|
|
13159
|
-
"
|
|
13160
|
-
id: "
|
|
13161
|
-
name: "
|
|
13162
|
-
api: "
|
|
13163
|
-
provider: "
|
|
13164
|
-
baseUrl: "https://
|
|
12685
|
+
"together": {
|
|
12686
|
+
"MiniMaxAI/MiniMax-M2.5": {
|
|
12687
|
+
id: "MiniMaxAI/MiniMax-M2.5",
|
|
12688
|
+
name: "MiniMax-M2.5",
|
|
12689
|
+
api: "openai-completions",
|
|
12690
|
+
provider: "together",
|
|
12691
|
+
baseUrl: "https://api.together.ai/v1",
|
|
12692
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
13165
12693
|
reasoning: true,
|
|
12694
|
+
thinkingLevelMap: { "off": null, "minimal": null, "low": null, "medium": null },
|
|
13166
12695
|
input: ["text"],
|
|
13167
12696
|
cost: {
|
|
13168
|
-
input: 0.
|
|
13169
|
-
output:
|
|
13170
|
-
cacheRead: 0,
|
|
12697
|
+
input: 0.3,
|
|
12698
|
+
output: 1.2,
|
|
12699
|
+
cacheRead: 0.06,
|
|
13171
12700
|
cacheWrite: 0,
|
|
13172
12701
|
},
|
|
13173
|
-
contextWindow:
|
|
13174
|
-
maxTokens:
|
|
12702
|
+
contextWindow: 204800,
|
|
12703
|
+
maxTokens: 131072,
|
|
13175
12704
|
},
|
|
13176
|
-
"
|
|
13177
|
-
id: "
|
|
13178
|
-
name: "
|
|
13179
|
-
api: "
|
|
13180
|
-
provider: "
|
|
13181
|
-
baseUrl: "https://
|
|
13182
|
-
|
|
12705
|
+
"MiniMaxAI/MiniMax-M2.7": {
|
|
12706
|
+
id: "MiniMaxAI/MiniMax-M2.7",
|
|
12707
|
+
name: "MiniMax-M2.7",
|
|
12708
|
+
api: "openai-completions",
|
|
12709
|
+
provider: "together",
|
|
12710
|
+
baseUrl: "https://api.together.ai/v1",
|
|
12711
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
12712
|
+
reasoning: true,
|
|
12713
|
+
thinkingLevelMap: { "off": null, "minimal": null, "low": null, "medium": null },
|
|
13183
12714
|
input: ["text"],
|
|
13184
12715
|
cost: {
|
|
13185
|
-
input: 0.
|
|
12716
|
+
input: 0.3,
|
|
13186
12717
|
output: 1.2,
|
|
13187
|
-
cacheRead: 0.
|
|
12718
|
+
cacheRead: 0.06,
|
|
13188
12719
|
cacheWrite: 0,
|
|
13189
12720
|
},
|
|
13190
|
-
contextWindow:
|
|
13191
|
-
maxTokens:
|
|
12721
|
+
contextWindow: 202752,
|
|
12722
|
+
maxTokens: 131072,
|
|
13192
12723
|
},
|
|
13193
|
-
"
|
|
13194
|
-
id: "
|
|
13195
|
-
name: "Qwen3
|
|
13196
|
-
api: "
|
|
13197
|
-
provider: "
|
|
13198
|
-
baseUrl: "https://
|
|
12724
|
+
"Qwen/Qwen3-235B-A22B-Instruct-2507-tput": {
|
|
12725
|
+
id: "Qwen/Qwen3-235B-A22B-Instruct-2507-tput",
|
|
12726
|
+
name: "Qwen3 235B A22B Instruct 2507 FP8",
|
|
12727
|
+
api: "openai-completions",
|
|
12728
|
+
provider: "together",
|
|
12729
|
+
baseUrl: "https://api.together.ai/v1",
|
|
12730
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
|
|
13199
12731
|
reasoning: true,
|
|
12732
|
+
thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
|
|
13200
12733
|
input: ["text"],
|
|
13201
12734
|
cost: {
|
|
13202
|
-
input: 0.
|
|
13203
|
-
output: 0.
|
|
12735
|
+
input: 0.2,
|
|
12736
|
+
output: 0.6,
|
|
13204
12737
|
cacheRead: 0,
|
|
13205
12738
|
cacheWrite: 0,
|
|
13206
12739
|
},
|
|
13207
|
-
contextWindow:
|
|
13208
|
-
maxTokens:
|
|
12740
|
+
contextWindow: 262144,
|
|
12741
|
+
maxTokens: 262144,
|
|
13209
12742
|
},
|
|
13210
|
-
"
|
|
13211
|
-
id: "
|
|
13212
|
-
name: "
|
|
13213
|
-
api: "
|
|
12743
|
+
"Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8": {
|
|
12744
|
+
id: "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
|
|
12745
|
+
name: "Qwen3 Coder 480B A35B Instruct",
|
|
12746
|
+
api: "openai-completions",
|
|
12747
|
+
provider: "together",
|
|
12748
|
+
baseUrl: "https://api.together.ai/v1",
|
|
12749
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
12750
|
+
reasoning: false,
|
|
12751
|
+
input: ["text"],
|
|
12752
|
+
cost: {
|
|
12753
|
+
input: 2,
|
|
12754
|
+
output: 2,
|
|
12755
|
+
cacheRead: 0,
|
|
12756
|
+
cacheWrite: 0,
|
|
12757
|
+
},
|
|
12758
|
+
contextWindow: 262144,
|
|
12759
|
+
maxTokens: 262144,
|
|
12760
|
+
},
|
|
12761
|
+
"Qwen/Qwen3-Coder-Next-FP8": {
|
|
12762
|
+
id: "Qwen/Qwen3-Coder-Next-FP8",
|
|
12763
|
+
name: "Qwen3 Coder Next FP8",
|
|
12764
|
+
api: "openai-completions",
|
|
12765
|
+
provider: "together",
|
|
12766
|
+
baseUrl: "https://api.together.ai/v1",
|
|
12767
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
|
|
12768
|
+
reasoning: true,
|
|
12769
|
+
thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
|
|
12770
|
+
input: ["text"],
|
|
12771
|
+
cost: {
|
|
12772
|
+
input: 0.5,
|
|
12773
|
+
output: 1.2,
|
|
12774
|
+
cacheRead: 0,
|
|
12775
|
+
cacheWrite: 0,
|
|
12776
|
+
},
|
|
12777
|
+
contextWindow: 262144,
|
|
12778
|
+
maxTokens: 262144,
|
|
12779
|
+
},
|
|
12780
|
+
"Qwen/Qwen3.5-397B-A17B": {
|
|
12781
|
+
id: "Qwen/Qwen3.5-397B-A17B",
|
|
12782
|
+
name: "Qwen3.5 397B A17B",
|
|
12783
|
+
api: "openai-completions",
|
|
12784
|
+
provider: "together",
|
|
12785
|
+
baseUrl: "https://api.together.ai/v1",
|
|
12786
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
|
|
12787
|
+
reasoning: true,
|
|
12788
|
+
thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
|
|
12789
|
+
input: ["text", "image"],
|
|
12790
|
+
cost: {
|
|
12791
|
+
input: 0.6,
|
|
12792
|
+
output: 3.6,
|
|
12793
|
+
cacheRead: 0,
|
|
12794
|
+
cacheWrite: 0,
|
|
12795
|
+
},
|
|
12796
|
+
contextWindow: 262144,
|
|
12797
|
+
maxTokens: 130000,
|
|
12798
|
+
},
|
|
12799
|
+
"Qwen/Qwen3.6-Plus": {
|
|
12800
|
+
id: "Qwen/Qwen3.6-Plus",
|
|
12801
|
+
name: "Qwen3.6 Plus",
|
|
12802
|
+
api: "openai-completions",
|
|
12803
|
+
provider: "together",
|
|
12804
|
+
baseUrl: "https://api.together.ai/v1",
|
|
12805
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
|
|
12806
|
+
reasoning: true,
|
|
12807
|
+
thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
|
|
12808
|
+
input: ["text"],
|
|
12809
|
+
cost: {
|
|
12810
|
+
input: 0.5,
|
|
12811
|
+
output: 3,
|
|
12812
|
+
cacheRead: 0,
|
|
12813
|
+
cacheWrite: 0,
|
|
12814
|
+
},
|
|
12815
|
+
contextWindow: 1000000,
|
|
12816
|
+
maxTokens: 500000,
|
|
12817
|
+
},
|
|
12818
|
+
"deepseek-ai/DeepSeek-V3": {
|
|
12819
|
+
id: "deepseek-ai/DeepSeek-V3",
|
|
12820
|
+
name: "DeepSeek V3",
|
|
12821
|
+
api: "openai-completions",
|
|
12822
|
+
provider: "together",
|
|
12823
|
+
baseUrl: "https://api.together.ai/v1",
|
|
12824
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
|
|
12825
|
+
reasoning: true,
|
|
12826
|
+
thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
|
|
12827
|
+
input: ["text"],
|
|
12828
|
+
cost: {
|
|
12829
|
+
input: 1.25,
|
|
12830
|
+
output: 1.25,
|
|
12831
|
+
cacheRead: 0,
|
|
12832
|
+
cacheWrite: 0,
|
|
12833
|
+
},
|
|
12834
|
+
contextWindow: 131072,
|
|
12835
|
+
maxTokens: 131072,
|
|
12836
|
+
},
|
|
12837
|
+
"deepseek-ai/DeepSeek-V3-1": {
|
|
12838
|
+
id: "deepseek-ai/DeepSeek-V3-1",
|
|
12839
|
+
name: "DeepSeek V3.1",
|
|
12840
|
+
api: "openai-completions",
|
|
12841
|
+
provider: "together",
|
|
12842
|
+
baseUrl: "https://api.together.ai/v1",
|
|
12843
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
|
|
12844
|
+
reasoning: true,
|
|
12845
|
+
thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
|
|
12846
|
+
input: ["text"],
|
|
12847
|
+
cost: {
|
|
12848
|
+
input: 0.6,
|
|
12849
|
+
output: 1.7,
|
|
12850
|
+
cacheRead: 0,
|
|
12851
|
+
cacheWrite: 0,
|
|
12852
|
+
},
|
|
12853
|
+
contextWindow: 131072,
|
|
12854
|
+
maxTokens: 131072,
|
|
12855
|
+
},
|
|
12856
|
+
"deepseek-ai/DeepSeek-V4-Pro": {
|
|
12857
|
+
id: "deepseek-ai/DeepSeek-V4-Pro",
|
|
12858
|
+
name: "DeepSeek V4 Pro",
|
|
12859
|
+
api: "openai-completions",
|
|
12860
|
+
provider: "together",
|
|
12861
|
+
baseUrl: "https://api.together.ai/v1",
|
|
12862
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": true, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
|
|
12863
|
+
reasoning: true,
|
|
12864
|
+
thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": null },
|
|
12865
|
+
input: ["text"],
|
|
12866
|
+
cost: {
|
|
12867
|
+
input: 2.1,
|
|
12868
|
+
output: 4.4,
|
|
12869
|
+
cacheRead: 0.2,
|
|
12870
|
+
cacheWrite: 0,
|
|
12871
|
+
},
|
|
12872
|
+
contextWindow: 512000,
|
|
12873
|
+
maxTokens: 384000,
|
|
12874
|
+
},
|
|
12875
|
+
"essentialai/Rnj-1-Instruct": {
|
|
12876
|
+
id: "essentialai/Rnj-1-Instruct",
|
|
12877
|
+
name: "Rnj-1 Instruct",
|
|
12878
|
+
api: "openai-completions",
|
|
12879
|
+
provider: "together",
|
|
12880
|
+
baseUrl: "https://api.together.ai/v1",
|
|
12881
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
12882
|
+
reasoning: false,
|
|
12883
|
+
input: ["text"],
|
|
12884
|
+
cost: {
|
|
12885
|
+
input: 0.15,
|
|
12886
|
+
output: 0.15,
|
|
12887
|
+
cacheRead: 0,
|
|
12888
|
+
cacheWrite: 0,
|
|
12889
|
+
},
|
|
12890
|
+
contextWindow: 32768,
|
|
12891
|
+
maxTokens: 32768,
|
|
12892
|
+
},
|
|
12893
|
+
"google/gemma-4-31B-it": {
|
|
12894
|
+
id: "google/gemma-4-31B-it",
|
|
12895
|
+
name: "Gemma 4 31B Instruct",
|
|
12896
|
+
api: "openai-completions",
|
|
12897
|
+
provider: "together",
|
|
12898
|
+
baseUrl: "https://api.together.ai/v1",
|
|
12899
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
|
|
12900
|
+
reasoning: true,
|
|
12901
|
+
thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
|
|
12902
|
+
input: ["text", "image"],
|
|
12903
|
+
cost: {
|
|
12904
|
+
input: 0.2,
|
|
12905
|
+
output: 0.5,
|
|
12906
|
+
cacheRead: 0,
|
|
12907
|
+
cacheWrite: 0,
|
|
12908
|
+
},
|
|
12909
|
+
contextWindow: 262144,
|
|
12910
|
+
maxTokens: 131072,
|
|
12911
|
+
},
|
|
12912
|
+
"meta-llama/Llama-3.3-70B-Instruct-Turbo": {
|
|
12913
|
+
id: "meta-llama/Llama-3.3-70B-Instruct-Turbo",
|
|
12914
|
+
name: "Llama 3.3 70B",
|
|
12915
|
+
api: "openai-completions",
|
|
12916
|
+
provider: "together",
|
|
12917
|
+
baseUrl: "https://api.together.ai/v1",
|
|
12918
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
12919
|
+
reasoning: false,
|
|
12920
|
+
input: ["text"],
|
|
12921
|
+
cost: {
|
|
12922
|
+
input: 0.88,
|
|
12923
|
+
output: 0.88,
|
|
12924
|
+
cacheRead: 0,
|
|
12925
|
+
cacheWrite: 0,
|
|
12926
|
+
},
|
|
12927
|
+
contextWindow: 131072,
|
|
12928
|
+
maxTokens: 131072,
|
|
12929
|
+
},
|
|
12930
|
+
"moonshotai/Kimi-K2.5": {
|
|
12931
|
+
id: "moonshotai/Kimi-K2.5",
|
|
12932
|
+
name: "Kimi K2.5",
|
|
12933
|
+
api: "openai-completions",
|
|
12934
|
+
provider: "together",
|
|
12935
|
+
baseUrl: "https://api.together.ai/v1",
|
|
12936
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
|
|
12937
|
+
reasoning: true,
|
|
12938
|
+
thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
|
|
12939
|
+
input: ["text", "image"],
|
|
12940
|
+
cost: {
|
|
12941
|
+
input: 0.5,
|
|
12942
|
+
output: 2.8,
|
|
12943
|
+
cacheRead: 0,
|
|
12944
|
+
cacheWrite: 0,
|
|
12945
|
+
},
|
|
12946
|
+
contextWindow: 262144,
|
|
12947
|
+
maxTokens: 262144,
|
|
12948
|
+
},
|
|
12949
|
+
"moonshotai/Kimi-K2.6": {
|
|
12950
|
+
id: "moonshotai/Kimi-K2.6",
|
|
12951
|
+
name: "Kimi K2.6",
|
|
12952
|
+
api: "openai-completions",
|
|
12953
|
+
provider: "together",
|
|
12954
|
+
baseUrl: "https://api.together.ai/v1",
|
|
12955
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
|
|
12956
|
+
reasoning: true,
|
|
12957
|
+
thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
|
|
12958
|
+
input: ["text", "image"],
|
|
12959
|
+
cost: {
|
|
12960
|
+
input: 1.2,
|
|
12961
|
+
output: 4.5,
|
|
12962
|
+
cacheRead: 0.2,
|
|
12963
|
+
cacheWrite: 0,
|
|
12964
|
+
},
|
|
12965
|
+
contextWindow: 262144,
|
|
12966
|
+
maxTokens: 131000,
|
|
12967
|
+
},
|
|
12968
|
+
"openai/gpt-oss-120b": {
|
|
12969
|
+
id: "openai/gpt-oss-120b",
|
|
12970
|
+
name: "GPT OSS 120B",
|
|
12971
|
+
api: "openai-completions",
|
|
12972
|
+
provider: "together",
|
|
12973
|
+
baseUrl: "https://api.together.ai/v1",
|
|
12974
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": true, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "openai" },
|
|
12975
|
+
reasoning: true,
|
|
12976
|
+
thinkingLevelMap: { "off": null, "minimal": null },
|
|
12977
|
+
input: ["text"],
|
|
12978
|
+
cost: {
|
|
12979
|
+
input: 0.15,
|
|
12980
|
+
output: 0.6,
|
|
12981
|
+
cacheRead: 0,
|
|
12982
|
+
cacheWrite: 0,
|
|
12983
|
+
},
|
|
12984
|
+
contextWindow: 131072,
|
|
12985
|
+
maxTokens: 131072,
|
|
12986
|
+
},
|
|
12987
|
+
"zai-org/GLM-5.1": {
|
|
12988
|
+
id: "zai-org/GLM-5.1",
|
|
12989
|
+
name: "GLM-5.1",
|
|
12990
|
+
api: "openai-completions",
|
|
12991
|
+
provider: "together",
|
|
12992
|
+
baseUrl: "https://api.together.ai/v1",
|
|
12993
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
|
|
12994
|
+
reasoning: true,
|
|
12995
|
+
thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
|
|
12996
|
+
input: ["text"],
|
|
12997
|
+
cost: {
|
|
12998
|
+
input: 1.4,
|
|
12999
|
+
output: 4.4,
|
|
13000
|
+
cacheRead: 0,
|
|
13001
|
+
cacheWrite: 0,
|
|
13002
|
+
},
|
|
13003
|
+
contextWindow: 202752,
|
|
13004
|
+
maxTokens: 131072,
|
|
13005
|
+
},
|
|
13006
|
+
},
|
|
13007
|
+
"vercel-ai-gateway": {
|
|
13008
|
+
"alibaba/qwen-3-14b": {
|
|
13009
|
+
id: "alibaba/qwen-3-14b",
|
|
13010
|
+
name: "Qwen3-14B",
|
|
13011
|
+
api: "anthropic-messages",
|
|
13012
|
+
provider: "vercel-ai-gateway",
|
|
13013
|
+
baseUrl: "https://ai-gateway.vercel.sh",
|
|
13014
|
+
reasoning: true,
|
|
13015
|
+
input: ["text"],
|
|
13016
|
+
cost: {
|
|
13017
|
+
input: 0.12,
|
|
13018
|
+
output: 0.24,
|
|
13019
|
+
cacheRead: 0,
|
|
13020
|
+
cacheWrite: 0,
|
|
13021
|
+
},
|
|
13022
|
+
contextWindow: 40960,
|
|
13023
|
+
maxTokens: 16384,
|
|
13024
|
+
},
|
|
13025
|
+
"alibaba/qwen-3-235b": {
|
|
13026
|
+
id: "alibaba/qwen-3-235b",
|
|
13027
|
+
name: "Qwen3 235B A22b Instruct 2507",
|
|
13028
|
+
api: "anthropic-messages",
|
|
13029
|
+
provider: "vercel-ai-gateway",
|
|
13030
|
+
baseUrl: "https://ai-gateway.vercel.sh",
|
|
13031
|
+
reasoning: false,
|
|
13032
|
+
input: ["text"],
|
|
13033
|
+
cost: {
|
|
13034
|
+
input: 0.6,
|
|
13035
|
+
output: 1.2,
|
|
13036
|
+
cacheRead: 0.6,
|
|
13037
|
+
cacheWrite: 0,
|
|
13038
|
+
},
|
|
13039
|
+
contextWindow: 131000,
|
|
13040
|
+
maxTokens: 40000,
|
|
13041
|
+
},
|
|
13042
|
+
"alibaba/qwen-3-30b": {
|
|
13043
|
+
id: "alibaba/qwen-3-30b",
|
|
13044
|
+
name: "Qwen3-30B-A3B",
|
|
13045
|
+
api: "anthropic-messages",
|
|
13046
|
+
provider: "vercel-ai-gateway",
|
|
13047
|
+
baseUrl: "https://ai-gateway.vercel.sh",
|
|
13048
|
+
reasoning: true,
|
|
13049
|
+
input: ["text"],
|
|
13050
|
+
cost: {
|
|
13051
|
+
input: 0.08,
|
|
13052
|
+
output: 0.29,
|
|
13053
|
+
cacheRead: 0,
|
|
13054
|
+
cacheWrite: 0,
|
|
13055
|
+
},
|
|
13056
|
+
contextWindow: 40960,
|
|
13057
|
+
maxTokens: 16384,
|
|
13058
|
+
},
|
|
13059
|
+
"alibaba/qwen-3-32b": {
|
|
13060
|
+
id: "alibaba/qwen-3-32b",
|
|
13061
|
+
name: "Qwen 3 32B",
|
|
13062
|
+
api: "anthropic-messages",
|
|
13214
13063
|
provider: "vercel-ai-gateway",
|
|
13215
13064
|
baseUrl: "https://ai-gateway.vercel.sh",
|
|
13216
13065
|
reasoning: true,
|
|
@@ -13462,6 +13311,23 @@ export const MODELS = {
|
|
|
13462
13311
|
contextWindow: 1000000,
|
|
13463
13312
|
maxTokens: 64000,
|
|
13464
13313
|
},
|
|
13314
|
+
"alibaba/qwen3.7-max": {
|
|
13315
|
+
id: "alibaba/qwen3.7-max",
|
|
13316
|
+
name: "Qwen 3.7 Max",
|
|
13317
|
+
api: "anthropic-messages",
|
|
13318
|
+
provider: "vercel-ai-gateway",
|
|
13319
|
+
baseUrl: "https://ai-gateway.vercel.sh",
|
|
13320
|
+
reasoning: true,
|
|
13321
|
+
input: ["text", "image"],
|
|
13322
|
+
cost: {
|
|
13323
|
+
input: 2.5,
|
|
13324
|
+
output: 7.5,
|
|
13325
|
+
cacheRead: 0.5,
|
|
13326
|
+
cacheWrite: 3.125,
|
|
13327
|
+
},
|
|
13328
|
+
contextWindow: 991000,
|
|
13329
|
+
maxTokens: 64000,
|
|
13330
|
+
},
|
|
13465
13331
|
"anthropic/claude-3-haiku": {
|
|
13466
13332
|
id: "anthropic/claude-3-haiku",
|
|
13467
13333
|
name: "Claude 3 Haiku",
|
|
@@ -13496,26 +13362,9 @@ export const MODELS = {
|
|
|
13496
13362
|
contextWindow: 200000,
|
|
13497
13363
|
maxTokens: 8192,
|
|
13498
13364
|
},
|
|
13499
|
-
"anthropic/claude-
|
|
13500
|
-
id: "anthropic/claude-
|
|
13501
|
-
name: "Claude
|
|
13502
|
-
api: "anthropic-messages",
|
|
13503
|
-
provider: "vercel-ai-gateway",
|
|
13504
|
-
baseUrl: "https://ai-gateway.vercel.sh",
|
|
13505
|
-
reasoning: true,
|
|
13506
|
-
input: ["text", "image"],
|
|
13507
|
-
cost: {
|
|
13508
|
-
input: 3,
|
|
13509
|
-
output: 15,
|
|
13510
|
-
cacheRead: 0.3,
|
|
13511
|
-
cacheWrite: 3.75,
|
|
13512
|
-
},
|
|
13513
|
-
contextWindow: 200000,
|
|
13514
|
-
maxTokens: 8192,
|
|
13515
|
-
},
|
|
13516
|
-
"anthropic/claude-haiku-4.5": {
|
|
13517
|
-
id: "anthropic/claude-haiku-4.5",
|
|
13518
|
-
name: "Claude Haiku 4.5",
|
|
13365
|
+
"anthropic/claude-haiku-4.5": {
|
|
13366
|
+
id: "anthropic/claude-haiku-4.5",
|
|
13367
|
+
name: "Claude Haiku 4.5",
|
|
13519
13368
|
api: "anthropic-messages",
|
|
13520
13369
|
provider: "vercel-ai-gateway",
|
|
13521
13370
|
baseUrl: "https://ai-gateway.vercel.sh",
|
|
@@ -13991,6 +13840,23 @@ export const MODELS = {
|
|
|
13991
13840
|
contextWindow: 1000000,
|
|
13992
13841
|
maxTokens: 64000,
|
|
13993
13842
|
},
|
|
13843
|
+
"google/gemini-3.1-flash-lite": {
|
|
13844
|
+
id: "google/gemini-3.1-flash-lite",
|
|
13845
|
+
name: "Gemini 3.1 Flash Lite",
|
|
13846
|
+
api: "anthropic-messages",
|
|
13847
|
+
provider: "vercel-ai-gateway",
|
|
13848
|
+
baseUrl: "https://ai-gateway.vercel.sh",
|
|
13849
|
+
reasoning: true,
|
|
13850
|
+
input: ["text", "image"],
|
|
13851
|
+
cost: {
|
|
13852
|
+
input: 0.25,
|
|
13853
|
+
output: 1.5,
|
|
13854
|
+
cacheRead: 0.03,
|
|
13855
|
+
cacheWrite: 0,
|
|
13856
|
+
},
|
|
13857
|
+
contextWindow: 1000000,
|
|
13858
|
+
maxTokens: 65000,
|
|
13859
|
+
},
|
|
13994
13860
|
"google/gemini-3.1-flash-lite-preview": {
|
|
13995
13861
|
id: "google/gemini-3.1-flash-lite-preview",
|
|
13996
13862
|
name: "Gemini 3.1 Flash Lite Preview",
|
|
@@ -14025,6 +13891,23 @@ export const MODELS = {
|
|
|
14025
13891
|
contextWindow: 1000000,
|
|
14026
13892
|
maxTokens: 64000,
|
|
14027
13893
|
},
|
|
13894
|
+
"google/gemini-3.5-flash": {
|
|
13895
|
+
id: "google/gemini-3.5-flash",
|
|
13896
|
+
name: "Gemini 3.5 Flash",
|
|
13897
|
+
api: "anthropic-messages",
|
|
13898
|
+
provider: "vercel-ai-gateway",
|
|
13899
|
+
baseUrl: "https://ai-gateway.vercel.sh",
|
|
13900
|
+
reasoning: true,
|
|
13901
|
+
input: ["text", "image"],
|
|
13902
|
+
cost: {
|
|
13903
|
+
input: 1.5,
|
|
13904
|
+
output: 9,
|
|
13905
|
+
cacheRead: 0.15,
|
|
13906
|
+
cacheWrite: 0,
|
|
13907
|
+
},
|
|
13908
|
+
contextWindow: 1000000,
|
|
13909
|
+
maxTokens: 64000,
|
|
13910
|
+
},
|
|
14028
13911
|
"google/gemma-4-26b-a4b-it": {
|
|
14029
13912
|
id: "google/gemma-4-26b-a4b-it",
|
|
14030
13913
|
name: "Gemma 4 26B A4B IT",
|
|
@@ -14484,6 +14367,23 @@ export const MODELS = {
|
|
|
14484
14367
|
contextWindow: 128000,
|
|
14485
14368
|
maxTokens: 64000,
|
|
14486
14369
|
},
|
|
14370
|
+
"mistral/mistral-medium-3.5": {
|
|
14371
|
+
id: "mistral/mistral-medium-3.5",
|
|
14372
|
+
name: "Mistral Medium Latest",
|
|
14373
|
+
api: "anthropic-messages",
|
|
14374
|
+
provider: "vercel-ai-gateway",
|
|
14375
|
+
baseUrl: "https://ai-gateway.vercel.sh",
|
|
14376
|
+
reasoning: true,
|
|
14377
|
+
input: ["text"],
|
|
14378
|
+
cost: {
|
|
14379
|
+
input: 1.5,
|
|
14380
|
+
output: 7.5,
|
|
14381
|
+
cacheRead: 0,
|
|
14382
|
+
cacheWrite: 0,
|
|
14383
|
+
},
|
|
14384
|
+
contextWindow: 256000,
|
|
14385
|
+
maxTokens: 256000,
|
|
14386
|
+
},
|
|
14487
14387
|
"mistral/mistral-small": {
|
|
14488
14388
|
id: "mistral/mistral-small",
|
|
14489
14389
|
name: "Mistral Small",
|
|
@@ -15178,7 +15078,7 @@ export const MODELS = {
|
|
|
15178
15078
|
},
|
|
15179
15079
|
"openai/gpt-oss-20b": {
|
|
15180
15080
|
id: "openai/gpt-oss-20b",
|
|
15181
|
-
name: "GPT OSS
|
|
15081
|
+
name: "GPT OSS 20B",
|
|
15182
15082
|
api: "anthropic-messages",
|
|
15183
15083
|
provider: "vercel-ai-gateway",
|
|
15184
15084
|
baseUrl: "https://ai-gateway.vercel.sh",
|
|
@@ -15346,125 +15246,6 @@ export const MODELS = {
|
|
|
15346
15246
|
contextWindow: 200000,
|
|
15347
15247
|
maxTokens: 8000,
|
|
15348
15248
|
},
|
|
15349
|
-
"xai/grok-3": {
|
|
15350
|
-
id: "xai/grok-3",
|
|
15351
|
-
name: "Grok 3 Beta",
|
|
15352
|
-
api: "anthropic-messages",
|
|
15353
|
-
provider: "vercel-ai-gateway",
|
|
15354
|
-
baseUrl: "https://ai-gateway.vercel.sh",
|
|
15355
|
-
reasoning: false,
|
|
15356
|
-
input: ["text"],
|
|
15357
|
-
cost: {
|
|
15358
|
-
input: 3,
|
|
15359
|
-
output: 15,
|
|
15360
|
-
cacheRead: 0.75,
|
|
15361
|
-
cacheWrite: 0,
|
|
15362
|
-
},
|
|
15363
|
-
contextWindow: 131072,
|
|
15364
|
-
maxTokens: 131072,
|
|
15365
|
-
},
|
|
15366
|
-
"xai/grok-3-fast": {
|
|
15367
|
-
id: "xai/grok-3-fast",
|
|
15368
|
-
name: "Grok 3 Fast Beta",
|
|
15369
|
-
api: "anthropic-messages",
|
|
15370
|
-
provider: "vercel-ai-gateway",
|
|
15371
|
-
baseUrl: "https://ai-gateway.vercel.sh",
|
|
15372
|
-
reasoning: false,
|
|
15373
|
-
input: ["text"],
|
|
15374
|
-
cost: {
|
|
15375
|
-
input: 5,
|
|
15376
|
-
output: 25,
|
|
15377
|
-
cacheRead: 1.25,
|
|
15378
|
-
cacheWrite: 0,
|
|
15379
|
-
},
|
|
15380
|
-
contextWindow: 131072,
|
|
15381
|
-
maxTokens: 131072,
|
|
15382
|
-
},
|
|
15383
|
-
"xai/grok-3-mini": {
|
|
15384
|
-
id: "xai/grok-3-mini",
|
|
15385
|
-
name: "Grok 3 Mini Beta",
|
|
15386
|
-
api: "anthropic-messages",
|
|
15387
|
-
provider: "vercel-ai-gateway",
|
|
15388
|
-
baseUrl: "https://ai-gateway.vercel.sh",
|
|
15389
|
-
reasoning: false,
|
|
15390
|
-
input: ["text"],
|
|
15391
|
-
cost: {
|
|
15392
|
-
input: 0.3,
|
|
15393
|
-
output: 0.5,
|
|
15394
|
-
cacheRead: 0.075,
|
|
15395
|
-
cacheWrite: 0,
|
|
15396
|
-
},
|
|
15397
|
-
contextWindow: 131072,
|
|
15398
|
-
maxTokens: 131072,
|
|
15399
|
-
},
|
|
15400
|
-
"xai/grok-3-mini-fast": {
|
|
15401
|
-
id: "xai/grok-3-mini-fast",
|
|
15402
|
-
name: "Grok 3 Mini Fast Beta",
|
|
15403
|
-
api: "anthropic-messages",
|
|
15404
|
-
provider: "vercel-ai-gateway",
|
|
15405
|
-
baseUrl: "https://ai-gateway.vercel.sh",
|
|
15406
|
-
reasoning: false,
|
|
15407
|
-
input: ["text"],
|
|
15408
|
-
cost: {
|
|
15409
|
-
input: 0.6,
|
|
15410
|
-
output: 4,
|
|
15411
|
-
cacheRead: 0,
|
|
15412
|
-
cacheWrite: 0,
|
|
15413
|
-
},
|
|
15414
|
-
contextWindow: 131072,
|
|
15415
|
-
maxTokens: 131072,
|
|
15416
|
-
},
|
|
15417
|
-
"xai/grok-4": {
|
|
15418
|
-
id: "xai/grok-4",
|
|
15419
|
-
name: "Grok 4",
|
|
15420
|
-
api: "anthropic-messages",
|
|
15421
|
-
provider: "vercel-ai-gateway",
|
|
15422
|
-
baseUrl: "https://ai-gateway.vercel.sh",
|
|
15423
|
-
reasoning: true,
|
|
15424
|
-
input: ["text", "image"],
|
|
15425
|
-
cost: {
|
|
15426
|
-
input: 3,
|
|
15427
|
-
output: 15,
|
|
15428
|
-
cacheRead: 0.75,
|
|
15429
|
-
cacheWrite: 0,
|
|
15430
|
-
},
|
|
15431
|
-
contextWindow: 256000,
|
|
15432
|
-
maxTokens: 256000,
|
|
15433
|
-
},
|
|
15434
|
-
"xai/grok-4-fast-non-reasoning": {
|
|
15435
|
-
id: "xai/grok-4-fast-non-reasoning",
|
|
15436
|
-
name: "Grok 4 Fast Non-Reasoning",
|
|
15437
|
-
api: "anthropic-messages",
|
|
15438
|
-
provider: "vercel-ai-gateway",
|
|
15439
|
-
baseUrl: "https://ai-gateway.vercel.sh",
|
|
15440
|
-
reasoning: false,
|
|
15441
|
-
input: ["text", "image"],
|
|
15442
|
-
cost: {
|
|
15443
|
-
input: 0.19999999999999998,
|
|
15444
|
-
output: 0.5,
|
|
15445
|
-
cacheRead: 0.049999999999999996,
|
|
15446
|
-
cacheWrite: 0,
|
|
15447
|
-
},
|
|
15448
|
-
contextWindow: 2000000,
|
|
15449
|
-
maxTokens: 256000,
|
|
15450
|
-
},
|
|
15451
|
-
"xai/grok-4-fast-reasoning": {
|
|
15452
|
-
id: "xai/grok-4-fast-reasoning",
|
|
15453
|
-
name: "Grok 4 Fast Reasoning",
|
|
15454
|
-
api: "anthropic-messages",
|
|
15455
|
-
provider: "vercel-ai-gateway",
|
|
15456
|
-
baseUrl: "https://ai-gateway.vercel.sh",
|
|
15457
|
-
reasoning: true,
|
|
15458
|
-
input: ["text", "image"],
|
|
15459
|
-
cost: {
|
|
15460
|
-
input: 0.19999999999999998,
|
|
15461
|
-
output: 0.5,
|
|
15462
|
-
cacheRead: 0.049999999999999996,
|
|
15463
|
-
cacheWrite: 0,
|
|
15464
|
-
},
|
|
15465
|
-
contextWindow: 2000000,
|
|
15466
|
-
maxTokens: 256000,
|
|
15467
|
-
},
|
|
15468
15249
|
"xai/grok-4.1-fast-non-reasoning": {
|
|
15469
15250
|
id: "xai/grok-4.1-fast-non-reasoning",
|
|
15470
15251
|
name: "Grok 4.1 Fast Non-Reasoning",
|
|
@@ -15479,8 +15260,8 @@ export const MODELS = {
|
|
|
15479
15260
|
cacheRead: 0.049999999999999996,
|
|
15480
15261
|
cacheWrite: 0,
|
|
15481
15262
|
},
|
|
15482
|
-
contextWindow:
|
|
15483
|
-
maxTokens:
|
|
15263
|
+
contextWindow: 1000000,
|
|
15264
|
+
maxTokens: 1000000,
|
|
15484
15265
|
},
|
|
15485
15266
|
"xai/grok-4.1-fast-reasoning": {
|
|
15486
15267
|
id: "xai/grok-4.1-fast-reasoning",
|
|
@@ -15496,8 +15277,8 @@ export const MODELS = {
|
|
|
15496
15277
|
cacheRead: 0.049999999999999996,
|
|
15497
15278
|
cacheWrite: 0,
|
|
15498
15279
|
},
|
|
15499
|
-
contextWindow:
|
|
15500
|
-
maxTokens:
|
|
15280
|
+
contextWindow: 1000000,
|
|
15281
|
+
maxTokens: 1000000,
|
|
15501
15282
|
},
|
|
15502
15283
|
"xai/grok-4.20-multi-agent": {
|
|
15503
15284
|
id: "xai/grok-4.20-multi-agent",
|
|
@@ -15618,18 +15399,18 @@ export const MODELS = {
|
|
|
15618
15399
|
contextWindow: 1000000,
|
|
15619
15400
|
maxTokens: 1000000,
|
|
15620
15401
|
},
|
|
15621
|
-
"xai/grok-
|
|
15622
|
-
id: "xai/grok-
|
|
15623
|
-
name: "Grok
|
|
15402
|
+
"xai/grok-build-0.1": {
|
|
15403
|
+
id: "xai/grok-build-0.1",
|
|
15404
|
+
name: "Grok Build 0.1",
|
|
15624
15405
|
api: "anthropic-messages",
|
|
15625
15406
|
provider: "vercel-ai-gateway",
|
|
15626
15407
|
baseUrl: "https://ai-gateway.vercel.sh",
|
|
15627
15408
|
reasoning: true,
|
|
15628
|
-
input: ["text"],
|
|
15409
|
+
input: ["text", "image"],
|
|
15629
15410
|
cost: {
|
|
15630
|
-
input:
|
|
15631
|
-
output:
|
|
15632
|
-
cacheRead: 0.
|
|
15411
|
+
input: 1,
|
|
15412
|
+
output: 2,
|
|
15413
|
+
cacheRead: 0.19999999999999998,
|
|
15633
15414
|
cacheWrite: 0,
|
|
15634
15415
|
},
|
|
15635
15416
|
contextWindow: 256000,
|
|
@@ -15926,108 +15707,6 @@ export const MODELS = {
|
|
|
15926
15707
|
},
|
|
15927
15708
|
},
|
|
15928
15709
|
"xai": {
|
|
15929
|
-
"grok-2": {
|
|
15930
|
-
id: "grok-2",
|
|
15931
|
-
name: "Grok 2",
|
|
15932
|
-
api: "openai-completions",
|
|
15933
|
-
provider: "xai",
|
|
15934
|
-
baseUrl: "https://api.x.ai/v1",
|
|
15935
|
-
reasoning: false,
|
|
15936
|
-
input: ["text"],
|
|
15937
|
-
cost: {
|
|
15938
|
-
input: 2,
|
|
15939
|
-
output: 10,
|
|
15940
|
-
cacheRead: 2,
|
|
15941
|
-
cacheWrite: 0,
|
|
15942
|
-
},
|
|
15943
|
-
contextWindow: 131072,
|
|
15944
|
-
maxTokens: 8192,
|
|
15945
|
-
},
|
|
15946
|
-
"grok-2-1212": {
|
|
15947
|
-
id: "grok-2-1212",
|
|
15948
|
-
name: "Grok 2 (1212)",
|
|
15949
|
-
api: "openai-completions",
|
|
15950
|
-
provider: "xai",
|
|
15951
|
-
baseUrl: "https://api.x.ai/v1",
|
|
15952
|
-
reasoning: false,
|
|
15953
|
-
input: ["text"],
|
|
15954
|
-
cost: {
|
|
15955
|
-
input: 2,
|
|
15956
|
-
output: 10,
|
|
15957
|
-
cacheRead: 2,
|
|
15958
|
-
cacheWrite: 0,
|
|
15959
|
-
},
|
|
15960
|
-
contextWindow: 131072,
|
|
15961
|
-
maxTokens: 8192,
|
|
15962
|
-
},
|
|
15963
|
-
"grok-2-latest": {
|
|
15964
|
-
id: "grok-2-latest",
|
|
15965
|
-
name: "Grok 2 Latest",
|
|
15966
|
-
api: "openai-completions",
|
|
15967
|
-
provider: "xai",
|
|
15968
|
-
baseUrl: "https://api.x.ai/v1",
|
|
15969
|
-
reasoning: false,
|
|
15970
|
-
input: ["text"],
|
|
15971
|
-
cost: {
|
|
15972
|
-
input: 2,
|
|
15973
|
-
output: 10,
|
|
15974
|
-
cacheRead: 2,
|
|
15975
|
-
cacheWrite: 0,
|
|
15976
|
-
},
|
|
15977
|
-
contextWindow: 131072,
|
|
15978
|
-
maxTokens: 8192,
|
|
15979
|
-
},
|
|
15980
|
-
"grok-2-vision": {
|
|
15981
|
-
id: "grok-2-vision",
|
|
15982
|
-
name: "Grok 2 Vision",
|
|
15983
|
-
api: "openai-completions",
|
|
15984
|
-
provider: "xai",
|
|
15985
|
-
baseUrl: "https://api.x.ai/v1",
|
|
15986
|
-
reasoning: false,
|
|
15987
|
-
input: ["text", "image"],
|
|
15988
|
-
cost: {
|
|
15989
|
-
input: 2,
|
|
15990
|
-
output: 10,
|
|
15991
|
-
cacheRead: 2,
|
|
15992
|
-
cacheWrite: 0,
|
|
15993
|
-
},
|
|
15994
|
-
contextWindow: 8192,
|
|
15995
|
-
maxTokens: 4096,
|
|
15996
|
-
},
|
|
15997
|
-
"grok-2-vision-1212": {
|
|
15998
|
-
id: "grok-2-vision-1212",
|
|
15999
|
-
name: "Grok 2 Vision (1212)",
|
|
16000
|
-
api: "openai-completions",
|
|
16001
|
-
provider: "xai",
|
|
16002
|
-
baseUrl: "https://api.x.ai/v1",
|
|
16003
|
-
reasoning: false,
|
|
16004
|
-
input: ["text", "image"],
|
|
16005
|
-
cost: {
|
|
16006
|
-
input: 2,
|
|
16007
|
-
output: 10,
|
|
16008
|
-
cacheRead: 2,
|
|
16009
|
-
cacheWrite: 0,
|
|
16010
|
-
},
|
|
16011
|
-
contextWindow: 8192,
|
|
16012
|
-
maxTokens: 4096,
|
|
16013
|
-
},
|
|
16014
|
-
"grok-2-vision-latest": {
|
|
16015
|
-
id: "grok-2-vision-latest",
|
|
16016
|
-
name: "Grok 2 Vision Latest",
|
|
16017
|
-
api: "openai-completions",
|
|
16018
|
-
provider: "xai",
|
|
16019
|
-
baseUrl: "https://api.x.ai/v1",
|
|
16020
|
-
reasoning: false,
|
|
16021
|
-
input: ["text", "image"],
|
|
16022
|
-
cost: {
|
|
16023
|
-
input: 2,
|
|
16024
|
-
output: 10,
|
|
16025
|
-
cacheRead: 2,
|
|
16026
|
-
cacheWrite: 0,
|
|
16027
|
-
},
|
|
16028
|
-
contextWindow: 8192,
|
|
16029
|
-
maxTokens: 4096,
|
|
16030
|
-
},
|
|
16031
15710
|
"grok-3": {
|
|
16032
15711
|
id: "grok-3",
|
|
16033
15712
|
name: "Grok 3",
|
|
@@ -16062,193 +15741,6 @@ export const MODELS = {
|
|
|
16062
15741
|
contextWindow: 131072,
|
|
16063
15742
|
maxTokens: 8192,
|
|
16064
15743
|
},
|
|
16065
|
-
"grok-3-fast-latest": {
|
|
16066
|
-
id: "grok-3-fast-latest",
|
|
16067
|
-
name: "Grok 3 Fast Latest",
|
|
16068
|
-
api: "openai-completions",
|
|
16069
|
-
provider: "xai",
|
|
16070
|
-
baseUrl: "https://api.x.ai/v1",
|
|
16071
|
-
reasoning: false,
|
|
16072
|
-
input: ["text"],
|
|
16073
|
-
cost: {
|
|
16074
|
-
input: 5,
|
|
16075
|
-
output: 25,
|
|
16076
|
-
cacheRead: 1.25,
|
|
16077
|
-
cacheWrite: 0,
|
|
16078
|
-
},
|
|
16079
|
-
contextWindow: 131072,
|
|
16080
|
-
maxTokens: 8192,
|
|
16081
|
-
},
|
|
16082
|
-
"grok-3-latest": {
|
|
16083
|
-
id: "grok-3-latest",
|
|
16084
|
-
name: "Grok 3 Latest",
|
|
16085
|
-
api: "openai-completions",
|
|
16086
|
-
provider: "xai",
|
|
16087
|
-
baseUrl: "https://api.x.ai/v1",
|
|
16088
|
-
reasoning: false,
|
|
16089
|
-
input: ["text"],
|
|
16090
|
-
cost: {
|
|
16091
|
-
input: 3,
|
|
16092
|
-
output: 15,
|
|
16093
|
-
cacheRead: 0.75,
|
|
16094
|
-
cacheWrite: 0,
|
|
16095
|
-
},
|
|
16096
|
-
contextWindow: 131072,
|
|
16097
|
-
maxTokens: 8192,
|
|
16098
|
-
},
|
|
16099
|
-
"grok-3-mini": {
|
|
16100
|
-
id: "grok-3-mini",
|
|
16101
|
-
name: "Grok 3 Mini",
|
|
16102
|
-
api: "openai-completions",
|
|
16103
|
-
provider: "xai",
|
|
16104
|
-
baseUrl: "https://api.x.ai/v1",
|
|
16105
|
-
reasoning: true,
|
|
16106
|
-
input: ["text"],
|
|
16107
|
-
cost: {
|
|
16108
|
-
input: 0.3,
|
|
16109
|
-
output: 0.5,
|
|
16110
|
-
cacheRead: 0.075,
|
|
16111
|
-
cacheWrite: 0,
|
|
16112
|
-
},
|
|
16113
|
-
contextWindow: 131072,
|
|
16114
|
-
maxTokens: 8192,
|
|
16115
|
-
},
|
|
16116
|
-
"grok-3-mini-fast": {
|
|
16117
|
-
id: "grok-3-mini-fast",
|
|
16118
|
-
name: "Grok 3 Mini Fast",
|
|
16119
|
-
api: "openai-completions",
|
|
16120
|
-
provider: "xai",
|
|
16121
|
-
baseUrl: "https://api.x.ai/v1",
|
|
16122
|
-
reasoning: true,
|
|
16123
|
-
input: ["text"],
|
|
16124
|
-
cost: {
|
|
16125
|
-
input: 0.6,
|
|
16126
|
-
output: 4,
|
|
16127
|
-
cacheRead: 0.15,
|
|
16128
|
-
cacheWrite: 0,
|
|
16129
|
-
},
|
|
16130
|
-
contextWindow: 131072,
|
|
16131
|
-
maxTokens: 8192,
|
|
16132
|
-
},
|
|
16133
|
-
"grok-3-mini-fast-latest": {
|
|
16134
|
-
id: "grok-3-mini-fast-latest",
|
|
16135
|
-
name: "Grok 3 Mini Fast Latest",
|
|
16136
|
-
api: "openai-completions",
|
|
16137
|
-
provider: "xai",
|
|
16138
|
-
baseUrl: "https://api.x.ai/v1",
|
|
16139
|
-
reasoning: true,
|
|
16140
|
-
input: ["text"],
|
|
16141
|
-
cost: {
|
|
16142
|
-
input: 0.6,
|
|
16143
|
-
output: 4,
|
|
16144
|
-
cacheRead: 0.15,
|
|
16145
|
-
cacheWrite: 0,
|
|
16146
|
-
},
|
|
16147
|
-
contextWindow: 131072,
|
|
16148
|
-
maxTokens: 8192,
|
|
16149
|
-
},
|
|
16150
|
-
"grok-3-mini-latest": {
|
|
16151
|
-
id: "grok-3-mini-latest",
|
|
16152
|
-
name: "Grok 3 Mini Latest",
|
|
16153
|
-
api: "openai-completions",
|
|
16154
|
-
provider: "xai",
|
|
16155
|
-
baseUrl: "https://api.x.ai/v1",
|
|
16156
|
-
reasoning: true,
|
|
16157
|
-
input: ["text"],
|
|
16158
|
-
cost: {
|
|
16159
|
-
input: 0.3,
|
|
16160
|
-
output: 0.5,
|
|
16161
|
-
cacheRead: 0.075,
|
|
16162
|
-
cacheWrite: 0,
|
|
16163
|
-
},
|
|
16164
|
-
contextWindow: 131072,
|
|
16165
|
-
maxTokens: 8192,
|
|
16166
|
-
},
|
|
16167
|
-
"grok-4": {
|
|
16168
|
-
id: "grok-4",
|
|
16169
|
-
name: "Grok 4",
|
|
16170
|
-
api: "openai-completions",
|
|
16171
|
-
provider: "xai",
|
|
16172
|
-
baseUrl: "https://api.x.ai/v1",
|
|
16173
|
-
reasoning: true,
|
|
16174
|
-
input: ["text"],
|
|
16175
|
-
cost: {
|
|
16176
|
-
input: 3,
|
|
16177
|
-
output: 15,
|
|
16178
|
-
cacheRead: 0.75,
|
|
16179
|
-
cacheWrite: 0,
|
|
16180
|
-
},
|
|
16181
|
-
contextWindow: 256000,
|
|
16182
|
-
maxTokens: 64000,
|
|
16183
|
-
},
|
|
16184
|
-
"grok-4-1-fast": {
|
|
16185
|
-
id: "grok-4-1-fast",
|
|
16186
|
-
name: "Grok 4.1 Fast",
|
|
16187
|
-
api: "openai-completions",
|
|
16188
|
-
provider: "xai",
|
|
16189
|
-
baseUrl: "https://api.x.ai/v1",
|
|
16190
|
-
reasoning: true,
|
|
16191
|
-
input: ["text", "image"],
|
|
16192
|
-
cost: {
|
|
16193
|
-
input: 0.2,
|
|
16194
|
-
output: 0.5,
|
|
16195
|
-
cacheRead: 0.05,
|
|
16196
|
-
cacheWrite: 0,
|
|
16197
|
-
},
|
|
16198
|
-
contextWindow: 2000000,
|
|
16199
|
-
maxTokens: 30000,
|
|
16200
|
-
},
|
|
16201
|
-
"grok-4-1-fast-non-reasoning": {
|
|
16202
|
-
id: "grok-4-1-fast-non-reasoning",
|
|
16203
|
-
name: "Grok 4.1 Fast (Non-Reasoning)",
|
|
16204
|
-
api: "openai-completions",
|
|
16205
|
-
provider: "xai",
|
|
16206
|
-
baseUrl: "https://api.x.ai/v1",
|
|
16207
|
-
reasoning: false,
|
|
16208
|
-
input: ["text", "image"],
|
|
16209
|
-
cost: {
|
|
16210
|
-
input: 0.2,
|
|
16211
|
-
output: 0.5,
|
|
16212
|
-
cacheRead: 0.05,
|
|
16213
|
-
cacheWrite: 0,
|
|
16214
|
-
},
|
|
16215
|
-
contextWindow: 2000000,
|
|
16216
|
-
maxTokens: 30000,
|
|
16217
|
-
},
|
|
16218
|
-
"grok-4-fast": {
|
|
16219
|
-
id: "grok-4-fast",
|
|
16220
|
-
name: "Grok 4 Fast",
|
|
16221
|
-
api: "openai-completions",
|
|
16222
|
-
provider: "xai",
|
|
16223
|
-
baseUrl: "https://api.x.ai/v1",
|
|
16224
|
-
reasoning: true,
|
|
16225
|
-
input: ["text", "image"],
|
|
16226
|
-
cost: {
|
|
16227
|
-
input: 0.2,
|
|
16228
|
-
output: 0.5,
|
|
16229
|
-
cacheRead: 0.05,
|
|
16230
|
-
cacheWrite: 0,
|
|
16231
|
-
},
|
|
16232
|
-
contextWindow: 2000000,
|
|
16233
|
-
maxTokens: 30000,
|
|
16234
|
-
},
|
|
16235
|
-
"grok-4-fast-non-reasoning": {
|
|
16236
|
-
id: "grok-4-fast-non-reasoning",
|
|
16237
|
-
name: "Grok 4 Fast (Non-Reasoning)",
|
|
16238
|
-
api: "openai-completions",
|
|
16239
|
-
provider: "xai",
|
|
16240
|
-
baseUrl: "https://api.x.ai/v1",
|
|
16241
|
-
reasoning: false,
|
|
16242
|
-
input: ["text", "image"],
|
|
16243
|
-
cost: {
|
|
16244
|
-
input: 0.2,
|
|
16245
|
-
output: 0.5,
|
|
16246
|
-
cacheRead: 0.05,
|
|
16247
|
-
cacheWrite: 0,
|
|
16248
|
-
},
|
|
16249
|
-
contextWindow: 2000000,
|
|
16250
|
-
maxTokens: 30000,
|
|
16251
|
-
},
|
|
16252
15744
|
"grok-4.20-0309-non-reasoning": {
|
|
16253
15745
|
id: "grok-4.20-0309-non-reasoning",
|
|
16254
15746
|
name: "Grok 4.20 (Non-Reasoning)",
|
|
@@ -16258,8 +15750,8 @@ export const MODELS = {
|
|
|
16258
15750
|
reasoning: false,
|
|
16259
15751
|
input: ["text", "image"],
|
|
16260
15752
|
cost: {
|
|
16261
|
-
input:
|
|
16262
|
-
output:
|
|
15753
|
+
input: 1.25,
|
|
15754
|
+
output: 2.5,
|
|
16263
15755
|
cacheRead: 0.2,
|
|
16264
15756
|
cacheWrite: 0,
|
|
16265
15757
|
},
|
|
@@ -16275,8 +15767,8 @@ export const MODELS = {
|
|
|
16275
15767
|
reasoning: true,
|
|
16276
15768
|
input: ["text", "image"],
|
|
16277
15769
|
cost: {
|
|
16278
|
-
input:
|
|
16279
|
-
output:
|
|
15770
|
+
input: 1.25,
|
|
15771
|
+
output: 2.5,
|
|
16280
15772
|
cacheRead: 0.2,
|
|
16281
15773
|
cacheWrite: 0,
|
|
16282
15774
|
},
|
|
@@ -16300,22 +15792,22 @@ export const MODELS = {
|
|
|
16300
15792
|
contextWindow: 1000000,
|
|
16301
15793
|
maxTokens: 30000,
|
|
16302
15794
|
},
|
|
16303
|
-
"grok-
|
|
16304
|
-
id: "grok-
|
|
16305
|
-
name: "Grok
|
|
15795
|
+
"grok-build-0.1": {
|
|
15796
|
+
id: "grok-build-0.1",
|
|
15797
|
+
name: "Grok Build 0.1",
|
|
16306
15798
|
api: "openai-completions",
|
|
16307
15799
|
provider: "xai",
|
|
16308
15800
|
baseUrl: "https://api.x.ai/v1",
|
|
16309
|
-
reasoning:
|
|
16310
|
-
input: ["text"],
|
|
15801
|
+
reasoning: true,
|
|
15802
|
+
input: ["text", "image"],
|
|
16311
15803
|
cost: {
|
|
16312
|
-
input:
|
|
16313
|
-
output:
|
|
16314
|
-
cacheRead:
|
|
15804
|
+
input: 1,
|
|
15805
|
+
output: 2,
|
|
15806
|
+
cacheRead: 0.2,
|
|
16315
15807
|
cacheWrite: 0,
|
|
16316
15808
|
},
|
|
16317
|
-
contextWindow:
|
|
16318
|
-
maxTokens:
|
|
15809
|
+
contextWindow: 256000,
|
|
15810
|
+
maxTokens: 256000,
|
|
16319
15811
|
},
|
|
16320
15812
|
"grok-code-fast-1": {
|
|
16321
15813
|
id: "grok-code-fast-1",
|
|
@@ -16323,7 +15815,7 @@ export const MODELS = {
|
|
|
16323
15815
|
api: "openai-completions",
|
|
16324
15816
|
provider: "xai",
|
|
16325
15817
|
baseUrl: "https://api.x.ai/v1",
|
|
16326
|
-
reasoning:
|
|
15818
|
+
reasoning: false,
|
|
16327
15819
|
input: ["text"],
|
|
16328
15820
|
cost: {
|
|
16329
15821
|
input: 0.2,
|
|
@@ -16331,25 +15823,8 @@ export const MODELS = {
|
|
|
16331
15823
|
cacheRead: 0.02,
|
|
16332
15824
|
cacheWrite: 0,
|
|
16333
15825
|
},
|
|
16334
|
-
contextWindow:
|
|
16335
|
-
maxTokens:
|
|
16336
|
-
},
|
|
16337
|
-
"grok-vision-beta": {
|
|
16338
|
-
id: "grok-vision-beta",
|
|
16339
|
-
name: "Grok Vision Beta",
|
|
16340
|
-
api: "openai-completions",
|
|
16341
|
-
provider: "xai",
|
|
16342
|
-
baseUrl: "https://api.x.ai/v1",
|
|
16343
|
-
reasoning: false,
|
|
16344
|
-
input: ["text", "image"],
|
|
16345
|
-
cost: {
|
|
16346
|
-
input: 5,
|
|
16347
|
-
output: 15,
|
|
16348
|
-
cacheRead: 5,
|
|
16349
|
-
cacheWrite: 0,
|
|
16350
|
-
},
|
|
16351
|
-
contextWindow: 8192,
|
|
16352
|
-
maxTokens: 4096,
|
|
15826
|
+
contextWindow: 32768,
|
|
15827
|
+
maxTokens: 8192,
|
|
16353
15828
|
},
|
|
16354
15829
|
},
|
|
16355
15830
|
"xiaomi": {
|