@eminent337/aery-ai 0.1.142 → 0.1.145

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (41) hide show
  1. package/dist/image-models.generated.d.ts +165 -0
  2. package/dist/image-models.generated.d.ts.map +1 -1
  3. package/dist/image-models.generated.js +251 -86
  4. package/dist/image-models.generated.js.map +1 -1
  5. package/dist/models.generated.d.ts +1061 -1689
  6. package/dist/models.generated.d.ts.map +1 -1
  7. package/dist/models.generated.js +748 -1442
  8. package/dist/models.generated.js.map +1 -1
  9. package/dist/providers/anthropic.d.ts.map +1 -1
  10. package/dist/providers/anthropic.js +1 -1
  11. package/dist/providers/anthropic.js.map +1 -1
  12. package/dist/providers/google-gemini-cli.d.ts +74 -0
  13. package/dist/providers/google-gemini-cli.d.ts.map +1 -0
  14. package/dist/providers/google-gemini-cli.js +779 -0
  15. package/dist/providers/google-gemini-cli.js.map +1 -0
  16. package/dist/providers/google-shared.d.ts +1 -1
  17. package/dist/providers/google-shared.d.ts.map +1 -1
  18. package/dist/providers/google-shared.js.map +1 -1
  19. package/dist/providers/openai-completions.d.ts.map +1 -1
  20. package/dist/providers/openai-completions.js +1 -1
  21. package/dist/providers/openai-completions.js.map +1 -1
  22. package/dist/providers/register-builtins.d.ts +3 -0
  23. package/dist/providers/register-builtins.d.ts.map +1 -1
  24. package/dist/providers/register-builtins.js +21 -0
  25. package/dist/providers/register-builtins.js.map +1 -1
  26. package/dist/types.d.ts +1 -1
  27. package/dist/types.d.ts.map +1 -1
  28. package/dist/types.js.map +1 -1
  29. package/dist/utils/oauth/google-antigravity.d.ts +26 -0
  30. package/dist/utils/oauth/google-antigravity.d.ts.map +1 -0
  31. package/dist/utils/oauth/google-antigravity.js +377 -0
  32. package/dist/utils/oauth/google-antigravity.js.map +1 -0
  33. package/dist/utils/oauth/google-gemini-cli.d.ts +26 -0
  34. package/dist/utils/oauth/google-gemini-cli.d.ts.map +1 -0
  35. package/dist/utils/oauth/google-gemini-cli.js +482 -0
  36. package/dist/utils/oauth/google-gemini-cli.js.map +1 -0
  37. package/dist/utils/oauth/index.d.ts +7 -0
  38. package/dist/utils/oauth/index.d.ts.map +1 -1
  39. package/dist/utils/oauth/index.js +13 -0
  40. package/dist/utils/oauth/index.js.map +1 -1
  41. package/package.json +2 -2
@@ -53,23 +53,6 @@ export const MODELS = {
53
53
  contextWindow: 128000,
54
54
  maxTokens: 8192,
55
55
  },
56
- "amazon.nova-premier-v1:0": {
57
- id: "amazon.nova-premier-v1:0",
58
- name: "Nova Premier",
59
- api: "bedrock-converse-stream",
60
- provider: "amazon-bedrock",
61
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
62
- reasoning: true,
63
- input: ["text", "image"],
64
- cost: {
65
- input: 2.5,
66
- output: 12.5,
67
- cacheRead: 0,
68
- cacheWrite: 0,
69
- },
70
- contextWindow: 1000000,
71
- maxTokens: 16384,
72
- },
73
56
  "amazon.nova-pro-v1:0": {
74
57
  id: "amazon.nova-pro-v1:0",
75
58
  name: "Nova Pro",
@@ -87,91 +70,6 @@ export const MODELS = {
87
70
  contextWindow: 300000,
88
71
  maxTokens: 8192,
89
72
  },
90
- "anthropic.claude-3-5-haiku-20241022-v1:0": {
91
- id: "anthropic.claude-3-5-haiku-20241022-v1:0",
92
- name: "Claude Haiku 3.5",
93
- api: "bedrock-converse-stream",
94
- provider: "amazon-bedrock",
95
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
96
- reasoning: false,
97
- input: ["text", "image"],
98
- cost: {
99
- input: 0.8,
100
- output: 4,
101
- cacheRead: 0.08,
102
- cacheWrite: 1,
103
- },
104
- contextWindow: 200000,
105
- maxTokens: 8192,
106
- },
107
- "anthropic.claude-3-5-sonnet-20240620-v1:0": {
108
- id: "anthropic.claude-3-5-sonnet-20240620-v1:0",
109
- name: "Claude Sonnet 3.5",
110
- api: "bedrock-converse-stream",
111
- provider: "amazon-bedrock",
112
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
113
- reasoning: false,
114
- input: ["text", "image"],
115
- cost: {
116
- input: 3,
117
- output: 15,
118
- cacheRead: 0.3,
119
- cacheWrite: 3.75,
120
- },
121
- contextWindow: 200000,
122
- maxTokens: 8192,
123
- },
124
- "anthropic.claude-3-5-sonnet-20241022-v2:0": {
125
- id: "anthropic.claude-3-5-sonnet-20241022-v2:0",
126
- name: "Claude Sonnet 3.5 v2",
127
- api: "bedrock-converse-stream",
128
- provider: "amazon-bedrock",
129
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
130
- reasoning: false,
131
- input: ["text", "image"],
132
- cost: {
133
- input: 3,
134
- output: 15,
135
- cacheRead: 0.3,
136
- cacheWrite: 3.75,
137
- },
138
- contextWindow: 200000,
139
- maxTokens: 8192,
140
- },
141
- "anthropic.claude-3-7-sonnet-20250219-v1:0": {
142
- id: "anthropic.claude-3-7-sonnet-20250219-v1:0",
143
- name: "Claude Sonnet 3.7",
144
- api: "bedrock-converse-stream",
145
- provider: "amazon-bedrock",
146
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
147
- reasoning: false,
148
- input: ["text", "image"],
149
- cost: {
150
- input: 3,
151
- output: 15,
152
- cacheRead: 0.3,
153
- cacheWrite: 3.75,
154
- },
155
- contextWindow: 200000,
156
- maxTokens: 8192,
157
- },
158
- "anthropic.claude-3-haiku-20240307-v1:0": {
159
- id: "anthropic.claude-3-haiku-20240307-v1:0",
160
- name: "Claude Haiku 3",
161
- api: "bedrock-converse-stream",
162
- provider: "amazon-bedrock",
163
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
164
- reasoning: false,
165
- input: ["text", "image"],
166
- cost: {
167
- input: 0.25,
168
- output: 1.25,
169
- cacheRead: 0,
170
- cacheWrite: 0,
171
- },
172
- contextWindow: 200000,
173
- maxTokens: 4096,
174
- },
175
73
  "anthropic.claude-haiku-4-5-20251001-v1:0": {
176
74
  id: "anthropic.claude-haiku-4-5-20251001-v1:0",
177
75
  name: "Claude Haiku 4.5",
@@ -206,23 +104,6 @@ export const MODELS = {
206
104
  contextWindow: 200000,
207
105
  maxTokens: 32000,
208
106
  },
209
- "anthropic.claude-opus-4-20250514-v1:0": {
210
- id: "anthropic.claude-opus-4-20250514-v1:0",
211
- name: "Claude Opus 4",
212
- api: "bedrock-converse-stream",
213
- provider: "amazon-bedrock",
214
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
215
- reasoning: true,
216
- input: ["text", "image"],
217
- cost: {
218
- input: 15,
219
- output: 75,
220
- cacheRead: 1.5,
221
- cacheWrite: 18.75,
222
- },
223
- contextWindow: 200000,
224
- maxTokens: 32000,
225
- },
226
107
  "anthropic.claude-opus-4-5-20251101-v1:0": {
227
108
  id: "anthropic.claude-opus-4-5-20251101-v1:0",
228
109
  name: "Claude Opus 4.5",
@@ -276,9 +157,9 @@ export const MODELS = {
276
157
  contextWindow: 1000000,
277
158
  maxTokens: 128000,
278
159
  },
279
- "anthropic.claude-sonnet-4-20250514-v1:0": {
280
- id: "anthropic.claude-sonnet-4-20250514-v1:0",
281
- name: "Claude Sonnet 4",
160
+ "anthropic.claude-sonnet-4-5-20250929-v1:0": {
161
+ id: "anthropic.claude-sonnet-4-5-20250929-v1:0",
162
+ name: "Claude Sonnet 4.5",
282
163
  api: "bedrock-converse-stream",
283
164
  provider: "amazon-bedrock",
284
165
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
@@ -293,9 +174,9 @@ export const MODELS = {
293
174
  contextWindow: 200000,
294
175
  maxTokens: 64000,
295
176
  },
296
- "anthropic.claude-sonnet-4-5-20250929-v1:0": {
297
- id: "anthropic.claude-sonnet-4-5-20250929-v1:0",
298
- name: "Claude Sonnet 4.5",
177
+ "anthropic.claude-sonnet-4-6": {
178
+ id: "anthropic.claude-sonnet-4-6",
179
+ name: "Claude Sonnet 4.6",
299
180
  api: "bedrock-converse-stream",
300
181
  provider: "amazon-bedrock",
301
182
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
@@ -307,24 +188,24 @@ export const MODELS = {
307
188
  cacheRead: 0.3,
308
189
  cacheWrite: 3.75,
309
190
  },
310
- contextWindow: 200000,
191
+ contextWindow: 1000000,
311
192
  maxTokens: 64000,
312
193
  },
313
- "anthropic.claude-sonnet-4-6": {
314
- id: "anthropic.claude-sonnet-4-6",
315
- name: "Claude Sonnet 4.6",
194
+ "au.anthropic.claude-haiku-4-5-20251001-v1:0": {
195
+ id: "au.anthropic.claude-haiku-4-5-20251001-v1:0",
196
+ name: "Claude Haiku 4.5 (AU)",
316
197
  api: "bedrock-converse-stream",
317
198
  provider: "amazon-bedrock",
318
199
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
319
200
  reasoning: true,
320
201
  input: ["text", "image"],
321
202
  cost: {
322
- input: 3,
323
- output: 15,
324
- cacheRead: 0.3,
325
- cacheWrite: 3.75,
203
+ input: 1,
204
+ output: 5,
205
+ cacheRead: 0.1,
206
+ cacheWrite: 1.25,
326
207
  },
327
- contextWindow: 1000000,
208
+ contextWindow: 200000,
328
209
  maxTokens: 64000,
329
210
  },
330
211
  "au.anthropic.claude-opus-4-6-v1": {
@@ -345,6 +226,23 @@ export const MODELS = {
345
226
  contextWindow: 1000000,
346
227
  maxTokens: 128000,
347
228
  },
229
+ "au.anthropic.claude-sonnet-4-5-20250929-v1:0": {
230
+ id: "au.anthropic.claude-sonnet-4-5-20250929-v1:0",
231
+ name: "Claude Sonnet 4.5 (AU)",
232
+ api: "bedrock-converse-stream",
233
+ provider: "amazon-bedrock",
234
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
235
+ reasoning: true,
236
+ input: ["text", "image"],
237
+ cost: {
238
+ input: 3,
239
+ output: 15,
240
+ cacheRead: 0.3,
241
+ cacheWrite: 3.75,
242
+ },
243
+ contextWindow: 200000,
244
+ maxTokens: 64000,
245
+ },
348
246
  "au.anthropic.claude-sonnet-4-6": {
349
247
  id: "au.anthropic.claude-sonnet-4-6",
350
248
  name: "AU Anthropic Claude Sonnet 4.6",
@@ -483,23 +381,6 @@ export const MODELS = {
483
381
  contextWindow: 1000000,
484
382
  maxTokens: 128000,
485
383
  },
486
- "eu.anthropic.claude-sonnet-4-20250514-v1:0": {
487
- id: "eu.anthropic.claude-sonnet-4-20250514-v1:0",
488
- name: "Claude Sonnet 4 (EU)",
489
- api: "bedrock-converse-stream",
490
- provider: "amazon-bedrock",
491
- baseUrl: "https://bedrock-runtime.eu-central-1.amazonaws.com",
492
- reasoning: true,
493
- input: ["text", "image"],
494
- cost: {
495
- input: 3,
496
- output: 15,
497
- cacheRead: 0.3,
498
- cacheWrite: 3.75,
499
- },
500
- contextWindow: 200000,
501
- maxTokens: 64000,
502
- },
503
384
  "eu.anthropic.claude-sonnet-4-5-20250929-v1:0": {
504
385
  id: "eu.anthropic.claude-sonnet-4-5-20250929-v1:0",
505
386
  name: "Claude Sonnet 4.5 (EU)",
@@ -604,23 +485,6 @@ export const MODELS = {
604
485
  contextWindow: 1000000,
605
486
  maxTokens: 128000,
606
487
  },
607
- "global.anthropic.claude-sonnet-4-20250514-v1:0": {
608
- id: "global.anthropic.claude-sonnet-4-20250514-v1:0",
609
- name: "Claude Sonnet 4 (Global)",
610
- api: "bedrock-converse-stream",
611
- provider: "amazon-bedrock",
612
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
613
- reasoning: true,
614
- input: ["text", "image"],
615
- cost: {
616
- input: 3,
617
- output: 15,
618
- cacheRead: 0.3,
619
- cacheWrite: 3.75,
620
- },
621
- contextWindow: 200000,
622
- maxTokens: 64000,
623
- },
624
488
  "global.anthropic.claude-sonnet-4-5-20250929-v1:0": {
625
489
  id: "global.anthropic.claude-sonnet-4-5-20250929-v1:0",
626
490
  name: "Claude Sonnet 4.5 (Global)",
@@ -689,119 +553,86 @@ export const MODELS = {
689
553
  contextWindow: 128000,
690
554
  maxTokens: 4096,
691
555
  },
692
- "meta.llama3-1-405b-instruct-v1:0": {
693
- id: "meta.llama3-1-405b-instruct-v1:0",
694
- name: "Llama 3.1 405B Instruct",
556
+ "jp.anthropic.claude-opus-4-7": {
557
+ id: "jp.anthropic.claude-opus-4-7",
558
+ name: "Claude Opus 4.7 (JP)",
695
559
  api: "bedrock-converse-stream",
696
560
  provider: "amazon-bedrock",
697
561
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
698
- reasoning: false,
699
- input: ["text"],
700
- cost: {
701
- input: 2.4,
702
- output: 2.4,
703
- cacheRead: 0,
704
- cacheWrite: 0,
705
- },
706
- contextWindow: 128000,
707
- maxTokens: 4096,
708
- },
709
- "meta.llama3-1-70b-instruct-v1:0": {
710
- id: "meta.llama3-1-70b-instruct-v1:0",
711
- name: "Llama 3.1 70B Instruct",
712
- api: "bedrock-converse-stream",
713
- provider: "amazon-bedrock",
714
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
715
- reasoning: false,
716
- input: ["text"],
562
+ reasoning: true,
563
+ thinkingLevelMap: { "xhigh": "xhigh" },
564
+ input: ["text", "image"],
717
565
  cost: {
718
- input: 0.72,
719
- output: 0.72,
720
- cacheRead: 0,
721
- cacheWrite: 0,
566
+ input: 5,
567
+ output: 25,
568
+ cacheRead: 0.5,
569
+ cacheWrite: 6.25,
722
570
  },
723
- contextWindow: 128000,
724
- maxTokens: 4096,
571
+ contextWindow: 1000000,
572
+ maxTokens: 128000,
725
573
  },
726
- "meta.llama3-1-8b-instruct-v1:0": {
727
- id: "meta.llama3-1-8b-instruct-v1:0",
728
- name: "Llama 3.1 8B Instruct",
574
+ "jp.anthropic.claude-sonnet-4-5-20250929-v1:0": {
575
+ id: "jp.anthropic.claude-sonnet-4-5-20250929-v1:0",
576
+ name: "Claude Sonnet 4.5 (JP)",
729
577
  api: "bedrock-converse-stream",
730
578
  provider: "amazon-bedrock",
731
579
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
732
- reasoning: false,
733
- input: ["text"],
580
+ reasoning: true,
581
+ input: ["text", "image"],
734
582
  cost: {
735
- input: 0.22,
736
- output: 0.22,
737
- cacheRead: 0,
738
- cacheWrite: 0,
583
+ input: 3,
584
+ output: 15,
585
+ cacheRead: 0.3,
586
+ cacheWrite: 3.75,
739
587
  },
740
- contextWindow: 128000,
741
- maxTokens: 4096,
588
+ contextWindow: 200000,
589
+ maxTokens: 64000,
742
590
  },
743
- "meta.llama3-2-11b-instruct-v1:0": {
744
- id: "meta.llama3-2-11b-instruct-v1:0",
745
- name: "Llama 3.2 11B Instruct",
591
+ "jp.anthropic.claude-sonnet-4-6": {
592
+ id: "jp.anthropic.claude-sonnet-4-6",
593
+ name: "Claude Sonnet 4.6 (JP)",
746
594
  api: "bedrock-converse-stream",
747
595
  provider: "amazon-bedrock",
748
596
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
749
- reasoning: false,
597
+ reasoning: true,
750
598
  input: ["text", "image"],
751
599
  cost: {
752
- input: 0.16,
753
- output: 0.16,
754
- cacheRead: 0,
755
- cacheWrite: 0,
600
+ input: 3,
601
+ output: 15,
602
+ cacheRead: 0.3,
603
+ cacheWrite: 3.75,
756
604
  },
757
- contextWindow: 128000,
758
- maxTokens: 4096,
605
+ contextWindow: 1000000,
606
+ maxTokens: 64000,
759
607
  },
760
- "meta.llama3-2-1b-instruct-v1:0": {
761
- id: "meta.llama3-2-1b-instruct-v1:0",
762
- name: "Llama 3.2 1B Instruct",
608
+ "meta.llama3-1-70b-instruct-v1:0": {
609
+ id: "meta.llama3-1-70b-instruct-v1:0",
610
+ name: "Llama 3.1 70B Instruct",
763
611
  api: "bedrock-converse-stream",
764
612
  provider: "amazon-bedrock",
765
613
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
766
614
  reasoning: false,
767
615
  input: ["text"],
768
616
  cost: {
769
- input: 0.1,
770
- output: 0.1,
617
+ input: 0.72,
618
+ output: 0.72,
771
619
  cacheRead: 0,
772
620
  cacheWrite: 0,
773
621
  },
774
- contextWindow: 131000,
622
+ contextWindow: 128000,
775
623
  maxTokens: 4096,
776
624
  },
777
- "meta.llama3-2-3b-instruct-v1:0": {
778
- id: "meta.llama3-2-3b-instruct-v1:0",
779
- name: "Llama 3.2 3B Instruct",
625
+ "meta.llama3-1-8b-instruct-v1:0": {
626
+ id: "meta.llama3-1-8b-instruct-v1:0",
627
+ name: "Llama 3.1 8B Instruct",
780
628
  api: "bedrock-converse-stream",
781
629
  provider: "amazon-bedrock",
782
630
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
783
631
  reasoning: false,
784
632
  input: ["text"],
785
633
  cost: {
786
- input: 0.15,
787
- output: 0.15,
788
- cacheRead: 0,
789
- cacheWrite: 0,
790
- },
791
- contextWindow: 131000,
792
- maxTokens: 4096,
793
- },
794
- "meta.llama3-2-90b-instruct-v1:0": {
795
- id: "meta.llama3-2-90b-instruct-v1:0",
796
- name: "Llama 3.2 90B Instruct",
797
- api: "bedrock-converse-stream",
798
- provider: "amazon-bedrock",
799
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
800
- reasoning: false,
801
- input: ["text", "image"],
802
- cost: {
803
- input: 0.72,
804
- output: 0.72,
634
+ input: 0.22,
635
+ output: 0.22,
805
636
  cacheRead: 0,
806
637
  cacheWrite: 0,
807
638
  },
@@ -1180,7 +1011,7 @@ export const MODELS = {
1180
1011
  cacheWrite: 0,
1181
1012
  },
1182
1013
  contextWindow: 128000,
1183
- maxTokens: 4096,
1014
+ maxTokens: 16384,
1184
1015
  },
1185
1016
  "openai.gpt-oss-20b-1:0": {
1186
1017
  id: "openai.gpt-oss-20b-1:0",
@@ -1197,7 +1028,7 @@ export const MODELS = {
1197
1028
  cacheWrite: 0,
1198
1029
  },
1199
1030
  contextWindow: 128000,
1200
- maxTokens: 4096,
1031
+ maxTokens: 16384,
1201
1032
  },
1202
1033
  "openai.gpt-oss-safeguard-120b": {
1203
1034
  id: "openai.gpt-oss-safeguard-120b",
@@ -1214,7 +1045,7 @@ export const MODELS = {
1214
1045
  cacheWrite: 0,
1215
1046
  },
1216
1047
  contextWindow: 128000,
1217
- maxTokens: 4096,
1048
+ maxTokens: 16384,
1218
1049
  },
1219
1050
  "openai.gpt-oss-safeguard-20b": {
1220
1051
  id: "openai.gpt-oss-safeguard-20b",
@@ -1231,7 +1062,7 @@ export const MODELS = {
1231
1062
  cacheWrite: 0,
1232
1063
  },
1233
1064
  contextWindow: 128000,
1234
- maxTokens: 4096,
1065
+ maxTokens: 16384,
1235
1066
  },
1236
1067
  "qwen.qwen3-235b-a22b-2507-v1:0": {
1237
1068
  id: "qwen.qwen3-235b-a22b-2507-v1:0",
@@ -1386,23 +1217,6 @@ export const MODELS = {
1386
1217
  contextWindow: 200000,
1387
1218
  maxTokens: 32000,
1388
1219
  },
1389
- "us.anthropic.claude-opus-4-20250514-v1:0": {
1390
- id: "us.anthropic.claude-opus-4-20250514-v1:0",
1391
- name: "Claude Opus 4 (US)",
1392
- api: "bedrock-converse-stream",
1393
- provider: "amazon-bedrock",
1394
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1395
- reasoning: true,
1396
- input: ["text", "image"],
1397
- cost: {
1398
- input: 15,
1399
- output: 75,
1400
- cacheRead: 1.5,
1401
- cacheWrite: 18.75,
1402
- },
1403
- contextWindow: 200000,
1404
- maxTokens: 32000,
1405
- },
1406
1220
  "us.anthropic.claude-opus-4-5-20251101-v1:0": {
1407
1221
  id: "us.anthropic.claude-opus-4-5-20251101-v1:0",
1408
1222
  name: "Claude Opus 4.5 (US)",
@@ -1456,9 +1270,9 @@ export const MODELS = {
1456
1270
  contextWindow: 1000000,
1457
1271
  maxTokens: 128000,
1458
1272
  },
1459
- "us.anthropic.claude-sonnet-4-20250514-v1:0": {
1460
- id: "us.anthropic.claude-sonnet-4-20250514-v1:0",
1461
- name: "Claude Sonnet 4 (US)",
1273
+ "us.anthropic.claude-sonnet-4-5-20250929-v1:0": {
1274
+ id: "us.anthropic.claude-sonnet-4-5-20250929-v1:0",
1275
+ name: "Claude Sonnet 4.5 (US)",
1462
1276
  api: "bedrock-converse-stream",
1463
1277
  provider: "amazon-bedrock",
1464
1278
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
@@ -1473,9 +1287,9 @@ export const MODELS = {
1473
1287
  contextWindow: 200000,
1474
1288
  maxTokens: 64000,
1475
1289
  },
1476
- "us.anthropic.claude-sonnet-4-5-20250929-v1:0": {
1477
- id: "us.anthropic.claude-sonnet-4-5-20250929-v1:0",
1478
- name: "Claude Sonnet 4.5 (US)",
1290
+ "us.anthropic.claude-sonnet-4-6": {
1291
+ id: "us.anthropic.claude-sonnet-4-6",
1292
+ name: "Claude Sonnet 4.6 (US)",
1479
1293
  api: "bedrock-converse-stream",
1480
1294
  provider: "amazon-bedrock",
1481
1295
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
@@ -1487,25 +1301,59 @@ export const MODELS = {
1487
1301
  cacheRead: 0.3,
1488
1302
  cacheWrite: 3.75,
1489
1303
  },
1490
- contextWindow: 200000,
1304
+ contextWindow: 1000000,
1491
1305
  maxTokens: 64000,
1492
1306
  },
1493
- "us.anthropic.claude-sonnet-4-6": {
1494
- id: "us.anthropic.claude-sonnet-4-6",
1495
- name: "Claude Sonnet 4.6 (US)",
1307
+ "us.deepseek.r1-v1:0": {
1308
+ id: "us.deepseek.r1-v1:0",
1309
+ name: "DeepSeek-R1 (US)",
1496
1310
  api: "bedrock-converse-stream",
1497
1311
  provider: "amazon-bedrock",
1498
1312
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1499
1313
  reasoning: true,
1314
+ input: ["text"],
1315
+ cost: {
1316
+ input: 1.35,
1317
+ output: 5.4,
1318
+ cacheRead: 0,
1319
+ cacheWrite: 0,
1320
+ },
1321
+ contextWindow: 128000,
1322
+ maxTokens: 32768,
1323
+ },
1324
+ "us.meta.llama4-maverick-17b-instruct-v1:0": {
1325
+ id: "us.meta.llama4-maverick-17b-instruct-v1:0",
1326
+ name: "Llama 4 Maverick 17B Instruct (US)",
1327
+ api: "bedrock-converse-stream",
1328
+ provider: "amazon-bedrock",
1329
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1330
+ reasoning: false,
1500
1331
  input: ["text", "image"],
1501
1332
  cost: {
1502
- input: 3,
1503
- output: 15,
1504
- cacheRead: 0.3,
1505
- cacheWrite: 3.75,
1333
+ input: 0.24,
1334
+ output: 0.97,
1335
+ cacheRead: 0,
1336
+ cacheWrite: 0,
1506
1337
  },
1507
1338
  contextWindow: 1000000,
1508
- maxTokens: 64000,
1339
+ maxTokens: 16384,
1340
+ },
1341
+ "us.meta.llama4-scout-17b-instruct-v1:0": {
1342
+ id: "us.meta.llama4-scout-17b-instruct-v1:0",
1343
+ name: "Llama 4 Scout 17B Instruct (US)",
1344
+ api: "bedrock-converse-stream",
1345
+ provider: "amazon-bedrock",
1346
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1347
+ reasoning: false,
1348
+ input: ["text", "image"],
1349
+ cost: {
1350
+ input: 0.17,
1351
+ output: 0.66,
1352
+ cacheRead: 0,
1353
+ cacheWrite: 0,
1354
+ },
1355
+ contextWindow: 3500000,
1356
+ maxTokens: 16384,
1509
1357
  },
1510
1358
  "writer.palmyra-x4-v1:0": {
1511
1359
  id: "writer.palmyra-x4-v1:0",
@@ -3601,6 +3449,7 @@ export const MODELS = {
3601
3449
  api: "anthropic-messages",
3602
3450
  provider: "fireworks",
3603
3451
  baseUrl: "https://api.fireworks.ai/inference",
3452
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3604
3453
  reasoning: true,
3605
3454
  input: ["text"],
3606
3455
  cost: {
@@ -3611,12 +3460,6 @@ export const MODELS = {
3611
3460
  },
3612
3461
  contextWindow: 163840,
3613
3462
  maxTokens: 163840,
3614
- compat: {
3615
- sendSessionAffinityHeaders: true,
3616
- supportsEagerToolInputStreaming: false,
3617
- supportsCacheControlOnTools: false,
3618
- supportsLongCacheRetention: false,
3619
- },
3620
3463
  },
3621
3464
  "accounts/fireworks/models/deepseek-v3p2": {
3622
3465
  id: "accounts/fireworks/models/deepseek-v3p2",
@@ -3624,6 +3467,7 @@ export const MODELS = {
3624
3467
  api: "anthropic-messages",
3625
3468
  provider: "fireworks",
3626
3469
  baseUrl: "https://api.fireworks.ai/inference",
3470
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3627
3471
  reasoning: true,
3628
3472
  input: ["text"],
3629
3473
  cost: {
@@ -3634,12 +3478,6 @@ export const MODELS = {
3634
3478
  },
3635
3479
  contextWindow: 160000,
3636
3480
  maxTokens: 160000,
3637
- compat: {
3638
- sendSessionAffinityHeaders: true,
3639
- supportsEagerToolInputStreaming: false,
3640
- supportsCacheControlOnTools: false,
3641
- supportsLongCacheRetention: false,
3642
- },
3643
3481
  },
3644
3482
  "accounts/fireworks/models/deepseek-v4-pro": {
3645
3483
  id: "accounts/fireworks/models/deepseek-v4-pro",
@@ -3647,6 +3485,7 @@ export const MODELS = {
3647
3485
  api: "anthropic-messages",
3648
3486
  provider: "fireworks",
3649
3487
  baseUrl: "https://api.fireworks.ai/inference",
3488
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3650
3489
  reasoning: true,
3651
3490
  input: ["text"],
3652
3491
  cost: {
@@ -3657,12 +3496,6 @@ export const MODELS = {
3657
3496
  },
3658
3497
  contextWindow: 1000000,
3659
3498
  maxTokens: 384000,
3660
- compat: {
3661
- sendSessionAffinityHeaders: true,
3662
- supportsEagerToolInputStreaming: false,
3663
- supportsCacheControlOnTools: false,
3664
- supportsLongCacheRetention: false,
3665
- },
3666
3499
  },
3667
3500
  "accounts/fireworks/models/glm-4p5": {
3668
3501
  id: "accounts/fireworks/models/glm-4p5",
@@ -3670,6 +3503,7 @@ export const MODELS = {
3670
3503
  api: "anthropic-messages",
3671
3504
  provider: "fireworks",
3672
3505
  baseUrl: "https://api.fireworks.ai/inference",
3506
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3673
3507
  reasoning: true,
3674
3508
  input: ["text"],
3675
3509
  cost: {
@@ -3680,12 +3514,6 @@ export const MODELS = {
3680
3514
  },
3681
3515
  contextWindow: 131072,
3682
3516
  maxTokens: 131072,
3683
- compat: {
3684
- sendSessionAffinityHeaders: true,
3685
- supportsEagerToolInputStreaming: false,
3686
- supportsCacheControlOnTools: false,
3687
- supportsLongCacheRetention: false,
3688
- },
3689
3517
  },
3690
3518
  "accounts/fireworks/models/glm-4p5-air": {
3691
3519
  id: "accounts/fireworks/models/glm-4p5-air",
@@ -3693,6 +3521,7 @@ export const MODELS = {
3693
3521
  api: "anthropic-messages",
3694
3522
  provider: "fireworks",
3695
3523
  baseUrl: "https://api.fireworks.ai/inference",
3524
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3696
3525
  reasoning: true,
3697
3526
  input: ["text"],
3698
3527
  cost: {
@@ -3703,12 +3532,6 @@ export const MODELS = {
3703
3532
  },
3704
3533
  contextWindow: 131072,
3705
3534
  maxTokens: 131072,
3706
- compat: {
3707
- sendSessionAffinityHeaders: true,
3708
- supportsEagerToolInputStreaming: false,
3709
- supportsCacheControlOnTools: false,
3710
- supportsLongCacheRetention: false,
3711
- },
3712
3535
  },
3713
3536
  "accounts/fireworks/models/glm-4p7": {
3714
3537
  id: "accounts/fireworks/models/glm-4p7",
@@ -3716,6 +3539,7 @@ export const MODELS = {
3716
3539
  api: "anthropic-messages",
3717
3540
  provider: "fireworks",
3718
3541
  baseUrl: "https://api.fireworks.ai/inference",
3542
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3719
3543
  reasoning: true,
3720
3544
  input: ["text"],
3721
3545
  cost: {
@@ -3726,12 +3550,6 @@ export const MODELS = {
3726
3550
  },
3727
3551
  contextWindow: 198000,
3728
3552
  maxTokens: 198000,
3729
- compat: {
3730
- sendSessionAffinityHeaders: true,
3731
- supportsEagerToolInputStreaming: false,
3732
- supportsCacheControlOnTools: false,
3733
- supportsLongCacheRetention: false,
3734
- },
3735
3553
  },
3736
3554
  "accounts/fireworks/models/glm-5": {
3737
3555
  id: "accounts/fireworks/models/glm-5",
@@ -3739,6 +3557,7 @@ export const MODELS = {
3739
3557
  api: "anthropic-messages",
3740
3558
  provider: "fireworks",
3741
3559
  baseUrl: "https://api.fireworks.ai/inference",
3560
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3742
3561
  reasoning: true,
3743
3562
  input: ["text"],
3744
3563
  cost: {
@@ -3749,12 +3568,6 @@ export const MODELS = {
3749
3568
  },
3750
3569
  contextWindow: 202752,
3751
3570
  maxTokens: 131072,
3752
- compat: {
3753
- sendSessionAffinityHeaders: true,
3754
- supportsEagerToolInputStreaming: false,
3755
- supportsCacheControlOnTools: false,
3756
- supportsLongCacheRetention: false,
3757
- },
3758
3571
  },
3759
3572
  "accounts/fireworks/models/glm-5p1": {
3760
3573
  id: "accounts/fireworks/models/glm-5p1",
@@ -3762,6 +3575,7 @@ export const MODELS = {
3762
3575
  api: "anthropic-messages",
3763
3576
  provider: "fireworks",
3764
3577
  baseUrl: "https://api.fireworks.ai/inference",
3578
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3765
3579
  reasoning: true,
3766
3580
  input: ["text"],
3767
3581
  cost: {
@@ -3772,12 +3586,6 @@ export const MODELS = {
3772
3586
  },
3773
3587
  contextWindow: 202800,
3774
3588
  maxTokens: 131072,
3775
- compat: {
3776
- sendSessionAffinityHeaders: true,
3777
- supportsEagerToolInputStreaming: false,
3778
- supportsCacheControlOnTools: false,
3779
- supportsLongCacheRetention: false,
3780
- },
3781
3589
  },
3782
3590
  "accounts/fireworks/models/gpt-oss-120b": {
3783
3591
  id: "accounts/fireworks/models/gpt-oss-120b",
@@ -3785,6 +3593,7 @@ export const MODELS = {
3785
3593
  api: "anthropic-messages",
3786
3594
  provider: "fireworks",
3787
3595
  baseUrl: "https://api.fireworks.ai/inference",
3596
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3788
3597
  reasoning: true,
3789
3598
  input: ["text"],
3790
3599
  cost: {
@@ -3795,12 +3604,6 @@ export const MODELS = {
3795
3604
  },
3796
3605
  contextWindow: 131072,
3797
3606
  maxTokens: 32768,
3798
- compat: {
3799
- sendSessionAffinityHeaders: true,
3800
- supportsEagerToolInputStreaming: false,
3801
- supportsCacheControlOnTools: false,
3802
- supportsLongCacheRetention: false,
3803
- },
3804
3607
  },
3805
3608
  "accounts/fireworks/models/gpt-oss-20b": {
3806
3609
  id: "accounts/fireworks/models/gpt-oss-20b",
@@ -3808,6 +3611,7 @@ export const MODELS = {
3808
3611
  api: "anthropic-messages",
3809
3612
  provider: "fireworks",
3810
3613
  baseUrl: "https://api.fireworks.ai/inference",
3614
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3811
3615
  reasoning: true,
3812
3616
  input: ["text"],
3813
3617
  cost: {
@@ -3818,12 +3622,6 @@ export const MODELS = {
3818
3622
  },
3819
3623
  contextWindow: 131072,
3820
3624
  maxTokens: 32768,
3821
- compat: {
3822
- sendSessionAffinityHeaders: true,
3823
- supportsEagerToolInputStreaming: false,
3824
- supportsCacheControlOnTools: false,
3825
- supportsLongCacheRetention: false,
3826
- },
3827
3625
  },
3828
3626
  "accounts/fireworks/models/kimi-k2-instruct": {
3829
3627
  id: "accounts/fireworks/models/kimi-k2-instruct",
@@ -3831,6 +3629,7 @@ export const MODELS = {
3831
3629
  api: "anthropic-messages",
3832
3630
  provider: "fireworks",
3833
3631
  baseUrl: "https://api.fireworks.ai/inference",
3632
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3834
3633
  reasoning: false,
3835
3634
  input: ["text"],
3836
3635
  cost: {
@@ -3841,12 +3640,6 @@ export const MODELS = {
3841
3640
  },
3842
3641
  contextWindow: 128000,
3843
3642
  maxTokens: 16384,
3844
- compat: {
3845
- sendSessionAffinityHeaders: true,
3846
- supportsEagerToolInputStreaming: false,
3847
- supportsCacheControlOnTools: false,
3848
- supportsLongCacheRetention: false,
3849
- },
3850
3643
  },
3851
3644
  "accounts/fireworks/models/kimi-k2-thinking": {
3852
3645
  id: "accounts/fireworks/models/kimi-k2-thinking",
@@ -3854,6 +3647,7 @@ export const MODELS = {
3854
3647
  api: "anthropic-messages",
3855
3648
  provider: "fireworks",
3856
3649
  baseUrl: "https://api.fireworks.ai/inference",
3650
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3857
3651
  reasoning: true,
3858
3652
  input: ["text"],
3859
3653
  cost: {
@@ -3864,12 +3658,6 @@ export const MODELS = {
3864
3658
  },
3865
3659
  contextWindow: 256000,
3866
3660
  maxTokens: 256000,
3867
- compat: {
3868
- sendSessionAffinityHeaders: true,
3869
- supportsEagerToolInputStreaming: false,
3870
- supportsCacheControlOnTools: false,
3871
- supportsLongCacheRetention: false,
3872
- },
3873
3661
  },
3874
3662
  "accounts/fireworks/models/kimi-k2p5": {
3875
3663
  id: "accounts/fireworks/models/kimi-k2p5",
@@ -3877,6 +3665,7 @@ export const MODELS = {
3877
3665
  api: "anthropic-messages",
3878
3666
  provider: "fireworks",
3879
3667
  baseUrl: "https://api.fireworks.ai/inference",
3668
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3880
3669
  reasoning: true,
3881
3670
  input: ["text", "image"],
3882
3671
  cost: {
@@ -3887,12 +3676,6 @@ export const MODELS = {
3887
3676
  },
3888
3677
  contextWindow: 256000,
3889
3678
  maxTokens: 256000,
3890
- compat: {
3891
- sendSessionAffinityHeaders: true,
3892
- supportsEagerToolInputStreaming: false,
3893
- supportsCacheControlOnTools: false,
3894
- supportsLongCacheRetention: false,
3895
- },
3896
3679
  },
3897
3680
  "accounts/fireworks/models/kimi-k2p6": {
3898
3681
  id: "accounts/fireworks/models/kimi-k2p6",
@@ -3900,6 +3683,7 @@ export const MODELS = {
3900
3683
  api: "anthropic-messages",
3901
3684
  provider: "fireworks",
3902
3685
  baseUrl: "https://api.fireworks.ai/inference",
3686
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3903
3687
  reasoning: true,
3904
3688
  input: ["text", "image"],
3905
3689
  cost: {
@@ -3910,12 +3694,6 @@ export const MODELS = {
3910
3694
  },
3911
3695
  contextWindow: 262000,
3912
3696
  maxTokens: 262000,
3913
- compat: {
3914
- sendSessionAffinityHeaders: true,
3915
- supportsEagerToolInputStreaming: false,
3916
- supportsCacheControlOnTools: false,
3917
- supportsLongCacheRetention: false,
3918
- },
3919
3697
  },
3920
3698
  "accounts/fireworks/models/minimax-m2p1": {
3921
3699
  id: "accounts/fireworks/models/minimax-m2p1",
@@ -3923,6 +3701,7 @@ export const MODELS = {
3923
3701
  api: "anthropic-messages",
3924
3702
  provider: "fireworks",
3925
3703
  baseUrl: "https://api.fireworks.ai/inference",
3704
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3926
3705
  reasoning: true,
3927
3706
  input: ["text"],
3928
3707
  cost: {
@@ -3933,12 +3712,6 @@ export const MODELS = {
3933
3712
  },
3934
3713
  contextWindow: 200000,
3935
3714
  maxTokens: 200000,
3936
- compat: {
3937
- sendSessionAffinityHeaders: true,
3938
- supportsEagerToolInputStreaming: false,
3939
- supportsCacheControlOnTools: false,
3940
- supportsLongCacheRetention: false,
3941
- },
3942
3715
  },
3943
3716
  "accounts/fireworks/models/minimax-m2p5": {
3944
3717
  id: "accounts/fireworks/models/minimax-m2p5",
@@ -3946,6 +3719,7 @@ export const MODELS = {
3946
3719
  api: "anthropic-messages",
3947
3720
  provider: "fireworks",
3948
3721
  baseUrl: "https://api.fireworks.ai/inference",
3722
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3949
3723
  reasoning: true,
3950
3724
  input: ["text"],
3951
3725
  cost: {
@@ -3956,12 +3730,6 @@ export const MODELS = {
3956
3730
  },
3957
3731
  contextWindow: 196608,
3958
3732
  maxTokens: 196608,
3959
- compat: {
3960
- sendSessionAffinityHeaders: true,
3961
- supportsEagerToolInputStreaming: false,
3962
- supportsCacheControlOnTools: false,
3963
- supportsLongCacheRetention: false,
3964
- },
3965
3733
  },
3966
3734
  "accounts/fireworks/models/minimax-m2p7": {
3967
3735
  id: "accounts/fireworks/models/minimax-m2p7",
@@ -3969,6 +3737,7 @@ export const MODELS = {
3969
3737
  api: "anthropic-messages",
3970
3738
  provider: "fireworks",
3971
3739
  baseUrl: "https://api.fireworks.ai/inference",
3740
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3972
3741
  reasoning: true,
3973
3742
  input: ["text"],
3974
3743
  cost: {
@@ -3979,12 +3748,6 @@ export const MODELS = {
3979
3748
  },
3980
3749
  contextWindow: 196608,
3981
3750
  maxTokens: 196608,
3982
- compat: {
3983
- sendSessionAffinityHeaders: true,
3984
- supportsEagerToolInputStreaming: false,
3985
- supportsCacheControlOnTools: false,
3986
- supportsLongCacheRetention: false,
3987
- },
3988
3751
  },
3989
3752
  "accounts/fireworks/models/qwen3p6-plus": {
3990
3753
  id: "accounts/fireworks/models/qwen3p6-plus",
@@ -3992,6 +3755,7 @@ export const MODELS = {
3992
3755
  api: "anthropic-messages",
3993
3756
  provider: "fireworks",
3994
3757
  baseUrl: "https://api.fireworks.ai/inference",
3758
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3995
3759
  reasoning: true,
3996
3760
  input: ["text", "image"],
3997
3761
  cost: {
@@ -4002,12 +3766,6 @@ export const MODELS = {
4002
3766
  },
4003
3767
  contextWindow: 128000,
4004
3768
  maxTokens: 8192,
4005
- compat: {
4006
- sendSessionAffinityHeaders: true,
4007
- supportsEagerToolInputStreaming: false,
4008
- supportsCacheControlOnTools: false,
4009
- supportsLongCacheRetention: false,
4010
- },
4011
3769
  },
4012
3770
  "accounts/fireworks/routers/kimi-k2p5-turbo": {
4013
3771
  id: "accounts/fireworks/routers/kimi-k2p5-turbo",
@@ -4015,6 +3773,7 @@ export const MODELS = {
4015
3773
  api: "anthropic-messages",
4016
3774
  provider: "fireworks",
4017
3775
  baseUrl: "https://api.fireworks.ai/inference",
3776
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
4018
3777
  reasoning: true,
4019
3778
  input: ["text", "image"],
4020
3779
  cost: {
@@ -4025,12 +3784,6 @@ export const MODELS = {
4025
3784
  },
4026
3785
  contextWindow: 256000,
4027
3786
  maxTokens: 256000,
4028
- compat: {
4029
- sendSessionAffinityHeaders: true,
4030
- supportsEagerToolInputStreaming: false,
4031
- supportsCacheControlOnTools: false,
4032
- supportsLongCacheRetention: false,
4033
- },
4034
3787
  },
4035
3788
  },
4036
3789
  "github-copilot": {
@@ -4109,25 +3862,6 @@ export const MODELS = {
4109
3862
  contextWindow: 144000,
4110
3863
  maxTokens: 64000,
4111
3864
  },
4112
- "claude-sonnet-4": {
4113
- id: "claude-sonnet-4",
4114
- name: "Claude Sonnet 4",
4115
- api: "anthropic-messages",
4116
- provider: "github-copilot",
4117
- baseUrl: "https://api.individual.githubcopilot.com",
4118
- headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4119
- compat: { "supportsEagerToolInputStreaming": false },
4120
- reasoning: true,
4121
- input: ["text", "image"],
4122
- cost: {
4123
- input: 0,
4124
- output: 0,
4125
- cacheRead: 0,
4126
- cacheWrite: 0,
4127
- },
4128
- contextWindow: 216000,
4129
- maxTokens: 16000,
4130
- },
4131
3865
  "claude-sonnet-4.5": {
4132
3866
  id: "claude-sonnet-4.5",
4133
3867
  name: "Claude Sonnet 4.5",
@@ -4173,121 +3907,7 @@ export const MODELS = {
4173
3907
  baseUrl: "https://api.individual.githubcopilot.com",
4174
3908
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4175
3909
  compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
4176
- reasoning: false,
4177
- input: ["text", "image"],
4178
- cost: {
4179
- input: 0,
4180
- output: 0,
4181
- cacheRead: 0,
4182
- cacheWrite: 0,
4183
- },
4184
- contextWindow: 128000,
4185
- maxTokens: 64000,
4186
- },
4187
- "gemini-3-flash-preview": {
4188
- id: "gemini-3-flash-preview",
4189
- name: "Gemini 3 Flash",
4190
- api: "openai-completions",
4191
- provider: "github-copilot",
4192
- baseUrl: "https://api.individual.githubcopilot.com",
4193
- headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4194
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
4195
- reasoning: true,
4196
- input: ["text", "image"],
4197
- cost: {
4198
- input: 0,
4199
- output: 0,
4200
- cacheRead: 0,
4201
- cacheWrite: 0,
4202
- },
4203
- contextWindow: 128000,
4204
- maxTokens: 64000,
4205
- },
4206
- "gemini-3-pro-preview": {
4207
- id: "gemini-3-pro-preview",
4208
- name: "Gemini 3 Pro Preview",
4209
- api: "openai-completions",
4210
- provider: "github-copilot",
4211
- baseUrl: "https://api.individual.githubcopilot.com",
4212
- headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4213
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
4214
- reasoning: true,
4215
- input: ["text", "image"],
4216
- cost: {
4217
- input: 0,
4218
- output: 0,
4219
- cacheRead: 0,
4220
- cacheWrite: 0,
4221
- },
4222
- contextWindow: 128000,
4223
- maxTokens: 64000,
4224
- },
4225
- "gemini-3.1-pro-preview": {
4226
- id: "gemini-3.1-pro-preview",
4227
- name: "Gemini 3.1 Pro Preview",
4228
- api: "openai-completions",
4229
- provider: "github-copilot",
4230
- baseUrl: "https://api.individual.githubcopilot.com",
4231
- headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4232
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
4233
- reasoning: true,
4234
- input: ["text", "image"],
4235
- cost: {
4236
- input: 0,
4237
- output: 0,
4238
- cacheRead: 0,
4239
- cacheWrite: 0,
4240
- },
4241
- contextWindow: 128000,
4242
- maxTokens: 64000,
4243
- },
4244
- "gpt-4.1": {
4245
- id: "gpt-4.1",
4246
- name: "GPT-4.1",
4247
- api: "openai-completions",
4248
- provider: "github-copilot",
4249
- baseUrl: "https://api.individual.githubcopilot.com",
4250
- headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4251
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
4252
- reasoning: false,
4253
- input: ["text", "image"],
4254
- cost: {
4255
- input: 0,
4256
- output: 0,
4257
- cacheRead: 0,
4258
- cacheWrite: 0,
4259
- },
4260
- contextWindow: 128000,
4261
- maxTokens: 16384,
4262
- },
4263
- "gpt-4o": {
4264
- id: "gpt-4o",
4265
- name: "GPT-4o",
4266
- api: "openai-completions",
4267
- provider: "github-copilot",
4268
- baseUrl: "https://api.individual.githubcopilot.com",
4269
- headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4270
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
4271
- reasoning: false,
4272
- input: ["text", "image"],
4273
- cost: {
4274
- input: 0,
4275
- output: 0,
4276
- cacheRead: 0,
4277
- cacheWrite: 0,
4278
- },
4279
- contextWindow: 128000,
4280
- maxTokens: 4096,
4281
- },
4282
- "gpt-5": {
4283
- id: "gpt-5",
4284
- name: "GPT-5",
4285
- api: "openai-responses",
4286
- provider: "github-copilot",
4287
- baseUrl: "https://api.individual.githubcopilot.com",
4288
- headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4289
- reasoning: true,
4290
- thinkingLevelMap: { "off": null },
3910
+ reasoning: false,
4291
3911
  input: ["text", "image"],
4292
3912
  cost: {
4293
3913
  input: 0,
@@ -4296,17 +3916,17 @@ export const MODELS = {
4296
3916
  cacheWrite: 0,
4297
3917
  },
4298
3918
  contextWindow: 128000,
4299
- maxTokens: 128000,
3919
+ maxTokens: 64000,
4300
3920
  },
4301
- "gpt-5-mini": {
4302
- id: "gpt-5-mini",
4303
- name: "GPT-5-mini",
4304
- api: "openai-responses",
3921
+ "gemini-3-flash-preview": {
3922
+ id: "gemini-3-flash-preview",
3923
+ name: "Gemini 3 Flash",
3924
+ api: "openai-completions",
4305
3925
  provider: "github-copilot",
4306
3926
  baseUrl: "https://api.individual.githubcopilot.com",
4307
3927
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3928
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
4308
3929
  reasoning: true,
4309
- thinkingLevelMap: { "off": null },
4310
3930
  input: ["text", "image"],
4311
3931
  cost: {
4312
3932
  input: 0,
@@ -4314,18 +3934,18 @@ export const MODELS = {
4314
3934
  cacheRead: 0,
4315
3935
  cacheWrite: 0,
4316
3936
  },
4317
- contextWindow: 264000,
3937
+ contextWindow: 128000,
4318
3938
  maxTokens: 64000,
4319
3939
  },
4320
- "gpt-5.1": {
4321
- id: "gpt-5.1",
4322
- name: "GPT-5.1",
4323
- api: "openai-responses",
3940
+ "gemini-3.1-pro-preview": {
3941
+ id: "gemini-3.1-pro-preview",
3942
+ name: "Gemini 3.1 Pro Preview",
3943
+ api: "openai-completions",
4324
3944
  provider: "github-copilot",
4325
3945
  baseUrl: "https://api.individual.githubcopilot.com",
4326
3946
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3947
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
4327
3948
  reasoning: true,
4328
- thinkingLevelMap: { "off": null },
4329
3949
  input: ["text", "image"],
4330
3950
  cost: {
4331
3951
  input: 0,
@@ -4333,18 +3953,18 @@ export const MODELS = {
4333
3953
  cacheRead: 0,
4334
3954
  cacheWrite: 0,
4335
3955
  },
4336
- contextWindow: 264000,
3956
+ contextWindow: 128000,
4337
3957
  maxTokens: 64000,
4338
3958
  },
4339
- "gpt-5.1-codex": {
4340
- id: "gpt-5.1-codex",
4341
- name: "GPT-5.1-Codex",
4342
- api: "openai-responses",
3959
+ "gpt-4.1": {
3960
+ id: "gpt-4.1",
3961
+ name: "GPT-4.1",
3962
+ api: "openai-completions",
4343
3963
  provider: "github-copilot",
4344
3964
  baseUrl: "https://api.individual.githubcopilot.com",
4345
3965
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4346
- reasoning: true,
4347
- thinkingLevelMap: { "off": null },
3966
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
3967
+ reasoning: false,
4348
3968
  input: ["text", "image"],
4349
3969
  cost: {
4350
3970
  input: 0,
@@ -4352,18 +3972,18 @@ export const MODELS = {
4352
3972
  cacheRead: 0,
4353
3973
  cacheWrite: 0,
4354
3974
  },
4355
- contextWindow: 400000,
4356
- maxTokens: 128000,
3975
+ contextWindow: 128000,
3976
+ maxTokens: 16384,
4357
3977
  },
4358
- "gpt-5.1-codex-max": {
4359
- id: "gpt-5.1-codex-max",
4360
- name: "GPT-5.1-Codex-max",
4361
- api: "openai-responses",
3978
+ "gpt-4o": {
3979
+ id: "gpt-4o",
3980
+ name: "GPT-4o",
3981
+ api: "openai-completions",
4362
3982
  provider: "github-copilot",
4363
3983
  baseUrl: "https://api.individual.githubcopilot.com",
4364
3984
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4365
- reasoning: true,
4366
- thinkingLevelMap: { "off": null },
3985
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
3986
+ reasoning: false,
4367
3987
  input: ["text", "image"],
4368
3988
  cost: {
4369
3989
  input: 0,
@@ -4371,12 +3991,12 @@ export const MODELS = {
4371
3991
  cacheRead: 0,
4372
3992
  cacheWrite: 0,
4373
3993
  },
4374
- contextWindow: 400000,
4375
- maxTokens: 128000,
3994
+ contextWindow: 128000,
3995
+ maxTokens: 4096,
4376
3996
  },
4377
- "gpt-5.1-codex-mini": {
4378
- id: "gpt-5.1-codex-mini",
4379
- name: "GPT-5.1-Codex-mini",
3997
+ "gpt-5-mini": {
3998
+ id: "gpt-5-mini",
3999
+ name: "GPT-5-mini",
4380
4000
  api: "openai-responses",
4381
4001
  provider: "github-copilot",
4382
4002
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -4390,8 +4010,8 @@ export const MODELS = {
4390
4010
  cacheRead: 0,
4391
4011
  cacheWrite: 0,
4392
4012
  },
4393
- contextWindow: 400000,
4394
- maxTokens: 128000,
4013
+ contextWindow: 264000,
4014
+ maxTokens: 64000,
4395
4015
  },
4396
4016
  "gpt-5.2": {
4397
4017
  id: "gpt-5.2",
@@ -4641,7 +4261,7 @@ export const MODELS = {
4641
4261
  cost: {
4642
4262
  input: 0.1,
4643
4263
  output: 0.4,
4644
- cacheRead: 0.025,
4264
+ cacheRead: 0.01,
4645
4265
  cacheWrite: 0,
4646
4266
  },
4647
4267
  contextWindow: 1048576,
@@ -4832,7 +4452,7 @@ export const MODELS = {
4832
4452
  input: 0.25,
4833
4453
  output: 1.5,
4834
4454
  cacheRead: 0.025,
4835
- cacheWrite: 1,
4455
+ cacheWrite: 0,
4836
4456
  },
4837
4457
  contextWindow: 1048576,
4838
4458
  maxTokens: 65536,
@@ -4850,7 +4470,7 @@ export const MODELS = {
4850
4470
  input: 0.25,
4851
4471
  output: 1.5,
4852
4472
  cacheRead: 0.025,
4853
- cacheWrite: 1,
4473
+ cacheWrite: 0,
4854
4474
  },
4855
4475
  contextWindow: 1048576,
4856
4476
  maxTokens: 65536,
@@ -4922,95 +4542,303 @@ export const MODELS = {
4922
4542
  cacheRead: 0.025,
4923
4543
  cacheWrite: 0,
4924
4544
  },
4925
- contextWindow: 1048576,
4926
- maxTokens: 65536,
4545
+ contextWindow: 1048576,
4546
+ maxTokens: 65536,
4547
+ },
4548
+ "gemini-live-2.5-flash": {
4549
+ id: "gemini-live-2.5-flash",
4550
+ name: "Gemini Live 2.5 Flash",
4551
+ api: "google-generative-ai",
4552
+ provider: "google",
4553
+ baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4554
+ reasoning: true,
4555
+ input: ["text", "image"],
4556
+ cost: {
4557
+ input: 0.5,
4558
+ output: 2,
4559
+ cacheRead: 0,
4560
+ cacheWrite: 0,
4561
+ },
4562
+ contextWindow: 128000,
4563
+ maxTokens: 8000,
4564
+ },
4565
+ "gemini-live-2.5-flash-preview-native-audio": {
4566
+ id: "gemini-live-2.5-flash-preview-native-audio",
4567
+ name: "Gemini Live 2.5 Flash Preview Native Audio",
4568
+ api: "google-generative-ai",
4569
+ provider: "google",
4570
+ baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4571
+ reasoning: true,
4572
+ input: ["text"],
4573
+ cost: {
4574
+ input: 0.5,
4575
+ output: 2,
4576
+ cacheRead: 0,
4577
+ cacheWrite: 0,
4578
+ },
4579
+ contextWindow: 131072,
4580
+ maxTokens: 65536,
4581
+ },
4582
+ "gemma-3-27b-it": {
4583
+ id: "gemma-3-27b-it",
4584
+ name: "Gemma 3 27B",
4585
+ api: "google-generative-ai",
4586
+ provider: "google",
4587
+ baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4588
+ reasoning: false,
4589
+ input: ["text", "image"],
4590
+ cost: {
4591
+ input: 0,
4592
+ output: 0,
4593
+ cacheRead: 0,
4594
+ cacheWrite: 0,
4595
+ },
4596
+ contextWindow: 131072,
4597
+ maxTokens: 8192,
4598
+ },
4599
+ "gemma-4-26b-a4b-it": {
4600
+ id: "gemma-4-26b-a4b-it",
4601
+ name: "Gemma 4 26B",
4602
+ api: "google-generative-ai",
4603
+ provider: "google",
4604
+ baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4605
+ reasoning: true,
4606
+ thinkingLevelMap: { "off": null, "minimal": "MINIMAL", "low": null, "medium": null, "high": "HIGH" },
4607
+ input: ["text", "image"],
4608
+ cost: {
4609
+ input: 0,
4610
+ output: 0,
4611
+ cacheRead: 0,
4612
+ cacheWrite: 0,
4613
+ },
4614
+ contextWindow: 256000,
4615
+ maxTokens: 8192,
4616
+ },
4617
+ "gemma-4-31b-it": {
4618
+ id: "gemma-4-31b-it",
4619
+ name: "Gemma 4 31B",
4620
+ api: "google-generative-ai",
4621
+ provider: "google",
4622
+ baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4623
+ reasoning: true,
4624
+ thinkingLevelMap: { "off": null, "minimal": "MINIMAL", "low": null, "medium": null, "high": "HIGH" },
4625
+ input: ["text", "image"],
4626
+ cost: {
4627
+ input: 0,
4628
+ output: 0,
4629
+ cacheRead: 0,
4630
+ cacheWrite: 0,
4631
+ },
4632
+ contextWindow: 256000,
4633
+ maxTokens: 8192,
4634
+ },
4635
+ },
4636
+ "google-antigravity": {
4637
+ "claude-opus-4": {
4638
+ id: "claude-opus-4",
4639
+ name: "Claude Opus 4",
4640
+ api: "google-gemini-cli",
4641
+ provider: "google-antigravity",
4642
+ baseUrl: "https://daily-cloudcode-pa.sandbox.googleapis.com",
4643
+ reasoning: true,
4644
+ input: ["text", "image"],
4645
+ cost: {
4646
+ input: 0,
4647
+ output: 0,
4648
+ cacheRead: 0,
4649
+ cacheWrite: 0,
4650
+ },
4651
+ contextWindow: 200000,
4652
+ maxTokens: 32000,
4653
+ },
4654
+ "claude-sonnet-4": {
4655
+ id: "claude-sonnet-4",
4656
+ name: "Claude Sonnet 4",
4657
+ api: "google-gemini-cli",
4658
+ provider: "google-antigravity",
4659
+ baseUrl: "https://daily-cloudcode-pa.sandbox.googleapis.com",
4660
+ reasoning: true,
4661
+ input: ["text", "image"],
4662
+ cost: {
4663
+ input: 0,
4664
+ output: 0,
4665
+ cacheRead: 0,
4666
+ cacheWrite: 0,
4667
+ },
4668
+ contextWindow: 200000,
4669
+ maxTokens: 16384,
4670
+ },
4671
+ "gemini-3-flash": {
4672
+ id: "gemini-3-flash",
4673
+ name: "Gemini 3 Flash",
4674
+ api: "google-gemini-cli",
4675
+ provider: "google-antigravity",
4676
+ baseUrl: "https://daily-cloudcode-pa.sandbox.googleapis.com",
4677
+ reasoning: true,
4678
+ input: ["text", "image"],
4679
+ cost: {
4680
+ input: 0,
4681
+ output: 0,
4682
+ cacheRead: 0,
4683
+ cacheWrite: 0,
4684
+ },
4685
+ contextWindow: 1048576,
4686
+ maxTokens: 65536,
4687
+ },
4688
+ "gemini-3-pro-preview": {
4689
+ id: "gemini-3-pro-preview",
4690
+ name: "Gemini 3 Pro Preview",
4691
+ api: "google-gemini-cli",
4692
+ provider: "google-antigravity",
4693
+ baseUrl: "https://daily-cloudcode-pa.sandbox.googleapis.com",
4694
+ reasoning: true,
4695
+ input: ["text", "image"],
4696
+ cost: {
4697
+ input: 0,
4698
+ output: 0,
4699
+ cacheRead: 0,
4700
+ cacheWrite: 0,
4701
+ },
4702
+ contextWindow: 1048576,
4703
+ maxTokens: 65536,
4704
+ },
4705
+ "gpt-oss-120b": {
4706
+ id: "gpt-oss-120b",
4707
+ name: "GPT OSS 120B",
4708
+ api: "google-gemini-cli",
4709
+ provider: "google-antigravity",
4710
+ baseUrl: "https://daily-cloudcode-pa.sandbox.googleapis.com",
4711
+ reasoning: true,
4712
+ input: ["text"],
4713
+ cost: {
4714
+ input: 0,
4715
+ output: 0,
4716
+ cacheRead: 0,
4717
+ cacheWrite: 0,
4718
+ },
4719
+ contextWindow: 131072,
4720
+ maxTokens: 16384,
4721
+ },
4722
+ },
4723
+ "google-gemini-cli": {
4724
+ "claude-opus-4": {
4725
+ id: "claude-opus-4",
4726
+ name: "Claude Opus 4",
4727
+ api: "google-gemini-cli",
4728
+ provider: "google-gemini-cli",
4729
+ baseUrl: "https://cloudcode-pa.googleapis.com",
4730
+ reasoning: true,
4731
+ input: ["text", "image"],
4732
+ cost: {
4733
+ input: 15,
4734
+ output: 75,
4735
+ cacheRead: 1.5,
4736
+ cacheWrite: 18.75,
4737
+ },
4738
+ contextWindow: 200000,
4739
+ maxTokens: 32000,
4740
+ },
4741
+ "claude-sonnet-4": {
4742
+ id: "claude-sonnet-4",
4743
+ name: "Claude Sonnet 4",
4744
+ api: "google-gemini-cli",
4745
+ provider: "google-gemini-cli",
4746
+ baseUrl: "https://cloudcode-pa.googleapis.com",
4747
+ reasoning: true,
4748
+ input: ["text", "image"],
4749
+ cost: {
4750
+ input: 3,
4751
+ output: 15,
4752
+ cacheRead: 0.3,
4753
+ cacheWrite: 3.75,
4754
+ },
4755
+ contextWindow: 200000,
4756
+ maxTokens: 16384,
4927
4757
  },
4928
- "gemini-live-2.5-flash": {
4929
- id: "gemini-live-2.5-flash",
4930
- name: "Gemini Live 2.5 Flash",
4931
- api: "google-generative-ai",
4932
- provider: "google",
4933
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4934
- reasoning: true,
4758
+ "gemini-2.0-flash": {
4759
+ id: "gemini-2.0-flash",
4760
+ name: "Gemini 2.0 Flash",
4761
+ api: "google-gemini-cli",
4762
+ provider: "google-gemini-cli",
4763
+ baseUrl: "https://cloudcode-pa.googleapis.com",
4764
+ reasoning: false,
4935
4765
  input: ["text", "image"],
4936
4766
  cost: {
4937
- input: 0.5,
4938
- output: 2,
4767
+ input: 0.075,
4768
+ output: 0.3,
4939
4769
  cacheRead: 0,
4940
4770
  cacheWrite: 0,
4941
4771
  },
4942
- contextWindow: 128000,
4943
- maxTokens: 8000,
4772
+ contextWindow: 1048576,
4773
+ maxTokens: 8192,
4944
4774
  },
4945
- "gemini-live-2.5-flash-preview-native-audio": {
4946
- id: "gemini-live-2.5-flash-preview-native-audio",
4947
- name: "Gemini Live 2.5 Flash Preview Native Audio",
4948
- api: "google-generative-ai",
4949
- provider: "google",
4950
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4775
+ "gemini-2.5-flash": {
4776
+ id: "gemini-2.5-flash",
4777
+ name: "Gemini 2.5 Flash",
4778
+ api: "google-gemini-cli",
4779
+ provider: "google-gemini-cli",
4780
+ baseUrl: "https://cloudcode-pa.googleapis.com",
4951
4781
  reasoning: true,
4952
- input: ["text"],
4782
+ input: ["text", "image"],
4953
4783
  cost: {
4954
- input: 0.5,
4955
- output: 2,
4956
- cacheRead: 0,
4784
+ input: 0.15,
4785
+ output: 0.6,
4786
+ cacheRead: 0.0375,
4957
4787
  cacheWrite: 0,
4958
4788
  },
4959
- contextWindow: 131072,
4789
+ contextWindow: 1048576,
4960
4790
  maxTokens: 65536,
4961
4791
  },
4962
- "gemma-3-27b-it": {
4963
- id: "gemma-3-27b-it",
4964
- name: "Gemma 3 27B",
4965
- api: "google-generative-ai",
4966
- provider: "google",
4967
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4968
- reasoning: false,
4792
+ "gemini-2.5-pro": {
4793
+ id: "gemini-2.5-pro",
4794
+ name: "Gemini 2.5 Pro",
4795
+ api: "google-gemini-cli",
4796
+ provider: "google-gemini-cli",
4797
+ baseUrl: "https://cloudcode-pa.googleapis.com",
4798
+ reasoning: true,
4969
4799
  input: ["text", "image"],
4970
4800
  cost: {
4971
- input: 0,
4972
- output: 0,
4973
- cacheRead: 0,
4801
+ input: 1.25,
4802
+ output: 10,
4803
+ cacheRead: 0.3125,
4974
4804
  cacheWrite: 0,
4975
4805
  },
4976
- contextWindow: 131072,
4977
- maxTokens: 8192,
4806
+ contextWindow: 1048576,
4807
+ maxTokens: 65536,
4978
4808
  },
4979
- "gemma-4-26b-a4b-it": {
4980
- id: "gemma-4-26b-a4b-it",
4981
- name: "Gemma 4 26B",
4982
- api: "google-generative-ai",
4983
- provider: "google",
4984
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4809
+ "gemini-3-flash-preview": {
4810
+ id: "gemini-3-flash-preview",
4811
+ name: "Gemini 3 Flash Preview",
4812
+ api: "google-gemini-cli",
4813
+ provider: "google-gemini-cli",
4814
+ baseUrl: "https://cloudcode-pa.googleapis.com",
4985
4815
  reasoning: true,
4986
- thinkingLevelMap: { "off": null, "minimal": "MINIMAL", "low": null, "medium": null, "high": "HIGH" },
4987
4816
  input: ["text", "image"],
4988
4817
  cost: {
4989
- input: 0,
4990
- output: 0,
4991
- cacheRead: 0,
4818
+ input: 0.15,
4819
+ output: 0.6,
4820
+ cacheRead: 0.0375,
4992
4821
  cacheWrite: 0,
4993
4822
  },
4994
- contextWindow: 256000,
4995
- maxTokens: 8192,
4823
+ contextWindow: 1048576,
4824
+ maxTokens: 65536,
4996
4825
  },
4997
- "gemma-4-31b-it": {
4998
- id: "gemma-4-31b-it",
4999
- name: "Gemma 4 31B",
5000
- api: "google-generative-ai",
5001
- provider: "google",
5002
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4826
+ "gemini-3-pro-preview": {
4827
+ id: "gemini-3-pro-preview",
4828
+ name: "Gemini 3 Pro Preview",
4829
+ api: "google-gemini-cli",
4830
+ provider: "google-gemini-cli",
4831
+ baseUrl: "https://cloudcode-pa.googleapis.com",
5003
4832
  reasoning: true,
5004
- thinkingLevelMap: { "off": null, "minimal": "MINIMAL", "low": null, "medium": null, "high": "HIGH" },
5005
4833
  input: ["text", "image"],
5006
4834
  cost: {
5007
- input: 0,
5008
- output: 0,
5009
- cacheRead: 0,
4835
+ input: 1.25,
4836
+ output: 10,
4837
+ cacheRead: 0.3125,
5010
4838
  cacheWrite: 0,
5011
4839
  },
5012
- contextWindow: 256000,
5013
- maxTokens: 8192,
4840
+ contextWindow: 1048576,
4841
+ maxTokens: 65536,
5014
4842
  },
5015
4843
  },
5016
4844
  "google-vertex": {
@@ -7867,6 +7695,25 @@ export const MODELS = {
7867
7695
  contextWindow: 1000000,
7868
7696
  maxTokens: 64000,
7869
7697
  },
7698
+ "deepseek-v4-flash-free": {
7699
+ id: "deepseek-v4-flash-free",
7700
+ name: "DeepSeek V4 Flash Free",
7701
+ api: "openai-completions",
7702
+ provider: "opencode",
7703
+ baseUrl: "https://opencode.ai/zen/v1",
7704
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7705
+ reasoning: true,
7706
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7707
+ input: ["text"],
7708
+ cost: {
7709
+ input: 0,
7710
+ output: 0,
7711
+ cacheRead: 0,
7712
+ cacheWrite: 0,
7713
+ },
7714
+ contextWindow: 200000,
7715
+ maxTokens: 128000,
7716
+ },
7870
7717
  "gemini-3-flash": {
7871
7718
  id: "gemini-3-flash",
7872
7719
  name: "Gemini 3 Flash",
@@ -8225,23 +8072,6 @@ export const MODELS = {
8225
8072
  contextWindow: 1050000,
8226
8073
  maxTokens: 128000,
8227
8074
  },
8228
- "hy3-preview-free": {
8229
- id: "hy3-preview-free",
8230
- name: "Hy3 preview Free",
8231
- api: "openai-completions",
8232
- provider: "opencode",
8233
- baseUrl: "https://opencode.ai/zen/v1",
8234
- reasoning: true,
8235
- input: ["text"],
8236
- cost: {
8237
- input: 0,
8238
- output: 0,
8239
- cacheRead: 0,
8240
- cacheWrite: 0,
8241
- },
8242
- contextWindow: 256000,
8243
- maxTokens: 64000,
8244
- },
8245
8075
  "kimi-k2.5": {
8246
8076
  id: "kimi-k2.5",
8247
8077
  name: "Kimi K2.5",
@@ -8378,6 +8208,23 @@ export const MODELS = {
8378
8208
  contextWindow: 262144,
8379
8209
  maxTokens: 65536,
8380
8210
  },
8211
+ "qwen3.6-plus-free": {
8212
+ id: "qwen3.6-plus-free",
8213
+ name: "Qwen3.6 Plus Free",
8214
+ api: "anthropic-messages",
8215
+ provider: "opencode",
8216
+ baseUrl: "https://opencode.ai/zen",
8217
+ reasoning: true,
8218
+ input: ["text", "image"],
8219
+ cost: {
8220
+ input: 0,
8221
+ output: 0,
8222
+ cacheRead: 0,
8223
+ cacheWrite: 0,
8224
+ },
8225
+ contextWindow: 262144,
8226
+ maxTokens: 65536,
8227
+ },
8381
8228
  },
8382
8229
  "opencode-go": {
8383
8230
  "deepseek-v4-flash": {
@@ -8523,9 +8370,9 @@ export const MODELS = {
8523
8370
  "minimax-m2.5": {
8524
8371
  id: "minimax-m2.5",
8525
8372
  name: "MiniMax M2.5",
8526
- api: "openai-completions",
8373
+ api: "anthropic-messages",
8527
8374
  provider: "opencode-go",
8528
- baseUrl: "https://opencode.ai/zen/go/v1",
8375
+ baseUrl: "https://opencode.ai/zen/go",
8529
8376
  reasoning: true,
8530
8377
  input: ["text"],
8531
8378
  cost: {
@@ -8745,40 +8592,6 @@ export const MODELS = {
8745
8592
  contextWindow: 200000,
8746
8593
  maxTokens: 8192,
8747
8594
  },
8748
- "anthropic/claude-3.7-sonnet": {
8749
- id: "anthropic/claude-3.7-sonnet",
8750
- name: "Anthropic: Claude 3.7 Sonnet",
8751
- api: "openai-completions",
8752
- provider: "openrouter",
8753
- baseUrl: "https://openrouter.ai/api/v1",
8754
- reasoning: true,
8755
- input: ["text", "image"],
8756
- cost: {
8757
- input: 3,
8758
- output: 15,
8759
- cacheRead: 0.3,
8760
- cacheWrite: 3.75,
8761
- },
8762
- contextWindow: 200000,
8763
- maxTokens: 64000,
8764
- },
8765
- "anthropic/claude-3.7-sonnet:thinking": {
8766
- id: "anthropic/claude-3.7-sonnet:thinking",
8767
- name: "Anthropic: Claude 3.7 Sonnet (thinking)",
8768
- api: "openai-completions",
8769
- provider: "openrouter",
8770
- baseUrl: "https://openrouter.ai/api/v1",
8771
- reasoning: true,
8772
- input: ["text", "image"],
8773
- cost: {
8774
- input: 3,
8775
- output: 15,
8776
- cacheRead: 0.3,
8777
- cacheWrite: 3.75,
8778
- },
8779
- contextWindow: 200000,
8780
- maxTokens: 64000,
8781
- },
8782
8595
  "anthropic/claude-haiku-4.5": {
8783
8596
  id: "anthropic/claude-haiku-4.5",
8784
8597
  name: "Anthropic: Claude Haiku 4.5",
@@ -8901,6 +8714,24 @@ export const MODELS = {
8901
8714
  contextWindow: 1000000,
8902
8715
  maxTokens: 128000,
8903
8716
  },
8717
+ "anthropic/claude-opus-4.7-fast": {
8718
+ id: "anthropic/claude-opus-4.7-fast",
8719
+ name: "Anthropic: Claude Opus 4.7 (Fast)",
8720
+ api: "openai-completions",
8721
+ provider: "openrouter",
8722
+ baseUrl: "https://openrouter.ai/api/v1",
8723
+ reasoning: true,
8724
+ thinkingLevelMap: { "xhigh": "xhigh" },
8725
+ input: ["text", "image"],
8726
+ cost: {
8727
+ input: 30,
8728
+ output: 150,
8729
+ cacheRead: 3,
8730
+ cacheWrite: 37.5,
8731
+ },
8732
+ contextWindow: 1000000,
8733
+ maxTokens: 128000,
8734
+ },
8904
8735
  "anthropic/claude-sonnet-4": {
8905
8736
  id: "anthropic/claude-sonnet-4",
8906
8737
  name: "Anthropic: Claude Sonnet 4",
@@ -8986,6 +8817,23 @@ export const MODELS = {
8986
8817
  contextWindow: 262144,
8987
8818
  maxTokens: 262144,
8988
8819
  },
8820
+ "arcee-ai/trinity-large-thinking:free": {
8821
+ id: "arcee-ai/trinity-large-thinking:free",
8822
+ name: "Arcee AI: Trinity Large Thinking (free)",
8823
+ api: "openai-completions",
8824
+ provider: "openrouter",
8825
+ baseUrl: "https://openrouter.ai/api/v1",
8826
+ reasoning: true,
8827
+ input: ["text"],
8828
+ cost: {
8829
+ input: 0,
8830
+ output: 0,
8831
+ cacheRead: 0,
8832
+ cacheWrite: 0,
8833
+ },
8834
+ contextWindow: 262144,
8835
+ maxTokens: 80000,
8836
+ },
8989
8837
  "arcee-ai/trinity-mini": {
8990
8838
  id: "arcee-ai/trinity-mini",
8991
8839
  name: "Arcee AI: Trinity Mini",
@@ -9068,7 +8916,7 @@ export const MODELS = {
9068
8916
  cacheRead: 0,
9069
8917
  cacheWrite: 0,
9070
8918
  },
9071
- contextWindow: 120000,
8919
+ contextWindow: 131072,
9072
8920
  maxTokens: 8000,
9073
8921
  },
9074
8922
  "baidu/ernie-4.5-vl-28b-a3b": {
@@ -9085,7 +8933,7 @@ export const MODELS = {
9085
8933
  cacheRead: 0,
9086
8934
  cacheWrite: 0,
9087
8935
  },
9088
- contextWindow: 30000,
8936
+ contextWindow: 131072,
9089
8937
  maxTokens: 8000,
9090
8938
  },
9091
8939
  "bytedance-seed/seed-1.6": {
@@ -9233,13 +9081,13 @@ export const MODELS = {
9233
9081
  reasoning: true,
9234
9082
  input: ["text"],
9235
9083
  cost: {
9236
- input: 0.15,
9237
- output: 0.75,
9238
- cacheRead: 0,
9084
+ input: 0.21,
9085
+ output: 0.7899999999999999,
9086
+ cacheRead: 0.13,
9239
9087
  cacheWrite: 0,
9240
9088
  },
9241
- contextWindow: 32768,
9242
- maxTokens: 7168,
9089
+ contextWindow: 163840,
9090
+ maxTokens: 32768,
9243
9091
  },
9244
9092
  "deepseek/deepseek-r1": {
9245
9093
  id: "deepseek/deepseek-r1",
@@ -9255,7 +9103,7 @@ export const MODELS = {
9255
9103
  cacheRead: 0,
9256
9104
  cacheWrite: 0,
9257
9105
  },
9258
- contextWindow: 64000,
9106
+ contextWindow: 163840,
9259
9107
  maxTokens: 16000,
9260
9108
  },
9261
9109
  "deepseek/deepseek-r1-0528": {
@@ -9337,9 +9185,28 @@ export const MODELS = {
9337
9185
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
9338
9186
  input: ["text"],
9339
9187
  cost: {
9340
- input: 0.14,
9341
- output: 0.28,
9342
- cacheRead: 0.0028,
9188
+ input: 0.112,
9189
+ output: 0.224,
9190
+ cacheRead: 0.022,
9191
+ cacheWrite: 0,
9192
+ },
9193
+ contextWindow: 1048576,
9194
+ maxTokens: 4096,
9195
+ },
9196
+ "deepseek/deepseek-v4-flash:free": {
9197
+ id: "deepseek/deepseek-v4-flash:free",
9198
+ name: "DeepSeek: DeepSeek V4 Flash (free)",
9199
+ api: "openai-completions",
9200
+ provider: "openrouter",
9201
+ baseUrl: "https://openrouter.ai/api/v1",
9202
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
9203
+ reasoning: true,
9204
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
9205
+ input: ["text"],
9206
+ cost: {
9207
+ input: 0,
9208
+ output: 0,
9209
+ cacheRead: 0,
9343
9210
  cacheWrite: 0,
9344
9211
  },
9345
9212
  contextWindow: 1048576,
@@ -9599,7 +9466,7 @@ export const MODELS = {
9599
9466
  cacheRead: 0.19999999999999998,
9600
9467
  cacheWrite: 0.375,
9601
9468
  },
9602
- contextWindow: 1048576,
9469
+ contextWindow: 1048756,
9603
9470
  maxTokens: 65536,
9604
9471
  },
9605
9472
  "google/gemma-3-12b-it": {
@@ -9679,8 +9546,8 @@ export const MODELS = {
9679
9546
  reasoning: true,
9680
9547
  input: ["text", "image"],
9681
9548
  cost: {
9682
- input: 0.13,
9683
- output: 0.38,
9549
+ input: 0.12,
9550
+ output: 0.37,
9684
9551
  cacheRead: 0,
9685
9552
  cacheWrite: 0,
9686
9553
  },
@@ -9765,13 +9632,30 @@ export const MODELS = {
9765
9632
  reasoning: false,
9766
9633
  input: ["text"],
9767
9634
  cost: {
9768
- input: 0.08,
9769
- output: 0.24,
9770
- cacheRead: 0.016,
9635
+ input: 0.01,
9636
+ output: 0.03,
9637
+ cacheRead: 0.002,
9638
+ cacheWrite: 0,
9639
+ },
9640
+ contextWindow: 262144,
9641
+ maxTokens: 32768,
9642
+ },
9643
+ "inclusionai/ring-2.6-1t": {
9644
+ id: "inclusionai/ring-2.6-1t",
9645
+ name: "inclusionAI: Ring-2.6-1T",
9646
+ api: "openai-completions",
9647
+ provider: "openrouter",
9648
+ baseUrl: "https://openrouter.ai/api/v1",
9649
+ reasoning: true,
9650
+ input: ["text"],
9651
+ cost: {
9652
+ input: 0.075,
9653
+ output: 0.625,
9654
+ cacheRead: 0.015,
9771
9655
  cacheWrite: 0,
9772
9656
  },
9773
9657
  contextWindow: 262144,
9774
- maxTokens: 32768,
9658
+ maxTokens: 65536,
9775
9659
  },
9776
9660
  "kwaipilot/kat-coder-pro-v2": {
9777
9661
  id: "kwaipilot/kat-coder-pro-v2",
@@ -9821,7 +9705,7 @@ export const MODELS = {
9821
9705
  cacheRead: 0,
9822
9706
  cacheWrite: 0,
9823
9707
  },
9824
- contextWindow: 16384,
9708
+ contextWindow: 131072,
9825
9709
  maxTokens: 16384,
9826
9710
  },
9827
9711
  "meta-llama/llama-3.3-70b-instruct": {
@@ -9855,7 +9739,7 @@ export const MODELS = {
9855
9739
  cacheRead: 0,
9856
9740
  cacheWrite: 0,
9857
9741
  },
9858
- contextWindow: 65536,
9742
+ contextWindow: 131072,
9859
9743
  maxTokens: 4096,
9860
9744
  },
9861
9745
  "meta-llama/llama-4-scout": {
@@ -9872,7 +9756,7 @@ export const MODELS = {
9872
9756
  cacheRead: 0,
9873
9757
  cacheWrite: 0,
9874
9758
  },
9875
- contextWindow: 327680,
9759
+ contextWindow: 10000000,
9876
9760
  maxTokens: 16384,
9877
9761
  },
9878
9762
  "minimax/minimax-m1": {
@@ -9906,7 +9790,7 @@ export const MODELS = {
9906
9790
  cacheRead: 0.03,
9907
9791
  cacheWrite: 0,
9908
9792
  },
9909
- contextWindow: 196608,
9793
+ contextWindow: 204800,
9910
9794
  maxTokens: 196608,
9911
9795
  },
9912
9796
  "minimax/minimax-m2.1": {
@@ -9923,7 +9807,7 @@ export const MODELS = {
9923
9807
  cacheRead: 0.03,
9924
9808
  cacheWrite: 0,
9925
9809
  },
9926
- contextWindow: 196608,
9810
+ contextWindow: 204800,
9927
9811
  maxTokens: 196608,
9928
9812
  },
9929
9813
  "minimax/minimax-m2.5": {
@@ -9937,11 +9821,11 @@ export const MODELS = {
9937
9821
  cost: {
9938
9822
  input: 0.15,
9939
9823
  output: 1.15,
9940
- cacheRead: 0.03,
9824
+ cacheRead: 0,
9941
9825
  cacheWrite: 0,
9942
9826
  },
9943
- contextWindow: 196608,
9944
- maxTokens: 131072,
9827
+ contextWindow: 204800,
9828
+ maxTokens: 196608,
9945
9829
  },
9946
9830
  "minimax/minimax-m2.5:free": {
9947
9831
  id: "minimax/minimax-m2.5:free",
@@ -9957,7 +9841,7 @@ export const MODELS = {
9957
9841
  cacheRead: 0,
9958
9842
  cacheWrite: 0,
9959
9843
  },
9960
- contextWindow: 196608,
9844
+ contextWindow: 204800,
9961
9845
  maxTokens: 8192,
9962
9846
  },
9963
9847
  "minimax/minimax-m2.7": {
@@ -9969,13 +9853,13 @@ export const MODELS = {
9969
9853
  reasoning: true,
9970
9854
  input: ["text"],
9971
9855
  cost: {
9972
- input: 0.3,
9856
+ input: 0.27899999999999997,
9973
9857
  output: 1.2,
9974
- cacheRead: 0.059,
9858
+ cacheRead: 0,
9975
9859
  cacheWrite: 0,
9976
9860
  },
9977
- contextWindow: 196608,
9978
- maxTokens: 4096,
9861
+ contextWindow: 204800,
9862
+ maxTokens: 131072,
9979
9863
  },
9980
9864
  "mistralai/codestral-2508": {
9981
9865
  id: "mistralai/codestral-2508",
@@ -10360,8 +10244,8 @@ export const MODELS = {
10360
10244
  reasoning: false,
10361
10245
  input: ["text"],
10362
10246
  cost: {
10363
- input: 0.39999999999999997,
10364
- output: 2,
10247
+ input: 0.6,
10248
+ output: 2.5,
10365
10249
  cacheRead: 0,
10366
10250
  cacheWrite: 0,
10367
10251
  },
@@ -10379,7 +10263,7 @@ export const MODELS = {
10379
10263
  cost: {
10380
10264
  input: 0.6,
10381
10265
  output: 2.5,
10382
- cacheRead: 0.15,
10266
+ cacheRead: 0,
10383
10267
  cacheWrite: 0,
10384
10268
  },
10385
10269
  contextWindow: 262144,
@@ -10411,13 +10295,13 @@ export const MODELS = {
10411
10295
  reasoning: true,
10412
10296
  input: ["text", "image"],
10413
10297
  cost: {
10414
- input: 0.75,
10415
- output: 3.5,
10416
- cacheRead: 0.15,
10298
+ input: 0.73,
10299
+ output: 3.49,
10300
+ cacheRead: 0.25,
10417
10301
  cacheWrite: 0,
10418
10302
  },
10419
10303
  contextWindow: 262144,
10420
- maxTokens: 16384,
10304
+ maxTokens: 262142,
10421
10305
  },
10422
10306
  "nex-agi/deepseek-v3.1-nex-n1": {
10423
10307
  id: "nex-agi/deepseek-v3.1-nex-n1",
@@ -10518,7 +10402,7 @@ export const MODELS = {
10518
10402
  cacheRead: 0,
10519
10403
  cacheWrite: 0,
10520
10404
  },
10521
- contextWindow: 262144,
10405
+ contextWindow: 1000000,
10522
10406
  maxTokens: 4096,
10523
10407
  },
10524
10408
  "nvidia/nemotron-3-super-120b-a12b:free": {
@@ -10535,7 +10419,7 @@ export const MODELS = {
10535
10419
  cacheRead: 0,
10536
10420
  cacheWrite: 0,
10537
10421
  },
10538
- contextWindow: 262144,
10422
+ contextWindow: 1000000,
10539
10423
  maxTokens: 262144,
10540
10424
  },
10541
10425
  "nvidia/nemotron-nano-12b-v2-vl:free": {
@@ -11686,7 +11570,7 @@ export const MODELS = {
11686
11570
  cacheRead: 0,
11687
11571
  cacheWrite: 0,
11688
11572
  },
11689
- contextWindow: 32768,
11573
+ contextWindow: 131072,
11690
11574
  maxTokens: 16384,
11691
11575
  },
11692
11576
  "qwen/qwen-2.5-7b-instruct": {
@@ -11703,26 +11587,9 @@ export const MODELS = {
11703
11587
  cacheRead: 0,
11704
11588
  cacheWrite: 0,
11705
11589
  },
11706
- contextWindow: 32768,
11590
+ contextWindow: 131072,
11707
11591
  maxTokens: 32768,
11708
11592
  },
11709
- "qwen/qwen-max": {
11710
- id: "qwen/qwen-max",
11711
- name: "Qwen: Qwen-Max ",
11712
- api: "openai-completions",
11713
- provider: "openrouter",
11714
- baseUrl: "https://openrouter.ai/api/v1",
11715
- reasoning: false,
11716
- input: ["text"],
11717
- cost: {
11718
- input: 1.04,
11719
- output: 4.16,
11720
- cacheRead: 0.20800000000000002,
11721
- cacheWrite: 0,
11722
- },
11723
- contextWindow: 32768,
11724
- maxTokens: 8192,
11725
- },
11726
11593
  "qwen/qwen-plus": {
11727
11594
  id: "qwen/qwen-plus",
11728
11595
  name: "Qwen: Qwen-Plus",
@@ -11774,40 +11641,6 @@ export const MODELS = {
11774
11641
  contextWindow: 1000000,
11775
11642
  maxTokens: 32768,
11776
11643
  },
11777
- "qwen/qwen-turbo": {
11778
- id: "qwen/qwen-turbo",
11779
- name: "Qwen: Qwen-Turbo",
11780
- api: "openai-completions",
11781
- provider: "openrouter",
11782
- baseUrl: "https://openrouter.ai/api/v1",
11783
- reasoning: false,
11784
- input: ["text"],
11785
- cost: {
11786
- input: 0.0325,
11787
- output: 0.13,
11788
- cacheRead: 0.006500000000000001,
11789
- cacheWrite: 0,
11790
- },
11791
- contextWindow: 131072,
11792
- maxTokens: 8192,
11793
- },
11794
- "qwen/qwen-vl-max": {
11795
- id: "qwen/qwen-vl-max",
11796
- name: "Qwen: Qwen VL Max",
11797
- api: "openai-completions",
11798
- provider: "openrouter",
11799
- baseUrl: "https://openrouter.ai/api/v1",
11800
- reasoning: false,
11801
- input: ["text", "image"],
11802
- cost: {
11803
- input: 0.52,
11804
- output: 2.08,
11805
- cacheRead: 0,
11806
- cacheWrite: 0,
11807
- },
11808
- contextWindow: 131072,
11809
- maxTokens: 32768,
11810
- },
11811
11644
  "qwen/qwen3-14b": {
11812
11645
  id: "qwen/qwen3-14b",
11813
11646
  name: "Qwen: Qwen3 14B",
@@ -11817,12 +11650,12 @@ export const MODELS = {
11817
11650
  reasoning: true,
11818
11651
  input: ["text"],
11819
11652
  cost: {
11820
- input: 0.06,
11653
+ input: 0.09999999999999999,
11821
11654
  output: 0.24,
11822
11655
  cacheRead: 0,
11823
11656
  cacheWrite: 0,
11824
11657
  },
11825
- contextWindow: 40960,
11658
+ contextWindow: 131702,
11826
11659
  maxTokens: 40960,
11827
11660
  },
11828
11661
  "qwen/qwen3-235b-a22b": {
@@ -11873,7 +11706,7 @@ export const MODELS = {
11873
11706
  cacheRead: 0,
11874
11707
  cacheWrite: 0,
11875
11708
  },
11876
- contextWindow: 131072,
11709
+ contextWindow: 262144,
11877
11710
  maxTokens: 4096,
11878
11711
  },
11879
11712
  "qwen/qwen3-30b-a3b": {
@@ -11890,7 +11723,7 @@ export const MODELS = {
11890
11723
  cacheRead: 0,
11891
11724
  cacheWrite: 0,
11892
11725
  },
11893
- contextWindow: 40960,
11726
+ contextWindow: 131072,
11894
11727
  maxTokens: 20000,
11895
11728
  },
11896
11729
  "qwen/qwen3-30b-a3b-instruct-2507": {
@@ -11937,12 +11770,12 @@ export const MODELS = {
11937
11770
  input: ["text"],
11938
11771
  cost: {
11939
11772
  input: 0.08,
11940
- output: 0.24,
11941
- cacheRead: 0.04,
11773
+ output: 0.28,
11774
+ cacheRead: 0,
11942
11775
  cacheWrite: 0,
11943
11776
  },
11944
- contextWindow: 40960,
11945
- maxTokens: 40960,
11777
+ contextWindow: 131072,
11778
+ maxTokens: 16384,
11946
11779
  },
11947
11780
  "qwen/qwen3-8b": {
11948
11781
  id: "qwen/qwen3-8b",
@@ -11958,7 +11791,7 @@ export const MODELS = {
11958
11791
  cacheRead: 0.049999999999999996,
11959
11792
  cacheWrite: 0,
11960
11793
  },
11961
- contextWindow: 40960,
11794
+ contextWindow: 131072,
11962
11795
  maxTokens: 8192,
11963
11796
  },
11964
11797
  "qwen/qwen3-coder": {
@@ -11975,7 +11808,7 @@ export const MODELS = {
11975
11808
  cacheRead: 0,
11976
11809
  cacheWrite: 0,
11977
11810
  },
11978
- contextWindow: 262144,
11811
+ contextWindow: 1048576,
11979
11812
  maxTokens: 65536,
11980
11813
  },
11981
11814
  "qwen/qwen3-coder-30b-a3b-instruct": {
@@ -12060,7 +11893,7 @@ export const MODELS = {
12060
11893
  cacheRead: 0,
12061
11894
  cacheWrite: 0,
12062
11895
  },
12063
- contextWindow: 262000,
11896
+ contextWindow: 1048576,
12064
11897
  maxTokens: 262000,
12065
11898
  },
12066
11899
  "qwen/qwen3-max": {
@@ -12145,7 +11978,7 @@ export const MODELS = {
12145
11978
  cacheRead: 0,
12146
11979
  cacheWrite: 0,
12147
11980
  },
12148
- contextWindow: 131072,
11981
+ contextWindow: 262144,
12149
11982
  maxTokens: 32768,
12150
11983
  },
12151
11984
  "qwen/qwen3-vl-235b-a22b-instruct": {
@@ -12196,7 +12029,7 @@ export const MODELS = {
12196
12029
  cacheRead: 0,
12197
12030
  cacheWrite: 0,
12198
12031
  },
12199
- contextWindow: 131072,
12032
+ contextWindow: 262144,
12200
12033
  maxTokens: 32768,
12201
12034
  },
12202
12035
  "qwen/qwen3-vl-30b-a3b-thinking": {
@@ -12230,7 +12063,7 @@ export const MODELS = {
12230
12063
  cacheRead: 0,
12231
12064
  cacheWrite: 0,
12232
12065
  },
12233
- contextWindow: 131072,
12066
+ contextWindow: 262144,
12234
12067
  maxTokens: 32768,
12235
12068
  },
12236
12069
  "qwen/qwen3-vl-8b-instruct": {
@@ -12247,7 +12080,7 @@ export const MODELS = {
12247
12080
  cacheRead: 0,
12248
12081
  cacheWrite: 0,
12249
12082
  },
12250
- contextWindow: 131072,
12083
+ contextWindow: 256000,
12251
12084
  maxTokens: 32768,
12252
12085
  },
12253
12086
  "qwen/qwen3-vl-8b-thinking": {
@@ -12264,7 +12097,7 @@ export const MODELS = {
12264
12097
  cacheRead: 0,
12265
12098
  cacheWrite: 0,
12266
12099
  },
12267
- contextWindow: 131072,
12100
+ contextWindow: 256000,
12268
12101
  maxTokens: 32768,
12269
12102
  },
12270
12103
  "qwen/qwen3.5-122b-a10b": {
@@ -12395,8 +12228,8 @@ export const MODELS = {
12395
12228
  reasoning: true,
12396
12229
  input: ["text", "image"],
12397
12230
  cost: {
12398
- input: 0.39999999999999997,
12399
- output: 2.4,
12231
+ input: 0.3,
12232
+ output: 1.7999999999999998,
12400
12233
  cacheRead: 0,
12401
12234
  cacheWrite: 0,
12402
12235
  },
@@ -12446,10 +12279,10 @@ export const MODELS = {
12446
12279
  reasoning: true,
12447
12280
  input: ["text", "image"],
12448
12281
  cost: {
12449
- input: 0.25,
12450
- output: 1.5,
12282
+ input: 0.1875,
12283
+ output: 1.125,
12451
12284
  cacheRead: 0,
12452
- cacheWrite: 0.3125,
12285
+ cacheWrite: 0.234375,
12453
12286
  },
12454
12287
  contextWindow: 1000000,
12455
12288
  maxTokens: 65536,
@@ -12512,270 +12345,134 @@ export const MODELS = {
12512
12345
  provider: "openrouter",
12513
12346
  baseUrl: "https://openrouter.ai/api/v1",
12514
12347
  reasoning: false,
12515
- input: ["text"],
12516
- cost: {
12517
- input: 1,
12518
- output: 3,
12519
- cacheRead: 0,
12520
- cacheWrite: 0,
12521
- },
12522
- contextWindow: 256000,
12523
- maxTokens: 128000,
12524
- },
12525
- "sao10k/l3-euryale-70b": {
12526
- id: "sao10k/l3-euryale-70b",
12527
- name: "Sao10k: Llama 3 Euryale 70B v2.1",
12528
- api: "openai-completions",
12529
- provider: "openrouter",
12530
- baseUrl: "https://openrouter.ai/api/v1",
12531
- reasoning: false,
12532
- input: ["text"],
12533
- cost: {
12534
- input: 1.48,
12535
- output: 1.48,
12536
- cacheRead: 0,
12537
- cacheWrite: 0,
12538
- },
12539
- contextWindow: 8192,
12540
- maxTokens: 8192,
12541
- },
12542
- "sao10k/l3.1-euryale-70b": {
12543
- id: "sao10k/l3.1-euryale-70b",
12544
- name: "Sao10K: Llama 3.1 Euryale 70B v2.2",
12545
- api: "openai-completions",
12546
- provider: "openrouter",
12547
- baseUrl: "https://openrouter.ai/api/v1",
12548
- reasoning: false,
12549
- input: ["text"],
12550
- cost: {
12551
- input: 0.85,
12552
- output: 0.85,
12553
- cacheRead: 0,
12554
- cacheWrite: 0,
12555
- },
12556
- contextWindow: 131072,
12557
- maxTokens: 16384,
12558
- },
12559
- "stepfun/step-3.5-flash": {
12560
- id: "stepfun/step-3.5-flash",
12561
- name: "StepFun: Step 3.5 Flash",
12562
- api: "openai-completions",
12563
- provider: "openrouter",
12564
- baseUrl: "https://openrouter.ai/api/v1",
12565
- reasoning: true,
12566
- input: ["text"],
12567
- cost: {
12568
- input: 0.09999999999999999,
12569
- output: 0.3,
12570
- cacheRead: 0,
12571
- cacheWrite: 0,
12572
- },
12573
- contextWindow: 262144,
12574
- maxTokens: 65536,
12575
- },
12576
- "tencent/hy3-preview:free": {
12577
- id: "tencent/hy3-preview:free",
12578
- name: "Tencent: Hy3 preview (free)",
12579
- api: "openai-completions",
12580
- provider: "openrouter",
12581
- baseUrl: "https://openrouter.ai/api/v1",
12582
- reasoning: true,
12583
- input: ["text"],
12584
- cost: {
12585
- input: 0,
12586
- output: 0,
12587
- cacheRead: 0,
12588
- cacheWrite: 0,
12589
- },
12590
- contextWindow: 262144,
12591
- maxTokens: 262144,
12592
- },
12593
- "thedrummer/rocinante-12b": {
12594
- id: "thedrummer/rocinante-12b",
12595
- name: "TheDrummer: Rocinante 12B",
12596
- api: "openai-completions",
12597
- provider: "openrouter",
12598
- baseUrl: "https://openrouter.ai/api/v1",
12599
- reasoning: false,
12600
- input: ["text"],
12601
- cost: {
12602
- input: 0.16999999999999998,
12603
- output: 0.43,
12604
- cacheRead: 0,
12605
- cacheWrite: 0,
12606
- },
12607
- contextWindow: 32768,
12608
- maxTokens: 32768,
12609
- },
12610
- "thedrummer/unslopnemo-12b": {
12611
- id: "thedrummer/unslopnemo-12b",
12612
- name: "TheDrummer: UnslopNemo 12B",
12613
- api: "openai-completions",
12614
- provider: "openrouter",
12615
- baseUrl: "https://openrouter.ai/api/v1",
12616
- reasoning: false,
12617
- input: ["text"],
12618
- cost: {
12619
- input: 0.39999999999999997,
12620
- output: 0.39999999999999997,
12621
- cacheRead: 0,
12622
- cacheWrite: 0,
12623
- },
12624
- contextWindow: 32768,
12625
- maxTokens: 32768,
12626
- },
12627
- "tngtech/deepseek-r1t2-chimera": {
12628
- id: "tngtech/deepseek-r1t2-chimera",
12629
- name: "TNG: DeepSeek R1T2 Chimera",
12630
- api: "openai-completions",
12631
- provider: "openrouter",
12632
- baseUrl: "https://openrouter.ai/api/v1",
12633
- reasoning: true,
12634
- input: ["text"],
12635
- cost: {
12636
- input: 0.3,
12637
- output: 1.1,
12638
- cacheRead: 0.15,
12639
- cacheWrite: 0,
12640
- },
12641
- contextWindow: 163840,
12642
- maxTokens: 163840,
12643
- },
12644
- "upstage/solar-pro-3": {
12645
- id: "upstage/solar-pro-3",
12646
- name: "Upstage: Solar Pro 3",
12647
- api: "openai-completions",
12648
- provider: "openrouter",
12649
- baseUrl: "https://openrouter.ai/api/v1",
12650
- reasoning: true,
12651
- input: ["text"],
12652
- cost: {
12653
- input: 0.15,
12654
- output: 0.6,
12655
- cacheRead: 0.015,
12348
+ input: ["text"],
12349
+ cost: {
12350
+ input: 1,
12351
+ output: 3,
12352
+ cacheRead: 0,
12656
12353
  cacheWrite: 0,
12657
12354
  },
12658
- contextWindow: 128000,
12659
- maxTokens: 4096,
12355
+ contextWindow: 256000,
12356
+ maxTokens: 128000,
12660
12357
  },
12661
- "x-ai/grok-3": {
12662
- id: "x-ai/grok-3",
12663
- name: "xAI: Grok 3",
12358
+ "sao10k/l3-euryale-70b": {
12359
+ id: "sao10k/l3-euryale-70b",
12360
+ name: "Sao10k: Llama 3 Euryale 70B v2.1",
12664
12361
  api: "openai-completions",
12665
12362
  provider: "openrouter",
12666
12363
  baseUrl: "https://openrouter.ai/api/v1",
12667
12364
  reasoning: false,
12668
12365
  input: ["text"],
12669
12366
  cost: {
12670
- input: 3,
12671
- output: 15,
12672
- cacheRead: 0.75,
12367
+ input: 1.48,
12368
+ output: 1.48,
12369
+ cacheRead: 0,
12673
12370
  cacheWrite: 0,
12674
12371
  },
12675
- contextWindow: 131072,
12676
- maxTokens: 4096,
12372
+ contextWindow: 8192,
12373
+ maxTokens: 8192,
12677
12374
  },
12678
- "x-ai/grok-3-beta": {
12679
- id: "x-ai/grok-3-beta",
12680
- name: "xAI: Grok 3 Beta",
12375
+ "sao10k/l3.1-euryale-70b": {
12376
+ id: "sao10k/l3.1-euryale-70b",
12377
+ name: "Sao10K: Llama 3.1 Euryale 70B v2.2",
12681
12378
  api: "openai-completions",
12682
12379
  provider: "openrouter",
12683
12380
  baseUrl: "https://openrouter.ai/api/v1",
12684
12381
  reasoning: false,
12685
12382
  input: ["text"],
12686
12383
  cost: {
12687
- input: 3,
12688
- output: 15,
12689
- cacheRead: 0.75,
12384
+ input: 0.85,
12385
+ output: 0.85,
12386
+ cacheRead: 0,
12690
12387
  cacheWrite: 0,
12691
12388
  },
12692
12389
  contextWindow: 131072,
12693
- maxTokens: 4096,
12390
+ maxTokens: 16384,
12694
12391
  },
12695
- "x-ai/grok-3-mini": {
12696
- id: "x-ai/grok-3-mini",
12697
- name: "xAI: Grok 3 Mini",
12392
+ "stepfun/step-3.5-flash": {
12393
+ id: "stepfun/step-3.5-flash",
12394
+ name: "StepFun: Step 3.5 Flash",
12698
12395
  api: "openai-completions",
12699
12396
  provider: "openrouter",
12700
12397
  baseUrl: "https://openrouter.ai/api/v1",
12701
12398
  reasoning: true,
12702
12399
  input: ["text"],
12703
12400
  cost: {
12704
- input: 0.3,
12705
- output: 0.5,
12706
- cacheRead: 0.075,
12401
+ input: 0.09999999999999999,
12402
+ output: 0.3,
12403
+ cacheRead: 0,
12707
12404
  cacheWrite: 0,
12708
12405
  },
12709
- contextWindow: 131072,
12710
- maxTokens: 4096,
12406
+ contextWindow: 262144,
12407
+ maxTokens: 65536,
12711
12408
  },
12712
- "x-ai/grok-3-mini-beta": {
12713
- id: "x-ai/grok-3-mini-beta",
12714
- name: "xAI: Grok 3 Mini Beta",
12409
+ "tencent/hy3-preview": {
12410
+ id: "tencent/hy3-preview",
12411
+ name: "Tencent: Hy3 preview",
12715
12412
  api: "openai-completions",
12716
12413
  provider: "openrouter",
12717
12414
  baseUrl: "https://openrouter.ai/api/v1",
12718
12415
  reasoning: true,
12719
12416
  input: ["text"],
12720
12417
  cost: {
12721
- input: 0.3,
12722
- output: 0.5,
12723
- cacheRead: 0.075,
12418
+ input: 0.06599999999999999,
12419
+ output: 0.26,
12420
+ cacheRead: 0.029,
12724
12421
  cacheWrite: 0,
12725
12422
  },
12726
- contextWindow: 131072,
12727
- maxTokens: 4096,
12423
+ contextWindow: 262144,
12424
+ maxTokens: 262144,
12728
12425
  },
12729
- "x-ai/grok-4": {
12730
- id: "x-ai/grok-4",
12731
- name: "xAI: Grok 4",
12426
+ "thedrummer/rocinante-12b": {
12427
+ id: "thedrummer/rocinante-12b",
12428
+ name: "TheDrummer: Rocinante 12B",
12732
12429
  api: "openai-completions",
12733
12430
  provider: "openrouter",
12734
12431
  baseUrl: "https://openrouter.ai/api/v1",
12735
- reasoning: true,
12736
- input: ["text", "image"],
12432
+ reasoning: false,
12433
+ input: ["text"],
12737
12434
  cost: {
12738
- input: 3,
12739
- output: 15,
12740
- cacheRead: 0.75,
12435
+ input: 0.16999999999999998,
12436
+ output: 0.43,
12437
+ cacheRead: 0,
12741
12438
  cacheWrite: 0,
12742
12439
  },
12743
- contextWindow: 256000,
12744
- maxTokens: 4096,
12440
+ contextWindow: 32768,
12441
+ maxTokens: 32768,
12745
12442
  },
12746
- "x-ai/grok-4-fast": {
12747
- id: "x-ai/grok-4-fast",
12748
- name: "xAI: Grok 4 Fast",
12443
+ "thedrummer/unslopnemo-12b": {
12444
+ id: "thedrummer/unslopnemo-12b",
12445
+ name: "TheDrummer: UnslopNemo 12B",
12749
12446
  api: "openai-completions",
12750
12447
  provider: "openrouter",
12751
12448
  baseUrl: "https://openrouter.ai/api/v1",
12752
- reasoning: true,
12753
- input: ["text", "image"],
12449
+ reasoning: false,
12450
+ input: ["text"],
12754
12451
  cost: {
12755
- input: 0.19999999999999998,
12756
- output: 0.5,
12757
- cacheRead: 0.049999999999999996,
12452
+ input: 0.39999999999999997,
12453
+ output: 0.39999999999999997,
12454
+ cacheRead: 0,
12758
12455
  cacheWrite: 0,
12759
12456
  },
12760
- contextWindow: 2000000,
12761
- maxTokens: 30000,
12457
+ contextWindow: 32768,
12458
+ maxTokens: 32768,
12762
12459
  },
12763
- "x-ai/grok-4.1-fast": {
12764
- id: "x-ai/grok-4.1-fast",
12765
- name: "xAI: Grok 4.1 Fast",
12460
+ "upstage/solar-pro-3": {
12461
+ id: "upstage/solar-pro-3",
12462
+ name: "Upstage: Solar Pro 3",
12766
12463
  api: "openai-completions",
12767
12464
  provider: "openrouter",
12768
12465
  baseUrl: "https://openrouter.ai/api/v1",
12769
12466
  reasoning: true,
12770
- input: ["text", "image"],
12467
+ input: ["text"],
12771
12468
  cost: {
12772
- input: 0.19999999999999998,
12773
- output: 0.5,
12774
- cacheRead: 0.049999999999999996,
12469
+ input: 0.15,
12470
+ output: 0.6,
12471
+ cacheRead: 0.015,
12775
12472
  cacheWrite: 0,
12776
12473
  },
12777
- contextWindow: 2000000,
12778
- maxTokens: 30000,
12474
+ contextWindow: 128000,
12475
+ maxTokens: 4096,
12779
12476
  },
12780
12477
  "x-ai/grok-4.20": {
12781
12478
  id: "x-ai/grok-4.20",
@@ -12811,23 +12508,6 @@ export const MODELS = {
12811
12508
  contextWindow: 1000000,
12812
12509
  maxTokens: 4096,
12813
12510
  },
12814
- "x-ai/grok-code-fast-1": {
12815
- id: "x-ai/grok-code-fast-1",
12816
- name: "xAI: Grok Code Fast 1",
12817
- api: "openai-completions",
12818
- provider: "openrouter",
12819
- baseUrl: "https://openrouter.ai/api/v1",
12820
- reasoning: true,
12821
- input: ["text"],
12822
- cost: {
12823
- input: 0.19999999999999998,
12824
- output: 1.5,
12825
- cacheRead: 0.02,
12826
- cacheWrite: 0,
12827
- },
12828
- contextWindow: 256000,
12829
- maxTokens: 10000,
12830
- },
12831
12511
  "xiaomi/mimo-v2-flash": {
12832
12512
  id: "xiaomi/mimo-v2-flash",
12833
12513
  name: "Xiaomi: MiMo-V2-Flash",
@@ -12837,9 +12517,9 @@ export const MODELS = {
12837
12517
  reasoning: true,
12838
12518
  input: ["text"],
12839
12519
  cost: {
12840
- input: 0.09,
12841
- output: 0.29,
12842
- cacheRead: 0.045,
12520
+ input: 0.09999999999999999,
12521
+ output: 0.3,
12522
+ cacheRead: 0.01,
12843
12523
  cacheWrite: 0,
12844
12524
  },
12845
12525
  contextWindow: 262144,
@@ -12911,7 +12591,7 @@ export const MODELS = {
12911
12591
  cacheWrite: 0,
12912
12592
  },
12913
12593
  contextWindow: 1048576,
12914
- maxTokens: 131072,
12594
+ maxTokens: 16384,
12915
12595
  },
12916
12596
  "z-ai/glm-4-32b": {
12917
12597
  id: "z-ai/glm-4-32b",
@@ -13007,13 +12687,13 @@ export const MODELS = {
13007
12687
  reasoning: true,
13008
12688
  input: ["text"],
13009
12689
  cost: {
13010
- input: 0.39,
13011
- output: 1.9,
13012
- cacheRead: 0,
12690
+ input: 0.43,
12691
+ output: 1.74,
12692
+ cacheRead: 0.08,
13013
12693
  cacheWrite: 0,
13014
12694
  },
13015
- contextWindow: 204800,
13016
- maxTokens: 204800,
12695
+ contextWindow: 202752,
12696
+ maxTokens: 131072,
13017
12697
  },
13018
12698
  "z-ai/glm-4.6v": {
13019
12699
  id: "z-ai/glm-4.6v",
@@ -13109,13 +12789,13 @@ export const MODELS = {
13109
12789
  reasoning: true,
13110
12790
  input: ["text"],
13111
12791
  cost: {
13112
- input: 1.0499999999999998,
13113
- output: 3.5,
13114
- cacheRead: 0.5249999999999999,
12792
+ input: 0.98,
12793
+ output: 3.08,
12794
+ cacheRead: 0.182,
13115
12795
  cacheWrite: 0,
13116
12796
  },
13117
12797
  contextWindow: 202752,
13118
- maxTokens: 65535,
12798
+ maxTokens: 4096,
13119
12799
  },
13120
12800
  "z-ai/glm-5v-turbo": {
13121
12801
  id: "z-ai/glm-5v-turbo",
@@ -13228,13 +12908,13 @@ export const MODELS = {
13228
12908
  reasoning: true,
13229
12909
  input: ["text", "image"],
13230
12910
  cost: {
13231
- input: 0.75,
13232
- output: 3.5,
13233
- cacheRead: 0.15,
12911
+ input: 0.73,
12912
+ output: 3.49,
12913
+ cacheRead: 0.25,
13234
12914
  cacheWrite: 0,
13235
12915
  },
13236
12916
  contextWindow: 262144,
13237
- maxTokens: 16384,
12917
+ maxTokens: 262142,
13238
12918
  },
13239
12919
  "~openai/gpt-latest": {
13240
12920
  id: "~openai/gpt-latest",
@@ -13934,23 +13614,6 @@ export const MODELS = {
13934
13614
  contextWindow: 200000,
13935
13615
  maxTokens: 8192,
13936
13616
  },
13937
- "anthropic/claude-3.7-sonnet": {
13938
- id: "anthropic/claude-3.7-sonnet",
13939
- name: "Claude 3.7 Sonnet",
13940
- api: "anthropic-messages",
13941
- provider: "vercel-ai-gateway",
13942
- baseUrl: "https://ai-gateway.vercel.sh",
13943
- reasoning: true,
13944
- input: ["text", "image"],
13945
- cost: {
13946
- input: 3,
13947
- output: 15,
13948
- cacheRead: 0.3,
13949
- cacheWrite: 3.75,
13950
- },
13951
- contextWindow: 200000,
13952
- maxTokens: 8192,
13953
- },
13954
13617
  "anthropic/claude-haiku-4.5": {
13955
13618
  id: "anthropic/claude-haiku-4.5",
13956
13619
  name: "Claude Haiku 4.5",
@@ -15633,7 +15296,7 @@ export const MODELS = {
15633
15296
  },
15634
15297
  "openai/gpt-oss-20b": {
15635
15298
  id: "openai/gpt-oss-20b",
15636
- name: "GPT OSS 120B",
15299
+ name: "GPT OSS 20B",
15637
15300
  api: "anthropic-messages",
15638
15301
  provider: "vercel-ai-gateway",
15639
15302
  baseUrl: "https://ai-gateway.vercel.sh",
@@ -15740,185 +15403,66 @@ export const MODELS = {
15740
15403
  provider: "vercel-ai-gateway",
15741
15404
  baseUrl: "https://ai-gateway.vercel.sh",
15742
15405
  reasoning: true,
15743
- input: ["text", "image"],
15744
- cost: {
15745
- input: 20,
15746
- output: 80,
15747
- cacheRead: 0,
15748
- cacheWrite: 0,
15749
- },
15750
- contextWindow: 200000,
15751
- maxTokens: 100000,
15752
- },
15753
- "openai/o4-mini": {
15754
- id: "openai/o4-mini",
15755
- name: "o4-mini",
15756
- api: "anthropic-messages",
15757
- provider: "vercel-ai-gateway",
15758
- baseUrl: "https://ai-gateway.vercel.sh",
15759
- reasoning: true,
15760
- input: ["text", "image"],
15761
- cost: {
15762
- input: 1.1,
15763
- output: 4.4,
15764
- cacheRead: 0.275,
15765
- cacheWrite: 0,
15766
- },
15767
- contextWindow: 200000,
15768
- maxTokens: 100000,
15769
- },
15770
- "perplexity/sonar": {
15771
- id: "perplexity/sonar",
15772
- name: "Sonar",
15773
- api: "anthropic-messages",
15774
- provider: "vercel-ai-gateway",
15775
- baseUrl: "https://ai-gateway.vercel.sh",
15776
- reasoning: false,
15777
- input: ["text", "image"],
15778
- cost: {
15779
- input: 0,
15780
- output: 0,
15781
- cacheRead: 0,
15782
- cacheWrite: 0,
15783
- },
15784
- contextWindow: 127000,
15785
- maxTokens: 8000,
15786
- },
15787
- "perplexity/sonar-pro": {
15788
- id: "perplexity/sonar-pro",
15789
- name: "Sonar Pro",
15790
- api: "anthropic-messages",
15791
- provider: "vercel-ai-gateway",
15792
- baseUrl: "https://ai-gateway.vercel.sh",
15793
- reasoning: false,
15794
- input: ["text", "image"],
15795
- cost: {
15796
- input: 0,
15797
- output: 0,
15798
- cacheRead: 0,
15799
- cacheWrite: 0,
15800
- },
15801
- contextWindow: 200000,
15802
- maxTokens: 8000,
15803
- },
15804
- "xai/grok-3": {
15805
- id: "xai/grok-3",
15806
- name: "Grok 3 Beta",
15807
- api: "anthropic-messages",
15808
- provider: "vercel-ai-gateway",
15809
- baseUrl: "https://ai-gateway.vercel.sh",
15810
- reasoning: false,
15811
- input: ["text"],
15812
- cost: {
15813
- input: 3,
15814
- output: 15,
15815
- cacheRead: 0.75,
15816
- cacheWrite: 0,
15817
- },
15818
- contextWindow: 131072,
15819
- maxTokens: 131072,
15820
- },
15821
- "xai/grok-3-fast": {
15822
- id: "xai/grok-3-fast",
15823
- name: "Grok 3 Fast Beta",
15824
- api: "anthropic-messages",
15825
- provider: "vercel-ai-gateway",
15826
- baseUrl: "https://ai-gateway.vercel.sh",
15827
- reasoning: false,
15828
- input: ["text"],
15829
- cost: {
15830
- input: 5,
15831
- output: 25,
15832
- cacheRead: 1.25,
15833
- cacheWrite: 0,
15834
- },
15835
- contextWindow: 131072,
15836
- maxTokens: 131072,
15837
- },
15838
- "xai/grok-3-mini": {
15839
- id: "xai/grok-3-mini",
15840
- name: "Grok 3 Mini Beta",
15841
- api: "anthropic-messages",
15842
- provider: "vercel-ai-gateway",
15843
- baseUrl: "https://ai-gateway.vercel.sh",
15844
- reasoning: false,
15845
- input: ["text"],
15846
- cost: {
15847
- input: 0.3,
15848
- output: 0.5,
15849
- cacheRead: 0.075,
15850
- cacheWrite: 0,
15851
- },
15852
- contextWindow: 131072,
15853
- maxTokens: 131072,
15854
- },
15855
- "xai/grok-3-mini-fast": {
15856
- id: "xai/grok-3-mini-fast",
15857
- name: "Grok 3 Mini Fast Beta",
15858
- api: "anthropic-messages",
15859
- provider: "vercel-ai-gateway",
15860
- baseUrl: "https://ai-gateway.vercel.sh",
15861
- reasoning: false,
15862
- input: ["text"],
15406
+ input: ["text", "image"],
15863
15407
  cost: {
15864
- input: 0.6,
15865
- output: 4,
15408
+ input: 20,
15409
+ output: 80,
15866
15410
  cacheRead: 0,
15867
15411
  cacheWrite: 0,
15868
15412
  },
15869
- contextWindow: 131072,
15870
- maxTokens: 131072,
15413
+ contextWindow: 200000,
15414
+ maxTokens: 100000,
15871
15415
  },
15872
- "xai/grok-4": {
15873
- id: "xai/grok-4",
15874
- name: "Grok 4",
15416
+ "openai/o4-mini": {
15417
+ id: "openai/o4-mini",
15418
+ name: "o4-mini",
15875
15419
  api: "anthropic-messages",
15876
15420
  provider: "vercel-ai-gateway",
15877
15421
  baseUrl: "https://ai-gateway.vercel.sh",
15878
15422
  reasoning: true,
15879
15423
  input: ["text", "image"],
15880
15424
  cost: {
15881
- input: 3,
15882
- output: 15,
15883
- cacheRead: 0.75,
15425
+ input: 1.1,
15426
+ output: 4.4,
15427
+ cacheRead: 0.275,
15884
15428
  cacheWrite: 0,
15885
15429
  },
15886
- contextWindow: 256000,
15887
- maxTokens: 256000,
15430
+ contextWindow: 200000,
15431
+ maxTokens: 100000,
15888
15432
  },
15889
- "xai/grok-4-fast-non-reasoning": {
15890
- id: "xai/grok-4-fast-non-reasoning",
15891
- name: "Grok 4 Fast Non-Reasoning",
15433
+ "perplexity/sonar": {
15434
+ id: "perplexity/sonar",
15435
+ name: "Sonar",
15892
15436
  api: "anthropic-messages",
15893
15437
  provider: "vercel-ai-gateway",
15894
15438
  baseUrl: "https://ai-gateway.vercel.sh",
15895
15439
  reasoning: false,
15896
15440
  input: ["text", "image"],
15897
15441
  cost: {
15898
- input: 0.19999999999999998,
15899
- output: 0.5,
15900
- cacheRead: 0.049999999999999996,
15442
+ input: 0,
15443
+ output: 0,
15444
+ cacheRead: 0,
15901
15445
  cacheWrite: 0,
15902
15446
  },
15903
- contextWindow: 2000000,
15904
- maxTokens: 256000,
15447
+ contextWindow: 127000,
15448
+ maxTokens: 8000,
15905
15449
  },
15906
- "xai/grok-4-fast-reasoning": {
15907
- id: "xai/grok-4-fast-reasoning",
15908
- name: "Grok 4 Fast Reasoning",
15450
+ "perplexity/sonar-pro": {
15451
+ id: "perplexity/sonar-pro",
15452
+ name: "Sonar Pro",
15909
15453
  api: "anthropic-messages",
15910
15454
  provider: "vercel-ai-gateway",
15911
15455
  baseUrl: "https://ai-gateway.vercel.sh",
15912
- reasoning: true,
15456
+ reasoning: false,
15913
15457
  input: ["text", "image"],
15914
15458
  cost: {
15915
- input: 0.19999999999999998,
15916
- output: 0.5,
15917
- cacheRead: 0.049999999999999996,
15459
+ input: 0,
15460
+ output: 0,
15461
+ cacheRead: 0,
15918
15462
  cacheWrite: 0,
15919
15463
  },
15920
- contextWindow: 2000000,
15921
- maxTokens: 256000,
15464
+ contextWindow: 200000,
15465
+ maxTokens: 8000,
15922
15466
  },
15923
15467
  "xai/grok-4.1-fast-non-reasoning": {
15924
15468
  id: "xai/grok-4.1-fast-non-reasoning",
@@ -15934,8 +15478,8 @@ export const MODELS = {
15934
15478
  cacheRead: 0.049999999999999996,
15935
15479
  cacheWrite: 0,
15936
15480
  },
15937
- contextWindow: 2000000,
15938
- maxTokens: 30000,
15481
+ contextWindow: 1000000,
15482
+ maxTokens: 1000000,
15939
15483
  },
15940
15484
  "xai/grok-4.1-fast-reasoning": {
15941
15485
  id: "xai/grok-4.1-fast-reasoning",
@@ -15951,8 +15495,8 @@ export const MODELS = {
15951
15495
  cacheRead: 0.049999999999999996,
15952
15496
  cacheWrite: 0,
15953
15497
  },
15954
- contextWindow: 2000000,
15955
- maxTokens: 30000,
15498
+ contextWindow: 1000000,
15499
+ maxTokens: 1000000,
15956
15500
  },
15957
15501
  "xai/grok-4.20-multi-agent": {
15958
15502
  id: "xai/grok-4.20-multi-agent",
@@ -16073,23 +15617,6 @@ export const MODELS = {
16073
15617
  contextWindow: 1000000,
16074
15618
  maxTokens: 1000000,
16075
15619
  },
16076
- "xai/grok-code-fast-1": {
16077
- id: "xai/grok-code-fast-1",
16078
- name: "Grok Code Fast 1",
16079
- api: "anthropic-messages",
16080
- provider: "vercel-ai-gateway",
16081
- baseUrl: "https://ai-gateway.vercel.sh",
16082
- reasoning: true,
16083
- input: ["text"],
16084
- cost: {
16085
- input: 0.19999999999999998,
16086
- output: 1.5,
16087
- cacheRead: 0.02,
16088
- cacheWrite: 0,
16089
- },
16090
- contextWindow: 256000,
16091
- maxTokens: 256000,
16092
- },
16093
15620
  "xiaomi/mimo-v2-flash": {
16094
15621
  id: "xiaomi/mimo-v2-flash",
16095
15622
  name: "MiMo V2 Flash",
@@ -16483,227 +16010,6 @@ export const MODELS = {
16483
16010
  contextWindow: 8192,
16484
16011
  maxTokens: 4096,
16485
16012
  },
16486
- "grok-3": {
16487
- id: "grok-3",
16488
- name: "Grok 3",
16489
- api: "openai-completions",
16490
- provider: "xai",
16491
- baseUrl: "https://api.x.ai/v1",
16492
- reasoning: false,
16493
- input: ["text"],
16494
- cost: {
16495
- input: 3,
16496
- output: 15,
16497
- cacheRead: 0.75,
16498
- cacheWrite: 0,
16499
- },
16500
- contextWindow: 131072,
16501
- maxTokens: 8192,
16502
- },
16503
- "grok-3-fast": {
16504
- id: "grok-3-fast",
16505
- name: "Grok 3 Fast",
16506
- api: "openai-completions",
16507
- provider: "xai",
16508
- baseUrl: "https://api.x.ai/v1",
16509
- reasoning: false,
16510
- input: ["text"],
16511
- cost: {
16512
- input: 5,
16513
- output: 25,
16514
- cacheRead: 1.25,
16515
- cacheWrite: 0,
16516
- },
16517
- contextWindow: 131072,
16518
- maxTokens: 8192,
16519
- },
16520
- "grok-3-fast-latest": {
16521
- id: "grok-3-fast-latest",
16522
- name: "Grok 3 Fast Latest",
16523
- api: "openai-completions",
16524
- provider: "xai",
16525
- baseUrl: "https://api.x.ai/v1",
16526
- reasoning: false,
16527
- input: ["text"],
16528
- cost: {
16529
- input: 5,
16530
- output: 25,
16531
- cacheRead: 1.25,
16532
- cacheWrite: 0,
16533
- },
16534
- contextWindow: 131072,
16535
- maxTokens: 8192,
16536
- },
16537
- "grok-3-latest": {
16538
- id: "grok-3-latest",
16539
- name: "Grok 3 Latest",
16540
- api: "openai-completions",
16541
- provider: "xai",
16542
- baseUrl: "https://api.x.ai/v1",
16543
- reasoning: false,
16544
- input: ["text"],
16545
- cost: {
16546
- input: 3,
16547
- output: 15,
16548
- cacheRead: 0.75,
16549
- cacheWrite: 0,
16550
- },
16551
- contextWindow: 131072,
16552
- maxTokens: 8192,
16553
- },
16554
- "grok-3-mini": {
16555
- id: "grok-3-mini",
16556
- name: "Grok 3 Mini",
16557
- api: "openai-completions",
16558
- provider: "xai",
16559
- baseUrl: "https://api.x.ai/v1",
16560
- reasoning: true,
16561
- input: ["text"],
16562
- cost: {
16563
- input: 0.3,
16564
- output: 0.5,
16565
- cacheRead: 0.075,
16566
- cacheWrite: 0,
16567
- },
16568
- contextWindow: 131072,
16569
- maxTokens: 8192,
16570
- },
16571
- "grok-3-mini-fast": {
16572
- id: "grok-3-mini-fast",
16573
- name: "Grok 3 Mini Fast",
16574
- api: "openai-completions",
16575
- provider: "xai",
16576
- baseUrl: "https://api.x.ai/v1",
16577
- reasoning: true,
16578
- input: ["text"],
16579
- cost: {
16580
- input: 0.6,
16581
- output: 4,
16582
- cacheRead: 0.15,
16583
- cacheWrite: 0,
16584
- },
16585
- contextWindow: 131072,
16586
- maxTokens: 8192,
16587
- },
16588
- "grok-3-mini-fast-latest": {
16589
- id: "grok-3-mini-fast-latest",
16590
- name: "Grok 3 Mini Fast Latest",
16591
- api: "openai-completions",
16592
- provider: "xai",
16593
- baseUrl: "https://api.x.ai/v1",
16594
- reasoning: true,
16595
- input: ["text"],
16596
- cost: {
16597
- input: 0.6,
16598
- output: 4,
16599
- cacheRead: 0.15,
16600
- cacheWrite: 0,
16601
- },
16602
- contextWindow: 131072,
16603
- maxTokens: 8192,
16604
- },
16605
- "grok-3-mini-latest": {
16606
- id: "grok-3-mini-latest",
16607
- name: "Grok 3 Mini Latest",
16608
- api: "openai-completions",
16609
- provider: "xai",
16610
- baseUrl: "https://api.x.ai/v1",
16611
- reasoning: true,
16612
- input: ["text"],
16613
- cost: {
16614
- input: 0.3,
16615
- output: 0.5,
16616
- cacheRead: 0.075,
16617
- cacheWrite: 0,
16618
- },
16619
- contextWindow: 131072,
16620
- maxTokens: 8192,
16621
- },
16622
- "grok-4": {
16623
- id: "grok-4",
16624
- name: "Grok 4",
16625
- api: "openai-completions",
16626
- provider: "xai",
16627
- baseUrl: "https://api.x.ai/v1",
16628
- reasoning: true,
16629
- input: ["text"],
16630
- cost: {
16631
- input: 3,
16632
- output: 15,
16633
- cacheRead: 0.75,
16634
- cacheWrite: 0,
16635
- },
16636
- contextWindow: 256000,
16637
- maxTokens: 64000,
16638
- },
16639
- "grok-4-1-fast": {
16640
- id: "grok-4-1-fast",
16641
- name: "Grok 4.1 Fast",
16642
- api: "openai-completions",
16643
- provider: "xai",
16644
- baseUrl: "https://api.x.ai/v1",
16645
- reasoning: true,
16646
- input: ["text", "image"],
16647
- cost: {
16648
- input: 0.2,
16649
- output: 0.5,
16650
- cacheRead: 0.05,
16651
- cacheWrite: 0,
16652
- },
16653
- contextWindow: 2000000,
16654
- maxTokens: 30000,
16655
- },
16656
- "grok-4-1-fast-non-reasoning": {
16657
- id: "grok-4-1-fast-non-reasoning",
16658
- name: "Grok 4.1 Fast (Non-Reasoning)",
16659
- api: "openai-completions",
16660
- provider: "xai",
16661
- baseUrl: "https://api.x.ai/v1",
16662
- reasoning: false,
16663
- input: ["text", "image"],
16664
- cost: {
16665
- input: 0.2,
16666
- output: 0.5,
16667
- cacheRead: 0.05,
16668
- cacheWrite: 0,
16669
- },
16670
- contextWindow: 2000000,
16671
- maxTokens: 30000,
16672
- },
16673
- "grok-4-fast": {
16674
- id: "grok-4-fast",
16675
- name: "Grok 4 Fast",
16676
- api: "openai-completions",
16677
- provider: "xai",
16678
- baseUrl: "https://api.x.ai/v1",
16679
- reasoning: true,
16680
- input: ["text", "image"],
16681
- cost: {
16682
- input: 0.2,
16683
- output: 0.5,
16684
- cacheRead: 0.05,
16685
- cacheWrite: 0,
16686
- },
16687
- contextWindow: 2000000,
16688
- maxTokens: 30000,
16689
- },
16690
- "grok-4-fast-non-reasoning": {
16691
- id: "grok-4-fast-non-reasoning",
16692
- name: "Grok 4 Fast (Non-Reasoning)",
16693
- api: "openai-completions",
16694
- provider: "xai",
16695
- baseUrl: "https://api.x.ai/v1",
16696
- reasoning: false,
16697
- input: ["text", "image"],
16698
- cost: {
16699
- input: 0.2,
16700
- output: 0.5,
16701
- cacheRead: 0.05,
16702
- cacheWrite: 0,
16703
- },
16704
- contextWindow: 2000000,
16705
- maxTokens: 30000,
16706
- },
16707
16013
  "grok-4.20-0309-non-reasoning": {
16708
16014
  id: "grok-4.20-0309-non-reasoning",
16709
16015
  name: "Grok 4.20 (Non-Reasoning)",
@@ -16778,7 +16084,7 @@ export const MODELS = {
16778
16084
  api: "openai-completions",
16779
16085
  provider: "xai",
16780
16086
  baseUrl: "https://api.x.ai/v1",
16781
- reasoning: true,
16087
+ reasoning: false,
16782
16088
  input: ["text"],
16783
16089
  cost: {
16784
16090
  input: 0.2,
@@ -16786,8 +16092,8 @@ export const MODELS = {
16786
16092
  cacheRead: 0.02,
16787
16093
  cacheWrite: 0,
16788
16094
  },
16789
- contextWindow: 256000,
16790
- maxTokens: 10000,
16095
+ contextWindow: 32768,
16096
+ maxTokens: 8192,
16791
16097
  },
16792
16098
  "grok-vision-beta": {
16793
16099
  id: "grok-vision-beta",