@earendil-works/pi-ai 0.74.0 → 0.74.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (63) hide show
  1. package/README.md +76 -6
  2. package/dist/env-api-keys.d.ts.map +1 -1
  3. package/dist/env-api-keys.js +2 -1
  4. package/dist/env-api-keys.js.map +1 -1
  5. package/dist/image-models.d.ts +10 -0
  6. package/dist/image-models.d.ts.map +1 -0
  7. package/dist/image-models.generated.d.ts +440 -0
  8. package/dist/image-models.generated.d.ts.map +1 -0
  9. package/dist/image-models.generated.js +442 -0
  10. package/dist/image-models.generated.js.map +1 -0
  11. package/dist/image-models.js +23 -0
  12. package/dist/image-models.js.map +1 -0
  13. package/dist/images-api-registry.d.ts +14 -0
  14. package/dist/images-api-registry.d.ts.map +1 -0
  15. package/dist/images-api-registry.js +22 -0
  16. package/dist/images-api-registry.js.map +1 -0
  17. package/dist/images.d.ts +4 -0
  18. package/dist/images.d.ts.map +1 -0
  19. package/dist/images.js +14 -0
  20. package/dist/images.js.map +1 -0
  21. package/dist/index.d.ts +4 -0
  22. package/dist/index.d.ts.map +1 -1
  23. package/dist/index.js +4 -0
  24. package/dist/index.js.map +1 -1
  25. package/dist/models.generated.d.ts +2148 -2396
  26. package/dist/models.generated.d.ts.map +1 -1
  27. package/dist/models.generated.js +1124 -1649
  28. package/dist/models.generated.js.map +1 -1
  29. package/dist/providers/amazon-bedrock.d.ts.map +1 -1
  30. package/dist/providers/amazon-bedrock.js +7 -16
  31. package/dist/providers/amazon-bedrock.js.map +1 -1
  32. package/dist/providers/anthropic.d.ts.map +1 -1
  33. package/dist/providers/anthropic.js +15 -6
  34. package/dist/providers/anthropic.js.map +1 -1
  35. package/dist/providers/images/openrouter.d.ts +3 -0
  36. package/dist/providers/images/openrouter.d.ts.map +1 -0
  37. package/dist/providers/images/openrouter.js +129 -0
  38. package/dist/providers/images/openrouter.js.map +1 -0
  39. package/dist/providers/images/register-builtins.d.ts +4 -0
  40. package/dist/providers/images/register-builtins.d.ts.map +1 -0
  41. package/dist/providers/images/register-builtins.js +34 -0
  42. package/dist/providers/images/register-builtins.js.map +1 -0
  43. package/dist/providers/openai-codex-responses.d.ts.map +1 -1
  44. package/dist/providers/openai-codex-responses.js +49 -3
  45. package/dist/providers/openai-codex-responses.js.map +1 -1
  46. package/dist/providers/openai-completions.d.ts.map +1 -1
  47. package/dist/providers/openai-completions.js +32 -14
  48. package/dist/providers/openai-completions.js.map +1 -1
  49. package/dist/providers/simple-options.d.ts.map +1 -1
  50. package/dist/providers/simple-options.js +1 -1
  51. package/dist/providers/simple-options.js.map +1 -1
  52. package/dist/types.d.ts +86 -3
  53. package/dist/types.d.ts.map +1 -1
  54. package/dist/types.js.map +1 -1
  55. package/dist/utils/node-http-proxy.d.ts +10 -0
  56. package/dist/utils/node-http-proxy.d.ts.map +1 -0
  57. package/dist/utils/node-http-proxy.js +97 -0
  58. package/dist/utils/node-http-proxy.js.map +1 -0
  59. package/dist/utils/overflow.d.ts +2 -1
  60. package/dist/utils/overflow.d.ts.map +1 -1
  61. package/dist/utils/overflow.js +6 -1
  62. package/dist/utils/overflow.js.map +1 -1
  63. package/package.json +6 -7
@@ -53,23 +53,6 @@ export const MODELS = {
53
53
  contextWindow: 128000,
54
54
  maxTokens: 8192,
55
55
  },
56
- "amazon.nova-premier-v1:0": {
57
- id: "amazon.nova-premier-v1:0",
58
- name: "Nova Premier",
59
- api: "bedrock-converse-stream",
60
- provider: "amazon-bedrock",
61
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
62
- reasoning: true,
63
- input: ["text", "image"],
64
- cost: {
65
- input: 2.5,
66
- output: 12.5,
67
- cacheRead: 0,
68
- cacheWrite: 0,
69
- },
70
- contextWindow: 1000000,
71
- maxTokens: 16384,
72
- },
73
56
  "amazon.nova-pro-v1:0": {
74
57
  id: "amazon.nova-pro-v1:0",
75
58
  name: "Nova Pro",
@@ -87,91 +70,6 @@ export const MODELS = {
87
70
  contextWindow: 300000,
88
71
  maxTokens: 8192,
89
72
  },
90
- "anthropic.claude-3-5-haiku-20241022-v1:0": {
91
- id: "anthropic.claude-3-5-haiku-20241022-v1:0",
92
- name: "Claude Haiku 3.5",
93
- api: "bedrock-converse-stream",
94
- provider: "amazon-bedrock",
95
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
96
- reasoning: false,
97
- input: ["text", "image"],
98
- cost: {
99
- input: 0.8,
100
- output: 4,
101
- cacheRead: 0.08,
102
- cacheWrite: 1,
103
- },
104
- contextWindow: 200000,
105
- maxTokens: 8192,
106
- },
107
- "anthropic.claude-3-5-sonnet-20240620-v1:0": {
108
- id: "anthropic.claude-3-5-sonnet-20240620-v1:0",
109
- name: "Claude Sonnet 3.5",
110
- api: "bedrock-converse-stream",
111
- provider: "amazon-bedrock",
112
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
113
- reasoning: false,
114
- input: ["text", "image"],
115
- cost: {
116
- input: 3,
117
- output: 15,
118
- cacheRead: 0.3,
119
- cacheWrite: 3.75,
120
- },
121
- contextWindow: 200000,
122
- maxTokens: 8192,
123
- },
124
- "anthropic.claude-3-5-sonnet-20241022-v2:0": {
125
- id: "anthropic.claude-3-5-sonnet-20241022-v2:0",
126
- name: "Claude Sonnet 3.5 v2",
127
- api: "bedrock-converse-stream",
128
- provider: "amazon-bedrock",
129
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
130
- reasoning: false,
131
- input: ["text", "image"],
132
- cost: {
133
- input: 3,
134
- output: 15,
135
- cacheRead: 0.3,
136
- cacheWrite: 3.75,
137
- },
138
- contextWindow: 200000,
139
- maxTokens: 8192,
140
- },
141
- "anthropic.claude-3-7-sonnet-20250219-v1:0": {
142
- id: "anthropic.claude-3-7-sonnet-20250219-v1:0",
143
- name: "Claude Sonnet 3.7",
144
- api: "bedrock-converse-stream",
145
- provider: "amazon-bedrock",
146
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
147
- reasoning: false,
148
- input: ["text", "image"],
149
- cost: {
150
- input: 3,
151
- output: 15,
152
- cacheRead: 0.3,
153
- cacheWrite: 3.75,
154
- },
155
- contextWindow: 200000,
156
- maxTokens: 8192,
157
- },
158
- "anthropic.claude-3-haiku-20240307-v1:0": {
159
- id: "anthropic.claude-3-haiku-20240307-v1:0",
160
- name: "Claude Haiku 3",
161
- api: "bedrock-converse-stream",
162
- provider: "amazon-bedrock",
163
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
164
- reasoning: false,
165
- input: ["text", "image"],
166
- cost: {
167
- input: 0.25,
168
- output: 1.25,
169
- cacheRead: 0,
170
- cacheWrite: 0,
171
- },
172
- contextWindow: 200000,
173
- maxTokens: 4096,
174
- },
175
73
  "anthropic.claude-haiku-4-5-20251001-v1:0": {
176
74
  id: "anthropic.claude-haiku-4-5-20251001-v1:0",
177
75
  name: "Claude Haiku 4.5",
@@ -206,23 +104,6 @@ export const MODELS = {
206
104
  contextWindow: 200000,
207
105
  maxTokens: 32000,
208
106
  },
209
- "anthropic.claude-opus-4-20250514-v1:0": {
210
- id: "anthropic.claude-opus-4-20250514-v1:0",
211
- name: "Claude Opus 4",
212
- api: "bedrock-converse-stream",
213
- provider: "amazon-bedrock",
214
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
215
- reasoning: true,
216
- input: ["text", "image"],
217
- cost: {
218
- input: 15,
219
- output: 75,
220
- cacheRead: 1.5,
221
- cacheWrite: 18.75,
222
- },
223
- contextWindow: 200000,
224
- maxTokens: 32000,
225
- },
226
107
  "anthropic.claude-opus-4-5-20251101-v1:0": {
227
108
  id: "anthropic.claude-opus-4-5-20251101-v1:0",
228
109
  name: "Claude Opus 4.5",
@@ -276,9 +157,9 @@ export const MODELS = {
276
157
  contextWindow: 1000000,
277
158
  maxTokens: 128000,
278
159
  },
279
- "anthropic.claude-sonnet-4-20250514-v1:0": {
280
- id: "anthropic.claude-sonnet-4-20250514-v1:0",
281
- name: "Claude Sonnet 4",
160
+ "anthropic.claude-sonnet-4-5-20250929-v1:0": {
161
+ id: "anthropic.claude-sonnet-4-5-20250929-v1:0",
162
+ name: "Claude Sonnet 4.5",
282
163
  api: "bedrock-converse-stream",
283
164
  provider: "amazon-bedrock",
284
165
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
@@ -293,9 +174,9 @@ export const MODELS = {
293
174
  contextWindow: 200000,
294
175
  maxTokens: 64000,
295
176
  },
296
- "anthropic.claude-sonnet-4-5-20250929-v1:0": {
297
- id: "anthropic.claude-sonnet-4-5-20250929-v1:0",
298
- name: "Claude Sonnet 4.5",
177
+ "anthropic.claude-sonnet-4-6": {
178
+ id: "anthropic.claude-sonnet-4-6",
179
+ name: "Claude Sonnet 4.6",
299
180
  api: "bedrock-converse-stream",
300
181
  provider: "amazon-bedrock",
301
182
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
@@ -307,24 +188,24 @@ export const MODELS = {
307
188
  cacheRead: 0.3,
308
189
  cacheWrite: 3.75,
309
190
  },
310
- contextWindow: 200000,
191
+ contextWindow: 1000000,
311
192
  maxTokens: 64000,
312
193
  },
313
- "anthropic.claude-sonnet-4-6": {
314
- id: "anthropic.claude-sonnet-4-6",
315
- name: "Claude Sonnet 4.6",
194
+ "au.anthropic.claude-haiku-4-5-20251001-v1:0": {
195
+ id: "au.anthropic.claude-haiku-4-5-20251001-v1:0",
196
+ name: "Claude Haiku 4.5 (AU)",
316
197
  api: "bedrock-converse-stream",
317
198
  provider: "amazon-bedrock",
318
199
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
319
200
  reasoning: true,
320
201
  input: ["text", "image"],
321
202
  cost: {
322
- input: 3,
323
- output: 15,
324
- cacheRead: 0.3,
325
- cacheWrite: 3.75,
203
+ input: 1,
204
+ output: 5,
205
+ cacheRead: 0.1,
206
+ cacheWrite: 1.25,
326
207
  },
327
- contextWindow: 1000000,
208
+ contextWindow: 200000,
328
209
  maxTokens: 64000,
329
210
  },
330
211
  "au.anthropic.claude-opus-4-6-v1": {
@@ -345,6 +226,23 @@ export const MODELS = {
345
226
  contextWindow: 1000000,
346
227
  maxTokens: 128000,
347
228
  },
229
+ "au.anthropic.claude-sonnet-4-5-20250929-v1:0": {
230
+ id: "au.anthropic.claude-sonnet-4-5-20250929-v1:0",
231
+ name: "Claude Sonnet 4.5 (AU)",
232
+ api: "bedrock-converse-stream",
233
+ provider: "amazon-bedrock",
234
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
235
+ reasoning: true,
236
+ input: ["text", "image"],
237
+ cost: {
238
+ input: 3,
239
+ output: 15,
240
+ cacheRead: 0.3,
241
+ cacheWrite: 3.75,
242
+ },
243
+ contextWindow: 200000,
244
+ maxTokens: 64000,
245
+ },
348
246
  "au.anthropic.claude-sonnet-4-6": {
349
247
  id: "au.anthropic.claude-sonnet-4-6",
350
248
  name: "AU Anthropic Claude Sonnet 4.6",
@@ -483,23 +381,6 @@ export const MODELS = {
483
381
  contextWindow: 1000000,
484
382
  maxTokens: 128000,
485
383
  },
486
- "eu.anthropic.claude-sonnet-4-20250514-v1:0": {
487
- id: "eu.anthropic.claude-sonnet-4-20250514-v1:0",
488
- name: "Claude Sonnet 4 (EU)",
489
- api: "bedrock-converse-stream",
490
- provider: "amazon-bedrock",
491
- baseUrl: "https://bedrock-runtime.eu-central-1.amazonaws.com",
492
- reasoning: true,
493
- input: ["text", "image"],
494
- cost: {
495
- input: 3,
496
- output: 15,
497
- cacheRead: 0.3,
498
- cacheWrite: 3.75,
499
- },
500
- contextWindow: 200000,
501
- maxTokens: 64000,
502
- },
503
384
  "eu.anthropic.claude-sonnet-4-5-20250929-v1:0": {
504
385
  id: "eu.anthropic.claude-sonnet-4-5-20250929-v1:0",
505
386
  name: "Claude Sonnet 4.5 (EU)",
@@ -604,23 +485,6 @@ export const MODELS = {
604
485
  contextWindow: 1000000,
605
486
  maxTokens: 128000,
606
487
  },
607
- "global.anthropic.claude-sonnet-4-20250514-v1:0": {
608
- id: "global.anthropic.claude-sonnet-4-20250514-v1:0",
609
- name: "Claude Sonnet 4 (Global)",
610
- api: "bedrock-converse-stream",
611
- provider: "amazon-bedrock",
612
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
613
- reasoning: true,
614
- input: ["text", "image"],
615
- cost: {
616
- input: 3,
617
- output: 15,
618
- cacheRead: 0.3,
619
- cacheWrite: 3.75,
620
- },
621
- contextWindow: 200000,
622
- maxTokens: 64000,
623
- },
624
488
  "global.anthropic.claude-sonnet-4-5-20250929-v1:0": {
625
489
  id: "global.anthropic.claude-sonnet-4-5-20250929-v1:0",
626
490
  name: "Claude Sonnet 4.5 (Global)",
@@ -689,22 +553,57 @@ export const MODELS = {
689
553
  contextWindow: 128000,
690
554
  maxTokens: 4096,
691
555
  },
692
- "meta.llama3-1-405b-instruct-v1:0": {
693
- id: "meta.llama3-1-405b-instruct-v1:0",
694
- name: "Llama 3.1 405B Instruct",
556
+ "jp.anthropic.claude-opus-4-7": {
557
+ id: "jp.anthropic.claude-opus-4-7",
558
+ name: "Claude Opus 4.7 (JP)",
695
559
  api: "bedrock-converse-stream",
696
560
  provider: "amazon-bedrock",
697
561
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
698
- reasoning: false,
699
- input: ["text"],
562
+ reasoning: true,
563
+ thinkingLevelMap: { "xhigh": "xhigh" },
564
+ input: ["text", "image"],
700
565
  cost: {
701
- input: 2.4,
702
- output: 2.4,
703
- cacheRead: 0,
704
- cacheWrite: 0,
566
+ input: 5,
567
+ output: 25,
568
+ cacheRead: 0.5,
569
+ cacheWrite: 6.25,
705
570
  },
706
- contextWindow: 128000,
707
- maxTokens: 4096,
571
+ contextWindow: 1000000,
572
+ maxTokens: 128000,
573
+ },
574
+ "jp.anthropic.claude-sonnet-4-5-20250929-v1:0": {
575
+ id: "jp.anthropic.claude-sonnet-4-5-20250929-v1:0",
576
+ name: "Claude Sonnet 4.5 (JP)",
577
+ api: "bedrock-converse-stream",
578
+ provider: "amazon-bedrock",
579
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
580
+ reasoning: true,
581
+ input: ["text", "image"],
582
+ cost: {
583
+ input: 3,
584
+ output: 15,
585
+ cacheRead: 0.3,
586
+ cacheWrite: 3.75,
587
+ },
588
+ contextWindow: 200000,
589
+ maxTokens: 64000,
590
+ },
591
+ "jp.anthropic.claude-sonnet-4-6": {
592
+ id: "jp.anthropic.claude-sonnet-4-6",
593
+ name: "Claude Sonnet 4.6 (JP)",
594
+ api: "bedrock-converse-stream",
595
+ provider: "amazon-bedrock",
596
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
597
+ reasoning: true,
598
+ input: ["text", "image"],
599
+ cost: {
600
+ input: 3,
601
+ output: 15,
602
+ cacheRead: 0.3,
603
+ cacheWrite: 3.75,
604
+ },
605
+ contextWindow: 1000000,
606
+ maxTokens: 64000,
708
607
  },
709
608
  "meta.llama3-1-70b-instruct-v1:0": {
710
609
  id: "meta.llama3-1-70b-instruct-v1:0",
@@ -740,128 +639,60 @@ export const MODELS = {
740
639
  contextWindow: 128000,
741
640
  maxTokens: 4096,
742
641
  },
743
- "meta.llama3-2-11b-instruct-v1:0": {
744
- id: "meta.llama3-2-11b-instruct-v1:0",
745
- name: "Llama 3.2 11B Instruct",
642
+ "meta.llama3-3-70b-instruct-v1:0": {
643
+ id: "meta.llama3-3-70b-instruct-v1:0",
644
+ name: "Llama 3.3 70B Instruct",
746
645
  api: "bedrock-converse-stream",
747
646
  provider: "amazon-bedrock",
748
647
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
749
648
  reasoning: false,
750
- input: ["text", "image"],
649
+ input: ["text"],
751
650
  cost: {
752
- input: 0.16,
753
- output: 0.16,
651
+ input: 0.72,
652
+ output: 0.72,
754
653
  cacheRead: 0,
755
654
  cacheWrite: 0,
756
655
  },
757
656
  contextWindow: 128000,
758
657
  maxTokens: 4096,
759
658
  },
760
- "meta.llama3-2-1b-instruct-v1:0": {
761
- id: "meta.llama3-2-1b-instruct-v1:0",
762
- name: "Llama 3.2 1B Instruct",
659
+ "meta.llama4-maverick-17b-instruct-v1:0": {
660
+ id: "meta.llama4-maverick-17b-instruct-v1:0",
661
+ name: "Llama 4 Maverick 17B Instruct",
763
662
  api: "bedrock-converse-stream",
764
663
  provider: "amazon-bedrock",
765
664
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
766
665
  reasoning: false,
767
- input: ["text"],
666
+ input: ["text", "image"],
768
667
  cost: {
769
- input: 0.1,
770
- output: 0.1,
668
+ input: 0.24,
669
+ output: 0.97,
771
670
  cacheRead: 0,
772
671
  cacheWrite: 0,
773
672
  },
774
- contextWindow: 131000,
775
- maxTokens: 4096,
673
+ contextWindow: 1000000,
674
+ maxTokens: 16384,
776
675
  },
777
- "meta.llama3-2-3b-instruct-v1:0": {
778
- id: "meta.llama3-2-3b-instruct-v1:0",
779
- name: "Llama 3.2 3B Instruct",
676
+ "meta.llama4-scout-17b-instruct-v1:0": {
677
+ id: "meta.llama4-scout-17b-instruct-v1:0",
678
+ name: "Llama 4 Scout 17B Instruct",
780
679
  api: "bedrock-converse-stream",
781
680
  provider: "amazon-bedrock",
782
681
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
783
682
  reasoning: false,
784
- input: ["text"],
683
+ input: ["text", "image"],
785
684
  cost: {
786
- input: 0.15,
787
- output: 0.15,
685
+ input: 0.17,
686
+ output: 0.66,
788
687
  cacheRead: 0,
789
688
  cacheWrite: 0,
790
689
  },
791
- contextWindow: 131000,
792
- maxTokens: 4096,
690
+ contextWindow: 3500000,
691
+ maxTokens: 16384,
793
692
  },
794
- "meta.llama3-2-90b-instruct-v1:0": {
795
- id: "meta.llama3-2-90b-instruct-v1:0",
796
- name: "Llama 3.2 90B Instruct",
797
- api: "bedrock-converse-stream",
798
- provider: "amazon-bedrock",
799
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
800
- reasoning: false,
801
- input: ["text", "image"],
802
- cost: {
803
- input: 0.72,
804
- output: 0.72,
805
- cacheRead: 0,
806
- cacheWrite: 0,
807
- },
808
- contextWindow: 128000,
809
- maxTokens: 4096,
810
- },
811
- "meta.llama3-3-70b-instruct-v1:0": {
812
- id: "meta.llama3-3-70b-instruct-v1:0",
813
- name: "Llama 3.3 70B Instruct",
814
- api: "bedrock-converse-stream",
815
- provider: "amazon-bedrock",
816
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
817
- reasoning: false,
818
- input: ["text"],
819
- cost: {
820
- input: 0.72,
821
- output: 0.72,
822
- cacheRead: 0,
823
- cacheWrite: 0,
824
- },
825
- contextWindow: 128000,
826
- maxTokens: 4096,
827
- },
828
- "meta.llama4-maverick-17b-instruct-v1:0": {
829
- id: "meta.llama4-maverick-17b-instruct-v1:0",
830
- name: "Llama 4 Maverick 17B Instruct",
831
- api: "bedrock-converse-stream",
832
- provider: "amazon-bedrock",
833
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
834
- reasoning: false,
835
- input: ["text", "image"],
836
- cost: {
837
- input: 0.24,
838
- output: 0.97,
839
- cacheRead: 0,
840
- cacheWrite: 0,
841
- },
842
- contextWindow: 1000000,
843
- maxTokens: 16384,
844
- },
845
- "meta.llama4-scout-17b-instruct-v1:0": {
846
- id: "meta.llama4-scout-17b-instruct-v1:0",
847
- name: "Llama 4 Scout 17B Instruct",
848
- api: "bedrock-converse-stream",
849
- provider: "amazon-bedrock",
850
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
851
- reasoning: false,
852
- input: ["text", "image"],
853
- cost: {
854
- input: 0.17,
855
- output: 0.66,
856
- cacheRead: 0,
857
- cacheWrite: 0,
858
- },
859
- contextWindow: 3500000,
860
- maxTokens: 16384,
861
- },
862
- "minimax.minimax-m2": {
863
- id: "minimax.minimax-m2",
864
- name: "MiniMax M2",
693
+ "minimax.minimax-m2": {
694
+ id: "minimax.minimax-m2",
695
+ name: "MiniMax M2",
865
696
  api: "bedrock-converse-stream",
866
697
  provider: "amazon-bedrock",
867
698
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
@@ -1077,8 +908,8 @@ export const MODELS = {
1077
908
  cacheRead: 0,
1078
909
  cacheWrite: 0,
1079
910
  },
1080
- contextWindow: 256000,
1081
- maxTokens: 256000,
911
+ contextWindow: 262143,
912
+ maxTokens: 16000,
1082
913
  },
1083
914
  "moonshotai.kimi-k2.5": {
1084
915
  id: "moonshotai.kimi-k2.5",
@@ -1094,8 +925,8 @@ export const MODELS = {
1094
925
  cacheRead: 0,
1095
926
  cacheWrite: 0,
1096
927
  },
1097
- contextWindow: 256000,
1098
- maxTokens: 256000,
928
+ contextWindow: 262143,
929
+ maxTokens: 16000,
1099
930
  },
1100
931
  "nvidia.nemotron-nano-12b-v2": {
1101
932
  id: "nvidia.nemotron-nano-12b-v2",
@@ -1180,7 +1011,7 @@ export const MODELS = {
1180
1011
  cacheWrite: 0,
1181
1012
  },
1182
1013
  contextWindow: 128000,
1183
- maxTokens: 4096,
1014
+ maxTokens: 16384,
1184
1015
  },
1185
1016
  "openai.gpt-oss-20b-1:0": {
1186
1017
  id: "openai.gpt-oss-20b-1:0",
@@ -1197,7 +1028,7 @@ export const MODELS = {
1197
1028
  cacheWrite: 0,
1198
1029
  },
1199
1030
  contextWindow: 128000,
1200
- maxTokens: 4096,
1031
+ maxTokens: 16384,
1201
1032
  },
1202
1033
  "openai.gpt-oss-safeguard-120b": {
1203
1034
  id: "openai.gpt-oss-safeguard-120b",
@@ -1214,7 +1045,7 @@ export const MODELS = {
1214
1045
  cacheWrite: 0,
1215
1046
  },
1216
1047
  contextWindow: 128000,
1217
- maxTokens: 4096,
1048
+ maxTokens: 16384,
1218
1049
  },
1219
1050
  "openai.gpt-oss-safeguard-20b": {
1220
1051
  id: "openai.gpt-oss-safeguard-20b",
@@ -1231,7 +1062,7 @@ export const MODELS = {
1231
1062
  cacheWrite: 0,
1232
1063
  },
1233
1064
  contextWindow: 128000,
1234
- maxTokens: 4096,
1065
+ maxTokens: 16384,
1235
1066
  },
1236
1067
  "qwen.qwen3-235b-a22b-2507-v1:0": {
1237
1068
  id: "qwen.qwen3-235b-a22b-2507-v1:0",
@@ -1386,23 +1217,6 @@ export const MODELS = {
1386
1217
  contextWindow: 200000,
1387
1218
  maxTokens: 32000,
1388
1219
  },
1389
- "us.anthropic.claude-opus-4-20250514-v1:0": {
1390
- id: "us.anthropic.claude-opus-4-20250514-v1:0",
1391
- name: "Claude Opus 4 (US)",
1392
- api: "bedrock-converse-stream",
1393
- provider: "amazon-bedrock",
1394
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1395
- reasoning: true,
1396
- input: ["text", "image"],
1397
- cost: {
1398
- input: 15,
1399
- output: 75,
1400
- cacheRead: 1.5,
1401
- cacheWrite: 18.75,
1402
- },
1403
- contextWindow: 200000,
1404
- maxTokens: 32000,
1405
- },
1406
1220
  "us.anthropic.claude-opus-4-5-20251101-v1:0": {
1407
1221
  id: "us.anthropic.claude-opus-4-5-20251101-v1:0",
1408
1222
  name: "Claude Opus 4.5 (US)",
@@ -1456,9 +1270,9 @@ export const MODELS = {
1456
1270
  contextWindow: 1000000,
1457
1271
  maxTokens: 128000,
1458
1272
  },
1459
- "us.anthropic.claude-sonnet-4-20250514-v1:0": {
1460
- id: "us.anthropic.claude-sonnet-4-20250514-v1:0",
1461
- name: "Claude Sonnet 4 (US)",
1273
+ "us.anthropic.claude-sonnet-4-5-20250929-v1:0": {
1274
+ id: "us.anthropic.claude-sonnet-4-5-20250929-v1:0",
1275
+ name: "Claude Sonnet 4.5 (US)",
1462
1276
  api: "bedrock-converse-stream",
1463
1277
  provider: "amazon-bedrock",
1464
1278
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
@@ -1473,9 +1287,9 @@ export const MODELS = {
1473
1287
  contextWindow: 200000,
1474
1288
  maxTokens: 64000,
1475
1289
  },
1476
- "us.anthropic.claude-sonnet-4-5-20250929-v1:0": {
1477
- id: "us.anthropic.claude-sonnet-4-5-20250929-v1:0",
1478
- name: "Claude Sonnet 4.5 (US)",
1290
+ "us.anthropic.claude-sonnet-4-6": {
1291
+ id: "us.anthropic.claude-sonnet-4-6",
1292
+ name: "Claude Sonnet 4.6 (US)",
1479
1293
  api: "bedrock-converse-stream",
1480
1294
  provider: "amazon-bedrock",
1481
1295
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
@@ -1487,25 +1301,59 @@ export const MODELS = {
1487
1301
  cacheRead: 0.3,
1488
1302
  cacheWrite: 3.75,
1489
1303
  },
1490
- contextWindow: 200000,
1304
+ contextWindow: 1000000,
1491
1305
  maxTokens: 64000,
1492
1306
  },
1493
- "us.anthropic.claude-sonnet-4-6": {
1494
- id: "us.anthropic.claude-sonnet-4-6",
1495
- name: "Claude Sonnet 4.6 (US)",
1307
+ "us.deepseek.r1-v1:0": {
1308
+ id: "us.deepseek.r1-v1:0",
1309
+ name: "DeepSeek-R1 (US)",
1496
1310
  api: "bedrock-converse-stream",
1497
1311
  provider: "amazon-bedrock",
1498
1312
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1499
1313
  reasoning: true,
1314
+ input: ["text"],
1315
+ cost: {
1316
+ input: 1.35,
1317
+ output: 5.4,
1318
+ cacheRead: 0,
1319
+ cacheWrite: 0,
1320
+ },
1321
+ contextWindow: 128000,
1322
+ maxTokens: 32768,
1323
+ },
1324
+ "us.meta.llama4-maverick-17b-instruct-v1:0": {
1325
+ id: "us.meta.llama4-maverick-17b-instruct-v1:0",
1326
+ name: "Llama 4 Maverick 17B Instruct (US)",
1327
+ api: "bedrock-converse-stream",
1328
+ provider: "amazon-bedrock",
1329
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1330
+ reasoning: false,
1500
1331
  input: ["text", "image"],
1501
1332
  cost: {
1502
- input: 3,
1503
- output: 15,
1504
- cacheRead: 0.3,
1505
- cacheWrite: 3.75,
1333
+ input: 0.24,
1334
+ output: 0.97,
1335
+ cacheRead: 0,
1336
+ cacheWrite: 0,
1506
1337
  },
1507
1338
  contextWindow: 1000000,
1508
- maxTokens: 64000,
1339
+ maxTokens: 16384,
1340
+ },
1341
+ "us.meta.llama4-scout-17b-instruct-v1:0": {
1342
+ id: "us.meta.llama4-scout-17b-instruct-v1:0",
1343
+ name: "Llama 4 Scout 17B Instruct (US)",
1344
+ api: "bedrock-converse-stream",
1345
+ provider: "amazon-bedrock",
1346
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1347
+ reasoning: false,
1348
+ input: ["text", "image"],
1349
+ cost: {
1350
+ input: 0.17,
1351
+ output: 0.66,
1352
+ cacheRead: 0,
1353
+ cacheWrite: 0,
1354
+ },
1355
+ contextWindow: 3500000,
1356
+ maxTokens: 16384,
1509
1357
  },
1510
1358
  "writer.palmyra-x4-v1:0": {
1511
1359
  id: "writer.palmyra-x4-v1:0",
@@ -3427,6 +3275,42 @@ export const MODELS = {
3427
3275
  contextWindow: 256000,
3428
3276
  maxTokens: 16384,
3429
3277
  },
3278
+ "@cf/ibm-granite/granite-4.0-h-micro": {
3279
+ id: "@cf/ibm-granite/granite-4.0-h-micro",
3280
+ name: "Granite 4.0 H Micro",
3281
+ api: "openai-completions",
3282
+ provider: "cloudflare-workers-ai",
3283
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3284
+ compat: { "sendSessionAffinityHeaders": true },
3285
+ reasoning: false,
3286
+ input: ["text"],
3287
+ cost: {
3288
+ input: 0.017,
3289
+ output: 0.112,
3290
+ cacheRead: 0,
3291
+ cacheWrite: 0,
3292
+ },
3293
+ contextWindow: 131000,
3294
+ maxTokens: 131000,
3295
+ },
3296
+ "@cf/meta/llama-3.3-70b-instruct-fp8-fast": {
3297
+ id: "@cf/meta/llama-3.3-70b-instruct-fp8-fast",
3298
+ name: "Llama 3.3 70B Instruct fp8 Fast",
3299
+ api: "openai-completions",
3300
+ provider: "cloudflare-workers-ai",
3301
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3302
+ compat: { "sendSessionAffinityHeaders": true },
3303
+ reasoning: false,
3304
+ input: ["text"],
3305
+ cost: {
3306
+ input: 0.293,
3307
+ output: 2.253,
3308
+ cacheRead: 0,
3309
+ cacheWrite: 0,
3310
+ },
3311
+ contextWindow: 24000,
3312
+ maxTokens: 24000,
3313
+ },
3430
3314
  "@cf/meta/llama-4-scout-17b-16e-instruct": {
3431
3315
  id: "@cf/meta/llama-4-scout-17b-16e-instruct",
3432
3316
  name: "Llama 4 Scout 17B 16E Instruct",
@@ -3442,9 +3326,27 @@ export const MODELS = {
3442
3326
  cacheRead: 0,
3443
3327
  cacheWrite: 0,
3444
3328
  },
3445
- contextWindow: 128000,
3329
+ contextWindow: 131000,
3446
3330
  maxTokens: 16384,
3447
3331
  },
3332
+ "@cf/mistralai/mistral-small-3.1-24b-instruct": {
3333
+ id: "@cf/mistralai/mistral-small-3.1-24b-instruct",
3334
+ name: "Mistral Small 3.1 24B Instruct",
3335
+ api: "openai-completions",
3336
+ provider: "cloudflare-workers-ai",
3337
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3338
+ compat: { "sendSessionAffinityHeaders": true },
3339
+ reasoning: false,
3340
+ input: ["text"],
3341
+ cost: {
3342
+ input: 0.351,
3343
+ output: 0.555,
3344
+ cacheRead: 0,
3345
+ cacheWrite: 0,
3346
+ },
3347
+ contextWindow: 128000,
3348
+ maxTokens: 128000,
3349
+ },
3448
3350
  "@cf/moonshotai/kimi-k2.5": {
3449
3351
  id: "@cf/moonshotai/kimi-k2.5",
3450
3352
  name: "Kimi K2.5",
@@ -3478,7 +3380,7 @@ export const MODELS = {
3478
3380
  cacheRead: 0.16,
3479
3381
  cacheWrite: 0,
3480
3382
  },
3481
- contextWindow: 256000,
3383
+ contextWindow: 262144,
3482
3384
  maxTokens: 256000,
3483
3385
  },
3484
3386
  "@cf/nvidia/nemotron-3-120b-a12b": {
@@ -3535,6 +3437,24 @@ export const MODELS = {
3535
3437
  contextWindow: 128000,
3536
3438
  maxTokens: 16384,
3537
3439
  },
3440
+ "@cf/qwen/qwen3-30b-a3b-fp8": {
3441
+ id: "@cf/qwen/qwen3-30b-a3b-fp8",
3442
+ name: "Qwen3 30B A3b fp8",
3443
+ api: "openai-completions",
3444
+ provider: "cloudflare-workers-ai",
3445
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3446
+ compat: { "sendSessionAffinityHeaders": true },
3447
+ reasoning: true,
3448
+ input: ["text"],
3449
+ cost: {
3450
+ input: 0.0509,
3451
+ output: 0.335,
3452
+ cacheRead: 0,
3453
+ cacheWrite: 0,
3454
+ },
3455
+ contextWindow: 32768,
3456
+ maxTokens: 32768,
3457
+ },
3538
3458
  "@cf/zai-org/glm-4.7-flash": {
3539
3459
  id: "@cf/zai-org/glm-4.7-flash",
3540
3460
  name: "GLM-4.7-Flash",
@@ -3545,7 +3465,7 @@ export const MODELS = {
3545
3465
  reasoning: true,
3546
3466
  input: ["text"],
3547
3467
  cost: {
3548
- input: 0.06,
3468
+ input: 0.0605,
3549
3469
  output: 0.4,
3550
3470
  cacheRead: 0,
3551
3471
  cacheWrite: 0,
@@ -3601,6 +3521,7 @@ export const MODELS = {
3601
3521
  api: "anthropic-messages",
3602
3522
  provider: "fireworks",
3603
3523
  baseUrl: "https://api.fireworks.ai/inference",
3524
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3604
3525
  reasoning: true,
3605
3526
  input: ["text"],
3606
3527
  cost: {
@@ -3618,6 +3539,7 @@ export const MODELS = {
3618
3539
  api: "anthropic-messages",
3619
3540
  provider: "fireworks",
3620
3541
  baseUrl: "https://api.fireworks.ai/inference",
3542
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3621
3543
  reasoning: true,
3622
3544
  input: ["text"],
3623
3545
  cost: {
@@ -3629,12 +3551,31 @@ export const MODELS = {
3629
3551
  contextWindow: 160000,
3630
3552
  maxTokens: 160000,
3631
3553
  },
3554
+ "accounts/fireworks/models/deepseek-v4-flash": {
3555
+ id: "accounts/fireworks/models/deepseek-v4-flash",
3556
+ name: "DeepSeek V4 Flash",
3557
+ api: "anthropic-messages",
3558
+ provider: "fireworks",
3559
+ baseUrl: "https://api.fireworks.ai/inference",
3560
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3561
+ reasoning: true,
3562
+ input: ["text"],
3563
+ cost: {
3564
+ input: 0.14,
3565
+ output: 0.28,
3566
+ cacheRead: 0.03,
3567
+ cacheWrite: 0,
3568
+ },
3569
+ contextWindow: 1000000,
3570
+ maxTokens: 384000,
3571
+ },
3632
3572
  "accounts/fireworks/models/deepseek-v4-pro": {
3633
3573
  id: "accounts/fireworks/models/deepseek-v4-pro",
3634
3574
  name: "DeepSeek V4 Pro",
3635
3575
  api: "anthropic-messages",
3636
3576
  provider: "fireworks",
3637
3577
  baseUrl: "https://api.fireworks.ai/inference",
3578
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3638
3579
  reasoning: true,
3639
3580
  input: ["text"],
3640
3581
  cost: {
@@ -3652,6 +3593,7 @@ export const MODELS = {
3652
3593
  api: "anthropic-messages",
3653
3594
  provider: "fireworks",
3654
3595
  baseUrl: "https://api.fireworks.ai/inference",
3596
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3655
3597
  reasoning: true,
3656
3598
  input: ["text"],
3657
3599
  cost: {
@@ -3669,6 +3611,7 @@ export const MODELS = {
3669
3611
  api: "anthropic-messages",
3670
3612
  provider: "fireworks",
3671
3613
  baseUrl: "https://api.fireworks.ai/inference",
3614
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3672
3615
  reasoning: true,
3673
3616
  input: ["text"],
3674
3617
  cost: {
@@ -3686,6 +3629,7 @@ export const MODELS = {
3686
3629
  api: "anthropic-messages",
3687
3630
  provider: "fireworks",
3688
3631
  baseUrl: "https://api.fireworks.ai/inference",
3632
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3689
3633
  reasoning: true,
3690
3634
  input: ["text"],
3691
3635
  cost: {
@@ -3703,6 +3647,7 @@ export const MODELS = {
3703
3647
  api: "anthropic-messages",
3704
3648
  provider: "fireworks",
3705
3649
  baseUrl: "https://api.fireworks.ai/inference",
3650
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3706
3651
  reasoning: true,
3707
3652
  input: ["text"],
3708
3653
  cost: {
@@ -3720,6 +3665,7 @@ export const MODELS = {
3720
3665
  api: "anthropic-messages",
3721
3666
  provider: "fireworks",
3722
3667
  baseUrl: "https://api.fireworks.ai/inference",
3668
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3723
3669
  reasoning: true,
3724
3670
  input: ["text"],
3725
3671
  cost: {
@@ -3737,6 +3683,7 @@ export const MODELS = {
3737
3683
  api: "anthropic-messages",
3738
3684
  provider: "fireworks",
3739
3685
  baseUrl: "https://api.fireworks.ai/inference",
3686
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3740
3687
  reasoning: true,
3741
3688
  input: ["text"],
3742
3689
  cost: {
@@ -3754,6 +3701,7 @@ export const MODELS = {
3754
3701
  api: "anthropic-messages",
3755
3702
  provider: "fireworks",
3756
3703
  baseUrl: "https://api.fireworks.ai/inference",
3704
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3757
3705
  reasoning: true,
3758
3706
  input: ["text"],
3759
3707
  cost: {
@@ -3771,6 +3719,7 @@ export const MODELS = {
3771
3719
  api: "anthropic-messages",
3772
3720
  provider: "fireworks",
3773
3721
  baseUrl: "https://api.fireworks.ai/inference",
3722
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3774
3723
  reasoning: false,
3775
3724
  input: ["text"],
3776
3725
  cost: {
@@ -3788,6 +3737,7 @@ export const MODELS = {
3788
3737
  api: "anthropic-messages",
3789
3738
  provider: "fireworks",
3790
3739
  baseUrl: "https://api.fireworks.ai/inference",
3740
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3791
3741
  reasoning: true,
3792
3742
  input: ["text"],
3793
3743
  cost: {
@@ -3805,6 +3755,7 @@ export const MODELS = {
3805
3755
  api: "anthropic-messages",
3806
3756
  provider: "fireworks",
3807
3757
  baseUrl: "https://api.fireworks.ai/inference",
3758
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3808
3759
  reasoning: true,
3809
3760
  input: ["text", "image"],
3810
3761
  cost: {
@@ -3822,6 +3773,7 @@ export const MODELS = {
3822
3773
  api: "anthropic-messages",
3823
3774
  provider: "fireworks",
3824
3775
  baseUrl: "https://api.fireworks.ai/inference",
3776
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3825
3777
  reasoning: true,
3826
3778
  input: ["text", "image"],
3827
3779
  cost: {
@@ -3839,6 +3791,7 @@ export const MODELS = {
3839
3791
  api: "anthropic-messages",
3840
3792
  provider: "fireworks",
3841
3793
  baseUrl: "https://api.fireworks.ai/inference",
3794
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3842
3795
  reasoning: true,
3843
3796
  input: ["text"],
3844
3797
  cost: {
@@ -3856,6 +3809,7 @@ export const MODELS = {
3856
3809
  api: "anthropic-messages",
3857
3810
  provider: "fireworks",
3858
3811
  baseUrl: "https://api.fireworks.ai/inference",
3812
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3859
3813
  reasoning: true,
3860
3814
  input: ["text"],
3861
3815
  cost: {
@@ -3873,6 +3827,7 @@ export const MODELS = {
3873
3827
  api: "anthropic-messages",
3874
3828
  provider: "fireworks",
3875
3829
  baseUrl: "https://api.fireworks.ai/inference",
3830
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3876
3831
  reasoning: true,
3877
3832
  input: ["text"],
3878
3833
  cost: {
@@ -3890,6 +3845,7 @@ export const MODELS = {
3890
3845
  api: "anthropic-messages",
3891
3846
  provider: "fireworks",
3892
3847
  baseUrl: "https://api.fireworks.ai/inference",
3848
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3893
3849
  reasoning: true,
3894
3850
  input: ["text", "image"],
3895
3851
  cost: {
@@ -3907,6 +3863,7 @@ export const MODELS = {
3907
3863
  api: "anthropic-messages",
3908
3864
  provider: "fireworks",
3909
3865
  baseUrl: "https://api.fireworks.ai/inference",
3866
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3910
3867
  reasoning: true,
3911
3868
  input: ["text", "image"],
3912
3869
  cost: {
@@ -3995,25 +3952,6 @@ export const MODELS = {
3995
3952
  contextWindow: 144000,
3996
3953
  maxTokens: 64000,
3997
3954
  },
3998
- "claude-sonnet-4": {
3999
- id: "claude-sonnet-4",
4000
- name: "Claude Sonnet 4",
4001
- api: "anthropic-messages",
4002
- provider: "github-copilot",
4003
- baseUrl: "https://api.individual.githubcopilot.com",
4004
- headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4005
- compat: { "supportsEagerToolInputStreaming": false },
4006
- reasoning: true,
4007
- input: ["text", "image"],
4008
- cost: {
4009
- input: 0,
4010
- output: 0,
4011
- cacheRead: 0,
4012
- cacheWrite: 0,
4013
- },
4014
- contextWindow: 216000,
4015
- maxTokens: 16000,
4016
- },
4017
3955
  "claude-sonnet-4.5": {
4018
3956
  id: "claude-sonnet-4.5",
4019
3957
  name: "Claude Sonnet 4.5",
@@ -4089,25 +4027,6 @@ export const MODELS = {
4089
4027
  contextWindow: 128000,
4090
4028
  maxTokens: 64000,
4091
4029
  },
4092
- "gemini-3-pro-preview": {
4093
- id: "gemini-3-pro-preview",
4094
- name: "Gemini 3 Pro Preview",
4095
- api: "openai-completions",
4096
- provider: "github-copilot",
4097
- baseUrl: "https://api.individual.githubcopilot.com",
4098
- headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4099
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
4100
- reasoning: true,
4101
- input: ["text", "image"],
4102
- cost: {
4103
- input: 0,
4104
- output: 0,
4105
- cacheRead: 0,
4106
- cacheWrite: 0,
4107
- },
4108
- contextWindow: 128000,
4109
- maxTokens: 64000,
4110
- },
4111
4030
  "gemini-3.1-pro-preview": {
4112
4031
  id: "gemini-3.1-pro-preview",
4113
4032
  name: "Gemini 3.1 Pro Preview",
@@ -4165,25 +4084,6 @@ export const MODELS = {
4165
4084
  contextWindow: 128000,
4166
4085
  maxTokens: 4096,
4167
4086
  },
4168
- "gpt-5": {
4169
- id: "gpt-5",
4170
- name: "GPT-5",
4171
- api: "openai-responses",
4172
- provider: "github-copilot",
4173
- baseUrl: "https://api.individual.githubcopilot.com",
4174
- headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4175
- reasoning: true,
4176
- thinkingLevelMap: { "off": null },
4177
- input: ["text", "image"],
4178
- cost: {
4179
- input: 0,
4180
- output: 0,
4181
- cacheRead: 0,
4182
- cacheWrite: 0,
4183
- },
4184
- contextWindow: 128000,
4185
- maxTokens: 128000,
4186
- },
4187
4087
  "gpt-5-mini": {
4188
4088
  id: "gpt-5-mini",
4189
4089
  name: "GPT-5-mini",
@@ -4203,82 +4103,6 @@ export const MODELS = {
4203
4103
  contextWindow: 264000,
4204
4104
  maxTokens: 64000,
4205
4105
  },
4206
- "gpt-5.1": {
4207
- id: "gpt-5.1",
4208
- name: "GPT-5.1",
4209
- api: "openai-responses",
4210
- provider: "github-copilot",
4211
- baseUrl: "https://api.individual.githubcopilot.com",
4212
- headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4213
- reasoning: true,
4214
- thinkingLevelMap: { "off": null },
4215
- input: ["text", "image"],
4216
- cost: {
4217
- input: 0,
4218
- output: 0,
4219
- cacheRead: 0,
4220
- cacheWrite: 0,
4221
- },
4222
- contextWindow: 264000,
4223
- maxTokens: 64000,
4224
- },
4225
- "gpt-5.1-codex": {
4226
- id: "gpt-5.1-codex",
4227
- name: "GPT-5.1-Codex",
4228
- api: "openai-responses",
4229
- provider: "github-copilot",
4230
- baseUrl: "https://api.individual.githubcopilot.com",
4231
- headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4232
- reasoning: true,
4233
- thinkingLevelMap: { "off": null },
4234
- input: ["text", "image"],
4235
- cost: {
4236
- input: 0,
4237
- output: 0,
4238
- cacheRead: 0,
4239
- cacheWrite: 0,
4240
- },
4241
- contextWindow: 400000,
4242
- maxTokens: 128000,
4243
- },
4244
- "gpt-5.1-codex-max": {
4245
- id: "gpt-5.1-codex-max",
4246
- name: "GPT-5.1-Codex-max",
4247
- api: "openai-responses",
4248
- provider: "github-copilot",
4249
- baseUrl: "https://api.individual.githubcopilot.com",
4250
- headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4251
- reasoning: true,
4252
- thinkingLevelMap: { "off": null },
4253
- input: ["text", "image"],
4254
- cost: {
4255
- input: 0,
4256
- output: 0,
4257
- cacheRead: 0,
4258
- cacheWrite: 0,
4259
- },
4260
- contextWindow: 400000,
4261
- maxTokens: 128000,
4262
- },
4263
- "gpt-5.1-codex-mini": {
4264
- id: "gpt-5.1-codex-mini",
4265
- name: "GPT-5.1-Codex-mini",
4266
- api: "openai-responses",
4267
- provider: "github-copilot",
4268
- baseUrl: "https://api.individual.githubcopilot.com",
4269
- headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4270
- reasoning: true,
4271
- thinkingLevelMap: { "off": null },
4272
- input: ["text", "image"],
4273
- cost: {
4274
- input: 0,
4275
- output: 0,
4276
- cacheRead: 0,
4277
- cacheWrite: 0,
4278
- },
4279
- contextWindow: 400000,
4280
- maxTokens: 128000,
4281
- },
4282
4106
  "gpt-5.2": {
4283
4107
  id: "gpt-5.2",
4284
4108
  name: "GPT-5.2",
@@ -4414,57 +4238,6 @@ export const MODELS = {
4414
4238
  },
4415
4239
  },
4416
4240
  "google": {
4417
- "gemini-1.5-flash": {
4418
- id: "gemini-1.5-flash",
4419
- name: "Gemini 1.5 Flash",
4420
- api: "google-generative-ai",
4421
- provider: "google",
4422
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4423
- reasoning: false,
4424
- input: ["text", "image"],
4425
- cost: {
4426
- input: 0.075,
4427
- output: 0.3,
4428
- cacheRead: 0.01875,
4429
- cacheWrite: 0,
4430
- },
4431
- contextWindow: 1000000,
4432
- maxTokens: 8192,
4433
- },
4434
- "gemini-1.5-flash-8b": {
4435
- id: "gemini-1.5-flash-8b",
4436
- name: "Gemini 1.5 Flash-8B",
4437
- api: "google-generative-ai",
4438
- provider: "google",
4439
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4440
- reasoning: false,
4441
- input: ["text", "image"],
4442
- cost: {
4443
- input: 0.0375,
4444
- output: 0.15,
4445
- cacheRead: 0.01,
4446
- cacheWrite: 0,
4447
- },
4448
- contextWindow: 1000000,
4449
- maxTokens: 8192,
4450
- },
4451
- "gemini-1.5-pro": {
4452
- id: "gemini-1.5-pro",
4453
- name: "Gemini 1.5 Pro",
4454
- api: "google-generative-ai",
4455
- provider: "google",
4456
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4457
- reasoning: false,
4458
- input: ["text", "image"],
4459
- cost: {
4460
- input: 1.25,
4461
- output: 5,
4462
- cacheRead: 0.3125,
4463
- cacheWrite: 0,
4464
- },
4465
- contextWindow: 1000000,
4466
- maxTokens: 8192,
4467
- },
4468
4241
  "gemini-2.0-flash": {
4469
4242
  id: "gemini-2.0-flash",
4470
4243
  name: "Gemini 2.0 Flash",
@@ -4484,7 +4257,7 @@ export const MODELS = {
4484
4257
  },
4485
4258
  "gemini-2.0-flash-lite": {
4486
4259
  id: "gemini-2.0-flash-lite",
4487
- name: "Gemini 2.0 Flash Lite",
4260
+ name: "Gemini 2.0 Flash-Lite",
4488
4261
  api: "google-generative-ai",
4489
4262
  provider: "google",
4490
4263
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4518,7 +4291,7 @@ export const MODELS = {
4518
4291
  },
4519
4292
  "gemini-2.5-flash-lite": {
4520
4293
  id: "gemini-2.5-flash-lite",
4521
- name: "Gemini 2.5 Flash Lite",
4294
+ name: "Gemini 2.5 Flash-Lite",
4522
4295
  api: "google-generative-ai",
4523
4296
  provider: "google",
4524
4297
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4527,331 +4300,197 @@ export const MODELS = {
4527
4300
  cost: {
4528
4301
  input: 0.1,
4529
4302
  output: 0.4,
4530
- cacheRead: 0.025,
4303
+ cacheRead: 0.01,
4531
4304
  cacheWrite: 0,
4532
4305
  },
4533
4306
  contextWindow: 1048576,
4534
4307
  maxTokens: 65536,
4535
4308
  },
4536
- "gemini-2.5-flash-lite-preview-06-17": {
4537
- id: "gemini-2.5-flash-lite-preview-06-17",
4538
- name: "Gemini 2.5 Flash Lite Preview 06-17",
4309
+ "gemini-2.5-pro": {
4310
+ id: "gemini-2.5-pro",
4311
+ name: "Gemini 2.5 Pro",
4539
4312
  api: "google-generative-ai",
4540
4313
  provider: "google",
4541
4314
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4542
4315
  reasoning: true,
4543
4316
  input: ["text", "image"],
4544
4317
  cost: {
4545
- input: 0.1,
4546
- output: 0.4,
4547
- cacheRead: 0.025,
4318
+ input: 1.25,
4319
+ output: 10,
4320
+ cacheRead: 0.125,
4548
4321
  cacheWrite: 0,
4549
4322
  },
4550
4323
  contextWindow: 1048576,
4551
4324
  maxTokens: 65536,
4552
4325
  },
4553
- "gemini-2.5-flash-lite-preview-09-2025": {
4554
- id: "gemini-2.5-flash-lite-preview-09-2025",
4555
- name: "Gemini 2.5 Flash Lite Preview 09-25",
4326
+ "gemini-3-flash-preview": {
4327
+ id: "gemini-3-flash-preview",
4328
+ name: "Gemini 3 Flash Preview",
4556
4329
  api: "google-generative-ai",
4557
4330
  provider: "google",
4558
4331
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4559
4332
  reasoning: true,
4333
+ thinkingLevelMap: { "off": null },
4560
4334
  input: ["text", "image"],
4561
4335
  cost: {
4562
- input: 0.1,
4563
- output: 0.4,
4564
- cacheRead: 0.025,
4336
+ input: 0.5,
4337
+ output: 3,
4338
+ cacheRead: 0.05,
4565
4339
  cacheWrite: 0,
4566
4340
  },
4567
4341
  contextWindow: 1048576,
4568
4342
  maxTokens: 65536,
4569
4343
  },
4570
- "gemini-2.5-flash-preview-04-17": {
4571
- id: "gemini-2.5-flash-preview-04-17",
4572
- name: "Gemini 2.5 Flash Preview 04-17",
4344
+ "gemini-3-pro-preview": {
4345
+ id: "gemini-3-pro-preview",
4346
+ name: "Gemini 3 Pro Preview",
4573
4347
  api: "google-generative-ai",
4574
4348
  provider: "google",
4575
4349
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4576
4350
  reasoning: true,
4351
+ thinkingLevelMap: { "off": null, "minimal": null, "low": "LOW", "medium": null, "high": "HIGH" },
4577
4352
  input: ["text", "image"],
4578
4353
  cost: {
4579
- input: 0.15,
4580
- output: 0.6,
4581
- cacheRead: 0.0375,
4354
+ input: 2,
4355
+ output: 12,
4356
+ cacheRead: 0.2,
4582
4357
  cacheWrite: 0,
4583
4358
  },
4584
4359
  contextWindow: 1048576,
4585
4360
  maxTokens: 65536,
4586
4361
  },
4587
- "gemini-2.5-flash-preview-05-20": {
4588
- id: "gemini-2.5-flash-preview-05-20",
4589
- name: "Gemini 2.5 Flash Preview 05-20",
4362
+ "gemini-3.1-flash-lite": {
4363
+ id: "gemini-3.1-flash-lite",
4364
+ name: "Gemini 3.1 Flash Lite",
4590
4365
  api: "google-generative-ai",
4591
4366
  provider: "google",
4592
4367
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4593
4368
  reasoning: true,
4369
+ thinkingLevelMap: { "off": null },
4594
4370
  input: ["text", "image"],
4595
4371
  cost: {
4596
- input: 0.15,
4597
- output: 0.6,
4598
- cacheRead: 0.0375,
4372
+ input: 0.25,
4373
+ output: 1.5,
4374
+ cacheRead: 0.025,
4599
4375
  cacheWrite: 0,
4600
4376
  },
4601
4377
  contextWindow: 1048576,
4602
4378
  maxTokens: 65536,
4603
4379
  },
4604
- "gemini-2.5-flash-preview-09-2025": {
4605
- id: "gemini-2.5-flash-preview-09-2025",
4606
- name: "Gemini 2.5 Flash Preview 09-25",
4380
+ "gemini-3.1-flash-lite-preview": {
4381
+ id: "gemini-3.1-flash-lite-preview",
4382
+ name: "Gemini 3.1 Flash Lite Preview",
4607
4383
  api: "google-generative-ai",
4608
4384
  provider: "google",
4609
4385
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4610
4386
  reasoning: true,
4387
+ thinkingLevelMap: { "off": null },
4611
4388
  input: ["text", "image"],
4612
4389
  cost: {
4613
- input: 0.3,
4614
- output: 2.5,
4615
- cacheRead: 0.075,
4390
+ input: 0.25,
4391
+ output: 1.5,
4392
+ cacheRead: 0.025,
4616
4393
  cacheWrite: 0,
4617
4394
  },
4618
4395
  contextWindow: 1048576,
4619
4396
  maxTokens: 65536,
4620
4397
  },
4621
- "gemini-2.5-pro": {
4622
- id: "gemini-2.5-pro",
4623
- name: "Gemini 2.5 Pro",
4398
+ "gemini-3.1-pro-preview": {
4399
+ id: "gemini-3.1-pro-preview",
4400
+ name: "Gemini 3.1 Pro Preview",
4624
4401
  api: "google-generative-ai",
4625
4402
  provider: "google",
4626
4403
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4627
4404
  reasoning: true,
4405
+ thinkingLevelMap: { "off": null, "minimal": null, "low": "LOW", "medium": null, "high": "HIGH" },
4628
4406
  input: ["text", "image"],
4629
4407
  cost: {
4630
- input: 1.25,
4631
- output: 10,
4632
- cacheRead: 0.125,
4408
+ input: 2,
4409
+ output: 12,
4410
+ cacheRead: 0.2,
4633
4411
  cacheWrite: 0,
4634
4412
  },
4635
4413
  contextWindow: 1048576,
4636
4414
  maxTokens: 65536,
4637
4415
  },
4638
- "gemini-2.5-pro-preview-05-06": {
4639
- id: "gemini-2.5-pro-preview-05-06",
4640
- name: "Gemini 2.5 Pro Preview 05-06",
4416
+ "gemini-3.1-pro-preview-customtools": {
4417
+ id: "gemini-3.1-pro-preview-customtools",
4418
+ name: "Gemini 3.1 Pro Preview Custom Tools",
4641
4419
  api: "google-generative-ai",
4642
4420
  provider: "google",
4643
4421
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4644
4422
  reasoning: true,
4423
+ thinkingLevelMap: { "off": null, "minimal": null, "low": "LOW", "medium": null, "high": "HIGH" },
4645
4424
  input: ["text", "image"],
4646
4425
  cost: {
4647
- input: 1.25,
4648
- output: 10,
4649
- cacheRead: 0.31,
4426
+ input: 2,
4427
+ output: 12,
4428
+ cacheRead: 0.2,
4650
4429
  cacheWrite: 0,
4651
4430
  },
4652
4431
  contextWindow: 1048576,
4653
4432
  maxTokens: 65536,
4654
4433
  },
4655
- "gemini-2.5-pro-preview-06-05": {
4656
- id: "gemini-2.5-pro-preview-06-05",
4657
- name: "Gemini 2.5 Pro Preview 06-05",
4434
+ "gemini-3.5-flash": {
4435
+ id: "gemini-3.5-flash",
4436
+ name: "Gemini 3.5 Flash",
4658
4437
  api: "google-generative-ai",
4659
4438
  provider: "google",
4660
4439
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4661
4440
  reasoning: true,
4441
+ thinkingLevelMap: { "off": null },
4662
4442
  input: ["text", "image"],
4663
4443
  cost: {
4664
- input: 1.25,
4665
- output: 10,
4666
- cacheRead: 0.31,
4444
+ input: 1.5,
4445
+ output: 9,
4446
+ cacheRead: 0.15,
4667
4447
  cacheWrite: 0,
4668
4448
  },
4669
4449
  contextWindow: 1048576,
4670
4450
  maxTokens: 65536,
4671
4451
  },
4672
- "gemini-3-flash-preview": {
4673
- id: "gemini-3-flash-preview",
4674
- name: "Gemini 3 Flash Preview",
4452
+ "gemini-flash-latest": {
4453
+ id: "gemini-flash-latest",
4454
+ name: "Gemini Flash Latest",
4675
4455
  api: "google-generative-ai",
4676
4456
  provider: "google",
4677
4457
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4678
4458
  reasoning: true,
4679
- thinkingLevelMap: { "off": null },
4680
4459
  input: ["text", "image"],
4681
4460
  cost: {
4682
- input: 0.5,
4683
- output: 3,
4684
- cacheRead: 0.05,
4461
+ input: 0.3,
4462
+ output: 2.5,
4463
+ cacheRead: 0.075,
4685
4464
  cacheWrite: 0,
4686
4465
  },
4687
4466
  contextWindow: 1048576,
4688
4467
  maxTokens: 65536,
4689
4468
  },
4690
- "gemini-3-pro-preview": {
4691
- id: "gemini-3-pro-preview",
4692
- name: "Gemini 3 Pro Preview",
4469
+ "gemini-flash-lite-latest": {
4470
+ id: "gemini-flash-lite-latest",
4471
+ name: "Gemini Flash-Lite Latest",
4693
4472
  api: "google-generative-ai",
4694
4473
  provider: "google",
4695
4474
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4696
4475
  reasoning: true,
4697
- thinkingLevelMap: { "off": null, "minimal": null, "low": "LOW", "medium": null, "high": "HIGH" },
4698
4476
  input: ["text", "image"],
4699
4477
  cost: {
4700
- input: 2,
4701
- output: 12,
4702
- cacheRead: 0.2,
4478
+ input: 0.1,
4479
+ output: 0.4,
4480
+ cacheRead: 0.025,
4703
4481
  cacheWrite: 0,
4704
4482
  },
4705
- contextWindow: 1000000,
4706
- maxTokens: 64000,
4483
+ contextWindow: 1048576,
4484
+ maxTokens: 65536,
4707
4485
  },
4708
- "gemini-3.1-flash-lite-preview": {
4709
- id: "gemini-3.1-flash-lite-preview",
4710
- name: "Gemini 3.1 Flash Lite Preview",
4486
+ "gemma-4-26b-a4b-it": {
4487
+ id: "gemma-4-26b-a4b-it",
4488
+ name: "Gemma 4 26B A4B IT",
4711
4489
  api: "google-generative-ai",
4712
4490
  provider: "google",
4713
4491
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4714
4492
  reasoning: true,
4715
- thinkingLevelMap: { "off": null },
4716
- input: ["text", "image"],
4717
- cost: {
4718
- input: 0.25,
4719
- output: 1.5,
4720
- cacheRead: 0.025,
4721
- cacheWrite: 1,
4722
- },
4723
- contextWindow: 1048576,
4724
- maxTokens: 65536,
4725
- },
4726
- "gemini-3.1-pro-preview": {
4727
- id: "gemini-3.1-pro-preview",
4728
- name: "Gemini 3.1 Pro Preview",
4729
- api: "google-generative-ai",
4730
- provider: "google",
4731
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4732
- reasoning: true,
4733
- thinkingLevelMap: { "off": null, "minimal": null, "low": "LOW", "medium": null, "high": "HIGH" },
4734
- input: ["text", "image"],
4735
- cost: {
4736
- input: 2,
4737
- output: 12,
4738
- cacheRead: 0.2,
4739
- cacheWrite: 0,
4740
- },
4741
- contextWindow: 1048576,
4742
- maxTokens: 65536,
4743
- },
4744
- "gemini-3.1-pro-preview-customtools": {
4745
- id: "gemini-3.1-pro-preview-customtools",
4746
- name: "Gemini 3.1 Pro Preview Custom Tools",
4747
- api: "google-generative-ai",
4748
- provider: "google",
4749
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4750
- reasoning: true,
4751
- thinkingLevelMap: { "off": null, "minimal": null, "low": "LOW", "medium": null, "high": "HIGH" },
4752
- input: ["text", "image"],
4753
- cost: {
4754
- input: 2,
4755
- output: 12,
4756
- cacheRead: 0.2,
4757
- cacheWrite: 0,
4758
- },
4759
- contextWindow: 1048576,
4760
- maxTokens: 65536,
4761
- },
4762
- "gemini-flash-latest": {
4763
- id: "gemini-flash-latest",
4764
- name: "Gemini Flash Latest",
4765
- api: "google-generative-ai",
4766
- provider: "google",
4767
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4768
- reasoning: true,
4769
- input: ["text", "image"],
4770
- cost: {
4771
- input: 0.3,
4772
- output: 2.5,
4773
- cacheRead: 0.075,
4774
- cacheWrite: 0,
4775
- },
4776
- contextWindow: 1048576,
4777
- maxTokens: 65536,
4778
- },
4779
- "gemini-flash-lite-latest": {
4780
- id: "gemini-flash-lite-latest",
4781
- name: "Gemini Flash-Lite Latest",
4782
- api: "google-generative-ai",
4783
- provider: "google",
4784
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4785
- reasoning: true,
4786
- input: ["text", "image"],
4787
- cost: {
4788
- input: 0.1,
4789
- output: 0.4,
4790
- cacheRead: 0.025,
4791
- cacheWrite: 0,
4792
- },
4793
- contextWindow: 1048576,
4794
- maxTokens: 65536,
4795
- },
4796
- "gemini-live-2.5-flash": {
4797
- id: "gemini-live-2.5-flash",
4798
- name: "Gemini Live 2.5 Flash",
4799
- api: "google-generative-ai",
4800
- provider: "google",
4801
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4802
- reasoning: true,
4803
- input: ["text", "image"],
4804
- cost: {
4805
- input: 0.5,
4806
- output: 2,
4807
- cacheRead: 0,
4808
- cacheWrite: 0,
4809
- },
4810
- contextWindow: 128000,
4811
- maxTokens: 8000,
4812
- },
4813
- "gemini-live-2.5-flash-preview-native-audio": {
4814
- id: "gemini-live-2.5-flash-preview-native-audio",
4815
- name: "Gemini Live 2.5 Flash Preview Native Audio",
4816
- api: "google-generative-ai",
4817
- provider: "google",
4818
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4819
- reasoning: true,
4820
- input: ["text"],
4821
- cost: {
4822
- input: 0.5,
4823
- output: 2,
4824
- cacheRead: 0,
4825
- cacheWrite: 0,
4826
- },
4827
- contextWindow: 131072,
4828
- maxTokens: 65536,
4829
- },
4830
- "gemma-3-27b-it": {
4831
- id: "gemma-3-27b-it",
4832
- name: "Gemma 3 27B",
4833
- api: "google-generative-ai",
4834
- provider: "google",
4835
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4836
- reasoning: false,
4837
- input: ["text", "image"],
4838
- cost: {
4839
- input: 0,
4840
- output: 0,
4841
- cacheRead: 0,
4842
- cacheWrite: 0,
4843
- },
4844
- contextWindow: 131072,
4845
- maxTokens: 8192,
4846
- },
4847
- "gemma-4-26b-a4b-it": {
4848
- id: "gemma-4-26b-a4b-it",
4849
- name: "Gemma 4 26B",
4850
- api: "google-generative-ai",
4851
- provider: "google",
4852
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4853
- reasoning: true,
4854
- thinkingLevelMap: { "off": null, "minimal": "MINIMAL", "low": null, "medium": null, "high": "HIGH" },
4493
+ thinkingLevelMap: { "off": null, "minimal": "MINIMAL", "low": null, "medium": null, "high": "HIGH" },
4855
4494
  input: ["text", "image"],
4856
4495
  cost: {
4857
4496
  input: 0,
@@ -4859,12 +4498,12 @@ export const MODELS = {
4859
4498
  cacheRead: 0,
4860
4499
  cacheWrite: 0,
4861
4500
  },
4862
- contextWindow: 256000,
4863
- maxTokens: 8192,
4501
+ contextWindow: 262144,
4502
+ maxTokens: 32768,
4864
4503
  },
4865
4504
  "gemma-4-31b-it": {
4866
4505
  id: "gemma-4-31b-it",
4867
- name: "Gemma 4 31B",
4506
+ name: "Gemma 4 31B IT",
4868
4507
  api: "google-generative-ai",
4869
4508
  provider: "google",
4870
4509
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4877,8 +4516,8 @@ export const MODELS = {
4877
4516
  cacheRead: 0,
4878
4517
  cacheWrite: 0,
4879
4518
  },
4880
- contextWindow: 256000,
4881
- maxTokens: 8192,
4519
+ contextWindow: 262144,
4520
+ maxTokens: 32768,
4882
4521
  },
4883
4522
  },
4884
4523
  "google-vertex": {
@@ -6945,7 +6584,7 @@ export const MODELS = {
6945
6584
  provider: "openai",
6946
6585
  baseUrl: "https://api.openai.com/v1",
6947
6586
  reasoning: true,
6948
- thinkingLevelMap: { "off": null },
6587
+ thinkingLevelMap: { "off": "none" },
6949
6588
  input: ["text", "image"],
6950
6589
  cost: {
6951
6590
  input: 1.25,
@@ -7035,7 +6674,7 @@ export const MODELS = {
7035
6674
  provider: "openai",
7036
6675
  baseUrl: "https://api.openai.com/v1",
7037
6676
  reasoning: true,
7038
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
6677
+ thinkingLevelMap: { "off": "none", "xhigh": "xhigh" },
7039
6678
  input: ["text", "image"],
7040
6679
  cost: {
7041
6680
  input: 1.75,
@@ -7125,7 +6764,7 @@ export const MODELS = {
7125
6764
  provider: "openai",
7126
6765
  baseUrl: "https://api.openai.com/v1",
7127
6766
  reasoning: true,
7128
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
6767
+ thinkingLevelMap: { "off": "none", "xhigh": "xhigh" },
7129
6768
  input: ["text", "image"],
7130
6769
  cost: {
7131
6770
  input: 1.75,
@@ -7161,7 +6800,7 @@ export const MODELS = {
7161
6800
  provider: "openai",
7162
6801
  baseUrl: "https://api.openai.com/v1",
7163
6802
  reasoning: true,
7164
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
6803
+ thinkingLevelMap: { "off": "none", "xhigh": "xhigh" },
7165
6804
  input: ["text", "image"],
7166
6805
  cost: {
7167
6806
  input: 2.5,
@@ -7179,7 +6818,7 @@ export const MODELS = {
7179
6818
  provider: "openai",
7180
6819
  baseUrl: "https://api.openai.com/v1",
7181
6820
  reasoning: true,
7182
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
6821
+ thinkingLevelMap: { "off": "none", "xhigh": "xhigh" },
7183
6822
  input: ["text", "image"],
7184
6823
  cost: {
7185
6824
  input: 0.75,
@@ -7197,7 +6836,7 @@ export const MODELS = {
7197
6836
  provider: "openai",
7198
6837
  baseUrl: "https://api.openai.com/v1",
7199
6838
  reasoning: true,
7200
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
6839
+ thinkingLevelMap: { "off": "none", "xhigh": "xhigh" },
7201
6840
  input: ["text", "image"],
7202
6841
  cost: {
7203
6842
  input: 0.2,
@@ -7233,7 +6872,7 @@ export const MODELS = {
7233
6872
  provider: "openai",
7234
6873
  baseUrl: "https://api.openai.com/v1",
7235
6874
  reasoning: true,
7236
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
6875
+ thinkingLevelMap: { "off": "none", "xhigh": "xhigh" },
7237
6876
  input: ["text", "image"],
7238
6877
  cost: {
7239
6878
  input: 5,
@@ -7735,6 +7374,25 @@ export const MODELS = {
7735
7374
  contextWindow: 1000000,
7736
7375
  maxTokens: 64000,
7737
7376
  },
7377
+ "deepseek-v4-flash-free": {
7378
+ id: "deepseek-v4-flash-free",
7379
+ name: "DeepSeek V4 Flash Free",
7380
+ api: "openai-completions",
7381
+ provider: "opencode",
7382
+ baseUrl: "https://opencode.ai/zen/v1",
7383
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7384
+ reasoning: true,
7385
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7386
+ input: ["text"],
7387
+ cost: {
7388
+ input: 0,
7389
+ output: 0,
7390
+ cacheRead: 0,
7391
+ cacheWrite: 0,
7392
+ },
7393
+ contextWindow: 200000,
7394
+ maxTokens: 128000,
7395
+ },
7738
7396
  "gemini-3-flash": {
7739
7397
  id: "gemini-3-flash",
7740
7398
  name: "Gemini 3 Flash",
@@ -7771,6 +7429,24 @@ export const MODELS = {
7771
7429
  contextWindow: 1048576,
7772
7430
  maxTokens: 65536,
7773
7431
  },
7432
+ "gemini-3.5-flash": {
7433
+ id: "gemini-3.5-flash",
7434
+ name: "Gemini 3.5 Flash",
7435
+ api: "google-generative-ai",
7436
+ provider: "opencode",
7437
+ baseUrl: "https://opencode.ai/zen/v1",
7438
+ reasoning: true,
7439
+ thinkingLevelMap: { "off": null },
7440
+ input: ["text", "image"],
7441
+ cost: {
7442
+ input: 1.5,
7443
+ output: 9,
7444
+ cacheRead: 0.15,
7445
+ cacheWrite: 0,
7446
+ },
7447
+ contextWindow: 1048576,
7448
+ maxTokens: 65536,
7449
+ },
7774
7450
  "glm-5": {
7775
7451
  id: "glm-5",
7776
7452
  name: "GLM-5",
@@ -8093,22 +7769,22 @@ export const MODELS = {
8093
7769
  contextWindow: 1050000,
8094
7770
  maxTokens: 128000,
8095
7771
  },
8096
- "hy3-preview-free": {
8097
- id: "hy3-preview-free",
8098
- name: "Hy3 preview Free",
7772
+ "grok-build-0.1": {
7773
+ id: "grok-build-0.1",
7774
+ name: "Grok Build 0.1",
8099
7775
  api: "openai-completions",
8100
7776
  provider: "opencode",
8101
7777
  baseUrl: "https://opencode.ai/zen/v1",
8102
7778
  reasoning: true,
8103
- input: ["text"],
7779
+ input: ["text", "image"],
8104
7780
  cost: {
8105
- input: 0,
8106
- output: 0,
8107
- cacheRead: 0,
7781
+ input: 1,
7782
+ output: 2,
7783
+ cacheRead: 0.2,
8108
7784
  cacheWrite: 0,
8109
7785
  },
8110
7786
  contextWindow: 256000,
8111
- maxTokens: 64000,
7787
+ maxTokens: 256000,
8112
7788
  },
8113
7789
  "kimi-k2.5": {
8114
7790
  id: "kimi-k2.5",
@@ -8161,23 +7837,6 @@ export const MODELS = {
8161
7837
  contextWindow: 204800,
8162
7838
  maxTokens: 131072,
8163
7839
  },
8164
- "minimax-m2.5-free": {
8165
- id: "minimax-m2.5-free",
8166
- name: "MiniMax M2.5 Free",
8167
- api: "anthropic-messages",
8168
- provider: "opencode",
8169
- baseUrl: "https://opencode.ai/zen",
8170
- reasoning: true,
8171
- input: ["text"],
8172
- cost: {
8173
- input: 0,
8174
- output: 0,
8175
- cacheRead: 0,
8176
- cacheWrite: 0,
8177
- },
8178
- contextWindow: 204800,
8179
- maxTokens: 131072,
8180
- },
8181
7840
  "minimax-m2.7": {
8182
7841
  id: "minimax-m2.7",
8183
7842
  name: "MiniMax M2.7",
@@ -8246,6 +7905,23 @@ export const MODELS = {
8246
7905
  contextWindow: 262144,
8247
7906
  maxTokens: 65536,
8248
7907
  },
7908
+ "qwen3.6-plus-free": {
7909
+ id: "qwen3.6-plus-free",
7910
+ name: "Qwen3.6 Plus Free",
7911
+ api: "anthropic-messages",
7912
+ provider: "opencode",
7913
+ baseUrl: "https://opencode.ai/zen",
7914
+ reasoning: true,
7915
+ input: ["text", "image"],
7916
+ cost: {
7917
+ input: 0,
7918
+ output: 0,
7919
+ cacheRead: 0,
7920
+ cacheWrite: 0,
7921
+ },
7922
+ contextWindow: 262144,
7923
+ maxTokens: 65536,
7924
+ },
8249
7925
  },
8250
7926
  "opencode-go": {
8251
7927
  "deepseek-v4-flash": {
@@ -8391,9 +8067,9 @@ export const MODELS = {
8391
8067
  "minimax-m2.5": {
8392
8068
  id: "minimax-m2.5",
8393
8069
  name: "MiniMax M2.5",
8394
- api: "openai-completions",
8070
+ api: "anthropic-messages",
8395
8071
  provider: "opencode-go",
8396
- baseUrl: "https://opencode.ai/zen/go/v1",
8072
+ baseUrl: "https://opencode.ai/zen/go",
8397
8073
  reasoning: true,
8398
8074
  input: ["text"],
8399
8075
  cost: {
@@ -8613,40 +8289,6 @@ export const MODELS = {
8613
8289
  contextWindow: 200000,
8614
8290
  maxTokens: 8192,
8615
8291
  },
8616
- "anthropic/claude-3.7-sonnet": {
8617
- id: "anthropic/claude-3.7-sonnet",
8618
- name: "Anthropic: Claude 3.7 Sonnet",
8619
- api: "openai-completions",
8620
- provider: "openrouter",
8621
- baseUrl: "https://openrouter.ai/api/v1",
8622
- reasoning: true,
8623
- input: ["text", "image"],
8624
- cost: {
8625
- input: 3,
8626
- output: 15,
8627
- cacheRead: 0.3,
8628
- cacheWrite: 3.75,
8629
- },
8630
- contextWindow: 200000,
8631
- maxTokens: 64000,
8632
- },
8633
- "anthropic/claude-3.7-sonnet:thinking": {
8634
- id: "anthropic/claude-3.7-sonnet:thinking",
8635
- name: "Anthropic: Claude 3.7 Sonnet (thinking)",
8636
- api: "openai-completions",
8637
- provider: "openrouter",
8638
- baseUrl: "https://openrouter.ai/api/v1",
8639
- reasoning: true,
8640
- input: ["text", "image"],
8641
- cost: {
8642
- input: 3,
8643
- output: 15,
8644
- cacheRead: 0.3,
8645
- cacheWrite: 3.75,
8646
- },
8647
- contextWindow: 200000,
8648
- maxTokens: 64000,
8649
- },
8650
8292
  "anthropic/claude-haiku-4.5": {
8651
8293
  id: "anthropic/claude-haiku-4.5",
8652
8294
  name: "Anthropic: Claude Haiku 4.5",
@@ -8769,19 +8411,37 @@ export const MODELS = {
8769
8411
  contextWindow: 1000000,
8770
8412
  maxTokens: 128000,
8771
8413
  },
8772
- "anthropic/claude-sonnet-4": {
8773
- id: "anthropic/claude-sonnet-4",
8774
- name: "Anthropic: Claude Sonnet 4",
8414
+ "anthropic/claude-opus-4.7-fast": {
8415
+ id: "anthropic/claude-opus-4.7-fast",
8416
+ name: "Anthropic: Claude Opus 4.7 (Fast)",
8775
8417
  api: "openai-completions",
8776
8418
  provider: "openrouter",
8777
8419
  baseUrl: "https://openrouter.ai/api/v1",
8778
8420
  reasoning: true,
8421
+ thinkingLevelMap: { "xhigh": "xhigh" },
8779
8422
  input: ["text", "image"],
8780
8423
  cost: {
8781
- input: 3,
8782
- output: 15,
8783
- cacheRead: 0.3,
8784
- cacheWrite: 3.75,
8424
+ input: 30,
8425
+ output: 150,
8426
+ cacheRead: 3,
8427
+ cacheWrite: 37.5,
8428
+ },
8429
+ contextWindow: 1000000,
8430
+ maxTokens: 128000,
8431
+ },
8432
+ "anthropic/claude-sonnet-4": {
8433
+ id: "anthropic/claude-sonnet-4",
8434
+ name: "Anthropic: Claude Sonnet 4",
8435
+ api: "openai-completions",
8436
+ provider: "openrouter",
8437
+ baseUrl: "https://openrouter.ai/api/v1",
8438
+ reasoning: true,
8439
+ input: ["text", "image"],
8440
+ cost: {
8441
+ input: 3,
8442
+ output: 15,
8443
+ cacheRead: 0.3,
8444
+ cacheWrite: 3.75,
8785
8445
  },
8786
8446
  contextWindow: 1000000,
8787
8447
  maxTokens: 64000,
@@ -8820,39 +8480,39 @@ export const MODELS = {
8820
8480
  contextWindow: 1000000,
8821
8481
  maxTokens: 128000,
8822
8482
  },
8823
- "arcee-ai/trinity-large-preview": {
8824
- id: "arcee-ai/trinity-large-preview",
8825
- name: "Arcee AI: Trinity Large Preview",
8483
+ "arcee-ai/trinity-large-thinking": {
8484
+ id: "arcee-ai/trinity-large-thinking",
8485
+ name: "Arcee AI: Trinity Large Thinking",
8826
8486
  api: "openai-completions",
8827
8487
  provider: "openrouter",
8828
8488
  baseUrl: "https://openrouter.ai/api/v1",
8829
- reasoning: false,
8489
+ reasoning: true,
8830
8490
  input: ["text"],
8831
8491
  cost: {
8832
- input: 0.15,
8833
- output: 0.44999999999999996,
8834
- cacheRead: 0,
8492
+ input: 0.22,
8493
+ output: 0.85,
8494
+ cacheRead: 0.06,
8835
8495
  cacheWrite: 0,
8836
8496
  },
8837
- contextWindow: 131000,
8838
- maxTokens: 4096,
8497
+ contextWindow: 262144,
8498
+ maxTokens: 262144,
8839
8499
  },
8840
- "arcee-ai/trinity-large-thinking": {
8841
- id: "arcee-ai/trinity-large-thinking",
8842
- name: "Arcee AI: Trinity Large Thinking",
8500
+ "arcee-ai/trinity-large-thinking:free": {
8501
+ id: "arcee-ai/trinity-large-thinking:free",
8502
+ name: "Arcee AI: Trinity Large Thinking (free)",
8843
8503
  api: "openai-completions",
8844
8504
  provider: "openrouter",
8845
8505
  baseUrl: "https://openrouter.ai/api/v1",
8846
8506
  reasoning: true,
8847
8507
  input: ["text"],
8848
8508
  cost: {
8849
- input: 0.22,
8850
- output: 0.85,
8851
- cacheRead: 0.06,
8509
+ input: 0,
8510
+ output: 0,
8511
+ cacheRead: 0,
8852
8512
  cacheWrite: 0,
8853
8513
  },
8854
8514
  contextWindow: 262144,
8855
- maxTokens: 262144,
8515
+ maxTokens: 80000,
8856
8516
  },
8857
8517
  "arcee-ai/trinity-mini": {
8858
8518
  id: "arcee-ai/trinity-mini",
@@ -8936,7 +8596,7 @@ export const MODELS = {
8936
8596
  cacheRead: 0,
8937
8597
  cacheWrite: 0,
8938
8598
  },
8939
- contextWindow: 120000,
8599
+ contextWindow: 131072,
8940
8600
  maxTokens: 8000,
8941
8601
  },
8942
8602
  "baidu/ernie-4.5-vl-28b-a3b": {
@@ -8953,7 +8613,7 @@ export const MODELS = {
8953
8613
  cacheRead: 0,
8954
8614
  cacheWrite: 0,
8955
8615
  },
8956
- contextWindow: 30000,
8616
+ contextWindow: 131072,
8957
8617
  maxTokens: 8000,
8958
8618
  },
8959
8619
  "bytedance-seed/seed-1.6": {
@@ -9101,13 +8761,13 @@ export const MODELS = {
9101
8761
  reasoning: true,
9102
8762
  input: ["text"],
9103
8763
  cost: {
9104
- input: 0.15,
9105
- output: 0.75,
9106
- cacheRead: 0,
8764
+ input: 0.21,
8765
+ output: 0.7899999999999999,
8766
+ cacheRead: 0.13,
9107
8767
  cacheWrite: 0,
9108
8768
  },
9109
- contextWindow: 32768,
9110
- maxTokens: 7168,
8769
+ contextWindow: 163840,
8770
+ maxTokens: 32768,
9111
8771
  },
9112
8772
  "deepseek/deepseek-r1": {
9113
8773
  id: "deepseek/deepseek-r1",
@@ -9123,7 +8783,7 @@ export const MODELS = {
9123
8783
  cacheRead: 0,
9124
8784
  cacheWrite: 0,
9125
8785
  },
9126
- contextWindow: 64000,
8786
+ contextWindow: 163840,
9127
8787
  maxTokens: 16000,
9128
8788
  },
9129
8789
  "deepseek/deepseek-r1-0528": {
@@ -9205,9 +8865,28 @@ export const MODELS = {
9205
8865
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
9206
8866
  input: ["text"],
9207
8867
  cost: {
9208
- input: 0.14,
9209
- output: 0.28,
9210
- cacheRead: 0.0028,
8868
+ input: 0.112,
8869
+ output: 0.224,
8870
+ cacheRead: 0.022,
8871
+ cacheWrite: 0,
8872
+ },
8873
+ contextWindow: 1048576,
8874
+ maxTokens: 4096,
8875
+ },
8876
+ "deepseek/deepseek-v4-flash:free": {
8877
+ id: "deepseek/deepseek-v4-flash:free",
8878
+ name: "DeepSeek: DeepSeek V4 Flash (free)",
8879
+ api: "openai-completions",
8880
+ provider: "openrouter",
8881
+ baseUrl: "https://openrouter.ai/api/v1",
8882
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8883
+ reasoning: true,
8884
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
8885
+ input: ["text"],
8886
+ cost: {
8887
+ input: 0,
8888
+ output: 0,
8889
+ cacheRead: 0,
9211
8890
  cacheWrite: 0,
9212
8891
  },
9213
8892
  contextWindow: 1048576,
@@ -9263,7 +8942,7 @@ export const MODELS = {
9263
8942
  cacheRead: 0.024999999999999998,
9264
8943
  cacheWrite: 0.08333333333333334,
9265
8944
  },
9266
- contextWindow: 1048576,
8945
+ contextWindow: 1000000,
9267
8946
  maxTokens: 8192,
9268
8947
  },
9269
8948
  "google/gemini-2.0-flash-lite-001": {
@@ -9402,6 +9081,23 @@ export const MODELS = {
9402
9081
  contextWindow: 1048576,
9403
9082
  maxTokens: 65536,
9404
9083
  },
9084
+ "google/gemini-3.1-flash-lite": {
9085
+ id: "google/gemini-3.1-flash-lite",
9086
+ name: "Google: Gemini 3.1 Flash Lite",
9087
+ api: "openai-completions",
9088
+ provider: "openrouter",
9089
+ baseUrl: "https://openrouter.ai/api/v1",
9090
+ reasoning: true,
9091
+ input: ["text", "image"],
9092
+ cost: {
9093
+ input: 0.25,
9094
+ output: 1.5,
9095
+ cacheRead: 0.024999999999999998,
9096
+ cacheWrite: 0.08333333333333334,
9097
+ },
9098
+ contextWindow: 1048576,
9099
+ maxTokens: 65536,
9100
+ },
9405
9101
  "google/gemini-3.1-flash-lite-preview": {
9406
9102
  id: "google/gemini-3.1-flash-lite-preview",
9407
9103
  name: "Google: Gemini 3.1 Flash Lite Preview",
@@ -9450,6 +9146,23 @@ export const MODELS = {
9450
9146
  cacheRead: 0.19999999999999998,
9451
9147
  cacheWrite: 0.375,
9452
9148
  },
9149
+ contextWindow: 1048756,
9150
+ maxTokens: 65536,
9151
+ },
9152
+ "google/gemini-3.5-flash": {
9153
+ id: "google/gemini-3.5-flash",
9154
+ name: "Google: Gemini 3.5 Flash",
9155
+ api: "openai-completions",
9156
+ provider: "openrouter",
9157
+ baseUrl: "https://openrouter.ai/api/v1",
9158
+ reasoning: true,
9159
+ input: ["text", "image"],
9160
+ cost: {
9161
+ input: 1.5,
9162
+ output: 9,
9163
+ cacheRead: 0.15,
9164
+ cacheWrite: 0.08333333333333334,
9165
+ },
9453
9166
  contextWindow: 1048576,
9454
9167
  maxTokens: 65536,
9455
9168
  },
@@ -9530,8 +9243,8 @@ export const MODELS = {
9530
9243
  reasoning: true,
9531
9244
  input: ["text", "image"],
9532
9245
  cost: {
9533
- input: 0.13,
9534
- output: 0.38,
9246
+ input: 0.12,
9247
+ output: 0.37,
9535
9248
  cacheRead: 0,
9536
9249
  cacheWrite: 0,
9537
9250
  },
@@ -9579,6 +9292,7 @@ export const MODELS = {
9579
9292
  provider: "openrouter",
9580
9293
  baseUrl: "https://openrouter.ai/api/v1",
9581
9294
  reasoning: true,
9295
+ thinkingLevelMap: { "off": null },
9582
9296
  input: ["text"],
9583
9297
  cost: {
9584
9298
  input: 0.25,
@@ -9598,9 +9312,9 @@ export const MODELS = {
9598
9312
  reasoning: false,
9599
9313
  input: ["text"],
9600
9314
  cost: {
9601
- input: 0.3,
9602
- output: 2.5,
9603
- cacheRead: 0.06,
9315
+ input: 0.075,
9316
+ output: 0.625,
9317
+ cacheRead: 0.015,
9604
9318
  cacheWrite: 0,
9605
9319
  },
9606
9320
  contextWindow: 262144,
@@ -9615,14 +9329,31 @@ export const MODELS = {
9615
9329
  reasoning: false,
9616
9330
  input: ["text"],
9617
9331
  cost: {
9618
- input: 0.08,
9619
- output: 0.24,
9620
- cacheRead: 0.016,
9332
+ input: 0.01,
9333
+ output: 0.03,
9334
+ cacheRead: 0.002,
9621
9335
  cacheWrite: 0,
9622
9336
  },
9623
9337
  contextWindow: 262144,
9624
9338
  maxTokens: 32768,
9625
9339
  },
9340
+ "inclusionai/ring-2.6-1t": {
9341
+ id: "inclusionai/ring-2.6-1t",
9342
+ name: "inclusionAI: Ring-2.6-1T",
9343
+ api: "openai-completions",
9344
+ provider: "openrouter",
9345
+ baseUrl: "https://openrouter.ai/api/v1",
9346
+ reasoning: true,
9347
+ input: ["text"],
9348
+ cost: {
9349
+ input: 0.075,
9350
+ output: 0.625,
9351
+ cacheRead: 0.015,
9352
+ cacheWrite: 0,
9353
+ },
9354
+ contextWindow: 262144,
9355
+ maxTokens: 65536,
9356
+ },
9626
9357
  "kwaipilot/kat-coder-pro-v2": {
9627
9358
  id: "kwaipilot/kat-coder-pro-v2",
9628
9359
  name: "Kwaipilot: KAT-Coder-Pro V2",
@@ -9671,7 +9402,7 @@ export const MODELS = {
9671
9402
  cacheRead: 0,
9672
9403
  cacheWrite: 0,
9673
9404
  },
9674
- contextWindow: 16384,
9405
+ contextWindow: 131072,
9675
9406
  maxTokens: 16384,
9676
9407
  },
9677
9408
  "meta-llama/llama-3.3-70b-instruct": {
@@ -9705,7 +9436,7 @@ export const MODELS = {
9705
9436
  cacheRead: 0,
9706
9437
  cacheWrite: 0,
9707
9438
  },
9708
- contextWindow: 65536,
9439
+ contextWindow: 131072,
9709
9440
  maxTokens: 4096,
9710
9441
  },
9711
9442
  "meta-llama/llama-4-scout": {
@@ -9722,7 +9453,7 @@ export const MODELS = {
9722
9453
  cacheRead: 0,
9723
9454
  cacheWrite: 0,
9724
9455
  },
9725
- contextWindow: 327680,
9456
+ contextWindow: 10000000,
9726
9457
  maxTokens: 16384,
9727
9458
  },
9728
9459
  "minimax/minimax-m1": {
@@ -9756,7 +9487,7 @@ export const MODELS = {
9756
9487
  cacheRead: 0.03,
9757
9488
  cacheWrite: 0,
9758
9489
  },
9759
- contextWindow: 196608,
9490
+ contextWindow: 204800,
9760
9491
  maxTokens: 196608,
9761
9492
  },
9762
9493
  "minimax/minimax-m2.1": {
@@ -9773,7 +9504,7 @@ export const MODELS = {
9773
9504
  cacheRead: 0.03,
9774
9505
  cacheWrite: 0,
9775
9506
  },
9776
- contextWindow: 196608,
9507
+ contextWindow: 204800,
9777
9508
  maxTokens: 196608,
9778
9509
  },
9779
9510
  "minimax/minimax-m2.5": {
@@ -9787,11 +9518,11 @@ export const MODELS = {
9787
9518
  cost: {
9788
9519
  input: 0.15,
9789
9520
  output: 1.15,
9790
- cacheRead: 0.03,
9521
+ cacheRead: 0,
9791
9522
  cacheWrite: 0,
9792
9523
  },
9793
- contextWindow: 196608,
9794
- maxTokens: 131072,
9524
+ contextWindow: 204800,
9525
+ maxTokens: 196608,
9795
9526
  },
9796
9527
  "minimax/minimax-m2.5:free": {
9797
9528
  id: "minimax/minimax-m2.5:free",
@@ -9807,7 +9538,7 @@ export const MODELS = {
9807
9538
  cacheRead: 0,
9808
9539
  cacheWrite: 0,
9809
9540
  },
9810
- contextWindow: 196608,
9541
+ contextWindow: 204800,
9811
9542
  maxTokens: 8192,
9812
9543
  },
9813
9544
  "minimax/minimax-m2.7": {
@@ -9819,13 +9550,13 @@ export const MODELS = {
9819
9550
  reasoning: true,
9820
9551
  input: ["text"],
9821
9552
  cost: {
9822
- input: 0.3,
9553
+ input: 0.27899999999999997,
9823
9554
  output: 1.2,
9824
- cacheRead: 0.059,
9555
+ cacheRead: 0,
9825
9556
  cacheWrite: 0,
9826
9557
  },
9827
- contextWindow: 196608,
9828
- maxTokens: 4096,
9558
+ contextWindow: 204800,
9559
+ maxTokens: 131072,
9829
9560
  },
9830
9561
  "mistralai/codestral-2508": {
9831
9562
  id: "mistralai/codestral-2508",
@@ -10150,23 +9881,6 @@ export const MODELS = {
10150
9881
  contextWindow: 65536,
10151
9882
  maxTokens: 4096,
10152
9883
  },
10153
- "mistralai/mixtral-8x7b-instruct": {
10154
- id: "mistralai/mixtral-8x7b-instruct",
10155
- name: "Mistral: Mixtral 8x7B Instruct",
10156
- api: "openai-completions",
10157
- provider: "openrouter",
10158
- baseUrl: "https://openrouter.ai/api/v1",
10159
- reasoning: false,
10160
- input: ["text"],
10161
- cost: {
10162
- input: 0.54,
10163
- output: 0.54,
10164
- cacheRead: 0,
10165
- cacheWrite: 0,
10166
- },
10167
- contextWindow: 32768,
10168
- maxTokens: 16384,
10169
- },
10170
9884
  "mistralai/pixtral-large-2411": {
10171
9885
  id: "mistralai/pixtral-large-2411",
10172
9886
  name: "Mistral: Pixtral Large 2411",
@@ -10227,8 +9941,8 @@ export const MODELS = {
10227
9941
  reasoning: false,
10228
9942
  input: ["text"],
10229
9943
  cost: {
10230
- input: 0.39999999999999997,
10231
- output: 2,
9944
+ input: 0.6,
9945
+ output: 2.5,
10232
9946
  cacheRead: 0,
10233
9947
  cacheWrite: 0,
10234
9948
  },
@@ -10246,7 +9960,7 @@ export const MODELS = {
10246
9960
  cost: {
10247
9961
  input: 0.6,
10248
9962
  output: 2.5,
10249
- cacheRead: 0.15,
9963
+ cacheRead: 0,
10250
9964
  cacheWrite: 0,
10251
9965
  },
10252
9966
  contextWindow: 262144,
@@ -10278,13 +9992,13 @@ export const MODELS = {
10278
9992
  reasoning: true,
10279
9993
  input: ["text", "image"],
10280
9994
  cost: {
10281
- input: 0.75,
10282
- output: 3.5,
10283
- cacheRead: 0.15,
9995
+ input: 0.73,
9996
+ output: 3.49,
9997
+ cacheRead: 0.25,
10284
9998
  cacheWrite: 0,
10285
9999
  },
10286
10000
  contextWindow: 262144,
10287
- maxTokens: 16384,
10001
+ maxTokens: 262142,
10288
10002
  },
10289
10003
  "nex-agi/deepseek-v3.1-nex-n1": {
10290
10004
  id: "nex-agi/deepseek-v3.1-nex-n1",
@@ -10303,23 +10017,6 @@ export const MODELS = {
10303
10017
  contextWindow: 131072,
10304
10018
  maxTokens: 163840,
10305
10019
  },
10306
- "nvidia/llama-3.1-nemotron-70b-instruct": {
10307
- id: "nvidia/llama-3.1-nemotron-70b-instruct",
10308
- name: "NVIDIA: Llama 3.1 Nemotron 70B Instruct",
10309
- api: "openai-completions",
10310
- provider: "openrouter",
10311
- baseUrl: "https://openrouter.ai/api/v1",
10312
- reasoning: false,
10313
- input: ["text"],
10314
- cost: {
10315
- input: 1.2,
10316
- output: 1.2,
10317
- cacheRead: 0,
10318
- cacheWrite: 0,
10319
- },
10320
- contextWindow: 131072,
10321
- maxTokens: 16384,
10322
- },
10323
10020
  "nvidia/llama-3.3-nemotron-super-49b-v1.5": {
10324
10021
  id: "nvidia/llama-3.3-nemotron-super-49b-v1.5",
10325
10022
  name: "NVIDIA: Llama 3.3 Nemotron Super 49B V1.5",
@@ -10402,7 +10099,7 @@ export const MODELS = {
10402
10099
  cacheRead: 0,
10403
10100
  cacheWrite: 0,
10404
10101
  },
10405
- contextWindow: 262144,
10102
+ contextWindow: 1000000,
10406
10103
  maxTokens: 4096,
10407
10104
  },
10408
10105
  "nvidia/nemotron-3-super-120b-a12b:free": {
@@ -10419,7 +10116,7 @@ export const MODELS = {
10419
10116
  cacheRead: 0,
10420
10117
  cacheWrite: 0,
10421
10118
  },
10422
- contextWindow: 262144,
10119
+ contextWindow: 1000000,
10423
10120
  maxTokens: 262144,
10424
10121
  },
10425
10122
  "nvidia/nemotron-nano-12b-v2-vl:free": {
@@ -11570,7 +11267,7 @@ export const MODELS = {
11570
11267
  cacheRead: 0,
11571
11268
  cacheWrite: 0,
11572
11269
  },
11573
- contextWindow: 32768,
11270
+ contextWindow: 131072,
11574
11271
  maxTokens: 16384,
11575
11272
  },
11576
11273
  "qwen/qwen-2.5-7b-instruct": {
@@ -11587,26 +11284,9 @@ export const MODELS = {
11587
11284
  cacheRead: 0,
11588
11285
  cacheWrite: 0,
11589
11286
  },
11590
- contextWindow: 32768,
11287
+ contextWindow: 131072,
11591
11288
  maxTokens: 32768,
11592
11289
  },
11593
- "qwen/qwen-max": {
11594
- id: "qwen/qwen-max",
11595
- name: "Qwen: Qwen-Max ",
11596
- api: "openai-completions",
11597
- provider: "openrouter",
11598
- baseUrl: "https://openrouter.ai/api/v1",
11599
- reasoning: false,
11600
- input: ["text"],
11601
- cost: {
11602
- input: 1.04,
11603
- output: 4.16,
11604
- cacheRead: 0.20800000000000002,
11605
- cacheWrite: 0,
11606
- },
11607
- contextWindow: 32768,
11608
- maxTokens: 8192,
11609
- },
11610
11290
  "qwen/qwen-plus": {
11611
11291
  id: "qwen/qwen-plus",
11612
11292
  name: "Qwen: Qwen-Plus",
@@ -11658,40 +11338,6 @@ export const MODELS = {
11658
11338
  contextWindow: 1000000,
11659
11339
  maxTokens: 32768,
11660
11340
  },
11661
- "qwen/qwen-turbo": {
11662
- id: "qwen/qwen-turbo",
11663
- name: "Qwen: Qwen-Turbo",
11664
- api: "openai-completions",
11665
- provider: "openrouter",
11666
- baseUrl: "https://openrouter.ai/api/v1",
11667
- reasoning: false,
11668
- input: ["text"],
11669
- cost: {
11670
- input: 0.0325,
11671
- output: 0.13,
11672
- cacheRead: 0.006500000000000001,
11673
- cacheWrite: 0,
11674
- },
11675
- contextWindow: 131072,
11676
- maxTokens: 8192,
11677
- },
11678
- "qwen/qwen-vl-max": {
11679
- id: "qwen/qwen-vl-max",
11680
- name: "Qwen: Qwen VL Max",
11681
- api: "openai-completions",
11682
- provider: "openrouter",
11683
- baseUrl: "https://openrouter.ai/api/v1",
11684
- reasoning: false,
11685
- input: ["text", "image"],
11686
- cost: {
11687
- input: 0.52,
11688
- output: 2.08,
11689
- cacheRead: 0,
11690
- cacheWrite: 0,
11691
- },
11692
- contextWindow: 131072,
11693
- maxTokens: 32768,
11694
- },
11695
11341
  "qwen/qwen3-14b": {
11696
11342
  id: "qwen/qwen3-14b",
11697
11343
  name: "Qwen: Qwen3 14B",
@@ -11701,12 +11347,12 @@ export const MODELS = {
11701
11347
  reasoning: true,
11702
11348
  input: ["text"],
11703
11349
  cost: {
11704
- input: 0.06,
11350
+ input: 0.09999999999999999,
11705
11351
  output: 0.24,
11706
11352
  cacheRead: 0,
11707
11353
  cacheWrite: 0,
11708
11354
  },
11709
- contextWindow: 40960,
11355
+ contextWindow: 131702,
11710
11356
  maxTokens: 40960,
11711
11357
  },
11712
11358
  "qwen/qwen3-235b-a22b": {
@@ -11757,7 +11403,7 @@ export const MODELS = {
11757
11403
  cacheRead: 0,
11758
11404
  cacheWrite: 0,
11759
11405
  },
11760
- contextWindow: 131072,
11406
+ contextWindow: 262144,
11761
11407
  maxTokens: 4096,
11762
11408
  },
11763
11409
  "qwen/qwen3-30b-a3b": {
@@ -11774,7 +11420,7 @@ export const MODELS = {
11774
11420
  cacheRead: 0,
11775
11421
  cacheWrite: 0,
11776
11422
  },
11777
- contextWindow: 40960,
11423
+ contextWindow: 131072,
11778
11424
  maxTokens: 20000,
11779
11425
  },
11780
11426
  "qwen/qwen3-30b-a3b-instruct-2507": {
@@ -11821,12 +11467,12 @@ export const MODELS = {
11821
11467
  input: ["text"],
11822
11468
  cost: {
11823
11469
  input: 0.08,
11824
- output: 0.24,
11825
- cacheRead: 0.04,
11470
+ output: 0.28,
11471
+ cacheRead: 0,
11826
11472
  cacheWrite: 0,
11827
11473
  },
11828
- contextWindow: 40960,
11829
- maxTokens: 40960,
11474
+ contextWindow: 131072,
11475
+ maxTokens: 16384,
11830
11476
  },
11831
11477
  "qwen/qwen3-8b": {
11832
11478
  id: "qwen/qwen3-8b",
@@ -11842,7 +11488,7 @@ export const MODELS = {
11842
11488
  cacheRead: 0.049999999999999996,
11843
11489
  cacheWrite: 0,
11844
11490
  },
11845
- contextWindow: 40960,
11491
+ contextWindow: 131072,
11846
11492
  maxTokens: 8192,
11847
11493
  },
11848
11494
  "qwen/qwen3-coder": {
@@ -11859,7 +11505,7 @@ export const MODELS = {
11859
11505
  cacheRead: 0,
11860
11506
  cacheWrite: 0,
11861
11507
  },
11862
- contextWindow: 262144,
11508
+ contextWindow: 1048576,
11863
11509
  maxTokens: 65536,
11864
11510
  },
11865
11511
  "qwen/qwen3-coder-30b-a3b-instruct": {
@@ -11944,7 +11590,7 @@ export const MODELS = {
11944
11590
  cacheRead: 0,
11945
11591
  cacheWrite: 0,
11946
11592
  },
11947
- contextWindow: 262000,
11593
+ contextWindow: 1048576,
11948
11594
  maxTokens: 262000,
11949
11595
  },
11950
11596
  "qwen/qwen3-max": {
@@ -12029,7 +11675,7 @@ export const MODELS = {
12029
11675
  cacheRead: 0,
12030
11676
  cacheWrite: 0,
12031
11677
  },
12032
- contextWindow: 131072,
11678
+ contextWindow: 262144,
12033
11679
  maxTokens: 32768,
12034
11680
  },
12035
11681
  "qwen/qwen3-vl-235b-a22b-instruct": {
@@ -12080,7 +11726,7 @@ export const MODELS = {
12080
11726
  cacheRead: 0,
12081
11727
  cacheWrite: 0,
12082
11728
  },
12083
- contextWindow: 131072,
11729
+ contextWindow: 262144,
12084
11730
  maxTokens: 32768,
12085
11731
  },
12086
11732
  "qwen/qwen3-vl-30b-a3b-thinking": {
@@ -12114,7 +11760,7 @@ export const MODELS = {
12114
11760
  cacheRead: 0,
12115
11761
  cacheWrite: 0,
12116
11762
  },
12117
- contextWindow: 131072,
11763
+ contextWindow: 262144,
12118
11764
  maxTokens: 32768,
12119
11765
  },
12120
11766
  "qwen/qwen3-vl-8b-instruct": {
@@ -12131,7 +11777,7 @@ export const MODELS = {
12131
11777
  cacheRead: 0,
12132
11778
  cacheWrite: 0,
12133
11779
  },
12134
- contextWindow: 131072,
11780
+ contextWindow: 256000,
12135
11781
  maxTokens: 32768,
12136
11782
  },
12137
11783
  "qwen/qwen3-vl-8b-thinking": {
@@ -12148,7 +11794,7 @@ export const MODELS = {
12148
11794
  cacheRead: 0,
12149
11795
  cacheWrite: 0,
12150
11796
  },
12151
- contextWindow: 131072,
11797
+ contextWindow: 256000,
12152
11798
  maxTokens: 32768,
12153
11799
  },
12154
11800
  "qwen/qwen3.5-122b-a10b": {
@@ -12194,13 +11840,13 @@ export const MODELS = {
12194
11840
  reasoning: true,
12195
11841
  input: ["text", "image"],
12196
11842
  cost: {
12197
- input: 0.14,
11843
+ input: 0.13899999999999998,
12198
11844
  output: 1,
12199
- cacheRead: 0.049999999999999996,
11845
+ cacheRead: 0,
12200
11846
  cacheWrite: 0,
12201
11847
  },
12202
11848
  contextWindow: 262144,
12203
- maxTokens: 81920,
11849
+ maxTokens: 4096,
12204
11850
  },
12205
11851
  "qwen/qwen3.5-397b-a17b": {
12206
11852
  id: "qwen/qwen3.5-397b-a17b",
@@ -12213,7 +11859,7 @@ export const MODELS = {
12213
11859
  cost: {
12214
11860
  input: 0.39,
12215
11861
  output: 2.34,
12216
- cacheRead: 0.195,
11862
+ cacheRead: 0,
12217
11863
  cacheWrite: 0,
12218
11864
  },
12219
11865
  contextWindow: 262144,
@@ -12279,8 +11925,8 @@ export const MODELS = {
12279
11925
  reasoning: true,
12280
11926
  input: ["text", "image"],
12281
11927
  cost: {
12282
- input: 0.39999999999999997,
12283
- output: 2.4,
11928
+ input: 0.3,
11929
+ output: 1.7999999999999998,
12284
11930
  cacheRead: 0,
12285
11931
  cacheWrite: 0,
12286
11932
  },
@@ -12296,13 +11942,13 @@ export const MODELS = {
12296
11942
  reasoning: true,
12297
11943
  input: ["text", "image"],
12298
11944
  cost: {
12299
- input: 0.32,
11945
+ input: 0.317,
12300
11946
  output: 3.1999999999999997,
12301
11947
  cacheRead: 0,
12302
11948
  cacheWrite: 0,
12303
11949
  },
12304
11950
  contextWindow: 262144,
12305
- maxTokens: 81920,
11951
+ maxTokens: 262140,
12306
11952
  },
12307
11953
  "qwen/qwen3.6-35b-a3b": {
12308
11954
  id: "qwen/qwen3.6-35b-a3b",
@@ -12330,10 +11976,10 @@ export const MODELS = {
12330
11976
  reasoning: true,
12331
11977
  input: ["text", "image"],
12332
11978
  cost: {
12333
- input: 0.25,
12334
- output: 1.5,
11979
+ input: 0.1875,
11980
+ output: 1.125,
12335
11981
  cacheRead: 0,
12336
- cacheWrite: 0.3125,
11982
+ cacheWrite: 0.234375,
12337
11983
  },
12338
11984
  contextWindow: 1000000,
12339
11985
  maxTokens: 65536,
@@ -12372,6 +12018,23 @@ export const MODELS = {
12372
12018
  contextWindow: 1000000,
12373
12019
  maxTokens: 65536,
12374
12020
  },
12021
+ "qwen/qwen3.7-max": {
12022
+ id: "qwen/qwen3.7-max",
12023
+ name: "Qwen: Qwen3.7 Max",
12024
+ api: "openai-completions",
12025
+ provider: "openrouter",
12026
+ baseUrl: "https://openrouter.ai/api/v1",
12027
+ reasoning: true,
12028
+ input: ["text"],
12029
+ cost: {
12030
+ input: 2.5,
12031
+ output: 7.5,
12032
+ cacheRead: 0,
12033
+ cacheWrite: 3.125,
12034
+ },
12035
+ contextWindow: 1000000,
12036
+ maxTokens: 65536,
12037
+ },
12375
12038
  "rekaai/reka-edge": {
12376
12039
  id: "rekaai/reka-edge",
12377
12040
  name: "Reka Edge",
@@ -12449,26 +12112,26 @@ export const MODELS = {
12449
12112
  reasoning: true,
12450
12113
  input: ["text"],
12451
12114
  cost: {
12452
- input: 0.09999999999999999,
12115
+ input: 0.09,
12453
12116
  output: 0.3,
12454
- cacheRead: 0,
12117
+ cacheRead: 0.02,
12455
12118
  cacheWrite: 0,
12456
12119
  },
12457
12120
  contextWindow: 262144,
12458
- maxTokens: 65536,
12121
+ maxTokens: 16384,
12459
12122
  },
12460
- "tencent/hy3-preview:free": {
12461
- id: "tencent/hy3-preview:free",
12462
- name: "Tencent: Hy3 preview (free)",
12123
+ "tencent/hy3-preview": {
12124
+ id: "tencent/hy3-preview",
12125
+ name: "Tencent: Hy3 preview",
12463
12126
  api: "openai-completions",
12464
12127
  provider: "openrouter",
12465
12128
  baseUrl: "https://openrouter.ai/api/v1",
12466
12129
  reasoning: true,
12467
12130
  input: ["text"],
12468
12131
  cost: {
12469
- input: 0,
12470
- output: 0,
12471
- cacheRead: 0,
12132
+ input: 0.06599999999999999,
12133
+ output: 0.26,
12134
+ cacheRead: 0.029,
12472
12135
  cacheWrite: 0,
12473
12136
  },
12474
12137
  contextWindow: 262144,
@@ -12508,23 +12171,6 @@ export const MODELS = {
12508
12171
  contextWindow: 32768,
12509
12172
  maxTokens: 32768,
12510
12173
  },
12511
- "tngtech/deepseek-r1t2-chimera": {
12512
- id: "tngtech/deepseek-r1t2-chimera",
12513
- name: "TNG: DeepSeek R1T2 Chimera",
12514
- api: "openai-completions",
12515
- provider: "openrouter",
12516
- baseUrl: "https://openrouter.ai/api/v1",
12517
- reasoning: true,
12518
- input: ["text"],
12519
- cost: {
12520
- input: 0.3,
12521
- output: 1.1,
12522
- cacheRead: 0.15,
12523
- cacheWrite: 0,
12524
- },
12525
- contextWindow: 163840,
12526
- maxTokens: 163840,
12527
- },
12528
12174
  "upstage/solar-pro-3": {
12529
12175
  id: "upstage/solar-pro-3",
12530
12176
  name: "Upstage: Solar Pro 3",
@@ -12542,125 +12188,6 @@ export const MODELS = {
12542
12188
  contextWindow: 128000,
12543
12189
  maxTokens: 4096,
12544
12190
  },
12545
- "x-ai/grok-3": {
12546
- id: "x-ai/grok-3",
12547
- name: "xAI: Grok 3",
12548
- api: "openai-completions",
12549
- provider: "openrouter",
12550
- baseUrl: "https://openrouter.ai/api/v1",
12551
- reasoning: false,
12552
- input: ["text"],
12553
- cost: {
12554
- input: 3,
12555
- output: 15,
12556
- cacheRead: 0.75,
12557
- cacheWrite: 0,
12558
- },
12559
- contextWindow: 131072,
12560
- maxTokens: 4096,
12561
- },
12562
- "x-ai/grok-3-beta": {
12563
- id: "x-ai/grok-3-beta",
12564
- name: "xAI: Grok 3 Beta",
12565
- api: "openai-completions",
12566
- provider: "openrouter",
12567
- baseUrl: "https://openrouter.ai/api/v1",
12568
- reasoning: false,
12569
- input: ["text"],
12570
- cost: {
12571
- input: 3,
12572
- output: 15,
12573
- cacheRead: 0.75,
12574
- cacheWrite: 0,
12575
- },
12576
- contextWindow: 131072,
12577
- maxTokens: 4096,
12578
- },
12579
- "x-ai/grok-3-mini": {
12580
- id: "x-ai/grok-3-mini",
12581
- name: "xAI: Grok 3 Mini",
12582
- api: "openai-completions",
12583
- provider: "openrouter",
12584
- baseUrl: "https://openrouter.ai/api/v1",
12585
- reasoning: true,
12586
- input: ["text"],
12587
- cost: {
12588
- input: 0.3,
12589
- output: 0.5,
12590
- cacheRead: 0.075,
12591
- cacheWrite: 0,
12592
- },
12593
- contextWindow: 131072,
12594
- maxTokens: 4096,
12595
- },
12596
- "x-ai/grok-3-mini-beta": {
12597
- id: "x-ai/grok-3-mini-beta",
12598
- name: "xAI: Grok 3 Mini Beta",
12599
- api: "openai-completions",
12600
- provider: "openrouter",
12601
- baseUrl: "https://openrouter.ai/api/v1",
12602
- reasoning: true,
12603
- input: ["text"],
12604
- cost: {
12605
- input: 0.3,
12606
- output: 0.5,
12607
- cacheRead: 0.075,
12608
- cacheWrite: 0,
12609
- },
12610
- contextWindow: 131072,
12611
- maxTokens: 4096,
12612
- },
12613
- "x-ai/grok-4": {
12614
- id: "x-ai/grok-4",
12615
- name: "xAI: Grok 4",
12616
- api: "openai-completions",
12617
- provider: "openrouter",
12618
- baseUrl: "https://openrouter.ai/api/v1",
12619
- reasoning: true,
12620
- input: ["text", "image"],
12621
- cost: {
12622
- input: 3,
12623
- output: 15,
12624
- cacheRead: 0.75,
12625
- cacheWrite: 0,
12626
- },
12627
- contextWindow: 256000,
12628
- maxTokens: 4096,
12629
- },
12630
- "x-ai/grok-4-fast": {
12631
- id: "x-ai/grok-4-fast",
12632
- name: "xAI: Grok 4 Fast",
12633
- api: "openai-completions",
12634
- provider: "openrouter",
12635
- baseUrl: "https://openrouter.ai/api/v1",
12636
- reasoning: true,
12637
- input: ["text", "image"],
12638
- cost: {
12639
- input: 0.19999999999999998,
12640
- output: 0.5,
12641
- cacheRead: 0.049999999999999996,
12642
- cacheWrite: 0,
12643
- },
12644
- contextWindow: 2000000,
12645
- maxTokens: 30000,
12646
- },
12647
- "x-ai/grok-4.1-fast": {
12648
- id: "x-ai/grok-4.1-fast",
12649
- name: "xAI: Grok 4.1 Fast",
12650
- api: "openai-completions",
12651
- provider: "openrouter",
12652
- baseUrl: "https://openrouter.ai/api/v1",
12653
- reasoning: true,
12654
- input: ["text", "image"],
12655
- cost: {
12656
- input: 0.19999999999999998,
12657
- output: 0.5,
12658
- cacheRead: 0.049999999999999996,
12659
- cacheWrite: 0,
12660
- },
12661
- contextWindow: 2000000,
12662
- maxTokens: 30000,
12663
- },
12664
12191
  "x-ai/grok-4.20": {
12665
12192
  id: "x-ai/grok-4.20",
12666
12193
  name: "xAI: Grok 4.20",
@@ -12695,22 +12222,22 @@ export const MODELS = {
12695
12222
  contextWindow: 1000000,
12696
12223
  maxTokens: 4096,
12697
12224
  },
12698
- "x-ai/grok-code-fast-1": {
12699
- id: "x-ai/grok-code-fast-1",
12700
- name: "xAI: Grok Code Fast 1",
12225
+ "x-ai/grok-build-0.1": {
12226
+ id: "x-ai/grok-build-0.1",
12227
+ name: "xAI: Grok Build 0.1",
12701
12228
  api: "openai-completions",
12702
12229
  provider: "openrouter",
12703
12230
  baseUrl: "https://openrouter.ai/api/v1",
12704
12231
  reasoning: true,
12705
- input: ["text"],
12232
+ input: ["text", "image"],
12706
12233
  cost: {
12707
- input: 0.19999999999999998,
12708
- output: 1.5,
12709
- cacheRead: 0.02,
12234
+ input: 1,
12235
+ output: 2,
12236
+ cacheRead: 0.19999999999999998,
12710
12237
  cacheWrite: 0,
12711
12238
  },
12712
12239
  contextWindow: 256000,
12713
- maxTokens: 10000,
12240
+ maxTokens: 4096,
12714
12241
  },
12715
12242
  "xiaomi/mimo-v2-flash": {
12716
12243
  id: "xiaomi/mimo-v2-flash",
@@ -12721,9 +12248,9 @@ export const MODELS = {
12721
12248
  reasoning: true,
12722
12249
  input: ["text"],
12723
12250
  cost: {
12724
- input: 0.09,
12725
- output: 0.29,
12726
- cacheRead: 0.045,
12251
+ input: 0.09999999999999999,
12252
+ output: 0.3,
12253
+ cacheRead: 0.01,
12727
12254
  cacheWrite: 0,
12728
12255
  },
12729
12256
  contextWindow: 262144,
@@ -12795,7 +12322,7 @@ export const MODELS = {
12795
12322
  cacheWrite: 0,
12796
12323
  },
12797
12324
  contextWindow: 1048576,
12798
- maxTokens: 131072,
12325
+ maxTokens: 16384,
12799
12326
  },
12800
12327
  "z-ai/glm-4-32b": {
12801
12328
  id: "z-ai/glm-4-32b",
@@ -12891,13 +12418,13 @@ export const MODELS = {
12891
12418
  reasoning: true,
12892
12419
  input: ["text"],
12893
12420
  cost: {
12894
- input: 0.39,
12895
- output: 1.9,
12896
- cacheRead: 0,
12421
+ input: 0.43,
12422
+ output: 1.74,
12423
+ cacheRead: 0.08,
12897
12424
  cacheWrite: 0,
12898
12425
  },
12899
- contextWindow: 204800,
12900
- maxTokens: 204800,
12426
+ contextWindow: 202752,
12427
+ maxTokens: 131072,
12901
12428
  },
12902
12429
  "z-ai/glm-4.6v": {
12903
12430
  id: "z-ai/glm-4.6v",
@@ -12925,13 +12452,13 @@ export const MODELS = {
12925
12452
  reasoning: true,
12926
12453
  input: ["text"],
12927
12454
  cost: {
12928
- input: 0.38,
12929
- output: 1.74,
12930
- cacheRead: 0,
12455
+ input: 0.39999999999999997,
12456
+ output: 1.75,
12457
+ cacheRead: 0.08,
12931
12458
  cacheWrite: 0,
12932
12459
  },
12933
12460
  contextWindow: 202752,
12934
- maxTokens: 4096,
12461
+ maxTokens: 131072,
12935
12462
  },
12936
12463
  "z-ai/glm-4.7-flash": {
12937
12464
  id: "z-ai/glm-4.7-flash",
@@ -12993,13 +12520,13 @@ export const MODELS = {
12993
12520
  reasoning: true,
12994
12521
  input: ["text"],
12995
12522
  cost: {
12996
- input: 1.0499999999999998,
12997
- output: 3.5,
12998
- cacheRead: 0.5249999999999999,
12523
+ input: 0.98,
12524
+ output: 3.08,
12525
+ cacheRead: 0.182,
12999
12526
  cacheWrite: 0,
13000
12527
  },
13001
12528
  contextWindow: 202752,
13002
- maxTokens: 65535,
12529
+ maxTokens: 4096,
13003
12530
  },
13004
12531
  "z-ai/glm-5v-turbo": {
13005
12532
  id: "z-ai/glm-5v-turbo",
@@ -13078,9 +12605,9 @@ export const MODELS = {
13078
12605
  reasoning: true,
13079
12606
  input: ["text", "image"],
13080
12607
  cost: {
13081
- input: 0.5,
13082
- output: 3,
13083
- cacheRead: 0.049999999999999996,
12608
+ input: 1.5,
12609
+ output: 9,
12610
+ cacheRead: 0.15,
13084
12611
  cacheWrite: 0.08333333333333334,
13085
12612
  },
13086
12613
  contextWindow: 1048576,
@@ -13112,13 +12639,13 @@ export const MODELS = {
13112
12639
  reasoning: true,
13113
12640
  input: ["text", "image"],
13114
12641
  cost: {
13115
- input: 0.75,
13116
- output: 3.5,
13117
- cacheRead: 0.15,
12642
+ input: 0.73,
12643
+ output: 3.49,
12644
+ cacheRead: 0.25,
13118
12645
  cacheWrite: 0,
13119
12646
  },
13120
12647
  contextWindow: 262144,
13121
- maxTokens: 16384,
12648
+ maxTokens: 262142,
13122
12649
  },
13123
12650
  "~openai/gpt-latest": {
13124
12651
  id: "~openai/gpt-latest",
@@ -13155,62 +12682,384 @@ export const MODELS = {
13155
12682
  maxTokens: 128000,
13156
12683
  },
13157
12684
  },
13158
- "vercel-ai-gateway": {
13159
- "alibaba/qwen-3-14b": {
13160
- id: "alibaba/qwen-3-14b",
13161
- name: "Qwen3-14B",
13162
- api: "anthropic-messages",
13163
- provider: "vercel-ai-gateway",
13164
- baseUrl: "https://ai-gateway.vercel.sh",
12685
+ "together": {
12686
+ "MiniMaxAI/MiniMax-M2.5": {
12687
+ id: "MiniMaxAI/MiniMax-M2.5",
12688
+ name: "MiniMax-M2.5",
12689
+ api: "openai-completions",
12690
+ provider: "together",
12691
+ baseUrl: "https://api.together.ai/v1",
12692
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
13165
12693
  reasoning: true,
12694
+ thinkingLevelMap: { "off": null, "minimal": null, "low": null, "medium": null },
13166
12695
  input: ["text"],
13167
12696
  cost: {
13168
- input: 0.12,
13169
- output: 0.24,
13170
- cacheRead: 0,
12697
+ input: 0.3,
12698
+ output: 1.2,
12699
+ cacheRead: 0.06,
13171
12700
  cacheWrite: 0,
13172
12701
  },
13173
- contextWindow: 40960,
13174
- maxTokens: 16384,
12702
+ contextWindow: 204800,
12703
+ maxTokens: 131072,
13175
12704
  },
13176
- "alibaba/qwen-3-235b": {
13177
- id: "alibaba/qwen-3-235b",
13178
- name: "Qwen3 235B A22b Instruct 2507",
13179
- api: "anthropic-messages",
13180
- provider: "vercel-ai-gateway",
13181
- baseUrl: "https://ai-gateway.vercel.sh",
13182
- reasoning: false,
12705
+ "MiniMaxAI/MiniMax-M2.7": {
12706
+ id: "MiniMaxAI/MiniMax-M2.7",
12707
+ name: "MiniMax-M2.7",
12708
+ api: "openai-completions",
12709
+ provider: "together",
12710
+ baseUrl: "https://api.together.ai/v1",
12711
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
12712
+ reasoning: true,
12713
+ thinkingLevelMap: { "off": null, "minimal": null, "low": null, "medium": null },
13183
12714
  input: ["text"],
13184
12715
  cost: {
13185
- input: 0.6,
12716
+ input: 0.3,
13186
12717
  output: 1.2,
13187
- cacheRead: 0.6,
12718
+ cacheRead: 0.06,
13188
12719
  cacheWrite: 0,
13189
12720
  },
13190
- contextWindow: 131000,
13191
- maxTokens: 40000,
12721
+ contextWindow: 202752,
12722
+ maxTokens: 131072,
13192
12723
  },
13193
- "alibaba/qwen-3-30b": {
13194
- id: "alibaba/qwen-3-30b",
13195
- name: "Qwen3-30B-A3B",
13196
- api: "anthropic-messages",
13197
- provider: "vercel-ai-gateway",
13198
- baseUrl: "https://ai-gateway.vercel.sh",
12724
+ "Qwen/Qwen3-235B-A22B-Instruct-2507-tput": {
12725
+ id: "Qwen/Qwen3-235B-A22B-Instruct-2507-tput",
12726
+ name: "Qwen3 235B A22B Instruct 2507 FP8",
12727
+ api: "openai-completions",
12728
+ provider: "together",
12729
+ baseUrl: "https://api.together.ai/v1",
12730
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13199
12731
  reasoning: true,
12732
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13200
12733
  input: ["text"],
13201
12734
  cost: {
13202
- input: 0.08,
13203
- output: 0.29,
12735
+ input: 0.2,
12736
+ output: 0.6,
13204
12737
  cacheRead: 0,
13205
12738
  cacheWrite: 0,
13206
12739
  },
13207
- contextWindow: 40960,
13208
- maxTokens: 16384,
12740
+ contextWindow: 262144,
12741
+ maxTokens: 262144,
13209
12742
  },
13210
- "alibaba/qwen-3-32b": {
13211
- id: "alibaba/qwen-3-32b",
13212
- name: "Qwen 3 32B",
13213
- api: "anthropic-messages",
12743
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8": {
12744
+ id: "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
12745
+ name: "Qwen3 Coder 480B A35B Instruct",
12746
+ api: "openai-completions",
12747
+ provider: "together",
12748
+ baseUrl: "https://api.together.ai/v1",
12749
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
12750
+ reasoning: false,
12751
+ input: ["text"],
12752
+ cost: {
12753
+ input: 2,
12754
+ output: 2,
12755
+ cacheRead: 0,
12756
+ cacheWrite: 0,
12757
+ },
12758
+ contextWindow: 262144,
12759
+ maxTokens: 262144,
12760
+ },
12761
+ "Qwen/Qwen3-Coder-Next-FP8": {
12762
+ id: "Qwen/Qwen3-Coder-Next-FP8",
12763
+ name: "Qwen3 Coder Next FP8",
12764
+ api: "openai-completions",
12765
+ provider: "together",
12766
+ baseUrl: "https://api.together.ai/v1",
12767
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
12768
+ reasoning: true,
12769
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
12770
+ input: ["text"],
12771
+ cost: {
12772
+ input: 0.5,
12773
+ output: 1.2,
12774
+ cacheRead: 0,
12775
+ cacheWrite: 0,
12776
+ },
12777
+ contextWindow: 262144,
12778
+ maxTokens: 262144,
12779
+ },
12780
+ "Qwen/Qwen3.5-397B-A17B": {
12781
+ id: "Qwen/Qwen3.5-397B-A17B",
12782
+ name: "Qwen3.5 397B A17B",
12783
+ api: "openai-completions",
12784
+ provider: "together",
12785
+ baseUrl: "https://api.together.ai/v1",
12786
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
12787
+ reasoning: true,
12788
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
12789
+ input: ["text", "image"],
12790
+ cost: {
12791
+ input: 0.6,
12792
+ output: 3.6,
12793
+ cacheRead: 0,
12794
+ cacheWrite: 0,
12795
+ },
12796
+ contextWindow: 262144,
12797
+ maxTokens: 130000,
12798
+ },
12799
+ "Qwen/Qwen3.6-Plus": {
12800
+ id: "Qwen/Qwen3.6-Plus",
12801
+ name: "Qwen3.6 Plus",
12802
+ api: "openai-completions",
12803
+ provider: "together",
12804
+ baseUrl: "https://api.together.ai/v1",
12805
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
12806
+ reasoning: true,
12807
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
12808
+ input: ["text"],
12809
+ cost: {
12810
+ input: 0.5,
12811
+ output: 3,
12812
+ cacheRead: 0,
12813
+ cacheWrite: 0,
12814
+ },
12815
+ contextWindow: 1000000,
12816
+ maxTokens: 500000,
12817
+ },
12818
+ "deepseek-ai/DeepSeek-V3": {
12819
+ id: "deepseek-ai/DeepSeek-V3",
12820
+ name: "DeepSeek V3",
12821
+ api: "openai-completions",
12822
+ provider: "together",
12823
+ baseUrl: "https://api.together.ai/v1",
12824
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
12825
+ reasoning: true,
12826
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
12827
+ input: ["text"],
12828
+ cost: {
12829
+ input: 1.25,
12830
+ output: 1.25,
12831
+ cacheRead: 0,
12832
+ cacheWrite: 0,
12833
+ },
12834
+ contextWindow: 131072,
12835
+ maxTokens: 131072,
12836
+ },
12837
+ "deepseek-ai/DeepSeek-V3-1": {
12838
+ id: "deepseek-ai/DeepSeek-V3-1",
12839
+ name: "DeepSeek V3.1",
12840
+ api: "openai-completions",
12841
+ provider: "together",
12842
+ baseUrl: "https://api.together.ai/v1",
12843
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
12844
+ reasoning: true,
12845
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
12846
+ input: ["text"],
12847
+ cost: {
12848
+ input: 0.6,
12849
+ output: 1.7,
12850
+ cacheRead: 0,
12851
+ cacheWrite: 0,
12852
+ },
12853
+ contextWindow: 131072,
12854
+ maxTokens: 131072,
12855
+ },
12856
+ "deepseek-ai/DeepSeek-V4-Pro": {
12857
+ id: "deepseek-ai/DeepSeek-V4-Pro",
12858
+ name: "DeepSeek V4 Pro",
12859
+ api: "openai-completions",
12860
+ provider: "together",
12861
+ baseUrl: "https://api.together.ai/v1",
12862
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": true, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
12863
+ reasoning: true,
12864
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": null },
12865
+ input: ["text"],
12866
+ cost: {
12867
+ input: 2.1,
12868
+ output: 4.4,
12869
+ cacheRead: 0.2,
12870
+ cacheWrite: 0,
12871
+ },
12872
+ contextWindow: 512000,
12873
+ maxTokens: 384000,
12874
+ },
12875
+ "essentialai/Rnj-1-Instruct": {
12876
+ id: "essentialai/Rnj-1-Instruct",
12877
+ name: "Rnj-1 Instruct",
12878
+ api: "openai-completions",
12879
+ provider: "together",
12880
+ baseUrl: "https://api.together.ai/v1",
12881
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
12882
+ reasoning: false,
12883
+ input: ["text"],
12884
+ cost: {
12885
+ input: 0.15,
12886
+ output: 0.15,
12887
+ cacheRead: 0,
12888
+ cacheWrite: 0,
12889
+ },
12890
+ contextWindow: 32768,
12891
+ maxTokens: 32768,
12892
+ },
12893
+ "google/gemma-4-31B-it": {
12894
+ id: "google/gemma-4-31B-it",
12895
+ name: "Gemma 4 31B Instruct",
12896
+ api: "openai-completions",
12897
+ provider: "together",
12898
+ baseUrl: "https://api.together.ai/v1",
12899
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
12900
+ reasoning: true,
12901
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
12902
+ input: ["text", "image"],
12903
+ cost: {
12904
+ input: 0.2,
12905
+ output: 0.5,
12906
+ cacheRead: 0,
12907
+ cacheWrite: 0,
12908
+ },
12909
+ contextWindow: 262144,
12910
+ maxTokens: 131072,
12911
+ },
12912
+ "meta-llama/Llama-3.3-70B-Instruct-Turbo": {
12913
+ id: "meta-llama/Llama-3.3-70B-Instruct-Turbo",
12914
+ name: "Llama 3.3 70B",
12915
+ api: "openai-completions",
12916
+ provider: "together",
12917
+ baseUrl: "https://api.together.ai/v1",
12918
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
12919
+ reasoning: false,
12920
+ input: ["text"],
12921
+ cost: {
12922
+ input: 0.88,
12923
+ output: 0.88,
12924
+ cacheRead: 0,
12925
+ cacheWrite: 0,
12926
+ },
12927
+ contextWindow: 131072,
12928
+ maxTokens: 131072,
12929
+ },
12930
+ "moonshotai/Kimi-K2.5": {
12931
+ id: "moonshotai/Kimi-K2.5",
12932
+ name: "Kimi K2.5",
12933
+ api: "openai-completions",
12934
+ provider: "together",
12935
+ baseUrl: "https://api.together.ai/v1",
12936
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
12937
+ reasoning: true,
12938
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
12939
+ input: ["text", "image"],
12940
+ cost: {
12941
+ input: 0.5,
12942
+ output: 2.8,
12943
+ cacheRead: 0,
12944
+ cacheWrite: 0,
12945
+ },
12946
+ contextWindow: 262144,
12947
+ maxTokens: 262144,
12948
+ },
12949
+ "moonshotai/Kimi-K2.6": {
12950
+ id: "moonshotai/Kimi-K2.6",
12951
+ name: "Kimi K2.6",
12952
+ api: "openai-completions",
12953
+ provider: "together",
12954
+ baseUrl: "https://api.together.ai/v1",
12955
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
12956
+ reasoning: true,
12957
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
12958
+ input: ["text", "image"],
12959
+ cost: {
12960
+ input: 1.2,
12961
+ output: 4.5,
12962
+ cacheRead: 0.2,
12963
+ cacheWrite: 0,
12964
+ },
12965
+ contextWindow: 262144,
12966
+ maxTokens: 131000,
12967
+ },
12968
+ "openai/gpt-oss-120b": {
12969
+ id: "openai/gpt-oss-120b",
12970
+ name: "GPT OSS 120B",
12971
+ api: "openai-completions",
12972
+ provider: "together",
12973
+ baseUrl: "https://api.together.ai/v1",
12974
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": true, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "openai" },
12975
+ reasoning: true,
12976
+ thinkingLevelMap: { "off": null, "minimal": null },
12977
+ input: ["text"],
12978
+ cost: {
12979
+ input: 0.15,
12980
+ output: 0.6,
12981
+ cacheRead: 0,
12982
+ cacheWrite: 0,
12983
+ },
12984
+ contextWindow: 131072,
12985
+ maxTokens: 131072,
12986
+ },
12987
+ "zai-org/GLM-5.1": {
12988
+ id: "zai-org/GLM-5.1",
12989
+ name: "GLM-5.1",
12990
+ api: "openai-completions",
12991
+ provider: "together",
12992
+ baseUrl: "https://api.together.ai/v1",
12993
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
12994
+ reasoning: true,
12995
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
12996
+ input: ["text"],
12997
+ cost: {
12998
+ input: 1.4,
12999
+ output: 4.4,
13000
+ cacheRead: 0,
13001
+ cacheWrite: 0,
13002
+ },
13003
+ contextWindow: 202752,
13004
+ maxTokens: 131072,
13005
+ },
13006
+ },
13007
+ "vercel-ai-gateway": {
13008
+ "alibaba/qwen-3-14b": {
13009
+ id: "alibaba/qwen-3-14b",
13010
+ name: "Qwen3-14B",
13011
+ api: "anthropic-messages",
13012
+ provider: "vercel-ai-gateway",
13013
+ baseUrl: "https://ai-gateway.vercel.sh",
13014
+ reasoning: true,
13015
+ input: ["text"],
13016
+ cost: {
13017
+ input: 0.12,
13018
+ output: 0.24,
13019
+ cacheRead: 0,
13020
+ cacheWrite: 0,
13021
+ },
13022
+ contextWindow: 40960,
13023
+ maxTokens: 16384,
13024
+ },
13025
+ "alibaba/qwen-3-235b": {
13026
+ id: "alibaba/qwen-3-235b",
13027
+ name: "Qwen3 235B A22b Instruct 2507",
13028
+ api: "anthropic-messages",
13029
+ provider: "vercel-ai-gateway",
13030
+ baseUrl: "https://ai-gateway.vercel.sh",
13031
+ reasoning: false,
13032
+ input: ["text"],
13033
+ cost: {
13034
+ input: 0.6,
13035
+ output: 1.2,
13036
+ cacheRead: 0.6,
13037
+ cacheWrite: 0,
13038
+ },
13039
+ contextWindow: 131000,
13040
+ maxTokens: 40000,
13041
+ },
13042
+ "alibaba/qwen-3-30b": {
13043
+ id: "alibaba/qwen-3-30b",
13044
+ name: "Qwen3-30B-A3B",
13045
+ api: "anthropic-messages",
13046
+ provider: "vercel-ai-gateway",
13047
+ baseUrl: "https://ai-gateway.vercel.sh",
13048
+ reasoning: true,
13049
+ input: ["text"],
13050
+ cost: {
13051
+ input: 0.08,
13052
+ output: 0.29,
13053
+ cacheRead: 0,
13054
+ cacheWrite: 0,
13055
+ },
13056
+ contextWindow: 40960,
13057
+ maxTokens: 16384,
13058
+ },
13059
+ "alibaba/qwen-3-32b": {
13060
+ id: "alibaba/qwen-3-32b",
13061
+ name: "Qwen 3 32B",
13062
+ api: "anthropic-messages",
13214
13063
  provider: "vercel-ai-gateway",
13215
13064
  baseUrl: "https://ai-gateway.vercel.sh",
13216
13065
  reasoning: true,
@@ -13462,6 +13311,23 @@ export const MODELS = {
13462
13311
  contextWindow: 1000000,
13463
13312
  maxTokens: 64000,
13464
13313
  },
13314
+ "alibaba/qwen3.7-max": {
13315
+ id: "alibaba/qwen3.7-max",
13316
+ name: "Qwen 3.7 Max",
13317
+ api: "anthropic-messages",
13318
+ provider: "vercel-ai-gateway",
13319
+ baseUrl: "https://ai-gateway.vercel.sh",
13320
+ reasoning: true,
13321
+ input: ["text", "image"],
13322
+ cost: {
13323
+ input: 2.5,
13324
+ output: 7.5,
13325
+ cacheRead: 0.5,
13326
+ cacheWrite: 3.125,
13327
+ },
13328
+ contextWindow: 991000,
13329
+ maxTokens: 64000,
13330
+ },
13465
13331
  "anthropic/claude-3-haiku": {
13466
13332
  id: "anthropic/claude-3-haiku",
13467
13333
  name: "Claude 3 Haiku",
@@ -13496,26 +13362,9 @@ export const MODELS = {
13496
13362
  contextWindow: 200000,
13497
13363
  maxTokens: 8192,
13498
13364
  },
13499
- "anthropic/claude-3.7-sonnet": {
13500
- id: "anthropic/claude-3.7-sonnet",
13501
- name: "Claude 3.7 Sonnet",
13502
- api: "anthropic-messages",
13503
- provider: "vercel-ai-gateway",
13504
- baseUrl: "https://ai-gateway.vercel.sh",
13505
- reasoning: true,
13506
- input: ["text", "image"],
13507
- cost: {
13508
- input: 3,
13509
- output: 15,
13510
- cacheRead: 0.3,
13511
- cacheWrite: 3.75,
13512
- },
13513
- contextWindow: 200000,
13514
- maxTokens: 8192,
13515
- },
13516
- "anthropic/claude-haiku-4.5": {
13517
- id: "anthropic/claude-haiku-4.5",
13518
- name: "Claude Haiku 4.5",
13365
+ "anthropic/claude-haiku-4.5": {
13366
+ id: "anthropic/claude-haiku-4.5",
13367
+ name: "Claude Haiku 4.5",
13519
13368
  api: "anthropic-messages",
13520
13369
  provider: "vercel-ai-gateway",
13521
13370
  baseUrl: "https://ai-gateway.vercel.sh",
@@ -13991,6 +13840,23 @@ export const MODELS = {
13991
13840
  contextWindow: 1000000,
13992
13841
  maxTokens: 64000,
13993
13842
  },
13843
+ "google/gemini-3.1-flash-lite": {
13844
+ id: "google/gemini-3.1-flash-lite",
13845
+ name: "Gemini 3.1 Flash Lite",
13846
+ api: "anthropic-messages",
13847
+ provider: "vercel-ai-gateway",
13848
+ baseUrl: "https://ai-gateway.vercel.sh",
13849
+ reasoning: true,
13850
+ input: ["text", "image"],
13851
+ cost: {
13852
+ input: 0.25,
13853
+ output: 1.5,
13854
+ cacheRead: 0.03,
13855
+ cacheWrite: 0,
13856
+ },
13857
+ contextWindow: 1000000,
13858
+ maxTokens: 65000,
13859
+ },
13994
13860
  "google/gemini-3.1-flash-lite-preview": {
13995
13861
  id: "google/gemini-3.1-flash-lite-preview",
13996
13862
  name: "Gemini 3.1 Flash Lite Preview",
@@ -14025,6 +13891,23 @@ export const MODELS = {
14025
13891
  contextWindow: 1000000,
14026
13892
  maxTokens: 64000,
14027
13893
  },
13894
+ "google/gemini-3.5-flash": {
13895
+ id: "google/gemini-3.5-flash",
13896
+ name: "Gemini 3.5 Flash",
13897
+ api: "anthropic-messages",
13898
+ provider: "vercel-ai-gateway",
13899
+ baseUrl: "https://ai-gateway.vercel.sh",
13900
+ reasoning: true,
13901
+ input: ["text", "image"],
13902
+ cost: {
13903
+ input: 1.5,
13904
+ output: 9,
13905
+ cacheRead: 0.15,
13906
+ cacheWrite: 0,
13907
+ },
13908
+ contextWindow: 1000000,
13909
+ maxTokens: 64000,
13910
+ },
14028
13911
  "google/gemma-4-26b-a4b-it": {
14029
13912
  id: "google/gemma-4-26b-a4b-it",
14030
13913
  name: "Gemma 4 26B A4B IT",
@@ -14484,6 +14367,23 @@ export const MODELS = {
14484
14367
  contextWindow: 128000,
14485
14368
  maxTokens: 64000,
14486
14369
  },
14370
+ "mistral/mistral-medium-3.5": {
14371
+ id: "mistral/mistral-medium-3.5",
14372
+ name: "Mistral Medium Latest",
14373
+ api: "anthropic-messages",
14374
+ provider: "vercel-ai-gateway",
14375
+ baseUrl: "https://ai-gateway.vercel.sh",
14376
+ reasoning: true,
14377
+ input: ["text"],
14378
+ cost: {
14379
+ input: 1.5,
14380
+ output: 7.5,
14381
+ cacheRead: 0,
14382
+ cacheWrite: 0,
14383
+ },
14384
+ contextWindow: 256000,
14385
+ maxTokens: 256000,
14386
+ },
14487
14387
  "mistral/mistral-small": {
14488
14388
  id: "mistral/mistral-small",
14489
14389
  name: "Mistral Small",
@@ -15178,7 +15078,7 @@ export const MODELS = {
15178
15078
  },
15179
15079
  "openai/gpt-oss-20b": {
15180
15080
  id: "openai/gpt-oss-20b",
15181
- name: "GPT OSS 120B",
15081
+ name: "GPT OSS 20B",
15182
15082
  api: "anthropic-messages",
15183
15083
  provider: "vercel-ai-gateway",
15184
15084
  baseUrl: "https://ai-gateway.vercel.sh",
@@ -15346,125 +15246,6 @@ export const MODELS = {
15346
15246
  contextWindow: 200000,
15347
15247
  maxTokens: 8000,
15348
15248
  },
15349
- "xai/grok-3": {
15350
- id: "xai/grok-3",
15351
- name: "Grok 3 Beta",
15352
- api: "anthropic-messages",
15353
- provider: "vercel-ai-gateway",
15354
- baseUrl: "https://ai-gateway.vercel.sh",
15355
- reasoning: false,
15356
- input: ["text"],
15357
- cost: {
15358
- input: 3,
15359
- output: 15,
15360
- cacheRead: 0.75,
15361
- cacheWrite: 0,
15362
- },
15363
- contextWindow: 131072,
15364
- maxTokens: 131072,
15365
- },
15366
- "xai/grok-3-fast": {
15367
- id: "xai/grok-3-fast",
15368
- name: "Grok 3 Fast Beta",
15369
- api: "anthropic-messages",
15370
- provider: "vercel-ai-gateway",
15371
- baseUrl: "https://ai-gateway.vercel.sh",
15372
- reasoning: false,
15373
- input: ["text"],
15374
- cost: {
15375
- input: 5,
15376
- output: 25,
15377
- cacheRead: 1.25,
15378
- cacheWrite: 0,
15379
- },
15380
- contextWindow: 131072,
15381
- maxTokens: 131072,
15382
- },
15383
- "xai/grok-3-mini": {
15384
- id: "xai/grok-3-mini",
15385
- name: "Grok 3 Mini Beta",
15386
- api: "anthropic-messages",
15387
- provider: "vercel-ai-gateway",
15388
- baseUrl: "https://ai-gateway.vercel.sh",
15389
- reasoning: false,
15390
- input: ["text"],
15391
- cost: {
15392
- input: 0.3,
15393
- output: 0.5,
15394
- cacheRead: 0.075,
15395
- cacheWrite: 0,
15396
- },
15397
- contextWindow: 131072,
15398
- maxTokens: 131072,
15399
- },
15400
- "xai/grok-3-mini-fast": {
15401
- id: "xai/grok-3-mini-fast",
15402
- name: "Grok 3 Mini Fast Beta",
15403
- api: "anthropic-messages",
15404
- provider: "vercel-ai-gateway",
15405
- baseUrl: "https://ai-gateway.vercel.sh",
15406
- reasoning: false,
15407
- input: ["text"],
15408
- cost: {
15409
- input: 0.6,
15410
- output: 4,
15411
- cacheRead: 0,
15412
- cacheWrite: 0,
15413
- },
15414
- contextWindow: 131072,
15415
- maxTokens: 131072,
15416
- },
15417
- "xai/grok-4": {
15418
- id: "xai/grok-4",
15419
- name: "Grok 4",
15420
- api: "anthropic-messages",
15421
- provider: "vercel-ai-gateway",
15422
- baseUrl: "https://ai-gateway.vercel.sh",
15423
- reasoning: true,
15424
- input: ["text", "image"],
15425
- cost: {
15426
- input: 3,
15427
- output: 15,
15428
- cacheRead: 0.75,
15429
- cacheWrite: 0,
15430
- },
15431
- contextWindow: 256000,
15432
- maxTokens: 256000,
15433
- },
15434
- "xai/grok-4-fast-non-reasoning": {
15435
- id: "xai/grok-4-fast-non-reasoning",
15436
- name: "Grok 4 Fast Non-Reasoning",
15437
- api: "anthropic-messages",
15438
- provider: "vercel-ai-gateway",
15439
- baseUrl: "https://ai-gateway.vercel.sh",
15440
- reasoning: false,
15441
- input: ["text", "image"],
15442
- cost: {
15443
- input: 0.19999999999999998,
15444
- output: 0.5,
15445
- cacheRead: 0.049999999999999996,
15446
- cacheWrite: 0,
15447
- },
15448
- contextWindow: 2000000,
15449
- maxTokens: 256000,
15450
- },
15451
- "xai/grok-4-fast-reasoning": {
15452
- id: "xai/grok-4-fast-reasoning",
15453
- name: "Grok 4 Fast Reasoning",
15454
- api: "anthropic-messages",
15455
- provider: "vercel-ai-gateway",
15456
- baseUrl: "https://ai-gateway.vercel.sh",
15457
- reasoning: true,
15458
- input: ["text", "image"],
15459
- cost: {
15460
- input: 0.19999999999999998,
15461
- output: 0.5,
15462
- cacheRead: 0.049999999999999996,
15463
- cacheWrite: 0,
15464
- },
15465
- contextWindow: 2000000,
15466
- maxTokens: 256000,
15467
- },
15468
15249
  "xai/grok-4.1-fast-non-reasoning": {
15469
15250
  id: "xai/grok-4.1-fast-non-reasoning",
15470
15251
  name: "Grok 4.1 Fast Non-Reasoning",
@@ -15479,8 +15260,8 @@ export const MODELS = {
15479
15260
  cacheRead: 0.049999999999999996,
15480
15261
  cacheWrite: 0,
15481
15262
  },
15482
- contextWindow: 2000000,
15483
- maxTokens: 30000,
15263
+ contextWindow: 1000000,
15264
+ maxTokens: 1000000,
15484
15265
  },
15485
15266
  "xai/grok-4.1-fast-reasoning": {
15486
15267
  id: "xai/grok-4.1-fast-reasoning",
@@ -15496,8 +15277,8 @@ export const MODELS = {
15496
15277
  cacheRead: 0.049999999999999996,
15497
15278
  cacheWrite: 0,
15498
15279
  },
15499
- contextWindow: 2000000,
15500
- maxTokens: 30000,
15280
+ contextWindow: 1000000,
15281
+ maxTokens: 1000000,
15501
15282
  },
15502
15283
  "xai/grok-4.20-multi-agent": {
15503
15284
  id: "xai/grok-4.20-multi-agent",
@@ -15618,18 +15399,18 @@ export const MODELS = {
15618
15399
  contextWindow: 1000000,
15619
15400
  maxTokens: 1000000,
15620
15401
  },
15621
- "xai/grok-code-fast-1": {
15622
- id: "xai/grok-code-fast-1",
15623
- name: "Grok Code Fast 1",
15402
+ "xai/grok-build-0.1": {
15403
+ id: "xai/grok-build-0.1",
15404
+ name: "Grok Build 0.1",
15624
15405
  api: "anthropic-messages",
15625
15406
  provider: "vercel-ai-gateway",
15626
15407
  baseUrl: "https://ai-gateway.vercel.sh",
15627
15408
  reasoning: true,
15628
- input: ["text"],
15409
+ input: ["text", "image"],
15629
15410
  cost: {
15630
- input: 0.19999999999999998,
15631
- output: 1.5,
15632
- cacheRead: 0.02,
15411
+ input: 1,
15412
+ output: 2,
15413
+ cacheRead: 0.19999999999999998,
15633
15414
  cacheWrite: 0,
15634
15415
  },
15635
15416
  contextWindow: 256000,
@@ -15926,108 +15707,6 @@ export const MODELS = {
15926
15707
  },
15927
15708
  },
15928
15709
  "xai": {
15929
- "grok-2": {
15930
- id: "grok-2",
15931
- name: "Grok 2",
15932
- api: "openai-completions",
15933
- provider: "xai",
15934
- baseUrl: "https://api.x.ai/v1",
15935
- reasoning: false,
15936
- input: ["text"],
15937
- cost: {
15938
- input: 2,
15939
- output: 10,
15940
- cacheRead: 2,
15941
- cacheWrite: 0,
15942
- },
15943
- contextWindow: 131072,
15944
- maxTokens: 8192,
15945
- },
15946
- "grok-2-1212": {
15947
- id: "grok-2-1212",
15948
- name: "Grok 2 (1212)",
15949
- api: "openai-completions",
15950
- provider: "xai",
15951
- baseUrl: "https://api.x.ai/v1",
15952
- reasoning: false,
15953
- input: ["text"],
15954
- cost: {
15955
- input: 2,
15956
- output: 10,
15957
- cacheRead: 2,
15958
- cacheWrite: 0,
15959
- },
15960
- contextWindow: 131072,
15961
- maxTokens: 8192,
15962
- },
15963
- "grok-2-latest": {
15964
- id: "grok-2-latest",
15965
- name: "Grok 2 Latest",
15966
- api: "openai-completions",
15967
- provider: "xai",
15968
- baseUrl: "https://api.x.ai/v1",
15969
- reasoning: false,
15970
- input: ["text"],
15971
- cost: {
15972
- input: 2,
15973
- output: 10,
15974
- cacheRead: 2,
15975
- cacheWrite: 0,
15976
- },
15977
- contextWindow: 131072,
15978
- maxTokens: 8192,
15979
- },
15980
- "grok-2-vision": {
15981
- id: "grok-2-vision",
15982
- name: "Grok 2 Vision",
15983
- api: "openai-completions",
15984
- provider: "xai",
15985
- baseUrl: "https://api.x.ai/v1",
15986
- reasoning: false,
15987
- input: ["text", "image"],
15988
- cost: {
15989
- input: 2,
15990
- output: 10,
15991
- cacheRead: 2,
15992
- cacheWrite: 0,
15993
- },
15994
- contextWindow: 8192,
15995
- maxTokens: 4096,
15996
- },
15997
- "grok-2-vision-1212": {
15998
- id: "grok-2-vision-1212",
15999
- name: "Grok 2 Vision (1212)",
16000
- api: "openai-completions",
16001
- provider: "xai",
16002
- baseUrl: "https://api.x.ai/v1",
16003
- reasoning: false,
16004
- input: ["text", "image"],
16005
- cost: {
16006
- input: 2,
16007
- output: 10,
16008
- cacheRead: 2,
16009
- cacheWrite: 0,
16010
- },
16011
- contextWindow: 8192,
16012
- maxTokens: 4096,
16013
- },
16014
- "grok-2-vision-latest": {
16015
- id: "grok-2-vision-latest",
16016
- name: "Grok 2 Vision Latest",
16017
- api: "openai-completions",
16018
- provider: "xai",
16019
- baseUrl: "https://api.x.ai/v1",
16020
- reasoning: false,
16021
- input: ["text", "image"],
16022
- cost: {
16023
- input: 2,
16024
- output: 10,
16025
- cacheRead: 2,
16026
- cacheWrite: 0,
16027
- },
16028
- contextWindow: 8192,
16029
- maxTokens: 4096,
16030
- },
16031
15710
  "grok-3": {
16032
15711
  id: "grok-3",
16033
15712
  name: "Grok 3",
@@ -16062,193 +15741,6 @@ export const MODELS = {
16062
15741
  contextWindow: 131072,
16063
15742
  maxTokens: 8192,
16064
15743
  },
16065
- "grok-3-fast-latest": {
16066
- id: "grok-3-fast-latest",
16067
- name: "Grok 3 Fast Latest",
16068
- api: "openai-completions",
16069
- provider: "xai",
16070
- baseUrl: "https://api.x.ai/v1",
16071
- reasoning: false,
16072
- input: ["text"],
16073
- cost: {
16074
- input: 5,
16075
- output: 25,
16076
- cacheRead: 1.25,
16077
- cacheWrite: 0,
16078
- },
16079
- contextWindow: 131072,
16080
- maxTokens: 8192,
16081
- },
16082
- "grok-3-latest": {
16083
- id: "grok-3-latest",
16084
- name: "Grok 3 Latest",
16085
- api: "openai-completions",
16086
- provider: "xai",
16087
- baseUrl: "https://api.x.ai/v1",
16088
- reasoning: false,
16089
- input: ["text"],
16090
- cost: {
16091
- input: 3,
16092
- output: 15,
16093
- cacheRead: 0.75,
16094
- cacheWrite: 0,
16095
- },
16096
- contextWindow: 131072,
16097
- maxTokens: 8192,
16098
- },
16099
- "grok-3-mini": {
16100
- id: "grok-3-mini",
16101
- name: "Grok 3 Mini",
16102
- api: "openai-completions",
16103
- provider: "xai",
16104
- baseUrl: "https://api.x.ai/v1",
16105
- reasoning: true,
16106
- input: ["text"],
16107
- cost: {
16108
- input: 0.3,
16109
- output: 0.5,
16110
- cacheRead: 0.075,
16111
- cacheWrite: 0,
16112
- },
16113
- contextWindow: 131072,
16114
- maxTokens: 8192,
16115
- },
16116
- "grok-3-mini-fast": {
16117
- id: "grok-3-mini-fast",
16118
- name: "Grok 3 Mini Fast",
16119
- api: "openai-completions",
16120
- provider: "xai",
16121
- baseUrl: "https://api.x.ai/v1",
16122
- reasoning: true,
16123
- input: ["text"],
16124
- cost: {
16125
- input: 0.6,
16126
- output: 4,
16127
- cacheRead: 0.15,
16128
- cacheWrite: 0,
16129
- },
16130
- contextWindow: 131072,
16131
- maxTokens: 8192,
16132
- },
16133
- "grok-3-mini-fast-latest": {
16134
- id: "grok-3-mini-fast-latest",
16135
- name: "Grok 3 Mini Fast Latest",
16136
- api: "openai-completions",
16137
- provider: "xai",
16138
- baseUrl: "https://api.x.ai/v1",
16139
- reasoning: true,
16140
- input: ["text"],
16141
- cost: {
16142
- input: 0.6,
16143
- output: 4,
16144
- cacheRead: 0.15,
16145
- cacheWrite: 0,
16146
- },
16147
- contextWindow: 131072,
16148
- maxTokens: 8192,
16149
- },
16150
- "grok-3-mini-latest": {
16151
- id: "grok-3-mini-latest",
16152
- name: "Grok 3 Mini Latest",
16153
- api: "openai-completions",
16154
- provider: "xai",
16155
- baseUrl: "https://api.x.ai/v1",
16156
- reasoning: true,
16157
- input: ["text"],
16158
- cost: {
16159
- input: 0.3,
16160
- output: 0.5,
16161
- cacheRead: 0.075,
16162
- cacheWrite: 0,
16163
- },
16164
- contextWindow: 131072,
16165
- maxTokens: 8192,
16166
- },
16167
- "grok-4": {
16168
- id: "grok-4",
16169
- name: "Grok 4",
16170
- api: "openai-completions",
16171
- provider: "xai",
16172
- baseUrl: "https://api.x.ai/v1",
16173
- reasoning: true,
16174
- input: ["text"],
16175
- cost: {
16176
- input: 3,
16177
- output: 15,
16178
- cacheRead: 0.75,
16179
- cacheWrite: 0,
16180
- },
16181
- contextWindow: 256000,
16182
- maxTokens: 64000,
16183
- },
16184
- "grok-4-1-fast": {
16185
- id: "grok-4-1-fast",
16186
- name: "Grok 4.1 Fast",
16187
- api: "openai-completions",
16188
- provider: "xai",
16189
- baseUrl: "https://api.x.ai/v1",
16190
- reasoning: true,
16191
- input: ["text", "image"],
16192
- cost: {
16193
- input: 0.2,
16194
- output: 0.5,
16195
- cacheRead: 0.05,
16196
- cacheWrite: 0,
16197
- },
16198
- contextWindow: 2000000,
16199
- maxTokens: 30000,
16200
- },
16201
- "grok-4-1-fast-non-reasoning": {
16202
- id: "grok-4-1-fast-non-reasoning",
16203
- name: "Grok 4.1 Fast (Non-Reasoning)",
16204
- api: "openai-completions",
16205
- provider: "xai",
16206
- baseUrl: "https://api.x.ai/v1",
16207
- reasoning: false,
16208
- input: ["text", "image"],
16209
- cost: {
16210
- input: 0.2,
16211
- output: 0.5,
16212
- cacheRead: 0.05,
16213
- cacheWrite: 0,
16214
- },
16215
- contextWindow: 2000000,
16216
- maxTokens: 30000,
16217
- },
16218
- "grok-4-fast": {
16219
- id: "grok-4-fast",
16220
- name: "Grok 4 Fast",
16221
- api: "openai-completions",
16222
- provider: "xai",
16223
- baseUrl: "https://api.x.ai/v1",
16224
- reasoning: true,
16225
- input: ["text", "image"],
16226
- cost: {
16227
- input: 0.2,
16228
- output: 0.5,
16229
- cacheRead: 0.05,
16230
- cacheWrite: 0,
16231
- },
16232
- contextWindow: 2000000,
16233
- maxTokens: 30000,
16234
- },
16235
- "grok-4-fast-non-reasoning": {
16236
- id: "grok-4-fast-non-reasoning",
16237
- name: "Grok 4 Fast (Non-Reasoning)",
16238
- api: "openai-completions",
16239
- provider: "xai",
16240
- baseUrl: "https://api.x.ai/v1",
16241
- reasoning: false,
16242
- input: ["text", "image"],
16243
- cost: {
16244
- input: 0.2,
16245
- output: 0.5,
16246
- cacheRead: 0.05,
16247
- cacheWrite: 0,
16248
- },
16249
- contextWindow: 2000000,
16250
- maxTokens: 30000,
16251
- },
16252
15744
  "grok-4.20-0309-non-reasoning": {
16253
15745
  id: "grok-4.20-0309-non-reasoning",
16254
15746
  name: "Grok 4.20 (Non-Reasoning)",
@@ -16258,8 +15750,8 @@ export const MODELS = {
16258
15750
  reasoning: false,
16259
15751
  input: ["text", "image"],
16260
15752
  cost: {
16261
- input: 2,
16262
- output: 6,
15753
+ input: 1.25,
15754
+ output: 2.5,
16263
15755
  cacheRead: 0.2,
16264
15756
  cacheWrite: 0,
16265
15757
  },
@@ -16275,8 +15767,8 @@ export const MODELS = {
16275
15767
  reasoning: true,
16276
15768
  input: ["text", "image"],
16277
15769
  cost: {
16278
- input: 2,
16279
- output: 6,
15770
+ input: 1.25,
15771
+ output: 2.5,
16280
15772
  cacheRead: 0.2,
16281
15773
  cacheWrite: 0,
16282
15774
  },
@@ -16300,22 +15792,22 @@ export const MODELS = {
16300
15792
  contextWindow: 1000000,
16301
15793
  maxTokens: 30000,
16302
15794
  },
16303
- "grok-beta": {
16304
- id: "grok-beta",
16305
- name: "Grok Beta",
15795
+ "grok-build-0.1": {
15796
+ id: "grok-build-0.1",
15797
+ name: "Grok Build 0.1",
16306
15798
  api: "openai-completions",
16307
15799
  provider: "xai",
16308
15800
  baseUrl: "https://api.x.ai/v1",
16309
- reasoning: false,
16310
- input: ["text"],
15801
+ reasoning: true,
15802
+ input: ["text", "image"],
16311
15803
  cost: {
16312
- input: 5,
16313
- output: 15,
16314
- cacheRead: 5,
15804
+ input: 1,
15805
+ output: 2,
15806
+ cacheRead: 0.2,
16315
15807
  cacheWrite: 0,
16316
15808
  },
16317
- contextWindow: 131072,
16318
- maxTokens: 4096,
15809
+ contextWindow: 256000,
15810
+ maxTokens: 256000,
16319
15811
  },
16320
15812
  "grok-code-fast-1": {
16321
15813
  id: "grok-code-fast-1",
@@ -16323,7 +15815,7 @@ export const MODELS = {
16323
15815
  api: "openai-completions",
16324
15816
  provider: "xai",
16325
15817
  baseUrl: "https://api.x.ai/v1",
16326
- reasoning: true,
15818
+ reasoning: false,
16327
15819
  input: ["text"],
16328
15820
  cost: {
16329
15821
  input: 0.2,
@@ -16331,25 +15823,8 @@ export const MODELS = {
16331
15823
  cacheRead: 0.02,
16332
15824
  cacheWrite: 0,
16333
15825
  },
16334
- contextWindow: 256000,
16335
- maxTokens: 10000,
16336
- },
16337
- "grok-vision-beta": {
16338
- id: "grok-vision-beta",
16339
- name: "Grok Vision Beta",
16340
- api: "openai-completions",
16341
- provider: "xai",
16342
- baseUrl: "https://api.x.ai/v1",
16343
- reasoning: false,
16344
- input: ["text", "image"],
16345
- cost: {
16346
- input: 5,
16347
- output: 15,
16348
- cacheRead: 5,
16349
- cacheWrite: 0,
16350
- },
16351
- contextWindow: 8192,
16352
- maxTokens: 4096,
15826
+ contextWindow: 32768,
15827
+ maxTokens: 8192,
16353
15828
  },
16354
15829
  },
16355
15830
  "xiaomi": {