@earendil-works/pi-ai 0.74.0 → 0.75.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (63) hide show
  1. package/README.md +76 -6
  2. package/dist/env-api-keys.d.ts.map +1 -1
  3. package/dist/env-api-keys.js +2 -1
  4. package/dist/env-api-keys.js.map +1 -1
  5. package/dist/image-models.d.ts +10 -0
  6. package/dist/image-models.d.ts.map +1 -0
  7. package/dist/image-models.generated.d.ts +425 -0
  8. package/dist/image-models.generated.d.ts.map +1 -0
  9. package/dist/image-models.generated.js +427 -0
  10. package/dist/image-models.generated.js.map +1 -0
  11. package/dist/image-models.js +23 -0
  12. package/dist/image-models.js.map +1 -0
  13. package/dist/images-api-registry.d.ts +14 -0
  14. package/dist/images-api-registry.d.ts.map +1 -0
  15. package/dist/images-api-registry.js +22 -0
  16. package/dist/images-api-registry.js.map +1 -0
  17. package/dist/images.d.ts +4 -0
  18. package/dist/images.d.ts.map +1 -0
  19. package/dist/images.js +14 -0
  20. package/dist/images.js.map +1 -0
  21. package/dist/index.d.ts +4 -0
  22. package/dist/index.d.ts.map +1 -1
  23. package/dist/index.js +4 -0
  24. package/dist/index.js.map +1 -1
  25. package/dist/models.generated.d.ts +1029 -1190
  26. package/dist/models.generated.d.ts.map +1 -1
  27. package/dist/models.generated.js +970 -1399
  28. package/dist/models.generated.js.map +1 -1
  29. package/dist/providers/amazon-bedrock.d.ts.map +1 -1
  30. package/dist/providers/amazon-bedrock.js +7 -16
  31. package/dist/providers/amazon-bedrock.js.map +1 -1
  32. package/dist/providers/anthropic.d.ts.map +1 -1
  33. package/dist/providers/anthropic.js +15 -6
  34. package/dist/providers/anthropic.js.map +1 -1
  35. package/dist/providers/images/openrouter.d.ts +3 -0
  36. package/dist/providers/images/openrouter.d.ts.map +1 -0
  37. package/dist/providers/images/openrouter.js +129 -0
  38. package/dist/providers/images/openrouter.js.map +1 -0
  39. package/dist/providers/images/register-builtins.d.ts +4 -0
  40. package/dist/providers/images/register-builtins.d.ts.map +1 -0
  41. package/dist/providers/images/register-builtins.js +34 -0
  42. package/dist/providers/images/register-builtins.js.map +1 -0
  43. package/dist/providers/openai-codex-responses.d.ts.map +1 -1
  44. package/dist/providers/openai-codex-responses.js +49 -3
  45. package/dist/providers/openai-codex-responses.js.map +1 -1
  46. package/dist/providers/openai-completions.d.ts.map +1 -1
  47. package/dist/providers/openai-completions.js +32 -14
  48. package/dist/providers/openai-completions.js.map +1 -1
  49. package/dist/providers/simple-options.d.ts.map +1 -1
  50. package/dist/providers/simple-options.js +8 -1
  51. package/dist/providers/simple-options.js.map +1 -1
  52. package/dist/types.d.ts +86 -3
  53. package/dist/types.d.ts.map +1 -1
  54. package/dist/types.js.map +1 -1
  55. package/dist/utils/node-http-proxy.d.ts +10 -0
  56. package/dist/utils/node-http-proxy.d.ts.map +1 -0
  57. package/dist/utils/node-http-proxy.js +97 -0
  58. package/dist/utils/node-http-proxy.js.map +1 -0
  59. package/dist/utils/overflow.d.ts +2 -1
  60. package/dist/utils/overflow.d.ts.map +1 -1
  61. package/dist/utils/overflow.js +6 -1
  62. package/dist/utils/overflow.js.map +1 -1
  63. package/package.json +7 -8
@@ -53,23 +53,6 @@ export const MODELS = {
53
53
  contextWindow: 128000,
54
54
  maxTokens: 8192,
55
55
  },
56
- "amazon.nova-premier-v1:0": {
57
- id: "amazon.nova-premier-v1:0",
58
- name: "Nova Premier",
59
- api: "bedrock-converse-stream",
60
- provider: "amazon-bedrock",
61
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
62
- reasoning: true,
63
- input: ["text", "image"],
64
- cost: {
65
- input: 2.5,
66
- output: 12.5,
67
- cacheRead: 0,
68
- cacheWrite: 0,
69
- },
70
- contextWindow: 1000000,
71
- maxTokens: 16384,
72
- },
73
56
  "amazon.nova-pro-v1:0": {
74
57
  id: "amazon.nova-pro-v1:0",
75
58
  name: "Nova Pro",
@@ -87,91 +70,6 @@ export const MODELS = {
87
70
  contextWindow: 300000,
88
71
  maxTokens: 8192,
89
72
  },
90
- "anthropic.claude-3-5-haiku-20241022-v1:0": {
91
- id: "anthropic.claude-3-5-haiku-20241022-v1:0",
92
- name: "Claude Haiku 3.5",
93
- api: "bedrock-converse-stream",
94
- provider: "amazon-bedrock",
95
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
96
- reasoning: false,
97
- input: ["text", "image"],
98
- cost: {
99
- input: 0.8,
100
- output: 4,
101
- cacheRead: 0.08,
102
- cacheWrite: 1,
103
- },
104
- contextWindow: 200000,
105
- maxTokens: 8192,
106
- },
107
- "anthropic.claude-3-5-sonnet-20240620-v1:0": {
108
- id: "anthropic.claude-3-5-sonnet-20240620-v1:0",
109
- name: "Claude Sonnet 3.5",
110
- api: "bedrock-converse-stream",
111
- provider: "amazon-bedrock",
112
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
113
- reasoning: false,
114
- input: ["text", "image"],
115
- cost: {
116
- input: 3,
117
- output: 15,
118
- cacheRead: 0.3,
119
- cacheWrite: 3.75,
120
- },
121
- contextWindow: 200000,
122
- maxTokens: 8192,
123
- },
124
- "anthropic.claude-3-5-sonnet-20241022-v2:0": {
125
- id: "anthropic.claude-3-5-sonnet-20241022-v2:0",
126
- name: "Claude Sonnet 3.5 v2",
127
- api: "bedrock-converse-stream",
128
- provider: "amazon-bedrock",
129
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
130
- reasoning: false,
131
- input: ["text", "image"],
132
- cost: {
133
- input: 3,
134
- output: 15,
135
- cacheRead: 0.3,
136
- cacheWrite: 3.75,
137
- },
138
- contextWindow: 200000,
139
- maxTokens: 8192,
140
- },
141
- "anthropic.claude-3-7-sonnet-20250219-v1:0": {
142
- id: "anthropic.claude-3-7-sonnet-20250219-v1:0",
143
- name: "Claude Sonnet 3.7",
144
- api: "bedrock-converse-stream",
145
- provider: "amazon-bedrock",
146
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
147
- reasoning: false,
148
- input: ["text", "image"],
149
- cost: {
150
- input: 3,
151
- output: 15,
152
- cacheRead: 0.3,
153
- cacheWrite: 3.75,
154
- },
155
- contextWindow: 200000,
156
- maxTokens: 8192,
157
- },
158
- "anthropic.claude-3-haiku-20240307-v1:0": {
159
- id: "anthropic.claude-3-haiku-20240307-v1:0",
160
- name: "Claude Haiku 3",
161
- api: "bedrock-converse-stream",
162
- provider: "amazon-bedrock",
163
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
164
- reasoning: false,
165
- input: ["text", "image"],
166
- cost: {
167
- input: 0.25,
168
- output: 1.25,
169
- cacheRead: 0,
170
- cacheWrite: 0,
171
- },
172
- contextWindow: 200000,
173
- maxTokens: 4096,
174
- },
175
73
  "anthropic.claude-haiku-4-5-20251001-v1:0": {
176
74
  id: "anthropic.claude-haiku-4-5-20251001-v1:0",
177
75
  name: "Claude Haiku 4.5",
@@ -206,23 +104,6 @@ export const MODELS = {
206
104
  contextWindow: 200000,
207
105
  maxTokens: 32000,
208
106
  },
209
- "anthropic.claude-opus-4-20250514-v1:0": {
210
- id: "anthropic.claude-opus-4-20250514-v1:0",
211
- name: "Claude Opus 4",
212
- api: "bedrock-converse-stream",
213
- provider: "amazon-bedrock",
214
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
215
- reasoning: true,
216
- input: ["text", "image"],
217
- cost: {
218
- input: 15,
219
- output: 75,
220
- cacheRead: 1.5,
221
- cacheWrite: 18.75,
222
- },
223
- contextWindow: 200000,
224
- maxTokens: 32000,
225
- },
226
107
  "anthropic.claude-opus-4-5-20251101-v1:0": {
227
108
  id: "anthropic.claude-opus-4-5-20251101-v1:0",
228
109
  name: "Claude Opus 4.5",
@@ -276,9 +157,9 @@ export const MODELS = {
276
157
  contextWindow: 1000000,
277
158
  maxTokens: 128000,
278
159
  },
279
- "anthropic.claude-sonnet-4-20250514-v1:0": {
280
- id: "anthropic.claude-sonnet-4-20250514-v1:0",
281
- name: "Claude Sonnet 4",
160
+ "anthropic.claude-sonnet-4-5-20250929-v1:0": {
161
+ id: "anthropic.claude-sonnet-4-5-20250929-v1:0",
162
+ name: "Claude Sonnet 4.5",
282
163
  api: "bedrock-converse-stream",
283
164
  provider: "amazon-bedrock",
284
165
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
@@ -293,9 +174,9 @@ export const MODELS = {
293
174
  contextWindow: 200000,
294
175
  maxTokens: 64000,
295
176
  },
296
- "anthropic.claude-sonnet-4-5-20250929-v1:0": {
297
- id: "anthropic.claude-sonnet-4-5-20250929-v1:0",
298
- name: "Claude Sonnet 4.5",
177
+ "anthropic.claude-sonnet-4-6": {
178
+ id: "anthropic.claude-sonnet-4-6",
179
+ name: "Claude Sonnet 4.6",
299
180
  api: "bedrock-converse-stream",
300
181
  provider: "amazon-bedrock",
301
182
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
@@ -307,24 +188,24 @@ export const MODELS = {
307
188
  cacheRead: 0.3,
308
189
  cacheWrite: 3.75,
309
190
  },
310
- contextWindow: 200000,
191
+ contextWindow: 1000000,
311
192
  maxTokens: 64000,
312
193
  },
313
- "anthropic.claude-sonnet-4-6": {
314
- id: "anthropic.claude-sonnet-4-6",
315
- name: "Claude Sonnet 4.6",
194
+ "au.anthropic.claude-haiku-4-5-20251001-v1:0": {
195
+ id: "au.anthropic.claude-haiku-4-5-20251001-v1:0",
196
+ name: "Claude Haiku 4.5 (AU)",
316
197
  api: "bedrock-converse-stream",
317
198
  provider: "amazon-bedrock",
318
199
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
319
200
  reasoning: true,
320
201
  input: ["text", "image"],
321
202
  cost: {
322
- input: 3,
323
- output: 15,
324
- cacheRead: 0.3,
325
- cacheWrite: 3.75,
203
+ input: 1,
204
+ output: 5,
205
+ cacheRead: 0.1,
206
+ cacheWrite: 1.25,
326
207
  },
327
- contextWindow: 1000000,
208
+ contextWindow: 200000,
328
209
  maxTokens: 64000,
329
210
  },
330
211
  "au.anthropic.claude-opus-4-6-v1": {
@@ -345,6 +226,23 @@ export const MODELS = {
345
226
  contextWindow: 1000000,
346
227
  maxTokens: 128000,
347
228
  },
229
+ "au.anthropic.claude-sonnet-4-5-20250929-v1:0": {
230
+ id: "au.anthropic.claude-sonnet-4-5-20250929-v1:0",
231
+ name: "Claude Sonnet 4.5 (AU)",
232
+ api: "bedrock-converse-stream",
233
+ provider: "amazon-bedrock",
234
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
235
+ reasoning: true,
236
+ input: ["text", "image"],
237
+ cost: {
238
+ input: 3,
239
+ output: 15,
240
+ cacheRead: 0.3,
241
+ cacheWrite: 3.75,
242
+ },
243
+ contextWindow: 200000,
244
+ maxTokens: 64000,
245
+ },
348
246
  "au.anthropic.claude-sonnet-4-6": {
349
247
  id: "au.anthropic.claude-sonnet-4-6",
350
248
  name: "AU Anthropic Claude Sonnet 4.6",
@@ -483,23 +381,6 @@ export const MODELS = {
483
381
  contextWindow: 1000000,
484
382
  maxTokens: 128000,
485
383
  },
486
- "eu.anthropic.claude-sonnet-4-20250514-v1:0": {
487
- id: "eu.anthropic.claude-sonnet-4-20250514-v1:0",
488
- name: "Claude Sonnet 4 (EU)",
489
- api: "bedrock-converse-stream",
490
- provider: "amazon-bedrock",
491
- baseUrl: "https://bedrock-runtime.eu-central-1.amazonaws.com",
492
- reasoning: true,
493
- input: ["text", "image"],
494
- cost: {
495
- input: 3,
496
- output: 15,
497
- cacheRead: 0.3,
498
- cacheWrite: 3.75,
499
- },
500
- contextWindow: 200000,
501
- maxTokens: 64000,
502
- },
503
384
  "eu.anthropic.claude-sonnet-4-5-20250929-v1:0": {
504
385
  id: "eu.anthropic.claude-sonnet-4-5-20250929-v1:0",
505
386
  name: "Claude Sonnet 4.5 (EU)",
@@ -604,23 +485,6 @@ export const MODELS = {
604
485
  contextWindow: 1000000,
605
486
  maxTokens: 128000,
606
487
  },
607
- "global.anthropic.claude-sonnet-4-20250514-v1:0": {
608
- id: "global.anthropic.claude-sonnet-4-20250514-v1:0",
609
- name: "Claude Sonnet 4 (Global)",
610
- api: "bedrock-converse-stream",
611
- provider: "amazon-bedrock",
612
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
613
- reasoning: true,
614
- input: ["text", "image"],
615
- cost: {
616
- input: 3,
617
- output: 15,
618
- cacheRead: 0.3,
619
- cacheWrite: 3.75,
620
- },
621
- contextWindow: 200000,
622
- maxTokens: 64000,
623
- },
624
488
  "global.anthropic.claude-sonnet-4-5-20250929-v1:0": {
625
489
  id: "global.anthropic.claude-sonnet-4-5-20250929-v1:0",
626
490
  name: "Claude Sonnet 4.5 (Global)",
@@ -689,22 +553,57 @@ export const MODELS = {
689
553
  contextWindow: 128000,
690
554
  maxTokens: 4096,
691
555
  },
692
- "meta.llama3-1-405b-instruct-v1:0": {
693
- id: "meta.llama3-1-405b-instruct-v1:0",
694
- name: "Llama 3.1 405B Instruct",
556
+ "jp.anthropic.claude-opus-4-7": {
557
+ id: "jp.anthropic.claude-opus-4-7",
558
+ name: "Claude Opus 4.7 (JP)",
695
559
  api: "bedrock-converse-stream",
696
560
  provider: "amazon-bedrock",
697
561
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
698
- reasoning: false,
699
- input: ["text"],
562
+ reasoning: true,
563
+ thinkingLevelMap: { "xhigh": "xhigh" },
564
+ input: ["text", "image"],
700
565
  cost: {
701
- input: 2.4,
702
- output: 2.4,
703
- cacheRead: 0,
704
- cacheWrite: 0,
566
+ input: 5,
567
+ output: 25,
568
+ cacheRead: 0.5,
569
+ cacheWrite: 6.25,
705
570
  },
706
- contextWindow: 128000,
707
- maxTokens: 4096,
571
+ contextWindow: 1000000,
572
+ maxTokens: 128000,
573
+ },
574
+ "jp.anthropic.claude-sonnet-4-5-20250929-v1:0": {
575
+ id: "jp.anthropic.claude-sonnet-4-5-20250929-v1:0",
576
+ name: "Claude Sonnet 4.5 (JP)",
577
+ api: "bedrock-converse-stream",
578
+ provider: "amazon-bedrock",
579
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
580
+ reasoning: true,
581
+ input: ["text", "image"],
582
+ cost: {
583
+ input: 3,
584
+ output: 15,
585
+ cacheRead: 0.3,
586
+ cacheWrite: 3.75,
587
+ },
588
+ contextWindow: 200000,
589
+ maxTokens: 64000,
590
+ },
591
+ "jp.anthropic.claude-sonnet-4-6": {
592
+ id: "jp.anthropic.claude-sonnet-4-6",
593
+ name: "Claude Sonnet 4.6 (JP)",
594
+ api: "bedrock-converse-stream",
595
+ provider: "amazon-bedrock",
596
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
597
+ reasoning: true,
598
+ input: ["text", "image"],
599
+ cost: {
600
+ input: 3,
601
+ output: 15,
602
+ cacheRead: 0.3,
603
+ cacheWrite: 3.75,
604
+ },
605
+ contextWindow: 1000000,
606
+ maxTokens: 64000,
708
607
  },
709
608
  "meta.llama3-1-70b-instruct-v1:0": {
710
609
  id: "meta.llama3-1-70b-instruct-v1:0",
@@ -740,128 +639,60 @@ export const MODELS = {
740
639
  contextWindow: 128000,
741
640
  maxTokens: 4096,
742
641
  },
743
- "meta.llama3-2-11b-instruct-v1:0": {
744
- id: "meta.llama3-2-11b-instruct-v1:0",
745
- name: "Llama 3.2 11B Instruct",
642
+ "meta.llama3-3-70b-instruct-v1:0": {
643
+ id: "meta.llama3-3-70b-instruct-v1:0",
644
+ name: "Llama 3.3 70B Instruct",
746
645
  api: "bedrock-converse-stream",
747
646
  provider: "amazon-bedrock",
748
647
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
749
648
  reasoning: false,
750
- input: ["text", "image"],
649
+ input: ["text"],
751
650
  cost: {
752
- input: 0.16,
753
- output: 0.16,
651
+ input: 0.72,
652
+ output: 0.72,
754
653
  cacheRead: 0,
755
654
  cacheWrite: 0,
756
655
  },
757
656
  contextWindow: 128000,
758
657
  maxTokens: 4096,
759
658
  },
760
- "meta.llama3-2-1b-instruct-v1:0": {
761
- id: "meta.llama3-2-1b-instruct-v1:0",
762
- name: "Llama 3.2 1B Instruct",
659
+ "meta.llama4-maverick-17b-instruct-v1:0": {
660
+ id: "meta.llama4-maverick-17b-instruct-v1:0",
661
+ name: "Llama 4 Maverick 17B Instruct",
763
662
  api: "bedrock-converse-stream",
764
663
  provider: "amazon-bedrock",
765
664
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
766
665
  reasoning: false,
767
- input: ["text"],
666
+ input: ["text", "image"],
768
667
  cost: {
769
- input: 0.1,
770
- output: 0.1,
668
+ input: 0.24,
669
+ output: 0.97,
771
670
  cacheRead: 0,
772
671
  cacheWrite: 0,
773
672
  },
774
- contextWindow: 131000,
775
- maxTokens: 4096,
673
+ contextWindow: 1000000,
674
+ maxTokens: 16384,
776
675
  },
777
- "meta.llama3-2-3b-instruct-v1:0": {
778
- id: "meta.llama3-2-3b-instruct-v1:0",
779
- name: "Llama 3.2 3B Instruct",
676
+ "meta.llama4-scout-17b-instruct-v1:0": {
677
+ id: "meta.llama4-scout-17b-instruct-v1:0",
678
+ name: "Llama 4 Scout 17B Instruct",
780
679
  api: "bedrock-converse-stream",
781
680
  provider: "amazon-bedrock",
782
681
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
783
682
  reasoning: false,
784
- input: ["text"],
683
+ input: ["text", "image"],
785
684
  cost: {
786
- input: 0.15,
787
- output: 0.15,
685
+ input: 0.17,
686
+ output: 0.66,
788
687
  cacheRead: 0,
789
688
  cacheWrite: 0,
790
689
  },
791
- contextWindow: 131000,
792
- maxTokens: 4096,
690
+ contextWindow: 3500000,
691
+ maxTokens: 16384,
793
692
  },
794
- "meta.llama3-2-90b-instruct-v1:0": {
795
- id: "meta.llama3-2-90b-instruct-v1:0",
796
- name: "Llama 3.2 90B Instruct",
797
- api: "bedrock-converse-stream",
798
- provider: "amazon-bedrock",
799
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
800
- reasoning: false,
801
- input: ["text", "image"],
802
- cost: {
803
- input: 0.72,
804
- output: 0.72,
805
- cacheRead: 0,
806
- cacheWrite: 0,
807
- },
808
- contextWindow: 128000,
809
- maxTokens: 4096,
810
- },
811
- "meta.llama3-3-70b-instruct-v1:0": {
812
- id: "meta.llama3-3-70b-instruct-v1:0",
813
- name: "Llama 3.3 70B Instruct",
814
- api: "bedrock-converse-stream",
815
- provider: "amazon-bedrock",
816
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
817
- reasoning: false,
818
- input: ["text"],
819
- cost: {
820
- input: 0.72,
821
- output: 0.72,
822
- cacheRead: 0,
823
- cacheWrite: 0,
824
- },
825
- contextWindow: 128000,
826
- maxTokens: 4096,
827
- },
828
- "meta.llama4-maverick-17b-instruct-v1:0": {
829
- id: "meta.llama4-maverick-17b-instruct-v1:0",
830
- name: "Llama 4 Maverick 17B Instruct",
831
- api: "bedrock-converse-stream",
832
- provider: "amazon-bedrock",
833
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
834
- reasoning: false,
835
- input: ["text", "image"],
836
- cost: {
837
- input: 0.24,
838
- output: 0.97,
839
- cacheRead: 0,
840
- cacheWrite: 0,
841
- },
842
- contextWindow: 1000000,
843
- maxTokens: 16384,
844
- },
845
- "meta.llama4-scout-17b-instruct-v1:0": {
846
- id: "meta.llama4-scout-17b-instruct-v1:0",
847
- name: "Llama 4 Scout 17B Instruct",
848
- api: "bedrock-converse-stream",
849
- provider: "amazon-bedrock",
850
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
851
- reasoning: false,
852
- input: ["text", "image"],
853
- cost: {
854
- input: 0.17,
855
- output: 0.66,
856
- cacheRead: 0,
857
- cacheWrite: 0,
858
- },
859
- contextWindow: 3500000,
860
- maxTokens: 16384,
861
- },
862
- "minimax.minimax-m2": {
863
- id: "minimax.minimax-m2",
864
- name: "MiniMax M2",
693
+ "minimax.minimax-m2": {
694
+ id: "minimax.minimax-m2",
695
+ name: "MiniMax M2",
865
696
  api: "bedrock-converse-stream",
866
697
  provider: "amazon-bedrock",
867
698
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
@@ -1180,7 +1011,7 @@ export const MODELS = {
1180
1011
  cacheWrite: 0,
1181
1012
  },
1182
1013
  contextWindow: 128000,
1183
- maxTokens: 4096,
1014
+ maxTokens: 16384,
1184
1015
  },
1185
1016
  "openai.gpt-oss-20b-1:0": {
1186
1017
  id: "openai.gpt-oss-20b-1:0",
@@ -1197,7 +1028,7 @@ export const MODELS = {
1197
1028
  cacheWrite: 0,
1198
1029
  },
1199
1030
  contextWindow: 128000,
1200
- maxTokens: 4096,
1031
+ maxTokens: 16384,
1201
1032
  },
1202
1033
  "openai.gpt-oss-safeguard-120b": {
1203
1034
  id: "openai.gpt-oss-safeguard-120b",
@@ -1214,7 +1045,7 @@ export const MODELS = {
1214
1045
  cacheWrite: 0,
1215
1046
  },
1216
1047
  contextWindow: 128000,
1217
- maxTokens: 4096,
1048
+ maxTokens: 16384,
1218
1049
  },
1219
1050
  "openai.gpt-oss-safeguard-20b": {
1220
1051
  id: "openai.gpt-oss-safeguard-20b",
@@ -1231,7 +1062,7 @@ export const MODELS = {
1231
1062
  cacheWrite: 0,
1232
1063
  },
1233
1064
  contextWindow: 128000,
1234
- maxTokens: 4096,
1065
+ maxTokens: 16384,
1235
1066
  },
1236
1067
  "qwen.qwen3-235b-a22b-2507-v1:0": {
1237
1068
  id: "qwen.qwen3-235b-a22b-2507-v1:0",
@@ -1386,23 +1217,6 @@ export const MODELS = {
1386
1217
  contextWindow: 200000,
1387
1218
  maxTokens: 32000,
1388
1219
  },
1389
- "us.anthropic.claude-opus-4-20250514-v1:0": {
1390
- id: "us.anthropic.claude-opus-4-20250514-v1:0",
1391
- name: "Claude Opus 4 (US)",
1392
- api: "bedrock-converse-stream",
1393
- provider: "amazon-bedrock",
1394
- baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1395
- reasoning: true,
1396
- input: ["text", "image"],
1397
- cost: {
1398
- input: 15,
1399
- output: 75,
1400
- cacheRead: 1.5,
1401
- cacheWrite: 18.75,
1402
- },
1403
- contextWindow: 200000,
1404
- maxTokens: 32000,
1405
- },
1406
1220
  "us.anthropic.claude-opus-4-5-20251101-v1:0": {
1407
1221
  id: "us.anthropic.claude-opus-4-5-20251101-v1:0",
1408
1222
  name: "Claude Opus 4.5 (US)",
@@ -1456,9 +1270,9 @@ export const MODELS = {
1456
1270
  contextWindow: 1000000,
1457
1271
  maxTokens: 128000,
1458
1272
  },
1459
- "us.anthropic.claude-sonnet-4-20250514-v1:0": {
1460
- id: "us.anthropic.claude-sonnet-4-20250514-v1:0",
1461
- name: "Claude Sonnet 4 (US)",
1273
+ "us.anthropic.claude-sonnet-4-5-20250929-v1:0": {
1274
+ id: "us.anthropic.claude-sonnet-4-5-20250929-v1:0",
1275
+ name: "Claude Sonnet 4.5 (US)",
1462
1276
  api: "bedrock-converse-stream",
1463
1277
  provider: "amazon-bedrock",
1464
1278
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
@@ -1473,9 +1287,9 @@ export const MODELS = {
1473
1287
  contextWindow: 200000,
1474
1288
  maxTokens: 64000,
1475
1289
  },
1476
- "us.anthropic.claude-sonnet-4-5-20250929-v1:0": {
1477
- id: "us.anthropic.claude-sonnet-4-5-20250929-v1:0",
1478
- name: "Claude Sonnet 4.5 (US)",
1290
+ "us.anthropic.claude-sonnet-4-6": {
1291
+ id: "us.anthropic.claude-sonnet-4-6",
1292
+ name: "Claude Sonnet 4.6 (US)",
1479
1293
  api: "bedrock-converse-stream",
1480
1294
  provider: "amazon-bedrock",
1481
1295
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
@@ -1487,25 +1301,59 @@ export const MODELS = {
1487
1301
  cacheRead: 0.3,
1488
1302
  cacheWrite: 3.75,
1489
1303
  },
1490
- contextWindow: 200000,
1304
+ contextWindow: 1000000,
1491
1305
  maxTokens: 64000,
1492
1306
  },
1493
- "us.anthropic.claude-sonnet-4-6": {
1494
- id: "us.anthropic.claude-sonnet-4-6",
1495
- name: "Claude Sonnet 4.6 (US)",
1307
+ "us.deepseek.r1-v1:0": {
1308
+ id: "us.deepseek.r1-v1:0",
1309
+ name: "DeepSeek-R1 (US)",
1496
1310
  api: "bedrock-converse-stream",
1497
1311
  provider: "amazon-bedrock",
1498
1312
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1499
1313
  reasoning: true,
1314
+ input: ["text"],
1315
+ cost: {
1316
+ input: 1.35,
1317
+ output: 5.4,
1318
+ cacheRead: 0,
1319
+ cacheWrite: 0,
1320
+ },
1321
+ contextWindow: 128000,
1322
+ maxTokens: 32768,
1323
+ },
1324
+ "us.meta.llama4-maverick-17b-instruct-v1:0": {
1325
+ id: "us.meta.llama4-maverick-17b-instruct-v1:0",
1326
+ name: "Llama 4 Maverick 17B Instruct (US)",
1327
+ api: "bedrock-converse-stream",
1328
+ provider: "amazon-bedrock",
1329
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1330
+ reasoning: false,
1500
1331
  input: ["text", "image"],
1501
1332
  cost: {
1502
- input: 3,
1503
- output: 15,
1504
- cacheRead: 0.3,
1505
- cacheWrite: 3.75,
1333
+ input: 0.24,
1334
+ output: 0.97,
1335
+ cacheRead: 0,
1336
+ cacheWrite: 0,
1506
1337
  },
1507
1338
  contextWindow: 1000000,
1508
- maxTokens: 64000,
1339
+ maxTokens: 16384,
1340
+ },
1341
+ "us.meta.llama4-scout-17b-instruct-v1:0": {
1342
+ id: "us.meta.llama4-scout-17b-instruct-v1:0",
1343
+ name: "Llama 4 Scout 17B Instruct (US)",
1344
+ api: "bedrock-converse-stream",
1345
+ provider: "amazon-bedrock",
1346
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1347
+ reasoning: false,
1348
+ input: ["text", "image"],
1349
+ cost: {
1350
+ input: 0.17,
1351
+ output: 0.66,
1352
+ cacheRead: 0,
1353
+ cacheWrite: 0,
1354
+ },
1355
+ contextWindow: 3500000,
1356
+ maxTokens: 16384,
1509
1357
  },
1510
1358
  "writer.palmyra-x4-v1:0": {
1511
1359
  id: "writer.palmyra-x4-v1:0",
@@ -3601,6 +3449,7 @@ export const MODELS = {
3601
3449
  api: "anthropic-messages",
3602
3450
  provider: "fireworks",
3603
3451
  baseUrl: "https://api.fireworks.ai/inference",
3452
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3604
3453
  reasoning: true,
3605
3454
  input: ["text"],
3606
3455
  cost: {
@@ -3618,6 +3467,7 @@ export const MODELS = {
3618
3467
  api: "anthropic-messages",
3619
3468
  provider: "fireworks",
3620
3469
  baseUrl: "https://api.fireworks.ai/inference",
3470
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3621
3471
  reasoning: true,
3622
3472
  input: ["text"],
3623
3473
  cost: {
@@ -3635,6 +3485,7 @@ export const MODELS = {
3635
3485
  api: "anthropic-messages",
3636
3486
  provider: "fireworks",
3637
3487
  baseUrl: "https://api.fireworks.ai/inference",
3488
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3638
3489
  reasoning: true,
3639
3490
  input: ["text"],
3640
3491
  cost: {
@@ -3652,6 +3503,7 @@ export const MODELS = {
3652
3503
  api: "anthropic-messages",
3653
3504
  provider: "fireworks",
3654
3505
  baseUrl: "https://api.fireworks.ai/inference",
3506
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3655
3507
  reasoning: true,
3656
3508
  input: ["text"],
3657
3509
  cost: {
@@ -3669,6 +3521,7 @@ export const MODELS = {
3669
3521
  api: "anthropic-messages",
3670
3522
  provider: "fireworks",
3671
3523
  baseUrl: "https://api.fireworks.ai/inference",
3524
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3672
3525
  reasoning: true,
3673
3526
  input: ["text"],
3674
3527
  cost: {
@@ -3686,6 +3539,7 @@ export const MODELS = {
3686
3539
  api: "anthropic-messages",
3687
3540
  provider: "fireworks",
3688
3541
  baseUrl: "https://api.fireworks.ai/inference",
3542
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3689
3543
  reasoning: true,
3690
3544
  input: ["text"],
3691
3545
  cost: {
@@ -3703,6 +3557,7 @@ export const MODELS = {
3703
3557
  api: "anthropic-messages",
3704
3558
  provider: "fireworks",
3705
3559
  baseUrl: "https://api.fireworks.ai/inference",
3560
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3706
3561
  reasoning: true,
3707
3562
  input: ["text"],
3708
3563
  cost: {
@@ -3720,6 +3575,7 @@ export const MODELS = {
3720
3575
  api: "anthropic-messages",
3721
3576
  provider: "fireworks",
3722
3577
  baseUrl: "https://api.fireworks.ai/inference",
3578
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3723
3579
  reasoning: true,
3724
3580
  input: ["text"],
3725
3581
  cost: {
@@ -3737,6 +3593,7 @@ export const MODELS = {
3737
3593
  api: "anthropic-messages",
3738
3594
  provider: "fireworks",
3739
3595
  baseUrl: "https://api.fireworks.ai/inference",
3596
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3740
3597
  reasoning: true,
3741
3598
  input: ["text"],
3742
3599
  cost: {
@@ -3754,6 +3611,7 @@ export const MODELS = {
3754
3611
  api: "anthropic-messages",
3755
3612
  provider: "fireworks",
3756
3613
  baseUrl: "https://api.fireworks.ai/inference",
3614
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3757
3615
  reasoning: true,
3758
3616
  input: ["text"],
3759
3617
  cost: {
@@ -3771,6 +3629,7 @@ export const MODELS = {
3771
3629
  api: "anthropic-messages",
3772
3630
  provider: "fireworks",
3773
3631
  baseUrl: "https://api.fireworks.ai/inference",
3632
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3774
3633
  reasoning: false,
3775
3634
  input: ["text"],
3776
3635
  cost: {
@@ -3788,6 +3647,7 @@ export const MODELS = {
3788
3647
  api: "anthropic-messages",
3789
3648
  provider: "fireworks",
3790
3649
  baseUrl: "https://api.fireworks.ai/inference",
3650
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3791
3651
  reasoning: true,
3792
3652
  input: ["text"],
3793
3653
  cost: {
@@ -3805,6 +3665,7 @@ export const MODELS = {
3805
3665
  api: "anthropic-messages",
3806
3666
  provider: "fireworks",
3807
3667
  baseUrl: "https://api.fireworks.ai/inference",
3668
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3808
3669
  reasoning: true,
3809
3670
  input: ["text", "image"],
3810
3671
  cost: {
@@ -3822,6 +3683,7 @@ export const MODELS = {
3822
3683
  api: "anthropic-messages",
3823
3684
  provider: "fireworks",
3824
3685
  baseUrl: "https://api.fireworks.ai/inference",
3686
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3825
3687
  reasoning: true,
3826
3688
  input: ["text", "image"],
3827
3689
  cost: {
@@ -3839,6 +3701,7 @@ export const MODELS = {
3839
3701
  api: "anthropic-messages",
3840
3702
  provider: "fireworks",
3841
3703
  baseUrl: "https://api.fireworks.ai/inference",
3704
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3842
3705
  reasoning: true,
3843
3706
  input: ["text"],
3844
3707
  cost: {
@@ -3856,6 +3719,7 @@ export const MODELS = {
3856
3719
  api: "anthropic-messages",
3857
3720
  provider: "fireworks",
3858
3721
  baseUrl: "https://api.fireworks.ai/inference",
3722
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3859
3723
  reasoning: true,
3860
3724
  input: ["text"],
3861
3725
  cost: {
@@ -3873,6 +3737,7 @@ export const MODELS = {
3873
3737
  api: "anthropic-messages",
3874
3738
  provider: "fireworks",
3875
3739
  baseUrl: "https://api.fireworks.ai/inference",
3740
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3876
3741
  reasoning: true,
3877
3742
  input: ["text"],
3878
3743
  cost: {
@@ -3890,6 +3755,7 @@ export const MODELS = {
3890
3755
  api: "anthropic-messages",
3891
3756
  provider: "fireworks",
3892
3757
  baseUrl: "https://api.fireworks.ai/inference",
3758
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3893
3759
  reasoning: true,
3894
3760
  input: ["text", "image"],
3895
3761
  cost: {
@@ -3907,6 +3773,7 @@ export const MODELS = {
3907
3773
  api: "anthropic-messages",
3908
3774
  provider: "fireworks",
3909
3775
  baseUrl: "https://api.fireworks.ai/inference",
3776
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3910
3777
  reasoning: true,
3911
3778
  input: ["text", "image"],
3912
3779
  cost: {
@@ -3995,25 +3862,6 @@ export const MODELS = {
3995
3862
  contextWindow: 144000,
3996
3863
  maxTokens: 64000,
3997
3864
  },
3998
- "claude-sonnet-4": {
3999
- id: "claude-sonnet-4",
4000
- name: "Claude Sonnet 4",
4001
- api: "anthropic-messages",
4002
- provider: "github-copilot",
4003
- baseUrl: "https://api.individual.githubcopilot.com",
4004
- headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4005
- compat: { "supportsEagerToolInputStreaming": false },
4006
- reasoning: true,
4007
- input: ["text", "image"],
4008
- cost: {
4009
- input: 0,
4010
- output: 0,
4011
- cacheRead: 0,
4012
- cacheWrite: 0,
4013
- },
4014
- contextWindow: 216000,
4015
- maxTokens: 16000,
4016
- },
4017
3865
  "claude-sonnet-4.5": {
4018
3866
  id: "claude-sonnet-4.5",
4019
3867
  name: "Claude Sonnet 4.5",
@@ -4089,25 +3937,6 @@ export const MODELS = {
4089
3937
  contextWindow: 128000,
4090
3938
  maxTokens: 64000,
4091
3939
  },
4092
- "gemini-3-pro-preview": {
4093
- id: "gemini-3-pro-preview",
4094
- name: "Gemini 3 Pro Preview",
4095
- api: "openai-completions",
4096
- provider: "github-copilot",
4097
- baseUrl: "https://api.individual.githubcopilot.com",
4098
- headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4099
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
4100
- reasoning: true,
4101
- input: ["text", "image"],
4102
- cost: {
4103
- input: 0,
4104
- output: 0,
4105
- cacheRead: 0,
4106
- cacheWrite: 0,
4107
- },
4108
- contextWindow: 128000,
4109
- maxTokens: 64000,
4110
- },
4111
3940
  "gemini-3.1-pro-preview": {
4112
3941
  id: "gemini-3.1-pro-preview",
4113
3942
  name: "Gemini 3.1 Pro Preview",
@@ -4165,25 +3994,6 @@ export const MODELS = {
4165
3994
  contextWindow: 128000,
4166
3995
  maxTokens: 4096,
4167
3996
  },
4168
- "gpt-5": {
4169
- id: "gpt-5",
4170
- name: "GPT-5",
4171
- api: "openai-responses",
4172
- provider: "github-copilot",
4173
- baseUrl: "https://api.individual.githubcopilot.com",
4174
- headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4175
- reasoning: true,
4176
- thinkingLevelMap: { "off": null },
4177
- input: ["text", "image"],
4178
- cost: {
4179
- input: 0,
4180
- output: 0,
4181
- cacheRead: 0,
4182
- cacheWrite: 0,
4183
- },
4184
- contextWindow: 128000,
4185
- maxTokens: 128000,
4186
- },
4187
3997
  "gpt-5-mini": {
4188
3998
  id: "gpt-5-mini",
4189
3999
  name: "GPT-5-mini",
@@ -4192,7 +4002,7 @@ export const MODELS = {
4192
4002
  baseUrl: "https://api.individual.githubcopilot.com",
4193
4003
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4194
4004
  reasoning: true,
4195
- thinkingLevelMap: { "off": null },
4005
+ thinkingLevelMap: { "off": null, "minimal": "low" },
4196
4006
  input: ["text", "image"],
4197
4007
  cost: {
4198
4008
  input: 0,
@@ -4203,15 +4013,15 @@ export const MODELS = {
4203
4013
  contextWindow: 264000,
4204
4014
  maxTokens: 64000,
4205
4015
  },
4206
- "gpt-5.1": {
4207
- id: "gpt-5.1",
4208
- name: "GPT-5.1",
4016
+ "gpt-5.2": {
4017
+ id: "gpt-5.2",
4018
+ name: "GPT-5.2",
4209
4019
  api: "openai-responses",
4210
4020
  provider: "github-copilot",
4211
4021
  baseUrl: "https://api.individual.githubcopilot.com",
4212
4022
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4213
4023
  reasoning: true,
4214
- thinkingLevelMap: { "off": null },
4024
+ thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4215
4025
  input: ["text", "image"],
4216
4026
  cost: {
4217
4027
  input: 0,
@@ -4222,15 +4032,15 @@ export const MODELS = {
4222
4032
  contextWindow: 264000,
4223
4033
  maxTokens: 64000,
4224
4034
  },
4225
- "gpt-5.1-codex": {
4226
- id: "gpt-5.1-codex",
4227
- name: "GPT-5.1-Codex",
4035
+ "gpt-5.2-codex": {
4036
+ id: "gpt-5.2-codex",
4037
+ name: "GPT-5.2-Codex",
4228
4038
  api: "openai-responses",
4229
4039
  provider: "github-copilot",
4230
4040
  baseUrl: "https://api.individual.githubcopilot.com",
4231
4041
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4232
4042
  reasoning: true,
4233
- thinkingLevelMap: { "off": null },
4043
+ thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4234
4044
  input: ["text", "image"],
4235
4045
  cost: {
4236
4046
  input: 0,
@@ -4241,15 +4051,15 @@ export const MODELS = {
4241
4051
  contextWindow: 400000,
4242
4052
  maxTokens: 128000,
4243
4053
  },
4244
- "gpt-5.1-codex-max": {
4245
- id: "gpt-5.1-codex-max",
4246
- name: "GPT-5.1-Codex-max",
4054
+ "gpt-5.3-codex": {
4055
+ id: "gpt-5.3-codex",
4056
+ name: "GPT-5.3-Codex",
4247
4057
  api: "openai-responses",
4248
4058
  provider: "github-copilot",
4249
4059
  baseUrl: "https://api.individual.githubcopilot.com",
4250
4060
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4251
4061
  reasoning: true,
4252
- thinkingLevelMap: { "off": null },
4062
+ thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4253
4063
  input: ["text", "image"],
4254
4064
  cost: {
4255
4065
  input: 0,
@@ -4260,15 +4070,15 @@ export const MODELS = {
4260
4070
  contextWindow: 400000,
4261
4071
  maxTokens: 128000,
4262
4072
  },
4263
- "gpt-5.1-codex-mini": {
4264
- id: "gpt-5.1-codex-mini",
4265
- name: "GPT-5.1-Codex-mini",
4073
+ "gpt-5.4": {
4074
+ id: "gpt-5.4",
4075
+ name: "GPT-5.4",
4266
4076
  api: "openai-responses",
4267
4077
  provider: "github-copilot",
4268
4078
  baseUrl: "https://api.individual.githubcopilot.com",
4269
4079
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4270
4080
  reasoning: true,
4271
- thinkingLevelMap: { "off": null },
4081
+ thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4272
4082
  input: ["text", "image"],
4273
4083
  cost: {
4274
4084
  input: 0,
@@ -4279,15 +4089,15 @@ export const MODELS = {
4279
4089
  contextWindow: 400000,
4280
4090
  maxTokens: 128000,
4281
4091
  },
4282
- "gpt-5.2": {
4283
- id: "gpt-5.2",
4284
- name: "GPT-5.2",
4092
+ "gpt-5.4-mini": {
4093
+ id: "gpt-5.4-mini",
4094
+ name: "GPT-5.4 Mini",
4285
4095
  api: "openai-responses",
4286
4096
  provider: "github-copilot",
4287
4097
  baseUrl: "https://api.individual.githubcopilot.com",
4288
4098
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4289
4099
  reasoning: true,
4290
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
4100
+ thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4291
4101
  input: ["text", "image"],
4292
4102
  cost: {
4293
4103
  input: 0,
@@ -4295,18 +4105,18 @@ export const MODELS = {
4295
4105
  cacheRead: 0,
4296
4106
  cacheWrite: 0,
4297
4107
  },
4298
- contextWindow: 264000,
4299
- maxTokens: 64000,
4108
+ contextWindow: 400000,
4109
+ maxTokens: 128000,
4300
4110
  },
4301
- "gpt-5.2-codex": {
4302
- id: "gpt-5.2-codex",
4303
- name: "GPT-5.2-Codex",
4111
+ "gpt-5.5": {
4112
+ id: "gpt-5.5",
4113
+ name: "GPT-5.5",
4304
4114
  api: "openai-responses",
4305
4115
  provider: "github-copilot",
4306
4116
  baseUrl: "https://api.individual.githubcopilot.com",
4307
4117
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4308
4118
  reasoning: true,
4309
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
4119
+ thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4310
4120
  input: ["text", "image"],
4311
4121
  cost: {
4312
4122
  input: 0,
@@ -4317,92 +4127,16 @@ export const MODELS = {
4317
4127
  contextWindow: 400000,
4318
4128
  maxTokens: 128000,
4319
4129
  },
4320
- "gpt-5.3-codex": {
4321
- id: "gpt-5.3-codex",
4322
- name: "GPT-5.3-Codex",
4323
- api: "openai-responses",
4130
+ "grok-code-fast-1": {
4131
+ id: "grok-code-fast-1",
4132
+ name: "Grok Code Fast 1",
4133
+ api: "openai-completions",
4324
4134
  provider: "github-copilot",
4325
4135
  baseUrl: "https://api.individual.githubcopilot.com",
4326
4136
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4137
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
4327
4138
  reasoning: true,
4328
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
4329
- input: ["text", "image"],
4330
- cost: {
4331
- input: 0,
4332
- output: 0,
4333
- cacheRead: 0,
4334
- cacheWrite: 0,
4335
- },
4336
- contextWindow: 400000,
4337
- maxTokens: 128000,
4338
- },
4339
- "gpt-5.4": {
4340
- id: "gpt-5.4",
4341
- name: "GPT-5.4",
4342
- api: "openai-responses",
4343
- provider: "github-copilot",
4344
- baseUrl: "https://api.individual.githubcopilot.com",
4345
- headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4346
- reasoning: true,
4347
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
4348
- input: ["text", "image"],
4349
- cost: {
4350
- input: 0,
4351
- output: 0,
4352
- cacheRead: 0,
4353
- cacheWrite: 0,
4354
- },
4355
- contextWindow: 400000,
4356
- maxTokens: 128000,
4357
- },
4358
- "gpt-5.4-mini": {
4359
- id: "gpt-5.4-mini",
4360
- name: "GPT-5.4 Mini",
4361
- api: "openai-responses",
4362
- provider: "github-copilot",
4363
- baseUrl: "https://api.individual.githubcopilot.com",
4364
- headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4365
- reasoning: true,
4366
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
4367
- input: ["text", "image"],
4368
- cost: {
4369
- input: 0,
4370
- output: 0,
4371
- cacheRead: 0,
4372
- cacheWrite: 0,
4373
- },
4374
- contextWindow: 400000,
4375
- maxTokens: 128000,
4376
- },
4377
- "gpt-5.5": {
4378
- id: "gpt-5.5",
4379
- name: "GPT-5.5",
4380
- api: "openai-responses",
4381
- provider: "github-copilot",
4382
- baseUrl: "https://api.individual.githubcopilot.com",
4383
- headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4384
- reasoning: true,
4385
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
4386
- input: ["text", "image"],
4387
- cost: {
4388
- input: 0,
4389
- output: 0,
4390
- cacheRead: 0,
4391
- cacheWrite: 0,
4392
- },
4393
- contextWindow: 400000,
4394
- maxTokens: 128000,
4395
- },
4396
- "grok-code-fast-1": {
4397
- id: "grok-code-fast-1",
4398
- name: "Grok Code Fast 1",
4399
- api: "openai-completions",
4400
- provider: "github-copilot",
4401
- baseUrl: "https://api.individual.githubcopilot.com",
4402
- headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4403
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
4404
- reasoning: true,
4405
- input: ["text"],
4139
+ input: ["text"],
4406
4140
  cost: {
4407
4141
  input: 0,
4408
4142
  output: 0,
@@ -4527,7 +4261,7 @@ export const MODELS = {
4527
4261
  cost: {
4528
4262
  input: 0.1,
4529
4263
  output: 0.4,
4530
- cacheRead: 0.025,
4264
+ cacheRead: 0.01,
4531
4265
  cacheWrite: 0,
4532
4266
  },
4533
4267
  contextWindow: 1048576,
@@ -4705,6 +4439,24 @@ export const MODELS = {
4705
4439
  contextWindow: 1000000,
4706
4440
  maxTokens: 64000,
4707
4441
  },
4442
+ "gemini-3.1-flash-lite": {
4443
+ id: "gemini-3.1-flash-lite",
4444
+ name: "Gemini 3.1 Flash Lite",
4445
+ api: "google-generative-ai",
4446
+ provider: "google",
4447
+ baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4448
+ reasoning: true,
4449
+ thinkingLevelMap: { "off": null },
4450
+ input: ["text", "image"],
4451
+ cost: {
4452
+ input: 0.25,
4453
+ output: 1.5,
4454
+ cacheRead: 0.025,
4455
+ cacheWrite: 0,
4456
+ },
4457
+ contextWindow: 1048576,
4458
+ maxTokens: 65536,
4459
+ },
4708
4460
  "gemini-3.1-flash-lite-preview": {
4709
4461
  id: "gemini-3.1-flash-lite-preview",
4710
4462
  name: "Gemini 3.1 Flash Lite Preview",
@@ -4718,7 +4470,7 @@ export const MODELS = {
4718
4470
  input: 0.25,
4719
4471
  output: 1.5,
4720
4472
  cacheRead: 0.025,
4721
- cacheWrite: 1,
4473
+ cacheWrite: 0,
4722
4474
  },
4723
4475
  contextWindow: 1048576,
4724
4476
  maxTokens: 65536,
@@ -6945,7 +6697,7 @@ export const MODELS = {
6945
6697
  provider: "openai",
6946
6698
  baseUrl: "https://api.openai.com/v1",
6947
6699
  reasoning: true,
6948
- thinkingLevelMap: { "off": null },
6700
+ thinkingLevelMap: { "off": "none" },
6949
6701
  input: ["text", "image"],
6950
6702
  cost: {
6951
6703
  input: 1.25,
@@ -7035,7 +6787,7 @@ export const MODELS = {
7035
6787
  provider: "openai",
7036
6788
  baseUrl: "https://api.openai.com/v1",
7037
6789
  reasoning: true,
7038
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
6790
+ thinkingLevelMap: { "off": "none", "xhigh": "xhigh" },
7039
6791
  input: ["text", "image"],
7040
6792
  cost: {
7041
6793
  input: 1.75,
@@ -7125,7 +6877,7 @@ export const MODELS = {
7125
6877
  provider: "openai",
7126
6878
  baseUrl: "https://api.openai.com/v1",
7127
6879
  reasoning: true,
7128
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
6880
+ thinkingLevelMap: { "off": "none", "xhigh": "xhigh" },
7129
6881
  input: ["text", "image"],
7130
6882
  cost: {
7131
6883
  input: 1.75,
@@ -7161,7 +6913,7 @@ export const MODELS = {
7161
6913
  provider: "openai",
7162
6914
  baseUrl: "https://api.openai.com/v1",
7163
6915
  reasoning: true,
7164
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
6916
+ thinkingLevelMap: { "off": "none", "xhigh": "xhigh" },
7165
6917
  input: ["text", "image"],
7166
6918
  cost: {
7167
6919
  input: 2.5,
@@ -7179,7 +6931,7 @@ export const MODELS = {
7179
6931
  provider: "openai",
7180
6932
  baseUrl: "https://api.openai.com/v1",
7181
6933
  reasoning: true,
7182
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
6934
+ thinkingLevelMap: { "off": "none", "xhigh": "xhigh" },
7183
6935
  input: ["text", "image"],
7184
6936
  cost: {
7185
6937
  input: 0.75,
@@ -7197,7 +6949,7 @@ export const MODELS = {
7197
6949
  provider: "openai",
7198
6950
  baseUrl: "https://api.openai.com/v1",
7199
6951
  reasoning: true,
7200
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
6952
+ thinkingLevelMap: { "off": "none", "xhigh": "xhigh" },
7201
6953
  input: ["text", "image"],
7202
6954
  cost: {
7203
6955
  input: 0.2,
@@ -7233,7 +6985,7 @@ export const MODELS = {
7233
6985
  provider: "openai",
7234
6986
  baseUrl: "https://api.openai.com/v1",
7235
6987
  reasoning: true,
7236
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
6988
+ thinkingLevelMap: { "off": "none", "xhigh": "xhigh" },
7237
6989
  input: ["text", "image"],
7238
6990
  cost: {
7239
6991
  input: 5,
@@ -7400,67 +7152,51 @@ export const MODELS = {
7400
7152
  },
7401
7153
  },
7402
7154
  "openai-codex": {
7403
- "gpt-5.1": {
7404
- id: "gpt-5.1",
7405
- name: "GPT-5.1",
7406
- api: "openai-codex-responses",
7407
- provider: "openai-codex",
7408
- baseUrl: "https://chatgpt.com/backend-api",
7409
- reasoning: true,
7410
- input: ["text", "image"],
7411
- cost: {
7412
- input: 1.25,
7413
- output: 10,
7414
- cacheRead: 0.125,
7415
- cacheWrite: 0,
7416
- },
7417
- contextWindow: 272000,
7418
- maxTokens: 128000,
7419
- },
7420
- "gpt-5.1-codex-max": {
7421
- id: "gpt-5.1-codex-max",
7422
- name: "GPT-5.1 Codex Max",
7155
+ "gpt-5.2": {
7156
+ id: "gpt-5.2",
7157
+ name: "GPT-5.2",
7423
7158
  api: "openai-codex-responses",
7424
7159
  provider: "openai-codex",
7425
7160
  baseUrl: "https://chatgpt.com/backend-api",
7426
7161
  reasoning: true,
7162
+ thinkingLevelMap: { "xhigh": "xhigh", "minimal": "low" },
7427
7163
  input: ["text", "image"],
7428
7164
  cost: {
7429
- input: 1.25,
7430
- output: 10,
7431
- cacheRead: 0.125,
7165
+ input: 1.75,
7166
+ output: 14,
7167
+ cacheRead: 0.175,
7432
7168
  cacheWrite: 0,
7433
7169
  },
7434
7170
  contextWindow: 272000,
7435
7171
  maxTokens: 128000,
7436
7172
  },
7437
- "gpt-5.1-codex-mini": {
7438
- id: "gpt-5.1-codex-mini",
7439
- name: "GPT-5.1 Codex Mini",
7173
+ "gpt-5.3-codex": {
7174
+ id: "gpt-5.3-codex",
7175
+ name: "GPT-5.3 Codex",
7440
7176
  api: "openai-codex-responses",
7441
7177
  provider: "openai-codex",
7442
7178
  baseUrl: "https://chatgpt.com/backend-api",
7443
7179
  reasoning: true,
7444
- thinkingLevelMap: { "minimal": "medium", "low": "medium", "medium": "medium", "high": "high" },
7180
+ thinkingLevelMap: { "xhigh": "xhigh", "minimal": "low" },
7445
7181
  input: ["text", "image"],
7446
7182
  cost: {
7447
- input: 0.25,
7448
- output: 2,
7449
- cacheRead: 0.025,
7183
+ input: 1.75,
7184
+ output: 14,
7185
+ cacheRead: 0.175,
7450
7186
  cacheWrite: 0,
7451
7187
  },
7452
7188
  contextWindow: 272000,
7453
7189
  maxTokens: 128000,
7454
7190
  },
7455
- "gpt-5.2": {
7456
- id: "gpt-5.2",
7457
- name: "GPT-5.2",
7191
+ "gpt-5.3-codex-spark": {
7192
+ id: "gpt-5.3-codex-spark",
7193
+ name: "GPT-5.3 Codex Spark",
7458
7194
  api: "openai-codex-responses",
7459
7195
  provider: "openai-codex",
7460
7196
  baseUrl: "https://chatgpt.com/backend-api",
7461
7197
  reasoning: true,
7462
7198
  thinkingLevelMap: { "xhigh": "xhigh", "minimal": "low" },
7463
- input: ["text", "image"],
7199
+ input: ["text"],
7464
7200
  cost: {
7465
7201
  input: 1.75,
7466
7202
  output: 14,
@@ -7470,9 +7206,9 @@ export const MODELS = {
7470
7206
  contextWindow: 272000,
7471
7207
  maxTokens: 128000,
7472
7208
  },
7473
- "gpt-5.2-codex": {
7474
- id: "gpt-5.2-codex",
7475
- name: "GPT-5.2 Codex",
7209
+ "gpt-5.4": {
7210
+ id: "gpt-5.4",
7211
+ name: "GPT-5.4",
7476
7212
  api: "openai-codex-responses",
7477
7213
  provider: "openai-codex",
7478
7214
  baseUrl: "https://chatgpt.com/backend-api",
@@ -7480,17 +7216,17 @@ export const MODELS = {
7480
7216
  thinkingLevelMap: { "xhigh": "xhigh", "minimal": "low" },
7481
7217
  input: ["text", "image"],
7482
7218
  cost: {
7483
- input: 1.75,
7484
- output: 14,
7485
- cacheRead: 0.175,
7219
+ input: 2.5,
7220
+ output: 15,
7221
+ cacheRead: 0.25,
7486
7222
  cacheWrite: 0,
7487
7223
  },
7488
7224
  contextWindow: 272000,
7489
7225
  maxTokens: 128000,
7490
7226
  },
7491
- "gpt-5.3-codex": {
7492
- id: "gpt-5.3-codex",
7493
- name: "GPT-5.3 Codex",
7227
+ "gpt-5.4-fast": {
7228
+ id: "gpt-5.4-fast",
7229
+ name: "GPT-5.4 Fast",
7494
7230
  api: "openai-codex-responses",
7495
7231
  provider: "openai-codex",
7496
7232
  baseUrl: "https://chatgpt.com/backend-api",
@@ -7498,35 +7234,35 @@ export const MODELS = {
7498
7234
  thinkingLevelMap: { "xhigh": "xhigh", "minimal": "low" },
7499
7235
  input: ["text", "image"],
7500
7236
  cost: {
7501
- input: 1.75,
7502
- output: 14,
7503
- cacheRead: 0.175,
7237
+ input: 5,
7238
+ output: 30,
7239
+ cacheRead: 0.5,
7504
7240
  cacheWrite: 0,
7505
7241
  },
7506
7242
  contextWindow: 272000,
7507
7243
  maxTokens: 128000,
7508
7244
  },
7509
- "gpt-5.3-codex-spark": {
7510
- id: "gpt-5.3-codex-spark",
7511
- name: "GPT-5.3 Codex Spark",
7245
+ "gpt-5.4-mini": {
7246
+ id: "gpt-5.4-mini",
7247
+ name: "GPT-5.4 mini",
7512
7248
  api: "openai-codex-responses",
7513
7249
  provider: "openai-codex",
7514
7250
  baseUrl: "https://chatgpt.com/backend-api",
7515
7251
  reasoning: true,
7516
7252
  thinkingLevelMap: { "xhigh": "xhigh", "minimal": "low" },
7517
- input: ["text"],
7253
+ input: ["text", "image"],
7518
7254
  cost: {
7519
- input: 0,
7520
- output: 0,
7521
- cacheRead: 0,
7255
+ input: 0.75,
7256
+ output: 4.5,
7257
+ cacheRead: 0.075,
7522
7258
  cacheWrite: 0,
7523
7259
  },
7524
- contextWindow: 128000,
7260
+ contextWindow: 272000,
7525
7261
  maxTokens: 128000,
7526
7262
  },
7527
- "gpt-5.4": {
7528
- id: "gpt-5.4",
7529
- name: "GPT-5.4",
7263
+ "gpt-5.4-mini-fast": {
7264
+ id: "gpt-5.4-mini-fast",
7265
+ name: "GPT-5.4 mini Fast",
7530
7266
  api: "openai-codex-responses",
7531
7267
  provider: "openai-codex",
7532
7268
  baseUrl: "https://chatgpt.com/backend-api",
@@ -7534,17 +7270,17 @@ export const MODELS = {
7534
7270
  thinkingLevelMap: { "xhigh": "xhigh", "minimal": "low" },
7535
7271
  input: ["text", "image"],
7536
7272
  cost: {
7537
- input: 2.5,
7538
- output: 15,
7539
- cacheRead: 0.25,
7273
+ input: 1.5,
7274
+ output: 9,
7275
+ cacheRead: 0.15,
7540
7276
  cacheWrite: 0,
7541
7277
  },
7542
7278
  contextWindow: 272000,
7543
7279
  maxTokens: 128000,
7544
7280
  },
7545
- "gpt-5.4-mini": {
7546
- id: "gpt-5.4-mini",
7547
- name: "GPT-5.4 Mini",
7281
+ "gpt-5.5": {
7282
+ id: "gpt-5.5",
7283
+ name: "GPT-5.5",
7548
7284
  api: "openai-codex-responses",
7549
7285
  provider: "openai-codex",
7550
7286
  baseUrl: "https://chatgpt.com/backend-api",
@@ -7552,17 +7288,17 @@ export const MODELS = {
7552
7288
  thinkingLevelMap: { "xhigh": "xhigh", "minimal": "low" },
7553
7289
  input: ["text", "image"],
7554
7290
  cost: {
7555
- input: 0.75,
7556
- output: 4.5,
7557
- cacheRead: 0.075,
7291
+ input: 5,
7292
+ output: 30,
7293
+ cacheRead: 0.5,
7558
7294
  cacheWrite: 0,
7559
7295
  },
7560
7296
  contextWindow: 272000,
7561
7297
  maxTokens: 128000,
7562
7298
  },
7563
- "gpt-5.5": {
7564
- id: "gpt-5.5",
7565
- name: "GPT-5.5",
7299
+ "gpt-5.5-fast": {
7300
+ id: "gpt-5.5-fast",
7301
+ name: "GPT-5.5 Fast",
7566
7302
  api: "openai-codex-responses",
7567
7303
  provider: "openai-codex",
7568
7304
  baseUrl: "https://chatgpt.com/backend-api",
@@ -7570,9 +7306,9 @@ export const MODELS = {
7570
7306
  thinkingLevelMap: { "xhigh": "xhigh", "minimal": "low" },
7571
7307
  input: ["text", "image"],
7572
7308
  cost: {
7573
- input: 5,
7574
- output: 30,
7575
- cacheRead: 0.5,
7309
+ input: 12.5,
7310
+ output: 75,
7311
+ cacheRead: 1.25,
7576
7312
  cacheWrite: 0,
7577
7313
  },
7578
7314
  contextWindow: 272000,
@@ -7735,6 +7471,25 @@ export const MODELS = {
7735
7471
  contextWindow: 1000000,
7736
7472
  maxTokens: 64000,
7737
7473
  },
7474
+ "deepseek-v4-flash-free": {
7475
+ id: "deepseek-v4-flash-free",
7476
+ name: "DeepSeek V4 Flash Free",
7477
+ api: "openai-completions",
7478
+ provider: "opencode",
7479
+ baseUrl: "https://opencode.ai/zen/v1",
7480
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7481
+ reasoning: true,
7482
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7483
+ input: ["text"],
7484
+ cost: {
7485
+ input: 0,
7486
+ output: 0,
7487
+ cacheRead: 0,
7488
+ cacheWrite: 0,
7489
+ },
7490
+ contextWindow: 200000,
7491
+ maxTokens: 128000,
7492
+ },
7738
7493
  "gemini-3-flash": {
7739
7494
  id: "gemini-3-flash",
7740
7495
  name: "Gemini 3 Flash",
@@ -8093,23 +7848,6 @@ export const MODELS = {
8093
7848
  contextWindow: 1050000,
8094
7849
  maxTokens: 128000,
8095
7850
  },
8096
- "hy3-preview-free": {
8097
- id: "hy3-preview-free",
8098
- name: "Hy3 preview Free",
8099
- api: "openai-completions",
8100
- provider: "opencode",
8101
- baseUrl: "https://opencode.ai/zen/v1",
8102
- reasoning: true,
8103
- input: ["text"],
8104
- cost: {
8105
- input: 0,
8106
- output: 0,
8107
- cacheRead: 0,
8108
- cacheWrite: 0,
8109
- },
8110
- contextWindow: 256000,
8111
- maxTokens: 64000,
8112
- },
8113
7851
  "kimi-k2.5": {
8114
7852
  id: "kimi-k2.5",
8115
7853
  name: "Kimi K2.5",
@@ -8246,17 +7984,34 @@ export const MODELS = {
8246
7984
  contextWindow: 262144,
8247
7985
  maxTokens: 65536,
8248
7986
  },
8249
- },
8250
- "opencode-go": {
8251
- "deepseek-v4-flash": {
8252
- id: "deepseek-v4-flash",
8253
- name: "DeepSeek V4 Flash",
8254
- api: "openai-completions",
8255
- provider: "opencode-go",
8256
- baseUrl: "https://opencode.ai/zen/go/v1",
8257
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8258
- reasoning: true,
8259
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7987
+ "qwen3.6-plus-free": {
7988
+ id: "qwen3.6-plus-free",
7989
+ name: "Qwen3.6 Plus Free",
7990
+ api: "anthropic-messages",
7991
+ provider: "opencode",
7992
+ baseUrl: "https://opencode.ai/zen",
7993
+ reasoning: true,
7994
+ input: ["text", "image"],
7995
+ cost: {
7996
+ input: 0,
7997
+ output: 0,
7998
+ cacheRead: 0,
7999
+ cacheWrite: 0,
8000
+ },
8001
+ contextWindow: 262144,
8002
+ maxTokens: 65536,
8003
+ },
8004
+ },
8005
+ "opencode-go": {
8006
+ "deepseek-v4-flash": {
8007
+ id: "deepseek-v4-flash",
8008
+ name: "DeepSeek V4 Flash",
8009
+ api: "openai-completions",
8010
+ provider: "opencode-go",
8011
+ baseUrl: "https://opencode.ai/zen/go/v1",
8012
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8013
+ reasoning: true,
8014
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
8260
8015
  input: ["text"],
8261
8016
  cost: {
8262
8017
  input: 0.14,
@@ -8391,9 +8146,9 @@ export const MODELS = {
8391
8146
  "minimax-m2.5": {
8392
8147
  id: "minimax-m2.5",
8393
8148
  name: "MiniMax M2.5",
8394
- api: "openai-completions",
8149
+ api: "anthropic-messages",
8395
8150
  provider: "opencode-go",
8396
- baseUrl: "https://opencode.ai/zen/go/v1",
8151
+ baseUrl: "https://opencode.ai/zen/go",
8397
8152
  reasoning: true,
8398
8153
  input: ["text"],
8399
8154
  cost: {
@@ -8613,40 +8368,6 @@ export const MODELS = {
8613
8368
  contextWindow: 200000,
8614
8369
  maxTokens: 8192,
8615
8370
  },
8616
- "anthropic/claude-3.7-sonnet": {
8617
- id: "anthropic/claude-3.7-sonnet",
8618
- name: "Anthropic: Claude 3.7 Sonnet",
8619
- api: "openai-completions",
8620
- provider: "openrouter",
8621
- baseUrl: "https://openrouter.ai/api/v1",
8622
- reasoning: true,
8623
- input: ["text", "image"],
8624
- cost: {
8625
- input: 3,
8626
- output: 15,
8627
- cacheRead: 0.3,
8628
- cacheWrite: 3.75,
8629
- },
8630
- contextWindow: 200000,
8631
- maxTokens: 64000,
8632
- },
8633
- "anthropic/claude-3.7-sonnet:thinking": {
8634
- id: "anthropic/claude-3.7-sonnet:thinking",
8635
- name: "Anthropic: Claude 3.7 Sonnet (thinking)",
8636
- api: "openai-completions",
8637
- provider: "openrouter",
8638
- baseUrl: "https://openrouter.ai/api/v1",
8639
- reasoning: true,
8640
- input: ["text", "image"],
8641
- cost: {
8642
- input: 3,
8643
- output: 15,
8644
- cacheRead: 0.3,
8645
- cacheWrite: 3.75,
8646
- },
8647
- contextWindow: 200000,
8648
- maxTokens: 64000,
8649
- },
8650
8371
  "anthropic/claude-haiku-4.5": {
8651
8372
  id: "anthropic/claude-haiku-4.5",
8652
8373
  name: "Anthropic: Claude Haiku 4.5",
@@ -8769,6 +8490,24 @@ export const MODELS = {
8769
8490
  contextWindow: 1000000,
8770
8491
  maxTokens: 128000,
8771
8492
  },
8493
+ "anthropic/claude-opus-4.7-fast": {
8494
+ id: "anthropic/claude-opus-4.7-fast",
8495
+ name: "Anthropic: Claude Opus 4.7 (Fast)",
8496
+ api: "openai-completions",
8497
+ provider: "openrouter",
8498
+ baseUrl: "https://openrouter.ai/api/v1",
8499
+ reasoning: true,
8500
+ thinkingLevelMap: { "xhigh": "xhigh" },
8501
+ input: ["text", "image"],
8502
+ cost: {
8503
+ input: 30,
8504
+ output: 150,
8505
+ cacheRead: 3,
8506
+ cacheWrite: 37.5,
8507
+ },
8508
+ contextWindow: 1000000,
8509
+ maxTokens: 128000,
8510
+ },
8772
8511
  "anthropic/claude-sonnet-4": {
8773
8512
  id: "anthropic/claude-sonnet-4",
8774
8513
  name: "Anthropic: Claude Sonnet 4",
@@ -8854,6 +8593,23 @@ export const MODELS = {
8854
8593
  contextWindow: 262144,
8855
8594
  maxTokens: 262144,
8856
8595
  },
8596
+ "arcee-ai/trinity-large-thinking:free": {
8597
+ id: "arcee-ai/trinity-large-thinking:free",
8598
+ name: "Arcee AI: Trinity Large Thinking (free)",
8599
+ api: "openai-completions",
8600
+ provider: "openrouter",
8601
+ baseUrl: "https://openrouter.ai/api/v1",
8602
+ reasoning: true,
8603
+ input: ["text"],
8604
+ cost: {
8605
+ input: 0,
8606
+ output: 0,
8607
+ cacheRead: 0,
8608
+ cacheWrite: 0,
8609
+ },
8610
+ contextWindow: 262144,
8611
+ maxTokens: 80000,
8612
+ },
8857
8613
  "arcee-ai/trinity-mini": {
8858
8614
  id: "arcee-ai/trinity-mini",
8859
8615
  name: "Arcee AI: Trinity Mini",
@@ -8936,7 +8692,7 @@ export const MODELS = {
8936
8692
  cacheRead: 0,
8937
8693
  cacheWrite: 0,
8938
8694
  },
8939
- contextWindow: 120000,
8695
+ contextWindow: 131072,
8940
8696
  maxTokens: 8000,
8941
8697
  },
8942
8698
  "baidu/ernie-4.5-vl-28b-a3b": {
@@ -8953,7 +8709,7 @@ export const MODELS = {
8953
8709
  cacheRead: 0,
8954
8710
  cacheWrite: 0,
8955
8711
  },
8956
- contextWindow: 30000,
8712
+ contextWindow: 131072,
8957
8713
  maxTokens: 8000,
8958
8714
  },
8959
8715
  "bytedance-seed/seed-1.6": {
@@ -9101,13 +8857,13 @@ export const MODELS = {
9101
8857
  reasoning: true,
9102
8858
  input: ["text"],
9103
8859
  cost: {
9104
- input: 0.15,
9105
- output: 0.75,
9106
- cacheRead: 0,
8860
+ input: 0.21,
8861
+ output: 0.7899999999999999,
8862
+ cacheRead: 0.13,
9107
8863
  cacheWrite: 0,
9108
8864
  },
9109
- contextWindow: 32768,
9110
- maxTokens: 7168,
8865
+ contextWindow: 163840,
8866
+ maxTokens: 32768,
9111
8867
  },
9112
8868
  "deepseek/deepseek-r1": {
9113
8869
  id: "deepseek/deepseek-r1",
@@ -9123,7 +8879,7 @@ export const MODELS = {
9123
8879
  cacheRead: 0,
9124
8880
  cacheWrite: 0,
9125
8881
  },
9126
- contextWindow: 64000,
8882
+ contextWindow: 163840,
9127
8883
  maxTokens: 16000,
9128
8884
  },
9129
8885
  "deepseek/deepseek-r1-0528": {
@@ -9205,9 +8961,28 @@ export const MODELS = {
9205
8961
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
9206
8962
  input: ["text"],
9207
8963
  cost: {
9208
- input: 0.14,
9209
- output: 0.28,
9210
- cacheRead: 0.0028,
8964
+ input: 0.112,
8965
+ output: 0.224,
8966
+ cacheRead: 0.022,
8967
+ cacheWrite: 0,
8968
+ },
8969
+ contextWindow: 1048576,
8970
+ maxTokens: 4096,
8971
+ },
8972
+ "deepseek/deepseek-v4-flash:free": {
8973
+ id: "deepseek/deepseek-v4-flash:free",
8974
+ name: "DeepSeek: DeepSeek V4 Flash (free)",
8975
+ api: "openai-completions",
8976
+ provider: "openrouter",
8977
+ baseUrl: "https://openrouter.ai/api/v1",
8978
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8979
+ reasoning: true,
8980
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
8981
+ input: ["text"],
8982
+ cost: {
8983
+ input: 0,
8984
+ output: 0,
8985
+ cacheRead: 0,
9211
8986
  cacheWrite: 0,
9212
8987
  },
9213
8988
  contextWindow: 1048576,
@@ -9402,6 +9177,23 @@ export const MODELS = {
9402
9177
  contextWindow: 1048576,
9403
9178
  maxTokens: 65536,
9404
9179
  },
9180
+ "google/gemini-3.1-flash-lite": {
9181
+ id: "google/gemini-3.1-flash-lite",
9182
+ name: "Google: Gemini 3.1 Flash Lite",
9183
+ api: "openai-completions",
9184
+ provider: "openrouter",
9185
+ baseUrl: "https://openrouter.ai/api/v1",
9186
+ reasoning: true,
9187
+ input: ["text", "image"],
9188
+ cost: {
9189
+ input: 0.25,
9190
+ output: 1.5,
9191
+ cacheRead: 0.024999999999999998,
9192
+ cacheWrite: 0.08333333333333334,
9193
+ },
9194
+ contextWindow: 1048576,
9195
+ maxTokens: 65536,
9196
+ },
9405
9197
  "google/gemini-3.1-flash-lite-preview": {
9406
9198
  id: "google/gemini-3.1-flash-lite-preview",
9407
9199
  name: "Google: Gemini 3.1 Flash Lite Preview",
@@ -9450,7 +9242,7 @@ export const MODELS = {
9450
9242
  cacheRead: 0.19999999999999998,
9451
9243
  cacheWrite: 0.375,
9452
9244
  },
9453
- contextWindow: 1048576,
9245
+ contextWindow: 1048756,
9454
9246
  maxTokens: 65536,
9455
9247
  },
9456
9248
  "google/gemma-3-12b-it": {
@@ -9530,8 +9322,8 @@ export const MODELS = {
9530
9322
  reasoning: true,
9531
9323
  input: ["text", "image"],
9532
9324
  cost: {
9533
- input: 0.13,
9534
- output: 0.38,
9325
+ input: 0.12,
9326
+ output: 0.37,
9535
9327
  cacheRead: 0,
9536
9328
  cacheWrite: 0,
9537
9329
  },
@@ -9579,6 +9371,7 @@ export const MODELS = {
9579
9371
  provider: "openrouter",
9580
9372
  baseUrl: "https://openrouter.ai/api/v1",
9581
9373
  reasoning: true,
9374
+ thinkingLevelMap: { "off": null },
9582
9375
  input: ["text"],
9583
9376
  cost: {
9584
9377
  input: 0.25,
@@ -9615,14 +9408,31 @@ export const MODELS = {
9615
9408
  reasoning: false,
9616
9409
  input: ["text"],
9617
9410
  cost: {
9618
- input: 0.08,
9619
- output: 0.24,
9620
- cacheRead: 0.016,
9411
+ input: 0.01,
9412
+ output: 0.03,
9413
+ cacheRead: 0.002,
9621
9414
  cacheWrite: 0,
9622
9415
  },
9623
9416
  contextWindow: 262144,
9624
9417
  maxTokens: 32768,
9625
9418
  },
9419
+ "inclusionai/ring-2.6-1t": {
9420
+ id: "inclusionai/ring-2.6-1t",
9421
+ name: "inclusionAI: Ring-2.6-1T",
9422
+ api: "openai-completions",
9423
+ provider: "openrouter",
9424
+ baseUrl: "https://openrouter.ai/api/v1",
9425
+ reasoning: true,
9426
+ input: ["text"],
9427
+ cost: {
9428
+ input: 0.075,
9429
+ output: 0.625,
9430
+ cacheRead: 0.015,
9431
+ cacheWrite: 0,
9432
+ },
9433
+ contextWindow: 262144,
9434
+ maxTokens: 65536,
9435
+ },
9626
9436
  "kwaipilot/kat-coder-pro-v2": {
9627
9437
  id: "kwaipilot/kat-coder-pro-v2",
9628
9438
  name: "Kwaipilot: KAT-Coder-Pro V2",
@@ -9671,7 +9481,7 @@ export const MODELS = {
9671
9481
  cacheRead: 0,
9672
9482
  cacheWrite: 0,
9673
9483
  },
9674
- contextWindow: 16384,
9484
+ contextWindow: 131072,
9675
9485
  maxTokens: 16384,
9676
9486
  },
9677
9487
  "meta-llama/llama-3.3-70b-instruct": {
@@ -9705,7 +9515,7 @@ export const MODELS = {
9705
9515
  cacheRead: 0,
9706
9516
  cacheWrite: 0,
9707
9517
  },
9708
- contextWindow: 65536,
9518
+ contextWindow: 131072,
9709
9519
  maxTokens: 4096,
9710
9520
  },
9711
9521
  "meta-llama/llama-4-scout": {
@@ -9722,7 +9532,7 @@ export const MODELS = {
9722
9532
  cacheRead: 0,
9723
9533
  cacheWrite: 0,
9724
9534
  },
9725
- contextWindow: 327680,
9535
+ contextWindow: 10000000,
9726
9536
  maxTokens: 16384,
9727
9537
  },
9728
9538
  "minimax/minimax-m1": {
@@ -9756,7 +9566,7 @@ export const MODELS = {
9756
9566
  cacheRead: 0.03,
9757
9567
  cacheWrite: 0,
9758
9568
  },
9759
- contextWindow: 196608,
9569
+ contextWindow: 204800,
9760
9570
  maxTokens: 196608,
9761
9571
  },
9762
9572
  "minimax/minimax-m2.1": {
@@ -9773,7 +9583,7 @@ export const MODELS = {
9773
9583
  cacheRead: 0.03,
9774
9584
  cacheWrite: 0,
9775
9585
  },
9776
- contextWindow: 196608,
9586
+ contextWindow: 204800,
9777
9587
  maxTokens: 196608,
9778
9588
  },
9779
9589
  "minimax/minimax-m2.5": {
@@ -9787,11 +9597,11 @@ export const MODELS = {
9787
9597
  cost: {
9788
9598
  input: 0.15,
9789
9599
  output: 1.15,
9790
- cacheRead: 0.03,
9600
+ cacheRead: 0,
9791
9601
  cacheWrite: 0,
9792
9602
  },
9793
- contextWindow: 196608,
9794
- maxTokens: 131072,
9603
+ contextWindow: 204800,
9604
+ maxTokens: 196608,
9795
9605
  },
9796
9606
  "minimax/minimax-m2.5:free": {
9797
9607
  id: "minimax/minimax-m2.5:free",
@@ -9807,7 +9617,7 @@ export const MODELS = {
9807
9617
  cacheRead: 0,
9808
9618
  cacheWrite: 0,
9809
9619
  },
9810
- contextWindow: 196608,
9620
+ contextWindow: 204800,
9811
9621
  maxTokens: 8192,
9812
9622
  },
9813
9623
  "minimax/minimax-m2.7": {
@@ -9819,13 +9629,13 @@ export const MODELS = {
9819
9629
  reasoning: true,
9820
9630
  input: ["text"],
9821
9631
  cost: {
9822
- input: 0.3,
9632
+ input: 0.27899999999999997,
9823
9633
  output: 1.2,
9824
- cacheRead: 0.059,
9634
+ cacheRead: 0,
9825
9635
  cacheWrite: 0,
9826
9636
  },
9827
- contextWindow: 196608,
9828
- maxTokens: 4096,
9637
+ contextWindow: 204800,
9638
+ maxTokens: 131072,
9829
9639
  },
9830
9640
  "mistralai/codestral-2508": {
9831
9641
  id: "mistralai/codestral-2508",
@@ -10150,23 +9960,6 @@ export const MODELS = {
10150
9960
  contextWindow: 65536,
10151
9961
  maxTokens: 4096,
10152
9962
  },
10153
- "mistralai/mixtral-8x7b-instruct": {
10154
- id: "mistralai/mixtral-8x7b-instruct",
10155
- name: "Mistral: Mixtral 8x7B Instruct",
10156
- api: "openai-completions",
10157
- provider: "openrouter",
10158
- baseUrl: "https://openrouter.ai/api/v1",
10159
- reasoning: false,
10160
- input: ["text"],
10161
- cost: {
10162
- input: 0.54,
10163
- output: 0.54,
10164
- cacheRead: 0,
10165
- cacheWrite: 0,
10166
- },
10167
- contextWindow: 32768,
10168
- maxTokens: 16384,
10169
- },
10170
9963
  "mistralai/pixtral-large-2411": {
10171
9964
  id: "mistralai/pixtral-large-2411",
10172
9965
  name: "Mistral: Pixtral Large 2411",
@@ -10227,8 +10020,8 @@ export const MODELS = {
10227
10020
  reasoning: false,
10228
10021
  input: ["text"],
10229
10022
  cost: {
10230
- input: 0.39999999999999997,
10231
- output: 2,
10023
+ input: 0.6,
10024
+ output: 2.5,
10232
10025
  cacheRead: 0,
10233
10026
  cacheWrite: 0,
10234
10027
  },
@@ -10246,7 +10039,7 @@ export const MODELS = {
10246
10039
  cost: {
10247
10040
  input: 0.6,
10248
10041
  output: 2.5,
10249
- cacheRead: 0.15,
10042
+ cacheRead: 0,
10250
10043
  cacheWrite: 0,
10251
10044
  },
10252
10045
  contextWindow: 262144,
@@ -10278,13 +10071,13 @@ export const MODELS = {
10278
10071
  reasoning: true,
10279
10072
  input: ["text", "image"],
10280
10073
  cost: {
10281
- input: 0.75,
10282
- output: 3.5,
10283
- cacheRead: 0.15,
10074
+ input: 0.73,
10075
+ output: 3.49,
10076
+ cacheRead: 0.25,
10284
10077
  cacheWrite: 0,
10285
10078
  },
10286
10079
  contextWindow: 262144,
10287
- maxTokens: 16384,
10080
+ maxTokens: 262142,
10288
10081
  },
10289
10082
  "nex-agi/deepseek-v3.1-nex-n1": {
10290
10083
  id: "nex-agi/deepseek-v3.1-nex-n1",
@@ -10303,23 +10096,6 @@ export const MODELS = {
10303
10096
  contextWindow: 131072,
10304
10097
  maxTokens: 163840,
10305
10098
  },
10306
- "nvidia/llama-3.1-nemotron-70b-instruct": {
10307
- id: "nvidia/llama-3.1-nemotron-70b-instruct",
10308
- name: "NVIDIA: Llama 3.1 Nemotron 70B Instruct",
10309
- api: "openai-completions",
10310
- provider: "openrouter",
10311
- baseUrl: "https://openrouter.ai/api/v1",
10312
- reasoning: false,
10313
- input: ["text"],
10314
- cost: {
10315
- input: 1.2,
10316
- output: 1.2,
10317
- cacheRead: 0,
10318
- cacheWrite: 0,
10319
- },
10320
- contextWindow: 131072,
10321
- maxTokens: 16384,
10322
- },
10323
10099
  "nvidia/llama-3.3-nemotron-super-49b-v1.5": {
10324
10100
  id: "nvidia/llama-3.3-nemotron-super-49b-v1.5",
10325
10101
  name: "NVIDIA: Llama 3.3 Nemotron Super 49B V1.5",
@@ -10402,7 +10178,7 @@ export const MODELS = {
10402
10178
  cacheRead: 0,
10403
10179
  cacheWrite: 0,
10404
10180
  },
10405
- contextWindow: 262144,
10181
+ contextWindow: 1000000,
10406
10182
  maxTokens: 4096,
10407
10183
  },
10408
10184
  "nvidia/nemotron-3-super-120b-a12b:free": {
@@ -10419,7 +10195,7 @@ export const MODELS = {
10419
10195
  cacheRead: 0,
10420
10196
  cacheWrite: 0,
10421
10197
  },
10422
- contextWindow: 262144,
10198
+ contextWindow: 1000000,
10423
10199
  maxTokens: 262144,
10424
10200
  },
10425
10201
  "nvidia/nemotron-nano-12b-v2-vl:free": {
@@ -11570,7 +11346,7 @@ export const MODELS = {
11570
11346
  cacheRead: 0,
11571
11347
  cacheWrite: 0,
11572
11348
  },
11573
- contextWindow: 32768,
11349
+ contextWindow: 131072,
11574
11350
  maxTokens: 16384,
11575
11351
  },
11576
11352
  "qwen/qwen-2.5-7b-instruct": {
@@ -11587,26 +11363,9 @@ export const MODELS = {
11587
11363
  cacheRead: 0,
11588
11364
  cacheWrite: 0,
11589
11365
  },
11590
- contextWindow: 32768,
11366
+ contextWindow: 131072,
11591
11367
  maxTokens: 32768,
11592
11368
  },
11593
- "qwen/qwen-max": {
11594
- id: "qwen/qwen-max",
11595
- name: "Qwen: Qwen-Max ",
11596
- api: "openai-completions",
11597
- provider: "openrouter",
11598
- baseUrl: "https://openrouter.ai/api/v1",
11599
- reasoning: false,
11600
- input: ["text"],
11601
- cost: {
11602
- input: 1.04,
11603
- output: 4.16,
11604
- cacheRead: 0.20800000000000002,
11605
- cacheWrite: 0,
11606
- },
11607
- contextWindow: 32768,
11608
- maxTokens: 8192,
11609
- },
11610
11369
  "qwen/qwen-plus": {
11611
11370
  id: "qwen/qwen-plus",
11612
11371
  name: "Qwen: Qwen-Plus",
@@ -11658,40 +11417,6 @@ export const MODELS = {
11658
11417
  contextWindow: 1000000,
11659
11418
  maxTokens: 32768,
11660
11419
  },
11661
- "qwen/qwen-turbo": {
11662
- id: "qwen/qwen-turbo",
11663
- name: "Qwen: Qwen-Turbo",
11664
- api: "openai-completions",
11665
- provider: "openrouter",
11666
- baseUrl: "https://openrouter.ai/api/v1",
11667
- reasoning: false,
11668
- input: ["text"],
11669
- cost: {
11670
- input: 0.0325,
11671
- output: 0.13,
11672
- cacheRead: 0.006500000000000001,
11673
- cacheWrite: 0,
11674
- },
11675
- contextWindow: 131072,
11676
- maxTokens: 8192,
11677
- },
11678
- "qwen/qwen-vl-max": {
11679
- id: "qwen/qwen-vl-max",
11680
- name: "Qwen: Qwen VL Max",
11681
- api: "openai-completions",
11682
- provider: "openrouter",
11683
- baseUrl: "https://openrouter.ai/api/v1",
11684
- reasoning: false,
11685
- input: ["text", "image"],
11686
- cost: {
11687
- input: 0.52,
11688
- output: 2.08,
11689
- cacheRead: 0,
11690
- cacheWrite: 0,
11691
- },
11692
- contextWindow: 131072,
11693
- maxTokens: 32768,
11694
- },
11695
11420
  "qwen/qwen3-14b": {
11696
11421
  id: "qwen/qwen3-14b",
11697
11422
  name: "Qwen: Qwen3 14B",
@@ -11701,12 +11426,12 @@ export const MODELS = {
11701
11426
  reasoning: true,
11702
11427
  input: ["text"],
11703
11428
  cost: {
11704
- input: 0.06,
11429
+ input: 0.09999999999999999,
11705
11430
  output: 0.24,
11706
11431
  cacheRead: 0,
11707
11432
  cacheWrite: 0,
11708
11433
  },
11709
- contextWindow: 40960,
11434
+ contextWindow: 131702,
11710
11435
  maxTokens: 40960,
11711
11436
  },
11712
11437
  "qwen/qwen3-235b-a22b": {
@@ -11757,7 +11482,7 @@ export const MODELS = {
11757
11482
  cacheRead: 0,
11758
11483
  cacheWrite: 0,
11759
11484
  },
11760
- contextWindow: 131072,
11485
+ contextWindow: 262144,
11761
11486
  maxTokens: 4096,
11762
11487
  },
11763
11488
  "qwen/qwen3-30b-a3b": {
@@ -11774,7 +11499,7 @@ export const MODELS = {
11774
11499
  cacheRead: 0,
11775
11500
  cacheWrite: 0,
11776
11501
  },
11777
- contextWindow: 40960,
11502
+ contextWindow: 131072,
11778
11503
  maxTokens: 20000,
11779
11504
  },
11780
11505
  "qwen/qwen3-30b-a3b-instruct-2507": {
@@ -11821,12 +11546,12 @@ export const MODELS = {
11821
11546
  input: ["text"],
11822
11547
  cost: {
11823
11548
  input: 0.08,
11824
- output: 0.24,
11825
- cacheRead: 0.04,
11549
+ output: 0.28,
11550
+ cacheRead: 0,
11826
11551
  cacheWrite: 0,
11827
11552
  },
11828
- contextWindow: 40960,
11829
- maxTokens: 40960,
11553
+ contextWindow: 131072,
11554
+ maxTokens: 16384,
11830
11555
  },
11831
11556
  "qwen/qwen3-8b": {
11832
11557
  id: "qwen/qwen3-8b",
@@ -11842,7 +11567,7 @@ export const MODELS = {
11842
11567
  cacheRead: 0.049999999999999996,
11843
11568
  cacheWrite: 0,
11844
11569
  },
11845
- contextWindow: 40960,
11570
+ contextWindow: 131072,
11846
11571
  maxTokens: 8192,
11847
11572
  },
11848
11573
  "qwen/qwen3-coder": {
@@ -11859,7 +11584,7 @@ export const MODELS = {
11859
11584
  cacheRead: 0,
11860
11585
  cacheWrite: 0,
11861
11586
  },
11862
- contextWindow: 262144,
11587
+ contextWindow: 1048576,
11863
11588
  maxTokens: 65536,
11864
11589
  },
11865
11590
  "qwen/qwen3-coder-30b-a3b-instruct": {
@@ -11944,7 +11669,7 @@ export const MODELS = {
11944
11669
  cacheRead: 0,
11945
11670
  cacheWrite: 0,
11946
11671
  },
11947
- contextWindow: 262000,
11672
+ contextWindow: 1048576,
11948
11673
  maxTokens: 262000,
11949
11674
  },
11950
11675
  "qwen/qwen3-max": {
@@ -12029,7 +11754,7 @@ export const MODELS = {
12029
11754
  cacheRead: 0,
12030
11755
  cacheWrite: 0,
12031
11756
  },
12032
- contextWindow: 131072,
11757
+ contextWindow: 262144,
12033
11758
  maxTokens: 32768,
12034
11759
  },
12035
11760
  "qwen/qwen3-vl-235b-a22b-instruct": {
@@ -12080,7 +11805,7 @@ export const MODELS = {
12080
11805
  cacheRead: 0,
12081
11806
  cacheWrite: 0,
12082
11807
  },
12083
- contextWindow: 131072,
11808
+ contextWindow: 262144,
12084
11809
  maxTokens: 32768,
12085
11810
  },
12086
11811
  "qwen/qwen3-vl-30b-a3b-thinking": {
@@ -12114,7 +11839,7 @@ export const MODELS = {
12114
11839
  cacheRead: 0,
12115
11840
  cacheWrite: 0,
12116
11841
  },
12117
- contextWindow: 131072,
11842
+ contextWindow: 262144,
12118
11843
  maxTokens: 32768,
12119
11844
  },
12120
11845
  "qwen/qwen3-vl-8b-instruct": {
@@ -12131,7 +11856,7 @@ export const MODELS = {
12131
11856
  cacheRead: 0,
12132
11857
  cacheWrite: 0,
12133
11858
  },
12134
- contextWindow: 131072,
11859
+ contextWindow: 256000,
12135
11860
  maxTokens: 32768,
12136
11861
  },
12137
11862
  "qwen/qwen3-vl-8b-thinking": {
@@ -12148,7 +11873,7 @@ export const MODELS = {
12148
11873
  cacheRead: 0,
12149
11874
  cacheWrite: 0,
12150
11875
  },
12151
- contextWindow: 131072,
11876
+ contextWindow: 256000,
12152
11877
  maxTokens: 32768,
12153
11878
  },
12154
11879
  "qwen/qwen3.5-122b-a10b": {
@@ -12279,8 +12004,8 @@ export const MODELS = {
12279
12004
  reasoning: true,
12280
12005
  input: ["text", "image"],
12281
12006
  cost: {
12282
- input: 0.39999999999999997,
12283
- output: 2.4,
12007
+ input: 0.3,
12008
+ output: 1.7999999999999998,
12284
12009
  cacheRead: 0,
12285
12010
  cacheWrite: 0,
12286
12011
  },
@@ -12330,10 +12055,10 @@ export const MODELS = {
12330
12055
  reasoning: true,
12331
12056
  input: ["text", "image"],
12332
12057
  cost: {
12333
- input: 0.25,
12334
- output: 1.5,
12058
+ input: 0.1875,
12059
+ output: 1.125,
12335
12060
  cacheRead: 0,
12336
- cacheWrite: 0.3125,
12061
+ cacheWrite: 0.234375,
12337
12062
  },
12338
12063
  contextWindow: 1000000,
12339
12064
  maxTokens: 65536,
@@ -12457,18 +12182,18 @@ export const MODELS = {
12457
12182
  contextWindow: 262144,
12458
12183
  maxTokens: 65536,
12459
12184
  },
12460
- "tencent/hy3-preview:free": {
12461
- id: "tencent/hy3-preview:free",
12462
- name: "Tencent: Hy3 preview (free)",
12185
+ "tencent/hy3-preview": {
12186
+ id: "tencent/hy3-preview",
12187
+ name: "Tencent: Hy3 preview",
12463
12188
  api: "openai-completions",
12464
12189
  provider: "openrouter",
12465
12190
  baseUrl: "https://openrouter.ai/api/v1",
12466
12191
  reasoning: true,
12467
12192
  input: ["text"],
12468
12193
  cost: {
12469
- input: 0,
12470
- output: 0,
12471
- cacheRead: 0,
12194
+ input: 0.06599999999999999,
12195
+ output: 0.26,
12196
+ cacheRead: 0.029,
12472
12197
  cacheWrite: 0,
12473
12198
  },
12474
12199
  contextWindow: 262144,
@@ -12508,23 +12233,6 @@ export const MODELS = {
12508
12233
  contextWindow: 32768,
12509
12234
  maxTokens: 32768,
12510
12235
  },
12511
- "tngtech/deepseek-r1t2-chimera": {
12512
- id: "tngtech/deepseek-r1t2-chimera",
12513
- name: "TNG: DeepSeek R1T2 Chimera",
12514
- api: "openai-completions",
12515
- provider: "openrouter",
12516
- baseUrl: "https://openrouter.ai/api/v1",
12517
- reasoning: true,
12518
- input: ["text"],
12519
- cost: {
12520
- input: 0.3,
12521
- output: 1.1,
12522
- cacheRead: 0.15,
12523
- cacheWrite: 0,
12524
- },
12525
- contextWindow: 163840,
12526
- maxTokens: 163840,
12527
- },
12528
12236
  "upstage/solar-pro-3": {
12529
12237
  id: "upstage/solar-pro-3",
12530
12238
  name: "Upstage: Solar Pro 3",
@@ -12542,125 +12250,6 @@ export const MODELS = {
12542
12250
  contextWindow: 128000,
12543
12251
  maxTokens: 4096,
12544
12252
  },
12545
- "x-ai/grok-3": {
12546
- id: "x-ai/grok-3",
12547
- name: "xAI: Grok 3",
12548
- api: "openai-completions",
12549
- provider: "openrouter",
12550
- baseUrl: "https://openrouter.ai/api/v1",
12551
- reasoning: false,
12552
- input: ["text"],
12553
- cost: {
12554
- input: 3,
12555
- output: 15,
12556
- cacheRead: 0.75,
12557
- cacheWrite: 0,
12558
- },
12559
- contextWindow: 131072,
12560
- maxTokens: 4096,
12561
- },
12562
- "x-ai/grok-3-beta": {
12563
- id: "x-ai/grok-3-beta",
12564
- name: "xAI: Grok 3 Beta",
12565
- api: "openai-completions",
12566
- provider: "openrouter",
12567
- baseUrl: "https://openrouter.ai/api/v1",
12568
- reasoning: false,
12569
- input: ["text"],
12570
- cost: {
12571
- input: 3,
12572
- output: 15,
12573
- cacheRead: 0.75,
12574
- cacheWrite: 0,
12575
- },
12576
- contextWindow: 131072,
12577
- maxTokens: 4096,
12578
- },
12579
- "x-ai/grok-3-mini": {
12580
- id: "x-ai/grok-3-mini",
12581
- name: "xAI: Grok 3 Mini",
12582
- api: "openai-completions",
12583
- provider: "openrouter",
12584
- baseUrl: "https://openrouter.ai/api/v1",
12585
- reasoning: true,
12586
- input: ["text"],
12587
- cost: {
12588
- input: 0.3,
12589
- output: 0.5,
12590
- cacheRead: 0.075,
12591
- cacheWrite: 0,
12592
- },
12593
- contextWindow: 131072,
12594
- maxTokens: 4096,
12595
- },
12596
- "x-ai/grok-3-mini-beta": {
12597
- id: "x-ai/grok-3-mini-beta",
12598
- name: "xAI: Grok 3 Mini Beta",
12599
- api: "openai-completions",
12600
- provider: "openrouter",
12601
- baseUrl: "https://openrouter.ai/api/v1",
12602
- reasoning: true,
12603
- input: ["text"],
12604
- cost: {
12605
- input: 0.3,
12606
- output: 0.5,
12607
- cacheRead: 0.075,
12608
- cacheWrite: 0,
12609
- },
12610
- contextWindow: 131072,
12611
- maxTokens: 4096,
12612
- },
12613
- "x-ai/grok-4": {
12614
- id: "x-ai/grok-4",
12615
- name: "xAI: Grok 4",
12616
- api: "openai-completions",
12617
- provider: "openrouter",
12618
- baseUrl: "https://openrouter.ai/api/v1",
12619
- reasoning: true,
12620
- input: ["text", "image"],
12621
- cost: {
12622
- input: 3,
12623
- output: 15,
12624
- cacheRead: 0.75,
12625
- cacheWrite: 0,
12626
- },
12627
- contextWindow: 256000,
12628
- maxTokens: 4096,
12629
- },
12630
- "x-ai/grok-4-fast": {
12631
- id: "x-ai/grok-4-fast",
12632
- name: "xAI: Grok 4 Fast",
12633
- api: "openai-completions",
12634
- provider: "openrouter",
12635
- baseUrl: "https://openrouter.ai/api/v1",
12636
- reasoning: true,
12637
- input: ["text", "image"],
12638
- cost: {
12639
- input: 0.19999999999999998,
12640
- output: 0.5,
12641
- cacheRead: 0.049999999999999996,
12642
- cacheWrite: 0,
12643
- },
12644
- contextWindow: 2000000,
12645
- maxTokens: 30000,
12646
- },
12647
- "x-ai/grok-4.1-fast": {
12648
- id: "x-ai/grok-4.1-fast",
12649
- name: "xAI: Grok 4.1 Fast",
12650
- api: "openai-completions",
12651
- provider: "openrouter",
12652
- baseUrl: "https://openrouter.ai/api/v1",
12653
- reasoning: true,
12654
- input: ["text", "image"],
12655
- cost: {
12656
- input: 0.19999999999999998,
12657
- output: 0.5,
12658
- cacheRead: 0.049999999999999996,
12659
- cacheWrite: 0,
12660
- },
12661
- contextWindow: 2000000,
12662
- maxTokens: 30000,
12663
- },
12664
12253
  "x-ai/grok-4.20": {
12665
12254
  id: "x-ai/grok-4.20",
12666
12255
  name: "xAI: Grok 4.20",
@@ -12695,23 +12284,6 @@ export const MODELS = {
12695
12284
  contextWindow: 1000000,
12696
12285
  maxTokens: 4096,
12697
12286
  },
12698
- "x-ai/grok-code-fast-1": {
12699
- id: "x-ai/grok-code-fast-1",
12700
- name: "xAI: Grok Code Fast 1",
12701
- api: "openai-completions",
12702
- provider: "openrouter",
12703
- baseUrl: "https://openrouter.ai/api/v1",
12704
- reasoning: true,
12705
- input: ["text"],
12706
- cost: {
12707
- input: 0.19999999999999998,
12708
- output: 1.5,
12709
- cacheRead: 0.02,
12710
- cacheWrite: 0,
12711
- },
12712
- contextWindow: 256000,
12713
- maxTokens: 10000,
12714
- },
12715
12287
  "xiaomi/mimo-v2-flash": {
12716
12288
  id: "xiaomi/mimo-v2-flash",
12717
12289
  name: "Xiaomi: MiMo-V2-Flash",
@@ -12721,9 +12293,9 @@ export const MODELS = {
12721
12293
  reasoning: true,
12722
12294
  input: ["text"],
12723
12295
  cost: {
12724
- input: 0.09,
12725
- output: 0.29,
12726
- cacheRead: 0.045,
12296
+ input: 0.09999999999999999,
12297
+ output: 0.3,
12298
+ cacheRead: 0.01,
12727
12299
  cacheWrite: 0,
12728
12300
  },
12729
12301
  contextWindow: 262144,
@@ -12795,7 +12367,7 @@ export const MODELS = {
12795
12367
  cacheWrite: 0,
12796
12368
  },
12797
12369
  contextWindow: 1048576,
12798
- maxTokens: 131072,
12370
+ maxTokens: 16384,
12799
12371
  },
12800
12372
  "z-ai/glm-4-32b": {
12801
12373
  id: "z-ai/glm-4-32b",
@@ -12891,13 +12463,13 @@ export const MODELS = {
12891
12463
  reasoning: true,
12892
12464
  input: ["text"],
12893
12465
  cost: {
12894
- input: 0.39,
12895
- output: 1.9,
12896
- cacheRead: 0,
12466
+ input: 0.43,
12467
+ output: 1.74,
12468
+ cacheRead: 0.08,
12897
12469
  cacheWrite: 0,
12898
12470
  },
12899
- contextWindow: 204800,
12900
- maxTokens: 204800,
12471
+ contextWindow: 202752,
12472
+ maxTokens: 131072,
12901
12473
  },
12902
12474
  "z-ai/glm-4.6v": {
12903
12475
  id: "z-ai/glm-4.6v",
@@ -12925,13 +12497,13 @@ export const MODELS = {
12925
12497
  reasoning: true,
12926
12498
  input: ["text"],
12927
12499
  cost: {
12928
- input: 0.38,
12929
- output: 1.74,
12930
- cacheRead: 0,
12500
+ input: 0.39999999999999997,
12501
+ output: 1.75,
12502
+ cacheRead: 0.08,
12931
12503
  cacheWrite: 0,
12932
12504
  },
12933
12505
  contextWindow: 202752,
12934
- maxTokens: 4096,
12506
+ maxTokens: 131072,
12935
12507
  },
12936
12508
  "z-ai/glm-4.7-flash": {
12937
12509
  id: "z-ai/glm-4.7-flash",
@@ -12993,13 +12565,13 @@ export const MODELS = {
12993
12565
  reasoning: true,
12994
12566
  input: ["text"],
12995
12567
  cost: {
12996
- input: 1.0499999999999998,
12997
- output: 3.5,
12998
- cacheRead: 0.5249999999999999,
12568
+ input: 0.98,
12569
+ output: 3.08,
12570
+ cacheRead: 0.182,
12999
12571
  cacheWrite: 0,
13000
12572
  },
13001
12573
  contextWindow: 202752,
13002
- maxTokens: 65535,
12574
+ maxTokens: 4096,
13003
12575
  },
13004
12576
  "z-ai/glm-5v-turbo": {
13005
12577
  id: "z-ai/glm-5v-turbo",
@@ -13056,103 +12628,425 @@ export const MODELS = {
13056
12628
  id: "~anthropic/claude-sonnet-latest",
13057
12629
  name: "Anthropic Claude Sonnet Latest",
13058
12630
  api: "openai-completions",
13059
- provider: "openrouter",
13060
- baseUrl: "https://openrouter.ai/api/v1",
12631
+ provider: "openrouter",
12632
+ baseUrl: "https://openrouter.ai/api/v1",
12633
+ reasoning: true,
12634
+ input: ["text", "image"],
12635
+ cost: {
12636
+ input: 3,
12637
+ output: 15,
12638
+ cacheRead: 0.3,
12639
+ cacheWrite: 3.75,
12640
+ },
12641
+ contextWindow: 1000000,
12642
+ maxTokens: 128000,
12643
+ },
12644
+ "~google/gemini-flash-latest": {
12645
+ id: "~google/gemini-flash-latest",
12646
+ name: "Google Gemini Flash Latest",
12647
+ api: "openai-completions",
12648
+ provider: "openrouter",
12649
+ baseUrl: "https://openrouter.ai/api/v1",
12650
+ reasoning: true,
12651
+ input: ["text", "image"],
12652
+ cost: {
12653
+ input: 0.5,
12654
+ output: 3,
12655
+ cacheRead: 0.049999999999999996,
12656
+ cacheWrite: 0.08333333333333334,
12657
+ },
12658
+ contextWindow: 1048576,
12659
+ maxTokens: 65536,
12660
+ },
12661
+ "~google/gemini-pro-latest": {
12662
+ id: "~google/gemini-pro-latest",
12663
+ name: "Google Gemini Pro Latest",
12664
+ api: "openai-completions",
12665
+ provider: "openrouter",
12666
+ baseUrl: "https://openrouter.ai/api/v1",
12667
+ reasoning: true,
12668
+ input: ["text", "image"],
12669
+ cost: {
12670
+ input: 2,
12671
+ output: 12,
12672
+ cacheRead: 0.19999999999999998,
12673
+ cacheWrite: 0.375,
12674
+ },
12675
+ contextWindow: 1048576,
12676
+ maxTokens: 65536,
12677
+ },
12678
+ "~moonshotai/kimi-latest": {
12679
+ id: "~moonshotai/kimi-latest",
12680
+ name: "MoonshotAI Kimi Latest",
12681
+ api: "openai-completions",
12682
+ provider: "openrouter",
12683
+ baseUrl: "https://openrouter.ai/api/v1",
12684
+ reasoning: true,
12685
+ input: ["text", "image"],
12686
+ cost: {
12687
+ input: 0.73,
12688
+ output: 3.49,
12689
+ cacheRead: 0.25,
12690
+ cacheWrite: 0,
12691
+ },
12692
+ contextWindow: 262144,
12693
+ maxTokens: 262142,
12694
+ },
12695
+ "~openai/gpt-latest": {
12696
+ id: "~openai/gpt-latest",
12697
+ name: "OpenAI GPT Latest",
12698
+ api: "openai-completions",
12699
+ provider: "openrouter",
12700
+ baseUrl: "https://openrouter.ai/api/v1",
12701
+ reasoning: true,
12702
+ input: ["text", "image"],
12703
+ cost: {
12704
+ input: 5,
12705
+ output: 30,
12706
+ cacheRead: 0.5,
12707
+ cacheWrite: 0,
12708
+ },
12709
+ contextWindow: 1050000,
12710
+ maxTokens: 128000,
12711
+ },
12712
+ "~openai/gpt-mini-latest": {
12713
+ id: "~openai/gpt-mini-latest",
12714
+ name: "OpenAI GPT Mini Latest",
12715
+ api: "openai-completions",
12716
+ provider: "openrouter",
12717
+ baseUrl: "https://openrouter.ai/api/v1",
12718
+ reasoning: true,
12719
+ input: ["text", "image"],
12720
+ cost: {
12721
+ input: 0.75,
12722
+ output: 4.5,
12723
+ cacheRead: 0.075,
12724
+ cacheWrite: 0,
12725
+ },
12726
+ contextWindow: 400000,
12727
+ maxTokens: 128000,
12728
+ },
12729
+ },
12730
+ "together": {
12731
+ "MiniMaxAI/MiniMax-M2.5": {
12732
+ id: "MiniMaxAI/MiniMax-M2.5",
12733
+ name: "MiniMax-M2.5",
12734
+ api: "openai-completions",
12735
+ provider: "together",
12736
+ baseUrl: "https://api.together.ai/v1",
12737
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
12738
+ reasoning: true,
12739
+ thinkingLevelMap: { "off": null, "minimal": null, "low": null, "medium": null },
12740
+ input: ["text"],
12741
+ cost: {
12742
+ input: 0.3,
12743
+ output: 1.2,
12744
+ cacheRead: 0.06,
12745
+ cacheWrite: 0,
12746
+ },
12747
+ contextWindow: 204800,
12748
+ maxTokens: 131072,
12749
+ },
12750
+ "MiniMaxAI/MiniMax-M2.7": {
12751
+ id: "MiniMaxAI/MiniMax-M2.7",
12752
+ name: "MiniMax-M2.7",
12753
+ api: "openai-completions",
12754
+ provider: "together",
12755
+ baseUrl: "https://api.together.ai/v1",
12756
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
12757
+ reasoning: true,
12758
+ thinkingLevelMap: { "off": null, "minimal": null, "low": null, "medium": null },
12759
+ input: ["text"],
12760
+ cost: {
12761
+ input: 0.3,
12762
+ output: 1.2,
12763
+ cacheRead: 0.06,
12764
+ cacheWrite: 0,
12765
+ },
12766
+ contextWindow: 202752,
12767
+ maxTokens: 131072,
12768
+ },
12769
+ "Qwen/Qwen3-235B-A22B-Instruct-2507-tput": {
12770
+ id: "Qwen/Qwen3-235B-A22B-Instruct-2507-tput",
12771
+ name: "Qwen3 235B A22B Instruct 2507 FP8",
12772
+ api: "openai-completions",
12773
+ provider: "together",
12774
+ baseUrl: "https://api.together.ai/v1",
12775
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
12776
+ reasoning: true,
12777
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
12778
+ input: ["text"],
12779
+ cost: {
12780
+ input: 0.2,
12781
+ output: 0.6,
12782
+ cacheRead: 0,
12783
+ cacheWrite: 0,
12784
+ },
12785
+ contextWindow: 262144,
12786
+ maxTokens: 262144,
12787
+ },
12788
+ "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8": {
12789
+ id: "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
12790
+ name: "Qwen3 Coder 480B A35B Instruct",
12791
+ api: "openai-completions",
12792
+ provider: "together",
12793
+ baseUrl: "https://api.together.ai/v1",
12794
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
12795
+ reasoning: false,
12796
+ input: ["text"],
12797
+ cost: {
12798
+ input: 2,
12799
+ output: 2,
12800
+ cacheRead: 0,
12801
+ cacheWrite: 0,
12802
+ },
12803
+ contextWindow: 262144,
12804
+ maxTokens: 262144,
12805
+ },
12806
+ "Qwen/Qwen3-Coder-Next-FP8": {
12807
+ id: "Qwen/Qwen3-Coder-Next-FP8",
12808
+ name: "Qwen3 Coder Next FP8",
12809
+ api: "openai-completions",
12810
+ provider: "together",
12811
+ baseUrl: "https://api.together.ai/v1",
12812
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
12813
+ reasoning: true,
12814
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
12815
+ input: ["text"],
12816
+ cost: {
12817
+ input: 0.5,
12818
+ output: 1.2,
12819
+ cacheRead: 0,
12820
+ cacheWrite: 0,
12821
+ },
12822
+ contextWindow: 262144,
12823
+ maxTokens: 262144,
12824
+ },
12825
+ "Qwen/Qwen3.5-397B-A17B": {
12826
+ id: "Qwen/Qwen3.5-397B-A17B",
12827
+ name: "Qwen3.5 397B A17B",
12828
+ api: "openai-completions",
12829
+ provider: "together",
12830
+ baseUrl: "https://api.together.ai/v1",
12831
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
12832
+ reasoning: true,
12833
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
12834
+ input: ["text", "image"],
12835
+ cost: {
12836
+ input: 0.6,
12837
+ output: 3.6,
12838
+ cacheRead: 0,
12839
+ cacheWrite: 0,
12840
+ },
12841
+ contextWindow: 262144,
12842
+ maxTokens: 130000,
12843
+ },
12844
+ "Qwen/Qwen3.6-Plus": {
12845
+ id: "Qwen/Qwen3.6-Plus",
12846
+ name: "Qwen3.6 Plus",
12847
+ api: "openai-completions",
12848
+ provider: "together",
12849
+ baseUrl: "https://api.together.ai/v1",
12850
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
12851
+ reasoning: true,
12852
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
12853
+ input: ["text"],
12854
+ cost: {
12855
+ input: 0.5,
12856
+ output: 3,
12857
+ cacheRead: 0,
12858
+ cacheWrite: 0,
12859
+ },
12860
+ contextWindow: 1000000,
12861
+ maxTokens: 500000,
12862
+ },
12863
+ "deepseek-ai/DeepSeek-V3": {
12864
+ id: "deepseek-ai/DeepSeek-V3",
12865
+ name: "DeepSeek V3",
12866
+ api: "openai-completions",
12867
+ provider: "together",
12868
+ baseUrl: "https://api.together.ai/v1",
12869
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
12870
+ reasoning: true,
12871
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
12872
+ input: ["text"],
12873
+ cost: {
12874
+ input: 1.25,
12875
+ output: 1.25,
12876
+ cacheRead: 0,
12877
+ cacheWrite: 0,
12878
+ },
12879
+ contextWindow: 131072,
12880
+ maxTokens: 131072,
12881
+ },
12882
+ "deepseek-ai/DeepSeek-V3-1": {
12883
+ id: "deepseek-ai/DeepSeek-V3-1",
12884
+ name: "DeepSeek V3.1",
12885
+ api: "openai-completions",
12886
+ provider: "together",
12887
+ baseUrl: "https://api.together.ai/v1",
12888
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
12889
+ reasoning: true,
12890
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
12891
+ input: ["text"],
12892
+ cost: {
12893
+ input: 0.6,
12894
+ output: 1.7,
12895
+ cacheRead: 0,
12896
+ cacheWrite: 0,
12897
+ },
12898
+ contextWindow: 131072,
12899
+ maxTokens: 131072,
12900
+ },
12901
+ "deepseek-ai/DeepSeek-V4-Pro": {
12902
+ id: "deepseek-ai/DeepSeek-V4-Pro",
12903
+ name: "DeepSeek V4 Pro",
12904
+ api: "openai-completions",
12905
+ provider: "together",
12906
+ baseUrl: "https://api.together.ai/v1",
12907
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": true, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
12908
+ reasoning: true,
12909
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": null },
12910
+ input: ["text"],
12911
+ cost: {
12912
+ input: 2.1,
12913
+ output: 4.4,
12914
+ cacheRead: 0.2,
12915
+ cacheWrite: 0,
12916
+ },
12917
+ contextWindow: 512000,
12918
+ maxTokens: 384000,
12919
+ },
12920
+ "essentialai/Rnj-1-Instruct": {
12921
+ id: "essentialai/Rnj-1-Instruct",
12922
+ name: "Rnj-1 Instruct",
12923
+ api: "openai-completions",
12924
+ provider: "together",
12925
+ baseUrl: "https://api.together.ai/v1",
12926
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
12927
+ reasoning: false,
12928
+ input: ["text"],
12929
+ cost: {
12930
+ input: 0.15,
12931
+ output: 0.15,
12932
+ cacheRead: 0,
12933
+ cacheWrite: 0,
12934
+ },
12935
+ contextWindow: 32768,
12936
+ maxTokens: 32768,
12937
+ },
12938
+ "google/gemma-4-31B-it": {
12939
+ id: "google/gemma-4-31B-it",
12940
+ name: "Gemma 4 31B Instruct",
12941
+ api: "openai-completions",
12942
+ provider: "together",
12943
+ baseUrl: "https://api.together.ai/v1",
12944
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13061
12945
  reasoning: true,
12946
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13062
12947
  input: ["text", "image"],
13063
12948
  cost: {
13064
- input: 3,
13065
- output: 15,
13066
- cacheRead: 0.3,
13067
- cacheWrite: 3.75,
12949
+ input: 0.2,
12950
+ output: 0.5,
12951
+ cacheRead: 0,
12952
+ cacheWrite: 0,
13068
12953
  },
13069
- contextWindow: 1000000,
13070
- maxTokens: 128000,
12954
+ contextWindow: 262144,
12955
+ maxTokens: 131072,
13071
12956
  },
13072
- "~google/gemini-flash-latest": {
13073
- id: "~google/gemini-flash-latest",
13074
- name: "Google Gemini Flash Latest",
12957
+ "meta-llama/Llama-3.3-70B-Instruct-Turbo": {
12958
+ id: "meta-llama/Llama-3.3-70B-Instruct-Turbo",
12959
+ name: "Llama 3.3 70B",
13075
12960
  api: "openai-completions",
13076
- provider: "openrouter",
13077
- baseUrl: "https://openrouter.ai/api/v1",
13078
- reasoning: true,
13079
- input: ["text", "image"],
12961
+ provider: "together",
12962
+ baseUrl: "https://api.together.ai/v1",
12963
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
12964
+ reasoning: false,
12965
+ input: ["text"],
13080
12966
  cost: {
13081
- input: 0.5,
13082
- output: 3,
13083
- cacheRead: 0.049999999999999996,
13084
- cacheWrite: 0.08333333333333334,
12967
+ input: 0.88,
12968
+ output: 0.88,
12969
+ cacheRead: 0,
12970
+ cacheWrite: 0,
13085
12971
  },
13086
- contextWindow: 1048576,
13087
- maxTokens: 65536,
12972
+ contextWindow: 131072,
12973
+ maxTokens: 131072,
13088
12974
  },
13089
- "~google/gemini-pro-latest": {
13090
- id: "~google/gemini-pro-latest",
13091
- name: "Google Gemini Pro Latest",
12975
+ "moonshotai/Kimi-K2.5": {
12976
+ id: "moonshotai/Kimi-K2.5",
12977
+ name: "Kimi K2.5",
13092
12978
  api: "openai-completions",
13093
- provider: "openrouter",
13094
- baseUrl: "https://openrouter.ai/api/v1",
12979
+ provider: "together",
12980
+ baseUrl: "https://api.together.ai/v1",
12981
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13095
12982
  reasoning: true,
12983
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13096
12984
  input: ["text", "image"],
13097
12985
  cost: {
13098
- input: 2,
13099
- output: 12,
13100
- cacheRead: 0.19999999999999998,
13101
- cacheWrite: 0.375,
12986
+ input: 0.5,
12987
+ output: 2.8,
12988
+ cacheRead: 0,
12989
+ cacheWrite: 0,
13102
12990
  },
13103
- contextWindow: 1048576,
13104
- maxTokens: 65536,
12991
+ contextWindow: 262144,
12992
+ maxTokens: 262144,
13105
12993
  },
13106
- "~moonshotai/kimi-latest": {
13107
- id: "~moonshotai/kimi-latest",
13108
- name: "MoonshotAI Kimi Latest",
12994
+ "moonshotai/Kimi-K2.6": {
12995
+ id: "moonshotai/Kimi-K2.6",
12996
+ name: "Kimi K2.6",
13109
12997
  api: "openai-completions",
13110
- provider: "openrouter",
13111
- baseUrl: "https://openrouter.ai/api/v1",
12998
+ provider: "together",
12999
+ baseUrl: "https://api.together.ai/v1",
13000
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13112
13001
  reasoning: true,
13002
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13113
13003
  input: ["text", "image"],
13114
13004
  cost: {
13115
- input: 0.75,
13116
- output: 3.5,
13117
- cacheRead: 0.15,
13005
+ input: 1.2,
13006
+ output: 4.5,
13007
+ cacheRead: 0.2,
13118
13008
  cacheWrite: 0,
13119
13009
  },
13120
13010
  contextWindow: 262144,
13121
- maxTokens: 16384,
13011
+ maxTokens: 131000,
13122
13012
  },
13123
- "~openai/gpt-latest": {
13124
- id: "~openai/gpt-latest",
13125
- name: "OpenAI GPT Latest",
13013
+ "openai/gpt-oss-120b": {
13014
+ id: "openai/gpt-oss-120b",
13015
+ name: "GPT OSS 120B",
13126
13016
  api: "openai-completions",
13127
- provider: "openrouter",
13128
- baseUrl: "https://openrouter.ai/api/v1",
13017
+ provider: "together",
13018
+ baseUrl: "https://api.together.ai/v1",
13019
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": true, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "openai" },
13129
13020
  reasoning: true,
13130
- input: ["text", "image"],
13021
+ thinkingLevelMap: { "off": null, "minimal": null },
13022
+ input: ["text"],
13131
13023
  cost: {
13132
- input: 5,
13133
- output: 30,
13134
- cacheRead: 0.5,
13024
+ input: 0.15,
13025
+ output: 0.6,
13026
+ cacheRead: 0,
13135
13027
  cacheWrite: 0,
13136
13028
  },
13137
- contextWindow: 1050000,
13138
- maxTokens: 128000,
13029
+ contextWindow: 131072,
13030
+ maxTokens: 131072,
13139
13031
  },
13140
- "~openai/gpt-mini-latest": {
13141
- id: "~openai/gpt-mini-latest",
13142
- name: "OpenAI GPT Mini Latest",
13032
+ "zai-org/GLM-5.1": {
13033
+ id: "zai-org/GLM-5.1",
13034
+ name: "GLM-5.1",
13143
13035
  api: "openai-completions",
13144
- provider: "openrouter",
13145
- baseUrl: "https://openrouter.ai/api/v1",
13036
+ provider: "together",
13037
+ baseUrl: "https://api.together.ai/v1",
13038
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13146
13039
  reasoning: true,
13147
- input: ["text", "image"],
13040
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13041
+ input: ["text"],
13148
13042
  cost: {
13149
- input: 0.75,
13150
- output: 4.5,
13151
- cacheRead: 0.075,
13043
+ input: 1.4,
13044
+ output: 4.4,
13045
+ cacheRead: 0,
13152
13046
  cacheWrite: 0,
13153
13047
  },
13154
- contextWindow: 400000,
13155
- maxTokens: 128000,
13048
+ contextWindow: 202752,
13049
+ maxTokens: 131072,
13156
13050
  },
13157
13051
  },
13158
13052
  "vercel-ai-gateway": {
@@ -13496,23 +13390,6 @@ export const MODELS = {
13496
13390
  contextWindow: 200000,
13497
13391
  maxTokens: 8192,
13498
13392
  },
13499
- "anthropic/claude-3.7-sonnet": {
13500
- id: "anthropic/claude-3.7-sonnet",
13501
- name: "Claude 3.7 Sonnet",
13502
- api: "anthropic-messages",
13503
- provider: "vercel-ai-gateway",
13504
- baseUrl: "https://ai-gateway.vercel.sh",
13505
- reasoning: true,
13506
- input: ["text", "image"],
13507
- cost: {
13508
- input: 3,
13509
- output: 15,
13510
- cacheRead: 0.3,
13511
- cacheWrite: 3.75,
13512
- },
13513
- contextWindow: 200000,
13514
- maxTokens: 8192,
13515
- },
13516
13393
  "anthropic/claude-haiku-4.5": {
13517
13394
  id: "anthropic/claude-haiku-4.5",
13518
13395
  name: "Claude Haiku 4.5",
@@ -13991,6 +13868,23 @@ export const MODELS = {
13991
13868
  contextWindow: 1000000,
13992
13869
  maxTokens: 64000,
13993
13870
  },
13871
+ "google/gemini-3.1-flash-lite": {
13872
+ id: "google/gemini-3.1-flash-lite",
13873
+ name: "Gemini 3.1 Flash Lite",
13874
+ api: "anthropic-messages",
13875
+ provider: "vercel-ai-gateway",
13876
+ baseUrl: "https://ai-gateway.vercel.sh",
13877
+ reasoning: true,
13878
+ input: ["text", "image"],
13879
+ cost: {
13880
+ input: 0.25,
13881
+ output: 1.5,
13882
+ cacheRead: 0.03,
13883
+ cacheWrite: 0,
13884
+ },
13885
+ contextWindow: 1000000,
13886
+ maxTokens: 65000,
13887
+ },
13994
13888
  "google/gemini-3.1-flash-lite-preview": {
13995
13889
  id: "google/gemini-3.1-flash-lite-preview",
13996
13890
  name: "Gemini 3.1 Flash Lite Preview",
@@ -15178,7 +15072,7 @@ export const MODELS = {
15178
15072
  },
15179
15073
  "openai/gpt-oss-20b": {
15180
15074
  id: "openai/gpt-oss-20b",
15181
- name: "GPT OSS 120B",
15075
+ name: "GPT OSS 20B",
15182
15076
  api: "anthropic-messages",
15183
15077
  provider: "vercel-ai-gateway",
15184
15078
  baseUrl: "https://ai-gateway.vercel.sh",
@@ -15257,213 +15151,94 @@ export const MODELS = {
15257
15151
  output: 40,
15258
15152
  cacheRead: 2.5,
15259
15153
  cacheWrite: 0,
15260
- },
15261
- contextWindow: 200000,
15262
- maxTokens: 100000,
15263
- },
15264
- "openai/o3-mini": {
15265
- id: "openai/o3-mini",
15266
- name: "o3-mini",
15267
- api: "anthropic-messages",
15268
- provider: "vercel-ai-gateway",
15269
- baseUrl: "https://ai-gateway.vercel.sh",
15270
- reasoning: true,
15271
- input: ["text"],
15272
- cost: {
15273
- input: 1.1,
15274
- output: 4.4,
15275
- cacheRead: 0.55,
15276
- cacheWrite: 0,
15277
- },
15278
- contextWindow: 200000,
15279
- maxTokens: 100000,
15280
- },
15281
- "openai/o3-pro": {
15282
- id: "openai/o3-pro",
15283
- name: "o3 Pro",
15284
- api: "anthropic-messages",
15285
- provider: "vercel-ai-gateway",
15286
- baseUrl: "https://ai-gateway.vercel.sh",
15287
- reasoning: true,
15288
- input: ["text", "image"],
15289
- cost: {
15290
- input: 20,
15291
- output: 80,
15292
- cacheRead: 0,
15293
- cacheWrite: 0,
15294
- },
15295
- contextWindow: 200000,
15296
- maxTokens: 100000,
15297
- },
15298
- "openai/o4-mini": {
15299
- id: "openai/o4-mini",
15300
- name: "o4-mini",
15301
- api: "anthropic-messages",
15302
- provider: "vercel-ai-gateway",
15303
- baseUrl: "https://ai-gateway.vercel.sh",
15304
- reasoning: true,
15305
- input: ["text", "image"],
15306
- cost: {
15307
- input: 1.1,
15308
- output: 4.4,
15309
- cacheRead: 0.275,
15310
- cacheWrite: 0,
15311
- },
15312
- contextWindow: 200000,
15313
- maxTokens: 100000,
15314
- },
15315
- "perplexity/sonar": {
15316
- id: "perplexity/sonar",
15317
- name: "Sonar",
15318
- api: "anthropic-messages",
15319
- provider: "vercel-ai-gateway",
15320
- baseUrl: "https://ai-gateway.vercel.sh",
15321
- reasoning: false,
15322
- input: ["text", "image"],
15323
- cost: {
15324
- input: 0,
15325
- output: 0,
15326
- cacheRead: 0,
15327
- cacheWrite: 0,
15328
- },
15329
- contextWindow: 127000,
15330
- maxTokens: 8000,
15331
- },
15332
- "perplexity/sonar-pro": {
15333
- id: "perplexity/sonar-pro",
15334
- name: "Sonar Pro",
15335
- api: "anthropic-messages",
15336
- provider: "vercel-ai-gateway",
15337
- baseUrl: "https://ai-gateway.vercel.sh",
15338
- reasoning: false,
15339
- input: ["text", "image"],
15340
- cost: {
15341
- input: 0,
15342
- output: 0,
15343
- cacheRead: 0,
15344
- cacheWrite: 0,
15345
- },
15346
- contextWindow: 200000,
15347
- maxTokens: 8000,
15348
- },
15349
- "xai/grok-3": {
15350
- id: "xai/grok-3",
15351
- name: "Grok 3 Beta",
15352
- api: "anthropic-messages",
15353
- provider: "vercel-ai-gateway",
15354
- baseUrl: "https://ai-gateway.vercel.sh",
15355
- reasoning: false,
15356
- input: ["text"],
15357
- cost: {
15358
- input: 3,
15359
- output: 15,
15360
- cacheRead: 0.75,
15361
- cacheWrite: 0,
15362
- },
15363
- contextWindow: 131072,
15364
- maxTokens: 131072,
15365
- },
15366
- "xai/grok-3-fast": {
15367
- id: "xai/grok-3-fast",
15368
- name: "Grok 3 Fast Beta",
15369
- api: "anthropic-messages",
15370
- provider: "vercel-ai-gateway",
15371
- baseUrl: "https://ai-gateway.vercel.sh",
15372
- reasoning: false,
15373
- input: ["text"],
15374
- cost: {
15375
- input: 5,
15376
- output: 25,
15377
- cacheRead: 1.25,
15378
- cacheWrite: 0,
15379
- },
15380
- contextWindow: 131072,
15381
- maxTokens: 131072,
15154
+ },
15155
+ contextWindow: 200000,
15156
+ maxTokens: 100000,
15382
15157
  },
15383
- "xai/grok-3-mini": {
15384
- id: "xai/grok-3-mini",
15385
- name: "Grok 3 Mini Beta",
15158
+ "openai/o3-mini": {
15159
+ id: "openai/o3-mini",
15160
+ name: "o3-mini",
15386
15161
  api: "anthropic-messages",
15387
15162
  provider: "vercel-ai-gateway",
15388
15163
  baseUrl: "https://ai-gateway.vercel.sh",
15389
- reasoning: false,
15164
+ reasoning: true,
15390
15165
  input: ["text"],
15391
15166
  cost: {
15392
- input: 0.3,
15393
- output: 0.5,
15394
- cacheRead: 0.075,
15167
+ input: 1.1,
15168
+ output: 4.4,
15169
+ cacheRead: 0.55,
15395
15170
  cacheWrite: 0,
15396
15171
  },
15397
- contextWindow: 131072,
15398
- maxTokens: 131072,
15172
+ contextWindow: 200000,
15173
+ maxTokens: 100000,
15399
15174
  },
15400
- "xai/grok-3-mini-fast": {
15401
- id: "xai/grok-3-mini-fast",
15402
- name: "Grok 3 Mini Fast Beta",
15175
+ "openai/o3-pro": {
15176
+ id: "openai/o3-pro",
15177
+ name: "o3 Pro",
15403
15178
  api: "anthropic-messages",
15404
15179
  provider: "vercel-ai-gateway",
15405
15180
  baseUrl: "https://ai-gateway.vercel.sh",
15406
- reasoning: false,
15407
- input: ["text"],
15181
+ reasoning: true,
15182
+ input: ["text", "image"],
15408
15183
  cost: {
15409
- input: 0.6,
15410
- output: 4,
15184
+ input: 20,
15185
+ output: 80,
15411
15186
  cacheRead: 0,
15412
15187
  cacheWrite: 0,
15413
15188
  },
15414
- contextWindow: 131072,
15415
- maxTokens: 131072,
15189
+ contextWindow: 200000,
15190
+ maxTokens: 100000,
15416
15191
  },
15417
- "xai/grok-4": {
15418
- id: "xai/grok-4",
15419
- name: "Grok 4",
15192
+ "openai/o4-mini": {
15193
+ id: "openai/o4-mini",
15194
+ name: "o4-mini",
15420
15195
  api: "anthropic-messages",
15421
15196
  provider: "vercel-ai-gateway",
15422
15197
  baseUrl: "https://ai-gateway.vercel.sh",
15423
15198
  reasoning: true,
15424
15199
  input: ["text", "image"],
15425
15200
  cost: {
15426
- input: 3,
15427
- output: 15,
15428
- cacheRead: 0.75,
15201
+ input: 1.1,
15202
+ output: 4.4,
15203
+ cacheRead: 0.275,
15429
15204
  cacheWrite: 0,
15430
15205
  },
15431
- contextWindow: 256000,
15432
- maxTokens: 256000,
15206
+ contextWindow: 200000,
15207
+ maxTokens: 100000,
15433
15208
  },
15434
- "xai/grok-4-fast-non-reasoning": {
15435
- id: "xai/grok-4-fast-non-reasoning",
15436
- name: "Grok 4 Fast Non-Reasoning",
15209
+ "perplexity/sonar": {
15210
+ id: "perplexity/sonar",
15211
+ name: "Sonar",
15437
15212
  api: "anthropic-messages",
15438
15213
  provider: "vercel-ai-gateway",
15439
15214
  baseUrl: "https://ai-gateway.vercel.sh",
15440
15215
  reasoning: false,
15441
15216
  input: ["text", "image"],
15442
15217
  cost: {
15443
- input: 0.19999999999999998,
15444
- output: 0.5,
15445
- cacheRead: 0.049999999999999996,
15218
+ input: 0,
15219
+ output: 0,
15220
+ cacheRead: 0,
15446
15221
  cacheWrite: 0,
15447
15222
  },
15448
- contextWindow: 2000000,
15449
- maxTokens: 256000,
15223
+ contextWindow: 127000,
15224
+ maxTokens: 8000,
15450
15225
  },
15451
- "xai/grok-4-fast-reasoning": {
15452
- id: "xai/grok-4-fast-reasoning",
15453
- name: "Grok 4 Fast Reasoning",
15226
+ "perplexity/sonar-pro": {
15227
+ id: "perplexity/sonar-pro",
15228
+ name: "Sonar Pro",
15454
15229
  api: "anthropic-messages",
15455
15230
  provider: "vercel-ai-gateway",
15456
15231
  baseUrl: "https://ai-gateway.vercel.sh",
15457
- reasoning: true,
15232
+ reasoning: false,
15458
15233
  input: ["text", "image"],
15459
15234
  cost: {
15460
- input: 0.19999999999999998,
15461
- output: 0.5,
15462
- cacheRead: 0.049999999999999996,
15235
+ input: 0,
15236
+ output: 0,
15237
+ cacheRead: 0,
15463
15238
  cacheWrite: 0,
15464
15239
  },
15465
- contextWindow: 2000000,
15466
- maxTokens: 256000,
15240
+ contextWindow: 200000,
15241
+ maxTokens: 8000,
15467
15242
  },
15468
15243
  "xai/grok-4.1-fast-non-reasoning": {
15469
15244
  id: "xai/grok-4.1-fast-non-reasoning",
@@ -15479,8 +15254,8 @@ export const MODELS = {
15479
15254
  cacheRead: 0.049999999999999996,
15480
15255
  cacheWrite: 0,
15481
15256
  },
15482
- contextWindow: 2000000,
15483
- maxTokens: 30000,
15257
+ contextWindow: 1000000,
15258
+ maxTokens: 1000000,
15484
15259
  },
15485
15260
  "xai/grok-4.1-fast-reasoning": {
15486
15261
  id: "xai/grok-4.1-fast-reasoning",
@@ -15496,8 +15271,8 @@ export const MODELS = {
15496
15271
  cacheRead: 0.049999999999999996,
15497
15272
  cacheWrite: 0,
15498
15273
  },
15499
- contextWindow: 2000000,
15500
- maxTokens: 30000,
15274
+ contextWindow: 1000000,
15275
+ maxTokens: 1000000,
15501
15276
  },
15502
15277
  "xai/grok-4.20-multi-agent": {
15503
15278
  id: "xai/grok-4.20-multi-agent",
@@ -15618,23 +15393,6 @@ export const MODELS = {
15618
15393
  contextWindow: 1000000,
15619
15394
  maxTokens: 1000000,
15620
15395
  },
15621
- "xai/grok-code-fast-1": {
15622
- id: "xai/grok-code-fast-1",
15623
- name: "Grok Code Fast 1",
15624
- api: "anthropic-messages",
15625
- provider: "vercel-ai-gateway",
15626
- baseUrl: "https://ai-gateway.vercel.sh",
15627
- reasoning: true,
15628
- input: ["text"],
15629
- cost: {
15630
- input: 0.19999999999999998,
15631
- output: 1.5,
15632
- cacheRead: 0.02,
15633
- cacheWrite: 0,
15634
- },
15635
- contextWindow: 256000,
15636
- maxTokens: 256000,
15637
- },
15638
15396
  "xiaomi/mimo-v2-flash": {
15639
15397
  id: "xiaomi/mimo-v2-flash",
15640
15398
  name: "MiMo V2 Flash",
@@ -16062,193 +15820,6 @@ export const MODELS = {
16062
15820
  contextWindow: 131072,
16063
15821
  maxTokens: 8192,
16064
15822
  },
16065
- "grok-3-fast-latest": {
16066
- id: "grok-3-fast-latest",
16067
- name: "Grok 3 Fast Latest",
16068
- api: "openai-completions",
16069
- provider: "xai",
16070
- baseUrl: "https://api.x.ai/v1",
16071
- reasoning: false,
16072
- input: ["text"],
16073
- cost: {
16074
- input: 5,
16075
- output: 25,
16076
- cacheRead: 1.25,
16077
- cacheWrite: 0,
16078
- },
16079
- contextWindow: 131072,
16080
- maxTokens: 8192,
16081
- },
16082
- "grok-3-latest": {
16083
- id: "grok-3-latest",
16084
- name: "Grok 3 Latest",
16085
- api: "openai-completions",
16086
- provider: "xai",
16087
- baseUrl: "https://api.x.ai/v1",
16088
- reasoning: false,
16089
- input: ["text"],
16090
- cost: {
16091
- input: 3,
16092
- output: 15,
16093
- cacheRead: 0.75,
16094
- cacheWrite: 0,
16095
- },
16096
- contextWindow: 131072,
16097
- maxTokens: 8192,
16098
- },
16099
- "grok-3-mini": {
16100
- id: "grok-3-mini",
16101
- name: "Grok 3 Mini",
16102
- api: "openai-completions",
16103
- provider: "xai",
16104
- baseUrl: "https://api.x.ai/v1",
16105
- reasoning: true,
16106
- input: ["text"],
16107
- cost: {
16108
- input: 0.3,
16109
- output: 0.5,
16110
- cacheRead: 0.075,
16111
- cacheWrite: 0,
16112
- },
16113
- contextWindow: 131072,
16114
- maxTokens: 8192,
16115
- },
16116
- "grok-3-mini-fast": {
16117
- id: "grok-3-mini-fast",
16118
- name: "Grok 3 Mini Fast",
16119
- api: "openai-completions",
16120
- provider: "xai",
16121
- baseUrl: "https://api.x.ai/v1",
16122
- reasoning: true,
16123
- input: ["text"],
16124
- cost: {
16125
- input: 0.6,
16126
- output: 4,
16127
- cacheRead: 0.15,
16128
- cacheWrite: 0,
16129
- },
16130
- contextWindow: 131072,
16131
- maxTokens: 8192,
16132
- },
16133
- "grok-3-mini-fast-latest": {
16134
- id: "grok-3-mini-fast-latest",
16135
- name: "Grok 3 Mini Fast Latest",
16136
- api: "openai-completions",
16137
- provider: "xai",
16138
- baseUrl: "https://api.x.ai/v1",
16139
- reasoning: true,
16140
- input: ["text"],
16141
- cost: {
16142
- input: 0.6,
16143
- output: 4,
16144
- cacheRead: 0.15,
16145
- cacheWrite: 0,
16146
- },
16147
- contextWindow: 131072,
16148
- maxTokens: 8192,
16149
- },
16150
- "grok-3-mini-latest": {
16151
- id: "grok-3-mini-latest",
16152
- name: "Grok 3 Mini Latest",
16153
- api: "openai-completions",
16154
- provider: "xai",
16155
- baseUrl: "https://api.x.ai/v1",
16156
- reasoning: true,
16157
- input: ["text"],
16158
- cost: {
16159
- input: 0.3,
16160
- output: 0.5,
16161
- cacheRead: 0.075,
16162
- cacheWrite: 0,
16163
- },
16164
- contextWindow: 131072,
16165
- maxTokens: 8192,
16166
- },
16167
- "grok-4": {
16168
- id: "grok-4",
16169
- name: "Grok 4",
16170
- api: "openai-completions",
16171
- provider: "xai",
16172
- baseUrl: "https://api.x.ai/v1",
16173
- reasoning: true,
16174
- input: ["text"],
16175
- cost: {
16176
- input: 3,
16177
- output: 15,
16178
- cacheRead: 0.75,
16179
- cacheWrite: 0,
16180
- },
16181
- contextWindow: 256000,
16182
- maxTokens: 64000,
16183
- },
16184
- "grok-4-1-fast": {
16185
- id: "grok-4-1-fast",
16186
- name: "Grok 4.1 Fast",
16187
- api: "openai-completions",
16188
- provider: "xai",
16189
- baseUrl: "https://api.x.ai/v1",
16190
- reasoning: true,
16191
- input: ["text", "image"],
16192
- cost: {
16193
- input: 0.2,
16194
- output: 0.5,
16195
- cacheRead: 0.05,
16196
- cacheWrite: 0,
16197
- },
16198
- contextWindow: 2000000,
16199
- maxTokens: 30000,
16200
- },
16201
- "grok-4-1-fast-non-reasoning": {
16202
- id: "grok-4-1-fast-non-reasoning",
16203
- name: "Grok 4.1 Fast (Non-Reasoning)",
16204
- api: "openai-completions",
16205
- provider: "xai",
16206
- baseUrl: "https://api.x.ai/v1",
16207
- reasoning: false,
16208
- input: ["text", "image"],
16209
- cost: {
16210
- input: 0.2,
16211
- output: 0.5,
16212
- cacheRead: 0.05,
16213
- cacheWrite: 0,
16214
- },
16215
- contextWindow: 2000000,
16216
- maxTokens: 30000,
16217
- },
16218
- "grok-4-fast": {
16219
- id: "grok-4-fast",
16220
- name: "Grok 4 Fast",
16221
- api: "openai-completions",
16222
- provider: "xai",
16223
- baseUrl: "https://api.x.ai/v1",
16224
- reasoning: true,
16225
- input: ["text", "image"],
16226
- cost: {
16227
- input: 0.2,
16228
- output: 0.5,
16229
- cacheRead: 0.05,
16230
- cacheWrite: 0,
16231
- },
16232
- contextWindow: 2000000,
16233
- maxTokens: 30000,
16234
- },
16235
- "grok-4-fast-non-reasoning": {
16236
- id: "grok-4-fast-non-reasoning",
16237
- name: "Grok 4 Fast (Non-Reasoning)",
16238
- api: "openai-completions",
16239
- provider: "xai",
16240
- baseUrl: "https://api.x.ai/v1",
16241
- reasoning: false,
16242
- input: ["text", "image"],
16243
- cost: {
16244
- input: 0.2,
16245
- output: 0.5,
16246
- cacheRead: 0.05,
16247
- cacheWrite: 0,
16248
- },
16249
- contextWindow: 2000000,
16250
- maxTokens: 30000,
16251
- },
16252
15823
  "grok-4.20-0309-non-reasoning": {
16253
15824
  id: "grok-4.20-0309-non-reasoning",
16254
15825
  name: "Grok 4.20 (Non-Reasoning)",
@@ -16323,7 +15894,7 @@ export const MODELS = {
16323
15894
  api: "openai-completions",
16324
15895
  provider: "xai",
16325
15896
  baseUrl: "https://api.x.ai/v1",
16326
- reasoning: true,
15897
+ reasoning: false,
16327
15898
  input: ["text"],
16328
15899
  cost: {
16329
15900
  input: 0.2,
@@ -16331,8 +15902,8 @@ export const MODELS = {
16331
15902
  cacheRead: 0.02,
16332
15903
  cacheWrite: 0,
16333
15904
  },
16334
- contextWindow: 256000,
16335
- maxTokens: 10000,
15905
+ contextWindow: 32768,
15906
+ maxTokens: 8192,
16336
15907
  },
16337
15908
  "grok-vision-beta": {
16338
15909
  id: "grok-vision-beta",