@fleetagent/pi-ai 0.0.6 → 0.0.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (42) hide show
  1. package/README.md +1 -1
  2. package/dist/image-models.generated.d.ts +15 -0
  3. package/dist/image-models.generated.d.ts.map +1 -1
  4. package/dist/image-models.generated.js +15 -0
  5. package/dist/image-models.generated.js.map +1 -1
  6. package/dist/models.generated.d.ts +863 -380
  7. package/dist/models.generated.d.ts.map +1 -1
  8. package/dist/models.generated.js +1064 -678
  9. package/dist/models.generated.js.map +1 -1
  10. package/dist/providers/anthropic.d.ts.map +1 -1
  11. package/dist/providers/anthropic.js +21 -12
  12. package/dist/providers/anthropic.js.map +1 -1
  13. package/dist/providers/azure-openai-responses.d.ts.map +1 -1
  14. package/dist/providers/azure-openai-responses.js +1 -1
  15. package/dist/providers/azure-openai-responses.js.map +1 -1
  16. package/dist/providers/images/openrouter.d.ts.map +1 -1
  17. package/dist/providers/images/openrouter.js +1 -1
  18. package/dist/providers/images/openrouter.js.map +1 -1
  19. package/dist/providers/openai-codex-responses.d.ts.map +1 -1
  20. package/dist/providers/openai-codex-responses.js +163 -81
  21. package/dist/providers/openai-codex-responses.js.map +1 -1
  22. package/dist/providers/openai-completions.d.ts.map +1 -1
  23. package/dist/providers/openai-completions.js +14 -4
  24. package/dist/providers/openai-completions.js.map +1 -1
  25. package/dist/providers/openai-responses-shared.d.ts.map +1 -1
  26. package/dist/providers/openai-responses-shared.js +4 -1
  27. package/dist/providers/openai-responses-shared.js.map +1 -1
  28. package/dist/providers/openai-responses.d.ts.map +1 -1
  29. package/dist/providers/openai-responses.js +1 -1
  30. package/dist/providers/openai-responses.js.map +1 -1
  31. package/dist/types.d.ts +26 -2
  32. package/dist/types.d.ts.map +1 -1
  33. package/dist/types.js.map +1 -1
  34. package/dist/utils/abort-signals.d.ts +6 -0
  35. package/dist/utils/abort-signals.d.ts.map +1 -0
  36. package/dist/utils/abort-signals.js +34 -0
  37. package/dist/utils/abort-signals.js.map +1 -0
  38. package/dist/utils/overflow.d.ts +2 -1
  39. package/dist/utils/overflow.d.ts.map +1 -1
  40. package/dist/utils/overflow.js +5 -2
  41. package/dist/utils/overflow.js.map +1 -1
  42. package/package.json +2 -1
@@ -157,6 +157,23 @@ export const MODELS = {
157
157
  contextWindow: 1000000,
158
158
  maxTokens: 128000,
159
159
  },
160
+ "anthropic.claude-opus-4-8": {
161
+ id: "anthropic.claude-opus-4-8",
162
+ name: "Claude Opus 4.8",
163
+ api: "bedrock-converse-stream",
164
+ provider: "amazon-bedrock",
165
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
166
+ reasoning: true,
167
+ input: ["text", "image"],
168
+ cost: {
169
+ input: 5,
170
+ output: 25,
171
+ cacheRead: 0.5,
172
+ cacheWrite: 6.25,
173
+ },
174
+ contextWindow: 1000000,
175
+ maxTokens: 128000,
176
+ },
160
177
  "anthropic.claude-sonnet-4-5-20250929-v1:0": {
161
178
  id: "anthropic.claude-sonnet-4-5-20250929-v1:0",
162
179
  name: "Claude Sonnet 4.5",
@@ -226,6 +243,23 @@ export const MODELS = {
226
243
  contextWindow: 1000000,
227
244
  maxTokens: 128000,
228
245
  },
246
+ "au.anthropic.claude-opus-4-8": {
247
+ id: "au.anthropic.claude-opus-4-8",
248
+ name: "Claude Opus 4.8 (AU)",
249
+ api: "bedrock-converse-stream",
250
+ provider: "amazon-bedrock",
251
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
252
+ reasoning: true,
253
+ input: ["text", "image"],
254
+ cost: {
255
+ input: 5,
256
+ output: 25,
257
+ cacheRead: 0.5,
258
+ cacheWrite: 6.25,
259
+ },
260
+ contextWindow: 1000000,
261
+ maxTokens: 128000,
262
+ },
229
263
  "au.anthropic.claude-sonnet-4-5-20250929-v1:0": {
230
264
  id: "au.anthropic.claude-sonnet-4-5-20250929-v1:0",
231
265
  name: "Claude Sonnet 4.5 (AU)",
@@ -355,8 +389,8 @@ export const MODELS = {
355
389
  thinkingLevelMap: { "xhigh": "max" },
356
390
  input: ["text", "image"],
357
391
  cost: {
358
- input: 5,
359
- output: 25,
392
+ input: 5.5,
393
+ output: 27.5,
360
394
  cacheRead: 0.5,
361
395
  cacheWrite: 6.25,
362
396
  },
@@ -373,10 +407,27 @@ export const MODELS = {
373
407
  thinkingLevelMap: { "xhigh": "xhigh" },
374
408
  input: ["text", "image"],
375
409
  cost: {
376
- input: 5,
377
- output: 25,
378
- cacheRead: 0.5,
379
- cacheWrite: 6.25,
410
+ input: 5.5,
411
+ output: 27.5,
412
+ cacheRead: 0.55,
413
+ cacheWrite: 6.875,
414
+ },
415
+ contextWindow: 1000000,
416
+ maxTokens: 128000,
417
+ },
418
+ "eu.anthropic.claude-opus-4-8": {
419
+ id: "eu.anthropic.claude-opus-4-8",
420
+ name: "Claude Opus 4.8 (EU)",
421
+ api: "bedrock-converse-stream",
422
+ provider: "amazon-bedrock",
423
+ baseUrl: "https://bedrock-runtime.eu-central-1.amazonaws.com",
424
+ reasoning: true,
425
+ input: ["text", "image"],
426
+ cost: {
427
+ input: 5.5,
428
+ output: 27.5,
429
+ cacheRead: 0.55,
430
+ cacheWrite: 6.875,
380
431
  },
381
432
  contextWindow: 1000000,
382
433
  maxTokens: 128000,
@@ -390,10 +441,10 @@ export const MODELS = {
390
441
  reasoning: true,
391
442
  input: ["text", "image"],
392
443
  cost: {
393
- input: 3,
394
- output: 15,
395
- cacheRead: 0.3,
396
- cacheWrite: 3.75,
444
+ input: 3.3,
445
+ output: 16.5,
446
+ cacheRead: 0.33,
447
+ cacheWrite: 4.125,
397
448
  },
398
449
  contextWindow: 200000,
399
450
  maxTokens: 64000,
@@ -407,10 +458,10 @@ export const MODELS = {
407
458
  reasoning: true,
408
459
  input: ["text", "image"],
409
460
  cost: {
410
- input: 3,
411
- output: 15,
412
- cacheRead: 0.3,
413
- cacheWrite: 3.75,
461
+ input: 3.3,
462
+ output: 16.5,
463
+ cacheRead: 0.33,
464
+ cacheWrite: 4.125,
414
465
  },
415
466
  contextWindow: 1000000,
416
467
  maxTokens: 64000,
@@ -485,6 +536,23 @@ export const MODELS = {
485
536
  contextWindow: 1000000,
486
537
  maxTokens: 128000,
487
538
  },
539
+ "global.anthropic.claude-opus-4-8": {
540
+ id: "global.anthropic.claude-opus-4-8",
541
+ name: "Claude Opus 4.8 (Global)",
542
+ api: "bedrock-converse-stream",
543
+ provider: "amazon-bedrock",
544
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
545
+ reasoning: true,
546
+ input: ["text", "image"],
547
+ cost: {
548
+ input: 5,
549
+ output: 25,
550
+ cacheRead: 0.5,
551
+ cacheWrite: 6.25,
552
+ },
553
+ contextWindow: 1000000,
554
+ maxTokens: 128000,
555
+ },
488
556
  "global.anthropic.claude-sonnet-4-5-20250929-v1:0": {
489
557
  id: "global.anthropic.claude-sonnet-4-5-20250929-v1:0",
490
558
  name: "Claude Sonnet 4.5 (Global)",
@@ -571,6 +639,23 @@ export const MODELS = {
571
639
  contextWindow: 1000000,
572
640
  maxTokens: 128000,
573
641
  },
642
+ "jp.anthropic.claude-opus-4-8": {
643
+ id: "jp.anthropic.claude-opus-4-8",
644
+ name: "Claude Opus 4.8 (JP)",
645
+ api: "bedrock-converse-stream",
646
+ provider: "amazon-bedrock",
647
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
648
+ reasoning: true,
649
+ input: ["text", "image"],
650
+ cost: {
651
+ input: 5,
652
+ output: 25,
653
+ cacheRead: 0.5,
654
+ cacheWrite: 6.25,
655
+ },
656
+ contextWindow: 1000000,
657
+ maxTokens: 128000,
658
+ },
574
659
  "jp.anthropic.claude-sonnet-4-5-20250929-v1:0": {
575
660
  id: "jp.anthropic.claude-sonnet-4-5-20250929-v1:0",
576
661
  name: "Claude Sonnet 4.5 (JP)",
@@ -996,6 +1081,59 @@ export const MODELS = {
996
1081
  contextWindow: 262144,
997
1082
  maxTokens: 131072,
998
1083
  },
1084
+ "openai.gpt-5.4": {
1085
+ id: "openai.gpt-5.4",
1086
+ name: "GPT-5.4",
1087
+ api: "bedrock-converse-stream",
1088
+ provider: "amazon-bedrock",
1089
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1090
+ reasoning: true,
1091
+ thinkingLevelMap: { "xhigh": "xhigh" },
1092
+ input: ["text", "image"],
1093
+ cost: {
1094
+ input: 2.75,
1095
+ output: 16.5,
1096
+ cacheRead: 0.275,
1097
+ cacheWrite: 0,
1098
+ },
1099
+ contextWindow: 272000,
1100
+ maxTokens: 128000,
1101
+ },
1102
+ "openai.gpt-5.5": {
1103
+ id: "openai.gpt-5.5",
1104
+ name: "GPT-5.5",
1105
+ api: "bedrock-converse-stream",
1106
+ provider: "amazon-bedrock",
1107
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1108
+ reasoning: true,
1109
+ thinkingLevelMap: { "xhigh": "xhigh" },
1110
+ input: ["text", "image"],
1111
+ cost: {
1112
+ input: 5.5,
1113
+ output: 33,
1114
+ cacheRead: 0.55,
1115
+ cacheWrite: 0,
1116
+ },
1117
+ contextWindow: 272000,
1118
+ maxTokens: 128000,
1119
+ },
1120
+ "openai.gpt-oss-120b": {
1121
+ id: "openai.gpt-oss-120b",
1122
+ name: "gpt-oss-120b",
1123
+ api: "bedrock-converse-stream",
1124
+ provider: "amazon-bedrock",
1125
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1126
+ reasoning: false,
1127
+ input: ["text"],
1128
+ cost: {
1129
+ input: 0.15,
1130
+ output: 0.6,
1131
+ cacheRead: 0,
1132
+ cacheWrite: 0,
1133
+ },
1134
+ contextWindow: 128000,
1135
+ maxTokens: 16384,
1136
+ },
999
1137
  "openai.gpt-oss-120b-1:0": {
1000
1138
  id: "openai.gpt-oss-120b-1:0",
1001
1139
  name: "gpt-oss-120b",
@@ -1013,6 +1151,23 @@ export const MODELS = {
1013
1151
  contextWindow: 128000,
1014
1152
  maxTokens: 16384,
1015
1153
  },
1154
+ "openai.gpt-oss-20b": {
1155
+ id: "openai.gpt-oss-20b",
1156
+ name: "gpt-oss-20b",
1157
+ api: "bedrock-converse-stream",
1158
+ provider: "amazon-bedrock",
1159
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1160
+ reasoning: false,
1161
+ input: ["text"],
1162
+ cost: {
1163
+ input: 0.07,
1164
+ output: 0.3,
1165
+ cacheRead: 0,
1166
+ cacheWrite: 0,
1167
+ },
1168
+ contextWindow: 128000,
1169
+ maxTokens: 16384,
1170
+ },
1016
1171
  "openai.gpt-oss-20b-1:0": {
1017
1172
  id: "openai.gpt-oss-20b-1:0",
1018
1173
  name: "gpt-oss-20b",
@@ -1270,6 +1425,23 @@ export const MODELS = {
1270
1425
  contextWindow: 1000000,
1271
1426
  maxTokens: 128000,
1272
1427
  },
1428
+ "us.anthropic.claude-opus-4-8": {
1429
+ id: "us.anthropic.claude-opus-4-8",
1430
+ name: "Claude Opus 4.8 (US)",
1431
+ api: "bedrock-converse-stream",
1432
+ provider: "amazon-bedrock",
1433
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1434
+ reasoning: true,
1435
+ input: ["text", "image"],
1436
+ cost: {
1437
+ input: 5,
1438
+ output: 25,
1439
+ cacheRead: 0.5,
1440
+ cacheWrite: 6.25,
1441
+ },
1442
+ contextWindow: 1000000,
1443
+ maxTokens: 128000,
1444
+ },
1273
1445
  "us.anthropic.claude-sonnet-4-5-20250929-v1:0": {
1274
1446
  id: "us.anthropic.claude-sonnet-4-5-20250929-v1:0",
1275
1447
  name: "Claude Sonnet 4.5 (US)",
@@ -1720,6 +1892,7 @@ export const MODELS = {
1720
1892
  api: "anthropic-messages",
1721
1893
  provider: "anthropic",
1722
1894
  baseUrl: "https://api.anthropic.com",
1895
+ compat: { "forceAdaptiveThinking": true },
1723
1896
  reasoning: true,
1724
1897
  thinkingLevelMap: { "xhigh": "max" },
1725
1898
  input: ["text", "image"],
@@ -1738,6 +1911,7 @@ export const MODELS = {
1738
1911
  api: "anthropic-messages",
1739
1912
  provider: "anthropic",
1740
1913
  baseUrl: "https://api.anthropic.com",
1914
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
1741
1915
  reasoning: true,
1742
1916
  thinkingLevelMap: { "xhigh": "xhigh" },
1743
1917
  input: ["text", "image"],
@@ -1750,6 +1924,24 @@ export const MODELS = {
1750
1924
  contextWindow: 1000000,
1751
1925
  maxTokens: 128000,
1752
1926
  },
1927
+ "claude-opus-4-8": {
1928
+ id: "claude-opus-4-8",
1929
+ name: "Claude Opus 4.8",
1930
+ api: "anthropic-messages",
1931
+ provider: "anthropic",
1932
+ baseUrl: "https://api.anthropic.com",
1933
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
1934
+ reasoning: true,
1935
+ input: ["text", "image"],
1936
+ cost: {
1937
+ input: 5,
1938
+ output: 25,
1939
+ cacheRead: 0.5,
1940
+ cacheWrite: 6.25,
1941
+ },
1942
+ contextWindow: 1000000,
1943
+ maxTokens: 128000,
1944
+ },
1753
1945
  "claude-sonnet-4-0": {
1754
1946
  id: "claude-sonnet-4-0",
1755
1947
  name: "Claude Sonnet 4 (latest)",
@@ -1824,6 +2016,7 @@ export const MODELS = {
1824
2016
  api: "anthropic-messages",
1825
2017
  provider: "anthropic",
1826
2018
  baseUrl: "https://api.anthropic.com",
2019
+ compat: { "forceAdaptiveThinking": true },
1827
2020
  reasoning: true,
1828
2021
  input: ["text", "image"],
1829
2022
  cost: {
@@ -1916,7 +2109,7 @@ export const MODELS = {
1916
2109
  cost: {
1917
2110
  input: 0.1,
1918
2111
  output: 0.4,
1919
- cacheRead: 0.03,
2112
+ cacheRead: 0.025,
1920
2113
  cacheWrite: 0,
1921
2114
  },
1922
2115
  contextWindow: 1047576,
@@ -2001,7 +2194,7 @@ export const MODELS = {
2001
2194
  cost: {
2002
2195
  input: 0.15,
2003
2196
  output: 0.6,
2004
- cacheRead: 0.08,
2197
+ cacheRead: 0.075,
2005
2198
  cacheWrite: 0,
2006
2199
  },
2007
2200
  contextWindow: 128000,
@@ -2127,7 +2320,7 @@ export const MODELS = {
2127
2320
  cost: {
2128
2321
  input: 1.25,
2129
2322
  output: 10,
2130
- cacheRead: 0.13,
2323
+ cacheRead: 0.125,
2131
2324
  cacheWrite: 0,
2132
2325
  },
2133
2326
  contextWindow: 400000,
@@ -2428,7 +2621,7 @@ export const MODELS = {
2428
2621
  provider: "azure-openai-responses",
2429
2622
  baseUrl: "",
2430
2623
  reasoning: true,
2431
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
2624
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh", "minimal": null, "low": null },
2432
2625
  input: ["text", "image"],
2433
2626
  cost: {
2434
2627
  input: 30,
@@ -2552,7 +2745,7 @@ export const MODELS = {
2552
2745
  cost: {
2553
2746
  input: 1.1,
2554
2747
  output: 4.4,
2555
- cacheRead: 0.28,
2748
+ cacheRead: 0.275,
2556
2749
  cacheWrite: 0,
2557
2750
  },
2558
2751
  contextWindow: 200000,
@@ -2611,23 +2804,6 @@ export const MODELS = {
2611
2804
  contextWindow: 32000,
2612
2805
  maxTokens: 8000,
2613
2806
  },
2614
- "qwen-3-235b-a22b-instruct-2507": {
2615
- id: "qwen-3-235b-a22b-instruct-2507",
2616
- name: "Qwen 3 235B Instruct",
2617
- api: "openai-completions",
2618
- provider: "cerebras",
2619
- baseUrl: "https://api.cerebras.ai/v1",
2620
- reasoning: false,
2621
- input: ["text"],
2622
- cost: {
2623
- input: 0.6,
2624
- output: 1.2,
2625
- cacheRead: 0,
2626
- cacheWrite: 0,
2627
- },
2628
- contextWindow: 131000,
2629
- maxTokens: 32000,
2630
- },
2631
2807
  "zai-glm-4.7": {
2632
2808
  id: "zai-glm-4.7",
2633
2809
  name: "Z.AI GLM-4.7",
@@ -2823,6 +2999,7 @@ export const MODELS = {
2823
2999
  api: "anthropic-messages",
2824
3000
  provider: "cloudflare-ai-gateway",
2825
3001
  baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
3002
+ compat: { "forceAdaptiveThinking": true },
2826
3003
  reasoning: true,
2827
3004
  thinkingLevelMap: { "xhigh": "max" },
2828
3005
  input: ["text", "image"],
@@ -2841,6 +3018,7 @@ export const MODELS = {
2841
3018
  api: "anthropic-messages",
2842
3019
  provider: "cloudflare-ai-gateway",
2843
3020
  baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
3021
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
2844
3022
  reasoning: true,
2845
3023
  thinkingLevelMap: { "xhigh": "xhigh" },
2846
3024
  input: ["text", "image"],
@@ -2853,6 +3031,24 @@ export const MODELS = {
2853
3031
  contextWindow: 1000000,
2854
3032
  maxTokens: 128000,
2855
3033
  },
3034
+ "claude-opus-4-8": {
3035
+ id: "claude-opus-4-8",
3036
+ name: "Claude Opus 4.8",
3037
+ api: "anthropic-messages",
3038
+ provider: "cloudflare-ai-gateway",
3039
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
3040
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
3041
+ reasoning: true,
3042
+ input: ["text", "image"],
3043
+ cost: {
3044
+ input: 5,
3045
+ output: 25,
3046
+ cacheRead: 0.5,
3047
+ cacheWrite: 6.25,
3048
+ },
3049
+ contextWindow: 1000000,
3050
+ maxTokens: 128000,
3051
+ },
2856
3052
  "claude-sonnet-4": {
2857
3053
  id: "claude-sonnet-4",
2858
3054
  name: "Claude Sonnet 4 (latest)",
@@ -2893,6 +3089,7 @@ export const MODELS = {
2893
3089
  api: "anthropic-messages",
2894
3090
  provider: "cloudflare-ai-gateway",
2895
3091
  baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
3092
+ compat: { "forceAdaptiveThinking": true },
2896
3093
  reasoning: true,
2897
3094
  input: ["text", "image"],
2898
3095
  cost: {
@@ -3347,24 +3544,6 @@ export const MODELS = {
3347
3544
  contextWindow: 128000,
3348
3545
  maxTokens: 128000,
3349
3546
  },
3350
- "@cf/moonshotai/kimi-k2.5": {
3351
- id: "@cf/moonshotai/kimi-k2.5",
3352
- name: "Kimi K2.5",
3353
- api: "openai-completions",
3354
- provider: "cloudflare-workers-ai",
3355
- baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3356
- compat: { "sendSessionAffinityHeaders": true },
3357
- reasoning: true,
3358
- input: ["text", "image"],
3359
- cost: {
3360
- input: 0.6,
3361
- output: 3,
3362
- cacheRead: 0.1,
3363
- cacheWrite: 0,
3364
- },
3365
- contextWindow: 256000,
3366
- maxTokens: 256000,
3367
- },
3368
3547
  "@cf/moonshotai/kimi-k2.6": {
3369
3548
  id: "@cf/moonshotai/kimi-k2.6",
3370
3549
  name: "Kimi K2.6",
@@ -3692,8 +3871,8 @@ export const MODELS = {
3692
3871
  cacheRead: 0.1,
3693
3872
  cacheWrite: 0,
3694
3873
  },
3695
- contextWindow: 128000,
3696
- maxTokens: 8192,
3874
+ contextWindow: 262144,
3875
+ maxTokens: 65536,
3697
3876
  },
3698
3877
  "accounts/fireworks/routers/glm-5p1-fast": {
3699
3878
  id: "accounts/fireworks/routers/glm-5p1-fast",
@@ -3735,7 +3914,7 @@ export const MODELS = {
3735
3914
  "github-copilot": {
3736
3915
  "claude-haiku-4.5": {
3737
3916
  id: "claude-haiku-4.5",
3738
- name: "Claude Haiku 4.5",
3917
+ name: "Claude Haiku 4.5 (latest)",
3739
3918
  api: "anthropic-messages",
3740
3919
  provider: "github-copilot",
3741
3920
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -3744,17 +3923,17 @@ export const MODELS = {
3744
3923
  reasoning: true,
3745
3924
  input: ["text", "image"],
3746
3925
  cost: {
3747
- input: 0,
3748
- output: 0,
3749
- cacheRead: 0,
3750
- cacheWrite: 0,
3926
+ input: 1,
3927
+ output: 5,
3928
+ cacheRead: 0.1,
3929
+ cacheWrite: 1.25,
3751
3930
  },
3752
- contextWindow: 144000,
3753
- maxTokens: 32000,
3931
+ contextWindow: 200000,
3932
+ maxTokens: 64000,
3754
3933
  },
3755
3934
  "claude-opus-4.5": {
3756
3935
  id: "claude-opus-4.5",
3757
- name: "Claude Opus 4.5",
3936
+ name: "Claude Opus 4.5 (latest)",
3758
3937
  api: "anthropic-messages",
3759
3938
  provider: "github-copilot",
3760
3939
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -3762,13 +3941,13 @@ export const MODELS = {
3762
3941
  reasoning: true,
3763
3942
  input: ["text", "image"],
3764
3943
  cost: {
3765
- input: 0,
3766
- output: 0,
3767
- cacheRead: 0,
3768
- cacheWrite: 0,
3769
- },
3770
- contextWindow: 160000,
3771
- maxTokens: 32000,
3944
+ input: 5,
3945
+ output: 25,
3946
+ cacheRead: 0.5,
3947
+ cacheWrite: 6.25,
3948
+ },
3949
+ contextWindow: 200000,
3950
+ maxTokens: 32000,
3772
3951
  },
3773
3952
  "claude-opus-4.6": {
3774
3953
  id: "claude-opus-4.6",
@@ -3777,17 +3956,18 @@ export const MODELS = {
3777
3956
  provider: "github-copilot",
3778
3957
  baseUrl: "https://api.individual.githubcopilot.com",
3779
3958
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3959
+ compat: { "forceAdaptiveThinking": true },
3780
3960
  reasoning: true,
3781
3961
  thinkingLevelMap: { "xhigh": "max" },
3782
3962
  input: ["text", "image"],
3783
3963
  cost: {
3784
- input: 0,
3785
- output: 0,
3786
- cacheRead: 0,
3787
- cacheWrite: 0,
3964
+ input: 5,
3965
+ output: 25,
3966
+ cacheRead: 0.5,
3967
+ cacheWrite: 6.25,
3788
3968
  },
3789
3969
  contextWindow: 1000000,
3790
- maxTokens: 64000,
3970
+ maxTokens: 32000,
3791
3971
  },
3792
3972
  "claude-opus-4.7": {
3793
3973
  id: "claude-opus-4.7",
@@ -3796,21 +3976,60 @@ export const MODELS = {
3796
3976
  provider: "github-copilot",
3797
3977
  baseUrl: "https://api.individual.githubcopilot.com",
3798
3978
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3979
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
3799
3980
  reasoning: true,
3800
3981
  thinkingLevelMap: { "xhigh": "xhigh" },
3801
3982
  input: ["text", "image"],
3802
3983
  cost: {
3803
- input: 0,
3804
- output: 0,
3805
- cacheRead: 0,
3806
- cacheWrite: 0,
3984
+ input: 5,
3985
+ output: 25,
3986
+ cacheRead: 0.5,
3987
+ cacheWrite: 6.25,
3988
+ },
3989
+ contextWindow: 200000,
3990
+ maxTokens: 32000,
3991
+ },
3992
+ "claude-opus-4.8": {
3993
+ id: "claude-opus-4.8",
3994
+ name: "Claude Opus 4.8",
3995
+ api: "anthropic-messages",
3996
+ provider: "github-copilot",
3997
+ baseUrl: "https://api.individual.githubcopilot.com",
3998
+ headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3999
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
4000
+ reasoning: true,
4001
+ input: ["text", "image"],
4002
+ cost: {
4003
+ input: 5,
4004
+ output: 25,
4005
+ cacheRead: 0.5,
4006
+ cacheWrite: 6.25,
3807
4007
  },
3808
- contextWindow: 144000,
4008
+ contextWindow: 200000,
3809
4009
  maxTokens: 64000,
3810
4010
  },
4011
+ "claude-sonnet-4": {
4012
+ id: "claude-sonnet-4",
4013
+ name: "Claude Sonnet 4 (latest)",
4014
+ api: "anthropic-messages",
4015
+ provider: "github-copilot",
4016
+ baseUrl: "https://api.individual.githubcopilot.com",
4017
+ headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4018
+ compat: { "supportsEagerToolInputStreaming": false },
4019
+ reasoning: true,
4020
+ input: ["text", "image"],
4021
+ cost: {
4022
+ input: 3,
4023
+ output: 15,
4024
+ cacheRead: 0.3,
4025
+ cacheWrite: 3.75,
4026
+ },
4027
+ contextWindow: 216000,
4028
+ maxTokens: 16000,
4029
+ },
3811
4030
  "claude-sonnet-4.5": {
3812
4031
  id: "claude-sonnet-4.5",
3813
- name: "Claude Sonnet 4.5",
4032
+ name: "Claude Sonnet 4.5 (latest)",
3814
4033
  api: "anthropic-messages",
3815
4034
  provider: "github-copilot",
3816
4035
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -3819,12 +4038,12 @@ export const MODELS = {
3819
4038
  reasoning: true,
3820
4039
  input: ["text", "image"],
3821
4040
  cost: {
3822
- input: 0,
3823
- output: 0,
3824
- cacheRead: 0,
3825
- cacheWrite: 0,
4041
+ input: 3,
4042
+ output: 15,
4043
+ cacheRead: 0.3,
4044
+ cacheWrite: 3.75,
3826
4045
  },
3827
- contextWindow: 144000,
4046
+ contextWindow: 200000,
3828
4047
  maxTokens: 32000,
3829
4048
  },
3830
4049
  "claude-sonnet-4.6": {
@@ -3834,13 +4053,14 @@ export const MODELS = {
3834
4053
  provider: "github-copilot",
3835
4054
  baseUrl: "https://api.individual.githubcopilot.com",
3836
4055
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4056
+ compat: { "forceAdaptiveThinking": true },
3837
4057
  reasoning: true,
3838
4058
  input: ["text", "image"],
3839
4059
  cost: {
3840
- input: 0,
3841
- output: 0,
3842
- cacheRead: 0,
3843
- cacheWrite: 0,
4060
+ input: 3,
4061
+ output: 15,
4062
+ cacheRead: 0.3,
4063
+ cacheWrite: 3.75,
3844
4064
  },
3845
4065
  contextWindow: 1000000,
3846
4066
  maxTokens: 32000,
@@ -3853,12 +4073,12 @@ export const MODELS = {
3853
4073
  baseUrl: "https://api.individual.githubcopilot.com",
3854
4074
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3855
4075
  compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
3856
- reasoning: false,
4076
+ reasoning: true,
3857
4077
  input: ["text", "image"],
3858
4078
  cost: {
3859
- input: 0,
3860
- output: 0,
3861
- cacheRead: 0,
4079
+ input: 1.25,
4080
+ output: 10,
4081
+ cacheRead: 0.125,
3862
4082
  cacheWrite: 0,
3863
4083
  },
3864
4084
  contextWindow: 128000,
@@ -3866,7 +4086,7 @@ export const MODELS = {
3866
4086
  },
3867
4087
  "gemini-3-flash-preview": {
3868
4088
  id: "gemini-3-flash-preview",
3869
- name: "Gemini 3 Flash",
4089
+ name: "Gemini 3 Flash Preview",
3870
4090
  api: "openai-completions",
3871
4091
  provider: "github-copilot",
3872
4092
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -3875,9 +4095,9 @@ export const MODELS = {
3875
4095
  reasoning: true,
3876
4096
  input: ["text", "image"],
3877
4097
  cost: {
3878
- input: 0,
3879
- output: 0,
3880
- cacheRead: 0,
4098
+ input: 0.5,
4099
+ output: 3,
4100
+ cacheRead: 0.05,
3881
4101
  cacheWrite: 0,
3882
4102
  },
3883
4103
  contextWindow: 128000,
@@ -3894,12 +4114,12 @@ export const MODELS = {
3894
4114
  reasoning: true,
3895
4115
  input: ["text", "image"],
3896
4116
  cost: {
3897
- input: 0,
3898
- output: 0,
3899
- cacheRead: 0,
4117
+ input: 2,
4118
+ output: 12,
4119
+ cacheRead: 0.2,
3900
4120
  cacheWrite: 0,
3901
4121
  },
3902
- contextWindow: 128000,
4122
+ contextWindow: 200000,
3903
4123
  maxTokens: 64000,
3904
4124
  },
3905
4125
  "gemini-3.5-flash": {
@@ -3913,12 +4133,12 @@ export const MODELS = {
3913
4133
  reasoning: true,
3914
4134
  input: ["text", "image"],
3915
4135
  cost: {
3916
- input: 0,
3917
- output: 0,
3918
- cacheRead: 0,
4136
+ input: 1.5,
4137
+ output: 9,
4138
+ cacheRead: 0.15,
3919
4139
  cacheWrite: 0,
3920
4140
  },
3921
- contextWindow: 128000,
4141
+ contextWindow: 200000,
3922
4142
  maxTokens: 64000,
3923
4143
  },
3924
4144
  "gpt-4.1": {
@@ -3932,36 +4152,17 @@ export const MODELS = {
3932
4152
  reasoning: false,
3933
4153
  input: ["text", "image"],
3934
4154
  cost: {
3935
- input: 0,
3936
- output: 0,
3937
- cacheRead: 0,
4155
+ input: 2,
4156
+ output: 8,
4157
+ cacheRead: 0.5,
3938
4158
  cacheWrite: 0,
3939
4159
  },
3940
4160
  contextWindow: 128000,
3941
4161
  maxTokens: 16384,
3942
4162
  },
3943
- "gpt-4o": {
3944
- id: "gpt-4o",
3945
- name: "GPT-4o",
3946
- api: "openai-completions",
3947
- provider: "github-copilot",
3948
- baseUrl: "https://api.individual.githubcopilot.com",
3949
- headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3950
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
3951
- reasoning: false,
3952
- input: ["text", "image"],
3953
- cost: {
3954
- input: 0,
3955
- output: 0,
3956
- cacheRead: 0,
3957
- cacheWrite: 0,
3958
- },
3959
- contextWindow: 128000,
3960
- maxTokens: 4096,
3961
- },
3962
4163
  "gpt-5-mini": {
3963
4164
  id: "gpt-5-mini",
3964
- name: "GPT-5-mini",
4165
+ name: "GPT-5 Mini",
3965
4166
  api: "openai-responses",
3966
4167
  provider: "github-copilot",
3967
4168
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -3970,9 +4171,9 @@ export const MODELS = {
3970
4171
  thinkingLevelMap: { "off": null, "minimal": "low" },
3971
4172
  input: ["text", "image"],
3972
4173
  cost: {
3973
- input: 0,
3974
- output: 0,
3975
- cacheRead: 0,
4174
+ input: 0.25,
4175
+ output: 2,
4176
+ cacheRead: 0.025,
3976
4177
  cacheWrite: 0,
3977
4178
  },
3978
4179
  contextWindow: 264000,
@@ -3989,17 +4190,17 @@ export const MODELS = {
3989
4190
  thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
3990
4191
  input: ["text", "image"],
3991
4192
  cost: {
3992
- input: 0,
3993
- output: 0,
3994
- cacheRead: 0,
4193
+ input: 1.75,
4194
+ output: 14,
4195
+ cacheRead: 0.175,
3995
4196
  cacheWrite: 0,
3996
4197
  },
3997
- contextWindow: 264000,
3998
- maxTokens: 64000,
4198
+ contextWindow: 400000,
4199
+ maxTokens: 128000,
3999
4200
  },
4000
4201
  "gpt-5.2-codex": {
4001
4202
  id: "gpt-5.2-codex",
4002
- name: "GPT-5.2-Codex",
4203
+ name: "GPT-5.2 Codex",
4003
4204
  api: "openai-responses",
4004
4205
  provider: "github-copilot",
4005
4206
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -4008,9 +4209,9 @@ export const MODELS = {
4008
4209
  thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4009
4210
  input: ["text", "image"],
4010
4211
  cost: {
4011
- input: 0,
4012
- output: 0,
4013
- cacheRead: 0,
4212
+ input: 1.75,
4213
+ output: 14,
4214
+ cacheRead: 0.175,
4014
4215
  cacheWrite: 0,
4015
4216
  },
4016
4217
  contextWindow: 400000,
@@ -4018,7 +4219,7 @@ export const MODELS = {
4018
4219
  },
4019
4220
  "gpt-5.3-codex": {
4020
4221
  id: "gpt-5.3-codex",
4021
- name: "GPT-5.3-Codex",
4222
+ name: "GPT-5.3 Codex",
4022
4223
  api: "openai-responses",
4023
4224
  provider: "github-copilot",
4024
4225
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -4027,9 +4228,9 @@ export const MODELS = {
4027
4228
  thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4028
4229
  input: ["text", "image"],
4029
4230
  cost: {
4030
- input: 0,
4031
- output: 0,
4032
- cacheRead: 0,
4231
+ input: 1.75,
4232
+ output: 14,
4233
+ cacheRead: 0.175,
4033
4234
  cacheWrite: 0,
4034
4235
  },
4035
4236
  contextWindow: 400000,
@@ -4046,9 +4247,9 @@ export const MODELS = {
4046
4247
  thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4047
4248
  input: ["text", "image"],
4048
4249
  cost: {
4049
- input: 0,
4050
- output: 0,
4051
- cacheRead: 0,
4250
+ input: 2.5,
4251
+ output: 15,
4252
+ cacheRead: 0.25,
4052
4253
  cacheWrite: 0,
4053
4254
  },
4054
4255
  contextWindow: 400000,
@@ -4056,7 +4257,7 @@ export const MODELS = {
4056
4257
  },
4057
4258
  "gpt-5.4-mini": {
4058
4259
  id: "gpt-5.4-mini",
4059
- name: "GPT-5.4 Mini",
4260
+ name: "GPT-5.4 mini",
4060
4261
  api: "openai-responses",
4061
4262
  provider: "github-copilot",
4062
4263
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -4065,9 +4266,28 @@ export const MODELS = {
4065
4266
  thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4066
4267
  input: ["text", "image"],
4067
4268
  cost: {
4068
- input: 0,
4069
- output: 0,
4070
- cacheRead: 0,
4269
+ input: 0.75,
4270
+ output: 4.5,
4271
+ cacheRead: 0.075,
4272
+ cacheWrite: 0,
4273
+ },
4274
+ contextWindow: 400000,
4275
+ maxTokens: 128000,
4276
+ },
4277
+ "gpt-5.4-nano": {
4278
+ id: "gpt-5.4-nano",
4279
+ name: "GPT-5.4 nano",
4280
+ api: "openai-responses",
4281
+ provider: "github-copilot",
4282
+ baseUrl: "https://api.individual.githubcopilot.com",
4283
+ headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4284
+ reasoning: true,
4285
+ thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4286
+ input: ["text", "image"],
4287
+ cost: {
4288
+ input: 0.2,
4289
+ output: 1.25,
4290
+ cacheRead: 0.02,
4071
4291
  cacheWrite: 0,
4072
4292
  },
4073
4293
  contextWindow: 400000,
@@ -4084,32 +4304,32 @@ export const MODELS = {
4084
4304
  thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4085
4305
  input: ["text", "image"],
4086
4306
  cost: {
4087
- input: 0,
4088
- output: 0,
4089
- cacheRead: 0,
4307
+ input: 5,
4308
+ output: 30,
4309
+ cacheRead: 0.5,
4090
4310
  cacheWrite: 0,
4091
4311
  },
4092
4312
  contextWindow: 400000,
4093
4313
  maxTokens: 128000,
4094
4314
  },
4095
- "grok-code-fast-1": {
4096
- id: "grok-code-fast-1",
4097
- name: "Grok Code Fast 1",
4315
+ "raptor-mini": {
4316
+ id: "raptor-mini",
4317
+ name: "Raptor mini",
4098
4318
  api: "openai-completions",
4099
4319
  provider: "github-copilot",
4100
4320
  baseUrl: "https://api.individual.githubcopilot.com",
4101
4321
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4102
4322
  compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
4103
4323
  reasoning: true,
4104
- input: ["text"],
4324
+ input: ["text", "image"],
4105
4325
  cost: {
4106
- input: 0,
4107
- output: 0,
4108
- cacheRead: 0,
4326
+ input: 0.25,
4327
+ output: 2,
4328
+ cacheRead: 0.025,
4109
4329
  cacheWrite: 0,
4110
4330
  },
4111
- contextWindow: 128000,
4112
- maxTokens: 64000,
4331
+ contextWindow: 400000,
4332
+ maxTokens: 128000,
4113
4333
  },
4114
4334
  },
4115
4335
  "google": {
@@ -4838,7 +5058,7 @@ export const MODELS = {
4838
5058
  cost: {
4839
5059
  input: 1,
4840
5060
  output: 3,
4841
- cacheRead: 0,
5061
+ cacheRead: 0.5,
4842
5062
  cacheWrite: 0,
4843
5063
  },
4844
5064
  contextWindow: 262144,
@@ -4855,7 +5075,7 @@ export const MODELS = {
4855
5075
  cost: {
4856
5076
  input: 0.15,
4857
5077
  output: 0.6,
4858
- cacheRead: 0,
5078
+ cacheRead: 0.075,
4859
5079
  cacheWrite: 0,
4860
5080
  },
4861
5081
  contextWindow: 131072,
@@ -4872,7 +5092,7 @@ export const MODELS = {
4872
5092
  cost: {
4873
5093
  input: 0.075,
4874
5094
  output: 0.3,
4875
- cacheRead: 0,
5095
+ cacheRead: 0.0375,
4876
5096
  cacheWrite: 0,
4877
5097
  },
4878
5098
  contextWindow: 131072,
@@ -5158,9 +5378,9 @@ export const MODELS = {
5158
5378
  reasoning: true,
5159
5379
  input: ["text"],
5160
5380
  cost: {
5161
- input: 1.74,
5162
- output: 3.48,
5163
- cacheRead: 0.145,
5381
+ input: 0.435,
5382
+ output: 0.87,
5383
+ cacheRead: 0.003625,
5164
5384
  cacheWrite: 0,
5165
5385
  },
5166
5386
  contextWindow: 1048576,
@@ -5474,6 +5694,23 @@ export const MODELS = {
5474
5694
  contextWindow: 262144,
5475
5695
  maxTokens: 262144,
5476
5696
  },
5697
+ "devstral-latest": {
5698
+ id: "devstral-latest",
5699
+ name: "Devstral 2",
5700
+ api: "mistral-conversations",
5701
+ provider: "mistral",
5702
+ baseUrl: "https://api.mistral.ai",
5703
+ reasoning: false,
5704
+ input: ["text"],
5705
+ cost: {
5706
+ input: 0.4,
5707
+ output: 2,
5708
+ cacheRead: 0,
5709
+ cacheWrite: 0,
5710
+ },
5711
+ contextWindow: 262144,
5712
+ maxTokens: 262144,
5713
+ },
5477
5714
  "devstral-medium-2507": {
5478
5715
  id: "devstral-medium-2507",
5479
5716
  name: "Devstral Medium",
@@ -5752,11 +5989,11 @@ export const MODELS = {
5752
5989
  api: "mistral-conversations",
5753
5990
  provider: "mistral",
5754
5991
  baseUrl: "https://api.mistral.ai",
5755
- reasoning: true,
5992
+ reasoning: false,
5756
5993
  input: ["text", "image"],
5757
5994
  cost: {
5758
- input: 1.5,
5759
- output: 7.5,
5995
+ input: 0.4,
5996
+ output: 2,
5760
5997
  cacheRead: 0,
5761
5998
  cacheWrite: 0,
5762
5999
  },
@@ -5848,9 +6085,26 @@ export const MODELS = {
5848
6085
  contextWindow: 8000,
5849
6086
  maxTokens: 8000,
5850
6087
  },
5851
- "open-mixtral-8x22b": {
5852
- id: "open-mixtral-8x22b",
5853
- name: "Mixtral 8x22B",
6088
+ "open-mistral-nemo": {
6089
+ id: "open-mistral-nemo",
6090
+ name: "Open Mistral Nemo",
6091
+ api: "mistral-conversations",
6092
+ provider: "mistral",
6093
+ baseUrl: "https://api.mistral.ai",
6094
+ reasoning: false,
6095
+ input: ["text"],
6096
+ cost: {
6097
+ input: 0.15,
6098
+ output: 0.15,
6099
+ cacheRead: 0,
6100
+ cacheWrite: 0,
6101
+ },
6102
+ contextWindow: 128000,
6103
+ maxTokens: 128000,
6104
+ },
6105
+ "open-mixtral-8x22b": {
6106
+ id: "open-mixtral-8x22b",
6107
+ name: "Mixtral 8x22B",
5854
6108
  api: "mistral-conversations",
5855
6109
  provider: "mistral",
5856
6110
  baseUrl: "https://api.mistral.ai",
@@ -6253,7 +6507,7 @@ export const MODELS = {
6253
6507
  cost: {
6254
6508
  input: 0.1,
6255
6509
  output: 0.4,
6256
- cacheRead: 0.03,
6510
+ cacheRead: 0.025,
6257
6511
  cacheWrite: 0,
6258
6512
  },
6259
6513
  contextWindow: 1047576,
@@ -6338,7 +6592,7 @@ export const MODELS = {
6338
6592
  cost: {
6339
6593
  input: 0.15,
6340
6594
  output: 0.6,
6341
- cacheRead: 0.08,
6595
+ cacheRead: 0.075,
6342
6596
  cacheWrite: 0,
6343
6597
  },
6344
6598
  contextWindow: 128000,
@@ -6464,7 +6718,7 @@ export const MODELS = {
6464
6718
  cost: {
6465
6719
  input: 1.25,
6466
6720
  output: 10,
6467
- cacheRead: 0.13,
6721
+ cacheRead: 0.125,
6468
6722
  cacheWrite: 0,
6469
6723
  },
6470
6724
  contextWindow: 400000,
@@ -6747,7 +7001,7 @@ export const MODELS = {
6747
7001
  provider: "openai",
6748
7002
  baseUrl: "https://api.openai.com/v1",
6749
7003
  reasoning: true,
6750
- thinkingLevelMap: { "off": "none", "xhigh": "xhigh" },
7004
+ thinkingLevelMap: { "off": "none", "xhigh": "xhigh", "minimal": null },
6751
7005
  input: ["text", "image"],
6752
7006
  cost: {
6753
7007
  input: 5,
@@ -6765,7 +7019,7 @@ export const MODELS = {
6765
7019
  provider: "openai",
6766
7020
  baseUrl: "https://api.openai.com/v1",
6767
7021
  reasoning: true,
6768
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
7022
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh", "minimal": null, "low": null },
6769
7023
  input: ["text", "image"],
6770
7024
  cost: {
6771
7025
  input: 30,
@@ -6889,7 +7143,7 @@ export const MODELS = {
6889
7143
  cost: {
6890
7144
  input: 1.1,
6891
7145
  output: 4.4,
6892
- cacheRead: 0.28,
7146
+ cacheRead: 0.275,
6893
7147
  cacheWrite: 0,
6894
7148
  },
6895
7149
  contextWindow: 200000,
@@ -6965,7 +7219,7 @@ export const MODELS = {
6965
7219
  cacheRead: 0.175,
6966
7220
  cacheWrite: 0,
6967
7221
  },
6968
- contextWindow: 272000,
7222
+ contextWindow: 128000,
6969
7223
  maxTokens: 128000,
6970
7224
  },
6971
7225
  "gpt-5.4": {
@@ -7039,7 +7293,7 @@ export const MODELS = {
7039
7293
  cacheWrite: 0,
7040
7294
  },
7041
7295
  contextWindow: 200000,
7042
- maxTokens: 128000,
7296
+ maxTokens: 32000,
7043
7297
  },
7044
7298
  "claude-haiku-4-5": {
7045
7299
  id: "claude-haiku-4-5",
@@ -7098,6 +7352,7 @@ export const MODELS = {
7098
7352
  api: "anthropic-messages",
7099
7353
  provider: "opencode",
7100
7354
  baseUrl: "https://opencode.ai/zen",
7355
+ compat: { "forceAdaptiveThinking": true },
7101
7356
  reasoning: true,
7102
7357
  thinkingLevelMap: { "xhigh": "max" },
7103
7358
  input: ["text", "image"],
@@ -7116,6 +7371,7 @@ export const MODELS = {
7116
7371
  api: "anthropic-messages",
7117
7372
  provider: "opencode",
7118
7373
  baseUrl: "https://opencode.ai/zen",
7374
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
7119
7375
  reasoning: true,
7120
7376
  thinkingLevelMap: { "xhigh": "xhigh" },
7121
7377
  input: ["text", "image"],
@@ -7128,6 +7384,24 @@ export const MODELS = {
7128
7384
  contextWindow: 1000000,
7129
7385
  maxTokens: 128000,
7130
7386
  },
7387
+ "claude-opus-4-8": {
7388
+ id: "claude-opus-4-8",
7389
+ name: "Claude Opus 4.8",
7390
+ api: "anthropic-messages",
7391
+ provider: "opencode",
7392
+ baseUrl: "https://opencode.ai/zen",
7393
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
7394
+ reasoning: true,
7395
+ input: ["text", "image"],
7396
+ cost: {
7397
+ input: 5,
7398
+ output: 25,
7399
+ cacheRead: 0.5,
7400
+ cacheWrite: 6.25,
7401
+ },
7402
+ contextWindow: 1000000,
7403
+ maxTokens: 128000,
7404
+ },
7131
7405
  "claude-sonnet-4": {
7132
7406
  id: "claude-sonnet-4",
7133
7407
  name: "Claude Sonnet 4",
@@ -7168,6 +7442,7 @@ export const MODELS = {
7168
7442
  api: "anthropic-messages",
7169
7443
  provider: "opencode",
7170
7444
  baseUrl: "https://opencode.ai/zen",
7445
+ compat: { "forceAdaptiveThinking": true },
7171
7446
  reasoning: true,
7172
7447
  input: ["text", "image"],
7173
7448
  cost: {
@@ -7179,6 +7454,25 @@ export const MODELS = {
7179
7454
  contextWindow: 1000000,
7180
7455
  maxTokens: 64000,
7181
7456
  },
7457
+ "deepseek-v4-flash": {
7458
+ id: "deepseek-v4-flash",
7459
+ name: "DeepSeek V4 Flash",
7460
+ api: "openai-completions",
7461
+ provider: "opencode",
7462
+ baseUrl: "https://opencode.ai/zen/v1",
7463
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7464
+ reasoning: true,
7465
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7466
+ input: ["text"],
7467
+ cost: {
7468
+ input: 0.14,
7469
+ output: 0.28,
7470
+ cacheRead: 0.03,
7471
+ cacheWrite: 0,
7472
+ },
7473
+ contextWindow: 1000000,
7474
+ maxTokens: 384000,
7475
+ },
7182
7476
  "deepseek-v4-flash-free": {
7183
7477
  id: "deepseek-v4-flash-free",
7184
7478
  name: "DeepSeek V4 Flash Free",
@@ -7563,7 +7857,7 @@ export const MODELS = {
7563
7857
  provider: "opencode",
7564
7858
  baseUrl: "https://opencode.ai/zen/v1",
7565
7859
  reasoning: true,
7566
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
7860
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh", "minimal": null, "low": null },
7567
7861
  input: ["text", "image"],
7568
7862
  cost: {
7569
7863
  input: 30,
@@ -7580,7 +7874,9 @@ export const MODELS = {
7580
7874
  api: "openai-completions",
7581
7875
  provider: "opencode",
7582
7876
  baseUrl: "https://opencode.ai/zen/v1",
7877
+ compat: { "supportsReasoningEffort": false },
7583
7878
  reasoning: true,
7879
+ thinkingLevelMap: { "off": null, "minimal": null, "low": null, "medium": null },
7584
7880
  input: ["text", "image"],
7585
7881
  cost: {
7586
7882
  input: 1,
@@ -7614,6 +7910,7 @@ export const MODELS = {
7614
7910
  api: "openai-completions",
7615
7911
  provider: "opencode",
7616
7912
  baseUrl: "https://opencode.ai/zen/v1",
7913
+ compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false },
7617
7914
  reasoning: true,
7618
7915
  input: ["text", "image"],
7619
7916
  cost: {
@@ -7625,6 +7922,23 @@ export const MODELS = {
7625
7922
  contextWindow: 262144,
7626
7923
  maxTokens: 65536,
7627
7924
  },
7925
+ "mimo-v2.5-free": {
7926
+ id: "mimo-v2.5-free",
7927
+ name: "MiMo V2.5 Free",
7928
+ api: "openai-completions",
7929
+ provider: "opencode",
7930
+ baseUrl: "https://opencode.ai/zen/v1",
7931
+ reasoning: true,
7932
+ input: ["text", "image"],
7933
+ cost: {
7934
+ input: 0,
7935
+ output: 0,
7936
+ cacheRead: 0,
7937
+ cacheWrite: 0,
7938
+ },
7939
+ contextWindow: 200000,
7940
+ maxTokens: 32000,
7941
+ },
7628
7942
  "minimax-m2.5": {
7629
7943
  id: "minimax-m2.5",
7630
7944
  name: "MiniMax M2.5",
@@ -7659,9 +7973,26 @@ export const MODELS = {
7659
7973
  contextWindow: 204800,
7660
7974
  maxTokens: 131072,
7661
7975
  },
7662
- "nemotron-3-super-free": {
7663
- id: "nemotron-3-super-free",
7664
- name: "Nemotron 3 Super Free",
7976
+ "minimax-m3-free": {
7977
+ id: "minimax-m3-free",
7978
+ name: "MiniMax M3 Free",
7979
+ api: "anthropic-messages",
7980
+ provider: "opencode",
7981
+ baseUrl: "https://opencode.ai/zen",
7982
+ reasoning: true,
7983
+ input: ["text", "image"],
7984
+ cost: {
7985
+ input: 0,
7986
+ output: 0,
7987
+ cacheRead: 0,
7988
+ cacheWrite: 0,
7989
+ },
7990
+ contextWindow: 200000,
7991
+ maxTokens: 32000,
7992
+ },
7993
+ "nemotron-3-ultra-free": {
7994
+ id: "nemotron-3-ultra-free",
7995
+ name: "Nemotron 3 Ultra Free",
7665
7996
  api: "openai-completions",
7666
7997
  provider: "opencode",
7667
7998
  baseUrl: "https://opencode.ai/zen/v1",
@@ -7673,7 +8004,7 @@ export const MODELS = {
7673
8004
  cacheRead: 0,
7674
8005
  cacheWrite: 0,
7675
8006
  },
7676
- contextWindow: 204800,
8007
+ contextWindow: 1000000,
7677
8008
  maxTokens: 128000,
7678
8009
  },
7679
8010
  "qwen3.5-plus": {
@@ -7807,7 +8138,9 @@ export const MODELS = {
7807
8138
  api: "openai-completions",
7808
8139
  provider: "opencode-go",
7809
8140
  baseUrl: "https://opencode.ai/zen/go/v1",
8141
+ compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false },
7810
8142
  reasoning: true,
8143
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
7811
8144
  input: ["text", "image"],
7812
8145
  cost: {
7813
8146
  input: 0.95,
@@ -7827,9 +8160,9 @@ export const MODELS = {
7827
8160
  reasoning: true,
7828
8161
  input: ["text", "image"],
7829
8162
  cost: {
7830
- input: 0.4,
7831
- output: 2,
7832
- cacheRead: 0.08,
8163
+ input: 0.14,
8164
+ output: 0.28,
8165
+ cacheRead: 0.0028,
7833
8166
  cacheWrite: 0,
7834
8167
  },
7835
8168
  contextWindow: 1000000,
@@ -7844,9 +8177,9 @@ export const MODELS = {
7844
8177
  reasoning: true,
7845
8178
  input: ["text"],
7846
8179
  cost: {
7847
- input: 1,
7848
- output: 3,
7849
- cacheRead: 0.2,
8180
+ input: 1.74,
8181
+ output: 3.48,
8182
+ cacheRead: 0.0145,
7850
8183
  cacheWrite: 0,
7851
8184
  },
7852
8185
  contextWindow: 1048576,
@@ -7886,23 +8219,22 @@ export const MODELS = {
7886
8219
  contextWindow: 204800,
7887
8220
  maxTokens: 131072,
7888
8221
  },
7889
- "qwen3.5-plus": {
7890
- id: "qwen3.5-plus",
7891
- name: "Qwen3.5 Plus",
7892
- api: "openai-completions",
8222
+ "minimax-m3": {
8223
+ id: "minimax-m3",
8224
+ name: "MiniMax M3",
8225
+ api: "anthropic-messages",
7893
8226
  provider: "opencode-go",
7894
- baseUrl: "https://opencode.ai/zen/go/v1",
7895
- compat: { "thinkingFormat": "qwen" },
8227
+ baseUrl: "https://opencode.ai/zen/go",
7896
8228
  reasoning: true,
7897
8229
  input: ["text", "image"],
7898
8230
  cost: {
7899
- input: 0.2,
7900
- output: 1.2,
7901
- cacheRead: 0.02,
7902
- cacheWrite: 0.25,
8231
+ input: 0.6,
8232
+ output: 2.4,
8233
+ cacheRead: 0.12,
8234
+ cacheWrite: 0,
7903
8235
  },
7904
- contextWindow: 262144,
7905
- maxTokens: 65536,
8236
+ contextWindow: 512000,
8237
+ maxTokens: 131072,
7906
8238
  },
7907
8239
  "qwen3.6-plus": {
7908
8240
  id: "qwen3.6-plus",
@@ -7919,7 +8251,41 @@ export const MODELS = {
7919
8251
  cacheRead: 0.05,
7920
8252
  cacheWrite: 0.625,
7921
8253
  },
7922
- contextWindow: 262144,
8254
+ contextWindow: 1000000,
8255
+ maxTokens: 65536,
8256
+ },
8257
+ "qwen3.7-max": {
8258
+ id: "qwen3.7-max",
8259
+ name: "Qwen3.7 Max",
8260
+ api: "anthropic-messages",
8261
+ provider: "opencode-go",
8262
+ baseUrl: "https://opencode.ai/zen/go",
8263
+ reasoning: true,
8264
+ input: ["text"],
8265
+ cost: {
8266
+ input: 2.5,
8267
+ output: 7.5,
8268
+ cacheRead: 0.5,
8269
+ cacheWrite: 3.125,
8270
+ },
8271
+ contextWindow: 1000000,
8272
+ maxTokens: 65536,
8273
+ },
8274
+ "qwen3.7-plus": {
8275
+ id: "qwen3.7-plus",
8276
+ name: "Qwen3.7 Plus",
8277
+ api: "anthropic-messages",
8278
+ provider: "opencode-go",
8279
+ baseUrl: "https://opencode.ai/zen/go",
8280
+ reasoning: true,
8281
+ input: ["text", "image"],
8282
+ cost: {
8283
+ input: 0.4,
8284
+ output: 1.6,
8285
+ cacheRead: 0.04,
8286
+ cacheWrite: 0.5,
8287
+ },
8288
+ contextWindow: 1000000,
7923
8289
  maxTokens: 65536,
7924
8290
  },
7925
8291
  },
@@ -7941,23 +8307,6 @@ export const MODELS = {
7941
8307
  contextWindow: 256000,
7942
8308
  maxTokens: 4096,
7943
8309
  },
7944
- "alibaba/tongyi-deepresearch-30b-a3b": {
7945
- id: "alibaba/tongyi-deepresearch-30b-a3b",
7946
- name: "Tongyi DeepResearch 30B A3B",
7947
- api: "openai-completions",
7948
- provider: "openrouter",
7949
- baseUrl: "https://openrouter.ai/api/v1",
7950
- reasoning: true,
7951
- input: ["text"],
7952
- cost: {
7953
- input: 0.09,
7954
- output: 0.44999999999999996,
7955
- cacheRead: 0.09,
7956
- cacheWrite: 0,
7957
- },
7958
- contextWindow: 131072,
7959
- maxTokens: 131072,
7960
- },
7961
8310
  "amazon/nova-2-lite-v1": {
7962
8311
  id: "amazon/nova-2-lite-v1",
7963
8312
  name: "Amazon: Nova 2 Lite",
@@ -8217,6 +8566,40 @@ export const MODELS = {
8217
8566
  contextWindow: 1000000,
8218
8567
  maxTokens: 128000,
8219
8568
  },
8569
+ "anthropic/claude-opus-4.8": {
8570
+ id: "anthropic/claude-opus-4.8",
8571
+ name: "Anthropic: Claude Opus 4.8",
8572
+ api: "openai-completions",
8573
+ provider: "openrouter",
8574
+ baseUrl: "https://openrouter.ai/api/v1",
8575
+ reasoning: true,
8576
+ input: ["text", "image"],
8577
+ cost: {
8578
+ input: 5,
8579
+ output: 25,
8580
+ cacheRead: 0.5,
8581
+ cacheWrite: 6.25,
8582
+ },
8583
+ contextWindow: 1000000,
8584
+ maxTokens: 128000,
8585
+ },
8586
+ "anthropic/claude-opus-4.8-fast": {
8587
+ id: "anthropic/claude-opus-4.8-fast",
8588
+ name: "Anthropic: Claude Opus 4.8 (Fast)",
8589
+ api: "openai-completions",
8590
+ provider: "openrouter",
8591
+ baseUrl: "https://openrouter.ai/api/v1",
8592
+ reasoning: true,
8593
+ input: ["text", "image"],
8594
+ cost: {
8595
+ input: 10,
8596
+ output: 50,
8597
+ cacheRead: 1,
8598
+ cacheWrite: 12.5,
8599
+ },
8600
+ contextWindow: 1000000,
8601
+ maxTokens: 128000,
8602
+ },
8220
8603
  "anthropic/claude-sonnet-4": {
8221
8604
  id: "anthropic/claude-sonnet-4",
8222
8605
  name: "Anthropic: Claude Sonnet 4",
@@ -8285,23 +8668,6 @@ export const MODELS = {
8285
8668
  contextWindow: 262144,
8286
8669
  maxTokens: 262144,
8287
8670
  },
8288
- "arcee-ai/trinity-large-thinking:free": {
8289
- id: "arcee-ai/trinity-large-thinking:free",
8290
- name: "Arcee AI: Trinity Large Thinking (free)",
8291
- api: "openai-completions",
8292
- provider: "openrouter",
8293
- baseUrl: "https://openrouter.ai/api/v1",
8294
- reasoning: true,
8295
- input: ["text"],
8296
- cost: {
8297
- input: 0,
8298
- output: 0,
8299
- cacheRead: 0,
8300
- cacheWrite: 0,
8301
- },
8302
- contextWindow: 262144,
8303
- maxTokens: 80000,
8304
- },
8305
8671
  "arcee-ai/trinity-mini": {
8306
8672
  id: "arcee-ai/trinity-mini",
8307
8673
  name: "Arcee AI: Trinity Mini",
@@ -8353,40 +8719,6 @@ export const MODELS = {
8353
8719
  contextWindow: 2000000,
8354
8720
  maxTokens: 30000,
8355
8721
  },
8356
- "baidu/cobuddy:free": {
8357
- id: "baidu/cobuddy:free",
8358
- name: "Baidu Qianfan: CoBuddy (free)",
8359
- api: "openai-completions",
8360
- provider: "openrouter",
8361
- baseUrl: "https://openrouter.ai/api/v1",
8362
- reasoning: true,
8363
- input: ["text"],
8364
- cost: {
8365
- input: 0,
8366
- output: 0,
8367
- cacheRead: 0,
8368
- cacheWrite: 0,
8369
- },
8370
- contextWindow: 131072,
8371
- maxTokens: 65536,
8372
- },
8373
- "baidu/ernie-4.5-21b-a3b": {
8374
- id: "baidu/ernie-4.5-21b-a3b",
8375
- name: "Baidu: ERNIE 4.5 21B A3B",
8376
- api: "openai-completions",
8377
- provider: "openrouter",
8378
- baseUrl: "https://openrouter.ai/api/v1",
8379
- reasoning: false,
8380
- input: ["text"],
8381
- cost: {
8382
- input: 0.07,
8383
- output: 0.28,
8384
- cacheRead: 0,
8385
- cacheWrite: 0,
8386
- },
8387
- contextWindow: 131072,
8388
- maxTokens: 8000,
8389
- },
8390
8722
  "baidu/ernie-4.5-vl-28b-a3b": {
8391
8723
  id: "baidu/ernie-4.5-vl-28b-a3b",
8392
8724
  name: "Baidu: ERNIE 4.5 VL 28B A3B",
@@ -8515,13 +8847,13 @@ export const MODELS = {
8515
8847
  reasoning: false,
8516
8848
  input: ["text"],
8517
8849
  cost: {
8518
- input: 0.32,
8519
- output: 0.8899999999999999,
8850
+ input: 0.20020000000000002,
8851
+ output: 0.8000999999999999,
8520
8852
  cacheRead: 0,
8521
8853
  cacheWrite: 0,
8522
8854
  },
8523
- contextWindow: 163840,
8524
- maxTokens: 16384,
8855
+ contextWindow: 131072,
8856
+ maxTokens: 16000,
8525
8857
  },
8526
8858
  "deepseek/deepseek-chat-v3-0324": {
8527
8859
  id: "deepseek/deepseek-chat-v3-0324",
@@ -8617,13 +8949,13 @@ export const MODELS = {
8617
8949
  reasoning: true,
8618
8950
  input: ["text"],
8619
8951
  cost: {
8620
- input: 0.252,
8621
- output: 0.378,
8622
- cacheRead: 0.0252,
8952
+ input: 0.2288,
8953
+ output: 0.3432,
8954
+ cacheRead: 0,
8623
8955
  cacheWrite: 0,
8624
8956
  },
8625
8957
  contextWindow: 131072,
8626
- maxTokens: 65536,
8958
+ maxTokens: 64000,
8627
8959
  },
8628
8960
  "deepseek/deepseek-v3.2-exp": {
8629
8961
  id: "deepseek/deepseek-v3.2-exp",
@@ -8648,37 +8980,18 @@ export const MODELS = {
8648
8980
  api: "openai-completions",
8649
8981
  provider: "openrouter",
8650
8982
  baseUrl: "https://openrouter.ai/api/v1",
8651
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8983
+ compat: { "requiresReasoningContentOnAssistantMessages": true },
8652
8984
  reasoning: true,
8653
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
8985
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "xhigh" },
8654
8986
  input: ["text"],
8655
8987
  cost: {
8656
- input: 0.09999999999999999,
8657
- output: 0.19999999999999998,
8658
- cacheRead: 0.02,
8988
+ input: 0.0983,
8989
+ output: 0.1966,
8990
+ cacheRead: 0.019700000000000002,
8659
8991
  cacheWrite: 0,
8660
8992
  },
8661
8993
  contextWindow: 1048576,
8662
- maxTokens: 16384,
8663
- },
8664
- "deepseek/deepseek-v4-flash:free": {
8665
- id: "deepseek/deepseek-v4-flash:free",
8666
- name: "DeepSeek: DeepSeek V4 Flash (free)",
8667
- api: "openai-completions",
8668
- provider: "openrouter",
8669
- baseUrl: "https://openrouter.ai/api/v1",
8670
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8671
- reasoning: true,
8672
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
8673
- input: ["text"],
8674
- cost: {
8675
- input: 0,
8676
- output: 0,
8677
- cacheRead: 0,
8678
- cacheWrite: 0,
8679
- },
8680
- contextWindow: 1048576,
8681
- maxTokens: 384000,
8994
+ maxTokens: 131072,
8682
8995
  },
8683
8996
  "deepseek/deepseek-v4-pro": {
8684
8997
  id: "deepseek/deepseek-v4-pro",
@@ -8686,9 +8999,9 @@ export const MODELS = {
8686
8999
  api: "openai-completions",
8687
9000
  provider: "openrouter",
8688
9001
  baseUrl: "https://openrouter.ai/api/v1",
8689
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
9002
+ compat: { "requiresReasoningContentOnAssistantMessages": true },
8690
9003
  reasoning: true,
8691
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
9004
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "xhigh" },
8692
9005
  input: ["text"],
8693
9006
  cost: {
8694
9007
  input: 0.435,
@@ -8716,40 +9029,6 @@ export const MODELS = {
8716
9029
  contextWindow: 32768,
8717
9030
  maxTokens: 4096,
8718
9031
  },
8719
- "google/gemini-2.0-flash-001": {
8720
- id: "google/gemini-2.0-flash-001",
8721
- name: "Google: Gemini 2.0 Flash",
8722
- api: "openai-completions",
8723
- provider: "openrouter",
8724
- baseUrl: "https://openrouter.ai/api/v1",
8725
- reasoning: false,
8726
- input: ["text", "image"],
8727
- cost: {
8728
- input: 0.09999999999999999,
8729
- output: 0.39999999999999997,
8730
- cacheRead: 0.024999999999999998,
8731
- cacheWrite: 0.08333333333333334,
8732
- },
8733
- contextWindow: 1000000,
8734
- maxTokens: 8192,
8735
- },
8736
- "google/gemini-2.0-flash-lite-001": {
8737
- id: "google/gemini-2.0-flash-lite-001",
8738
- name: "Google: Gemini 2.0 Flash Lite",
8739
- api: "openai-completions",
8740
- provider: "openrouter",
8741
- baseUrl: "https://openrouter.ai/api/v1",
8742
- reasoning: false,
8743
- input: ["text", "image"],
8744
- cost: {
8745
- input: 0.075,
8746
- output: 0.3,
8747
- cacheRead: 0,
8748
- cacheWrite: 0,
8749
- },
8750
- contextWindow: 1048576,
8751
- maxTokens: 8192,
8752
- },
8753
9032
  "google/gemini-2.5-flash": {
8754
9033
  id: "google/gemini-2.5-flash",
8755
9034
  name: "Google: Gemini 2.5 Flash",
@@ -9186,7 +9465,7 @@ export const MODELS = {
9186
9465
  input: ["text"],
9187
9466
  cost: {
9188
9467
  input: 0.02,
9189
- output: 0.049999999999999996,
9468
+ output: 0.03,
9190
9469
  cacheRead: 0,
9191
9470
  cacheWrite: 0,
9192
9471
  },
@@ -9227,6 +9506,23 @@ export const MODELS = {
9227
9506
  contextWindow: 131072,
9228
9507
  maxTokens: 4096,
9229
9508
  },
9509
+ "meta-llama/llama-4-maverick": {
9510
+ id: "meta-llama/llama-4-maverick",
9511
+ name: "Meta: Llama 4 Maverick",
9512
+ api: "openai-completions",
9513
+ provider: "openrouter",
9514
+ baseUrl: "https://openrouter.ai/api/v1",
9515
+ reasoning: false,
9516
+ input: ["text", "image"],
9517
+ cost: {
9518
+ input: 0.15,
9519
+ output: 0.6,
9520
+ cacheRead: 0,
9521
+ cacheWrite: 0,
9522
+ },
9523
+ contextWindow: 1048576,
9524
+ maxTokens: 16384,
9525
+ },
9230
9526
  "meta-llama/llama-4-scout": {
9231
9527
  id: "meta-llama/llama-4-scout",
9232
9528
  name: "Meta: Llama 4 Scout",
@@ -9312,39 +9608,39 @@ export const MODELS = {
9312
9608
  contextWindow: 204800,
9313
9609
  maxTokens: 196608,
9314
9610
  },
9315
- "minimax/minimax-m2.5:free": {
9316
- id: "minimax/minimax-m2.5:free",
9317
- name: "MiniMax: MiniMax M2.5 (free)",
9611
+ "minimax/minimax-m2.7": {
9612
+ id: "minimax/minimax-m2.7",
9613
+ name: "MiniMax: MiniMax M2.7",
9318
9614
  api: "openai-completions",
9319
9615
  provider: "openrouter",
9320
9616
  baseUrl: "https://openrouter.ai/api/v1",
9321
9617
  reasoning: true,
9322
9618
  input: ["text"],
9323
9619
  cost: {
9324
- input: 0,
9325
- output: 0,
9620
+ input: 0.27899999999999997,
9621
+ output: 1.2,
9326
9622
  cacheRead: 0,
9327
9623
  cacheWrite: 0,
9328
9624
  },
9329
9625
  contextWindow: 204800,
9330
- maxTokens: 8192,
9626
+ maxTokens: 131072,
9331
9627
  },
9332
- "minimax/minimax-m2.7": {
9333
- id: "minimax/minimax-m2.7",
9334
- name: "MiniMax: MiniMax M2.7",
9628
+ "minimax/minimax-m3": {
9629
+ id: "minimax/minimax-m3",
9630
+ name: "MiniMax: MiniMax M3",
9335
9631
  api: "openai-completions",
9336
9632
  provider: "openrouter",
9337
9633
  baseUrl: "https://openrouter.ai/api/v1",
9338
9634
  reasoning: true,
9339
- input: ["text"],
9635
+ input: ["text", "image"],
9340
9636
  cost: {
9341
- input: 0.27899999999999997,
9637
+ input: 0.3,
9342
9638
  output: 1.2,
9343
- cacheRead: 0,
9639
+ cacheRead: 0.06,
9344
9640
  cacheWrite: 0,
9345
9641
  },
9346
- contextWindow: 204800,
9347
- maxTokens: 131072,
9642
+ contextWindow: 1048576,
9643
+ maxTokens: 512000,
9348
9644
  },
9349
9645
  "mistralai/codestral-2508": {
9350
9646
  id: "mistralai/codestral-2508",
@@ -9380,40 +9676,6 @@ export const MODELS = {
9380
9676
  contextWindow: 262144,
9381
9677
  maxTokens: 4096,
9382
9678
  },
9383
- "mistralai/devstral-medium": {
9384
- id: "mistralai/devstral-medium",
9385
- name: "Mistral: Devstral Medium",
9386
- api: "openai-completions",
9387
- provider: "openrouter",
9388
- baseUrl: "https://openrouter.ai/api/v1",
9389
- reasoning: false,
9390
- input: ["text"],
9391
- cost: {
9392
- input: 0.39999999999999997,
9393
- output: 2,
9394
- cacheRead: 0.04,
9395
- cacheWrite: 0,
9396
- },
9397
- contextWindow: 131072,
9398
- maxTokens: 4096,
9399
- },
9400
- "mistralai/devstral-small": {
9401
- id: "mistralai/devstral-small",
9402
- name: "Mistral: Devstral Small 1.1",
9403
- api: "openai-completions",
9404
- provider: "openrouter",
9405
- baseUrl: "https://openrouter.ai/api/v1",
9406
- reasoning: false,
9407
- input: ["text"],
9408
- cost: {
9409
- input: 0.09999999999999999,
9410
- output: 0.3,
9411
- cacheRead: 0.01,
9412
- cacheWrite: 0,
9413
- },
9414
- contextWindow: 131072,
9415
- maxTokens: 4096,
9416
- },
9417
9679
  "mistralai/ministral-14b-2512": {
9418
9680
  id: "mistralai/ministral-14b-2512",
9419
9681
  name: "Mistral: Ministral 3 14B 2512",
@@ -9499,23 +9761,6 @@ export const MODELS = {
9499
9761
  contextWindow: 131072,
9500
9762
  maxTokens: 4096,
9501
9763
  },
9502
- "mistralai/mistral-large-2411": {
9503
- id: "mistralai/mistral-large-2411",
9504
- name: "Mistral Large 2411",
9505
- api: "openai-completions",
9506
- provider: "openrouter",
9507
- baseUrl: "https://openrouter.ai/api/v1",
9508
- reasoning: false,
9509
- input: ["text"],
9510
- cost: {
9511
- input: 2,
9512
- output: 6,
9513
- cacheRead: 0.19999999999999998,
9514
- cacheWrite: 0,
9515
- },
9516
- contextWindow: 131072,
9517
- maxTokens: 4096,
9518
- },
9519
9764
  "mistralai/mistral-large-2512": {
9520
9765
  id: "mistralai/mistral-large-2512",
9521
9766
  name: "Mistral: Mistral Large 3 2512",
@@ -9669,23 +9914,6 @@ export const MODELS = {
9669
9914
  contextWindow: 65536,
9670
9915
  maxTokens: 4096,
9671
9916
  },
9672
- "mistralai/pixtral-large-2411": {
9673
- id: "mistralai/pixtral-large-2411",
9674
- name: "Mistral: Pixtral Large 2411",
9675
- api: "openai-completions",
9676
- provider: "openrouter",
9677
- baseUrl: "https://openrouter.ai/api/v1",
9678
- reasoning: false,
9679
- input: ["text", "image"],
9680
- cost: {
9681
- input: 2,
9682
- output: 6,
9683
- cacheRead: 0.19999999999999998,
9684
- cacheWrite: 0,
9685
- },
9686
- contextWindow: 131072,
9687
- maxTokens: 4096,
9688
- },
9689
9917
  "mistralai/voxtral-small-24b-2507": {
9690
9918
  id: "mistralai/voxtral-small-24b-2507",
9691
9919
  name: "Mistral: Voxtral Small 24B 2507",
@@ -9777,16 +10005,35 @@ export const MODELS = {
9777
10005
  api: "openai-completions",
9778
10006
  provider: "openrouter",
9779
10007
  baseUrl: "https://openrouter.ai/api/v1",
10008
+ compat: { "supportsDeveloperRole": false },
9780
10009
  reasoning: true,
9781
10010
  input: ["text", "image"],
9782
10011
  cost: {
9783
- input: 0.73,
9784
- output: 3.49,
9785
- cacheRead: 0.25,
10012
+ input: 0.684,
10013
+ output: 3.42,
10014
+ cacheRead: 0.144,
10015
+ cacheWrite: 0,
10016
+ },
10017
+ contextWindow: 262144,
10018
+ maxTokens: 262144,
10019
+ },
10020
+ "moonshotai/kimi-k2.6:free": {
10021
+ id: "moonshotai/kimi-k2.6:free",
10022
+ name: "MoonshotAI: Kimi K2.6 (free)",
10023
+ api: "openai-completions",
10024
+ provider: "openrouter",
10025
+ baseUrl: "https://openrouter.ai/api/v1",
10026
+ compat: { "supportsDeveloperRole": false },
10027
+ reasoning: true,
10028
+ input: ["text", "image"],
10029
+ cost: {
10030
+ input: 0,
10031
+ output: 0,
10032
+ cacheRead: 0,
9786
10033
  cacheWrite: 0,
9787
10034
  },
9788
10035
  contextWindow: 262144,
9789
- maxTokens: 262142,
10036
+ maxTokens: 4096,
9790
10037
  },
9791
10038
  "nex-agi/deepseek-v3.1-nex-n1": {
9792
10039
  id: "nex-agi/deepseek-v3.1-nex-n1",
@@ -9888,11 +10135,45 @@ export const MODELS = {
9888
10135
  cacheWrite: 0,
9889
10136
  },
9890
10137
  contextWindow: 1000000,
9891
- maxTokens: 4096,
10138
+ maxTokens: 4096,
10139
+ },
10140
+ "nvidia/nemotron-3-super-120b-a12b:free": {
10141
+ id: "nvidia/nemotron-3-super-120b-a12b:free",
10142
+ name: "NVIDIA: Nemotron 3 Super (free)",
10143
+ api: "openai-completions",
10144
+ provider: "openrouter",
10145
+ baseUrl: "https://openrouter.ai/api/v1",
10146
+ reasoning: true,
10147
+ input: ["text"],
10148
+ cost: {
10149
+ input: 0,
10150
+ output: 0,
10151
+ cacheRead: 0,
10152
+ cacheWrite: 0,
10153
+ },
10154
+ contextWindow: 1000000,
10155
+ maxTokens: 262144,
10156
+ },
10157
+ "nvidia/nemotron-3-ultra-550b-a55b": {
10158
+ id: "nvidia/nemotron-3-ultra-550b-a55b",
10159
+ name: "NVIDIA: Nemotron 3 Ultra",
10160
+ api: "openai-completions",
10161
+ provider: "openrouter",
10162
+ baseUrl: "https://openrouter.ai/api/v1",
10163
+ reasoning: true,
10164
+ input: ["text"],
10165
+ cost: {
10166
+ input: 0.5,
10167
+ output: 2.5,
10168
+ cacheRead: 0.15,
10169
+ cacheWrite: 0,
10170
+ },
10171
+ contextWindow: 1000000,
10172
+ maxTokens: 16384,
9892
10173
  },
9893
- "nvidia/nemotron-3-super-120b-a12b:free": {
9894
- id: "nvidia/nemotron-3-super-120b-a12b:free",
9895
- name: "NVIDIA: Nemotron 3 Super (free)",
10174
+ "nvidia/nemotron-3-ultra-550b-a55b:free": {
10175
+ id: "nvidia/nemotron-3-ultra-550b-a55b:free",
10176
+ name: "NVIDIA: Nemotron 3 Ultra (free)",
9896
10177
  api: "openai-completions",
9897
10178
  provider: "openrouter",
9898
10179
  baseUrl: "https://openrouter.ai/api/v1",
@@ -9905,7 +10186,7 @@ export const MODELS = {
9905
10186
  cacheWrite: 0,
9906
10187
  },
9907
10188
  contextWindow: 1000000,
9908
- maxTokens: 262144,
10189
+ maxTokens: 65536,
9909
10190
  },
9910
10191
  "nvidia/nemotron-nano-12b-v2-vl:free": {
9911
10192
  id: "nvidia/nemotron-nano-12b-v2-vl:free",
@@ -10026,23 +10307,6 @@ export const MODELS = {
10026
10307
  contextWindow: 8191,
10027
10308
  maxTokens: 4096,
10028
10309
  },
10029
- "openai/gpt-4-0314": {
10030
- id: "openai/gpt-4-0314",
10031
- name: "OpenAI: GPT-4 (older v0314)",
10032
- api: "openai-completions",
10033
- provider: "openrouter",
10034
- baseUrl: "https://openrouter.ai/api/v1",
10035
- reasoning: false,
10036
- input: ["text"],
10037
- cost: {
10038
- input: 30,
10039
- output: 60,
10040
- cacheRead: 0,
10041
- cacheWrite: 0,
10042
- },
10043
- contextWindow: 8191,
10044
- maxTokens: 4096,
10045
- },
10046
10310
  "openai/gpt-4-1106-preview": {
10047
10311
  id: "openai/gpt-4-1106-preview",
10048
10312
  name: "OpenAI: GPT-4 Turbo (older v1106)",
@@ -10213,23 +10477,6 @@ export const MODELS = {
10213
10477
  contextWindow: 128000,
10214
10478
  maxTokens: 16384,
10215
10479
  },
10216
- "openai/gpt-4o-audio-preview": {
10217
- id: "openai/gpt-4o-audio-preview",
10218
- name: "OpenAI: GPT-4o Audio",
10219
- api: "openai-completions",
10220
- provider: "openrouter",
10221
- baseUrl: "https://openrouter.ai/api/v1",
10222
- reasoning: false,
10223
- input: ["text"],
10224
- cost: {
10225
- input: 2.5,
10226
- output: 10,
10227
- cacheRead: 0,
10228
- cacheWrite: 0,
10229
- },
10230
- contextWindow: 128000,
10231
- maxTokens: 16384,
10232
- },
10233
10480
  "openai/gpt-4o-mini": {
10234
10481
  id: "openai/gpt-4o-mini",
10235
10482
  name: "OpenAI: GPT-4o-mini",
@@ -10377,11 +10624,11 @@ export const MODELS = {
10377
10624
  cost: {
10378
10625
  input: 1.25,
10379
10626
  output: 10,
10380
- cacheRead: 0.125,
10627
+ cacheRead: 0.13,
10381
10628
  cacheWrite: 0,
10382
10629
  },
10383
10630
  contextWindow: 128000,
10384
- maxTokens: 16384,
10631
+ maxTokens: 32000,
10385
10632
  },
10386
10633
  "openai/gpt-5.1-codex": {
10387
10634
  id: "openai/gpt-5.1-codex",
@@ -10394,7 +10641,7 @@ export const MODELS = {
10394
10641
  cost: {
10395
10642
  input: 1.25,
10396
10643
  output: 10,
10397
- cacheRead: 0.125,
10644
+ cacheRead: 0.13,
10398
10645
  cacheWrite: 0,
10399
10646
  },
10400
10647
  contextWindow: 400000,
@@ -10428,11 +10675,11 @@ export const MODELS = {
10428
10675
  cost: {
10429
10676
  input: 0.25,
10430
10677
  output: 2,
10431
- cacheRead: 0.03,
10678
+ cacheRead: 0.024999999999999998,
10432
10679
  cacheWrite: 0,
10433
10680
  },
10434
10681
  contextWindow: 400000,
10435
- maxTokens: 128000,
10682
+ maxTokens: 100000,
10436
10683
  },
10437
10684
  "openai/gpt-5.2": {
10438
10685
  id: "openai/gpt-5.2",
@@ -10468,7 +10715,7 @@ export const MODELS = {
10468
10715
  cacheWrite: 0,
10469
10716
  },
10470
10717
  contextWindow: 128000,
10471
- maxTokens: 32000,
10718
+ maxTokens: 16384,
10472
10719
  },
10473
10720
  "openai/gpt-5.2-codex": {
10474
10721
  id: "openai/gpt-5.2-codex",
@@ -10639,7 +10886,7 @@ export const MODELS = {
10639
10886
  provider: "openrouter",
10640
10887
  baseUrl: "https://openrouter.ai/api/v1",
10641
10888
  reasoning: true,
10642
- thinkingLevelMap: { "xhigh": "xhigh" },
10889
+ thinkingLevelMap: { "xhigh": "xhigh", "off": null, "minimal": null, "low": null },
10643
10890
  input: ["text", "image"],
10644
10891
  cost: {
10645
10892
  input: 30,
@@ -10744,13 +10991,13 @@ export const MODELS = {
10744
10991
  reasoning: true,
10745
10992
  input: ["text"],
10746
10993
  cost: {
10747
- input: 0.03,
10994
+ input: 0.029,
10748
10995
  output: 0.14,
10749
10996
  cacheRead: 0,
10750
10997
  cacheWrite: 0,
10751
10998
  },
10752
10999
  contextWindow: 131072,
10753
- maxTokens: 131072,
11000
+ maxTokens: 4096,
10754
11001
  },
10755
11002
  "openai/gpt-oss-20b:free": {
10756
11003
  id: "openai/gpt-oss-20b:free",
@@ -11004,8 +11251,8 @@ export const MODELS = {
11004
11251
  cacheRead: 0,
11005
11252
  cacheWrite: 0,
11006
11253
  },
11007
- contextWindow: 131072,
11008
- maxTokens: 8192,
11254
+ contextWindow: 262144,
11255
+ maxTokens: 32768,
11009
11256
  },
11010
11257
  "poolside/laguna-xs.2:free": {
11011
11258
  id: "poolside/laguna-xs.2:free",
@@ -11021,8 +11268,8 @@ export const MODELS = {
11021
11268
  cacheRead: 0,
11022
11269
  cacheWrite: 0,
11023
11270
  },
11024
- contextWindow: 131072,
11025
- maxTokens: 8192,
11271
+ contextWindow: 262144,
11272
+ maxTokens: 32768,
11026
11273
  },
11027
11274
  "prime-intellect/intellect-3": {
11028
11275
  id: "prime-intellect/intellect-3",
@@ -11058,23 +11305,6 @@ export const MODELS = {
11058
11305
  contextWindow: 131072,
11059
11306
  maxTokens: 16384,
11060
11307
  },
11061
- "qwen/qwen-2.5-7b-instruct": {
11062
- id: "qwen/qwen-2.5-7b-instruct",
11063
- name: "Qwen: Qwen2.5 7B Instruct",
11064
- api: "openai-completions",
11065
- provider: "openrouter",
11066
- baseUrl: "https://openrouter.ai/api/v1",
11067
- reasoning: false,
11068
- input: ["text"],
11069
- cost: {
11070
- input: 0.04,
11071
- output: 0.09999999999999999,
11072
- cacheRead: 0,
11073
- cacheWrite: 0,
11074
- },
11075
- contextWindow: 131072,
11076
- maxTokens: 32768,
11077
- },
11078
11308
  "qwen/qwen-plus": {
11079
11309
  id: "qwen/qwen-plus",
11080
11310
  name: "Qwen: Qwen-Plus",
@@ -11104,7 +11334,7 @@ export const MODELS = {
11104
11334
  input: 0.26,
11105
11335
  output: 0.78,
11106
11336
  cacheRead: 0,
11107
- cacheWrite: 0.325,
11337
+ cacheWrite: 0,
11108
11338
  },
11109
11339
  contextWindow: 1000000,
11110
11340
  maxTokens: 32768,
@@ -11186,13 +11416,13 @@ export const MODELS = {
11186
11416
  reasoning: true,
11187
11417
  input: ["text"],
11188
11418
  cost: {
11189
- input: 0.14950000000000002,
11190
- output: 1.495,
11191
- cacheRead: 0,
11419
+ input: 0.09999999999999999,
11420
+ output: 0.09999999999999999,
11421
+ cacheRead: 0.09999999999999999,
11192
11422
  cacheWrite: 0,
11193
11423
  },
11194
11424
  contextWindow: 262144,
11195
- maxTokens: 4096,
11425
+ maxTokens: 262144,
11196
11426
  },
11197
11427
  "qwen/qwen3-30b-a3b": {
11198
11428
  id: "qwen/qwen3-30b-a3b",
@@ -11209,7 +11439,7 @@ export const MODELS = {
11209
11439
  cacheWrite: 0,
11210
11440
  },
11211
11441
  contextWindow: 131072,
11212
- maxTokens: 20000,
11442
+ maxTokens: 16384,
11213
11443
  },
11214
11444
  "qwen/qwen3-30b-a3b-instruct-2507": {
11215
11445
  id: "qwen/qwen3-30b-a3b-instruct-2507",
@@ -11220,13 +11450,13 @@ export const MODELS = {
11220
11450
  reasoning: false,
11221
11451
  input: ["text"],
11222
11452
  cost: {
11223
- input: 0.09,
11224
- output: 0.3,
11453
+ input: 0.04815,
11454
+ output: 0.19305,
11225
11455
  cacheRead: 0,
11226
11456
  cacheWrite: 0,
11227
11457
  },
11228
- contextWindow: 262144,
11229
- maxTokens: 262144,
11458
+ contextWindow: 131072,
11459
+ maxTokens: 32000,
11230
11460
  },
11231
11461
  "qwen/qwen3-30b-a3b-thinking-2507": {
11232
11462
  id: "qwen/qwen3-30b-a3b-thinking-2507",
@@ -11628,13 +11858,13 @@ export const MODELS = {
11628
11858
  reasoning: true,
11629
11859
  input: ["text", "image"],
11630
11860
  cost: {
11631
- input: 0.13899999999999998,
11861
+ input: 0.14,
11632
11862
  output: 1,
11633
- cacheRead: 0,
11863
+ cacheRead: 0.049999999999999996,
11634
11864
  cacheWrite: 0,
11635
11865
  },
11636
11866
  contextWindow: 262144,
11637
- maxTokens: 4096,
11867
+ maxTokens: 262144,
11638
11868
  },
11639
11869
  "qwen/qwen3.5-397b-a17b": {
11640
11870
  id: "qwen/qwen3.5-397b-a17b",
@@ -11682,7 +11912,7 @@ export const MODELS = {
11682
11912
  input: 0.065,
11683
11913
  output: 0.26,
11684
11914
  cacheRead: 0,
11685
- cacheWrite: 0.08125,
11915
+ cacheWrite: 0,
11686
11916
  },
11687
11917
  contextWindow: 1000000,
11688
11918
  maxTokens: 65536,
@@ -11699,7 +11929,7 @@ export const MODELS = {
11699
11929
  input: 0.26,
11700
11930
  output: 1.56,
11701
11931
  cacheRead: 0,
11702
- cacheWrite: 0.325,
11932
+ cacheWrite: 0,
11703
11933
  },
11704
11934
  contextWindow: 1000000,
11705
11935
  maxTokens: 65536,
@@ -11716,7 +11946,7 @@ export const MODELS = {
11716
11946
  input: 0.3,
11717
11947
  output: 1.7999999999999998,
11718
11948
  cacheRead: 0,
11719
- cacheWrite: 0,
11949
+ cacheWrite: 0.375,
11720
11950
  },
11721
11951
  contextWindow: 1000000,
11722
11952
  maxTokens: 65536,
@@ -11730,13 +11960,13 @@ export const MODELS = {
11730
11960
  reasoning: true,
11731
11961
  input: ["text", "image"],
11732
11962
  cost: {
11733
- input: 0.3,
11963
+ input: 0.29,
11734
11964
  output: 3.1999999999999997,
11735
11965
  cacheRead: 0,
11736
11966
  cacheWrite: 0,
11737
11967
  },
11738
11968
  contextWindow: 262144,
11739
- maxTokens: 262144,
11969
+ maxTokens: 262140,
11740
11970
  },
11741
11971
  "qwen/qwen3.6-35b-a3b": {
11742
11972
  id: "qwen/qwen3.6-35b-a3b",
@@ -11747,7 +11977,7 @@ export const MODELS = {
11747
11977
  reasoning: true,
11748
11978
  input: ["text", "image"],
11749
11979
  cost: {
11750
- input: 0.15,
11980
+ input: 0.14,
11751
11981
  output: 1,
11752
11982
  cacheRead: 0,
11753
11983
  cacheWrite: 0,
@@ -11815,10 +12045,27 @@ export const MODELS = {
11815
12045
  reasoning: true,
11816
12046
  input: ["text"],
11817
12047
  cost: {
11818
- input: 2.5,
11819
- output: 7.5,
11820
- cacheRead: 0,
11821
- cacheWrite: 3.125,
12048
+ input: 1.25,
12049
+ output: 3.75,
12050
+ cacheRead: 0.25,
12051
+ cacheWrite: 1.5625,
12052
+ },
12053
+ contextWindow: 1000000,
12054
+ maxTokens: 65536,
12055
+ },
12056
+ "qwen/qwen3.7-plus": {
12057
+ id: "qwen/qwen3.7-plus",
12058
+ name: "Qwen: Qwen3.7 Plus",
12059
+ api: "openai-completions",
12060
+ provider: "openrouter",
12061
+ baseUrl: "https://openrouter.ai/api/v1",
12062
+ reasoning: true,
12063
+ input: ["text", "image"],
12064
+ cost: {
12065
+ input: 0.39999999999999997,
12066
+ output: 1.5999999999999999,
12067
+ cacheRead: 0.08,
12068
+ cacheWrite: 0.5,
11822
12069
  },
11823
12070
  contextWindow: 1000000,
11824
12071
  maxTokens: 65536,
@@ -11908,6 +12155,23 @@ export const MODELS = {
11908
12155
  contextWindow: 262144,
11909
12156
  maxTokens: 16384,
11910
12157
  },
12158
+ "stepfun/step-3.7-flash": {
12159
+ id: "stepfun/step-3.7-flash",
12160
+ name: "StepFun: Step 3.7 Flash",
12161
+ api: "openai-completions",
12162
+ provider: "openrouter",
12163
+ baseUrl: "https://openrouter.ai/api/v1",
12164
+ reasoning: true,
12165
+ input: ["text", "image"],
12166
+ cost: {
12167
+ input: 0.19999999999999998,
12168
+ output: 1.15,
12169
+ cacheRead: 0.04,
12170
+ cacheWrite: 0,
12171
+ },
12172
+ contextWindow: 256000,
12173
+ maxTokens: 256000,
12174
+ },
11911
12175
  "tencent/hy3-preview": {
11912
12176
  id: "tencent/hy3-preview",
11913
12177
  name: "Tencent: Hy3 preview",
@@ -11917,13 +12181,13 @@ export const MODELS = {
11917
12181
  reasoning: true,
11918
12182
  input: ["text"],
11919
12183
  cost: {
11920
- input: 0.06599999999999999,
11921
- output: 0.26,
11922
- cacheRead: 0.029,
12184
+ input: 0.063,
12185
+ output: 0.21,
12186
+ cacheRead: 0.020999999999999998,
11923
12187
  cacheWrite: 0,
11924
12188
  },
11925
12189
  contextWindow: 262144,
11926
- maxTokens: 262144,
12190
+ maxTokens: 4096,
11927
12191
  },
11928
12192
  "thedrummer/rocinante-12b": {
11929
12193
  id: "thedrummer/rocinante-12b",
@@ -12044,40 +12308,6 @@ export const MODELS = {
12044
12308
  contextWindow: 262144,
12045
12309
  maxTokens: 65536,
12046
12310
  },
12047
- "xiaomi/mimo-v2-omni": {
12048
- id: "xiaomi/mimo-v2-omni",
12049
- name: "Xiaomi: MiMo-V2-Omni",
12050
- api: "openai-completions",
12051
- provider: "openrouter",
12052
- baseUrl: "https://openrouter.ai/api/v1",
12053
- reasoning: true,
12054
- input: ["text", "image"],
12055
- cost: {
12056
- input: 0.39999999999999997,
12057
- output: 2,
12058
- cacheRead: 0.08,
12059
- cacheWrite: 0,
12060
- },
12061
- contextWindow: 262144,
12062
- maxTokens: 65536,
12063
- },
12064
- "xiaomi/mimo-v2-pro": {
12065
- id: "xiaomi/mimo-v2-pro",
12066
- name: "Xiaomi: MiMo-V2-Pro",
12067
- api: "openai-completions",
12068
- provider: "openrouter",
12069
- baseUrl: "https://openrouter.ai/api/v1",
12070
- reasoning: true,
12071
- input: ["text"],
12072
- cost: {
12073
- input: 1,
12074
- output: 3,
12075
- cacheRead: 0.19999999999999998,
12076
- cacheWrite: 0,
12077
- },
12078
- contextWindow: 1048576,
12079
- maxTokens: 131072,
12080
- },
12081
12311
  "xiaomi/mimo-v2.5": {
12082
12312
  id: "xiaomi/mimo-v2.5",
12083
12313
  name: "Xiaomi: MiMo-V2.5",
@@ -12087,9 +12317,9 @@ export const MODELS = {
12087
12317
  reasoning: true,
12088
12318
  input: ["text", "image"],
12089
12319
  cost: {
12090
- input: 0.39999999999999997,
12091
- output: 2,
12092
- cacheRead: 0.08,
12320
+ input: 0.14,
12321
+ output: 0.28,
12322
+ cacheRead: 0.0028,
12093
12323
  cacheWrite: 0,
12094
12324
  },
12095
12325
  contextWindow: 1048576,
@@ -12104,13 +12334,13 @@ export const MODELS = {
12104
12334
  reasoning: true,
12105
12335
  input: ["text"],
12106
12336
  cost: {
12107
- input: 1,
12108
- output: 3,
12109
- cacheRead: 0.19999999999999998,
12337
+ input: 0.435,
12338
+ output: 0.87,
12339
+ cacheRead: 0.0036,
12110
12340
  cacheWrite: 0,
12111
12341
  },
12112
12342
  contextWindow: 1048576,
12113
- maxTokens: 16384,
12343
+ maxTokens: 131072,
12114
12344
  },
12115
12345
  "z-ai/glm-4-32b": {
12116
12346
  id: "z-ai/glm-4-32b",
@@ -12155,13 +12385,13 @@ export const MODELS = {
12155
12385
  reasoning: true,
12156
12386
  input: ["text"],
12157
12387
  cost: {
12158
- input: 0.13,
12388
+ input: 0.125,
12159
12389
  output: 0.85,
12160
- cacheRead: 0.024999999999999998,
12390
+ cacheRead: 0.06,
12161
12391
  cacheWrite: 0,
12162
12392
  },
12163
12393
  contextWindow: 131072,
12164
- maxTokens: 98304,
12394
+ maxTokens: 131070,
12165
12395
  },
12166
12396
  "z-ai/glm-4.5-air:free": {
12167
12397
  id: "z-ai/glm-4.5-air:free",
@@ -12427,13 +12657,13 @@ export const MODELS = {
12427
12657
  reasoning: true,
12428
12658
  input: ["text", "image"],
12429
12659
  cost: {
12430
- input: 0.73,
12431
- output: 3.49,
12432
- cacheRead: 0.25,
12660
+ input: 0.684,
12661
+ output: 3.42,
12662
+ cacheRead: 0.144,
12433
12663
  cacheWrite: 0,
12434
12664
  },
12435
12665
  contextWindow: 262144,
12436
- maxTokens: 262142,
12666
+ maxTokens: 262144,
12437
12667
  },
12438
12668
  "~openai/gpt-latest": {
12439
12669
  id: "~openai/gpt-latest",
@@ -12624,7 +12854,7 @@ export const MODELS = {
12624
12854
  },
12625
12855
  "deepseek-ai/DeepSeek-V3": {
12626
12856
  id: "deepseek-ai/DeepSeek-V3",
12627
- name: "DeepSeek V3",
12857
+ name: "DeepSeek-V3",
12628
12858
  api: "openai-completions",
12629
12859
  provider: "together",
12630
12860
  baseUrl: "https://api.together.ai/v1",
@@ -12772,6 +13002,25 @@ export const MODELS = {
12772
13002
  contextWindow: 262144,
12773
13003
  maxTokens: 131000,
12774
13004
  },
13005
+ "nvidia/nemotron-3-ultra-550b-a55b": {
13006
+ id: "nvidia/nemotron-3-ultra-550b-a55b",
13007
+ name: "Nemotron 3 Ultra 550B A55B",
13008
+ api: "openai-completions",
13009
+ provider: "together",
13010
+ baseUrl: "https://api.together.ai/v1",
13011
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13012
+ reasoning: true,
13013
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13014
+ input: ["text"],
13015
+ cost: {
13016
+ input: 0.6,
13017
+ output: 3.6,
13018
+ cacheRead: 0.2,
13019
+ cacheWrite: 0,
13020
+ },
13021
+ contextWindow: 512300,
13022
+ maxTokens: 512300,
13023
+ },
12775
13024
  "openai/gpt-oss-120b": {
12776
13025
  id: "openai/gpt-oss-120b",
12777
13026
  name: "GPT OSS 120B",
@@ -12831,20 +13080,20 @@ export const MODELS = {
12831
13080
  },
12832
13081
  "alibaba/qwen-3-235b": {
12833
13082
  id: "alibaba/qwen-3-235b",
12834
- name: "Qwen3 235B A22b Instruct 2507",
13083
+ name: "Qwen3 235B A22B",
12835
13084
  api: "anthropic-messages",
12836
13085
  provider: "vercel-ai-gateway",
12837
13086
  baseUrl: "https://ai-gateway.vercel.sh",
12838
- reasoning: false,
13087
+ reasoning: true,
12839
13088
  input: ["text"],
12840
13089
  cost: {
12841
- input: 0.6,
12842
- output: 1.2,
12843
- cacheRead: 0.6,
13090
+ input: 0.22,
13091
+ output: 0.88,
13092
+ cacheRead: 0,
12844
13093
  cacheWrite: 0,
12845
13094
  },
12846
- contextWindow: 131000,
12847
- maxTokens: 40000,
13095
+ contextWindow: 262144,
13096
+ maxTokens: 16384,
12848
13097
  },
12849
13098
  "alibaba/qwen-3-30b": {
12850
13099
  id: "alibaba/qwen-3-30b",
@@ -12887,7 +13136,7 @@ export const MODELS = {
12887
13136
  provider: "vercel-ai-gateway",
12888
13137
  baseUrl: "https://ai-gateway.vercel.sh",
12889
13138
  reasoning: true,
12890
- input: ["text", "image"],
13139
+ input: ["text"],
12891
13140
  cost: {
12892
13141
  input: 1.3,
12893
13142
  output: 7.8,
@@ -12920,7 +13169,7 @@ export const MODELS = {
12920
13169
  api: "anthropic-messages",
12921
13170
  provider: "vercel-ai-gateway",
12922
13171
  baseUrl: "https://ai-gateway.vercel.sh",
12923
- reasoning: false,
13172
+ reasoning: true,
12924
13173
  input: ["text"],
12925
13174
  cost: {
12926
13175
  input: 1.5,
@@ -12954,7 +13203,7 @@ export const MODELS = {
12954
13203
  api: "anthropic-messages",
12955
13204
  provider: "vercel-ai-gateway",
12956
13205
  baseUrl: "https://ai-gateway.vercel.sh",
12957
- reasoning: false,
13206
+ reasoning: true,
12958
13207
  input: ["text"],
12959
13208
  cost: {
12960
13209
  input: 0.5,
@@ -13013,25 +13262,59 @@ export const MODELS = {
13013
13262
  cacheRead: 0.24,
13014
13263
  cacheWrite: 0,
13015
13264
  },
13016
- contextWindow: 262144,
13265
+ contextWindow: 262144,
13266
+ maxTokens: 32768,
13267
+ },
13268
+ "alibaba/qwen3-max-thinking": {
13269
+ id: "alibaba/qwen3-max-thinking",
13270
+ name: "Qwen 3 Max Thinking",
13271
+ api: "anthropic-messages",
13272
+ provider: "vercel-ai-gateway",
13273
+ baseUrl: "https://ai-gateway.vercel.sh",
13274
+ reasoning: true,
13275
+ input: ["text"],
13276
+ cost: {
13277
+ input: 1.2,
13278
+ output: 6,
13279
+ cacheRead: 0.24,
13280
+ cacheWrite: 0,
13281
+ },
13282
+ contextWindow: 256000,
13283
+ maxTokens: 65536,
13284
+ },
13285
+ "alibaba/qwen3-next-80b-a3b-instruct": {
13286
+ id: "alibaba/qwen3-next-80b-a3b-instruct",
13287
+ name: "Qwen3 Next 80B A3B Instruct",
13288
+ api: "anthropic-messages",
13289
+ provider: "vercel-ai-gateway",
13290
+ baseUrl: "https://ai-gateway.vercel.sh",
13291
+ reasoning: false,
13292
+ input: ["text"],
13293
+ cost: {
13294
+ input: 0.15,
13295
+ output: 1.2,
13296
+ cacheRead: 0,
13297
+ cacheWrite: 0,
13298
+ },
13299
+ contextWindow: 131072,
13017
13300
  maxTokens: 32768,
13018
13301
  },
13019
- "alibaba/qwen3-max-thinking": {
13020
- id: "alibaba/qwen3-max-thinking",
13021
- name: "Qwen 3 Max Thinking",
13302
+ "alibaba/qwen3-next-80b-a3b-thinking": {
13303
+ id: "alibaba/qwen3-next-80b-a3b-thinking",
13304
+ name: "Qwen3 Next 80B A3B Thinking",
13022
13305
  api: "anthropic-messages",
13023
13306
  provider: "vercel-ai-gateway",
13024
13307
  baseUrl: "https://ai-gateway.vercel.sh",
13025
13308
  reasoning: true,
13026
13309
  input: ["text"],
13027
13310
  cost: {
13028
- input: 1.2,
13029
- output: 6,
13030
- cacheRead: 0.24,
13311
+ input: 0.15,
13312
+ output: 1.2,
13313
+ cacheRead: 0,
13031
13314
  cacheWrite: 0,
13032
13315
  },
13033
- contextWindow: 256000,
13034
- maxTokens: 65536,
13316
+ contextWindow: 131072,
13317
+ maxTokens: 32768,
13035
13318
  },
13036
13319
  "alibaba/qwen3-vl-thinking": {
13037
13320
  id: "alibaba/qwen3-vl-thinking",
@@ -13125,7 +13408,7 @@ export const MODELS = {
13125
13408
  provider: "vercel-ai-gateway",
13126
13409
  baseUrl: "https://ai-gateway.vercel.sh",
13127
13410
  reasoning: true,
13128
- input: ["text", "image"],
13411
+ input: ["text"],
13129
13412
  cost: {
13130
13413
  input: 1.25,
13131
13414
  output: 3.75,
@@ -13135,6 +13418,23 @@ export const MODELS = {
13135
13418
  contextWindow: 991000,
13136
13419
  maxTokens: 64000,
13137
13420
  },
13421
+ "alibaba/qwen3.7-plus": {
13422
+ id: "alibaba/qwen3.7-plus",
13423
+ name: "Qwen 3.7 Plus",
13424
+ api: "anthropic-messages",
13425
+ provider: "vercel-ai-gateway",
13426
+ baseUrl: "https://ai-gateway.vercel.sh",
13427
+ reasoning: true,
13428
+ input: ["text", "image"],
13429
+ cost: {
13430
+ input: 0.39999999999999997,
13431
+ output: 1.5999999999999999,
13432
+ cacheRead: 0.08,
13433
+ cacheWrite: 0.5,
13434
+ },
13435
+ contextWindow: 1000000,
13436
+ maxTokens: 64000,
13437
+ },
13138
13438
  "anthropic/claude-3-haiku": {
13139
13439
  id: "anthropic/claude-3-haiku",
13140
13440
  name: "Claude 3 Haiku",
@@ -13243,6 +13543,7 @@ export const MODELS = {
13243
13543
  api: "anthropic-messages",
13244
13544
  provider: "vercel-ai-gateway",
13245
13545
  baseUrl: "https://ai-gateway.vercel.sh",
13546
+ compat: { "forceAdaptiveThinking": true },
13246
13547
  reasoning: true,
13247
13548
  thinkingLevelMap: { "xhigh": "max" },
13248
13549
  input: ["text", "image"],
@@ -13261,6 +13562,7 @@ export const MODELS = {
13261
13562
  api: "anthropic-messages",
13262
13563
  provider: "vercel-ai-gateway",
13263
13564
  baseUrl: "https://ai-gateway.vercel.sh",
13565
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
13264
13566
  reasoning: true,
13265
13567
  thinkingLevelMap: { "xhigh": "xhigh" },
13266
13568
  input: ["text", "image"],
@@ -13273,6 +13575,24 @@ export const MODELS = {
13273
13575
  contextWindow: 1000000,
13274
13576
  maxTokens: 128000,
13275
13577
  },
13578
+ "anthropic/claude-opus-4.8": {
13579
+ id: "anthropic/claude-opus-4.8",
13580
+ name: "Claude Opus 4.8",
13581
+ api: "anthropic-messages",
13582
+ provider: "vercel-ai-gateway",
13583
+ baseUrl: "https://ai-gateway.vercel.sh",
13584
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
13585
+ reasoning: true,
13586
+ input: ["text", "image"],
13587
+ cost: {
13588
+ input: 5,
13589
+ output: 25,
13590
+ cacheRead: 0.5,
13591
+ cacheWrite: 6.25,
13592
+ },
13593
+ contextWindow: 1000000,
13594
+ maxTokens: 128000,
13595
+ },
13276
13596
  "anthropic/claude-sonnet-4": {
13277
13597
  id: "anthropic/claude-sonnet-4",
13278
13598
  name: "Claude Sonnet 4",
@@ -13313,6 +13633,7 @@ export const MODELS = {
13313
13633
  api: "anthropic-messages",
13314
13634
  provider: "vercel-ai-gateway",
13315
13635
  baseUrl: "https://ai-gateway.vercel.sh",
13636
+ compat: { "forceAdaptiveThinking": true },
13316
13637
  reasoning: true,
13317
13638
  input: ["text", "image"],
13318
13639
  cost: {
@@ -13418,17 +13739,17 @@ export const MODELS = {
13418
13739
  reasoning: false,
13419
13740
  input: ["text"],
13420
13741
  cost: {
13421
- input: 0.77,
13422
- output: 0.77,
13423
- cacheRead: 0,
13742
+ input: 0.27,
13743
+ output: 1.12,
13744
+ cacheRead: 0.135,
13424
13745
  cacheWrite: 0,
13425
13746
  },
13426
13747
  contextWindow: 163840,
13427
- maxTokens: 16384,
13748
+ maxTokens: 163840,
13428
13749
  },
13429
13750
  "deepseek/deepseek-v3.1": {
13430
13751
  id: "deepseek/deepseek-v3.1",
13431
- name: "DeepSeek-V3.1",
13752
+ name: "DeepSeek V3.1",
13432
13753
  api: "anthropic-messages",
13433
13754
  provider: "vercel-ai-gateway",
13434
13755
  baseUrl: "https://ai-gateway.vercel.sh",
@@ -13466,8 +13787,8 @@ export const MODELS = {
13466
13787
  api: "anthropic-messages",
13467
13788
  provider: "vercel-ai-gateway",
13468
13789
  baseUrl: "https://ai-gateway.vercel.sh",
13469
- reasoning: false,
13470
- input: ["text"],
13790
+ reasoning: true,
13791
+ input: ["text", "image"],
13471
13792
  cost: {
13472
13793
  input: 0.28,
13473
13794
  output: 0.42,
@@ -13483,8 +13804,8 @@ export const MODELS = {
13483
13804
  api: "anthropic-messages",
13484
13805
  provider: "vercel-ai-gateway",
13485
13806
  baseUrl: "https://ai-gateway.vercel.sh",
13486
- reasoning: false,
13487
- input: ["text"],
13807
+ reasoning: true,
13808
+ input: ["text", "image"],
13488
13809
  cost: {
13489
13810
  input: 0.62,
13490
13811
  output: 1.85,
@@ -13501,7 +13822,7 @@ export const MODELS = {
13501
13822
  provider: "vercel-ai-gateway",
13502
13823
  baseUrl: "https://ai-gateway.vercel.sh",
13503
13824
  reasoning: true,
13504
- input: ["text"],
13825
+ input: ["text", "image"],
13505
13826
  cost: {
13506
13827
  input: 0.14,
13507
13828
  output: 0.28,
@@ -13721,12 +14042,12 @@ export const MODELS = {
13721
14042
  api: "anthropic-messages",
13722
14043
  provider: "vercel-ai-gateway",
13723
14044
  baseUrl: "https://ai-gateway.vercel.sh",
13724
- reasoning: false,
14045
+ reasoning: true,
13725
14046
  input: ["text", "image"],
13726
14047
  cost: {
13727
- input: 0.13,
13728
- output: 0.39999999999999997,
13729
- cacheRead: 0,
14048
+ input: 0.15,
14049
+ output: 0.6,
14050
+ cacheRead: 0.015,
13730
14051
  cacheWrite: 0,
13731
14052
  },
13732
14053
  contextWindow: 262144,
@@ -14028,7 +14349,7 @@ export const MODELS = {
14028
14349
  provider: "vercel-ai-gateway",
14029
14350
  baseUrl: "https://ai-gateway.vercel.sh",
14030
14351
  reasoning: true,
14031
- input: ["text", "image"],
14352
+ input: ["text"],
14032
14353
  cost: {
14033
14354
  input: 0.3,
14034
14355
  output: 1.2,
@@ -14045,7 +14366,7 @@ export const MODELS = {
14045
14366
  provider: "vercel-ai-gateway",
14046
14367
  baseUrl: "https://ai-gateway.vercel.sh",
14047
14368
  reasoning: true,
14048
- input: ["text", "image"],
14369
+ input: ["text"],
14049
14370
  cost: {
14050
14371
  input: 0.6,
14051
14372
  output: 2.4,
@@ -14055,6 +14376,23 @@ export const MODELS = {
14055
14376
  contextWindow: 204800,
14056
14377
  maxTokens: 131100,
14057
14378
  },
14379
+ "minimax/minimax-m3": {
14380
+ id: "minimax/minimax-m3",
14381
+ name: "MiniMax M3",
14382
+ api: "anthropic-messages",
14383
+ provider: "vercel-ai-gateway",
14384
+ baseUrl: "https://ai-gateway.vercel.sh",
14385
+ reasoning: true,
14386
+ input: ["text", "image"],
14387
+ cost: {
14388
+ input: 0.3,
14389
+ output: 1.2,
14390
+ cacheRead: 0.06,
14391
+ cacheWrite: 0,
14392
+ },
14393
+ contextWindow: 1000000,
14394
+ maxTokens: 1000000,
14395
+ },
14058
14396
  "mistral/codestral": {
14059
14397
  id: "mistral/codestral",
14060
14398
  name: "Mistral Codestral",
@@ -14191,6 +14529,23 @@ export const MODELS = {
14191
14529
  contextWindow: 256000,
14192
14530
  maxTokens: 256000,
14193
14531
  },
14532
+ "mistral/mistral-nemo": {
14533
+ id: "mistral/mistral-nemo",
14534
+ name: "Mistral Nemo 12B",
14535
+ api: "anthropic-messages",
14536
+ provider: "vercel-ai-gateway",
14537
+ baseUrl: "https://ai-gateway.vercel.sh",
14538
+ reasoning: false,
14539
+ input: ["text"],
14540
+ cost: {
14541
+ input: 0.02,
14542
+ output: 0.04,
14543
+ cacheRead: 0,
14544
+ cacheWrite: 0,
14545
+ },
14546
+ contextWindow: 131072,
14547
+ maxTokens: 131072,
14548
+ },
14194
14549
  "mistral/mistral-small": {
14195
14550
  id: "mistral/mistral-small",
14196
14551
  name: "Mistral Small",
@@ -14344,6 +14699,40 @@ export const MODELS = {
14344
14699
  contextWindow: 262000,
14345
14700
  maxTokens: 262000,
14346
14701
  },
14702
+ "nvidia/nemotron-3-super-120b-a12b": {
14703
+ id: "nvidia/nemotron-3-super-120b-a12b",
14704
+ name: "NVIDIA Nemotron 3 Super 120B A12B",
14705
+ api: "anthropic-messages",
14706
+ provider: "vercel-ai-gateway",
14707
+ baseUrl: "https://ai-gateway.vercel.sh",
14708
+ reasoning: true,
14709
+ input: ["text"],
14710
+ cost: {
14711
+ input: 0.15,
14712
+ output: 0.65,
14713
+ cacheRead: 0,
14714
+ cacheWrite: 0,
14715
+ },
14716
+ contextWindow: 256000,
14717
+ maxTokens: 32000,
14718
+ },
14719
+ "nvidia/nemotron-3-ultra-550b-a55b": {
14720
+ id: "nvidia/nemotron-3-ultra-550b-a55b",
14721
+ name: "Nemotron 3 Ultra",
14722
+ api: "anthropic-messages",
14723
+ provider: "vercel-ai-gateway",
14724
+ baseUrl: "https://ai-gateway.vercel.sh",
14725
+ reasoning: true,
14726
+ input: ["text"],
14727
+ cost: {
14728
+ input: 0.6,
14729
+ output: 2.4,
14730
+ cacheRead: 0.12,
14731
+ cacheWrite: 0,
14732
+ },
14733
+ contextWindow: 1000000,
14734
+ maxTokens: 65000,
14735
+ },
14347
14736
  "nvidia/nemotron-nano-12b-v2-vl": {
14348
14737
  id: "nvidia/nemotron-nano-12b-v2-vl",
14349
14738
  name: "Nvidia Nemotron Nano 12B V2 VL",
@@ -14521,7 +14910,7 @@ export const MODELS = {
14521
14910
  provider: "vercel-ai-gateway",
14522
14911
  baseUrl: "https://ai-gateway.vercel.sh",
14523
14912
  reasoning: true,
14524
- input: ["text"],
14913
+ input: ["text", "image"],
14525
14914
  cost: {
14526
14915
  input: 1.25,
14527
14916
  output: 10,
@@ -14872,7 +15261,7 @@ export const MODELS = {
14872
15261
  provider: "vercel-ai-gateway",
14873
15262
  baseUrl: "https://ai-gateway.vercel.sh",
14874
15263
  reasoning: true,
14875
- thinkingLevelMap: { "xhigh": "xhigh" },
15264
+ thinkingLevelMap: { "xhigh": "xhigh", "off": null, "minimal": null, "low": null },
14876
15265
  input: ["text", "image"],
14877
15266
  cost: {
14878
15267
  input: 30,
@@ -14883,6 +15272,23 @@ export const MODELS = {
14883
15272
  contextWindow: 1000000,
14884
15273
  maxTokens: 128000,
14885
15274
  },
15275
+ "openai/gpt-oss-120b": {
15276
+ id: "openai/gpt-oss-120b",
15277
+ name: "GPT OSS 120B",
15278
+ api: "anthropic-messages",
15279
+ provider: "vercel-ai-gateway",
15280
+ baseUrl: "https://ai-gateway.vercel.sh",
15281
+ reasoning: true,
15282
+ input: ["text"],
15283
+ cost: {
15284
+ input: 0.35,
15285
+ output: 0.75,
15286
+ cacheRead: 0.25,
15287
+ cacheWrite: 0,
15288
+ },
15289
+ contextWindow: 131072,
15290
+ maxTokens: 131000,
15291
+ },
14886
15292
  "openai/gpt-oss-20b": {
14887
15293
  id: "openai/gpt-oss-20b",
14888
15294
  name: "GPT OSS 20B",
@@ -15053,6 +15459,40 @@ export const MODELS = {
15053
15459
  contextWindow: 200000,
15054
15460
  maxTokens: 8000,
15055
15461
  },
15462
+ "stepfun/step-3.5-flash": {
15463
+ id: "stepfun/step-3.5-flash",
15464
+ name: "StepFun 3.5 Flash",
15465
+ api: "anthropic-messages",
15466
+ provider: "vercel-ai-gateway",
15467
+ baseUrl: "https://ai-gateway.vercel.sh",
15468
+ reasoning: true,
15469
+ input: ["text"],
15470
+ cost: {
15471
+ input: 0.09,
15472
+ output: 0.3,
15473
+ cacheRead: 0,
15474
+ cacheWrite: 0.02,
15475
+ },
15476
+ contextWindow: 262114,
15477
+ maxTokens: 262114,
15478
+ },
15479
+ "stepfun/step-3.7-flash": {
15480
+ id: "stepfun/step-3.7-flash",
15481
+ name: "Step 3.7 Flash",
15482
+ api: "anthropic-messages",
15483
+ provider: "vercel-ai-gateway",
15484
+ baseUrl: "https://ai-gateway.vercel.sh",
15485
+ reasoning: true,
15486
+ input: ["text", "image"],
15487
+ cost: {
15488
+ input: 0.19999999999999998,
15489
+ output: 1.15,
15490
+ cacheRead: 0.04,
15491
+ cacheWrite: 0,
15492
+ },
15493
+ contextWindow: 256000,
15494
+ maxTokens: 256000,
15495
+ },
15056
15496
  "xai/grok-4.1-fast-non-reasoning": {
15057
15497
  id: "xai/grok-4.1-fast-non-reasoning",
15058
15498
  name: "Grok 4.1 Fast Non-Reasoning",
@@ -15266,9 +15706,9 @@ export const MODELS = {
15266
15706
  reasoning: true,
15267
15707
  input: ["text", "image"],
15268
15708
  cost: {
15269
- input: 0.39999999999999997,
15270
- output: 2,
15271
- cacheRead: 0.08,
15709
+ input: 0.14,
15710
+ output: 0.28,
15711
+ cacheRead: 0.0028,
15272
15712
  cacheWrite: 0,
15273
15713
  },
15274
15714
  contextWindow: 1050000,
@@ -15283,9 +15723,9 @@ export const MODELS = {
15283
15723
  reasoning: true,
15284
15724
  input: ["text", "image"],
15285
15725
  cost: {
15286
- input: 1,
15287
- output: 3,
15288
- cacheRead: 0.19999999999999998,
15726
+ input: 0.435,
15727
+ output: 0.87,
15728
+ cacheRead: 0.0036,
15289
15729
  cacheWrite: 0,
15290
15730
  },
15291
15731
  contextWindow: 1050000,
@@ -15331,7 +15771,7 @@ export const MODELS = {
15331
15771
  api: "anthropic-messages",
15332
15772
  provider: "vercel-ai-gateway",
15333
15773
  baseUrl: "https://ai-gateway.vercel.sh",
15334
- reasoning: false,
15774
+ reasoning: true,
15335
15775
  input: ["text", "image"],
15336
15776
  cost: {
15337
15777
  input: 0.6,
@@ -15485,7 +15925,7 @@ export const MODELS = {
15485
15925
  provider: "vercel-ai-gateway",
15486
15926
  baseUrl: "https://ai-gateway.vercel.sh",
15487
15927
  reasoning: true,
15488
- input: ["text"],
15928
+ input: ["text", "image"],
15489
15929
  cost: {
15490
15930
  input: 1.4,
15491
15931
  output: 4.4,
@@ -15727,24 +16167,6 @@ export const MODELS = {
15727
16167
  },
15728
16168
  },
15729
16169
  "xiaomi-token-plan-ams": {
15730
- "mimo-v2-flash": {
15731
- id: "mimo-v2-flash",
15732
- name: "MiMo-V2-Flash",
15733
- api: "openai-completions",
15734
- provider: "xiaomi-token-plan-ams",
15735
- baseUrl: "https://token-plan-ams.xiaomimimo.com/v1",
15736
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
15737
- reasoning: true,
15738
- input: ["text"],
15739
- cost: {
15740
- input: 0.1,
15741
- output: 0.3,
15742
- cacheRead: 0.01,
15743
- cacheWrite: 0,
15744
- },
15745
- contextWindow: 262144,
15746
- maxTokens: 65536,
15747
- },
15748
16170
  "mimo-v2-omni": {
15749
16171
  id: "mimo-v2-omni",
15750
16172
  name: "MiMo-V2-Omni",
@@ -15819,24 +16241,6 @@ export const MODELS = {
15819
16241
  },
15820
16242
  },
15821
16243
  "xiaomi-token-plan-cn": {
15822
- "mimo-v2-flash": {
15823
- id: "mimo-v2-flash",
15824
- name: "MiMo-V2-Flash",
15825
- api: "openai-completions",
15826
- provider: "xiaomi-token-plan-cn",
15827
- baseUrl: "https://token-plan-cn.xiaomimimo.com/v1",
15828
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
15829
- reasoning: true,
15830
- input: ["text"],
15831
- cost: {
15832
- input: 0.1,
15833
- output: 0.3,
15834
- cacheRead: 0.01,
15835
- cacheWrite: 0,
15836
- },
15837
- contextWindow: 262144,
15838
- maxTokens: 65536,
15839
- },
15840
16244
  "mimo-v2-omni": {
15841
16245
  id: "mimo-v2-omni",
15842
16246
  name: "MiMo-V2-Omni",
@@ -15911,24 +16315,6 @@ export const MODELS = {
15911
16315
  },
15912
16316
  },
15913
16317
  "xiaomi-token-plan-sgp": {
15914
- "mimo-v2-flash": {
15915
- id: "mimo-v2-flash",
15916
- name: "MiMo-V2-Flash",
15917
- api: "openai-completions",
15918
- provider: "xiaomi-token-plan-sgp",
15919
- baseUrl: "https://token-plan-sgp.xiaomimimo.com/v1",
15920
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
15921
- reasoning: true,
15922
- input: ["text"],
15923
- cost: {
15924
- input: 0.1,
15925
- output: 0.3,
15926
- cacheRead: 0.01,
15927
- cacheWrite: 0,
15928
- },
15929
- contextWindow: 262144,
15930
- maxTokens: 65536,
15931
- },
15932
16318
  "mimo-v2-omni": {
15933
16319
  id: "mimo-v2-omni",
15934
16320
  name: "MiMo-V2-Omni",