@fleetagent/pi-ai 0.0.6 → 0.0.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (42) hide show
  1. package/README.md +1 -1
  2. package/dist/image-models.generated.d.ts +15 -0
  3. package/dist/image-models.generated.d.ts.map +1 -1
  4. package/dist/image-models.generated.js +15 -0
  5. package/dist/image-models.generated.js.map +1 -1
  6. package/dist/models.generated.d.ts +754 -376
  7. package/dist/models.generated.d.ts.map +1 -1
  8. package/dist/models.generated.js +987 -690
  9. package/dist/models.generated.js.map +1 -1
  10. package/dist/providers/anthropic.d.ts.map +1 -1
  11. package/dist/providers/anthropic.js +21 -12
  12. package/dist/providers/anthropic.js.map +1 -1
  13. package/dist/providers/azure-openai-responses.d.ts.map +1 -1
  14. package/dist/providers/azure-openai-responses.js +1 -1
  15. package/dist/providers/azure-openai-responses.js.map +1 -1
  16. package/dist/providers/images/openrouter.d.ts.map +1 -1
  17. package/dist/providers/images/openrouter.js +1 -1
  18. package/dist/providers/images/openrouter.js.map +1 -1
  19. package/dist/providers/openai-codex-responses.d.ts.map +1 -1
  20. package/dist/providers/openai-codex-responses.js +163 -81
  21. package/dist/providers/openai-codex-responses.js.map +1 -1
  22. package/dist/providers/openai-completions.d.ts.map +1 -1
  23. package/dist/providers/openai-completions.js +14 -4
  24. package/dist/providers/openai-completions.js.map +1 -1
  25. package/dist/providers/openai-responses-shared.d.ts.map +1 -1
  26. package/dist/providers/openai-responses-shared.js +4 -1
  27. package/dist/providers/openai-responses-shared.js.map +1 -1
  28. package/dist/providers/openai-responses.d.ts.map +1 -1
  29. package/dist/providers/openai-responses.js +1 -1
  30. package/dist/providers/openai-responses.js.map +1 -1
  31. package/dist/types.d.ts +26 -2
  32. package/dist/types.d.ts.map +1 -1
  33. package/dist/types.js.map +1 -1
  34. package/dist/utils/abort-signals.d.ts +6 -0
  35. package/dist/utils/abort-signals.d.ts.map +1 -0
  36. package/dist/utils/abort-signals.js +34 -0
  37. package/dist/utils/abort-signals.js.map +1 -0
  38. package/dist/utils/overflow.d.ts +2 -1
  39. package/dist/utils/overflow.d.ts.map +1 -1
  40. package/dist/utils/overflow.js +5 -2
  41. package/dist/utils/overflow.js.map +1 -1
  42. package/package.json +2 -1
@@ -157,6 +157,23 @@ export const MODELS = {
157
157
  contextWindow: 1000000,
158
158
  maxTokens: 128000,
159
159
  },
160
+ "anthropic.claude-opus-4-8": {
161
+ id: "anthropic.claude-opus-4-8",
162
+ name: "Claude Opus 4.8",
163
+ api: "bedrock-converse-stream",
164
+ provider: "amazon-bedrock",
165
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
166
+ reasoning: true,
167
+ input: ["text", "image"],
168
+ cost: {
169
+ input: 5,
170
+ output: 25,
171
+ cacheRead: 0.5,
172
+ cacheWrite: 6.25,
173
+ },
174
+ contextWindow: 1000000,
175
+ maxTokens: 128000,
176
+ },
160
177
  "anthropic.claude-sonnet-4-5-20250929-v1:0": {
161
178
  id: "anthropic.claude-sonnet-4-5-20250929-v1:0",
162
179
  name: "Claude Sonnet 4.5",
@@ -226,6 +243,23 @@ export const MODELS = {
226
243
  contextWindow: 1000000,
227
244
  maxTokens: 128000,
228
245
  },
246
+ "au.anthropic.claude-opus-4-8": {
247
+ id: "au.anthropic.claude-opus-4-8",
248
+ name: "Claude Opus 4.8 (AU)",
249
+ api: "bedrock-converse-stream",
250
+ provider: "amazon-bedrock",
251
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
252
+ reasoning: true,
253
+ input: ["text", "image"],
254
+ cost: {
255
+ input: 5,
256
+ output: 25,
257
+ cacheRead: 0.5,
258
+ cacheWrite: 6.25,
259
+ },
260
+ contextWindow: 1000000,
261
+ maxTokens: 128000,
262
+ },
229
263
  "au.anthropic.claude-sonnet-4-5-20250929-v1:0": {
230
264
  id: "au.anthropic.claude-sonnet-4-5-20250929-v1:0",
231
265
  name: "Claude Sonnet 4.5 (AU)",
@@ -355,8 +389,8 @@ export const MODELS = {
355
389
  thinkingLevelMap: { "xhigh": "max" },
356
390
  input: ["text", "image"],
357
391
  cost: {
358
- input: 5,
359
- output: 25,
392
+ input: 5.5,
393
+ output: 27.5,
360
394
  cacheRead: 0.5,
361
395
  cacheWrite: 6.25,
362
396
  },
@@ -373,10 +407,27 @@ export const MODELS = {
373
407
  thinkingLevelMap: { "xhigh": "xhigh" },
374
408
  input: ["text", "image"],
375
409
  cost: {
376
- input: 5,
377
- output: 25,
378
- cacheRead: 0.5,
379
- cacheWrite: 6.25,
410
+ input: 5.5,
411
+ output: 27.5,
412
+ cacheRead: 0.55,
413
+ cacheWrite: 6.875,
414
+ },
415
+ contextWindow: 1000000,
416
+ maxTokens: 128000,
417
+ },
418
+ "eu.anthropic.claude-opus-4-8": {
419
+ id: "eu.anthropic.claude-opus-4-8",
420
+ name: "Claude Opus 4.8 (EU)",
421
+ api: "bedrock-converse-stream",
422
+ provider: "amazon-bedrock",
423
+ baseUrl: "https://bedrock-runtime.eu-central-1.amazonaws.com",
424
+ reasoning: true,
425
+ input: ["text", "image"],
426
+ cost: {
427
+ input: 5.5,
428
+ output: 27.5,
429
+ cacheRead: 0.55,
430
+ cacheWrite: 6.875,
380
431
  },
381
432
  contextWindow: 1000000,
382
433
  maxTokens: 128000,
@@ -390,10 +441,10 @@ export const MODELS = {
390
441
  reasoning: true,
391
442
  input: ["text", "image"],
392
443
  cost: {
393
- input: 3,
394
- output: 15,
395
- cacheRead: 0.3,
396
- cacheWrite: 3.75,
444
+ input: 3.3,
445
+ output: 16.5,
446
+ cacheRead: 0.33,
447
+ cacheWrite: 4.125,
397
448
  },
398
449
  contextWindow: 200000,
399
450
  maxTokens: 64000,
@@ -407,10 +458,10 @@ export const MODELS = {
407
458
  reasoning: true,
408
459
  input: ["text", "image"],
409
460
  cost: {
410
- input: 3,
411
- output: 15,
412
- cacheRead: 0.3,
413
- cacheWrite: 3.75,
461
+ input: 3.3,
462
+ output: 16.5,
463
+ cacheRead: 0.33,
464
+ cacheWrite: 4.125,
414
465
  },
415
466
  contextWindow: 1000000,
416
467
  maxTokens: 64000,
@@ -485,6 +536,23 @@ export const MODELS = {
485
536
  contextWindow: 1000000,
486
537
  maxTokens: 128000,
487
538
  },
539
+ "global.anthropic.claude-opus-4-8": {
540
+ id: "global.anthropic.claude-opus-4-8",
541
+ name: "Claude Opus 4.8 (Global)",
542
+ api: "bedrock-converse-stream",
543
+ provider: "amazon-bedrock",
544
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
545
+ reasoning: true,
546
+ input: ["text", "image"],
547
+ cost: {
548
+ input: 5,
549
+ output: 25,
550
+ cacheRead: 0.5,
551
+ cacheWrite: 6.25,
552
+ },
553
+ contextWindow: 1000000,
554
+ maxTokens: 128000,
555
+ },
488
556
  "global.anthropic.claude-sonnet-4-5-20250929-v1:0": {
489
557
  id: "global.anthropic.claude-sonnet-4-5-20250929-v1:0",
490
558
  name: "Claude Sonnet 4.5 (Global)",
@@ -571,6 +639,23 @@ export const MODELS = {
571
639
  contextWindow: 1000000,
572
640
  maxTokens: 128000,
573
641
  },
642
+ "jp.anthropic.claude-opus-4-8": {
643
+ id: "jp.anthropic.claude-opus-4-8",
644
+ name: "Claude Opus 4.8 (JP)",
645
+ api: "bedrock-converse-stream",
646
+ provider: "amazon-bedrock",
647
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
648
+ reasoning: true,
649
+ input: ["text", "image"],
650
+ cost: {
651
+ input: 5,
652
+ output: 25,
653
+ cacheRead: 0.5,
654
+ cacheWrite: 6.25,
655
+ },
656
+ contextWindow: 1000000,
657
+ maxTokens: 128000,
658
+ },
574
659
  "jp.anthropic.claude-sonnet-4-5-20250929-v1:0": {
575
660
  id: "jp.anthropic.claude-sonnet-4-5-20250929-v1:0",
576
661
  name: "Claude Sonnet 4.5 (JP)",
@@ -1270,6 +1355,23 @@ export const MODELS = {
1270
1355
  contextWindow: 1000000,
1271
1356
  maxTokens: 128000,
1272
1357
  },
1358
+ "us.anthropic.claude-opus-4-8": {
1359
+ id: "us.anthropic.claude-opus-4-8",
1360
+ name: "Claude Opus 4.8 (US)",
1361
+ api: "bedrock-converse-stream",
1362
+ provider: "amazon-bedrock",
1363
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1364
+ reasoning: true,
1365
+ input: ["text", "image"],
1366
+ cost: {
1367
+ input: 5,
1368
+ output: 25,
1369
+ cacheRead: 0.5,
1370
+ cacheWrite: 6.25,
1371
+ },
1372
+ contextWindow: 1000000,
1373
+ maxTokens: 128000,
1374
+ },
1273
1375
  "us.anthropic.claude-sonnet-4-5-20250929-v1:0": {
1274
1376
  id: "us.anthropic.claude-sonnet-4-5-20250929-v1:0",
1275
1377
  name: "Claude Sonnet 4.5 (US)",
@@ -1720,6 +1822,7 @@ export const MODELS = {
1720
1822
  api: "anthropic-messages",
1721
1823
  provider: "anthropic",
1722
1824
  baseUrl: "https://api.anthropic.com",
1825
+ compat: { "forceAdaptiveThinking": true },
1723
1826
  reasoning: true,
1724
1827
  thinkingLevelMap: { "xhigh": "max" },
1725
1828
  input: ["text", "image"],
@@ -1738,6 +1841,7 @@ export const MODELS = {
1738
1841
  api: "anthropic-messages",
1739
1842
  provider: "anthropic",
1740
1843
  baseUrl: "https://api.anthropic.com",
1844
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
1741
1845
  reasoning: true,
1742
1846
  thinkingLevelMap: { "xhigh": "xhigh" },
1743
1847
  input: ["text", "image"],
@@ -1750,6 +1854,24 @@ export const MODELS = {
1750
1854
  contextWindow: 1000000,
1751
1855
  maxTokens: 128000,
1752
1856
  },
1857
+ "claude-opus-4-8": {
1858
+ id: "claude-opus-4-8",
1859
+ name: "Claude Opus 4.8",
1860
+ api: "anthropic-messages",
1861
+ provider: "anthropic",
1862
+ baseUrl: "https://api.anthropic.com",
1863
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
1864
+ reasoning: true,
1865
+ input: ["text", "image"],
1866
+ cost: {
1867
+ input: 5,
1868
+ output: 25,
1869
+ cacheRead: 0.5,
1870
+ cacheWrite: 6.25,
1871
+ },
1872
+ contextWindow: 1000000,
1873
+ maxTokens: 128000,
1874
+ },
1753
1875
  "claude-sonnet-4-0": {
1754
1876
  id: "claude-sonnet-4-0",
1755
1877
  name: "Claude Sonnet 4 (latest)",
@@ -1824,6 +1946,7 @@ export const MODELS = {
1824
1946
  api: "anthropic-messages",
1825
1947
  provider: "anthropic",
1826
1948
  baseUrl: "https://api.anthropic.com",
1949
+ compat: { "forceAdaptiveThinking": true },
1827
1950
  reasoning: true,
1828
1951
  input: ["text", "image"],
1829
1952
  cost: {
@@ -1916,7 +2039,7 @@ export const MODELS = {
1916
2039
  cost: {
1917
2040
  input: 0.1,
1918
2041
  output: 0.4,
1919
- cacheRead: 0.03,
2042
+ cacheRead: 0.025,
1920
2043
  cacheWrite: 0,
1921
2044
  },
1922
2045
  contextWindow: 1047576,
@@ -2001,7 +2124,7 @@ export const MODELS = {
2001
2124
  cost: {
2002
2125
  input: 0.15,
2003
2126
  output: 0.6,
2004
- cacheRead: 0.08,
2127
+ cacheRead: 0.075,
2005
2128
  cacheWrite: 0,
2006
2129
  },
2007
2130
  contextWindow: 128000,
@@ -2127,7 +2250,7 @@ export const MODELS = {
2127
2250
  cost: {
2128
2251
  input: 1.25,
2129
2252
  output: 10,
2130
- cacheRead: 0.13,
2253
+ cacheRead: 0.125,
2131
2254
  cacheWrite: 0,
2132
2255
  },
2133
2256
  contextWindow: 400000,
@@ -2428,7 +2551,7 @@ export const MODELS = {
2428
2551
  provider: "azure-openai-responses",
2429
2552
  baseUrl: "",
2430
2553
  reasoning: true,
2431
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
2554
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh", "minimal": null, "low": null },
2432
2555
  input: ["text", "image"],
2433
2556
  cost: {
2434
2557
  input: 30,
@@ -2552,7 +2675,7 @@ export const MODELS = {
2552
2675
  cost: {
2553
2676
  input: 1.1,
2554
2677
  output: 4.4,
2555
- cacheRead: 0.28,
2678
+ cacheRead: 0.275,
2556
2679
  cacheWrite: 0,
2557
2680
  },
2558
2681
  contextWindow: 200000,
@@ -2611,23 +2734,6 @@ export const MODELS = {
2611
2734
  contextWindow: 32000,
2612
2735
  maxTokens: 8000,
2613
2736
  },
2614
- "qwen-3-235b-a22b-instruct-2507": {
2615
- id: "qwen-3-235b-a22b-instruct-2507",
2616
- name: "Qwen 3 235B Instruct",
2617
- api: "openai-completions",
2618
- provider: "cerebras",
2619
- baseUrl: "https://api.cerebras.ai/v1",
2620
- reasoning: false,
2621
- input: ["text"],
2622
- cost: {
2623
- input: 0.6,
2624
- output: 1.2,
2625
- cacheRead: 0,
2626
- cacheWrite: 0,
2627
- },
2628
- contextWindow: 131000,
2629
- maxTokens: 32000,
2630
- },
2631
2737
  "zai-glm-4.7": {
2632
2738
  id: "zai-glm-4.7",
2633
2739
  name: "Z.AI GLM-4.7",
@@ -2823,6 +2929,7 @@ export const MODELS = {
2823
2929
  api: "anthropic-messages",
2824
2930
  provider: "cloudflare-ai-gateway",
2825
2931
  baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2932
+ compat: { "forceAdaptiveThinking": true },
2826
2933
  reasoning: true,
2827
2934
  thinkingLevelMap: { "xhigh": "max" },
2828
2935
  input: ["text", "image"],
@@ -2841,6 +2948,7 @@ export const MODELS = {
2841
2948
  api: "anthropic-messages",
2842
2949
  provider: "cloudflare-ai-gateway",
2843
2950
  baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2951
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
2844
2952
  reasoning: true,
2845
2953
  thinkingLevelMap: { "xhigh": "xhigh" },
2846
2954
  input: ["text", "image"],
@@ -2853,6 +2961,24 @@ export const MODELS = {
2853
2961
  contextWindow: 1000000,
2854
2962
  maxTokens: 128000,
2855
2963
  },
2964
+ "claude-opus-4-8": {
2965
+ id: "claude-opus-4-8",
2966
+ name: "Claude Opus 4.8",
2967
+ api: "anthropic-messages",
2968
+ provider: "cloudflare-ai-gateway",
2969
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2970
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
2971
+ reasoning: true,
2972
+ input: ["text", "image"],
2973
+ cost: {
2974
+ input: 5,
2975
+ output: 25,
2976
+ cacheRead: 0.5,
2977
+ cacheWrite: 6.25,
2978
+ },
2979
+ contextWindow: 1000000,
2980
+ maxTokens: 128000,
2981
+ },
2856
2982
  "claude-sonnet-4": {
2857
2983
  id: "claude-sonnet-4",
2858
2984
  name: "Claude Sonnet 4 (latest)",
@@ -2893,6 +3019,7 @@ export const MODELS = {
2893
3019
  api: "anthropic-messages",
2894
3020
  provider: "cloudflare-ai-gateway",
2895
3021
  baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
3022
+ compat: { "forceAdaptiveThinking": true },
2896
3023
  reasoning: true,
2897
3024
  input: ["text", "image"],
2898
3025
  cost: {
@@ -3347,24 +3474,6 @@ export const MODELS = {
3347
3474
  contextWindow: 128000,
3348
3475
  maxTokens: 128000,
3349
3476
  },
3350
- "@cf/moonshotai/kimi-k2.5": {
3351
- id: "@cf/moonshotai/kimi-k2.5",
3352
- name: "Kimi K2.5",
3353
- api: "openai-completions",
3354
- provider: "cloudflare-workers-ai",
3355
- baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3356
- compat: { "sendSessionAffinityHeaders": true },
3357
- reasoning: true,
3358
- input: ["text", "image"],
3359
- cost: {
3360
- input: 0.6,
3361
- output: 3,
3362
- cacheRead: 0.1,
3363
- cacheWrite: 0,
3364
- },
3365
- contextWindow: 256000,
3366
- maxTokens: 256000,
3367
- },
3368
3477
  "@cf/moonshotai/kimi-k2.6": {
3369
3478
  id: "@cf/moonshotai/kimi-k2.6",
3370
3479
  name: "Kimi K2.6",
@@ -3692,8 +3801,8 @@ export const MODELS = {
3692
3801
  cacheRead: 0.1,
3693
3802
  cacheWrite: 0,
3694
3803
  },
3695
- contextWindow: 128000,
3696
- maxTokens: 8192,
3804
+ contextWindow: 262144,
3805
+ maxTokens: 65536,
3697
3806
  },
3698
3807
  "accounts/fireworks/routers/glm-5p1-fast": {
3699
3808
  id: "accounts/fireworks/routers/glm-5p1-fast",
@@ -3735,7 +3844,7 @@ export const MODELS = {
3735
3844
  "github-copilot": {
3736
3845
  "claude-haiku-4.5": {
3737
3846
  id: "claude-haiku-4.5",
3738
- name: "Claude Haiku 4.5",
3847
+ name: "Claude Haiku 4.5 (latest)",
3739
3848
  api: "anthropic-messages",
3740
3849
  provider: "github-copilot",
3741
3850
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -3744,17 +3853,17 @@ export const MODELS = {
3744
3853
  reasoning: true,
3745
3854
  input: ["text", "image"],
3746
3855
  cost: {
3747
- input: 0,
3748
- output: 0,
3749
- cacheRead: 0,
3750
- cacheWrite: 0,
3856
+ input: 1,
3857
+ output: 5,
3858
+ cacheRead: 0.1,
3859
+ cacheWrite: 1.25,
3751
3860
  },
3752
- contextWindow: 144000,
3753
- maxTokens: 32000,
3861
+ contextWindow: 200000,
3862
+ maxTokens: 64000,
3754
3863
  },
3755
3864
  "claude-opus-4.5": {
3756
3865
  id: "claude-opus-4.5",
3757
- name: "Claude Opus 4.5",
3866
+ name: "Claude Opus 4.5 (latest)",
3758
3867
  api: "anthropic-messages",
3759
3868
  provider: "github-copilot",
3760
3869
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -3762,12 +3871,12 @@ export const MODELS = {
3762
3871
  reasoning: true,
3763
3872
  input: ["text", "image"],
3764
3873
  cost: {
3765
- input: 0,
3766
- output: 0,
3767
- cacheRead: 0,
3768
- cacheWrite: 0,
3874
+ input: 5,
3875
+ output: 25,
3876
+ cacheRead: 0.5,
3877
+ cacheWrite: 6.25,
3769
3878
  },
3770
- contextWindow: 160000,
3879
+ contextWindow: 200000,
3771
3880
  maxTokens: 32000,
3772
3881
  },
3773
3882
  "claude-opus-4.6": {
@@ -3777,17 +3886,18 @@ export const MODELS = {
3777
3886
  provider: "github-copilot",
3778
3887
  baseUrl: "https://api.individual.githubcopilot.com",
3779
3888
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3889
+ compat: { "forceAdaptiveThinking": true },
3780
3890
  reasoning: true,
3781
3891
  thinkingLevelMap: { "xhigh": "max" },
3782
3892
  input: ["text", "image"],
3783
3893
  cost: {
3784
- input: 0,
3785
- output: 0,
3786
- cacheRead: 0,
3787
- cacheWrite: 0,
3894
+ input: 5,
3895
+ output: 25,
3896
+ cacheRead: 0.5,
3897
+ cacheWrite: 6.25,
3788
3898
  },
3789
3899
  contextWindow: 1000000,
3790
- maxTokens: 64000,
3900
+ maxTokens: 32000,
3791
3901
  },
3792
3902
  "claude-opus-4.7": {
3793
3903
  id: "claude-opus-4.7",
@@ -3796,69 +3906,109 @@ export const MODELS = {
3796
3906
  provider: "github-copilot",
3797
3907
  baseUrl: "https://api.individual.githubcopilot.com",
3798
3908
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3909
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
3799
3910
  reasoning: true,
3800
3911
  thinkingLevelMap: { "xhigh": "xhigh" },
3801
3912
  input: ["text", "image"],
3802
3913
  cost: {
3803
- input: 0,
3804
- output: 0,
3805
- cacheRead: 0,
3806
- cacheWrite: 0,
3914
+ input: 5,
3915
+ output: 25,
3916
+ cacheRead: 0.5,
3917
+ cacheWrite: 6.25,
3807
3918
  },
3808
- contextWindow: 144000,
3809
- maxTokens: 64000,
3919
+ contextWindow: 200000,
3920
+ maxTokens: 32000,
3810
3921
  },
3811
- "claude-sonnet-4.5": {
3812
- id: "claude-sonnet-4.5",
3813
- name: "Claude Sonnet 4.5",
3922
+ "claude-opus-4.8": {
3923
+ id: "claude-opus-4.8",
3924
+ name: "Claude Opus 4.8",
3814
3925
  api: "anthropic-messages",
3815
3926
  provider: "github-copilot",
3816
3927
  baseUrl: "https://api.individual.githubcopilot.com",
3817
3928
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3818
- compat: { "supportsEagerToolInputStreaming": false },
3929
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
3819
3930
  reasoning: true,
3820
3931
  input: ["text", "image"],
3821
3932
  cost: {
3822
- input: 0,
3823
- output: 0,
3824
- cacheRead: 0,
3825
- cacheWrite: 0,
3933
+ input: 5,
3934
+ output: 25,
3935
+ cacheRead: 0.5,
3936
+ cacheWrite: 6.25,
3826
3937
  },
3827
- contextWindow: 144000,
3828
- maxTokens: 32000,
3938
+ contextWindow: 200000,
3939
+ maxTokens: 64000,
3829
3940
  },
3830
- "claude-sonnet-4.6": {
3831
- id: "claude-sonnet-4.6",
3832
- name: "Claude Sonnet 4.6",
3941
+ "claude-sonnet-4": {
3942
+ id: "claude-sonnet-4",
3943
+ name: "Claude Sonnet 4 (latest)",
3833
3944
  api: "anthropic-messages",
3834
3945
  provider: "github-copilot",
3835
3946
  baseUrl: "https://api.individual.githubcopilot.com",
3836
3947
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3948
+ compat: { "supportsEagerToolInputStreaming": false },
3837
3949
  reasoning: true,
3838
3950
  input: ["text", "image"],
3839
3951
  cost: {
3840
- input: 0,
3841
- output: 0,
3842
- cacheRead: 0,
3843
- cacheWrite: 0,
3952
+ input: 3,
3953
+ output: 15,
3954
+ cacheRead: 0.3,
3955
+ cacheWrite: 3.75,
3844
3956
  },
3845
- contextWindow: 1000000,
3846
- maxTokens: 32000,
3957
+ contextWindow: 216000,
3958
+ maxTokens: 16000,
3847
3959
  },
3848
- "gemini-2.5-pro": {
3849
- id: "gemini-2.5-pro",
3960
+ "claude-sonnet-4.5": {
3961
+ id: "claude-sonnet-4.5",
3962
+ name: "Claude Sonnet 4.5 (latest)",
3963
+ api: "anthropic-messages",
3964
+ provider: "github-copilot",
3965
+ baseUrl: "https://api.individual.githubcopilot.com",
3966
+ headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3967
+ compat: { "supportsEagerToolInputStreaming": false },
3968
+ reasoning: true,
3969
+ input: ["text", "image"],
3970
+ cost: {
3971
+ input: 3,
3972
+ output: 15,
3973
+ cacheRead: 0.3,
3974
+ cacheWrite: 3.75,
3975
+ },
3976
+ contextWindow: 200000,
3977
+ maxTokens: 32000,
3978
+ },
3979
+ "claude-sonnet-4.6": {
3980
+ id: "claude-sonnet-4.6",
3981
+ name: "Claude Sonnet 4.6",
3982
+ api: "anthropic-messages",
3983
+ provider: "github-copilot",
3984
+ baseUrl: "https://api.individual.githubcopilot.com",
3985
+ headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3986
+ compat: { "forceAdaptiveThinking": true },
3987
+ reasoning: true,
3988
+ input: ["text", "image"],
3989
+ cost: {
3990
+ input: 3,
3991
+ output: 15,
3992
+ cacheRead: 0.3,
3993
+ cacheWrite: 3.75,
3994
+ },
3995
+ contextWindow: 1000000,
3996
+ maxTokens: 32000,
3997
+ },
3998
+ "gemini-2.5-pro": {
3999
+ id: "gemini-2.5-pro",
3850
4000
  name: "Gemini 2.5 Pro",
3851
4001
  api: "openai-completions",
3852
4002
  provider: "github-copilot",
3853
4003
  baseUrl: "https://api.individual.githubcopilot.com",
3854
4004
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3855
4005
  compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
3856
- reasoning: false,
4006
+ reasoning: true,
3857
4007
  input: ["text", "image"],
3858
4008
  cost: {
3859
- input: 0,
3860
- output: 0,
3861
- cacheRead: 0,
4009
+ input: 1.25,
4010
+ output: 10,
4011
+ cacheRead: 0.125,
3862
4012
  cacheWrite: 0,
3863
4013
  },
3864
4014
  contextWindow: 128000,
@@ -3866,7 +4016,7 @@ export const MODELS = {
3866
4016
  },
3867
4017
  "gemini-3-flash-preview": {
3868
4018
  id: "gemini-3-flash-preview",
3869
- name: "Gemini 3 Flash",
4019
+ name: "Gemini 3 Flash Preview",
3870
4020
  api: "openai-completions",
3871
4021
  provider: "github-copilot",
3872
4022
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -3875,9 +4025,9 @@ export const MODELS = {
3875
4025
  reasoning: true,
3876
4026
  input: ["text", "image"],
3877
4027
  cost: {
3878
- input: 0,
3879
- output: 0,
3880
- cacheRead: 0,
4028
+ input: 0.5,
4029
+ output: 3,
4030
+ cacheRead: 0.05,
3881
4031
  cacheWrite: 0,
3882
4032
  },
3883
4033
  contextWindow: 128000,
@@ -3894,12 +4044,12 @@ export const MODELS = {
3894
4044
  reasoning: true,
3895
4045
  input: ["text", "image"],
3896
4046
  cost: {
3897
- input: 0,
3898
- output: 0,
3899
- cacheRead: 0,
4047
+ input: 2,
4048
+ output: 12,
4049
+ cacheRead: 0.2,
3900
4050
  cacheWrite: 0,
3901
4051
  },
3902
- contextWindow: 128000,
4052
+ contextWindow: 200000,
3903
4053
  maxTokens: 64000,
3904
4054
  },
3905
4055
  "gemini-3.5-flash": {
@@ -3913,12 +4063,12 @@ export const MODELS = {
3913
4063
  reasoning: true,
3914
4064
  input: ["text", "image"],
3915
4065
  cost: {
3916
- input: 0,
3917
- output: 0,
3918
- cacheRead: 0,
4066
+ input: 1.5,
4067
+ output: 9,
4068
+ cacheRead: 0.15,
3919
4069
  cacheWrite: 0,
3920
4070
  },
3921
- contextWindow: 128000,
4071
+ contextWindow: 200000,
3922
4072
  maxTokens: 64000,
3923
4073
  },
3924
4074
  "gpt-4.1": {
@@ -3932,36 +4082,17 @@ export const MODELS = {
3932
4082
  reasoning: false,
3933
4083
  input: ["text", "image"],
3934
4084
  cost: {
3935
- input: 0,
3936
- output: 0,
3937
- cacheRead: 0,
4085
+ input: 2,
4086
+ output: 8,
4087
+ cacheRead: 0.5,
3938
4088
  cacheWrite: 0,
3939
4089
  },
3940
4090
  contextWindow: 128000,
3941
4091
  maxTokens: 16384,
3942
4092
  },
3943
- "gpt-4o": {
3944
- id: "gpt-4o",
3945
- name: "GPT-4o",
3946
- api: "openai-completions",
3947
- provider: "github-copilot",
3948
- baseUrl: "https://api.individual.githubcopilot.com",
3949
- headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3950
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
3951
- reasoning: false,
3952
- input: ["text", "image"],
3953
- cost: {
3954
- input: 0,
3955
- output: 0,
3956
- cacheRead: 0,
3957
- cacheWrite: 0,
3958
- },
3959
- contextWindow: 128000,
3960
- maxTokens: 4096,
3961
- },
3962
4093
  "gpt-5-mini": {
3963
4094
  id: "gpt-5-mini",
3964
- name: "GPT-5-mini",
4095
+ name: "GPT-5 Mini",
3965
4096
  api: "openai-responses",
3966
4097
  provider: "github-copilot",
3967
4098
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -3970,9 +4101,9 @@ export const MODELS = {
3970
4101
  thinkingLevelMap: { "off": null, "minimal": "low" },
3971
4102
  input: ["text", "image"],
3972
4103
  cost: {
3973
- input: 0,
3974
- output: 0,
3975
- cacheRead: 0,
4104
+ input: 0.25,
4105
+ output: 2,
4106
+ cacheRead: 0.025,
3976
4107
  cacheWrite: 0,
3977
4108
  },
3978
4109
  contextWindow: 264000,
@@ -3989,17 +4120,17 @@ export const MODELS = {
3989
4120
  thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
3990
4121
  input: ["text", "image"],
3991
4122
  cost: {
3992
- input: 0,
3993
- output: 0,
3994
- cacheRead: 0,
4123
+ input: 1.75,
4124
+ output: 14,
4125
+ cacheRead: 0.175,
3995
4126
  cacheWrite: 0,
3996
4127
  },
3997
- contextWindow: 264000,
3998
- maxTokens: 64000,
4128
+ contextWindow: 400000,
4129
+ maxTokens: 128000,
3999
4130
  },
4000
4131
  "gpt-5.2-codex": {
4001
4132
  id: "gpt-5.2-codex",
4002
- name: "GPT-5.2-Codex",
4133
+ name: "GPT-5.2 Codex",
4003
4134
  api: "openai-responses",
4004
4135
  provider: "github-copilot",
4005
4136
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -4008,9 +4139,9 @@ export const MODELS = {
4008
4139
  thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4009
4140
  input: ["text", "image"],
4010
4141
  cost: {
4011
- input: 0,
4012
- output: 0,
4013
- cacheRead: 0,
4142
+ input: 1.75,
4143
+ output: 14,
4144
+ cacheRead: 0.175,
4014
4145
  cacheWrite: 0,
4015
4146
  },
4016
4147
  contextWindow: 400000,
@@ -4018,7 +4149,7 @@ export const MODELS = {
4018
4149
  },
4019
4150
  "gpt-5.3-codex": {
4020
4151
  id: "gpt-5.3-codex",
4021
- name: "GPT-5.3-Codex",
4152
+ name: "GPT-5.3 Codex",
4022
4153
  api: "openai-responses",
4023
4154
  provider: "github-copilot",
4024
4155
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -4027,9 +4158,9 @@ export const MODELS = {
4027
4158
  thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4028
4159
  input: ["text", "image"],
4029
4160
  cost: {
4030
- input: 0,
4031
- output: 0,
4032
- cacheRead: 0,
4161
+ input: 1.75,
4162
+ output: 14,
4163
+ cacheRead: 0.175,
4033
4164
  cacheWrite: 0,
4034
4165
  },
4035
4166
  contextWindow: 400000,
@@ -4046,9 +4177,9 @@ export const MODELS = {
4046
4177
  thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4047
4178
  input: ["text", "image"],
4048
4179
  cost: {
4049
- input: 0,
4050
- output: 0,
4051
- cacheRead: 0,
4180
+ input: 2.5,
4181
+ output: 15,
4182
+ cacheRead: 0.25,
4052
4183
  cacheWrite: 0,
4053
4184
  },
4054
4185
  contextWindow: 400000,
@@ -4056,7 +4187,7 @@ export const MODELS = {
4056
4187
  },
4057
4188
  "gpt-5.4-mini": {
4058
4189
  id: "gpt-5.4-mini",
4059
- name: "GPT-5.4 Mini",
4190
+ name: "GPT-5.4 mini",
4060
4191
  api: "openai-responses",
4061
4192
  provider: "github-copilot",
4062
4193
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -4065,9 +4196,28 @@ export const MODELS = {
4065
4196
  thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4066
4197
  input: ["text", "image"],
4067
4198
  cost: {
4068
- input: 0,
4069
- output: 0,
4070
- cacheRead: 0,
4199
+ input: 0.75,
4200
+ output: 4.5,
4201
+ cacheRead: 0.075,
4202
+ cacheWrite: 0,
4203
+ },
4204
+ contextWindow: 400000,
4205
+ maxTokens: 128000,
4206
+ },
4207
+ "gpt-5.4-nano": {
4208
+ id: "gpt-5.4-nano",
4209
+ name: "GPT-5.4 nano",
4210
+ api: "openai-responses",
4211
+ provider: "github-copilot",
4212
+ baseUrl: "https://api.individual.githubcopilot.com",
4213
+ headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4214
+ reasoning: true,
4215
+ thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4216
+ input: ["text", "image"],
4217
+ cost: {
4218
+ input: 0.2,
4219
+ output: 1.25,
4220
+ cacheRead: 0.02,
4071
4221
  cacheWrite: 0,
4072
4222
  },
4073
4223
  contextWindow: 400000,
@@ -4084,32 +4234,32 @@ export const MODELS = {
4084
4234
  thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4085
4235
  input: ["text", "image"],
4086
4236
  cost: {
4087
- input: 0,
4088
- output: 0,
4089
- cacheRead: 0,
4237
+ input: 5,
4238
+ output: 30,
4239
+ cacheRead: 0.5,
4090
4240
  cacheWrite: 0,
4091
4241
  },
4092
4242
  contextWindow: 400000,
4093
4243
  maxTokens: 128000,
4094
4244
  },
4095
- "grok-code-fast-1": {
4096
- id: "grok-code-fast-1",
4097
- name: "Grok Code Fast 1",
4245
+ "raptor-mini": {
4246
+ id: "raptor-mini",
4247
+ name: "Raptor mini",
4098
4248
  api: "openai-completions",
4099
4249
  provider: "github-copilot",
4100
4250
  baseUrl: "https://api.individual.githubcopilot.com",
4101
4251
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4102
4252
  compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
4103
4253
  reasoning: true,
4104
- input: ["text"],
4254
+ input: ["text", "image"],
4105
4255
  cost: {
4106
- input: 0,
4107
- output: 0,
4108
- cacheRead: 0,
4256
+ input: 0.25,
4257
+ output: 2,
4258
+ cacheRead: 0.025,
4109
4259
  cacheWrite: 0,
4110
4260
  },
4111
- contextWindow: 128000,
4112
- maxTokens: 64000,
4261
+ contextWindow: 400000,
4262
+ maxTokens: 128000,
4113
4263
  },
4114
4264
  },
4115
4265
  "google": {
@@ -4838,7 +4988,7 @@ export const MODELS = {
4838
4988
  cost: {
4839
4989
  input: 1,
4840
4990
  output: 3,
4841
- cacheRead: 0,
4991
+ cacheRead: 0.5,
4842
4992
  cacheWrite: 0,
4843
4993
  },
4844
4994
  contextWindow: 262144,
@@ -4855,7 +5005,7 @@ export const MODELS = {
4855
5005
  cost: {
4856
5006
  input: 0.15,
4857
5007
  output: 0.6,
4858
- cacheRead: 0,
5008
+ cacheRead: 0.075,
4859
5009
  cacheWrite: 0,
4860
5010
  },
4861
5011
  contextWindow: 131072,
@@ -4872,7 +5022,7 @@ export const MODELS = {
4872
5022
  cost: {
4873
5023
  input: 0.075,
4874
5024
  output: 0.3,
4875
- cacheRead: 0,
5025
+ cacheRead: 0.0375,
4876
5026
  cacheWrite: 0,
4877
5027
  },
4878
5028
  contextWindow: 131072,
@@ -5158,9 +5308,9 @@ export const MODELS = {
5158
5308
  reasoning: true,
5159
5309
  input: ["text"],
5160
5310
  cost: {
5161
- input: 1.74,
5162
- output: 3.48,
5163
- cacheRead: 0.145,
5311
+ input: 0.435,
5312
+ output: 0.87,
5313
+ cacheRead: 0.003625,
5164
5314
  cacheWrite: 0,
5165
5315
  },
5166
5316
  contextWindow: 1048576,
@@ -5474,6 +5624,23 @@ export const MODELS = {
5474
5624
  contextWindow: 262144,
5475
5625
  maxTokens: 262144,
5476
5626
  },
5627
+ "devstral-latest": {
5628
+ id: "devstral-latest",
5629
+ name: "Devstral 2",
5630
+ api: "mistral-conversations",
5631
+ provider: "mistral",
5632
+ baseUrl: "https://api.mistral.ai",
5633
+ reasoning: false,
5634
+ input: ["text"],
5635
+ cost: {
5636
+ input: 0.4,
5637
+ output: 2,
5638
+ cacheRead: 0,
5639
+ cacheWrite: 0,
5640
+ },
5641
+ contextWindow: 262144,
5642
+ maxTokens: 262144,
5643
+ },
5477
5644
  "devstral-medium-2507": {
5478
5645
  id: "devstral-medium-2507",
5479
5646
  name: "Devstral Medium",
@@ -5848,6 +6015,23 @@ export const MODELS = {
5848
6015
  contextWindow: 8000,
5849
6016
  maxTokens: 8000,
5850
6017
  },
6018
+ "open-mistral-nemo": {
6019
+ id: "open-mistral-nemo",
6020
+ name: "Open Mistral Nemo",
6021
+ api: "mistral-conversations",
6022
+ provider: "mistral",
6023
+ baseUrl: "https://api.mistral.ai",
6024
+ reasoning: false,
6025
+ input: ["text"],
6026
+ cost: {
6027
+ input: 0.15,
6028
+ output: 0.15,
6029
+ cacheRead: 0,
6030
+ cacheWrite: 0,
6031
+ },
6032
+ contextWindow: 128000,
6033
+ maxTokens: 128000,
6034
+ },
5851
6035
  "open-mixtral-8x22b": {
5852
6036
  id: "open-mixtral-8x22b",
5853
6037
  name: "Mixtral 8x22B",
@@ -6253,7 +6437,7 @@ export const MODELS = {
6253
6437
  cost: {
6254
6438
  input: 0.1,
6255
6439
  output: 0.4,
6256
- cacheRead: 0.03,
6440
+ cacheRead: 0.025,
6257
6441
  cacheWrite: 0,
6258
6442
  },
6259
6443
  contextWindow: 1047576,
@@ -6338,7 +6522,7 @@ export const MODELS = {
6338
6522
  cost: {
6339
6523
  input: 0.15,
6340
6524
  output: 0.6,
6341
- cacheRead: 0.08,
6525
+ cacheRead: 0.075,
6342
6526
  cacheWrite: 0,
6343
6527
  },
6344
6528
  contextWindow: 128000,
@@ -6464,7 +6648,7 @@ export const MODELS = {
6464
6648
  cost: {
6465
6649
  input: 1.25,
6466
6650
  output: 10,
6467
- cacheRead: 0.13,
6651
+ cacheRead: 0.125,
6468
6652
  cacheWrite: 0,
6469
6653
  },
6470
6654
  contextWindow: 400000,
@@ -6747,7 +6931,7 @@ export const MODELS = {
6747
6931
  provider: "openai",
6748
6932
  baseUrl: "https://api.openai.com/v1",
6749
6933
  reasoning: true,
6750
- thinkingLevelMap: { "off": "none", "xhigh": "xhigh" },
6934
+ thinkingLevelMap: { "off": "none", "xhigh": "xhigh", "minimal": null },
6751
6935
  input: ["text", "image"],
6752
6936
  cost: {
6753
6937
  input: 5,
@@ -6765,7 +6949,7 @@ export const MODELS = {
6765
6949
  provider: "openai",
6766
6950
  baseUrl: "https://api.openai.com/v1",
6767
6951
  reasoning: true,
6768
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
6952
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh", "minimal": null, "low": null },
6769
6953
  input: ["text", "image"],
6770
6954
  cost: {
6771
6955
  input: 30,
@@ -6889,7 +7073,7 @@ export const MODELS = {
6889
7073
  cost: {
6890
7074
  input: 1.1,
6891
7075
  output: 4.4,
6892
- cacheRead: 0.28,
7076
+ cacheRead: 0.275,
6893
7077
  cacheWrite: 0,
6894
7078
  },
6895
7079
  contextWindow: 200000,
@@ -6965,7 +7149,7 @@ export const MODELS = {
6965
7149
  cacheRead: 0.175,
6966
7150
  cacheWrite: 0,
6967
7151
  },
6968
- contextWindow: 272000,
7152
+ contextWindow: 128000,
6969
7153
  maxTokens: 128000,
6970
7154
  },
6971
7155
  "gpt-5.4": {
@@ -7039,7 +7223,7 @@ export const MODELS = {
7039
7223
  cacheWrite: 0,
7040
7224
  },
7041
7225
  contextWindow: 200000,
7042
- maxTokens: 128000,
7226
+ maxTokens: 32000,
7043
7227
  },
7044
7228
  "claude-haiku-4-5": {
7045
7229
  id: "claude-haiku-4-5",
@@ -7098,6 +7282,7 @@ export const MODELS = {
7098
7282
  api: "anthropic-messages",
7099
7283
  provider: "opencode",
7100
7284
  baseUrl: "https://opencode.ai/zen",
7285
+ compat: { "forceAdaptiveThinking": true },
7101
7286
  reasoning: true,
7102
7287
  thinkingLevelMap: { "xhigh": "max" },
7103
7288
  input: ["text", "image"],
@@ -7116,6 +7301,7 @@ export const MODELS = {
7116
7301
  api: "anthropic-messages",
7117
7302
  provider: "opencode",
7118
7303
  baseUrl: "https://opencode.ai/zen",
7304
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
7119
7305
  reasoning: true,
7120
7306
  thinkingLevelMap: { "xhigh": "xhigh" },
7121
7307
  input: ["text", "image"],
@@ -7128,6 +7314,24 @@ export const MODELS = {
7128
7314
  contextWindow: 1000000,
7129
7315
  maxTokens: 128000,
7130
7316
  },
7317
+ "claude-opus-4-8": {
7318
+ id: "claude-opus-4-8",
7319
+ name: "Claude Opus 4.8",
7320
+ api: "anthropic-messages",
7321
+ provider: "opencode",
7322
+ baseUrl: "https://opencode.ai/zen",
7323
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
7324
+ reasoning: true,
7325
+ input: ["text", "image"],
7326
+ cost: {
7327
+ input: 5,
7328
+ output: 25,
7329
+ cacheRead: 0.5,
7330
+ cacheWrite: 6.25,
7331
+ },
7332
+ contextWindow: 1000000,
7333
+ maxTokens: 128000,
7334
+ },
7131
7335
  "claude-sonnet-4": {
7132
7336
  id: "claude-sonnet-4",
7133
7337
  name: "Claude Sonnet 4",
@@ -7168,6 +7372,7 @@ export const MODELS = {
7168
7372
  api: "anthropic-messages",
7169
7373
  provider: "opencode",
7170
7374
  baseUrl: "https://opencode.ai/zen",
7375
+ compat: { "forceAdaptiveThinking": true },
7171
7376
  reasoning: true,
7172
7377
  input: ["text", "image"],
7173
7378
  cost: {
@@ -7179,9 +7384,28 @@ export const MODELS = {
7179
7384
  contextWindow: 1000000,
7180
7385
  maxTokens: 64000,
7181
7386
  },
7182
- "deepseek-v4-flash-free": {
7183
- id: "deepseek-v4-flash-free",
7184
- name: "DeepSeek V4 Flash Free",
7387
+ "deepseek-v4-flash": {
7388
+ id: "deepseek-v4-flash",
7389
+ name: "DeepSeek V4 Flash",
7390
+ api: "openai-completions",
7391
+ provider: "opencode",
7392
+ baseUrl: "https://opencode.ai/zen/v1",
7393
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7394
+ reasoning: true,
7395
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7396
+ input: ["text"],
7397
+ cost: {
7398
+ input: 0.14,
7399
+ output: 0.28,
7400
+ cacheRead: 0.03,
7401
+ cacheWrite: 0,
7402
+ },
7403
+ contextWindow: 1000000,
7404
+ maxTokens: 384000,
7405
+ },
7406
+ "deepseek-v4-flash-free": {
7407
+ id: "deepseek-v4-flash-free",
7408
+ name: "DeepSeek V4 Flash Free",
7185
7409
  api: "openai-completions",
7186
7410
  provider: "opencode",
7187
7411
  baseUrl: "https://opencode.ai/zen/v1",
@@ -7563,7 +7787,7 @@ export const MODELS = {
7563
7787
  provider: "opencode",
7564
7788
  baseUrl: "https://opencode.ai/zen/v1",
7565
7789
  reasoning: true,
7566
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
7790
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh", "minimal": null, "low": null },
7567
7791
  input: ["text", "image"],
7568
7792
  cost: {
7569
7793
  input: 30,
@@ -7580,7 +7804,9 @@ export const MODELS = {
7580
7804
  api: "openai-completions",
7581
7805
  provider: "opencode",
7582
7806
  baseUrl: "https://opencode.ai/zen/v1",
7807
+ compat: { "supportsReasoningEffort": false },
7583
7808
  reasoning: true,
7809
+ thinkingLevelMap: { "off": null, "minimal": null, "low": null, "medium": null },
7584
7810
  input: ["text", "image"],
7585
7811
  cost: {
7586
7812
  input: 1,
@@ -7614,6 +7840,7 @@ export const MODELS = {
7614
7840
  api: "openai-completions",
7615
7841
  provider: "opencode",
7616
7842
  baseUrl: "https://opencode.ai/zen/v1",
7843
+ compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false },
7617
7844
  reasoning: true,
7618
7845
  input: ["text", "image"],
7619
7846
  cost: {
@@ -7625,6 +7852,23 @@ export const MODELS = {
7625
7852
  contextWindow: 262144,
7626
7853
  maxTokens: 65536,
7627
7854
  },
7855
+ "mimo-v2.5-free": {
7856
+ id: "mimo-v2.5-free",
7857
+ name: "MiMo V2.5 Free",
7858
+ api: "openai-completions",
7859
+ provider: "opencode",
7860
+ baseUrl: "https://opencode.ai/zen/v1",
7861
+ reasoning: true,
7862
+ input: ["text", "image"],
7863
+ cost: {
7864
+ input: 0,
7865
+ output: 0,
7866
+ cacheRead: 0,
7867
+ cacheWrite: 0,
7868
+ },
7869
+ contextWindow: 200000,
7870
+ maxTokens: 32000,
7871
+ },
7628
7872
  "minimax-m2.5": {
7629
7873
  id: "minimax-m2.5",
7630
7874
  name: "MiniMax M2.5",
@@ -7659,9 +7903,26 @@ export const MODELS = {
7659
7903
  contextWindow: 204800,
7660
7904
  maxTokens: 131072,
7661
7905
  },
7662
- "nemotron-3-super-free": {
7663
- id: "nemotron-3-super-free",
7664
- name: "Nemotron 3 Super Free",
7906
+ "minimax-m3-free": {
7907
+ id: "minimax-m3-free",
7908
+ name: "MiniMax M3 Free",
7909
+ api: "anthropic-messages",
7910
+ provider: "opencode",
7911
+ baseUrl: "https://opencode.ai/zen",
7912
+ reasoning: true,
7913
+ input: ["text", "image"],
7914
+ cost: {
7915
+ input: 0,
7916
+ output: 0,
7917
+ cacheRead: 0,
7918
+ cacheWrite: 0,
7919
+ },
7920
+ contextWindow: 200000,
7921
+ maxTokens: 32000,
7922
+ },
7923
+ "nemotron-3-ultra-free": {
7924
+ id: "nemotron-3-ultra-free",
7925
+ name: "Nemotron 3 Ultra Free",
7665
7926
  api: "openai-completions",
7666
7927
  provider: "opencode",
7667
7928
  baseUrl: "https://opencode.ai/zen/v1",
@@ -7673,7 +7934,7 @@ export const MODELS = {
7673
7934
  cacheRead: 0,
7674
7935
  cacheWrite: 0,
7675
7936
  },
7676
- contextWindow: 204800,
7937
+ contextWindow: 1000000,
7677
7938
  maxTokens: 128000,
7678
7939
  },
7679
7940
  "qwen3.5-plus": {
@@ -7807,7 +8068,9 @@ export const MODELS = {
7807
8068
  api: "openai-completions",
7808
8069
  provider: "opencode-go",
7809
8070
  baseUrl: "https://opencode.ai/zen/go/v1",
8071
+ compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false },
7810
8072
  reasoning: true,
8073
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
7811
8074
  input: ["text", "image"],
7812
8075
  cost: {
7813
8076
  input: 0.95,
@@ -7827,9 +8090,9 @@ export const MODELS = {
7827
8090
  reasoning: true,
7828
8091
  input: ["text", "image"],
7829
8092
  cost: {
7830
- input: 0.4,
7831
- output: 2,
7832
- cacheRead: 0.08,
8093
+ input: 0.14,
8094
+ output: 0.28,
8095
+ cacheRead: 0.0028,
7833
8096
  cacheWrite: 0,
7834
8097
  },
7835
8098
  contextWindow: 1000000,
@@ -7844,9 +8107,9 @@ export const MODELS = {
7844
8107
  reasoning: true,
7845
8108
  input: ["text"],
7846
8109
  cost: {
7847
- input: 1,
7848
- output: 3,
7849
- cacheRead: 0.2,
8110
+ input: 1.74,
8111
+ output: 3.48,
8112
+ cacheRead: 0.0145,
7850
8113
  cacheWrite: 0,
7851
8114
  },
7852
8115
  contextWindow: 1048576,
@@ -7886,23 +8149,22 @@ export const MODELS = {
7886
8149
  contextWindow: 204800,
7887
8150
  maxTokens: 131072,
7888
8151
  },
7889
- "qwen3.5-plus": {
7890
- id: "qwen3.5-plus",
7891
- name: "Qwen3.5 Plus",
7892
- api: "openai-completions",
8152
+ "minimax-m3": {
8153
+ id: "minimax-m3",
8154
+ name: "MiniMax M3",
8155
+ api: "anthropic-messages",
7893
8156
  provider: "opencode-go",
7894
- baseUrl: "https://opencode.ai/zen/go/v1",
7895
- compat: { "thinkingFormat": "qwen" },
8157
+ baseUrl: "https://opencode.ai/zen/go",
7896
8158
  reasoning: true,
7897
8159
  input: ["text", "image"],
7898
8160
  cost: {
7899
- input: 0.2,
7900
- output: 1.2,
7901
- cacheRead: 0.02,
7902
- cacheWrite: 0.25,
8161
+ input: 0.6,
8162
+ output: 2.4,
8163
+ cacheRead: 0.12,
8164
+ cacheWrite: 0,
7903
8165
  },
7904
- contextWindow: 262144,
7905
- maxTokens: 65536,
8166
+ contextWindow: 512000,
8167
+ maxTokens: 131072,
7906
8168
  },
7907
8169
  "qwen3.6-plus": {
7908
8170
  id: "qwen3.6-plus",
@@ -7922,6 +8184,40 @@ export const MODELS = {
7922
8184
  contextWindow: 262144,
7923
8185
  maxTokens: 65536,
7924
8186
  },
8187
+ "qwen3.7-max": {
8188
+ id: "qwen3.7-max",
8189
+ name: "Qwen3.7 Max",
8190
+ api: "anthropic-messages",
8191
+ provider: "opencode-go",
8192
+ baseUrl: "https://opencode.ai/zen/go",
8193
+ reasoning: true,
8194
+ input: ["text"],
8195
+ cost: {
8196
+ input: 2.5,
8197
+ output: 7.5,
8198
+ cacheRead: 0.5,
8199
+ cacheWrite: 3.125,
8200
+ },
8201
+ contextWindow: 1000000,
8202
+ maxTokens: 65536,
8203
+ },
8204
+ "qwen3.7-plus": {
8205
+ id: "qwen3.7-plus",
8206
+ name: "Qwen3.7 Plus",
8207
+ api: "anthropic-messages",
8208
+ provider: "opencode-go",
8209
+ baseUrl: "https://opencode.ai/zen/go",
8210
+ reasoning: true,
8211
+ input: ["text", "image"],
8212
+ cost: {
8213
+ input: 0.4,
8214
+ output: 1.6,
8215
+ cacheRead: 0.04,
8216
+ cacheWrite: 0.5,
8217
+ },
8218
+ contextWindow: 262144,
8219
+ maxTokens: 65536,
8220
+ },
7925
8221
  },
7926
8222
  "openrouter": {
7927
8223
  "ai21/jamba-large-1.7": {
@@ -7941,23 +8237,6 @@ export const MODELS = {
7941
8237
  contextWindow: 256000,
7942
8238
  maxTokens: 4096,
7943
8239
  },
7944
- "alibaba/tongyi-deepresearch-30b-a3b": {
7945
- id: "alibaba/tongyi-deepresearch-30b-a3b",
7946
- name: "Tongyi DeepResearch 30B A3B",
7947
- api: "openai-completions",
7948
- provider: "openrouter",
7949
- baseUrl: "https://openrouter.ai/api/v1",
7950
- reasoning: true,
7951
- input: ["text"],
7952
- cost: {
7953
- input: 0.09,
7954
- output: 0.44999999999999996,
7955
- cacheRead: 0.09,
7956
- cacheWrite: 0,
7957
- },
7958
- contextWindow: 131072,
7959
- maxTokens: 131072,
7960
- },
7961
8240
  "amazon/nova-2-lite-v1": {
7962
8241
  id: "amazon/nova-2-lite-v1",
7963
8242
  name: "Amazon: Nova 2 Lite",
@@ -8217,6 +8496,40 @@ export const MODELS = {
8217
8496
  contextWindow: 1000000,
8218
8497
  maxTokens: 128000,
8219
8498
  },
8499
+ "anthropic/claude-opus-4.8": {
8500
+ id: "anthropic/claude-opus-4.8",
8501
+ name: "Anthropic: Claude Opus 4.8",
8502
+ api: "openai-completions",
8503
+ provider: "openrouter",
8504
+ baseUrl: "https://openrouter.ai/api/v1",
8505
+ reasoning: true,
8506
+ input: ["text", "image"],
8507
+ cost: {
8508
+ input: 5,
8509
+ output: 25,
8510
+ cacheRead: 0.5,
8511
+ cacheWrite: 6.25,
8512
+ },
8513
+ contextWindow: 1000000,
8514
+ maxTokens: 128000,
8515
+ },
8516
+ "anthropic/claude-opus-4.8-fast": {
8517
+ id: "anthropic/claude-opus-4.8-fast",
8518
+ name: "Anthropic: Claude Opus 4.8 (Fast)",
8519
+ api: "openai-completions",
8520
+ provider: "openrouter",
8521
+ baseUrl: "https://openrouter.ai/api/v1",
8522
+ reasoning: true,
8523
+ input: ["text", "image"],
8524
+ cost: {
8525
+ input: 10,
8526
+ output: 50,
8527
+ cacheRead: 1,
8528
+ cacheWrite: 12.5,
8529
+ },
8530
+ contextWindow: 1000000,
8531
+ maxTokens: 128000,
8532
+ },
8220
8533
  "anthropic/claude-sonnet-4": {
8221
8534
  id: "anthropic/claude-sonnet-4",
8222
8535
  name: "Anthropic: Claude Sonnet 4",
@@ -8285,23 +8598,6 @@ export const MODELS = {
8285
8598
  contextWindow: 262144,
8286
8599
  maxTokens: 262144,
8287
8600
  },
8288
- "arcee-ai/trinity-large-thinking:free": {
8289
- id: "arcee-ai/trinity-large-thinking:free",
8290
- name: "Arcee AI: Trinity Large Thinking (free)",
8291
- api: "openai-completions",
8292
- provider: "openrouter",
8293
- baseUrl: "https://openrouter.ai/api/v1",
8294
- reasoning: true,
8295
- input: ["text"],
8296
- cost: {
8297
- input: 0,
8298
- output: 0,
8299
- cacheRead: 0,
8300
- cacheWrite: 0,
8301
- },
8302
- contextWindow: 262144,
8303
- maxTokens: 80000,
8304
- },
8305
8601
  "arcee-ai/trinity-mini": {
8306
8602
  id: "arcee-ai/trinity-mini",
8307
8603
  name: "Arcee AI: Trinity Mini",
@@ -8353,40 +8649,6 @@ export const MODELS = {
8353
8649
  contextWindow: 2000000,
8354
8650
  maxTokens: 30000,
8355
8651
  },
8356
- "baidu/cobuddy:free": {
8357
- id: "baidu/cobuddy:free",
8358
- name: "Baidu Qianfan: CoBuddy (free)",
8359
- api: "openai-completions",
8360
- provider: "openrouter",
8361
- baseUrl: "https://openrouter.ai/api/v1",
8362
- reasoning: true,
8363
- input: ["text"],
8364
- cost: {
8365
- input: 0,
8366
- output: 0,
8367
- cacheRead: 0,
8368
- cacheWrite: 0,
8369
- },
8370
- contextWindow: 131072,
8371
- maxTokens: 65536,
8372
- },
8373
- "baidu/ernie-4.5-21b-a3b": {
8374
- id: "baidu/ernie-4.5-21b-a3b",
8375
- name: "Baidu: ERNIE 4.5 21B A3B",
8376
- api: "openai-completions",
8377
- provider: "openrouter",
8378
- baseUrl: "https://openrouter.ai/api/v1",
8379
- reasoning: false,
8380
- input: ["text"],
8381
- cost: {
8382
- input: 0.07,
8383
- output: 0.28,
8384
- cacheRead: 0,
8385
- cacheWrite: 0,
8386
- },
8387
- contextWindow: 131072,
8388
- maxTokens: 8000,
8389
- },
8390
8652
  "baidu/ernie-4.5-vl-28b-a3b": {
8391
8653
  id: "baidu/ernie-4.5-vl-28b-a3b",
8392
8654
  name: "Baidu: ERNIE 4.5 VL 28B A3B",
@@ -8515,13 +8777,13 @@ export const MODELS = {
8515
8777
  reasoning: false,
8516
8778
  input: ["text"],
8517
8779
  cost: {
8518
- input: 0.32,
8519
- output: 0.8899999999999999,
8780
+ input: 0.20020000000000002,
8781
+ output: 0.8000999999999999,
8520
8782
  cacheRead: 0,
8521
8783
  cacheWrite: 0,
8522
8784
  },
8523
- contextWindow: 163840,
8524
- maxTokens: 16384,
8785
+ contextWindow: 131072,
8786
+ maxTokens: 16000,
8525
8787
  },
8526
8788
  "deepseek/deepseek-chat-v3-0324": {
8527
8789
  id: "deepseek/deepseek-chat-v3-0324",
@@ -8617,13 +8879,13 @@ export const MODELS = {
8617
8879
  reasoning: true,
8618
8880
  input: ["text"],
8619
8881
  cost: {
8620
- input: 0.252,
8621
- output: 0.378,
8622
- cacheRead: 0.0252,
8882
+ input: 0.2288,
8883
+ output: 0.3432,
8884
+ cacheRead: 0,
8623
8885
  cacheWrite: 0,
8624
8886
  },
8625
8887
  contextWindow: 131072,
8626
- maxTokens: 65536,
8888
+ maxTokens: 64000,
8627
8889
  },
8628
8890
  "deepseek/deepseek-v3.2-exp": {
8629
8891
  id: "deepseek/deepseek-v3.2-exp",
@@ -8648,37 +8910,18 @@ export const MODELS = {
8648
8910
  api: "openai-completions",
8649
8911
  provider: "openrouter",
8650
8912
  baseUrl: "https://openrouter.ai/api/v1",
8651
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8913
+ compat: { "requiresReasoningContentOnAssistantMessages": true },
8652
8914
  reasoning: true,
8653
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
8915
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "xhigh" },
8654
8916
  input: ["text"],
8655
8917
  cost: {
8656
- input: 0.09999999999999999,
8657
- output: 0.19999999999999998,
8658
- cacheRead: 0.02,
8918
+ input: 0.0983,
8919
+ output: 0.1966,
8920
+ cacheRead: 0.019700000000000002,
8659
8921
  cacheWrite: 0,
8660
8922
  },
8661
8923
  contextWindow: 1048576,
8662
- maxTokens: 16384,
8663
- },
8664
- "deepseek/deepseek-v4-flash:free": {
8665
- id: "deepseek/deepseek-v4-flash:free",
8666
- name: "DeepSeek: DeepSeek V4 Flash (free)",
8667
- api: "openai-completions",
8668
- provider: "openrouter",
8669
- baseUrl: "https://openrouter.ai/api/v1",
8670
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8671
- reasoning: true,
8672
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
8673
- input: ["text"],
8674
- cost: {
8675
- input: 0,
8676
- output: 0,
8677
- cacheRead: 0,
8678
- cacheWrite: 0,
8679
- },
8680
- contextWindow: 1048576,
8681
- maxTokens: 384000,
8924
+ maxTokens: 131072,
8682
8925
  },
8683
8926
  "deepseek/deepseek-v4-pro": {
8684
8927
  id: "deepseek/deepseek-v4-pro",
@@ -8686,9 +8929,9 @@ export const MODELS = {
8686
8929
  api: "openai-completions",
8687
8930
  provider: "openrouter",
8688
8931
  baseUrl: "https://openrouter.ai/api/v1",
8689
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8932
+ compat: { "requiresReasoningContentOnAssistantMessages": true },
8690
8933
  reasoning: true,
8691
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
8934
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "xhigh" },
8692
8935
  input: ["text"],
8693
8936
  cost: {
8694
8937
  input: 0.435,
@@ -8716,40 +8959,6 @@ export const MODELS = {
8716
8959
  contextWindow: 32768,
8717
8960
  maxTokens: 4096,
8718
8961
  },
8719
- "google/gemini-2.0-flash-001": {
8720
- id: "google/gemini-2.0-flash-001",
8721
- name: "Google: Gemini 2.0 Flash",
8722
- api: "openai-completions",
8723
- provider: "openrouter",
8724
- baseUrl: "https://openrouter.ai/api/v1",
8725
- reasoning: false,
8726
- input: ["text", "image"],
8727
- cost: {
8728
- input: 0.09999999999999999,
8729
- output: 0.39999999999999997,
8730
- cacheRead: 0.024999999999999998,
8731
- cacheWrite: 0.08333333333333334,
8732
- },
8733
- contextWindow: 1000000,
8734
- maxTokens: 8192,
8735
- },
8736
- "google/gemini-2.0-flash-lite-001": {
8737
- id: "google/gemini-2.0-flash-lite-001",
8738
- name: "Google: Gemini 2.0 Flash Lite",
8739
- api: "openai-completions",
8740
- provider: "openrouter",
8741
- baseUrl: "https://openrouter.ai/api/v1",
8742
- reasoning: false,
8743
- input: ["text", "image"],
8744
- cost: {
8745
- input: 0.075,
8746
- output: 0.3,
8747
- cacheRead: 0,
8748
- cacheWrite: 0,
8749
- },
8750
- contextWindow: 1048576,
8751
- maxTokens: 8192,
8752
- },
8753
8962
  "google/gemini-2.5-flash": {
8754
8963
  id: "google/gemini-2.5-flash",
8755
8964
  name: "Google: Gemini 2.5 Flash",
@@ -9227,6 +9436,23 @@ export const MODELS = {
9227
9436
  contextWindow: 131072,
9228
9437
  maxTokens: 4096,
9229
9438
  },
9439
+ "meta-llama/llama-4-maverick": {
9440
+ id: "meta-llama/llama-4-maverick",
9441
+ name: "Meta: Llama 4 Maverick",
9442
+ api: "openai-completions",
9443
+ provider: "openrouter",
9444
+ baseUrl: "https://openrouter.ai/api/v1",
9445
+ reasoning: false,
9446
+ input: ["text", "image"],
9447
+ cost: {
9448
+ input: 0.15,
9449
+ output: 0.6,
9450
+ cacheRead: 0,
9451
+ cacheWrite: 0,
9452
+ },
9453
+ contextWindow: 1048576,
9454
+ maxTokens: 16384,
9455
+ },
9230
9456
  "meta-llama/llama-4-scout": {
9231
9457
  id: "meta-llama/llama-4-scout",
9232
9458
  name: "Meta: Llama 4 Scout",
@@ -9312,39 +9538,39 @@ export const MODELS = {
9312
9538
  contextWindow: 204800,
9313
9539
  maxTokens: 196608,
9314
9540
  },
9315
- "minimax/minimax-m2.5:free": {
9316
- id: "minimax/minimax-m2.5:free",
9317
- name: "MiniMax: MiniMax M2.5 (free)",
9541
+ "minimax/minimax-m2.7": {
9542
+ id: "minimax/minimax-m2.7",
9543
+ name: "MiniMax: MiniMax M2.7",
9318
9544
  api: "openai-completions",
9319
9545
  provider: "openrouter",
9320
9546
  baseUrl: "https://openrouter.ai/api/v1",
9321
9547
  reasoning: true,
9322
9548
  input: ["text"],
9323
9549
  cost: {
9324
- input: 0,
9325
- output: 0,
9550
+ input: 0.27899999999999997,
9551
+ output: 1.2,
9326
9552
  cacheRead: 0,
9327
9553
  cacheWrite: 0,
9328
9554
  },
9329
9555
  contextWindow: 204800,
9330
- maxTokens: 8192,
9556
+ maxTokens: 131072,
9331
9557
  },
9332
- "minimax/minimax-m2.7": {
9333
- id: "minimax/minimax-m2.7",
9334
- name: "MiniMax: MiniMax M2.7",
9558
+ "minimax/minimax-m3": {
9559
+ id: "minimax/minimax-m3",
9560
+ name: "MiniMax: MiniMax M3",
9335
9561
  api: "openai-completions",
9336
9562
  provider: "openrouter",
9337
9563
  baseUrl: "https://openrouter.ai/api/v1",
9338
9564
  reasoning: true,
9339
- input: ["text"],
9565
+ input: ["text", "image"],
9340
9566
  cost: {
9341
- input: 0.27899999999999997,
9567
+ input: 0.3,
9342
9568
  output: 1.2,
9343
- cacheRead: 0,
9569
+ cacheRead: 0.06,
9344
9570
  cacheWrite: 0,
9345
9571
  },
9346
- contextWindow: 204800,
9347
- maxTokens: 131072,
9572
+ contextWindow: 1048576,
9573
+ maxTokens: 512000,
9348
9574
  },
9349
9575
  "mistralai/codestral-2508": {
9350
9576
  id: "mistralai/codestral-2508",
@@ -9380,40 +9606,6 @@ export const MODELS = {
9380
9606
  contextWindow: 262144,
9381
9607
  maxTokens: 4096,
9382
9608
  },
9383
- "mistralai/devstral-medium": {
9384
- id: "mistralai/devstral-medium",
9385
- name: "Mistral: Devstral Medium",
9386
- api: "openai-completions",
9387
- provider: "openrouter",
9388
- baseUrl: "https://openrouter.ai/api/v1",
9389
- reasoning: false,
9390
- input: ["text"],
9391
- cost: {
9392
- input: 0.39999999999999997,
9393
- output: 2,
9394
- cacheRead: 0.04,
9395
- cacheWrite: 0,
9396
- },
9397
- contextWindow: 131072,
9398
- maxTokens: 4096,
9399
- },
9400
- "mistralai/devstral-small": {
9401
- id: "mistralai/devstral-small",
9402
- name: "Mistral: Devstral Small 1.1",
9403
- api: "openai-completions",
9404
- provider: "openrouter",
9405
- baseUrl: "https://openrouter.ai/api/v1",
9406
- reasoning: false,
9407
- input: ["text"],
9408
- cost: {
9409
- input: 0.09999999999999999,
9410
- output: 0.3,
9411
- cacheRead: 0.01,
9412
- cacheWrite: 0,
9413
- },
9414
- contextWindow: 131072,
9415
- maxTokens: 4096,
9416
- },
9417
9609
  "mistralai/ministral-14b-2512": {
9418
9610
  id: "mistralai/ministral-14b-2512",
9419
9611
  name: "Mistral: Ministral 3 14B 2512",
@@ -9499,23 +9691,6 @@ export const MODELS = {
9499
9691
  contextWindow: 131072,
9500
9692
  maxTokens: 4096,
9501
9693
  },
9502
- "mistralai/mistral-large-2411": {
9503
- id: "mistralai/mistral-large-2411",
9504
- name: "Mistral Large 2411",
9505
- api: "openai-completions",
9506
- provider: "openrouter",
9507
- baseUrl: "https://openrouter.ai/api/v1",
9508
- reasoning: false,
9509
- input: ["text"],
9510
- cost: {
9511
- input: 2,
9512
- output: 6,
9513
- cacheRead: 0.19999999999999998,
9514
- cacheWrite: 0,
9515
- },
9516
- contextWindow: 131072,
9517
- maxTokens: 4096,
9518
- },
9519
9694
  "mistralai/mistral-large-2512": {
9520
9695
  id: "mistralai/mistral-large-2512",
9521
9696
  name: "Mistral: Mistral Large 3 2512",
@@ -9669,23 +9844,6 @@ export const MODELS = {
9669
9844
  contextWindow: 65536,
9670
9845
  maxTokens: 4096,
9671
9846
  },
9672
- "mistralai/pixtral-large-2411": {
9673
- id: "mistralai/pixtral-large-2411",
9674
- name: "Mistral: Pixtral Large 2411",
9675
- api: "openai-completions",
9676
- provider: "openrouter",
9677
- baseUrl: "https://openrouter.ai/api/v1",
9678
- reasoning: false,
9679
- input: ["text", "image"],
9680
- cost: {
9681
- input: 2,
9682
- output: 6,
9683
- cacheRead: 0.19999999999999998,
9684
- cacheWrite: 0,
9685
- },
9686
- contextWindow: 131072,
9687
- maxTokens: 4096,
9688
- },
9689
9847
  "mistralai/voxtral-small-24b-2507": {
9690
9848
  id: "mistralai/voxtral-small-24b-2507",
9691
9849
  name: "Mistral: Voxtral Small 24B 2507",
@@ -9777,16 +9935,35 @@ export const MODELS = {
9777
9935
  api: "openai-completions",
9778
9936
  provider: "openrouter",
9779
9937
  baseUrl: "https://openrouter.ai/api/v1",
9938
+ compat: { "supportsDeveloperRole": false },
9780
9939
  reasoning: true,
9781
9940
  input: ["text", "image"],
9782
9941
  cost: {
9783
- input: 0.73,
9784
- output: 3.49,
9785
- cacheRead: 0.25,
9942
+ input: 0.684,
9943
+ output: 3.42,
9944
+ cacheRead: 0.144,
9945
+ cacheWrite: 0,
9946
+ },
9947
+ contextWindow: 262144,
9948
+ maxTokens: 262144,
9949
+ },
9950
+ "moonshotai/kimi-k2.6:free": {
9951
+ id: "moonshotai/kimi-k2.6:free",
9952
+ name: "MoonshotAI: Kimi K2.6 (free)",
9953
+ api: "openai-completions",
9954
+ provider: "openrouter",
9955
+ baseUrl: "https://openrouter.ai/api/v1",
9956
+ compat: { "supportsDeveloperRole": false },
9957
+ reasoning: true,
9958
+ input: ["text", "image"],
9959
+ cost: {
9960
+ input: 0,
9961
+ output: 0,
9962
+ cacheRead: 0,
9786
9963
  cacheWrite: 0,
9787
9964
  },
9788
9965
  contextWindow: 262144,
9789
- maxTokens: 262142,
9966
+ maxTokens: 4096,
9790
9967
  },
9791
9968
  "nex-agi/deepseek-v3.1-nex-n1": {
9792
9969
  id: "nex-agi/deepseek-v3.1-nex-n1",
@@ -9863,36 +10040,70 @@ export const MODELS = {
9863
10040
  provider: "openrouter",
9864
10041
  baseUrl: "https://openrouter.ai/api/v1",
9865
10042
  reasoning: true,
9866
- input: ["text", "image"],
10043
+ input: ["text", "image"],
10044
+ cost: {
10045
+ input: 0,
10046
+ output: 0,
10047
+ cacheRead: 0,
10048
+ cacheWrite: 0,
10049
+ },
10050
+ contextWindow: 256000,
10051
+ maxTokens: 65536,
10052
+ },
10053
+ "nvidia/nemotron-3-super-120b-a12b": {
10054
+ id: "nvidia/nemotron-3-super-120b-a12b",
10055
+ name: "NVIDIA: Nemotron 3 Super",
10056
+ api: "openai-completions",
10057
+ provider: "openrouter",
10058
+ baseUrl: "https://openrouter.ai/api/v1",
10059
+ reasoning: true,
10060
+ input: ["text"],
10061
+ cost: {
10062
+ input: 0.09,
10063
+ output: 0.44999999999999996,
10064
+ cacheRead: 0,
10065
+ cacheWrite: 0,
10066
+ },
10067
+ contextWindow: 1000000,
10068
+ maxTokens: 4096,
10069
+ },
10070
+ "nvidia/nemotron-3-super-120b-a12b:free": {
10071
+ id: "nvidia/nemotron-3-super-120b-a12b:free",
10072
+ name: "NVIDIA: Nemotron 3 Super (free)",
10073
+ api: "openai-completions",
10074
+ provider: "openrouter",
10075
+ baseUrl: "https://openrouter.ai/api/v1",
10076
+ reasoning: true,
10077
+ input: ["text"],
9867
10078
  cost: {
9868
10079
  input: 0,
9869
10080
  output: 0,
9870
10081
  cacheRead: 0,
9871
10082
  cacheWrite: 0,
9872
10083
  },
9873
- contextWindow: 256000,
9874
- maxTokens: 65536,
10084
+ contextWindow: 1000000,
10085
+ maxTokens: 262144,
9875
10086
  },
9876
- "nvidia/nemotron-3-super-120b-a12b": {
9877
- id: "nvidia/nemotron-3-super-120b-a12b",
9878
- name: "NVIDIA: Nemotron 3 Super",
10087
+ "nvidia/nemotron-3-ultra-550b-a55b": {
10088
+ id: "nvidia/nemotron-3-ultra-550b-a55b",
10089
+ name: "NVIDIA: Nemotron 3 Ultra",
9879
10090
  api: "openai-completions",
9880
10091
  provider: "openrouter",
9881
10092
  baseUrl: "https://openrouter.ai/api/v1",
9882
10093
  reasoning: true,
9883
10094
  input: ["text"],
9884
10095
  cost: {
9885
- input: 0.09,
9886
- output: 0.44999999999999996,
9887
- cacheRead: 0,
10096
+ input: 0.5,
10097
+ output: 2.5,
10098
+ cacheRead: 0.15,
9888
10099
  cacheWrite: 0,
9889
10100
  },
9890
10101
  contextWindow: 1000000,
9891
- maxTokens: 4096,
10102
+ maxTokens: 16384,
9892
10103
  },
9893
- "nvidia/nemotron-3-super-120b-a12b:free": {
9894
- id: "nvidia/nemotron-3-super-120b-a12b:free",
9895
- name: "NVIDIA: Nemotron 3 Super (free)",
10104
+ "nvidia/nemotron-3-ultra-550b-a55b:free": {
10105
+ id: "nvidia/nemotron-3-ultra-550b-a55b:free",
10106
+ name: "NVIDIA: Nemotron 3 Ultra (free)",
9896
10107
  api: "openai-completions",
9897
10108
  provider: "openrouter",
9898
10109
  baseUrl: "https://openrouter.ai/api/v1",
@@ -9905,7 +10116,7 @@ export const MODELS = {
9905
10116
  cacheWrite: 0,
9906
10117
  },
9907
10118
  contextWindow: 1000000,
9908
- maxTokens: 262144,
10119
+ maxTokens: 65536,
9909
10120
  },
9910
10121
  "nvidia/nemotron-nano-12b-v2-vl:free": {
9911
10122
  id: "nvidia/nemotron-nano-12b-v2-vl:free",
@@ -10026,23 +10237,6 @@ export const MODELS = {
10026
10237
  contextWindow: 8191,
10027
10238
  maxTokens: 4096,
10028
10239
  },
10029
- "openai/gpt-4-0314": {
10030
- id: "openai/gpt-4-0314",
10031
- name: "OpenAI: GPT-4 (older v0314)",
10032
- api: "openai-completions",
10033
- provider: "openrouter",
10034
- baseUrl: "https://openrouter.ai/api/v1",
10035
- reasoning: false,
10036
- input: ["text"],
10037
- cost: {
10038
- input: 30,
10039
- output: 60,
10040
- cacheRead: 0,
10041
- cacheWrite: 0,
10042
- },
10043
- contextWindow: 8191,
10044
- maxTokens: 4096,
10045
- },
10046
10240
  "openai/gpt-4-1106-preview": {
10047
10241
  id: "openai/gpt-4-1106-preview",
10048
10242
  name: "OpenAI: GPT-4 Turbo (older v1106)",
@@ -10213,23 +10407,6 @@ export const MODELS = {
10213
10407
  contextWindow: 128000,
10214
10408
  maxTokens: 16384,
10215
10409
  },
10216
- "openai/gpt-4o-audio-preview": {
10217
- id: "openai/gpt-4o-audio-preview",
10218
- name: "OpenAI: GPT-4o Audio",
10219
- api: "openai-completions",
10220
- provider: "openrouter",
10221
- baseUrl: "https://openrouter.ai/api/v1",
10222
- reasoning: false,
10223
- input: ["text"],
10224
- cost: {
10225
- input: 2.5,
10226
- output: 10,
10227
- cacheRead: 0,
10228
- cacheWrite: 0,
10229
- },
10230
- contextWindow: 128000,
10231
- maxTokens: 16384,
10232
- },
10233
10410
  "openai/gpt-4o-mini": {
10234
10411
  id: "openai/gpt-4o-mini",
10235
10412
  name: "OpenAI: GPT-4o-mini",
@@ -10377,11 +10554,11 @@ export const MODELS = {
10377
10554
  cost: {
10378
10555
  input: 1.25,
10379
10556
  output: 10,
10380
- cacheRead: 0.125,
10557
+ cacheRead: 0.13,
10381
10558
  cacheWrite: 0,
10382
10559
  },
10383
10560
  contextWindow: 128000,
10384
- maxTokens: 16384,
10561
+ maxTokens: 32000,
10385
10562
  },
10386
10563
  "openai/gpt-5.1-codex": {
10387
10564
  id: "openai/gpt-5.1-codex",
@@ -10394,7 +10571,7 @@ export const MODELS = {
10394
10571
  cost: {
10395
10572
  input: 1.25,
10396
10573
  output: 10,
10397
- cacheRead: 0.125,
10574
+ cacheRead: 0.13,
10398
10575
  cacheWrite: 0,
10399
10576
  },
10400
10577
  contextWindow: 400000,
@@ -10428,11 +10605,11 @@ export const MODELS = {
10428
10605
  cost: {
10429
10606
  input: 0.25,
10430
10607
  output: 2,
10431
- cacheRead: 0.03,
10608
+ cacheRead: 0.024999999999999998,
10432
10609
  cacheWrite: 0,
10433
10610
  },
10434
10611
  contextWindow: 400000,
10435
- maxTokens: 128000,
10612
+ maxTokens: 100000,
10436
10613
  },
10437
10614
  "openai/gpt-5.2": {
10438
10615
  id: "openai/gpt-5.2",
@@ -10468,7 +10645,7 @@ export const MODELS = {
10468
10645
  cacheWrite: 0,
10469
10646
  },
10470
10647
  contextWindow: 128000,
10471
- maxTokens: 32000,
10648
+ maxTokens: 16384,
10472
10649
  },
10473
10650
  "openai/gpt-5.2-codex": {
10474
10651
  id: "openai/gpt-5.2-codex",
@@ -10639,7 +10816,7 @@ export const MODELS = {
10639
10816
  provider: "openrouter",
10640
10817
  baseUrl: "https://openrouter.ai/api/v1",
10641
10818
  reasoning: true,
10642
- thinkingLevelMap: { "xhigh": "xhigh" },
10819
+ thinkingLevelMap: { "xhigh": "xhigh", "off": null, "minimal": null, "low": null },
10643
10820
  input: ["text", "image"],
10644
10821
  cost: {
10645
10822
  input: 30,
@@ -10744,13 +10921,13 @@ export const MODELS = {
10744
10921
  reasoning: true,
10745
10922
  input: ["text"],
10746
10923
  cost: {
10747
- input: 0.03,
10924
+ input: 0.029,
10748
10925
  output: 0.14,
10749
10926
  cacheRead: 0,
10750
10927
  cacheWrite: 0,
10751
10928
  },
10752
10929
  contextWindow: 131072,
10753
- maxTokens: 131072,
10930
+ maxTokens: 4096,
10754
10931
  },
10755
10932
  "openai/gpt-oss-20b:free": {
10756
10933
  id: "openai/gpt-oss-20b:free",
@@ -11004,8 +11181,8 @@ export const MODELS = {
11004
11181
  cacheRead: 0,
11005
11182
  cacheWrite: 0,
11006
11183
  },
11007
- contextWindow: 131072,
11008
- maxTokens: 8192,
11184
+ contextWindow: 262144,
11185
+ maxTokens: 32768,
11009
11186
  },
11010
11187
  "poolside/laguna-xs.2:free": {
11011
11188
  id: "poolside/laguna-xs.2:free",
@@ -11021,8 +11198,8 @@ export const MODELS = {
11021
11198
  cacheRead: 0,
11022
11199
  cacheWrite: 0,
11023
11200
  },
11024
- contextWindow: 131072,
11025
- maxTokens: 8192,
11201
+ contextWindow: 262144,
11202
+ maxTokens: 32768,
11026
11203
  },
11027
11204
  "prime-intellect/intellect-3": {
11028
11205
  id: "prime-intellect/intellect-3",
@@ -11058,23 +11235,6 @@ export const MODELS = {
11058
11235
  contextWindow: 131072,
11059
11236
  maxTokens: 16384,
11060
11237
  },
11061
- "qwen/qwen-2.5-7b-instruct": {
11062
- id: "qwen/qwen-2.5-7b-instruct",
11063
- name: "Qwen: Qwen2.5 7B Instruct",
11064
- api: "openai-completions",
11065
- provider: "openrouter",
11066
- baseUrl: "https://openrouter.ai/api/v1",
11067
- reasoning: false,
11068
- input: ["text"],
11069
- cost: {
11070
- input: 0.04,
11071
- output: 0.09999999999999999,
11072
- cacheRead: 0,
11073
- cacheWrite: 0,
11074
- },
11075
- contextWindow: 131072,
11076
- maxTokens: 32768,
11077
- },
11078
11238
  "qwen/qwen-plus": {
11079
11239
  id: "qwen/qwen-plus",
11080
11240
  name: "Qwen: Qwen-Plus",
@@ -11104,7 +11264,7 @@ export const MODELS = {
11104
11264
  input: 0.26,
11105
11265
  output: 0.78,
11106
11266
  cacheRead: 0,
11107
- cacheWrite: 0.325,
11267
+ cacheWrite: 0,
11108
11268
  },
11109
11269
  contextWindow: 1000000,
11110
11270
  maxTokens: 32768,
@@ -11186,13 +11346,13 @@ export const MODELS = {
11186
11346
  reasoning: true,
11187
11347
  input: ["text"],
11188
11348
  cost: {
11189
- input: 0.14950000000000002,
11190
- output: 1.495,
11191
- cacheRead: 0,
11349
+ input: 0.09999999999999999,
11350
+ output: 0.09999999999999999,
11351
+ cacheRead: 0.09999999999999999,
11192
11352
  cacheWrite: 0,
11193
11353
  },
11194
11354
  contextWindow: 262144,
11195
- maxTokens: 4096,
11355
+ maxTokens: 262144,
11196
11356
  },
11197
11357
  "qwen/qwen3-30b-a3b": {
11198
11358
  id: "qwen/qwen3-30b-a3b",
@@ -11220,13 +11380,13 @@ export const MODELS = {
11220
11380
  reasoning: false,
11221
11381
  input: ["text"],
11222
11382
  cost: {
11223
- input: 0.09,
11224
- output: 0.3,
11383
+ input: 0.04815,
11384
+ output: 0.19305,
11225
11385
  cacheRead: 0,
11226
11386
  cacheWrite: 0,
11227
11387
  },
11228
- contextWindow: 262144,
11229
- maxTokens: 262144,
11388
+ contextWindow: 131072,
11389
+ maxTokens: 32000,
11230
11390
  },
11231
11391
  "qwen/qwen3-30b-a3b-thinking-2507": {
11232
11392
  id: "qwen/qwen3-30b-a3b-thinking-2507",
@@ -11628,13 +11788,13 @@ export const MODELS = {
11628
11788
  reasoning: true,
11629
11789
  input: ["text", "image"],
11630
11790
  cost: {
11631
- input: 0.13899999999999998,
11791
+ input: 0.14,
11632
11792
  output: 1,
11633
- cacheRead: 0,
11793
+ cacheRead: 0.049999999999999996,
11634
11794
  cacheWrite: 0,
11635
11795
  },
11636
11796
  contextWindow: 262144,
11637
- maxTokens: 4096,
11797
+ maxTokens: 262144,
11638
11798
  },
11639
11799
  "qwen/qwen3.5-397b-a17b": {
11640
11800
  id: "qwen/qwen3.5-397b-a17b",
@@ -11682,7 +11842,7 @@ export const MODELS = {
11682
11842
  input: 0.065,
11683
11843
  output: 0.26,
11684
11844
  cacheRead: 0,
11685
- cacheWrite: 0.08125,
11845
+ cacheWrite: 0,
11686
11846
  },
11687
11847
  contextWindow: 1000000,
11688
11848
  maxTokens: 65536,
@@ -11699,7 +11859,7 @@ export const MODELS = {
11699
11859
  input: 0.26,
11700
11860
  output: 1.56,
11701
11861
  cacheRead: 0,
11702
- cacheWrite: 0.325,
11862
+ cacheWrite: 0,
11703
11863
  },
11704
11864
  contextWindow: 1000000,
11705
11865
  maxTokens: 65536,
@@ -11716,7 +11876,7 @@ export const MODELS = {
11716
11876
  input: 0.3,
11717
11877
  output: 1.7999999999999998,
11718
11878
  cacheRead: 0,
11719
- cacheWrite: 0,
11879
+ cacheWrite: 0.375,
11720
11880
  },
11721
11881
  contextWindow: 1000000,
11722
11882
  maxTokens: 65536,
@@ -11730,13 +11890,13 @@ export const MODELS = {
11730
11890
  reasoning: true,
11731
11891
  input: ["text", "image"],
11732
11892
  cost: {
11733
- input: 0.3,
11893
+ input: 0.29,
11734
11894
  output: 3.1999999999999997,
11735
11895
  cacheRead: 0,
11736
11896
  cacheWrite: 0,
11737
11897
  },
11738
11898
  contextWindow: 262144,
11739
- maxTokens: 262144,
11899
+ maxTokens: 262140,
11740
11900
  },
11741
11901
  "qwen/qwen3.6-35b-a3b": {
11742
11902
  id: "qwen/qwen3.6-35b-a3b",
@@ -11747,7 +11907,7 @@ export const MODELS = {
11747
11907
  reasoning: true,
11748
11908
  input: ["text", "image"],
11749
11909
  cost: {
11750
- input: 0.15,
11910
+ input: 0.14,
11751
11911
  output: 1,
11752
11912
  cacheRead: 0,
11753
11913
  cacheWrite: 0,
@@ -11815,10 +11975,27 @@ export const MODELS = {
11815
11975
  reasoning: true,
11816
11976
  input: ["text"],
11817
11977
  cost: {
11818
- input: 2.5,
11819
- output: 7.5,
11820
- cacheRead: 0,
11821
- cacheWrite: 3.125,
11978
+ input: 1.25,
11979
+ output: 3.75,
11980
+ cacheRead: 0.25,
11981
+ cacheWrite: 1.5625,
11982
+ },
11983
+ contextWindow: 1000000,
11984
+ maxTokens: 65536,
11985
+ },
11986
+ "qwen/qwen3.7-plus": {
11987
+ id: "qwen/qwen3.7-plus",
11988
+ name: "Qwen: Qwen3.7 Plus",
11989
+ api: "openai-completions",
11990
+ provider: "openrouter",
11991
+ baseUrl: "https://openrouter.ai/api/v1",
11992
+ reasoning: true,
11993
+ input: ["text", "image"],
11994
+ cost: {
11995
+ input: 0.39999999999999997,
11996
+ output: 1.5999999999999999,
11997
+ cacheRead: 0.08,
11998
+ cacheWrite: 0.5,
11822
11999
  },
11823
12000
  contextWindow: 1000000,
11824
12001
  maxTokens: 65536,
@@ -11908,6 +12085,23 @@ export const MODELS = {
11908
12085
  contextWindow: 262144,
11909
12086
  maxTokens: 16384,
11910
12087
  },
12088
+ "stepfun/step-3.7-flash": {
12089
+ id: "stepfun/step-3.7-flash",
12090
+ name: "StepFun: Step 3.7 Flash",
12091
+ api: "openai-completions",
12092
+ provider: "openrouter",
12093
+ baseUrl: "https://openrouter.ai/api/v1",
12094
+ reasoning: true,
12095
+ input: ["text", "image"],
12096
+ cost: {
12097
+ input: 0.19999999999999998,
12098
+ output: 1.15,
12099
+ cacheRead: 0.04,
12100
+ cacheWrite: 0,
12101
+ },
12102
+ contextWindow: 256000,
12103
+ maxTokens: 256000,
12104
+ },
11911
12105
  "tencent/hy3-preview": {
11912
12106
  id: "tencent/hy3-preview",
11913
12107
  name: "Tencent: Hy3 preview",
@@ -11917,13 +12111,13 @@ export const MODELS = {
11917
12111
  reasoning: true,
11918
12112
  input: ["text"],
11919
12113
  cost: {
11920
- input: 0.06599999999999999,
11921
- output: 0.26,
11922
- cacheRead: 0.029,
12114
+ input: 0.063,
12115
+ output: 0.21,
12116
+ cacheRead: 0.020999999999999998,
11923
12117
  cacheWrite: 0,
11924
12118
  },
11925
12119
  contextWindow: 262144,
11926
- maxTokens: 262144,
12120
+ maxTokens: 4096,
11927
12121
  },
11928
12122
  "thedrummer/rocinante-12b": {
11929
12123
  id: "thedrummer/rocinante-12b",
@@ -12044,40 +12238,6 @@ export const MODELS = {
12044
12238
  contextWindow: 262144,
12045
12239
  maxTokens: 65536,
12046
12240
  },
12047
- "xiaomi/mimo-v2-omni": {
12048
- id: "xiaomi/mimo-v2-omni",
12049
- name: "Xiaomi: MiMo-V2-Omni",
12050
- api: "openai-completions",
12051
- provider: "openrouter",
12052
- baseUrl: "https://openrouter.ai/api/v1",
12053
- reasoning: true,
12054
- input: ["text", "image"],
12055
- cost: {
12056
- input: 0.39999999999999997,
12057
- output: 2,
12058
- cacheRead: 0.08,
12059
- cacheWrite: 0,
12060
- },
12061
- contextWindow: 262144,
12062
- maxTokens: 65536,
12063
- },
12064
- "xiaomi/mimo-v2-pro": {
12065
- id: "xiaomi/mimo-v2-pro",
12066
- name: "Xiaomi: MiMo-V2-Pro",
12067
- api: "openai-completions",
12068
- provider: "openrouter",
12069
- baseUrl: "https://openrouter.ai/api/v1",
12070
- reasoning: true,
12071
- input: ["text"],
12072
- cost: {
12073
- input: 1,
12074
- output: 3,
12075
- cacheRead: 0.19999999999999998,
12076
- cacheWrite: 0,
12077
- },
12078
- contextWindow: 1048576,
12079
- maxTokens: 131072,
12080
- },
12081
12241
  "xiaomi/mimo-v2.5": {
12082
12242
  id: "xiaomi/mimo-v2.5",
12083
12243
  name: "Xiaomi: MiMo-V2.5",
@@ -12087,9 +12247,9 @@ export const MODELS = {
12087
12247
  reasoning: true,
12088
12248
  input: ["text", "image"],
12089
12249
  cost: {
12090
- input: 0.39999999999999997,
12091
- output: 2,
12092
- cacheRead: 0.08,
12250
+ input: 0.14,
12251
+ output: 0.28,
12252
+ cacheRead: 0.0028,
12093
12253
  cacheWrite: 0,
12094
12254
  },
12095
12255
  contextWindow: 1048576,
@@ -12104,13 +12264,13 @@ export const MODELS = {
12104
12264
  reasoning: true,
12105
12265
  input: ["text"],
12106
12266
  cost: {
12107
- input: 1,
12108
- output: 3,
12109
- cacheRead: 0.19999999999999998,
12267
+ input: 0.435,
12268
+ output: 0.87,
12269
+ cacheRead: 0.0036,
12110
12270
  cacheWrite: 0,
12111
12271
  },
12112
12272
  contextWindow: 1048576,
12113
- maxTokens: 16384,
12273
+ maxTokens: 131072,
12114
12274
  },
12115
12275
  "z-ai/glm-4-32b": {
12116
12276
  id: "z-ai/glm-4-32b",
@@ -12155,13 +12315,13 @@ export const MODELS = {
12155
12315
  reasoning: true,
12156
12316
  input: ["text"],
12157
12317
  cost: {
12158
- input: 0.13,
12318
+ input: 0.125,
12159
12319
  output: 0.85,
12160
- cacheRead: 0.024999999999999998,
12320
+ cacheRead: 0.06,
12161
12321
  cacheWrite: 0,
12162
12322
  },
12163
12323
  contextWindow: 131072,
12164
- maxTokens: 98304,
12324
+ maxTokens: 131070,
12165
12325
  },
12166
12326
  "z-ai/glm-4.5-air:free": {
12167
12327
  id: "z-ai/glm-4.5-air:free",
@@ -12427,13 +12587,13 @@ export const MODELS = {
12427
12587
  reasoning: true,
12428
12588
  input: ["text", "image"],
12429
12589
  cost: {
12430
- input: 0.73,
12431
- output: 3.49,
12432
- cacheRead: 0.25,
12590
+ input: 0.684,
12591
+ output: 3.42,
12592
+ cacheRead: 0.144,
12433
12593
  cacheWrite: 0,
12434
12594
  },
12435
12595
  contextWindow: 262144,
12436
- maxTokens: 262142,
12596
+ maxTokens: 262144,
12437
12597
  },
12438
12598
  "~openai/gpt-latest": {
12439
12599
  id: "~openai/gpt-latest",
@@ -12831,20 +12991,20 @@ export const MODELS = {
12831
12991
  },
12832
12992
  "alibaba/qwen-3-235b": {
12833
12993
  id: "alibaba/qwen-3-235b",
12834
- name: "Qwen3 235B A22b Instruct 2507",
12994
+ name: "Qwen3 235B A22B",
12835
12995
  api: "anthropic-messages",
12836
12996
  provider: "vercel-ai-gateway",
12837
12997
  baseUrl: "https://ai-gateway.vercel.sh",
12838
- reasoning: false,
12998
+ reasoning: true,
12839
12999
  input: ["text"],
12840
13000
  cost: {
12841
- input: 0.6,
12842
- output: 1.2,
12843
- cacheRead: 0.6,
13001
+ input: 0.22,
13002
+ output: 0.88,
13003
+ cacheRead: 0,
12844
13004
  cacheWrite: 0,
12845
13005
  },
12846
- contextWindow: 131000,
12847
- maxTokens: 40000,
13006
+ contextWindow: 262144,
13007
+ maxTokens: 16384,
12848
13008
  },
12849
13009
  "alibaba/qwen-3-30b": {
12850
13010
  id: "alibaba/qwen-3-30b",
@@ -12887,7 +13047,7 @@ export const MODELS = {
12887
13047
  provider: "vercel-ai-gateway",
12888
13048
  baseUrl: "https://ai-gateway.vercel.sh",
12889
13049
  reasoning: true,
12890
- input: ["text", "image"],
13050
+ input: ["text"],
12891
13051
  cost: {
12892
13052
  input: 1.3,
12893
13053
  output: 7.8,
@@ -12920,7 +13080,7 @@ export const MODELS = {
12920
13080
  api: "anthropic-messages",
12921
13081
  provider: "vercel-ai-gateway",
12922
13082
  baseUrl: "https://ai-gateway.vercel.sh",
12923
- reasoning: false,
13083
+ reasoning: true,
12924
13084
  input: ["text"],
12925
13085
  cost: {
12926
13086
  input: 1.5,
@@ -12954,7 +13114,7 @@ export const MODELS = {
12954
13114
  api: "anthropic-messages",
12955
13115
  provider: "vercel-ai-gateway",
12956
13116
  baseUrl: "https://ai-gateway.vercel.sh",
12957
- reasoning: false,
13117
+ reasoning: true,
12958
13118
  input: ["text"],
12959
13119
  cost: {
12960
13120
  input: 0.5,
@@ -13013,25 +13173,59 @@ export const MODELS = {
13013
13173
  cacheRead: 0.24,
13014
13174
  cacheWrite: 0,
13015
13175
  },
13016
- contextWindow: 262144,
13176
+ contextWindow: 262144,
13177
+ maxTokens: 32768,
13178
+ },
13179
+ "alibaba/qwen3-max-thinking": {
13180
+ id: "alibaba/qwen3-max-thinking",
13181
+ name: "Qwen 3 Max Thinking",
13182
+ api: "anthropic-messages",
13183
+ provider: "vercel-ai-gateway",
13184
+ baseUrl: "https://ai-gateway.vercel.sh",
13185
+ reasoning: true,
13186
+ input: ["text"],
13187
+ cost: {
13188
+ input: 1.2,
13189
+ output: 6,
13190
+ cacheRead: 0.24,
13191
+ cacheWrite: 0,
13192
+ },
13193
+ contextWindow: 256000,
13194
+ maxTokens: 65536,
13195
+ },
13196
+ "alibaba/qwen3-next-80b-a3b-instruct": {
13197
+ id: "alibaba/qwen3-next-80b-a3b-instruct",
13198
+ name: "Qwen3 Next 80B A3B Instruct",
13199
+ api: "anthropic-messages",
13200
+ provider: "vercel-ai-gateway",
13201
+ baseUrl: "https://ai-gateway.vercel.sh",
13202
+ reasoning: false,
13203
+ input: ["text"],
13204
+ cost: {
13205
+ input: 0.15,
13206
+ output: 1.2,
13207
+ cacheRead: 0,
13208
+ cacheWrite: 0,
13209
+ },
13210
+ contextWindow: 131072,
13017
13211
  maxTokens: 32768,
13018
13212
  },
13019
- "alibaba/qwen3-max-thinking": {
13020
- id: "alibaba/qwen3-max-thinking",
13021
- name: "Qwen 3 Max Thinking",
13213
+ "alibaba/qwen3-next-80b-a3b-thinking": {
13214
+ id: "alibaba/qwen3-next-80b-a3b-thinking",
13215
+ name: "Qwen3 Next 80B A3B Thinking",
13022
13216
  api: "anthropic-messages",
13023
13217
  provider: "vercel-ai-gateway",
13024
13218
  baseUrl: "https://ai-gateway.vercel.sh",
13025
13219
  reasoning: true,
13026
13220
  input: ["text"],
13027
13221
  cost: {
13028
- input: 1.2,
13029
- output: 6,
13030
- cacheRead: 0.24,
13222
+ input: 0.15,
13223
+ output: 1.2,
13224
+ cacheRead: 0,
13031
13225
  cacheWrite: 0,
13032
13226
  },
13033
- contextWindow: 256000,
13034
- maxTokens: 65536,
13227
+ contextWindow: 131072,
13228
+ maxTokens: 32768,
13035
13229
  },
13036
13230
  "alibaba/qwen3-vl-thinking": {
13037
13231
  id: "alibaba/qwen3-vl-thinking",
@@ -13125,7 +13319,7 @@ export const MODELS = {
13125
13319
  provider: "vercel-ai-gateway",
13126
13320
  baseUrl: "https://ai-gateway.vercel.sh",
13127
13321
  reasoning: true,
13128
- input: ["text", "image"],
13322
+ input: ["text"],
13129
13323
  cost: {
13130
13324
  input: 1.25,
13131
13325
  output: 3.75,
@@ -13135,6 +13329,23 @@ export const MODELS = {
13135
13329
  contextWindow: 991000,
13136
13330
  maxTokens: 64000,
13137
13331
  },
13332
+ "alibaba/qwen3.7-plus": {
13333
+ id: "alibaba/qwen3.7-plus",
13334
+ name: "Qwen 3.7 Plus",
13335
+ api: "anthropic-messages",
13336
+ provider: "vercel-ai-gateway",
13337
+ baseUrl: "https://ai-gateway.vercel.sh",
13338
+ reasoning: true,
13339
+ input: ["text", "image"],
13340
+ cost: {
13341
+ input: 0.39999999999999997,
13342
+ output: 1.5999999999999999,
13343
+ cacheRead: 0.08,
13344
+ cacheWrite: 0.5,
13345
+ },
13346
+ contextWindow: 1000000,
13347
+ maxTokens: 64000,
13348
+ },
13138
13349
  "anthropic/claude-3-haiku": {
13139
13350
  id: "anthropic/claude-3-haiku",
13140
13351
  name: "Claude 3 Haiku",
@@ -13243,6 +13454,7 @@ export const MODELS = {
13243
13454
  api: "anthropic-messages",
13244
13455
  provider: "vercel-ai-gateway",
13245
13456
  baseUrl: "https://ai-gateway.vercel.sh",
13457
+ compat: { "forceAdaptiveThinking": true },
13246
13458
  reasoning: true,
13247
13459
  thinkingLevelMap: { "xhigh": "max" },
13248
13460
  input: ["text", "image"],
@@ -13261,6 +13473,7 @@ export const MODELS = {
13261
13473
  api: "anthropic-messages",
13262
13474
  provider: "vercel-ai-gateway",
13263
13475
  baseUrl: "https://ai-gateway.vercel.sh",
13476
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
13264
13477
  reasoning: true,
13265
13478
  thinkingLevelMap: { "xhigh": "xhigh" },
13266
13479
  input: ["text", "image"],
@@ -13273,6 +13486,24 @@ export const MODELS = {
13273
13486
  contextWindow: 1000000,
13274
13487
  maxTokens: 128000,
13275
13488
  },
13489
+ "anthropic/claude-opus-4.8": {
13490
+ id: "anthropic/claude-opus-4.8",
13491
+ name: "Claude Opus 4.8",
13492
+ api: "anthropic-messages",
13493
+ provider: "vercel-ai-gateway",
13494
+ baseUrl: "https://ai-gateway.vercel.sh",
13495
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
13496
+ reasoning: true,
13497
+ input: ["text", "image"],
13498
+ cost: {
13499
+ input: 5,
13500
+ output: 25,
13501
+ cacheRead: 0.5,
13502
+ cacheWrite: 6.25,
13503
+ },
13504
+ contextWindow: 1000000,
13505
+ maxTokens: 128000,
13506
+ },
13276
13507
  "anthropic/claude-sonnet-4": {
13277
13508
  id: "anthropic/claude-sonnet-4",
13278
13509
  name: "Claude Sonnet 4",
@@ -13313,6 +13544,7 @@ export const MODELS = {
13313
13544
  api: "anthropic-messages",
13314
13545
  provider: "vercel-ai-gateway",
13315
13546
  baseUrl: "https://ai-gateway.vercel.sh",
13547
+ compat: { "forceAdaptiveThinking": true },
13316
13548
  reasoning: true,
13317
13549
  input: ["text", "image"],
13318
13550
  cost: {
@@ -13418,17 +13650,17 @@ export const MODELS = {
13418
13650
  reasoning: false,
13419
13651
  input: ["text"],
13420
13652
  cost: {
13421
- input: 0.77,
13422
- output: 0.77,
13423
- cacheRead: 0,
13653
+ input: 0.27,
13654
+ output: 1.12,
13655
+ cacheRead: 0.135,
13424
13656
  cacheWrite: 0,
13425
13657
  },
13426
13658
  contextWindow: 163840,
13427
- maxTokens: 16384,
13659
+ maxTokens: 163840,
13428
13660
  },
13429
13661
  "deepseek/deepseek-v3.1": {
13430
13662
  id: "deepseek/deepseek-v3.1",
13431
- name: "DeepSeek-V3.1",
13663
+ name: "DeepSeek V3.1",
13432
13664
  api: "anthropic-messages",
13433
13665
  provider: "vercel-ai-gateway",
13434
13666
  baseUrl: "https://ai-gateway.vercel.sh",
@@ -13466,8 +13698,8 @@ export const MODELS = {
13466
13698
  api: "anthropic-messages",
13467
13699
  provider: "vercel-ai-gateway",
13468
13700
  baseUrl: "https://ai-gateway.vercel.sh",
13469
- reasoning: false,
13470
- input: ["text"],
13701
+ reasoning: true,
13702
+ input: ["text", "image"],
13471
13703
  cost: {
13472
13704
  input: 0.28,
13473
13705
  output: 0.42,
@@ -13483,8 +13715,8 @@ export const MODELS = {
13483
13715
  api: "anthropic-messages",
13484
13716
  provider: "vercel-ai-gateway",
13485
13717
  baseUrl: "https://ai-gateway.vercel.sh",
13486
- reasoning: false,
13487
- input: ["text"],
13718
+ reasoning: true,
13719
+ input: ["text", "image"],
13488
13720
  cost: {
13489
13721
  input: 0.62,
13490
13722
  output: 1.85,
@@ -13501,7 +13733,7 @@ export const MODELS = {
13501
13733
  provider: "vercel-ai-gateway",
13502
13734
  baseUrl: "https://ai-gateway.vercel.sh",
13503
13735
  reasoning: true,
13504
- input: ["text"],
13736
+ input: ["text", "image"],
13505
13737
  cost: {
13506
13738
  input: 0.14,
13507
13739
  output: 0.28,
@@ -13721,12 +13953,12 @@ export const MODELS = {
13721
13953
  api: "anthropic-messages",
13722
13954
  provider: "vercel-ai-gateway",
13723
13955
  baseUrl: "https://ai-gateway.vercel.sh",
13724
- reasoning: false,
13956
+ reasoning: true,
13725
13957
  input: ["text", "image"],
13726
13958
  cost: {
13727
- input: 0.13,
13728
- output: 0.39999999999999997,
13729
- cacheRead: 0,
13959
+ input: 0.15,
13960
+ output: 0.6,
13961
+ cacheRead: 0.015,
13730
13962
  cacheWrite: 0,
13731
13963
  },
13732
13964
  contextWindow: 262144,
@@ -14028,7 +14260,7 @@ export const MODELS = {
14028
14260
  provider: "vercel-ai-gateway",
14029
14261
  baseUrl: "https://ai-gateway.vercel.sh",
14030
14262
  reasoning: true,
14031
- input: ["text", "image"],
14263
+ input: ["text"],
14032
14264
  cost: {
14033
14265
  input: 0.3,
14034
14266
  output: 1.2,
@@ -14045,7 +14277,7 @@ export const MODELS = {
14045
14277
  provider: "vercel-ai-gateway",
14046
14278
  baseUrl: "https://ai-gateway.vercel.sh",
14047
14279
  reasoning: true,
14048
- input: ["text", "image"],
14280
+ input: ["text"],
14049
14281
  cost: {
14050
14282
  input: 0.6,
14051
14283
  output: 2.4,
@@ -14055,6 +14287,23 @@ export const MODELS = {
14055
14287
  contextWindow: 204800,
14056
14288
  maxTokens: 131100,
14057
14289
  },
14290
+ "minimax/minimax-m3": {
14291
+ id: "minimax/minimax-m3",
14292
+ name: "MiniMax M3",
14293
+ api: "anthropic-messages",
14294
+ provider: "vercel-ai-gateway",
14295
+ baseUrl: "https://ai-gateway.vercel.sh",
14296
+ reasoning: true,
14297
+ input: ["text", "image"],
14298
+ cost: {
14299
+ input: 0.3,
14300
+ output: 1.2,
14301
+ cacheRead: 0.06,
14302
+ cacheWrite: 0,
14303
+ },
14304
+ contextWindow: 1000000,
14305
+ maxTokens: 1000000,
14306
+ },
14058
14307
  "mistral/codestral": {
14059
14308
  id: "mistral/codestral",
14060
14309
  name: "Mistral Codestral",
@@ -14191,6 +14440,23 @@ export const MODELS = {
14191
14440
  contextWindow: 256000,
14192
14441
  maxTokens: 256000,
14193
14442
  },
14443
+ "mistral/mistral-nemo": {
14444
+ id: "mistral/mistral-nemo",
14445
+ name: "Mistral Nemo 12B",
14446
+ api: "anthropic-messages",
14447
+ provider: "vercel-ai-gateway",
14448
+ baseUrl: "https://ai-gateway.vercel.sh",
14449
+ reasoning: false,
14450
+ input: ["text"],
14451
+ cost: {
14452
+ input: 0.02,
14453
+ output: 0.04,
14454
+ cacheRead: 0,
14455
+ cacheWrite: 0,
14456
+ },
14457
+ contextWindow: 131072,
14458
+ maxTokens: 131072,
14459
+ },
14194
14460
  "mistral/mistral-small": {
14195
14461
  id: "mistral/mistral-small",
14196
14462
  name: "Mistral Small",
@@ -14344,6 +14610,40 @@ export const MODELS = {
14344
14610
  contextWindow: 262000,
14345
14611
  maxTokens: 262000,
14346
14612
  },
14613
+ "nvidia/nemotron-3-super-120b-a12b": {
14614
+ id: "nvidia/nemotron-3-super-120b-a12b",
14615
+ name: "NVIDIA Nemotron 3 Super 120B A12B",
14616
+ api: "anthropic-messages",
14617
+ provider: "vercel-ai-gateway",
14618
+ baseUrl: "https://ai-gateway.vercel.sh",
14619
+ reasoning: true,
14620
+ input: ["text"],
14621
+ cost: {
14622
+ input: 0.15,
14623
+ output: 0.65,
14624
+ cacheRead: 0,
14625
+ cacheWrite: 0,
14626
+ },
14627
+ contextWindow: 256000,
14628
+ maxTokens: 32000,
14629
+ },
14630
+ "nvidia/nemotron-3-ultra-550b-a55b": {
14631
+ id: "nvidia/nemotron-3-ultra-550b-a55b",
14632
+ name: "Nemotron 3 Ultra",
14633
+ api: "anthropic-messages",
14634
+ provider: "vercel-ai-gateway",
14635
+ baseUrl: "https://ai-gateway.vercel.sh",
14636
+ reasoning: true,
14637
+ input: ["text"],
14638
+ cost: {
14639
+ input: 0.5,
14640
+ output: 2.5,
14641
+ cacheRead: 0.15,
14642
+ cacheWrite: 0,
14643
+ },
14644
+ contextWindow: 262144,
14645
+ maxTokens: 65000,
14646
+ },
14347
14647
  "nvidia/nemotron-nano-12b-v2-vl": {
14348
14648
  id: "nvidia/nemotron-nano-12b-v2-vl",
14349
14649
  name: "Nvidia Nemotron Nano 12B V2 VL",
@@ -14521,7 +14821,7 @@ export const MODELS = {
14521
14821
  provider: "vercel-ai-gateway",
14522
14822
  baseUrl: "https://ai-gateway.vercel.sh",
14523
14823
  reasoning: true,
14524
- input: ["text"],
14824
+ input: ["text", "image"],
14525
14825
  cost: {
14526
14826
  input: 1.25,
14527
14827
  output: 10,
@@ -14872,7 +15172,7 @@ export const MODELS = {
14872
15172
  provider: "vercel-ai-gateway",
14873
15173
  baseUrl: "https://ai-gateway.vercel.sh",
14874
15174
  reasoning: true,
14875
- thinkingLevelMap: { "xhigh": "xhigh" },
15175
+ thinkingLevelMap: { "xhigh": "xhigh", "off": null, "minimal": null, "low": null },
14876
15176
  input: ["text", "image"],
14877
15177
  cost: {
14878
15178
  input: 30,
@@ -14883,6 +15183,23 @@ export const MODELS = {
14883
15183
  contextWindow: 1000000,
14884
15184
  maxTokens: 128000,
14885
15185
  },
15186
+ "openai/gpt-oss-120b": {
15187
+ id: "openai/gpt-oss-120b",
15188
+ name: "GPT OSS 120B",
15189
+ api: "anthropic-messages",
15190
+ provider: "vercel-ai-gateway",
15191
+ baseUrl: "https://ai-gateway.vercel.sh",
15192
+ reasoning: true,
15193
+ input: ["text"],
15194
+ cost: {
15195
+ input: 0.35,
15196
+ output: 0.75,
15197
+ cacheRead: 0.25,
15198
+ cacheWrite: 0,
15199
+ },
15200
+ contextWindow: 131072,
15201
+ maxTokens: 131000,
15202
+ },
14886
15203
  "openai/gpt-oss-20b": {
14887
15204
  id: "openai/gpt-oss-20b",
14888
15205
  name: "GPT OSS 20B",
@@ -15053,6 +15370,40 @@ export const MODELS = {
15053
15370
  contextWindow: 200000,
15054
15371
  maxTokens: 8000,
15055
15372
  },
15373
+ "stepfun/step-3.5-flash": {
15374
+ id: "stepfun/step-3.5-flash",
15375
+ name: "StepFun 3.5 Flash",
15376
+ api: "anthropic-messages",
15377
+ provider: "vercel-ai-gateway",
15378
+ baseUrl: "https://ai-gateway.vercel.sh",
15379
+ reasoning: true,
15380
+ input: ["text"],
15381
+ cost: {
15382
+ input: 0.09,
15383
+ output: 0.3,
15384
+ cacheRead: 0,
15385
+ cacheWrite: 0.02,
15386
+ },
15387
+ contextWindow: 262114,
15388
+ maxTokens: 262114,
15389
+ },
15390
+ "stepfun/step-3.7-flash": {
15391
+ id: "stepfun/step-3.7-flash",
15392
+ name: "Step 3.7 Flash",
15393
+ api: "anthropic-messages",
15394
+ provider: "vercel-ai-gateway",
15395
+ baseUrl: "https://ai-gateway.vercel.sh",
15396
+ reasoning: true,
15397
+ input: ["text", "image"],
15398
+ cost: {
15399
+ input: 0.19999999999999998,
15400
+ output: 1.15,
15401
+ cacheRead: 0.04,
15402
+ cacheWrite: 0,
15403
+ },
15404
+ contextWindow: 256000,
15405
+ maxTokens: 256000,
15406
+ },
15056
15407
  "xai/grok-4.1-fast-non-reasoning": {
15057
15408
  id: "xai/grok-4.1-fast-non-reasoning",
15058
15409
  name: "Grok 4.1 Fast Non-Reasoning",
@@ -15266,9 +15617,9 @@ export const MODELS = {
15266
15617
  reasoning: true,
15267
15618
  input: ["text", "image"],
15268
15619
  cost: {
15269
- input: 0.39999999999999997,
15270
- output: 2,
15271
- cacheRead: 0.08,
15620
+ input: 0.14,
15621
+ output: 0.28,
15622
+ cacheRead: 0.0028,
15272
15623
  cacheWrite: 0,
15273
15624
  },
15274
15625
  contextWindow: 1050000,
@@ -15283,9 +15634,9 @@ export const MODELS = {
15283
15634
  reasoning: true,
15284
15635
  input: ["text", "image"],
15285
15636
  cost: {
15286
- input: 1,
15287
- output: 3,
15288
- cacheRead: 0.19999999999999998,
15637
+ input: 0.435,
15638
+ output: 0.87,
15639
+ cacheRead: 0.0036,
15289
15640
  cacheWrite: 0,
15290
15641
  },
15291
15642
  contextWindow: 1050000,
@@ -15331,7 +15682,7 @@ export const MODELS = {
15331
15682
  api: "anthropic-messages",
15332
15683
  provider: "vercel-ai-gateway",
15333
15684
  baseUrl: "https://ai-gateway.vercel.sh",
15334
- reasoning: false,
15685
+ reasoning: true,
15335
15686
  input: ["text", "image"],
15336
15687
  cost: {
15337
15688
  input: 0.6,
@@ -15485,7 +15836,7 @@ export const MODELS = {
15485
15836
  provider: "vercel-ai-gateway",
15486
15837
  baseUrl: "https://ai-gateway.vercel.sh",
15487
15838
  reasoning: true,
15488
- input: ["text"],
15839
+ input: ["text", "image"],
15489
15840
  cost: {
15490
15841
  input: 1.4,
15491
15842
  output: 4.4,
@@ -15727,24 +16078,6 @@ export const MODELS = {
15727
16078
  },
15728
16079
  },
15729
16080
  "xiaomi-token-plan-ams": {
15730
- "mimo-v2-flash": {
15731
- id: "mimo-v2-flash",
15732
- name: "MiMo-V2-Flash",
15733
- api: "openai-completions",
15734
- provider: "xiaomi-token-plan-ams",
15735
- baseUrl: "https://token-plan-ams.xiaomimimo.com/v1",
15736
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
15737
- reasoning: true,
15738
- input: ["text"],
15739
- cost: {
15740
- input: 0.1,
15741
- output: 0.3,
15742
- cacheRead: 0.01,
15743
- cacheWrite: 0,
15744
- },
15745
- contextWindow: 262144,
15746
- maxTokens: 65536,
15747
- },
15748
16081
  "mimo-v2-omni": {
15749
16082
  id: "mimo-v2-omni",
15750
16083
  name: "MiMo-V2-Omni",
@@ -15819,24 +16152,6 @@ export const MODELS = {
15819
16152
  },
15820
16153
  },
15821
16154
  "xiaomi-token-plan-cn": {
15822
- "mimo-v2-flash": {
15823
- id: "mimo-v2-flash",
15824
- name: "MiMo-V2-Flash",
15825
- api: "openai-completions",
15826
- provider: "xiaomi-token-plan-cn",
15827
- baseUrl: "https://token-plan-cn.xiaomimimo.com/v1",
15828
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
15829
- reasoning: true,
15830
- input: ["text"],
15831
- cost: {
15832
- input: 0.1,
15833
- output: 0.3,
15834
- cacheRead: 0.01,
15835
- cacheWrite: 0,
15836
- },
15837
- contextWindow: 262144,
15838
- maxTokens: 65536,
15839
- },
15840
16155
  "mimo-v2-omni": {
15841
16156
  id: "mimo-v2-omni",
15842
16157
  name: "MiMo-V2-Omni",
@@ -15911,24 +16226,6 @@ export const MODELS = {
15911
16226
  },
15912
16227
  },
15913
16228
  "xiaomi-token-plan-sgp": {
15914
- "mimo-v2-flash": {
15915
- id: "mimo-v2-flash",
15916
- name: "MiMo-V2-Flash",
15917
- api: "openai-completions",
15918
- provider: "xiaomi-token-plan-sgp",
15919
- baseUrl: "https://token-plan-sgp.xiaomimimo.com/v1",
15920
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
15921
- reasoning: true,
15922
- input: ["text"],
15923
- cost: {
15924
- input: 0.1,
15925
- output: 0.3,
15926
- cacheRead: 0.01,
15927
- cacheWrite: 0,
15928
- },
15929
- contextWindow: 262144,
15930
- maxTokens: 65536,
15931
- },
15932
16229
  "mimo-v2-omni": {
15933
16230
  id: "mimo-v2-omni",
15934
16231
  name: "MiMo-V2-Omni",