@caupulican/pi-ai 0.75.6 → 0.78.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (71) hide show
  1. package/README.md +1 -1
  2. package/dist/image-models.generated.d.ts.map +1 -1
  3. package/dist/image-models.generated.js +146 -146
  4. package/dist/image-models.generated.js.map +1 -1
  5. package/dist/models.generated.d.ts +500 -298
  6. package/dist/models.generated.d.ts.map +1 -1
  7. package/dist/models.generated.js +617 -491
  8. package/dist/models.generated.js.map +1 -1
  9. package/dist/providers/amazon-bedrock.d.ts +1 -1
  10. package/dist/providers/amazon-bedrock.d.ts.map +1 -1
  11. package/dist/providers/amazon-bedrock.js +48 -5
  12. package/dist/providers/amazon-bedrock.js.map +1 -1
  13. package/dist/providers/anthropic.d.ts.map +1 -1
  14. package/dist/providers/anthropic.js +51 -15
  15. package/dist/providers/anthropic.js.map +1 -1
  16. package/dist/providers/azure-openai-responses.d.ts.map +1 -1
  17. package/dist/providers/azure-openai-responses.js +6 -10
  18. package/dist/providers/azure-openai-responses.js.map +1 -1
  19. package/dist/providers/google-vertex.d.ts.map +1 -1
  20. package/dist/providers/google-vertex.js +1 -1
  21. package/dist/providers/google-vertex.js.map +1 -1
  22. package/dist/providers/google.d.ts.map +1 -1
  23. package/dist/providers/google.js +5 -3
  24. package/dist/providers/google.js.map +1 -1
  25. package/dist/providers/images/openrouter.d.ts.map +1 -1
  26. package/dist/providers/images/openrouter.js +3 -4
  27. package/dist/providers/images/openrouter.js.map +1 -1
  28. package/dist/providers/mistral.d.ts.map +1 -1
  29. package/dist/providers/mistral.js +2 -3
  30. package/dist/providers/mistral.js.map +1 -1
  31. package/dist/providers/openai-codex-responses.d.ts.map +1 -1
  32. package/dist/providers/openai-codex-responses.js +159 -78
  33. package/dist/providers/openai-codex-responses.js.map +1 -1
  34. package/dist/providers/openai-completions.d.ts.map +1 -1
  35. package/dist/providers/openai-completions.js +44 -18
  36. package/dist/providers/openai-completions.js.map +1 -1
  37. package/dist/providers/openai-responses-shared.d.ts.map +1 -1
  38. package/dist/providers/openai-responses-shared.js +4 -1
  39. package/dist/providers/openai-responses-shared.js.map +1 -1
  40. package/dist/providers/openai-responses.d.ts.map +1 -1
  41. package/dist/providers/openai-responses.js +6 -10
  42. package/dist/providers/openai-responses.js.map +1 -1
  43. package/dist/providers/simple-options.d.ts.map +1 -1
  44. package/dist/providers/simple-options.js +1 -0
  45. package/dist/providers/simple-options.js.map +1 -1
  46. package/dist/stream.d.ts.map +1 -1
  47. package/dist/stream.js +14 -2
  48. package/dist/stream.js.map +1 -1
  49. package/dist/types.d.ts +21 -5
  50. package/dist/types.d.ts.map +1 -1
  51. package/dist/types.js.map +1 -1
  52. package/dist/utils/abort-signals.d.ts +6 -0
  53. package/dist/utils/abort-signals.d.ts.map +1 -0
  54. package/dist/utils/abort-signals.js +34 -0
  55. package/dist/utils/abort-signals.js.map +1 -0
  56. package/dist/utils/oauth/device-code.d.ts +9 -7
  57. package/dist/utils/oauth/device-code.d.ts.map +1 -1
  58. package/dist/utils/oauth/device-code.js +8 -7
  59. package/dist/utils/oauth/device-code.js.map +1 -1
  60. package/dist/utils/oauth/github-copilot.d.ts.map +1 -1
  61. package/dist/utils/oauth/github-copilot.js +1 -1
  62. package/dist/utils/oauth/github-copilot.js.map +1 -1
  63. package/dist/utils/oauth/index.d.ts +1 -1
  64. package/dist/utils/oauth/index.d.ts.map +1 -1
  65. package/dist/utils/oauth/index.js +1 -1
  66. package/dist/utils/oauth/index.js.map +1 -1
  67. package/dist/utils/oauth/openai-codex.d.ts +10 -1
  68. package/dist/utils/oauth/openai-codex.d.ts.map +1 -1
  69. package/dist/utils/oauth/openai-codex.js +179 -79
  70. package/dist/utils/oauth/openai-codex.js.map +1 -1
  71. package/package.json +104 -91
@@ -157,6 +157,24 @@ export const MODELS = {
157
157
  contextWindow: 1000000,
158
158
  maxTokens: 128000,
159
159
  },
160
+ "anthropic.claude-opus-4-8": {
161
+ id: "anthropic.claude-opus-4-8",
162
+ name: "Claude Opus 4.8",
163
+ api: "bedrock-converse-stream",
164
+ provider: "amazon-bedrock",
165
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
166
+ reasoning: true,
167
+ thinkingLevelMap: { "xhigh": "xhigh" },
168
+ input: ["text", "image"],
169
+ cost: {
170
+ input: 5,
171
+ output: 25,
172
+ cacheRead: 0.5,
173
+ cacheWrite: 6.25,
174
+ },
175
+ contextWindow: 1000000,
176
+ maxTokens: 128000,
177
+ },
160
178
  "anthropic.claude-sonnet-4-5-20250929-v1:0": {
161
179
  id: "anthropic.claude-sonnet-4-5-20250929-v1:0",
162
180
  name: "Claude Sonnet 4.5",
@@ -226,6 +244,24 @@ export const MODELS = {
226
244
  contextWindow: 1000000,
227
245
  maxTokens: 128000,
228
246
  },
247
+ "au.anthropic.claude-opus-4-8": {
248
+ id: "au.anthropic.claude-opus-4-8",
249
+ name: "Claude Opus 4.8 (AU)",
250
+ api: "bedrock-converse-stream",
251
+ provider: "amazon-bedrock",
252
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
253
+ reasoning: true,
254
+ thinkingLevelMap: { "xhigh": "xhigh" },
255
+ input: ["text", "image"],
256
+ cost: {
257
+ input: 5,
258
+ output: 25,
259
+ cacheRead: 0.5,
260
+ cacheWrite: 6.25,
261
+ },
262
+ contextWindow: 1000000,
263
+ maxTokens: 128000,
264
+ },
229
265
  "au.anthropic.claude-sonnet-4-5-20250929-v1:0": {
230
266
  id: "au.anthropic.claude-sonnet-4-5-20250929-v1:0",
231
267
  name: "Claude Sonnet 4.5 (AU)",
@@ -355,8 +391,8 @@ export const MODELS = {
355
391
  thinkingLevelMap: { "xhigh": "max" },
356
392
  input: ["text", "image"],
357
393
  cost: {
358
- input: 5,
359
- output: 25,
394
+ input: 5.5,
395
+ output: 27.5,
360
396
  cacheRead: 0.5,
361
397
  cacheWrite: 6.25,
362
398
  },
@@ -373,10 +409,28 @@ export const MODELS = {
373
409
  thinkingLevelMap: { "xhigh": "xhigh" },
374
410
  input: ["text", "image"],
375
411
  cost: {
376
- input: 5,
377
- output: 25,
378
- cacheRead: 0.5,
379
- cacheWrite: 6.25,
412
+ input: 5.5,
413
+ output: 27.5,
414
+ cacheRead: 0.55,
415
+ cacheWrite: 6.875,
416
+ },
417
+ contextWindow: 1000000,
418
+ maxTokens: 128000,
419
+ },
420
+ "eu.anthropic.claude-opus-4-8": {
421
+ id: "eu.anthropic.claude-opus-4-8",
422
+ name: "Claude Opus 4.8 (EU)",
423
+ api: "bedrock-converse-stream",
424
+ provider: "amazon-bedrock",
425
+ baseUrl: "https://bedrock-runtime.eu-central-1.amazonaws.com",
426
+ reasoning: true,
427
+ thinkingLevelMap: { "xhigh": "xhigh" },
428
+ input: ["text", "image"],
429
+ cost: {
430
+ input: 5.5,
431
+ output: 27.5,
432
+ cacheRead: 0.55,
433
+ cacheWrite: 6.875,
380
434
  },
381
435
  contextWindow: 1000000,
382
436
  maxTokens: 128000,
@@ -390,10 +444,10 @@ export const MODELS = {
390
444
  reasoning: true,
391
445
  input: ["text", "image"],
392
446
  cost: {
393
- input: 3,
394
- output: 15,
395
- cacheRead: 0.3,
396
- cacheWrite: 3.75,
447
+ input: 3.3,
448
+ output: 16.5,
449
+ cacheRead: 0.33,
450
+ cacheWrite: 4.125,
397
451
  },
398
452
  contextWindow: 200000,
399
453
  maxTokens: 64000,
@@ -407,10 +461,10 @@ export const MODELS = {
407
461
  reasoning: true,
408
462
  input: ["text", "image"],
409
463
  cost: {
410
- input: 3,
411
- output: 15,
412
- cacheRead: 0.3,
413
- cacheWrite: 3.75,
464
+ input: 3.3,
465
+ output: 16.5,
466
+ cacheRead: 0.33,
467
+ cacheWrite: 4.125,
414
468
  },
415
469
  contextWindow: 1000000,
416
470
  maxTokens: 64000,
@@ -485,6 +539,24 @@ export const MODELS = {
485
539
  contextWindow: 1000000,
486
540
  maxTokens: 128000,
487
541
  },
542
+ "global.anthropic.claude-opus-4-8": {
543
+ id: "global.anthropic.claude-opus-4-8",
544
+ name: "Claude Opus 4.8 (Global)",
545
+ api: "bedrock-converse-stream",
546
+ provider: "amazon-bedrock",
547
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
548
+ reasoning: true,
549
+ thinkingLevelMap: { "xhigh": "xhigh" },
550
+ input: ["text", "image"],
551
+ cost: {
552
+ input: 5,
553
+ output: 25,
554
+ cacheRead: 0.5,
555
+ cacheWrite: 6.25,
556
+ },
557
+ contextWindow: 1000000,
558
+ maxTokens: 128000,
559
+ },
488
560
  "global.anthropic.claude-sonnet-4-5-20250929-v1:0": {
489
561
  id: "global.anthropic.claude-sonnet-4-5-20250929-v1:0",
490
562
  name: "Claude Sonnet 4.5 (Global)",
@@ -571,6 +643,24 @@ export const MODELS = {
571
643
  contextWindow: 1000000,
572
644
  maxTokens: 128000,
573
645
  },
646
+ "jp.anthropic.claude-opus-4-8": {
647
+ id: "jp.anthropic.claude-opus-4-8",
648
+ name: "Claude Opus 4.8 (JP)",
649
+ api: "bedrock-converse-stream",
650
+ provider: "amazon-bedrock",
651
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
652
+ reasoning: true,
653
+ thinkingLevelMap: { "xhigh": "xhigh" },
654
+ input: ["text", "image"],
655
+ cost: {
656
+ input: 5,
657
+ output: 25,
658
+ cacheRead: 0.5,
659
+ cacheWrite: 6.25,
660
+ },
661
+ contextWindow: 1000000,
662
+ maxTokens: 128000,
663
+ },
574
664
  "jp.anthropic.claude-sonnet-4-5-20250929-v1:0": {
575
665
  id: "jp.anthropic.claude-sonnet-4-5-20250929-v1:0",
576
666
  name: "Claude Sonnet 4.5 (JP)",
@@ -1270,6 +1360,24 @@ export const MODELS = {
1270
1360
  contextWindow: 1000000,
1271
1361
  maxTokens: 128000,
1272
1362
  },
1363
+ "us.anthropic.claude-opus-4-8": {
1364
+ id: "us.anthropic.claude-opus-4-8",
1365
+ name: "Claude Opus 4.8 (US)",
1366
+ api: "bedrock-converse-stream",
1367
+ provider: "amazon-bedrock",
1368
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1369
+ reasoning: true,
1370
+ thinkingLevelMap: { "xhigh": "xhigh" },
1371
+ input: ["text", "image"],
1372
+ cost: {
1373
+ input: 5,
1374
+ output: 25,
1375
+ cacheRead: 0.5,
1376
+ cacheWrite: 6.25,
1377
+ },
1378
+ contextWindow: 1000000,
1379
+ maxTokens: 128000,
1380
+ },
1273
1381
  "us.anthropic.claude-sonnet-4-5-20250929-v1:0": {
1274
1382
  id: "us.anthropic.claude-sonnet-4-5-20250929-v1:0",
1275
1383
  name: "Claude Sonnet 4.5 (US)",
@@ -1739,7 +1847,26 @@ export const MODELS = {
1739
1847
  api: "anthropic-messages",
1740
1848
  provider: "anthropic",
1741
1849
  baseUrl: "https://api.anthropic.com",
1742
- compat: { "forceAdaptiveThinking": true },
1850
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
1851
+ reasoning: true,
1852
+ thinkingLevelMap: { "xhigh": "xhigh" },
1853
+ input: ["text", "image"],
1854
+ cost: {
1855
+ input: 5,
1856
+ output: 25,
1857
+ cacheRead: 0.5,
1858
+ cacheWrite: 6.25,
1859
+ },
1860
+ contextWindow: 1000000,
1861
+ maxTokens: 128000,
1862
+ },
1863
+ "claude-opus-4-8": {
1864
+ id: "claude-opus-4-8",
1865
+ name: "Claude Opus 4.8",
1866
+ api: "anthropic-messages",
1867
+ provider: "anthropic",
1868
+ baseUrl: "https://api.anthropic.com",
1869
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
1743
1870
  reasoning: true,
1744
1871
  thinkingLevelMap: { "xhigh": "xhigh" },
1745
1872
  input: ["text", "image"],
@@ -1919,7 +2046,7 @@ export const MODELS = {
1919
2046
  cost: {
1920
2047
  input: 0.1,
1921
2048
  output: 0.4,
1922
- cacheRead: 0.03,
2049
+ cacheRead: 0.025,
1923
2050
  cacheWrite: 0,
1924
2051
  },
1925
2052
  contextWindow: 1047576,
@@ -2004,7 +2131,7 @@ export const MODELS = {
2004
2131
  cost: {
2005
2132
  input: 0.15,
2006
2133
  output: 0.6,
2007
- cacheRead: 0.08,
2134
+ cacheRead: 0.075,
2008
2135
  cacheWrite: 0,
2009
2136
  },
2010
2137
  contextWindow: 128000,
@@ -2130,7 +2257,7 @@ export const MODELS = {
2130
2257
  cost: {
2131
2258
  input: 1.25,
2132
2259
  output: 10,
2133
- cacheRead: 0.13,
2260
+ cacheRead: 0.125,
2134
2261
  cacheWrite: 0,
2135
2262
  },
2136
2263
  contextWindow: 400000,
@@ -2431,7 +2558,7 @@ export const MODELS = {
2431
2558
  provider: "azure-openai-responses",
2432
2559
  baseUrl: "",
2433
2560
  reasoning: true,
2434
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
2561
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh", "minimal": null, "low": null },
2435
2562
  input: ["text", "image"],
2436
2563
  cost: {
2437
2564
  input: 30,
@@ -2555,7 +2682,7 @@ export const MODELS = {
2555
2682
  cost: {
2556
2683
  input: 1.1,
2557
2684
  output: 4.4,
2558
- cacheRead: 0.28,
2685
+ cacheRead: 0.275,
2559
2686
  cacheWrite: 0,
2560
2687
  },
2561
2688
  contextWindow: 200000,
@@ -2614,23 +2741,6 @@ export const MODELS = {
2614
2741
  contextWindow: 32000,
2615
2742
  maxTokens: 8000,
2616
2743
  },
2617
- "qwen-3-235b-a22b-instruct-2507": {
2618
- id: "qwen-3-235b-a22b-instruct-2507",
2619
- name: "Qwen 3 235B Instruct",
2620
- api: "openai-completions",
2621
- provider: "cerebras",
2622
- baseUrl: "https://api.cerebras.ai/v1",
2623
- reasoning: false,
2624
- input: ["text"],
2625
- cost: {
2626
- input: 0.6,
2627
- output: 1.2,
2628
- cacheRead: 0,
2629
- cacheWrite: 0,
2630
- },
2631
- contextWindow: 131000,
2632
- maxTokens: 32000,
2633
- },
2634
2744
  "zai-glm-4.7": {
2635
2745
  id: "zai-glm-4.7",
2636
2746
  name: "Z.AI GLM-4.7",
@@ -2845,7 +2955,26 @@ export const MODELS = {
2845
2955
  api: "anthropic-messages",
2846
2956
  provider: "cloudflare-ai-gateway",
2847
2957
  baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2848
- compat: { "forceAdaptiveThinking": true },
2958
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
2959
+ reasoning: true,
2960
+ thinkingLevelMap: { "xhigh": "xhigh" },
2961
+ input: ["text", "image"],
2962
+ cost: {
2963
+ input: 5,
2964
+ output: 25,
2965
+ cacheRead: 0.5,
2966
+ cacheWrite: 6.25,
2967
+ },
2968
+ contextWindow: 1000000,
2969
+ maxTokens: 128000,
2970
+ },
2971
+ "claude-opus-4-8": {
2972
+ id: "claude-opus-4-8",
2973
+ name: "Claude Opus 4.8",
2974
+ api: "anthropic-messages",
2975
+ provider: "cloudflare-ai-gateway",
2976
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2977
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
2849
2978
  reasoning: true,
2850
2979
  thinkingLevelMap: { "xhigh": "xhigh" },
2851
2980
  input: ["text", "image"],
@@ -3353,24 +3482,6 @@ export const MODELS = {
3353
3482
  contextWindow: 128000,
3354
3483
  maxTokens: 128000,
3355
3484
  },
3356
- "@cf/moonshotai/kimi-k2.5": {
3357
- id: "@cf/moonshotai/kimi-k2.5",
3358
- name: "Kimi K2.5",
3359
- api: "openai-completions",
3360
- provider: "cloudflare-workers-ai",
3361
- baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3362
- compat: { "sendSessionAffinityHeaders": true },
3363
- reasoning: true,
3364
- input: ["text", "image"],
3365
- cost: {
3366
- input: 0.6,
3367
- output: 3,
3368
- cacheRead: 0.1,
3369
- cacheWrite: 0,
3370
- },
3371
- contextWindow: 256000,
3372
- maxTokens: 256000,
3373
- },
3374
3485
  "@cf/moonshotai/kimi-k2.6": {
3375
3486
  id: "@cf/moonshotai/kimi-k2.6",
3376
3487
  name: "Kimi K2.6",
@@ -3755,8 +3866,8 @@ export const MODELS = {
3755
3866
  cacheRead: 0,
3756
3867
  cacheWrite: 0,
3757
3868
  },
3758
- contextWindow: 144000,
3759
- maxTokens: 32000,
3869
+ contextWindow: 200000,
3870
+ maxTokens: 64000,
3760
3871
  },
3761
3872
  "claude-opus-4.5": {
3762
3873
  id: "claude-opus-4.5",
@@ -3773,7 +3884,7 @@ export const MODELS = {
3773
3884
  cacheRead: 0,
3774
3885
  cacheWrite: 0,
3775
3886
  },
3776
- contextWindow: 160000,
3887
+ contextWindow: 200000,
3777
3888
  maxTokens: 32000,
3778
3889
  },
3779
3890
  "claude-opus-4.6": {
@@ -3794,7 +3905,7 @@ export const MODELS = {
3794
3905
  cacheWrite: 0,
3795
3906
  },
3796
3907
  contextWindow: 1000000,
3797
- maxTokens: 64000,
3908
+ maxTokens: 32000,
3798
3909
  },
3799
3910
  "claude-opus-4.7": {
3800
3911
  id: "claude-opus-4.7",
@@ -3803,7 +3914,27 @@ export const MODELS = {
3803
3914
  provider: "github-copilot",
3804
3915
  baseUrl: "https://api.individual.githubcopilot.com",
3805
3916
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3806
- compat: { "forceAdaptiveThinking": true },
3917
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
3918
+ reasoning: true,
3919
+ thinkingLevelMap: { "xhigh": "xhigh" },
3920
+ input: ["text", "image"],
3921
+ cost: {
3922
+ input: 0,
3923
+ output: 0,
3924
+ cacheRead: 0,
3925
+ cacheWrite: 0,
3926
+ },
3927
+ contextWindow: 200000,
3928
+ maxTokens: 32000,
3929
+ },
3930
+ "claude-opus-4.8": {
3931
+ id: "claude-opus-4.8",
3932
+ name: "Claude Opus 4.8",
3933
+ api: "anthropic-messages",
3934
+ provider: "github-copilot",
3935
+ baseUrl: "https://api.individual.githubcopilot.com",
3936
+ headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3937
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
3807
3938
  reasoning: true,
3808
3939
  thinkingLevelMap: { "xhigh": "xhigh" },
3809
3940
  input: ["text", "image"],
@@ -3813,7 +3944,7 @@ export const MODELS = {
3813
3944
  cacheRead: 0,
3814
3945
  cacheWrite: 0,
3815
3946
  },
3816
- contextWindow: 144000,
3947
+ contextWindow: 200000,
3817
3948
  maxTokens: 64000,
3818
3949
  },
3819
3950
  "claude-sonnet-4.5": {
@@ -3832,7 +3963,7 @@ export const MODELS = {
3832
3963
  cacheRead: 0,
3833
3964
  cacheWrite: 0,
3834
3965
  },
3835
- contextWindow: 144000,
3966
+ contextWindow: 200000,
3836
3967
  maxTokens: 32000,
3837
3968
  },
3838
3969
  "claude-sonnet-4.6": {
@@ -3908,7 +4039,7 @@ export const MODELS = {
3908
4039
  cacheRead: 0,
3909
4040
  cacheWrite: 0,
3910
4041
  },
3911
- contextWindow: 128000,
4042
+ contextWindow: 200000,
3912
4043
  maxTokens: 64000,
3913
4044
  },
3914
4045
  "gemini-3.5-flash": {
@@ -3927,7 +4058,7 @@ export const MODELS = {
3927
4058
  cacheRead: 0,
3928
4059
  cacheWrite: 0,
3929
4060
  },
3930
- contextWindow: 128000,
4061
+ contextWindow: 200000,
3931
4062
  maxTokens: 64000,
3932
4063
  },
3933
4064
  "gpt-4.1": {
@@ -4003,8 +4134,8 @@ export const MODELS = {
4003
4134
  cacheRead: 0,
4004
4135
  cacheWrite: 0,
4005
4136
  },
4006
- contextWindow: 264000,
4007
- maxTokens: 64000,
4137
+ contextWindow: 400000,
4138
+ maxTokens: 128000,
4008
4139
  },
4009
4140
  "gpt-5.2-codex": {
4010
4141
  id: "gpt-5.2-codex",
@@ -4847,7 +4978,7 @@ export const MODELS = {
4847
4978
  cost: {
4848
4979
  input: 1,
4849
4980
  output: 3,
4850
- cacheRead: 0,
4981
+ cacheRead: 0.5,
4851
4982
  cacheWrite: 0,
4852
4983
  },
4853
4984
  contextWindow: 262144,
@@ -4864,7 +4995,7 @@ export const MODELS = {
4864
4995
  cost: {
4865
4996
  input: 0.15,
4866
4997
  output: 0.6,
4867
- cacheRead: 0,
4998
+ cacheRead: 0.075,
4868
4999
  cacheWrite: 0,
4869
5000
  },
4870
5001
  contextWindow: 131072,
@@ -4881,7 +5012,7 @@ export const MODELS = {
4881
5012
  cost: {
4882
5013
  input: 0.075,
4883
5014
  output: 0.3,
4884
- cacheRead: 0,
5015
+ cacheRead: 0.0375,
4885
5016
  cacheWrite: 0,
4886
5017
  },
4887
5018
  contextWindow: 131072,
@@ -5167,9 +5298,9 @@ export const MODELS = {
5167
5298
  reasoning: true,
5168
5299
  input: ["text"],
5169
5300
  cost: {
5170
- input: 1.74,
5171
- output: 3.48,
5172
- cacheRead: 0.145,
5301
+ input: 0.435,
5302
+ output: 0.87,
5303
+ cacheRead: 0.003625,
5173
5304
  cacheWrite: 0,
5174
5305
  },
5175
5306
  contextWindow: 1048576,
@@ -5376,6 +5507,26 @@ export const MODELS = {
5376
5507
  maxTokens: 32768,
5377
5508
  },
5378
5509
  },
5510
+ "llama-cpp": {
5511
+ "local": {
5512
+ id: "local",
5513
+ name: "llama.cpp local server",
5514
+ api: "openai-completions",
5515
+ provider: "llama-cpp",
5516
+ baseUrl: "http://127.0.0.1:8080/v1",
5517
+ compat: { "supportsDeveloperRole": false, "supportsStore": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
5518
+ reasoning: false,
5519
+ input: ["text"],
5520
+ cost: {
5521
+ input: 0,
5522
+ output: 0,
5523
+ cacheRead: 0,
5524
+ cacheWrite: 0,
5525
+ },
5526
+ contextWindow: 32768,
5527
+ maxTokens: 4096,
5528
+ },
5529
+ },
5379
5530
  "minimax": {
5380
5531
  "MiniMax-M2.7": {
5381
5532
  id: "MiniMax-M2.7",
@@ -6262,7 +6413,7 @@ export const MODELS = {
6262
6413
  cost: {
6263
6414
  input: 0.1,
6264
6415
  output: 0.4,
6265
- cacheRead: 0.03,
6416
+ cacheRead: 0.025,
6266
6417
  cacheWrite: 0,
6267
6418
  },
6268
6419
  contextWindow: 1047576,
@@ -6347,7 +6498,7 @@ export const MODELS = {
6347
6498
  cost: {
6348
6499
  input: 0.15,
6349
6500
  output: 0.6,
6350
- cacheRead: 0.08,
6501
+ cacheRead: 0.075,
6351
6502
  cacheWrite: 0,
6352
6503
  },
6353
6504
  contextWindow: 128000,
@@ -6473,7 +6624,7 @@ export const MODELS = {
6473
6624
  cost: {
6474
6625
  input: 1.25,
6475
6626
  output: 10,
6476
- cacheRead: 0.13,
6627
+ cacheRead: 0.125,
6477
6628
  cacheWrite: 0,
6478
6629
  },
6479
6630
  contextWindow: 400000,
@@ -6756,7 +6907,7 @@ export const MODELS = {
6756
6907
  provider: "openai",
6757
6908
  baseUrl: "https://api.openai.com/v1",
6758
6909
  reasoning: true,
6759
- thinkingLevelMap: { "off": "none", "xhigh": "xhigh" },
6910
+ thinkingLevelMap: { "off": "none", "xhigh": "xhigh", "minimal": null },
6760
6911
  input: ["text", "image"],
6761
6912
  cost: {
6762
6913
  input: 5,
@@ -6774,7 +6925,7 @@ export const MODELS = {
6774
6925
  provider: "openai",
6775
6926
  baseUrl: "https://api.openai.com/v1",
6776
6927
  reasoning: true,
6777
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
6928
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh", "minimal": null, "low": null },
6778
6929
  input: ["text", "image"],
6779
6930
  cost: {
6780
6931
  input: 30,
@@ -6898,7 +7049,7 @@ export const MODELS = {
6898
7049
  cost: {
6899
7050
  input: 1.1,
6900
7051
  output: 4.4,
6901
- cacheRead: 0.28,
7052
+ cacheRead: 0.275,
6902
7053
  cacheWrite: 0,
6903
7054
  },
6904
7055
  contextWindow: 200000,
@@ -7048,7 +7199,7 @@ export const MODELS = {
7048
7199
  cacheWrite: 0,
7049
7200
  },
7050
7201
  contextWindow: 200000,
7051
- maxTokens: 128000,
7202
+ maxTokens: 32000,
7052
7203
  },
7053
7204
  "claude-haiku-4-5": {
7054
7205
  id: "claude-haiku-4-5",
@@ -7126,7 +7277,7 @@ export const MODELS = {
7126
7277
  api: "anthropic-messages",
7127
7278
  provider: "opencode",
7128
7279
  baseUrl: "https://opencode.ai/zen",
7129
- compat: { "forceAdaptiveThinking": true },
7280
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
7130
7281
  reasoning: true,
7131
7282
  thinkingLevelMap: { "xhigh": "xhigh" },
7132
7283
  input: ["text", "image"],
@@ -7139,9 +7290,28 @@ export const MODELS = {
7139
7290
  contextWindow: 1000000,
7140
7291
  maxTokens: 128000,
7141
7292
  },
7142
- "claude-sonnet-4": {
7143
- id: "claude-sonnet-4",
7144
- name: "Claude Sonnet 4",
7293
+ "claude-opus-4-8": {
7294
+ id: "claude-opus-4-8",
7295
+ name: "Claude Opus 4.8",
7296
+ api: "anthropic-messages",
7297
+ provider: "opencode",
7298
+ baseUrl: "https://opencode.ai/zen",
7299
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
7300
+ reasoning: true,
7301
+ thinkingLevelMap: { "xhigh": "xhigh" },
7302
+ input: ["text", "image"],
7303
+ cost: {
7304
+ input: 5,
7305
+ output: 25,
7306
+ cacheRead: 0.5,
7307
+ cacheWrite: 6.25,
7308
+ },
7309
+ contextWindow: 1000000,
7310
+ maxTokens: 128000,
7311
+ },
7312
+ "claude-sonnet-4": {
7313
+ id: "claude-sonnet-4",
7314
+ name: "Claude Sonnet 4",
7145
7315
  api: "anthropic-messages",
7146
7316
  provider: "opencode",
7147
7317
  baseUrl: "https://opencode.ai/zen",
@@ -7191,6 +7361,25 @@ export const MODELS = {
7191
7361
  contextWindow: 1000000,
7192
7362
  maxTokens: 64000,
7193
7363
  },
7364
+ "deepseek-v4-flash": {
7365
+ id: "deepseek-v4-flash",
7366
+ name: "DeepSeek V4 Flash",
7367
+ api: "openai-completions",
7368
+ provider: "opencode",
7369
+ baseUrl: "https://opencode.ai/zen/v1",
7370
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7371
+ reasoning: true,
7372
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7373
+ input: ["text"],
7374
+ cost: {
7375
+ input: 0.14,
7376
+ output: 0.28,
7377
+ cacheRead: 0.03,
7378
+ cacheWrite: 0,
7379
+ },
7380
+ contextWindow: 1000000,
7381
+ maxTokens: 384000,
7382
+ },
7194
7383
  "deepseek-v4-flash-free": {
7195
7384
  id: "deepseek-v4-flash-free",
7196
7385
  name: "DeepSeek V4 Flash Free",
@@ -7575,7 +7764,7 @@ export const MODELS = {
7575
7764
  provider: "opencode",
7576
7765
  baseUrl: "https://opencode.ai/zen/v1",
7577
7766
  reasoning: true,
7578
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
7767
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh", "minimal": null, "low": null },
7579
7768
  input: ["text", "image"],
7580
7769
  cost: {
7581
7770
  input: 30,
@@ -7592,7 +7781,9 @@ export const MODELS = {
7592
7781
  api: "openai-completions",
7593
7782
  provider: "opencode",
7594
7783
  baseUrl: "https://opencode.ai/zen/v1",
7784
+ compat: { "supportsReasoningEffort": false },
7595
7785
  reasoning: true,
7786
+ thinkingLevelMap: { "off": null, "minimal": null, "low": null, "medium": null },
7596
7787
  input: ["text", "image"],
7597
7788
  cost: {
7598
7789
  input: 1,
@@ -7626,6 +7817,7 @@ export const MODELS = {
7626
7817
  api: "openai-completions",
7627
7818
  provider: "opencode",
7628
7819
  baseUrl: "https://opencode.ai/zen/v1",
7820
+ compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false },
7629
7821
  reasoning: true,
7630
7822
  input: ["text", "image"],
7631
7823
  cost: {
@@ -7637,6 +7829,23 @@ export const MODELS = {
7637
7829
  contextWindow: 262144,
7638
7830
  maxTokens: 65536,
7639
7831
  },
7832
+ "mimo-v2.5-free": {
7833
+ id: "mimo-v2.5-free",
7834
+ name: "MiMo V2.5 Free",
7835
+ api: "openai-completions",
7836
+ provider: "opencode",
7837
+ baseUrl: "https://opencode.ai/zen/v1",
7838
+ reasoning: true,
7839
+ input: ["text", "image"],
7840
+ cost: {
7841
+ input: 0,
7842
+ output: 0,
7843
+ cacheRead: 0,
7844
+ cacheWrite: 0,
7845
+ },
7846
+ contextWindow: 200000,
7847
+ maxTokens: 32000,
7848
+ },
7640
7849
  "minimax-m2.5": {
7641
7850
  id: "minimax-m2.5",
7642
7851
  name: "MiniMax M2.5",
@@ -7671,6 +7880,23 @@ export const MODELS = {
7671
7880
  contextWindow: 204800,
7672
7881
  maxTokens: 131072,
7673
7882
  },
7883
+ "minimax-m3-free": {
7884
+ id: "minimax-m3-free",
7885
+ name: "MiniMax M3 Free",
7886
+ api: "anthropic-messages",
7887
+ provider: "opencode",
7888
+ baseUrl: "https://opencode.ai/zen",
7889
+ reasoning: true,
7890
+ input: ["text", "image"],
7891
+ cost: {
7892
+ input: 0,
7893
+ output: 0,
7894
+ cacheRead: 0,
7895
+ cacheWrite: 0,
7896
+ },
7897
+ contextWindow: 200000,
7898
+ maxTokens: 32000,
7899
+ },
7674
7900
  "nemotron-3-super-free": {
7675
7901
  id: "nemotron-3-super-free",
7676
7902
  name: "Nemotron 3 Super Free",
@@ -7819,7 +8045,9 @@ export const MODELS = {
7819
8045
  api: "openai-completions",
7820
8046
  provider: "opencode-go",
7821
8047
  baseUrl: "https://opencode.ai/zen/go/v1",
8048
+ compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false },
7822
8049
  reasoning: true,
8050
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
7823
8051
  input: ["text", "image"],
7824
8052
  cost: {
7825
8053
  input: 0.95,
@@ -7839,9 +8067,9 @@ export const MODELS = {
7839
8067
  reasoning: true,
7840
8068
  input: ["text", "image"],
7841
8069
  cost: {
7842
- input: 0.4,
7843
- output: 2,
7844
- cacheRead: 0.08,
8070
+ input: 0.14,
8071
+ output: 0.28,
8072
+ cacheRead: 0.0028,
7845
8073
  cacheWrite: 0,
7846
8074
  },
7847
8075
  contextWindow: 1000000,
@@ -7856,9 +8084,9 @@ export const MODELS = {
7856
8084
  reasoning: true,
7857
8085
  input: ["text"],
7858
8086
  cost: {
7859
- input: 1,
7860
- output: 3,
7861
- cacheRead: 0.2,
8087
+ input: 1.74,
8088
+ output: 3.48,
8089
+ cacheRead: 0.0145,
7862
8090
  cacheWrite: 0,
7863
8091
  },
7864
8092
  contextWindow: 1048576,
@@ -7898,23 +8126,22 @@ export const MODELS = {
7898
8126
  contextWindow: 204800,
7899
8127
  maxTokens: 131072,
7900
8128
  },
7901
- "qwen3.5-plus": {
7902
- id: "qwen3.5-plus",
7903
- name: "Qwen3.5 Plus",
7904
- api: "openai-completions",
8129
+ "minimax-m3": {
8130
+ id: "minimax-m3",
8131
+ name: "MiniMax M3",
8132
+ api: "anthropic-messages",
7905
8133
  provider: "opencode-go",
7906
- baseUrl: "https://opencode.ai/zen/go/v1",
7907
- compat: { "thinkingFormat": "qwen" },
8134
+ baseUrl: "https://opencode.ai/zen/go",
7908
8135
  reasoning: true,
7909
8136
  input: ["text", "image"],
7910
8137
  cost: {
7911
- input: 0.2,
7912
- output: 1.2,
7913
- cacheRead: 0.02,
7914
- cacheWrite: 0.25,
8138
+ input: 0.6,
8139
+ output: 2.4,
8140
+ cacheRead: 0.12,
8141
+ cacheWrite: 0,
7915
8142
  },
7916
- contextWindow: 262144,
7917
- maxTokens: 65536,
8143
+ contextWindow: 512000,
8144
+ maxTokens: 131072,
7918
8145
  },
7919
8146
  "qwen3.6-plus": {
7920
8147
  id: "qwen3.6-plus",
@@ -7934,6 +8161,23 @@ export const MODELS = {
7934
8161
  contextWindow: 262144,
7935
8162
  maxTokens: 65536,
7936
8163
  },
8164
+ "qwen3.7-max": {
8165
+ id: "qwen3.7-max",
8166
+ name: "Qwen3.7 Max",
8167
+ api: "anthropic-messages",
8168
+ provider: "opencode-go",
8169
+ baseUrl: "https://opencode.ai/zen/go",
8170
+ reasoning: true,
8171
+ input: ["text"],
8172
+ cost: {
8173
+ input: 2.5,
8174
+ output: 7.5,
8175
+ cacheRead: 0.5,
8176
+ cacheWrite: 3.125,
8177
+ },
8178
+ contextWindow: 1000000,
8179
+ maxTokens: 65536,
8180
+ },
7937
8181
  },
7938
8182
  "openrouter": {
7939
8183
  "ai21/jamba-large-1.7": {
@@ -7953,23 +8197,6 @@ export const MODELS = {
7953
8197
  contextWindow: 256000,
7954
8198
  maxTokens: 4096,
7955
8199
  },
7956
- "alibaba/tongyi-deepresearch-30b-a3b": {
7957
- id: "alibaba/tongyi-deepresearch-30b-a3b",
7958
- name: "Tongyi DeepResearch 30B A3B",
7959
- api: "openai-completions",
7960
- provider: "openrouter",
7961
- baseUrl: "https://openrouter.ai/api/v1",
7962
- reasoning: true,
7963
- input: ["text"],
7964
- cost: {
7965
- input: 0.09,
7966
- output: 0.44999999999999996,
7967
- cacheRead: 0.09,
7968
- cacheWrite: 0,
7969
- },
7970
- contextWindow: 131072,
7971
- maxTokens: 131072,
7972
- },
7973
8200
  "amazon/nova-2-lite-v1": {
7974
8201
  id: "amazon/nova-2-lite-v1",
7975
8202
  name: "Amazon: Nova 2 Lite",
@@ -8229,6 +8456,42 @@ export const MODELS = {
8229
8456
  contextWindow: 1000000,
8230
8457
  maxTokens: 128000,
8231
8458
  },
8459
+ "anthropic/claude-opus-4.8": {
8460
+ id: "anthropic/claude-opus-4.8",
8461
+ name: "Anthropic: Claude Opus 4.8",
8462
+ api: "openai-completions",
8463
+ provider: "openrouter",
8464
+ baseUrl: "https://openrouter.ai/api/v1",
8465
+ reasoning: true,
8466
+ thinkingLevelMap: { "xhigh": "xhigh" },
8467
+ input: ["text", "image"],
8468
+ cost: {
8469
+ input: 5,
8470
+ output: 25,
8471
+ cacheRead: 0.5,
8472
+ cacheWrite: 6.25,
8473
+ },
8474
+ contextWindow: 1000000,
8475
+ maxTokens: 128000,
8476
+ },
8477
+ "anthropic/claude-opus-4.8-fast": {
8478
+ id: "anthropic/claude-opus-4.8-fast",
8479
+ name: "Anthropic: Claude Opus 4.8 (Fast)",
8480
+ api: "openai-completions",
8481
+ provider: "openrouter",
8482
+ baseUrl: "https://openrouter.ai/api/v1",
8483
+ reasoning: true,
8484
+ thinkingLevelMap: { "xhigh": "xhigh" },
8485
+ input: ["text", "image"],
8486
+ cost: {
8487
+ input: 10,
8488
+ output: 50,
8489
+ cacheRead: 1,
8490
+ cacheWrite: 12.5,
8491
+ },
8492
+ contextWindow: 1000000,
8493
+ maxTokens: 128000,
8494
+ },
8232
8495
  "anthropic/claude-sonnet-4": {
8233
8496
  id: "anthropic/claude-sonnet-4",
8234
8497
  name: "Anthropic: Claude Sonnet 4",
@@ -8297,23 +8560,6 @@ export const MODELS = {
8297
8560
  contextWindow: 262144,
8298
8561
  maxTokens: 262144,
8299
8562
  },
8300
- "arcee-ai/trinity-large-thinking:free": {
8301
- id: "arcee-ai/trinity-large-thinking:free",
8302
- name: "Arcee AI: Trinity Large Thinking (free)",
8303
- api: "openai-completions",
8304
- provider: "openrouter",
8305
- baseUrl: "https://openrouter.ai/api/v1",
8306
- reasoning: true,
8307
- input: ["text"],
8308
- cost: {
8309
- input: 0,
8310
- output: 0,
8311
- cacheRead: 0,
8312
- cacheWrite: 0,
8313
- },
8314
- contextWindow: 262144,
8315
- maxTokens: 80000,
8316
- },
8317
8563
  "arcee-ai/trinity-mini": {
8318
8564
  id: "arcee-ai/trinity-mini",
8319
8565
  name: "Arcee AI: Trinity Mini",
@@ -8365,40 +8611,6 @@ export const MODELS = {
8365
8611
  contextWindow: 2000000,
8366
8612
  maxTokens: 30000,
8367
8613
  },
8368
- "baidu/cobuddy:free": {
8369
- id: "baidu/cobuddy:free",
8370
- name: "Baidu Qianfan: CoBuddy (free)",
8371
- api: "openai-completions",
8372
- provider: "openrouter",
8373
- baseUrl: "https://openrouter.ai/api/v1",
8374
- reasoning: true,
8375
- input: ["text"],
8376
- cost: {
8377
- input: 0,
8378
- output: 0,
8379
- cacheRead: 0,
8380
- cacheWrite: 0,
8381
- },
8382
- contextWindow: 131072,
8383
- maxTokens: 65536,
8384
- },
8385
- "baidu/ernie-4.5-21b-a3b": {
8386
- id: "baidu/ernie-4.5-21b-a3b",
8387
- name: "Baidu: ERNIE 4.5 21B A3B",
8388
- api: "openai-completions",
8389
- provider: "openrouter",
8390
- baseUrl: "https://openrouter.ai/api/v1",
8391
- reasoning: false,
8392
- input: ["text"],
8393
- cost: {
8394
- input: 0.07,
8395
- output: 0.28,
8396
- cacheRead: 0,
8397
- cacheWrite: 0,
8398
- },
8399
- contextWindow: 131072,
8400
- maxTokens: 8000,
8401
- },
8402
8614
  "baidu/ernie-4.5-vl-28b-a3b": {
8403
8615
  id: "baidu/ernie-4.5-vl-28b-a3b",
8404
8616
  name: "Baidu: ERNIE 4.5 VL 28B A3B",
@@ -8527,13 +8739,13 @@ export const MODELS = {
8527
8739
  reasoning: false,
8528
8740
  input: ["text"],
8529
8741
  cost: {
8530
- input: 0.32,
8531
- output: 0.8899999999999999,
8742
+ input: 0.2288,
8743
+ output: 0.9144,
8532
8744
  cacheRead: 0,
8533
8745
  cacheWrite: 0,
8534
8746
  },
8535
- contextWindow: 163840,
8536
- maxTokens: 16384,
8747
+ contextWindow: 131072,
8748
+ maxTokens: 16000,
8537
8749
  },
8538
8750
  "deepseek/deepseek-chat-v3-0324": {
8539
8751
  id: "deepseek/deepseek-chat-v3-0324",
@@ -8660,37 +8872,18 @@ export const MODELS = {
8660
8872
  api: "openai-completions",
8661
8873
  provider: "openrouter",
8662
8874
  baseUrl: "https://openrouter.ai/api/v1",
8663
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8875
+ compat: { "requiresReasoningContentOnAssistantMessages": true },
8664
8876
  reasoning: true,
8665
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
8877
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "xhigh" },
8666
8878
  input: ["text"],
8667
8879
  cost: {
8668
- input: 0.09999999999999999,
8669
- output: 0.19999999999999998,
8670
- cacheRead: 0.02,
8880
+ input: 0.0983,
8881
+ output: 0.1966,
8882
+ cacheRead: 0.019700000000000002,
8671
8883
  cacheWrite: 0,
8672
8884
  },
8673
8885
  contextWindow: 1048576,
8674
- maxTokens: 16384,
8675
- },
8676
- "deepseek/deepseek-v4-flash:free": {
8677
- id: "deepseek/deepseek-v4-flash:free",
8678
- name: "DeepSeek: DeepSeek V4 Flash (free)",
8679
- api: "openai-completions",
8680
- provider: "openrouter",
8681
- baseUrl: "https://openrouter.ai/api/v1",
8682
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8683
- reasoning: true,
8684
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
8685
- input: ["text"],
8686
- cost: {
8687
- input: 0,
8688
- output: 0,
8689
- cacheRead: 0,
8690
- cacheWrite: 0,
8691
- },
8692
- contextWindow: 1048576,
8693
- maxTokens: 384000,
8886
+ maxTokens: 131072,
8694
8887
  },
8695
8888
  "deepseek/deepseek-v4-pro": {
8696
8889
  id: "deepseek/deepseek-v4-pro",
@@ -8698,9 +8891,9 @@ export const MODELS = {
8698
8891
  api: "openai-completions",
8699
8892
  provider: "openrouter",
8700
8893
  baseUrl: "https://openrouter.ai/api/v1",
8701
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8894
+ compat: { "requiresReasoningContentOnAssistantMessages": true },
8702
8895
  reasoning: true,
8703
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
8896
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "xhigh" },
8704
8897
  input: ["text"],
8705
8898
  cost: {
8706
8899
  input: 0.435,
@@ -8742,7 +8935,7 @@ export const MODELS = {
8742
8935
  cacheRead: 0.024999999999999998,
8743
8936
  cacheWrite: 0.08333333333333334,
8744
8937
  },
8745
- contextWindow: 1000000,
8938
+ contextWindow: 1048576,
8746
8939
  maxTokens: 8192,
8747
8940
  },
8748
8941
  "google/gemini-2.0-flash-lite-001": {
@@ -9146,9 +9339,9 @@ export const MODELS = {
9146
9339
  reasoning: true,
9147
9340
  input: ["text"],
9148
9341
  cost: {
9149
- input: 0.075,
9150
- output: 0.625,
9151
- cacheRead: 0.015,
9342
+ input: 0.3,
9343
+ output: 2.5,
9344
+ cacheRead: 0.06,
9152
9345
  cacheWrite: 0,
9153
9346
  },
9154
9347
  contextWindow: 262144,
@@ -9239,6 +9432,23 @@ export const MODELS = {
9239
9432
  contextWindow: 131072,
9240
9433
  maxTokens: 4096,
9241
9434
  },
9435
+ "meta-llama/llama-4-maverick": {
9436
+ id: "meta-llama/llama-4-maverick",
9437
+ name: "Meta: Llama 4 Maverick",
9438
+ api: "openai-completions",
9439
+ provider: "openrouter",
9440
+ baseUrl: "https://openrouter.ai/api/v1",
9441
+ reasoning: false,
9442
+ input: ["text", "image"],
9443
+ cost: {
9444
+ input: 0.15,
9445
+ output: 0.6,
9446
+ cacheRead: 0,
9447
+ cacheWrite: 0,
9448
+ },
9449
+ contextWindow: 1048576,
9450
+ maxTokens: 16384,
9451
+ },
9242
9452
  "meta-llama/llama-4-scout": {
9243
9453
  id: "meta-llama/llama-4-scout",
9244
9454
  name: "Meta: Llama 4 Scout",
@@ -9324,39 +9534,39 @@ export const MODELS = {
9324
9534
  contextWindow: 204800,
9325
9535
  maxTokens: 196608,
9326
9536
  },
9327
- "minimax/minimax-m2.5:free": {
9328
- id: "minimax/minimax-m2.5:free",
9329
- name: "MiniMax: MiniMax M2.5 (free)",
9537
+ "minimax/minimax-m2.7": {
9538
+ id: "minimax/minimax-m2.7",
9539
+ name: "MiniMax: MiniMax M2.7",
9330
9540
  api: "openai-completions",
9331
9541
  provider: "openrouter",
9332
9542
  baseUrl: "https://openrouter.ai/api/v1",
9333
9543
  reasoning: true,
9334
9544
  input: ["text"],
9335
9545
  cost: {
9336
- input: 0,
9337
- output: 0,
9546
+ input: 0.26,
9547
+ output: 1.2,
9338
9548
  cacheRead: 0,
9339
9549
  cacheWrite: 0,
9340
9550
  },
9341
9551
  contextWindow: 204800,
9342
- maxTokens: 8192,
9552
+ maxTokens: 4096,
9343
9553
  },
9344
- "minimax/minimax-m2.7": {
9345
- id: "minimax/minimax-m2.7",
9346
- name: "MiniMax: MiniMax M2.7",
9554
+ "minimax/minimax-m3": {
9555
+ id: "minimax/minimax-m3",
9556
+ name: "MiniMax: MiniMax M3",
9347
9557
  api: "openai-completions",
9348
9558
  provider: "openrouter",
9349
9559
  baseUrl: "https://openrouter.ai/api/v1",
9350
9560
  reasoning: true,
9351
- input: ["text"],
9561
+ input: ["text", "image"],
9352
9562
  cost: {
9353
- input: 0.27899999999999997,
9563
+ input: 0.3,
9354
9564
  output: 1.2,
9355
- cacheRead: 0,
9565
+ cacheRead: 0.06,
9356
9566
  cacheWrite: 0,
9357
9567
  },
9358
- contextWindow: 204800,
9359
- maxTokens: 131072,
9568
+ contextWindow: 1048576,
9569
+ maxTokens: 512000,
9360
9570
  },
9361
9571
  "mistralai/codestral-2508": {
9362
9572
  id: "mistralai/codestral-2508",
@@ -9392,40 +9602,6 @@ export const MODELS = {
9392
9602
  contextWindow: 262144,
9393
9603
  maxTokens: 4096,
9394
9604
  },
9395
- "mistralai/devstral-medium": {
9396
- id: "mistralai/devstral-medium",
9397
- name: "Mistral: Devstral Medium",
9398
- api: "openai-completions",
9399
- provider: "openrouter",
9400
- baseUrl: "https://openrouter.ai/api/v1",
9401
- reasoning: false,
9402
- input: ["text"],
9403
- cost: {
9404
- input: 0.39999999999999997,
9405
- output: 2,
9406
- cacheRead: 0.04,
9407
- cacheWrite: 0,
9408
- },
9409
- contextWindow: 131072,
9410
- maxTokens: 4096,
9411
- },
9412
- "mistralai/devstral-small": {
9413
- id: "mistralai/devstral-small",
9414
- name: "Mistral: Devstral Small 1.1",
9415
- api: "openai-completions",
9416
- provider: "openrouter",
9417
- baseUrl: "https://openrouter.ai/api/v1",
9418
- reasoning: false,
9419
- input: ["text"],
9420
- cost: {
9421
- input: 0.09999999999999999,
9422
- output: 0.3,
9423
- cacheRead: 0.01,
9424
- cacheWrite: 0,
9425
- },
9426
- contextWindow: 131072,
9427
- maxTokens: 4096,
9428
- },
9429
9605
  "mistralai/ministral-14b-2512": {
9430
9606
  id: "mistralai/ministral-14b-2512",
9431
9607
  name: "Mistral: Ministral 3 14B 2512",
@@ -9511,23 +9687,6 @@ export const MODELS = {
9511
9687
  contextWindow: 131072,
9512
9688
  maxTokens: 4096,
9513
9689
  },
9514
- "mistralai/mistral-large-2411": {
9515
- id: "mistralai/mistral-large-2411",
9516
- name: "Mistral Large 2411",
9517
- api: "openai-completions",
9518
- provider: "openrouter",
9519
- baseUrl: "https://openrouter.ai/api/v1",
9520
- reasoning: false,
9521
- input: ["text"],
9522
- cost: {
9523
- input: 2,
9524
- output: 6,
9525
- cacheRead: 0.19999999999999998,
9526
- cacheWrite: 0,
9527
- },
9528
- contextWindow: 131072,
9529
- maxTokens: 4096,
9530
- },
9531
9690
  "mistralai/mistral-large-2512": {
9532
9691
  id: "mistralai/mistral-large-2512",
9533
9692
  name: "Mistral: Mistral Large 3 2512",
@@ -9681,23 +9840,6 @@ export const MODELS = {
9681
9840
  contextWindow: 65536,
9682
9841
  maxTokens: 4096,
9683
9842
  },
9684
- "mistralai/pixtral-large-2411": {
9685
- id: "mistralai/pixtral-large-2411",
9686
- name: "Mistral: Pixtral Large 2411",
9687
- api: "openai-completions",
9688
- provider: "openrouter",
9689
- baseUrl: "https://openrouter.ai/api/v1",
9690
- reasoning: false,
9691
- input: ["text", "image"],
9692
- cost: {
9693
- input: 2,
9694
- output: 6,
9695
- cacheRead: 0.19999999999999998,
9696
- cacheWrite: 0,
9697
- },
9698
- contextWindow: 131072,
9699
- maxTokens: 4096,
9700
- },
9701
9843
  "mistralai/voxtral-small-24b-2507": {
9702
9844
  id: "mistralai/voxtral-small-24b-2507",
9703
9845
  name: "Mistral: Voxtral Small 24B 2507",
@@ -9789,16 +9931,35 @@ export const MODELS = {
9789
9931
  api: "openai-completions",
9790
9932
  provider: "openrouter",
9791
9933
  baseUrl: "https://openrouter.ai/api/v1",
9934
+ compat: { "supportsDeveloperRole": false },
9792
9935
  reasoning: true,
9793
9936
  input: ["text", "image"],
9794
9937
  cost: {
9795
- input: 0.73,
9796
- output: 3.49,
9797
- cacheRead: 0.25,
9938
+ input: 0.684,
9939
+ output: 3.42,
9940
+ cacheRead: 0.144,
9798
9941
  cacheWrite: 0,
9799
9942
  },
9800
9943
  contextWindow: 262144,
9801
- maxTokens: 262142,
9944
+ maxTokens: 262144,
9945
+ },
9946
+ "moonshotai/kimi-k2.6:free": {
9947
+ id: "moonshotai/kimi-k2.6:free",
9948
+ name: "MoonshotAI: Kimi K2.6 (free)",
9949
+ api: "openai-completions",
9950
+ provider: "openrouter",
9951
+ baseUrl: "https://openrouter.ai/api/v1",
9952
+ compat: { "supportsDeveloperRole": false },
9953
+ reasoning: true,
9954
+ input: ["text", "image"],
9955
+ cost: {
9956
+ input: 0,
9957
+ output: 0,
9958
+ cacheRead: 0,
9959
+ cacheWrite: 0,
9960
+ },
9961
+ contextWindow: 262144,
9962
+ maxTokens: 4096,
9802
9963
  },
9803
9964
  "nex-agi/deepseek-v3.1-nex-n1": {
9804
9965
  id: "nex-agi/deepseek-v3.1-nex-n1",
@@ -10225,23 +10386,6 @@ export const MODELS = {
10225
10386
  contextWindow: 128000,
10226
10387
  maxTokens: 16384,
10227
10388
  },
10228
- "openai/gpt-4o-audio-preview": {
10229
- id: "openai/gpt-4o-audio-preview",
10230
- name: "OpenAI: GPT-4o Audio",
10231
- api: "openai-completions",
10232
- provider: "openrouter",
10233
- baseUrl: "https://openrouter.ai/api/v1",
10234
- reasoning: false,
10235
- input: ["text"],
10236
- cost: {
10237
- input: 2.5,
10238
- output: 10,
10239
- cacheRead: 0,
10240
- cacheWrite: 0,
10241
- },
10242
- contextWindow: 128000,
10243
- maxTokens: 16384,
10244
- },
10245
10389
  "openai/gpt-4o-mini": {
10246
10390
  id: "openai/gpt-4o-mini",
10247
10391
  name: "OpenAI: GPT-4o-mini",
@@ -10389,11 +10533,11 @@ export const MODELS = {
10389
10533
  cost: {
10390
10534
  input: 1.25,
10391
10535
  output: 10,
10392
- cacheRead: 0.125,
10536
+ cacheRead: 0.13,
10393
10537
  cacheWrite: 0,
10394
10538
  },
10395
10539
  contextWindow: 128000,
10396
- maxTokens: 16384,
10540
+ maxTokens: 32000,
10397
10541
  },
10398
10542
  "openai/gpt-5.1-codex": {
10399
10543
  id: "openai/gpt-5.1-codex",
@@ -10406,7 +10550,7 @@ export const MODELS = {
10406
10550
  cost: {
10407
10551
  input: 1.25,
10408
10552
  output: 10,
10409
- cacheRead: 0.125,
10553
+ cacheRead: 0.13,
10410
10554
  cacheWrite: 0,
10411
10555
  },
10412
10556
  contextWindow: 400000,
@@ -10440,11 +10584,11 @@ export const MODELS = {
10440
10584
  cost: {
10441
10585
  input: 0.25,
10442
10586
  output: 2,
10443
- cacheRead: 0.03,
10587
+ cacheRead: 0.024999999999999998,
10444
10588
  cacheWrite: 0,
10445
10589
  },
10446
10590
  contextWindow: 400000,
10447
- maxTokens: 128000,
10591
+ maxTokens: 100000,
10448
10592
  },
10449
10593
  "openai/gpt-5.2": {
10450
10594
  id: "openai/gpt-5.2",
@@ -10480,7 +10624,7 @@ export const MODELS = {
10480
10624
  cacheWrite: 0,
10481
10625
  },
10482
10626
  contextWindow: 128000,
10483
- maxTokens: 32000,
10627
+ maxTokens: 16384,
10484
10628
  },
10485
10629
  "openai/gpt-5.2-codex": {
10486
10630
  id: "openai/gpt-5.2-codex",
@@ -10651,7 +10795,7 @@ export const MODELS = {
10651
10795
  provider: "openrouter",
10652
10796
  baseUrl: "https://openrouter.ai/api/v1",
10653
10797
  reasoning: true,
10654
- thinkingLevelMap: { "xhigh": "xhigh" },
10798
+ thinkingLevelMap: { "xhigh": "xhigh", "off": null, "minimal": null, "low": null },
10655
10799
  input: ["text", "image"],
10656
10800
  cost: {
10657
10801
  input: 30,
@@ -10756,13 +10900,13 @@ export const MODELS = {
10756
10900
  reasoning: true,
10757
10901
  input: ["text"],
10758
10902
  cost: {
10759
- input: 0.03,
10903
+ input: 0.029,
10760
10904
  output: 0.14,
10761
10905
  cacheRead: 0,
10762
10906
  cacheWrite: 0,
10763
10907
  },
10764
10908
  contextWindow: 131072,
10765
- maxTokens: 131072,
10909
+ maxTokens: 4096,
10766
10910
  },
10767
10911
  "openai/gpt-oss-20b:free": {
10768
10912
  id: "openai/gpt-oss-20b:free",
@@ -11016,8 +11160,8 @@ export const MODELS = {
11016
11160
  cacheRead: 0,
11017
11161
  cacheWrite: 0,
11018
11162
  },
11019
- contextWindow: 131072,
11020
- maxTokens: 8192,
11163
+ contextWindow: 262144,
11164
+ maxTokens: 32768,
11021
11165
  },
11022
11166
  "poolside/laguna-xs.2:free": {
11023
11167
  id: "poolside/laguna-xs.2:free",
@@ -11033,8 +11177,8 @@ export const MODELS = {
11033
11177
  cacheRead: 0,
11034
11178
  cacheWrite: 0,
11035
11179
  },
11036
- contextWindow: 131072,
11037
- maxTokens: 8192,
11180
+ contextWindow: 262144,
11181
+ maxTokens: 32768,
11038
11182
  },
11039
11183
  "prime-intellect/intellect-3": {
11040
11184
  id: "prime-intellect/intellect-3",
@@ -11045,47 +11189,30 @@ export const MODELS = {
11045
11189
  reasoning: true,
11046
11190
  input: ["text"],
11047
11191
  cost: {
11048
- input: 0.19999999999999998,
11049
- output: 1.1,
11050
- cacheRead: 0,
11051
- cacheWrite: 0,
11052
- },
11053
- contextWindow: 131072,
11054
- maxTokens: 131072,
11055
- },
11056
- "qwen/qwen-2.5-72b-instruct": {
11057
- id: "qwen/qwen-2.5-72b-instruct",
11058
- name: "Qwen2.5 72B Instruct",
11059
- api: "openai-completions",
11060
- provider: "openrouter",
11061
- baseUrl: "https://openrouter.ai/api/v1",
11062
- reasoning: false,
11063
- input: ["text"],
11064
- cost: {
11065
- input: 0.36,
11066
- output: 0.39999999999999997,
11192
+ input: 0.19999999999999998,
11193
+ output: 1.1,
11067
11194
  cacheRead: 0,
11068
11195
  cacheWrite: 0,
11069
11196
  },
11070
11197
  contextWindow: 131072,
11071
- maxTokens: 16384,
11198
+ maxTokens: 131072,
11072
11199
  },
11073
- "qwen/qwen-2.5-7b-instruct": {
11074
- id: "qwen/qwen-2.5-7b-instruct",
11075
- name: "Qwen: Qwen2.5 7B Instruct",
11200
+ "qwen/qwen-2.5-72b-instruct": {
11201
+ id: "qwen/qwen-2.5-72b-instruct",
11202
+ name: "Qwen2.5 72B Instruct",
11076
11203
  api: "openai-completions",
11077
11204
  provider: "openrouter",
11078
11205
  baseUrl: "https://openrouter.ai/api/v1",
11079
11206
  reasoning: false,
11080
11207
  input: ["text"],
11081
11208
  cost: {
11082
- input: 0.04,
11083
- output: 0.09999999999999999,
11209
+ input: 0.36,
11210
+ output: 0.39999999999999997,
11084
11211
  cacheRead: 0,
11085
11212
  cacheWrite: 0,
11086
11213
  },
11087
11214
  contextWindow: 131072,
11088
- maxTokens: 32768,
11215
+ maxTokens: 16384,
11089
11216
  },
11090
11217
  "qwen/qwen-plus": {
11091
11218
  id: "qwen/qwen-plus",
@@ -11116,7 +11243,7 @@ export const MODELS = {
11116
11243
  input: 0.26,
11117
11244
  output: 0.78,
11118
11245
  cacheRead: 0,
11119
- cacheWrite: 0.325,
11246
+ cacheWrite: 0,
11120
11247
  },
11121
11248
  contextWindow: 1000000,
11122
11249
  maxTokens: 32768,
@@ -11198,13 +11325,13 @@ export const MODELS = {
11198
11325
  reasoning: true,
11199
11326
  input: ["text"],
11200
11327
  cost: {
11201
- input: 0.14950000000000002,
11202
- output: 1.495,
11203
- cacheRead: 0,
11328
+ input: 0.09999999999999999,
11329
+ output: 0.09999999999999999,
11330
+ cacheRead: 0.09999999999999999,
11204
11331
  cacheWrite: 0,
11205
11332
  },
11206
11333
  contextWindow: 262144,
11207
- maxTokens: 4096,
11334
+ maxTokens: 262144,
11208
11335
  },
11209
11336
  "qwen/qwen3-30b-a3b": {
11210
11337
  id: "qwen/qwen3-30b-a3b",
@@ -11640,13 +11767,13 @@ export const MODELS = {
11640
11767
  reasoning: true,
11641
11768
  input: ["text", "image"],
11642
11769
  cost: {
11643
- input: 0.13899999999999998,
11770
+ input: 0.14,
11644
11771
  output: 1,
11645
- cacheRead: 0,
11772
+ cacheRead: 0.049999999999999996,
11646
11773
  cacheWrite: 0,
11647
11774
  },
11648
11775
  contextWindow: 262144,
11649
- maxTokens: 4096,
11776
+ maxTokens: 262144,
11650
11777
  },
11651
11778
  "qwen/qwen3.5-397b-a17b": {
11652
11779
  id: "qwen/qwen3.5-397b-a17b",
@@ -11694,7 +11821,7 @@ export const MODELS = {
11694
11821
  input: 0.065,
11695
11822
  output: 0.26,
11696
11823
  cacheRead: 0,
11697
- cacheWrite: 0.08125,
11824
+ cacheWrite: 0,
11698
11825
  },
11699
11826
  contextWindow: 1000000,
11700
11827
  maxTokens: 65536,
@@ -11711,7 +11838,7 @@ export const MODELS = {
11711
11838
  input: 0.26,
11712
11839
  output: 1.56,
11713
11840
  cacheRead: 0,
11714
- cacheWrite: 0.325,
11841
+ cacheWrite: 0,
11715
11842
  },
11716
11843
  contextWindow: 1000000,
11717
11844
  maxTokens: 65536,
@@ -11728,7 +11855,7 @@ export const MODELS = {
11728
11855
  input: 0.3,
11729
11856
  output: 1.7999999999999998,
11730
11857
  cacheRead: 0,
11731
- cacheWrite: 0,
11858
+ cacheWrite: 0.375,
11732
11859
  },
11733
11860
  contextWindow: 1000000,
11734
11861
  maxTokens: 65536,
@@ -11742,13 +11869,13 @@ export const MODELS = {
11742
11869
  reasoning: true,
11743
11870
  input: ["text", "image"],
11744
11871
  cost: {
11745
- input: 0.3,
11872
+ input: 0.29,
11746
11873
  output: 3.1999999999999997,
11747
11874
  cacheRead: 0,
11748
11875
  cacheWrite: 0,
11749
11876
  },
11750
11877
  contextWindow: 262144,
11751
- maxTokens: 262144,
11878
+ maxTokens: 262140,
11752
11879
  },
11753
11880
  "qwen/qwen3.6-35b-a3b": {
11754
11881
  id: "qwen/qwen3.6-35b-a3b",
@@ -11759,7 +11886,7 @@ export const MODELS = {
11759
11886
  reasoning: true,
11760
11887
  input: ["text", "image"],
11761
11888
  cost: {
11762
- input: 0.15,
11889
+ input: 0.14,
11763
11890
  output: 1,
11764
11891
  cacheRead: 0,
11765
11892
  cacheWrite: 0,
@@ -11827,10 +11954,10 @@ export const MODELS = {
11827
11954
  reasoning: true,
11828
11955
  input: ["text"],
11829
11956
  cost: {
11830
- input: 2.5,
11831
- output: 7.5,
11832
- cacheRead: 0,
11833
- cacheWrite: 3.125,
11957
+ input: 1.25,
11958
+ output: 3.75,
11959
+ cacheRead: 0.25,
11960
+ cacheWrite: 1.5625,
11834
11961
  },
11835
11962
  contextWindow: 1000000,
11836
11963
  maxTokens: 65536,
@@ -11920,6 +12047,23 @@ export const MODELS = {
11920
12047
  contextWindow: 262144,
11921
12048
  maxTokens: 16384,
11922
12049
  },
12050
+ "stepfun/step-3.7-flash": {
12051
+ id: "stepfun/step-3.7-flash",
12052
+ name: "StepFun: Step 3.7 Flash",
12053
+ api: "openai-completions",
12054
+ provider: "openrouter",
12055
+ baseUrl: "https://openrouter.ai/api/v1",
12056
+ reasoning: true,
12057
+ input: ["text", "image"],
12058
+ cost: {
12059
+ input: 0.19999999999999998,
12060
+ output: 1.15,
12061
+ cacheRead: 0.04,
12062
+ cacheWrite: 0,
12063
+ },
12064
+ contextWindow: 256000,
12065
+ maxTokens: 256000,
12066
+ },
11923
12067
  "tencent/hy3-preview": {
11924
12068
  id: "tencent/hy3-preview",
11925
12069
  name: "Tencent: Hy3 preview",
@@ -11929,13 +12073,13 @@ export const MODELS = {
11929
12073
  reasoning: true,
11930
12074
  input: ["text"],
11931
12075
  cost: {
11932
- input: 0.06599999999999999,
11933
- output: 0.26,
11934
- cacheRead: 0.029,
12076
+ input: 0.063,
12077
+ output: 0.21,
12078
+ cacheRead: 0.020999999999999998,
11935
12079
  cacheWrite: 0,
11936
12080
  },
11937
12081
  contextWindow: 262144,
11938
- maxTokens: 262144,
12082
+ maxTokens: 4096,
11939
12083
  },
11940
12084
  "thedrummer/rocinante-12b": {
11941
12085
  id: "thedrummer/rocinante-12b",
@@ -12056,40 +12200,6 @@ export const MODELS = {
12056
12200
  contextWindow: 262144,
12057
12201
  maxTokens: 65536,
12058
12202
  },
12059
- "xiaomi/mimo-v2-omni": {
12060
- id: "xiaomi/mimo-v2-omni",
12061
- name: "Xiaomi: MiMo-V2-Omni",
12062
- api: "openai-completions",
12063
- provider: "openrouter",
12064
- baseUrl: "https://openrouter.ai/api/v1",
12065
- reasoning: true,
12066
- input: ["text", "image"],
12067
- cost: {
12068
- input: 0.39999999999999997,
12069
- output: 2,
12070
- cacheRead: 0.08,
12071
- cacheWrite: 0,
12072
- },
12073
- contextWindow: 262144,
12074
- maxTokens: 65536,
12075
- },
12076
- "xiaomi/mimo-v2-pro": {
12077
- id: "xiaomi/mimo-v2-pro",
12078
- name: "Xiaomi: MiMo-V2-Pro",
12079
- api: "openai-completions",
12080
- provider: "openrouter",
12081
- baseUrl: "https://openrouter.ai/api/v1",
12082
- reasoning: true,
12083
- input: ["text"],
12084
- cost: {
12085
- input: 1,
12086
- output: 3,
12087
- cacheRead: 0.19999999999999998,
12088
- cacheWrite: 0,
12089
- },
12090
- contextWindow: 1048576,
12091
- maxTokens: 131072,
12092
- },
12093
12203
  "xiaomi/mimo-v2.5": {
12094
12204
  id: "xiaomi/mimo-v2.5",
12095
12205
  name: "Xiaomi: MiMo-V2.5",
@@ -12099,9 +12209,9 @@ export const MODELS = {
12099
12209
  reasoning: true,
12100
12210
  input: ["text", "image"],
12101
12211
  cost: {
12102
- input: 0.39999999999999997,
12103
- output: 2,
12104
- cacheRead: 0.08,
12212
+ input: 0.14,
12213
+ output: 0.28,
12214
+ cacheRead: 0.0028,
12105
12215
  cacheWrite: 0,
12106
12216
  },
12107
12217
  contextWindow: 1048576,
@@ -12116,13 +12226,13 @@ export const MODELS = {
12116
12226
  reasoning: true,
12117
12227
  input: ["text"],
12118
12228
  cost: {
12119
- input: 1,
12120
- output: 3,
12121
- cacheRead: 0.19999999999999998,
12229
+ input: 0.435,
12230
+ output: 0.87,
12231
+ cacheRead: 0.0036,
12122
12232
  cacheWrite: 0,
12123
12233
  },
12124
12234
  contextWindow: 1048576,
12125
- maxTokens: 16384,
12235
+ maxTokens: 131072,
12126
12236
  },
12127
12237
  "z-ai/glm-4-32b": {
12128
12238
  id: "z-ai/glm-4-32b",
@@ -12167,13 +12277,13 @@ export const MODELS = {
12167
12277
  reasoning: true,
12168
12278
  input: ["text"],
12169
12279
  cost: {
12170
- input: 0.13,
12280
+ input: 0.125,
12171
12281
  output: 0.85,
12172
- cacheRead: 0.024999999999999998,
12282
+ cacheRead: 0.06,
12173
12283
  cacheWrite: 0,
12174
12284
  },
12175
12285
  contextWindow: 131072,
12176
- maxTokens: 98304,
12286
+ maxTokens: 131070,
12177
12287
  },
12178
12288
  "z-ai/glm-4.5-air:free": {
12179
12289
  id: "z-ai/glm-4.5-air:free",
@@ -12439,13 +12549,13 @@ export const MODELS = {
12439
12549
  reasoning: true,
12440
12550
  input: ["text", "image"],
12441
12551
  cost: {
12442
- input: 0.73,
12443
- output: 3.49,
12444
- cacheRead: 0.25,
12552
+ input: 0.684,
12553
+ output: 3.42,
12554
+ cacheRead: 0.144,
12445
12555
  cacheWrite: 0,
12446
12556
  },
12447
12557
  contextWindow: 262144,
12448
- maxTokens: 262142,
12558
+ maxTokens: 262144,
12449
12559
  },
12450
12560
  "~openai/gpt-latest": {
12451
12561
  id: "~openai/gpt-latest",
@@ -12843,20 +12953,20 @@ export const MODELS = {
12843
12953
  },
12844
12954
  "alibaba/qwen-3-235b": {
12845
12955
  id: "alibaba/qwen-3-235b",
12846
- name: "Qwen3 235B A22b Instruct 2507",
12956
+ name: "Qwen3 235B A22B",
12847
12957
  api: "anthropic-messages",
12848
12958
  provider: "vercel-ai-gateway",
12849
12959
  baseUrl: "https://ai-gateway.vercel.sh",
12850
12960
  reasoning: false,
12851
12961
  input: ["text"],
12852
12962
  cost: {
12853
- input: 0.6,
12854
- output: 1.2,
12855
- cacheRead: 0.6,
12963
+ input: 0.22,
12964
+ output: 0.88,
12965
+ cacheRead: 0,
12856
12966
  cacheWrite: 0,
12857
12967
  },
12858
- contextWindow: 131000,
12859
- maxTokens: 40000,
12968
+ contextWindow: 262144,
12969
+ maxTokens: 16384,
12860
12970
  },
12861
12971
  "alibaba/qwen-3-30b": {
12862
12972
  id: "alibaba/qwen-3-30b",
@@ -13274,7 +13384,26 @@ export const MODELS = {
13274
13384
  api: "anthropic-messages",
13275
13385
  provider: "vercel-ai-gateway",
13276
13386
  baseUrl: "https://ai-gateway.vercel.sh",
13277
- compat: { "forceAdaptiveThinking": true },
13387
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
13388
+ reasoning: true,
13389
+ thinkingLevelMap: { "xhigh": "xhigh" },
13390
+ input: ["text", "image"],
13391
+ cost: {
13392
+ input: 5,
13393
+ output: 25,
13394
+ cacheRead: 0.5,
13395
+ cacheWrite: 6.25,
13396
+ },
13397
+ contextWindow: 1000000,
13398
+ maxTokens: 128000,
13399
+ },
13400
+ "anthropic/claude-opus-4.8": {
13401
+ id: "anthropic/claude-opus-4.8",
13402
+ name: "Claude Opus 4.8",
13403
+ api: "anthropic-messages",
13404
+ provider: "vercel-ai-gateway",
13405
+ baseUrl: "https://ai-gateway.vercel.sh",
13406
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
13278
13407
  reasoning: true,
13279
13408
  thinkingLevelMap: { "xhigh": "xhigh" },
13280
13409
  input: ["text", "image"],
@@ -13433,17 +13562,17 @@ export const MODELS = {
13433
13562
  reasoning: false,
13434
13563
  input: ["text"],
13435
13564
  cost: {
13436
- input: 0.77,
13437
- output: 0.77,
13438
- cacheRead: 0,
13565
+ input: 0.27,
13566
+ output: 1.12,
13567
+ cacheRead: 0.135,
13439
13568
  cacheWrite: 0,
13440
13569
  },
13441
13570
  contextWindow: 163840,
13442
- maxTokens: 16384,
13571
+ maxTokens: 163840,
13443
13572
  },
13444
13573
  "deepseek/deepseek-v3.1": {
13445
13574
  id: "deepseek/deepseek-v3.1",
13446
- name: "DeepSeek-V3.1",
13575
+ name: "DeepSeek V3.1",
13447
13576
  api: "anthropic-messages",
13448
13577
  provider: "vercel-ai-gateway",
13449
13578
  baseUrl: "https://ai-gateway.vercel.sh",
@@ -14070,6 +14199,23 @@ export const MODELS = {
14070
14199
  contextWindow: 204800,
14071
14200
  maxTokens: 131100,
14072
14201
  },
14202
+ "minimax/minimax-m3": {
14203
+ id: "minimax/minimax-m3",
14204
+ name: "MiniMax M3",
14205
+ api: "anthropic-messages",
14206
+ provider: "vercel-ai-gateway",
14207
+ baseUrl: "https://ai-gateway.vercel.sh",
14208
+ reasoning: true,
14209
+ input: ["text", "image"],
14210
+ cost: {
14211
+ input: 0.3,
14212
+ output: 1.2,
14213
+ cacheRead: 0.06,
14214
+ cacheWrite: 0,
14215
+ },
14216
+ contextWindow: 1000000,
14217
+ maxTokens: 1000000,
14218
+ },
14073
14219
  "mistral/codestral": {
14074
14220
  id: "mistral/codestral",
14075
14221
  name: "Mistral Codestral",
@@ -14887,7 +15033,7 @@ export const MODELS = {
14887
15033
  provider: "vercel-ai-gateway",
14888
15034
  baseUrl: "https://ai-gateway.vercel.sh",
14889
15035
  reasoning: true,
14890
- thinkingLevelMap: { "xhigh": "xhigh" },
15036
+ thinkingLevelMap: { "xhigh": "xhigh", "off": null, "minimal": null, "low": null },
14891
15037
  input: ["text", "image"],
14892
15038
  cost: {
14893
15039
  input: 30,
@@ -15068,6 +15214,40 @@ export const MODELS = {
15068
15214
  contextWindow: 200000,
15069
15215
  maxTokens: 8000,
15070
15216
  },
15217
+ "stepfun/step-3.5-flash": {
15218
+ id: "stepfun/step-3.5-flash",
15219
+ name: "StepFun 3.5 Flash",
15220
+ api: "anthropic-messages",
15221
+ provider: "vercel-ai-gateway",
15222
+ baseUrl: "https://ai-gateway.vercel.sh",
15223
+ reasoning: true,
15224
+ input: ["text"],
15225
+ cost: {
15226
+ input: 0.09,
15227
+ output: 0.3,
15228
+ cacheRead: 0,
15229
+ cacheWrite: 0.02,
15230
+ },
15231
+ contextWindow: 262114,
15232
+ maxTokens: 262114,
15233
+ },
15234
+ "stepfun/step-3.7-flash": {
15235
+ id: "stepfun/step-3.7-flash",
15236
+ name: "Step 3.7 Flash",
15237
+ api: "anthropic-messages",
15238
+ provider: "vercel-ai-gateway",
15239
+ baseUrl: "https://ai-gateway.vercel.sh",
15240
+ reasoning: true,
15241
+ input: ["text", "image"],
15242
+ cost: {
15243
+ input: 0.19999999999999998,
15244
+ output: 1.15,
15245
+ cacheRead: 0.04,
15246
+ cacheWrite: 0,
15247
+ },
15248
+ contextWindow: 256000,
15249
+ maxTokens: 256000,
15250
+ },
15071
15251
  "xai/grok-4.1-fast-non-reasoning": {
15072
15252
  id: "xai/grok-4.1-fast-non-reasoning",
15073
15253
  name: "Grok 4.1 Fast Non-Reasoning",
@@ -15281,9 +15461,9 @@ export const MODELS = {
15281
15461
  reasoning: true,
15282
15462
  input: ["text", "image"],
15283
15463
  cost: {
15284
- input: 0.39999999999999997,
15285
- output: 2,
15286
- cacheRead: 0.08,
15464
+ input: 0.14,
15465
+ output: 0.28,
15466
+ cacheRead: 0.0028,
15287
15467
  cacheWrite: 0,
15288
15468
  },
15289
15469
  contextWindow: 1050000,
@@ -15298,9 +15478,9 @@ export const MODELS = {
15298
15478
  reasoning: true,
15299
15479
  input: ["text", "image"],
15300
15480
  cost: {
15301
- input: 1,
15302
- output: 3,
15303
- cacheRead: 0.19999999999999998,
15481
+ input: 0.435,
15482
+ output: 0.87,
15483
+ cacheRead: 0.0036,
15304
15484
  cacheWrite: 0,
15305
15485
  },
15306
15486
  contextWindow: 1050000,
@@ -15742,24 +15922,6 @@ export const MODELS = {
15742
15922
  },
15743
15923
  },
15744
15924
  "xiaomi-token-plan-ams": {
15745
- "mimo-v2-flash": {
15746
- id: "mimo-v2-flash",
15747
- name: "MiMo-V2-Flash",
15748
- api: "openai-completions",
15749
- provider: "xiaomi-token-plan-ams",
15750
- baseUrl: "https://token-plan-ams.xiaomimimo.com/v1",
15751
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
15752
- reasoning: true,
15753
- input: ["text"],
15754
- cost: {
15755
- input: 0.1,
15756
- output: 0.3,
15757
- cacheRead: 0.01,
15758
- cacheWrite: 0,
15759
- },
15760
- contextWindow: 262144,
15761
- maxTokens: 65536,
15762
- },
15763
15925
  "mimo-v2-omni": {
15764
15926
  id: "mimo-v2-omni",
15765
15927
  name: "MiMo-V2-Omni",
@@ -15834,24 +15996,6 @@ export const MODELS = {
15834
15996
  },
15835
15997
  },
15836
15998
  "xiaomi-token-plan-cn": {
15837
- "mimo-v2-flash": {
15838
- id: "mimo-v2-flash",
15839
- name: "MiMo-V2-Flash",
15840
- api: "openai-completions",
15841
- provider: "xiaomi-token-plan-cn",
15842
- baseUrl: "https://token-plan-cn.xiaomimimo.com/v1",
15843
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
15844
- reasoning: true,
15845
- input: ["text"],
15846
- cost: {
15847
- input: 0.1,
15848
- output: 0.3,
15849
- cacheRead: 0.01,
15850
- cacheWrite: 0,
15851
- },
15852
- contextWindow: 262144,
15853
- maxTokens: 65536,
15854
- },
15855
15999
  "mimo-v2-omni": {
15856
16000
  id: "mimo-v2-omni",
15857
16001
  name: "MiMo-V2-Omni",
@@ -15926,24 +16070,6 @@ export const MODELS = {
15926
16070
  },
15927
16071
  },
15928
16072
  "xiaomi-token-plan-sgp": {
15929
- "mimo-v2-flash": {
15930
- id: "mimo-v2-flash",
15931
- name: "MiMo-V2-Flash",
15932
- api: "openai-completions",
15933
- provider: "xiaomi-token-plan-sgp",
15934
- baseUrl: "https://token-plan-sgp.xiaomimimo.com/v1",
15935
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
15936
- reasoning: true,
15937
- input: ["text"],
15938
- cost: {
15939
- input: 0.1,
15940
- output: 0.3,
15941
- cacheRead: 0.01,
15942
- cacheWrite: 0,
15943
- },
15944
- contextWindow: 262144,
15945
- maxTokens: 65536,
15946
- },
15947
16073
  "mimo-v2-omni": {
15948
16074
  id: "mimo-v2-omni",
15949
16075
  name: "MiMo-V2-Omni",