@earendil-works/pi-ai 0.75.4 → 0.76.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (62) hide show
  1. package/dist/cli.d.ts.map +1 -1
  2. package/dist/cli.js +14 -0
  3. package/dist/cli.js.map +1 -1
  4. package/dist/index.d.ts +1 -1
  5. package/dist/index.d.ts.map +1 -1
  6. package/dist/index.js.map +1 -1
  7. package/dist/models.generated.d.ts +364 -687
  8. package/dist/models.generated.d.ts.map +1 -1
  9. package/dist/models.generated.js +407 -749
  10. package/dist/models.generated.js.map +1 -1
  11. package/dist/providers/amazon-bedrock.d.ts.map +1 -1
  12. package/dist/providers/amazon-bedrock.js +2 -1
  13. package/dist/providers/amazon-bedrock.js.map +1 -1
  14. package/dist/providers/anthropic.d.ts +22 -5
  15. package/dist/providers/anthropic.d.ts.map +1 -1
  16. package/dist/providers/anthropic.js +8 -22
  17. package/dist/providers/anthropic.js.map +1 -1
  18. package/dist/providers/azure-openai-responses.d.ts.map +1 -1
  19. package/dist/providers/azure-openai-responses.js +1 -1
  20. package/dist/providers/azure-openai-responses.js.map +1 -1
  21. package/dist/providers/images/openrouter.d.ts.map +1 -1
  22. package/dist/providers/images/openrouter.js +1 -1
  23. package/dist/providers/images/openrouter.js.map +1 -1
  24. package/dist/providers/openai-codex-responses.d.ts.map +1 -1
  25. package/dist/providers/openai-codex-responses.js +148 -76
  26. package/dist/providers/openai-codex-responses.js.map +1 -1
  27. package/dist/providers/openai-completions.d.ts.map +1 -1
  28. package/dist/providers/openai-completions.js +1 -1
  29. package/dist/providers/openai-completions.js.map +1 -1
  30. package/dist/providers/openai-responses.d.ts.map +1 -1
  31. package/dist/providers/openai-responses.js +1 -1
  32. package/dist/providers/openai-responses.js.map +1 -1
  33. package/dist/providers/simple-options.d.ts.map +1 -1
  34. package/dist/providers/simple-options.js +1 -0
  35. package/dist/providers/simple-options.js.map +1 -1
  36. package/dist/types.d.ts +16 -0
  37. package/dist/types.d.ts.map +1 -1
  38. package/dist/types.js.map +1 -1
  39. package/dist/utils/abort-signals.d.ts +6 -0
  40. package/dist/utils/abort-signals.d.ts.map +1 -0
  41. package/dist/utils/abort-signals.js +34 -0
  42. package/dist/utils/abort-signals.js.map +1 -0
  43. package/dist/utils/oauth/device-code.d.ts +19 -0
  44. package/dist/utils/oauth/device-code.d.ts.map +1 -0
  45. package/dist/utils/oauth/device-code.js +55 -0
  46. package/dist/utils/oauth/device-code.js.map +1 -0
  47. package/dist/utils/oauth/github-copilot.d.ts +3 -3
  48. package/dist/utils/oauth/github-copilot.d.ts.map +1 -1
  49. package/dist/utils/oauth/github-copilot.js +45 -69
  50. package/dist/utils/oauth/github-copilot.js.map +1 -1
  51. package/dist/utils/oauth/index.d.ts +1 -0
  52. package/dist/utils/oauth/index.d.ts.map +1 -1
  53. package/dist/utils/oauth/index.js +1 -0
  54. package/dist/utils/oauth/index.js.map +1 -1
  55. package/dist/utils/oauth/types.d.ts +8 -1
  56. package/dist/utils/oauth/types.d.ts.map +1 -1
  57. package/dist/utils/oauth/types.js.map +1 -1
  58. package/dist/utils/overflow.d.ts +2 -1
  59. package/dist/utils/overflow.d.ts.map +1 -1
  60. package/dist/utils/overflow.js +5 -2
  61. package/dist/utils/overflow.js.map +1 -1
  62. package/package.json +2 -1
@@ -1720,6 +1720,7 @@ export const MODELS = {
1720
1720
  api: "anthropic-messages",
1721
1721
  provider: "anthropic",
1722
1722
  baseUrl: "https://api.anthropic.com",
1723
+ compat: { "forceAdaptiveThinking": true },
1723
1724
  reasoning: true,
1724
1725
  thinkingLevelMap: { "xhigh": "max" },
1725
1726
  input: ["text", "image"],
@@ -1738,6 +1739,7 @@ export const MODELS = {
1738
1739
  api: "anthropic-messages",
1739
1740
  provider: "anthropic",
1740
1741
  baseUrl: "https://api.anthropic.com",
1742
+ compat: { "forceAdaptiveThinking": true },
1741
1743
  reasoning: true,
1742
1744
  thinkingLevelMap: { "xhigh": "xhigh" },
1743
1745
  input: ["text", "image"],
@@ -1824,6 +1826,7 @@ export const MODELS = {
1824
1826
  api: "anthropic-messages",
1825
1827
  provider: "anthropic",
1826
1828
  baseUrl: "https://api.anthropic.com",
1829
+ compat: { "forceAdaptiveThinking": true },
1827
1830
  reasoning: true,
1828
1831
  input: ["text", "image"],
1829
1832
  cost: {
@@ -1916,7 +1919,7 @@ export const MODELS = {
1916
1919
  cost: {
1917
1920
  input: 0.1,
1918
1921
  output: 0.4,
1919
- cacheRead: 0.03,
1922
+ cacheRead: 0.025,
1920
1923
  cacheWrite: 0,
1921
1924
  },
1922
1925
  contextWindow: 1047576,
@@ -2001,7 +2004,7 @@ export const MODELS = {
2001
2004
  cost: {
2002
2005
  input: 0.15,
2003
2006
  output: 0.6,
2004
- cacheRead: 0.08,
2007
+ cacheRead: 0.075,
2005
2008
  cacheWrite: 0,
2006
2009
  },
2007
2010
  contextWindow: 128000,
@@ -2127,7 +2130,7 @@ export const MODELS = {
2127
2130
  cost: {
2128
2131
  input: 1.25,
2129
2132
  output: 10,
2130
- cacheRead: 0.13,
2133
+ cacheRead: 0.125,
2131
2134
  cacheWrite: 0,
2132
2135
  },
2133
2136
  contextWindow: 400000,
@@ -2552,7 +2555,7 @@ export const MODELS = {
2552
2555
  cost: {
2553
2556
  input: 1.1,
2554
2557
  output: 4.4,
2555
- cacheRead: 0.28,
2558
+ cacheRead: 0.275,
2556
2559
  cacheWrite: 0,
2557
2560
  },
2558
2561
  contextWindow: 200000,
@@ -2611,23 +2614,6 @@ export const MODELS = {
2611
2614
  contextWindow: 32000,
2612
2615
  maxTokens: 8000,
2613
2616
  },
2614
- "qwen-3-235b-a22b-instruct-2507": {
2615
- id: "qwen-3-235b-a22b-instruct-2507",
2616
- name: "Qwen 3 235B Instruct",
2617
- api: "openai-completions",
2618
- provider: "cerebras",
2619
- baseUrl: "https://api.cerebras.ai/v1",
2620
- reasoning: false,
2621
- input: ["text"],
2622
- cost: {
2623
- input: 0.6,
2624
- output: 1.2,
2625
- cacheRead: 0,
2626
- cacheWrite: 0,
2627
- },
2628
- contextWindow: 131000,
2629
- maxTokens: 32000,
2630
- },
2631
2617
  "zai-glm-4.7": {
2632
2618
  id: "zai-glm-4.7",
2633
2619
  name: "Z.AI GLM-4.7",
@@ -2823,6 +2809,7 @@ export const MODELS = {
2823
2809
  api: "anthropic-messages",
2824
2810
  provider: "cloudflare-ai-gateway",
2825
2811
  baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2812
+ compat: { "forceAdaptiveThinking": true },
2826
2813
  reasoning: true,
2827
2814
  thinkingLevelMap: { "xhigh": "max" },
2828
2815
  input: ["text", "image"],
@@ -2841,6 +2828,7 @@ export const MODELS = {
2841
2828
  api: "anthropic-messages",
2842
2829
  provider: "cloudflare-ai-gateway",
2843
2830
  baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2831
+ compat: { "forceAdaptiveThinking": true },
2844
2832
  reasoning: true,
2845
2833
  thinkingLevelMap: { "xhigh": "xhigh" },
2846
2834
  input: ["text", "image"],
@@ -2893,6 +2881,7 @@ export const MODELS = {
2893
2881
  api: "anthropic-messages",
2894
2882
  provider: "cloudflare-ai-gateway",
2895
2883
  baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2884
+ compat: { "forceAdaptiveThinking": true },
2896
2885
  reasoning: true,
2897
2886
  input: ["text", "image"],
2898
2887
  cost: {
@@ -3275,6 +3264,42 @@ export const MODELS = {
3275
3264
  contextWindow: 256000,
3276
3265
  maxTokens: 16384,
3277
3266
  },
3267
+ "@cf/ibm-granite/granite-4.0-h-micro": {
3268
+ id: "@cf/ibm-granite/granite-4.0-h-micro",
3269
+ name: "Granite 4.0 H Micro",
3270
+ api: "openai-completions",
3271
+ provider: "cloudflare-workers-ai",
3272
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3273
+ compat: { "sendSessionAffinityHeaders": true },
3274
+ reasoning: false,
3275
+ input: ["text"],
3276
+ cost: {
3277
+ input: 0.017,
3278
+ output: 0.112,
3279
+ cacheRead: 0,
3280
+ cacheWrite: 0,
3281
+ },
3282
+ contextWindow: 131000,
3283
+ maxTokens: 131000,
3284
+ },
3285
+ "@cf/meta/llama-3.3-70b-instruct-fp8-fast": {
3286
+ id: "@cf/meta/llama-3.3-70b-instruct-fp8-fast",
3287
+ name: "Llama 3.3 70B Instruct fp8 Fast",
3288
+ api: "openai-completions",
3289
+ provider: "cloudflare-workers-ai",
3290
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3291
+ compat: { "sendSessionAffinityHeaders": true },
3292
+ reasoning: false,
3293
+ input: ["text"],
3294
+ cost: {
3295
+ input: 0.293,
3296
+ output: 2.253,
3297
+ cacheRead: 0,
3298
+ cacheWrite: 0,
3299
+ },
3300
+ contextWindow: 24000,
3301
+ maxTokens: 24000,
3302
+ },
3278
3303
  "@cf/meta/llama-4-scout-17b-16e-instruct": {
3279
3304
  id: "@cf/meta/llama-4-scout-17b-16e-instruct",
3280
3305
  name: "Llama 4 Scout 17B 16E Instruct",
@@ -3290,9 +3315,27 @@ export const MODELS = {
3290
3315
  cacheRead: 0,
3291
3316
  cacheWrite: 0,
3292
3317
  },
3293
- contextWindow: 128000,
3318
+ contextWindow: 131000,
3294
3319
  maxTokens: 16384,
3295
3320
  },
3321
+ "@cf/mistralai/mistral-small-3.1-24b-instruct": {
3322
+ id: "@cf/mistralai/mistral-small-3.1-24b-instruct",
3323
+ name: "Mistral Small 3.1 24B Instruct",
3324
+ api: "openai-completions",
3325
+ provider: "cloudflare-workers-ai",
3326
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3327
+ compat: { "sendSessionAffinityHeaders": true },
3328
+ reasoning: false,
3329
+ input: ["text"],
3330
+ cost: {
3331
+ input: 0.351,
3332
+ output: 0.555,
3333
+ cacheRead: 0,
3334
+ cacheWrite: 0,
3335
+ },
3336
+ contextWindow: 128000,
3337
+ maxTokens: 128000,
3338
+ },
3296
3339
  "@cf/moonshotai/kimi-k2.5": {
3297
3340
  id: "@cf/moonshotai/kimi-k2.5",
3298
3341
  name: "Kimi K2.5",
@@ -3326,7 +3369,7 @@ export const MODELS = {
3326
3369
  cacheRead: 0.16,
3327
3370
  cacheWrite: 0,
3328
3371
  },
3329
- contextWindow: 256000,
3372
+ contextWindow: 262144,
3330
3373
  maxTokens: 256000,
3331
3374
  },
3332
3375
  "@cf/nvidia/nemotron-3-120b-a12b": {
@@ -3383,6 +3426,24 @@ export const MODELS = {
3383
3426
  contextWindow: 128000,
3384
3427
  maxTokens: 16384,
3385
3428
  },
3429
+ "@cf/qwen/qwen3-30b-a3b-fp8": {
3430
+ id: "@cf/qwen/qwen3-30b-a3b-fp8",
3431
+ name: "Qwen3 30B A3b fp8",
3432
+ api: "openai-completions",
3433
+ provider: "cloudflare-workers-ai",
3434
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3435
+ compat: { "sendSessionAffinityHeaders": true },
3436
+ reasoning: true,
3437
+ input: ["text"],
3438
+ cost: {
3439
+ input: 0.0509,
3440
+ output: 0.335,
3441
+ cacheRead: 0,
3442
+ cacheWrite: 0,
3443
+ },
3444
+ contextWindow: 32768,
3445
+ maxTokens: 32768,
3446
+ },
3386
3447
  "@cf/zai-org/glm-4.7-flash": {
3387
3448
  id: "@cf/zai-org/glm-4.7-flash",
3388
3449
  name: "GLM-4.7-Flash",
@@ -3393,7 +3454,7 @@ export const MODELS = {
3393
3454
  reasoning: true,
3394
3455
  input: ["text"],
3395
3456
  cost: {
3396
- input: 0.06,
3457
+ input: 0.0605,
3397
3458
  output: 0.4,
3398
3459
  cacheRead: 0,
3399
3460
  cacheWrite: 0,
@@ -3443,42 +3504,6 @@ export const MODELS = {
3443
3504
  },
3444
3505
  },
3445
3506
  "fireworks": {
3446
- "accounts/fireworks/models/deepseek-v3p1": {
3447
- id: "accounts/fireworks/models/deepseek-v3p1",
3448
- name: "DeepSeek V3.1",
3449
- api: "anthropic-messages",
3450
- provider: "fireworks",
3451
- baseUrl: "https://api.fireworks.ai/inference",
3452
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3453
- reasoning: true,
3454
- input: ["text"],
3455
- cost: {
3456
- input: 0.56,
3457
- output: 1.68,
3458
- cacheRead: 0,
3459
- cacheWrite: 0,
3460
- },
3461
- contextWindow: 163840,
3462
- maxTokens: 163840,
3463
- },
3464
- "accounts/fireworks/models/deepseek-v3p2": {
3465
- id: "accounts/fireworks/models/deepseek-v3p2",
3466
- name: "DeepSeek V3.2",
3467
- api: "anthropic-messages",
3468
- provider: "fireworks",
3469
- baseUrl: "https://api.fireworks.ai/inference",
3470
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3471
- reasoning: true,
3472
- input: ["text"],
3473
- cost: {
3474
- input: 0.56,
3475
- output: 1.68,
3476
- cacheRead: 0.28,
3477
- cacheWrite: 0,
3478
- },
3479
- contextWindow: 160000,
3480
- maxTokens: 160000,
3481
- },
3482
3507
  "accounts/fireworks/models/deepseek-v4-flash": {
3483
3508
  id: "accounts/fireworks/models/deepseek-v4-flash",
3484
3509
  name: "DeepSeek V4 Flash",
@@ -3509,84 +3534,12 @@ export const MODELS = {
3509
3534
  cost: {
3510
3535
  input: 1.74,
3511
3536
  output: 3.48,
3512
- cacheRead: 0.15,
3537
+ cacheRead: 0.145,
3513
3538
  cacheWrite: 0,
3514
3539
  },
3515
3540
  contextWindow: 1000000,
3516
3541
  maxTokens: 384000,
3517
3542
  },
3518
- "accounts/fireworks/models/glm-4p5": {
3519
- id: "accounts/fireworks/models/glm-4p5",
3520
- name: "GLM 4.5",
3521
- api: "anthropic-messages",
3522
- provider: "fireworks",
3523
- baseUrl: "https://api.fireworks.ai/inference",
3524
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3525
- reasoning: true,
3526
- input: ["text"],
3527
- cost: {
3528
- input: 0.55,
3529
- output: 2.19,
3530
- cacheRead: 0,
3531
- cacheWrite: 0,
3532
- },
3533
- contextWindow: 131072,
3534
- maxTokens: 131072,
3535
- },
3536
- "accounts/fireworks/models/glm-4p5-air": {
3537
- id: "accounts/fireworks/models/glm-4p5-air",
3538
- name: "GLM 4.5 Air",
3539
- api: "anthropic-messages",
3540
- provider: "fireworks",
3541
- baseUrl: "https://api.fireworks.ai/inference",
3542
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3543
- reasoning: true,
3544
- input: ["text"],
3545
- cost: {
3546
- input: 0.22,
3547
- output: 0.88,
3548
- cacheRead: 0,
3549
- cacheWrite: 0,
3550
- },
3551
- contextWindow: 131072,
3552
- maxTokens: 131072,
3553
- },
3554
- "accounts/fireworks/models/glm-4p7": {
3555
- id: "accounts/fireworks/models/glm-4p7",
3556
- name: "GLM 4.7",
3557
- api: "anthropic-messages",
3558
- provider: "fireworks",
3559
- baseUrl: "https://api.fireworks.ai/inference",
3560
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3561
- reasoning: true,
3562
- input: ["text"],
3563
- cost: {
3564
- input: 0.6,
3565
- output: 2.2,
3566
- cacheRead: 0.3,
3567
- cacheWrite: 0,
3568
- },
3569
- contextWindow: 198000,
3570
- maxTokens: 198000,
3571
- },
3572
- "accounts/fireworks/models/glm-5": {
3573
- id: "accounts/fireworks/models/glm-5",
3574
- name: "GLM 5",
3575
- api: "anthropic-messages",
3576
- provider: "fireworks",
3577
- baseUrl: "https://api.fireworks.ai/inference",
3578
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3579
- reasoning: true,
3580
- input: ["text"],
3581
- cost: {
3582
- input: 1,
3583
- output: 3.2,
3584
- cacheRead: 0.5,
3585
- cacheWrite: 0,
3586
- },
3587
- contextWindow: 202752,
3588
- maxTokens: 131072,
3589
- },
3590
3543
  "accounts/fireworks/models/glm-5p1": {
3591
3544
  id: "accounts/fireworks/models/glm-5p1",
3592
3545
  name: "GLM 5.1",
@@ -3617,7 +3570,7 @@ export const MODELS = {
3617
3570
  cost: {
3618
3571
  input: 0.15,
3619
3572
  output: 0.6,
3620
- cacheRead: 0,
3573
+ cacheRead: 0.015,
3621
3574
  cacheWrite: 0,
3622
3575
  },
3623
3576
  contextWindow: 131072,
@@ -3633,50 +3586,14 @@ export const MODELS = {
3633
3586
  reasoning: true,
3634
3587
  input: ["text"],
3635
3588
  cost: {
3636
- input: 0.05,
3637
- output: 0.2,
3638
- cacheRead: 0,
3589
+ input: 0.07,
3590
+ output: 0.3,
3591
+ cacheRead: 0.035,
3639
3592
  cacheWrite: 0,
3640
3593
  },
3641
3594
  contextWindow: 131072,
3642
3595
  maxTokens: 32768,
3643
3596
  },
3644
- "accounts/fireworks/models/kimi-k2-instruct": {
3645
- id: "accounts/fireworks/models/kimi-k2-instruct",
3646
- name: "Kimi K2 Instruct",
3647
- api: "anthropic-messages",
3648
- provider: "fireworks",
3649
- baseUrl: "https://api.fireworks.ai/inference",
3650
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3651
- reasoning: false,
3652
- input: ["text"],
3653
- cost: {
3654
- input: 1,
3655
- output: 3,
3656
- cacheRead: 0,
3657
- cacheWrite: 0,
3658
- },
3659
- contextWindow: 128000,
3660
- maxTokens: 16384,
3661
- },
3662
- "accounts/fireworks/models/kimi-k2-thinking": {
3663
- id: "accounts/fireworks/models/kimi-k2-thinking",
3664
- name: "Kimi K2 Thinking",
3665
- api: "anthropic-messages",
3666
- provider: "fireworks",
3667
- baseUrl: "https://api.fireworks.ai/inference",
3668
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3669
- reasoning: true,
3670
- input: ["text"],
3671
- cost: {
3672
- input: 0.6,
3673
- output: 2.5,
3674
- cacheRead: 0.3,
3675
- cacheWrite: 0,
3676
- },
3677
- contextWindow: 256000,
3678
- maxTokens: 256000,
3679
- },
3680
3597
  "accounts/fireworks/models/kimi-k2p5": {
3681
3598
  id: "accounts/fireworks/models/kimi-k2p5",
3682
3599
  name: "Kimi K2.5",
@@ -3713,24 +3630,6 @@ export const MODELS = {
3713
3630
  contextWindow: 262000,
3714
3631
  maxTokens: 262000,
3715
3632
  },
3716
- "accounts/fireworks/models/minimax-m2p1": {
3717
- id: "accounts/fireworks/models/minimax-m2p1",
3718
- name: "MiniMax-M2.1",
3719
- api: "anthropic-messages",
3720
- provider: "fireworks",
3721
- baseUrl: "https://api.fireworks.ai/inference",
3722
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3723
- reasoning: true,
3724
- input: ["text"],
3725
- cost: {
3726
- input: 0.3,
3727
- output: 1.2,
3728
- cacheRead: 0.03,
3729
- cacheWrite: 0,
3730
- },
3731
- contextWindow: 200000,
3732
- maxTokens: 200000,
3733
- },
3734
3633
  "accounts/fireworks/models/minimax-m2p5": {
3735
3634
  id: "accounts/fireworks/models/minimax-m2p5",
3736
3635
  name: "MiniMax-M2.5",
@@ -3761,7 +3660,7 @@ export const MODELS = {
3761
3660
  cost: {
3762
3661
  input: 0.3,
3763
3662
  output: 1.2,
3764
- cacheRead: 0.03,
3663
+ cacheRead: 0.06,
3765
3664
  cacheWrite: 0,
3766
3665
  },
3767
3666
  contextWindow: 196608,
@@ -3785,9 +3684,27 @@ export const MODELS = {
3785
3684
  contextWindow: 128000,
3786
3685
  maxTokens: 8192,
3787
3686
  },
3788
- "accounts/fireworks/routers/kimi-k2p5-turbo": {
3789
- id: "accounts/fireworks/routers/kimi-k2p5-turbo",
3790
- name: "Kimi K2.5 Turbo",
3687
+ "accounts/fireworks/routers/glm-5p1-fast": {
3688
+ id: "accounts/fireworks/routers/glm-5p1-fast",
3689
+ name: "GLM 5.1 Fast",
3690
+ api: "anthropic-messages",
3691
+ provider: "fireworks",
3692
+ baseUrl: "https://api.fireworks.ai/inference",
3693
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3694
+ reasoning: true,
3695
+ input: ["text"],
3696
+ cost: {
3697
+ input: 2.8,
3698
+ output: 8.8,
3699
+ cacheRead: 0.52,
3700
+ cacheWrite: 0,
3701
+ },
3702
+ contextWindow: 202800,
3703
+ maxTokens: 131072,
3704
+ },
3705
+ "accounts/fireworks/routers/kimi-k2p6-turbo": {
3706
+ id: "accounts/fireworks/routers/kimi-k2p6-turbo",
3707
+ name: "Kimi K2.6 Turbo",
3791
3708
  api: "anthropic-messages",
3792
3709
  provider: "fireworks",
3793
3710
  baseUrl: "https://api.fireworks.ai/inference",
@@ -3795,13 +3712,13 @@ export const MODELS = {
3795
3712
  reasoning: true,
3796
3713
  input: ["text", "image"],
3797
3714
  cost: {
3798
- input: 0,
3799
- output: 0,
3800
- cacheRead: 0,
3715
+ input: 2,
3716
+ output: 8,
3717
+ cacheRead: 0.3,
3801
3718
  cacheWrite: 0,
3802
3719
  },
3803
- contextWindow: 256000,
3804
- maxTokens: 256000,
3720
+ contextWindow: 262000,
3721
+ maxTokens: 262000,
3805
3722
  },
3806
3723
  },
3807
3724
  "github-copilot": {
@@ -3849,6 +3766,7 @@ export const MODELS = {
3849
3766
  provider: "github-copilot",
3850
3767
  baseUrl: "https://api.individual.githubcopilot.com",
3851
3768
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3769
+ compat: { "forceAdaptiveThinking": true },
3852
3770
  reasoning: true,
3853
3771
  thinkingLevelMap: { "xhigh": "max" },
3854
3772
  input: ["text", "image"],
@@ -3868,6 +3786,7 @@ export const MODELS = {
3868
3786
  provider: "github-copilot",
3869
3787
  baseUrl: "https://api.individual.githubcopilot.com",
3870
3788
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3789
+ compat: { "forceAdaptiveThinking": true },
3871
3790
  reasoning: true,
3872
3791
  thinkingLevelMap: { "xhigh": "xhigh" },
3873
3792
  input: ["text", "image"],
@@ -3906,6 +3825,7 @@ export const MODELS = {
3906
3825
  provider: "github-copilot",
3907
3826
  baseUrl: "https://api.individual.githubcopilot.com",
3908
3827
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3828
+ compat: { "forceAdaptiveThinking": true },
3909
3829
  reasoning: true,
3910
3830
  input: ["text", "image"],
3911
3831
  cost: {
@@ -3974,6 +3894,25 @@ export const MODELS = {
3974
3894
  contextWindow: 128000,
3975
3895
  maxTokens: 64000,
3976
3896
  },
3897
+ "gemini-3.5-flash": {
3898
+ id: "gemini-3.5-flash",
3899
+ name: "Gemini 3.5 Flash",
3900
+ api: "openai-completions",
3901
+ provider: "github-copilot",
3902
+ baseUrl: "https://api.individual.githubcopilot.com",
3903
+ headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3904
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
3905
+ reasoning: true,
3906
+ input: ["text", "image"],
3907
+ cost: {
3908
+ input: 0,
3909
+ output: 0,
3910
+ cacheRead: 0,
3911
+ cacheWrite: 0,
3912
+ },
3913
+ contextWindow: 128000,
3914
+ maxTokens: 64000,
3915
+ },
3977
3916
  "gpt-4.1": {
3978
3917
  id: "gpt-4.1",
3979
3918
  name: "GPT-4.1",
@@ -4166,57 +4105,6 @@ export const MODELS = {
4166
4105
  },
4167
4106
  },
4168
4107
  "google": {
4169
- "gemini-1.5-flash": {
4170
- id: "gemini-1.5-flash",
4171
- name: "Gemini 1.5 Flash",
4172
- api: "google-generative-ai",
4173
- provider: "google",
4174
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4175
- reasoning: false,
4176
- input: ["text", "image"],
4177
- cost: {
4178
- input: 0.075,
4179
- output: 0.3,
4180
- cacheRead: 0.01875,
4181
- cacheWrite: 0,
4182
- },
4183
- contextWindow: 1000000,
4184
- maxTokens: 8192,
4185
- },
4186
- "gemini-1.5-flash-8b": {
4187
- id: "gemini-1.5-flash-8b",
4188
- name: "Gemini 1.5 Flash-8B",
4189
- api: "google-generative-ai",
4190
- provider: "google",
4191
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4192
- reasoning: false,
4193
- input: ["text", "image"],
4194
- cost: {
4195
- input: 0.0375,
4196
- output: 0.15,
4197
- cacheRead: 0.01,
4198
- cacheWrite: 0,
4199
- },
4200
- contextWindow: 1000000,
4201
- maxTokens: 8192,
4202
- },
4203
- "gemini-1.5-pro": {
4204
- id: "gemini-1.5-pro",
4205
- name: "Gemini 1.5 Pro",
4206
- api: "google-generative-ai",
4207
- provider: "google",
4208
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4209
- reasoning: false,
4210
- input: ["text", "image"],
4211
- cost: {
4212
- input: 1.25,
4213
- output: 5,
4214
- cacheRead: 0.3125,
4215
- cacheWrite: 0,
4216
- },
4217
- contextWindow: 1000000,
4218
- maxTokens: 8192,
4219
- },
4220
4108
  "gemini-2.0-flash": {
4221
4109
  id: "gemini-2.0-flash",
4222
4110
  name: "Gemini 2.0 Flash",
@@ -4236,7 +4124,7 @@ export const MODELS = {
4236
4124
  },
4237
4125
  "gemini-2.0-flash-lite": {
4238
4126
  id: "gemini-2.0-flash-lite",
4239
- name: "Gemini 2.0 Flash Lite",
4127
+ name: "Gemini 2.0 Flash-Lite",
4240
4128
  api: "google-generative-ai",
4241
4129
  provider: "google",
4242
4130
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4270,143 +4158,24 @@ export const MODELS = {
4270
4158
  },
4271
4159
  "gemini-2.5-flash-lite": {
4272
4160
  id: "gemini-2.5-flash-lite",
4273
- name: "Gemini 2.5 Flash Lite",
4161
+ name: "Gemini 2.5 Flash-Lite",
4274
4162
  api: "google-generative-ai",
4275
4163
  provider: "google",
4276
4164
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4277
4165
  reasoning: true,
4278
4166
  input: ["text", "image"],
4279
- cost: {
4280
- input: 0.1,
4281
- output: 0.4,
4282
- cacheRead: 0.01,
4283
- cacheWrite: 0,
4284
- },
4285
- contextWindow: 1048576,
4286
- maxTokens: 65536,
4287
- },
4288
- "gemini-2.5-flash-lite-preview-06-17": {
4289
- id: "gemini-2.5-flash-lite-preview-06-17",
4290
- name: "Gemini 2.5 Flash Lite Preview 06-17",
4291
- api: "google-generative-ai",
4292
- provider: "google",
4293
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4294
- reasoning: true,
4295
- input: ["text", "image"],
4296
- cost: {
4297
- input: 0.1,
4298
- output: 0.4,
4299
- cacheRead: 0.025,
4300
- cacheWrite: 0,
4301
- },
4302
- contextWindow: 1048576,
4303
- maxTokens: 65536,
4304
- },
4305
- "gemini-2.5-flash-lite-preview-09-2025": {
4306
- id: "gemini-2.5-flash-lite-preview-09-2025",
4307
- name: "Gemini 2.5 Flash Lite Preview 09-25",
4308
- api: "google-generative-ai",
4309
- provider: "google",
4310
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4311
- reasoning: true,
4312
- input: ["text", "image"],
4313
- cost: {
4314
- input: 0.1,
4315
- output: 0.4,
4316
- cacheRead: 0.025,
4317
- cacheWrite: 0,
4318
- },
4319
- contextWindow: 1048576,
4320
- maxTokens: 65536,
4321
- },
4322
- "gemini-2.5-flash-preview-04-17": {
4323
- id: "gemini-2.5-flash-preview-04-17",
4324
- name: "Gemini 2.5 Flash Preview 04-17",
4325
- api: "google-generative-ai",
4326
- provider: "google",
4327
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4328
- reasoning: true,
4329
- input: ["text", "image"],
4330
- cost: {
4331
- input: 0.15,
4332
- output: 0.6,
4333
- cacheRead: 0.0375,
4334
- cacheWrite: 0,
4335
- },
4336
- contextWindow: 1048576,
4337
- maxTokens: 65536,
4338
- },
4339
- "gemini-2.5-flash-preview-05-20": {
4340
- id: "gemini-2.5-flash-preview-05-20",
4341
- name: "Gemini 2.5 Flash Preview 05-20",
4342
- api: "google-generative-ai",
4343
- provider: "google",
4344
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4345
- reasoning: true,
4346
- input: ["text", "image"],
4347
- cost: {
4348
- input: 0.15,
4349
- output: 0.6,
4350
- cacheRead: 0.0375,
4351
- cacheWrite: 0,
4352
- },
4353
- contextWindow: 1048576,
4354
- maxTokens: 65536,
4355
- },
4356
- "gemini-2.5-flash-preview-09-2025": {
4357
- id: "gemini-2.5-flash-preview-09-2025",
4358
- name: "Gemini 2.5 Flash Preview 09-25",
4359
- api: "google-generative-ai",
4360
- provider: "google",
4361
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4362
- reasoning: true,
4363
- input: ["text", "image"],
4364
- cost: {
4365
- input: 0.3,
4366
- output: 2.5,
4367
- cacheRead: 0.075,
4368
- cacheWrite: 0,
4369
- },
4370
- contextWindow: 1048576,
4371
- maxTokens: 65536,
4372
- },
4373
- "gemini-2.5-pro": {
4374
- id: "gemini-2.5-pro",
4375
- name: "Gemini 2.5 Pro",
4376
- api: "google-generative-ai",
4377
- provider: "google",
4378
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4379
- reasoning: true,
4380
- input: ["text", "image"],
4381
- cost: {
4382
- input: 1.25,
4383
- output: 10,
4384
- cacheRead: 0.125,
4385
- cacheWrite: 0,
4386
- },
4387
- contextWindow: 1048576,
4388
- maxTokens: 65536,
4389
- },
4390
- "gemini-2.5-pro-preview-05-06": {
4391
- id: "gemini-2.5-pro-preview-05-06",
4392
- name: "Gemini 2.5 Pro Preview 05-06",
4393
- api: "google-generative-ai",
4394
- provider: "google",
4395
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4396
- reasoning: true,
4397
- input: ["text", "image"],
4398
- cost: {
4399
- input: 1.25,
4400
- output: 10,
4401
- cacheRead: 0.31,
4167
+ cost: {
4168
+ input: 0.1,
4169
+ output: 0.4,
4170
+ cacheRead: 0.01,
4402
4171
  cacheWrite: 0,
4403
4172
  },
4404
4173
  contextWindow: 1048576,
4405
4174
  maxTokens: 65536,
4406
4175
  },
4407
- "gemini-2.5-pro-preview-06-05": {
4408
- id: "gemini-2.5-pro-preview-06-05",
4409
- name: "Gemini 2.5 Pro Preview 06-05",
4176
+ "gemini-2.5-pro": {
4177
+ id: "gemini-2.5-pro",
4178
+ name: "Gemini 2.5 Pro",
4410
4179
  api: "google-generative-ai",
4411
4180
  provider: "google",
4412
4181
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4415,7 +4184,7 @@ export const MODELS = {
4415
4184
  cost: {
4416
4185
  input: 1.25,
4417
4186
  output: 10,
4418
- cacheRead: 0.31,
4187
+ cacheRead: 0.125,
4419
4188
  cacheWrite: 0,
4420
4189
  },
4421
4190
  contextWindow: 1048576,
@@ -4454,8 +4223,8 @@ export const MODELS = {
4454
4223
  cacheRead: 0.2,
4455
4224
  cacheWrite: 0,
4456
4225
  },
4457
- contextWindow: 1000000,
4458
- maxTokens: 64000,
4226
+ contextWindow: 1048576,
4227
+ maxTokens: 65536,
4459
4228
  },
4460
4229
  "gemini-3.1-flash-lite": {
4461
4230
  id: "gemini-3.1-flash-lite",
@@ -4581,60 +4350,9 @@ export const MODELS = {
4581
4350
  contextWindow: 1048576,
4582
4351
  maxTokens: 65536,
4583
4352
  },
4584
- "gemini-live-2.5-flash": {
4585
- id: "gemini-live-2.5-flash",
4586
- name: "Gemini Live 2.5 Flash",
4587
- api: "google-generative-ai",
4588
- provider: "google",
4589
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4590
- reasoning: true,
4591
- input: ["text", "image"],
4592
- cost: {
4593
- input: 0.5,
4594
- output: 2,
4595
- cacheRead: 0,
4596
- cacheWrite: 0,
4597
- },
4598
- contextWindow: 128000,
4599
- maxTokens: 8000,
4600
- },
4601
- "gemini-live-2.5-flash-preview-native-audio": {
4602
- id: "gemini-live-2.5-flash-preview-native-audio",
4603
- name: "Gemini Live 2.5 Flash Preview Native Audio",
4604
- api: "google-generative-ai",
4605
- provider: "google",
4606
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4607
- reasoning: true,
4608
- input: ["text"],
4609
- cost: {
4610
- input: 0.5,
4611
- output: 2,
4612
- cacheRead: 0,
4613
- cacheWrite: 0,
4614
- },
4615
- contextWindow: 131072,
4616
- maxTokens: 65536,
4617
- },
4618
- "gemma-3-27b-it": {
4619
- id: "gemma-3-27b-it",
4620
- name: "Gemma 3 27B",
4621
- api: "google-generative-ai",
4622
- provider: "google",
4623
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4624
- reasoning: false,
4625
- input: ["text", "image"],
4626
- cost: {
4627
- input: 0,
4628
- output: 0,
4629
- cacheRead: 0,
4630
- cacheWrite: 0,
4631
- },
4632
- contextWindow: 131072,
4633
- maxTokens: 8192,
4634
- },
4635
4353
  "gemma-4-26b-a4b-it": {
4636
4354
  id: "gemma-4-26b-a4b-it",
4637
- name: "Gemma 4 26B",
4355
+ name: "Gemma 4 26B A4B IT",
4638
4356
  api: "google-generative-ai",
4639
4357
  provider: "google",
4640
4358
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4647,12 +4365,12 @@ export const MODELS = {
4647
4365
  cacheRead: 0,
4648
4366
  cacheWrite: 0,
4649
4367
  },
4650
- contextWindow: 256000,
4651
- maxTokens: 8192,
4368
+ contextWindow: 262144,
4369
+ maxTokens: 32768,
4652
4370
  },
4653
4371
  "gemma-4-31b-it": {
4654
4372
  id: "gemma-4-31b-it",
4655
- name: "Gemma 4 31B",
4373
+ name: "Gemma 4 31B IT",
4656
4374
  api: "google-generative-ai",
4657
4375
  provider: "google",
4658
4376
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4665,8 +4383,8 @@ export const MODELS = {
4665
4383
  cacheRead: 0,
4666
4384
  cacheWrite: 0,
4667
4385
  },
4668
- contextWindow: 256000,
4669
- maxTokens: 8192,
4386
+ contextWindow: 262144,
4387
+ maxTokens: 32768,
4670
4388
  },
4671
4389
  },
4672
4390
  "google-vertex": {
@@ -5112,7 +4830,7 @@ export const MODELS = {
5112
4830
  cost: {
5113
4831
  input: 1,
5114
4832
  output: 3,
5115
- cacheRead: 0,
4833
+ cacheRead: 0.5,
5116
4834
  cacheWrite: 0,
5117
4835
  },
5118
4836
  contextWindow: 262144,
@@ -5129,7 +4847,7 @@ export const MODELS = {
5129
4847
  cost: {
5130
4848
  input: 0.15,
5131
4849
  output: 0.6,
5132
- cacheRead: 0,
4850
+ cacheRead: 0.075,
5133
4851
  cacheWrite: 0,
5134
4852
  },
5135
4853
  contextWindow: 131072,
@@ -5146,7 +4864,7 @@ export const MODELS = {
5146
4864
  cost: {
5147
4865
  input: 0.075,
5148
4866
  output: 0.3,
5149
- cacheRead: 0,
4867
+ cacheRead: 0.0375,
5150
4868
  cacheWrite: 0,
5151
4869
  },
5152
4870
  contextWindow: 131072,
@@ -5432,9 +5150,9 @@ export const MODELS = {
5432
5150
  reasoning: true,
5433
5151
  input: ["text"],
5434
5152
  cost: {
5435
- input: 1.74,
5436
- output: 3.48,
5437
- cacheRead: 0.145,
5153
+ input: 0.435,
5154
+ output: 0.87,
5155
+ cacheRead: 0.003625,
5438
5156
  cacheWrite: 0,
5439
5157
  },
5440
5158
  contextWindow: 1048576,
@@ -6527,7 +6245,7 @@ export const MODELS = {
6527
6245
  cost: {
6528
6246
  input: 0.1,
6529
6247
  output: 0.4,
6530
- cacheRead: 0.03,
6248
+ cacheRead: 0.025,
6531
6249
  cacheWrite: 0,
6532
6250
  },
6533
6251
  contextWindow: 1047576,
@@ -6612,7 +6330,7 @@ export const MODELS = {
6612
6330
  cost: {
6613
6331
  input: 0.15,
6614
6332
  output: 0.6,
6615
- cacheRead: 0.08,
6333
+ cacheRead: 0.075,
6616
6334
  cacheWrite: 0,
6617
6335
  },
6618
6336
  contextWindow: 128000,
@@ -6738,7 +6456,7 @@ export const MODELS = {
6738
6456
  cost: {
6739
6457
  input: 1.25,
6740
6458
  output: 10,
6741
- cacheRead: 0.13,
6459
+ cacheRead: 0.125,
6742
6460
  cacheWrite: 0,
6743
6461
  },
6744
6462
  contextWindow: 400000,
@@ -7163,7 +6881,7 @@ export const MODELS = {
7163
6881
  cost: {
7164
6882
  input: 1.1,
7165
6883
  output: 4.4,
7166
- cacheRead: 0.28,
6884
+ cacheRead: 0.275,
7167
6885
  cacheWrite: 0,
7168
6886
  },
7169
6887
  contextWindow: 200000,
@@ -7239,7 +6957,7 @@ export const MODELS = {
7239
6957
  cacheRead: 0.175,
7240
6958
  cacheWrite: 0,
7241
6959
  },
7242
- contextWindow: 272000,
6960
+ contextWindow: 128000,
7243
6961
  maxTokens: 128000,
7244
6962
  },
7245
6963
  "gpt-5.4": {
@@ -7313,7 +7031,7 @@ export const MODELS = {
7313
7031
  cacheWrite: 0,
7314
7032
  },
7315
7033
  contextWindow: 200000,
7316
- maxTokens: 128000,
7034
+ maxTokens: 32000,
7317
7035
  },
7318
7036
  "claude-haiku-4-5": {
7319
7037
  id: "claude-haiku-4-5",
@@ -7372,6 +7090,7 @@ export const MODELS = {
7372
7090
  api: "anthropic-messages",
7373
7091
  provider: "opencode",
7374
7092
  baseUrl: "https://opencode.ai/zen",
7093
+ compat: { "forceAdaptiveThinking": true },
7375
7094
  reasoning: true,
7376
7095
  thinkingLevelMap: { "xhigh": "max" },
7377
7096
  input: ["text", "image"],
@@ -7390,6 +7109,7 @@ export const MODELS = {
7390
7109
  api: "anthropic-messages",
7391
7110
  provider: "opencode",
7392
7111
  baseUrl: "https://opencode.ai/zen",
7112
+ compat: { "forceAdaptiveThinking": true },
7393
7113
  reasoning: true,
7394
7114
  thinkingLevelMap: { "xhigh": "xhigh" },
7395
7115
  input: ["text", "image"],
@@ -7442,6 +7162,7 @@ export const MODELS = {
7442
7162
  api: "anthropic-messages",
7443
7163
  provider: "opencode",
7444
7164
  baseUrl: "https://opencode.ai/zen",
7165
+ compat: { "forceAdaptiveThinking": true },
7445
7166
  reasoning: true,
7446
7167
  input: ["text", "image"],
7447
7168
  cost: {
@@ -7848,6 +7569,23 @@ export const MODELS = {
7848
7569
  contextWindow: 1050000,
7849
7570
  maxTokens: 128000,
7850
7571
  },
7572
+ "grok-build-0.1": {
7573
+ id: "grok-build-0.1",
7574
+ name: "Grok Build 0.1",
7575
+ api: "openai-completions",
7576
+ provider: "opencode",
7577
+ baseUrl: "https://opencode.ai/zen/v1",
7578
+ reasoning: true,
7579
+ input: ["text", "image"],
7580
+ cost: {
7581
+ input: 1,
7582
+ output: 2,
7583
+ cacheRead: 0.2,
7584
+ cacheWrite: 0,
7585
+ },
7586
+ contextWindow: 256000,
7587
+ maxTokens: 256000,
7588
+ },
7851
7589
  "kimi-k2.5": {
7852
7590
  id: "kimi-k2.5",
7853
7591
  name: "Kimi K2.5",
@@ -7882,35 +7620,35 @@ export const MODELS = {
7882
7620
  contextWindow: 262144,
7883
7621
  maxTokens: 65536,
7884
7622
  },
7885
- "minimax-m2.5": {
7886
- id: "minimax-m2.5",
7887
- name: "MiniMax M2.5",
7623
+ "mimo-v2.5-free": {
7624
+ id: "mimo-v2.5-free",
7625
+ name: "MiMo V2.5 Free",
7888
7626
  api: "openai-completions",
7889
7627
  provider: "opencode",
7890
7628
  baseUrl: "https://opencode.ai/zen/v1",
7891
7629
  reasoning: true,
7892
- input: ["text"],
7630
+ input: ["text", "image"],
7893
7631
  cost: {
7894
- input: 0.3,
7895
- output: 1.2,
7896
- cacheRead: 0.06,
7632
+ input: 0,
7633
+ output: 0,
7634
+ cacheRead: 0,
7897
7635
  cacheWrite: 0,
7898
7636
  },
7899
- contextWindow: 204800,
7900
- maxTokens: 131072,
7637
+ contextWindow: 1000000,
7638
+ maxTokens: 128000,
7901
7639
  },
7902
- "minimax-m2.5-free": {
7903
- id: "minimax-m2.5-free",
7904
- name: "MiniMax M2.5 Free",
7905
- api: "anthropic-messages",
7640
+ "minimax-m2.5": {
7641
+ id: "minimax-m2.5",
7642
+ name: "MiniMax M2.5",
7643
+ api: "openai-completions",
7906
7644
  provider: "opencode",
7907
- baseUrl: "https://opencode.ai/zen",
7645
+ baseUrl: "https://opencode.ai/zen/v1",
7908
7646
  reasoning: true,
7909
7647
  input: ["text"],
7910
7648
  cost: {
7911
- input: 0,
7912
- output: 0,
7913
- cacheRead: 0,
7649
+ input: 0.3,
7650
+ output: 1.2,
7651
+ cacheRead: 0.06,
7914
7652
  cacheWrite: 0,
7915
7653
  },
7916
7654
  contextWindow: 204800,
@@ -7984,23 +7722,6 @@ export const MODELS = {
7984
7722
  contextWindow: 262144,
7985
7723
  maxTokens: 65536,
7986
7724
  },
7987
- "qwen3.6-plus-free": {
7988
- id: "qwen3.6-plus-free",
7989
- name: "Qwen3.6 Plus Free",
7990
- api: "anthropic-messages",
7991
- provider: "opencode",
7992
- baseUrl: "https://opencode.ai/zen",
7993
- reasoning: true,
7994
- input: ["text", "image"],
7995
- cost: {
7996
- input: 0,
7997
- output: 0,
7998
- cacheRead: 0,
7999
- cacheWrite: 0,
8000
- },
8001
- contextWindow: 262144,
8002
- maxTokens: 65536,
8003
- },
8004
7725
  },
8005
7726
  "opencode-go": {
8006
7727
  "deepseek-v4-flash": {
@@ -8118,9 +7839,9 @@ export const MODELS = {
8118
7839
  reasoning: true,
8119
7840
  input: ["text", "image"],
8120
7841
  cost: {
8121
- input: 0.4,
8122
- output: 2,
8123
- cacheRead: 0.08,
7842
+ input: 0.14,
7843
+ output: 0.28,
7844
+ cacheRead: 0.0028,
8124
7845
  cacheWrite: 0,
8125
7846
  },
8126
7847
  contextWindow: 1000000,
@@ -8135,9 +7856,9 @@ export const MODELS = {
8135
7856
  reasoning: true,
8136
7857
  input: ["text"],
8137
7858
  cost: {
8138
- input: 1,
8139
- output: 3,
8140
- cacheRead: 0.2,
7859
+ input: 1.74,
7860
+ output: 3.48,
7861
+ cacheRead: 0.0145,
8141
7862
  cacheWrite: 0,
8142
7863
  },
8143
7864
  contextWindow: 1048576,
@@ -8213,6 +7934,23 @@ export const MODELS = {
8213
7934
  contextWindow: 262144,
8214
7935
  maxTokens: 65536,
8215
7936
  },
7937
+ "qwen3.7-max": {
7938
+ id: "qwen3.7-max",
7939
+ name: "Qwen3.7 Max",
7940
+ api: "anthropic-messages",
7941
+ provider: "opencode-go",
7942
+ baseUrl: "https://opencode.ai/zen/go",
7943
+ reasoning: true,
7944
+ input: ["text"],
7945
+ cost: {
7946
+ input: 2.5,
7947
+ output: 7.5,
7948
+ cacheRead: 0.5,
7949
+ cacheWrite: 3.125,
7950
+ },
7951
+ contextWindow: 1000000,
7952
+ maxTokens: 65536,
7953
+ },
8216
7954
  },
8217
7955
  "openrouter": {
8218
7956
  "ai21/jamba-large-1.7": {
@@ -8232,23 +7970,6 @@ export const MODELS = {
8232
7970
  contextWindow: 256000,
8233
7971
  maxTokens: 4096,
8234
7972
  },
8235
- "alibaba/tongyi-deepresearch-30b-a3b": {
8236
- id: "alibaba/tongyi-deepresearch-30b-a3b",
8237
- name: "Tongyi DeepResearch 30B A3B",
8238
- api: "openai-completions",
8239
- provider: "openrouter",
8240
- baseUrl: "https://openrouter.ai/api/v1",
8241
- reasoning: true,
8242
- input: ["text"],
8243
- cost: {
8244
- input: 0.09,
8245
- output: 0.44999999999999996,
8246
- cacheRead: 0.09,
8247
- cacheWrite: 0,
8248
- },
8249
- contextWindow: 131072,
8250
- maxTokens: 131072,
8251
- },
8252
7973
  "amazon/nova-2-lite-v1": {
8253
7974
  id: "amazon/nova-2-lite-v1",
8254
7975
  name: "Amazon: Nova 2 Lite",
@@ -8559,23 +8280,6 @@ export const MODELS = {
8559
8280
  contextWindow: 1000000,
8560
8281
  maxTokens: 128000,
8561
8282
  },
8562
- "arcee-ai/trinity-large-preview": {
8563
- id: "arcee-ai/trinity-large-preview",
8564
- name: "Arcee AI: Trinity Large Preview",
8565
- api: "openai-completions",
8566
- provider: "openrouter",
8567
- baseUrl: "https://openrouter.ai/api/v1",
8568
- reasoning: false,
8569
- input: ["text"],
8570
- cost: {
8571
- input: 0.15,
8572
- output: 0.44999999999999996,
8573
- cacheRead: 0,
8574
- cacheWrite: 0,
8575
- },
8576
- contextWindow: 131000,
8577
- maxTokens: 4096,
8578
- },
8579
8283
  "arcee-ai/trinity-large-thinking": {
8580
8284
  id: "arcee-ai/trinity-large-thinking",
8581
8285
  name: "Arcee AI: Trinity Large Thinking",
@@ -8593,23 +8297,6 @@ export const MODELS = {
8593
8297
  contextWindow: 262144,
8594
8298
  maxTokens: 262144,
8595
8299
  },
8596
- "arcee-ai/trinity-large-thinking:free": {
8597
- id: "arcee-ai/trinity-large-thinking:free",
8598
- name: "Arcee AI: Trinity Large Thinking (free)",
8599
- api: "openai-completions",
8600
- provider: "openrouter",
8601
- baseUrl: "https://openrouter.ai/api/v1",
8602
- reasoning: true,
8603
- input: ["text"],
8604
- cost: {
8605
- input: 0,
8606
- output: 0,
8607
- cacheRead: 0,
8608
- cacheWrite: 0,
8609
- },
8610
- contextWindow: 262144,
8611
- maxTokens: 80000,
8612
- },
8613
8300
  "arcee-ai/trinity-mini": {
8614
8301
  id: "arcee-ai/trinity-mini",
8615
8302
  name: "Arcee AI: Trinity Mini",
@@ -8661,23 +8348,6 @@ export const MODELS = {
8661
8348
  contextWindow: 2000000,
8662
8349
  maxTokens: 30000,
8663
8350
  },
8664
- "baidu/cobuddy:free": {
8665
- id: "baidu/cobuddy:free",
8666
- name: "Baidu Qianfan: CoBuddy (free)",
8667
- api: "openai-completions",
8668
- provider: "openrouter",
8669
- baseUrl: "https://openrouter.ai/api/v1",
8670
- reasoning: true,
8671
- input: ["text"],
8672
- cost: {
8673
- input: 0,
8674
- output: 0,
8675
- cacheRead: 0,
8676
- cacheWrite: 0,
8677
- },
8678
- contextWindow: 131072,
8679
- maxTokens: 65536,
8680
- },
8681
8351
  "baidu/ernie-4.5-21b-a3b": {
8682
8352
  id: "baidu/ernie-4.5-21b-a3b",
8683
8353
  name: "Baidu: ERNIE 4.5 21B A3B",
@@ -8823,13 +8493,13 @@ export const MODELS = {
8823
8493
  reasoning: false,
8824
8494
  input: ["text"],
8825
8495
  cost: {
8826
- input: 0.32,
8827
- output: 0.8899999999999999,
8496
+ input: 0.2288,
8497
+ output: 0.9144,
8828
8498
  cacheRead: 0,
8829
8499
  cacheWrite: 0,
8830
8500
  },
8831
- contextWindow: 163840,
8832
- maxTokens: 16384,
8501
+ contextWindow: 131072,
8502
+ maxTokens: 16000,
8833
8503
  },
8834
8504
  "deepseek/deepseek-chat-v3-0324": {
8835
8505
  id: "deepseek/deepseek-chat-v3-0324",
@@ -8961,13 +8631,13 @@ export const MODELS = {
8961
8631
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
8962
8632
  input: ["text"],
8963
8633
  cost: {
8964
- input: 0.112,
8965
- output: 0.224,
8966
- cacheRead: 0.022,
8634
+ input: 0.09999999999999999,
8635
+ output: 0.19999999999999998,
8636
+ cacheRead: 0.02,
8967
8637
  cacheWrite: 0,
8968
8638
  },
8969
8639
  contextWindow: 1048576,
8970
- maxTokens: 4096,
8640
+ maxTokens: 16384,
8971
8641
  },
8972
8642
  "deepseek/deepseek-v4-flash:free": {
8973
8643
  id: "deepseek/deepseek-v4-flash:free",
@@ -9408,9 +9078,9 @@ export const MODELS = {
9408
9078
  reasoning: false,
9409
9079
  input: ["text"],
9410
9080
  cost: {
9411
- input: 0.3,
9412
- output: 2.5,
9413
- cacheRead: 0.06,
9081
+ input: 0.075,
9082
+ output: 0.625,
9083
+ cacheRead: 0.015,
9414
9084
  cacheWrite: 0,
9415
9085
  },
9416
9086
  contextWindow: 262144,
@@ -10096,6 +9766,23 @@ export const MODELS = {
10096
9766
  contextWindow: 262144,
10097
9767
  maxTokens: 262142,
10098
9768
  },
9769
+ "moonshotai/kimi-k2.6:free": {
9770
+ id: "moonshotai/kimi-k2.6:free",
9771
+ name: "MoonshotAI: Kimi K2.6 (free)",
9772
+ api: "openai-completions",
9773
+ provider: "openrouter",
9774
+ baseUrl: "https://openrouter.ai/api/v1",
9775
+ reasoning: true,
9776
+ input: ["text", "image"],
9777
+ cost: {
9778
+ input: 0,
9779
+ output: 0,
9780
+ cacheRead: 0,
9781
+ cacheWrite: 0,
9782
+ },
9783
+ contextWindow: 262144,
9784
+ maxTokens: 4096,
9785
+ },
10099
9786
  "nex-agi/deepseek-v3.1-nex-n1": {
10100
9787
  id: "nex-agi/deepseek-v3.1-nex-n1",
10101
9788
  name: "Nex AGI: DeepSeek V3.1 Nex N1",
@@ -10685,11 +10372,11 @@ export const MODELS = {
10685
10372
  cost: {
10686
10373
  input: 1.25,
10687
10374
  output: 10,
10688
- cacheRead: 0.125,
10375
+ cacheRead: 0.13,
10689
10376
  cacheWrite: 0,
10690
10377
  },
10691
10378
  contextWindow: 128000,
10692
- maxTokens: 16384,
10379
+ maxTokens: 32000,
10693
10380
  },
10694
10381
  "openai/gpt-5.1-codex": {
10695
10382
  id: "openai/gpt-5.1-codex",
@@ -10702,7 +10389,7 @@ export const MODELS = {
10702
10389
  cost: {
10703
10390
  input: 1.25,
10704
10391
  output: 10,
10705
- cacheRead: 0.125,
10392
+ cacheRead: 0.13,
10706
10393
  cacheWrite: 0,
10707
10394
  },
10708
10395
  contextWindow: 400000,
@@ -10736,11 +10423,11 @@ export const MODELS = {
10736
10423
  cost: {
10737
10424
  input: 0.25,
10738
10425
  output: 2,
10739
- cacheRead: 0.03,
10426
+ cacheRead: 0.024999999999999998,
10740
10427
  cacheWrite: 0,
10741
10428
  },
10742
10429
  contextWindow: 400000,
10743
- maxTokens: 128000,
10430
+ maxTokens: 100000,
10744
10431
  },
10745
10432
  "openai/gpt-5.2": {
10746
10433
  id: "openai/gpt-5.2",
@@ -10776,7 +10463,7 @@ export const MODELS = {
10776
10463
  cacheWrite: 0,
10777
10464
  },
10778
10465
  contextWindow: 128000,
10779
- maxTokens: 32000,
10466
+ maxTokens: 16384,
10780
10467
  },
10781
10468
  "openai/gpt-5.2-codex": {
10782
10469
  id: "openai/gpt-5.2-codex",
@@ -11312,8 +10999,8 @@ export const MODELS = {
11312
10999
  cacheRead: 0,
11313
11000
  cacheWrite: 0,
11314
11001
  },
11315
- contextWindow: 131072,
11316
- maxTokens: 8192,
11002
+ contextWindow: 262144,
11003
+ maxTokens: 32768,
11317
11004
  },
11318
11005
  "poolside/laguna-xs.2:free": {
11319
11006
  id: "poolside/laguna-xs.2:free",
@@ -11329,8 +11016,8 @@ export const MODELS = {
11329
11016
  cacheRead: 0,
11330
11017
  cacheWrite: 0,
11331
11018
  },
11332
- contextWindow: 131072,
11333
- maxTokens: 8192,
11019
+ contextWindow: 262144,
11020
+ maxTokens: 32768,
11334
11021
  },
11335
11022
  "prime-intellect/intellect-3": {
11336
11023
  id: "prime-intellect/intellect-3",
@@ -11412,7 +11099,7 @@ export const MODELS = {
11412
11099
  input: 0.26,
11413
11100
  output: 0.78,
11414
11101
  cacheRead: 0,
11415
- cacheWrite: 0.325,
11102
+ cacheWrite: 0,
11416
11103
  },
11417
11104
  contextWindow: 1000000,
11418
11105
  maxTokens: 32768,
@@ -11908,7 +11595,7 @@ export const MODELS = {
11908
11595
  cacheWrite: 0,
11909
11596
  },
11910
11597
  contextWindow: 262144,
11911
- maxTokens: 65536,
11598
+ maxTokens: 262144,
11912
11599
  },
11913
11600
  "qwen/qwen3.5-27b": {
11914
11601
  id: "qwen/qwen3.5-27b",
@@ -11955,7 +11642,7 @@ export const MODELS = {
11955
11642
  cost: {
11956
11643
  input: 0.39,
11957
11644
  output: 2.34,
11958
- cacheRead: 0.195,
11645
+ cacheRead: 0,
11959
11646
  cacheWrite: 0,
11960
11647
  },
11961
11648
  contextWindow: 262144,
@@ -11990,7 +11677,7 @@ export const MODELS = {
11990
11677
  input: 0.065,
11991
11678
  output: 0.26,
11992
11679
  cacheRead: 0,
11993
- cacheWrite: 0.08125,
11680
+ cacheWrite: 0,
11994
11681
  },
11995
11682
  contextWindow: 1000000,
11996
11683
  maxTokens: 65536,
@@ -12007,7 +11694,7 @@ export const MODELS = {
12007
11694
  input: 0.26,
12008
11695
  output: 1.56,
12009
11696
  cacheRead: 0,
12010
- cacheWrite: 0.325,
11697
+ cacheWrite: 0,
12011
11698
  },
12012
11699
  contextWindow: 1000000,
12013
11700
  maxTokens: 65536,
@@ -12024,7 +11711,7 @@ export const MODELS = {
12024
11711
  input: 0.3,
12025
11712
  output: 1.7999999999999998,
12026
11713
  cacheRead: 0,
12027
- cacheWrite: 0,
11714
+ cacheWrite: 0.375,
12028
11715
  },
12029
11716
  contextWindow: 1000000,
12030
11717
  maxTokens: 65536,
@@ -12038,13 +11725,13 @@ export const MODELS = {
12038
11725
  reasoning: true,
12039
11726
  input: ["text", "image"],
12040
11727
  cost: {
12041
- input: 0.32,
11728
+ input: 0.29,
12042
11729
  output: 3.1999999999999997,
12043
11730
  cacheRead: 0,
12044
11731
  cacheWrite: 0,
12045
11732
  },
12046
11733
  contextWindow: 262144,
12047
- maxTokens: 81920,
11734
+ maxTokens: 262140,
12048
11735
  },
12049
11736
  "qwen/qwen3.6-35b-a3b": {
12050
11737
  id: "qwen/qwen3.6-35b-a3b",
@@ -12055,13 +11742,13 @@ export const MODELS = {
12055
11742
  reasoning: true,
12056
11743
  input: ["text", "image"],
12057
11744
  cost: {
12058
- input: 0.149,
11745
+ input: 0.14,
12059
11746
  output: 1,
12060
11747
  cacheRead: 0,
12061
11748
  cacheWrite: 0,
12062
11749
  },
12063
11750
  contextWindow: 262144,
12064
- maxTokens: 4096,
11751
+ maxTokens: 262140,
12065
11752
  },
12066
11753
  "qwen/qwen3.6-flash": {
12067
11754
  id: "qwen/qwen3.6-flash",
@@ -12114,6 +11801,23 @@ export const MODELS = {
12114
11801
  contextWindow: 1000000,
12115
11802
  maxTokens: 65536,
12116
11803
  },
11804
+ "qwen/qwen3.7-max": {
11805
+ id: "qwen/qwen3.7-max",
11806
+ name: "Qwen: Qwen3.7 Max",
11807
+ api: "openai-completions",
11808
+ provider: "openrouter",
11809
+ baseUrl: "https://openrouter.ai/api/v1",
11810
+ reasoning: true,
11811
+ input: ["text"],
11812
+ cost: {
11813
+ input: 1.25,
11814
+ output: 3.75,
11815
+ cacheRead: 0.25,
11816
+ cacheWrite: 1.5625,
11817
+ },
11818
+ contextWindow: 1000000,
11819
+ maxTokens: 65536,
11820
+ },
12117
11821
  "rekaai/reka-edge": {
12118
11822
  id: "rekaai/reka-edge",
12119
11823
  name: "Reka Edge",
@@ -12191,13 +11895,13 @@ export const MODELS = {
12191
11895
  reasoning: true,
12192
11896
  input: ["text"],
12193
11897
  cost: {
12194
- input: 0.09999999999999999,
11898
+ input: 0.09,
12195
11899
  output: 0.3,
12196
- cacheRead: 0,
11900
+ cacheRead: 0.02,
12197
11901
  cacheWrite: 0,
12198
11902
  },
12199
11903
  contextWindow: 262144,
12200
- maxTokens: 65536,
11904
+ maxTokens: 16384,
12201
11905
  },
12202
11906
  "tencent/hy3-preview": {
12203
11907
  id: "tencent/hy3-preview",
@@ -12301,6 +12005,23 @@ export const MODELS = {
12301
12005
  contextWindow: 1000000,
12302
12006
  maxTokens: 4096,
12303
12007
  },
12008
+ "x-ai/grok-build-0.1": {
12009
+ id: "x-ai/grok-build-0.1",
12010
+ name: "xAI: Grok Build 0.1",
12011
+ api: "openai-completions",
12012
+ provider: "openrouter",
12013
+ baseUrl: "https://openrouter.ai/api/v1",
12014
+ reasoning: true,
12015
+ input: ["text", "image"],
12016
+ cost: {
12017
+ input: 1,
12018
+ output: 2,
12019
+ cacheRead: 0.19999999999999998,
12020
+ cacheWrite: 0,
12021
+ },
12022
+ contextWindow: 256000,
12023
+ maxTokens: 4096,
12024
+ },
12304
12025
  "xiaomi/mimo-v2-flash": {
12305
12026
  id: "xiaomi/mimo-v2-flash",
12306
12027
  name: "Xiaomi: MiMo-V2-Flash",
@@ -12361,9 +12082,9 @@ export const MODELS = {
12361
12082
  reasoning: true,
12362
12083
  input: ["text", "image"],
12363
12084
  cost: {
12364
- input: 0.39999999999999997,
12365
- output: 2,
12366
- cacheRead: 0.08,
12085
+ input: 0.14,
12086
+ output: 0.28,
12087
+ cacheRead: 0.0028,
12367
12088
  cacheWrite: 0,
12368
12089
  },
12369
12090
  contextWindow: 1048576,
@@ -12378,13 +12099,13 @@ export const MODELS = {
12378
12099
  reasoning: true,
12379
12100
  input: ["text"],
12380
12101
  cost: {
12381
- input: 1,
12382
- output: 3,
12383
- cacheRead: 0.19999999999999998,
12102
+ input: 0.435,
12103
+ output: 0.87,
12104
+ cacheRead: 0.0036,
12384
12105
  cacheWrite: 0,
12385
12106
  },
12386
12107
  contextWindow: 1048576,
12387
- maxTokens: 16384,
12108
+ maxTokens: 131072,
12388
12109
  },
12389
12110
  "z-ai/glm-4-32b": {
12390
12111
  id: "z-ai/glm-4-32b",
@@ -12429,13 +12150,13 @@ export const MODELS = {
12429
12150
  reasoning: true,
12430
12151
  input: ["text"],
12431
12152
  cost: {
12432
- input: 0.13,
12433
- output: 0.85,
12434
- cacheRead: 0.024999999999999998,
12153
+ input: 0.125,
12154
+ output: 0.84,
12155
+ cacheRead: 0,
12435
12156
  cacheWrite: 0,
12436
12157
  },
12437
12158
  contextWindow: 131072,
12438
- maxTokens: 98304,
12159
+ maxTokens: 131070,
12439
12160
  },
12440
12161
  "z-ai/glm-4.5-air:free": {
12441
12162
  id: "z-ai/glm-4.5-air:free",
@@ -12582,13 +12303,13 @@ export const MODELS = {
12582
12303
  reasoning: true,
12583
12304
  input: ["text"],
12584
12305
  cost: {
12585
- input: 0,
12586
- output: 0,
12587
- cacheRead: 0,
12306
+ input: 0.98,
12307
+ output: 3.08,
12308
+ cacheRead: 0.182,
12588
12309
  cacheWrite: 0,
12589
12310
  },
12590
- contextWindow: 202800,
12591
- maxTokens: 202800,
12311
+ contextWindow: 202752,
12312
+ maxTokens: 4096,
12592
12313
  },
12593
12314
  "z-ai/glm-5v-turbo": {
12594
12315
  id: "z-ai/glm-5v-turbo",
@@ -12877,6 +12598,25 @@ export const MODELS = {
12877
12598
  contextWindow: 1000000,
12878
12599
  maxTokens: 500000,
12879
12600
  },
12601
+ "Qwen/Qwen3.7-Max": {
12602
+ id: "Qwen/Qwen3.7-Max",
12603
+ name: "Qwen3.7 Max",
12604
+ api: "openai-completions",
12605
+ provider: "together",
12606
+ baseUrl: "https://api.together.ai/v1",
12607
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
12608
+ reasoning: true,
12609
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
12610
+ input: ["text"],
12611
+ cost: {
12612
+ input: 2.5,
12613
+ output: 7.5,
12614
+ cacheRead: 0,
12615
+ cacheWrite: 0,
12616
+ },
12617
+ contextWindow: 1000000,
12618
+ maxTokens: 500000,
12619
+ },
12880
12620
  "deepseek-ai/DeepSeek-V3": {
12881
12621
  id: "deepseek-ai/DeepSeek-V3",
12882
12622
  name: "DeepSeek V3",
@@ -13373,6 +13113,23 @@ export const MODELS = {
13373
13113
  contextWindow: 1000000,
13374
13114
  maxTokens: 64000,
13375
13115
  },
13116
+ "alibaba/qwen3.7-max": {
13117
+ id: "alibaba/qwen3.7-max",
13118
+ name: "Qwen 3.7 Max",
13119
+ api: "anthropic-messages",
13120
+ provider: "vercel-ai-gateway",
13121
+ baseUrl: "https://ai-gateway.vercel.sh",
13122
+ reasoning: true,
13123
+ input: ["text", "image"],
13124
+ cost: {
13125
+ input: 1.25,
13126
+ output: 3.75,
13127
+ cacheRead: 0.25,
13128
+ cacheWrite: 1.5625,
13129
+ },
13130
+ contextWindow: 991000,
13131
+ maxTokens: 64000,
13132
+ },
13376
13133
  "anthropic/claude-3-haiku": {
13377
13134
  id: "anthropic/claude-3-haiku",
13378
13135
  name: "Claude 3 Haiku",
@@ -13481,6 +13238,7 @@ export const MODELS = {
13481
13238
  api: "anthropic-messages",
13482
13239
  provider: "vercel-ai-gateway",
13483
13240
  baseUrl: "https://ai-gateway.vercel.sh",
13241
+ compat: { "forceAdaptiveThinking": true },
13484
13242
  reasoning: true,
13485
13243
  thinkingLevelMap: { "xhigh": "max" },
13486
13244
  input: ["text", "image"],
@@ -13499,6 +13257,7 @@ export const MODELS = {
13499
13257
  api: "anthropic-messages",
13500
13258
  provider: "vercel-ai-gateway",
13501
13259
  baseUrl: "https://ai-gateway.vercel.sh",
13260
+ compat: { "forceAdaptiveThinking": true },
13502
13261
  reasoning: true,
13503
13262
  thinkingLevelMap: { "xhigh": "xhigh" },
13504
13263
  input: ["text", "image"],
@@ -13551,6 +13310,7 @@ export const MODELS = {
13551
13310
  api: "anthropic-messages",
13552
13311
  provider: "vercel-ai-gateway",
13553
13312
  baseUrl: "https://ai-gateway.vercel.sh",
13313
+ compat: { "forceAdaptiveThinking": true },
13554
13314
  reasoning: true,
13555
13315
  input: ["text", "image"],
13556
13316
  cost: {
@@ -14261,7 +14021,7 @@ export const MODELS = {
14261
14021
  },
14262
14022
  "minimax/minimax-m2.7": {
14263
14023
  id: "minimax/minimax-m2.7",
14264
- name: "Minimax M2.7",
14024
+ name: "MiniMax M2.7",
14265
14025
  api: "anthropic-messages",
14266
14026
  provider: "vercel-ai-gateway",
14267
14027
  baseUrl: "https://ai-gateway.vercel.sh",
@@ -15444,6 +15204,23 @@ export const MODELS = {
15444
15204
  contextWindow: 1000000,
15445
15205
  maxTokens: 1000000,
15446
15206
  },
15207
+ "xai/grok-build-0.1": {
15208
+ id: "xai/grok-build-0.1",
15209
+ name: "Grok Build 0.1",
15210
+ api: "anthropic-messages",
15211
+ provider: "vercel-ai-gateway",
15212
+ baseUrl: "https://ai-gateway.vercel.sh",
15213
+ reasoning: true,
15214
+ input: ["text", "image"],
15215
+ cost: {
15216
+ input: 1,
15217
+ output: 2,
15218
+ cacheRead: 0.19999999999999998,
15219
+ cacheWrite: 0,
15220
+ },
15221
+ contextWindow: 256000,
15222
+ maxTokens: 256000,
15223
+ },
15447
15224
  "xiaomi/mimo-v2-flash": {
15448
15225
  id: "xiaomi/mimo-v2-flash",
15449
15226
  name: "MiMo V2 Flash",
@@ -15487,9 +15264,9 @@ export const MODELS = {
15487
15264
  reasoning: true,
15488
15265
  input: ["text", "image"],
15489
15266
  cost: {
15490
- input: 0.39999999999999997,
15491
- output: 2,
15492
- cacheRead: 0.08,
15267
+ input: 0.14,
15268
+ output: 0.28,
15269
+ cacheRead: 0.0028,
15493
15270
  cacheWrite: 0,
15494
15271
  },
15495
15272
  contextWindow: 1050000,
@@ -15504,9 +15281,9 @@ export const MODELS = {
15504
15281
  reasoning: true,
15505
15282
  input: ["text", "image"],
15506
15283
  cost: {
15507
- input: 1,
15508
- output: 3,
15509
- cacheRead: 0.19999999999999998,
15284
+ input: 0.435,
15285
+ output: 0.87,
15286
+ cacheRead: 0.0036,
15510
15287
  cacheWrite: 0,
15511
15288
  },
15512
15289
  contextWindow: 1050000,
@@ -15735,108 +15512,6 @@ export const MODELS = {
15735
15512
  },
15736
15513
  },
15737
15514
  "xai": {
15738
- "grok-2": {
15739
- id: "grok-2",
15740
- name: "Grok 2",
15741
- api: "openai-completions",
15742
- provider: "xai",
15743
- baseUrl: "https://api.x.ai/v1",
15744
- reasoning: false,
15745
- input: ["text"],
15746
- cost: {
15747
- input: 2,
15748
- output: 10,
15749
- cacheRead: 2,
15750
- cacheWrite: 0,
15751
- },
15752
- contextWindow: 131072,
15753
- maxTokens: 8192,
15754
- },
15755
- "grok-2-1212": {
15756
- id: "grok-2-1212",
15757
- name: "Grok 2 (1212)",
15758
- api: "openai-completions",
15759
- provider: "xai",
15760
- baseUrl: "https://api.x.ai/v1",
15761
- reasoning: false,
15762
- input: ["text"],
15763
- cost: {
15764
- input: 2,
15765
- output: 10,
15766
- cacheRead: 2,
15767
- cacheWrite: 0,
15768
- },
15769
- contextWindow: 131072,
15770
- maxTokens: 8192,
15771
- },
15772
- "grok-2-latest": {
15773
- id: "grok-2-latest",
15774
- name: "Grok 2 Latest",
15775
- api: "openai-completions",
15776
- provider: "xai",
15777
- baseUrl: "https://api.x.ai/v1",
15778
- reasoning: false,
15779
- input: ["text"],
15780
- cost: {
15781
- input: 2,
15782
- output: 10,
15783
- cacheRead: 2,
15784
- cacheWrite: 0,
15785
- },
15786
- contextWindow: 131072,
15787
- maxTokens: 8192,
15788
- },
15789
- "grok-2-vision": {
15790
- id: "grok-2-vision",
15791
- name: "Grok 2 Vision",
15792
- api: "openai-completions",
15793
- provider: "xai",
15794
- baseUrl: "https://api.x.ai/v1",
15795
- reasoning: false,
15796
- input: ["text", "image"],
15797
- cost: {
15798
- input: 2,
15799
- output: 10,
15800
- cacheRead: 2,
15801
- cacheWrite: 0,
15802
- },
15803
- contextWindow: 8192,
15804
- maxTokens: 4096,
15805
- },
15806
- "grok-2-vision-1212": {
15807
- id: "grok-2-vision-1212",
15808
- name: "Grok 2 Vision (1212)",
15809
- api: "openai-completions",
15810
- provider: "xai",
15811
- baseUrl: "https://api.x.ai/v1",
15812
- reasoning: false,
15813
- input: ["text", "image"],
15814
- cost: {
15815
- input: 2,
15816
- output: 10,
15817
- cacheRead: 2,
15818
- cacheWrite: 0,
15819
- },
15820
- contextWindow: 8192,
15821
- maxTokens: 4096,
15822
- },
15823
- "grok-2-vision-latest": {
15824
- id: "grok-2-vision-latest",
15825
- name: "Grok 2 Vision Latest",
15826
- api: "openai-completions",
15827
- provider: "xai",
15828
- baseUrl: "https://api.x.ai/v1",
15829
- reasoning: false,
15830
- input: ["text", "image"],
15831
- cost: {
15832
- input: 2,
15833
- output: 10,
15834
- cacheRead: 2,
15835
- cacheWrite: 0,
15836
- },
15837
- contextWindow: 8192,
15838
- maxTokens: 4096,
15839
- },
15840
15515
  "grok-3": {
15841
15516
  id: "grok-3",
15842
15517
  name: "Grok 3",
@@ -15880,8 +15555,8 @@ export const MODELS = {
15880
15555
  reasoning: false,
15881
15556
  input: ["text", "image"],
15882
15557
  cost: {
15883
- input: 2,
15884
- output: 6,
15558
+ input: 1.25,
15559
+ output: 2.5,
15885
15560
  cacheRead: 0.2,
15886
15561
  cacheWrite: 0,
15887
15562
  },
@@ -15897,8 +15572,8 @@ export const MODELS = {
15897
15572
  reasoning: true,
15898
15573
  input: ["text", "image"],
15899
15574
  cost: {
15900
- input: 2,
15901
- output: 6,
15575
+ input: 1.25,
15576
+ output: 2.5,
15902
15577
  cacheRead: 0.2,
15903
15578
  cacheWrite: 0,
15904
15579
  },
@@ -15922,22 +15597,22 @@ export const MODELS = {
15922
15597
  contextWindow: 1000000,
15923
15598
  maxTokens: 30000,
15924
15599
  },
15925
- "grok-beta": {
15926
- id: "grok-beta",
15927
- name: "Grok Beta",
15600
+ "grok-build-0.1": {
15601
+ id: "grok-build-0.1",
15602
+ name: "Grok Build 0.1",
15928
15603
  api: "openai-completions",
15929
15604
  provider: "xai",
15930
15605
  baseUrl: "https://api.x.ai/v1",
15931
- reasoning: false,
15932
- input: ["text"],
15606
+ reasoning: true,
15607
+ input: ["text", "image"],
15933
15608
  cost: {
15934
- input: 5,
15935
- output: 15,
15936
- cacheRead: 5,
15609
+ input: 1,
15610
+ output: 2,
15611
+ cacheRead: 0.2,
15937
15612
  cacheWrite: 0,
15938
15613
  },
15939
- contextWindow: 131072,
15940
- maxTokens: 4096,
15614
+ contextWindow: 256000,
15615
+ maxTokens: 256000,
15941
15616
  },
15942
15617
  "grok-code-fast-1": {
15943
15618
  id: "grok-code-fast-1",
@@ -15956,23 +15631,6 @@ export const MODELS = {
15956
15631
  contextWindow: 32768,
15957
15632
  maxTokens: 8192,
15958
15633
  },
15959
- "grok-vision-beta": {
15960
- id: "grok-vision-beta",
15961
- name: "Grok Vision Beta",
15962
- api: "openai-completions",
15963
- provider: "xai",
15964
- baseUrl: "https://api.x.ai/v1",
15965
- reasoning: false,
15966
- input: ["text", "image"],
15967
- cost: {
15968
- input: 5,
15969
- output: 15,
15970
- cacheRead: 5,
15971
- cacheWrite: 0,
15972
- },
15973
- contextWindow: 8192,
15974
- maxTokens: 4096,
15975
- },
15976
15634
  },
15977
15635
  "xiaomi": {
15978
15636
  "mimo-v2-flash": {