@earendil-works/pi-ai 0.75.4 → 0.75.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (36) hide show
  1. package/dist/cli.d.ts.map +1 -1
  2. package/dist/cli.js +14 -0
  3. package/dist/cli.js.map +1 -1
  4. package/dist/index.d.ts +1 -1
  5. package/dist/index.d.ts.map +1 -1
  6. package/dist/index.js.map +1 -1
  7. package/dist/models.generated.d.ts +243 -549
  8. package/dist/models.generated.d.ts.map +1 -1
  9. package/dist/models.generated.js +299 -624
  10. package/dist/models.generated.js.map +1 -1
  11. package/dist/providers/amazon-bedrock.d.ts.map +1 -1
  12. package/dist/providers/amazon-bedrock.js +2 -1
  13. package/dist/providers/amazon-bedrock.js.map +1 -1
  14. package/dist/providers/anthropic.d.ts +22 -5
  15. package/dist/providers/anthropic.d.ts.map +1 -1
  16. package/dist/providers/anthropic.js +7 -21
  17. package/dist/providers/anthropic.js.map +1 -1
  18. package/dist/types.d.ts +10 -0
  19. package/dist/types.d.ts.map +1 -1
  20. package/dist/types.js.map +1 -1
  21. package/dist/utils/oauth/device-code.d.ts +19 -0
  22. package/dist/utils/oauth/device-code.d.ts.map +1 -0
  23. package/dist/utils/oauth/device-code.js +55 -0
  24. package/dist/utils/oauth/device-code.js.map +1 -0
  25. package/dist/utils/oauth/github-copilot.d.ts +3 -3
  26. package/dist/utils/oauth/github-copilot.d.ts.map +1 -1
  27. package/dist/utils/oauth/github-copilot.js +45 -69
  28. package/dist/utils/oauth/github-copilot.js.map +1 -1
  29. package/dist/utils/oauth/index.d.ts +1 -0
  30. package/dist/utils/oauth/index.d.ts.map +1 -1
  31. package/dist/utils/oauth/index.js +1 -0
  32. package/dist/utils/oauth/index.js.map +1 -1
  33. package/dist/utils/oauth/types.d.ts +8 -1
  34. package/dist/utils/oauth/types.d.ts.map +1 -1
  35. package/dist/utils/oauth/types.js.map +1 -1
  36. package/package.json +2 -1
@@ -1720,6 +1720,7 @@ export const MODELS = {
1720
1720
  api: "anthropic-messages",
1721
1721
  provider: "anthropic",
1722
1722
  baseUrl: "https://api.anthropic.com",
1723
+ compat: { "forceAdaptiveThinking": true },
1723
1724
  reasoning: true,
1724
1725
  thinkingLevelMap: { "xhigh": "max" },
1725
1726
  input: ["text", "image"],
@@ -1738,6 +1739,7 @@ export const MODELS = {
1738
1739
  api: "anthropic-messages",
1739
1740
  provider: "anthropic",
1740
1741
  baseUrl: "https://api.anthropic.com",
1742
+ compat: { "forceAdaptiveThinking": true },
1741
1743
  reasoning: true,
1742
1744
  thinkingLevelMap: { "xhigh": "xhigh" },
1743
1745
  input: ["text", "image"],
@@ -1824,6 +1826,7 @@ export const MODELS = {
1824
1826
  api: "anthropic-messages",
1825
1827
  provider: "anthropic",
1826
1828
  baseUrl: "https://api.anthropic.com",
1829
+ compat: { "forceAdaptiveThinking": true },
1827
1830
  reasoning: true,
1828
1831
  input: ["text", "image"],
1829
1832
  cost: {
@@ -2823,6 +2826,7 @@ export const MODELS = {
2823
2826
  api: "anthropic-messages",
2824
2827
  provider: "cloudflare-ai-gateway",
2825
2828
  baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2829
+ compat: { "forceAdaptiveThinking": true },
2826
2830
  reasoning: true,
2827
2831
  thinkingLevelMap: { "xhigh": "max" },
2828
2832
  input: ["text", "image"],
@@ -2841,6 +2845,7 @@ export const MODELS = {
2841
2845
  api: "anthropic-messages",
2842
2846
  provider: "cloudflare-ai-gateway",
2843
2847
  baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2848
+ compat: { "forceAdaptiveThinking": true },
2844
2849
  reasoning: true,
2845
2850
  thinkingLevelMap: { "xhigh": "xhigh" },
2846
2851
  input: ["text", "image"],
@@ -2893,6 +2898,7 @@ export const MODELS = {
2893
2898
  api: "anthropic-messages",
2894
2899
  provider: "cloudflare-ai-gateway",
2895
2900
  baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2901
+ compat: { "forceAdaptiveThinking": true },
2896
2902
  reasoning: true,
2897
2903
  input: ["text", "image"],
2898
2904
  cost: {
@@ -3275,6 +3281,42 @@ export const MODELS = {
3275
3281
  contextWindow: 256000,
3276
3282
  maxTokens: 16384,
3277
3283
  },
3284
+ "@cf/ibm-granite/granite-4.0-h-micro": {
3285
+ id: "@cf/ibm-granite/granite-4.0-h-micro",
3286
+ name: "Granite 4.0 H Micro",
3287
+ api: "openai-completions",
3288
+ provider: "cloudflare-workers-ai",
3289
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3290
+ compat: { "sendSessionAffinityHeaders": true },
3291
+ reasoning: false,
3292
+ input: ["text"],
3293
+ cost: {
3294
+ input: 0.017,
3295
+ output: 0.112,
3296
+ cacheRead: 0,
3297
+ cacheWrite: 0,
3298
+ },
3299
+ contextWindow: 131000,
3300
+ maxTokens: 131000,
3301
+ },
3302
+ "@cf/meta/llama-3.3-70b-instruct-fp8-fast": {
3303
+ id: "@cf/meta/llama-3.3-70b-instruct-fp8-fast",
3304
+ name: "Llama 3.3 70B Instruct fp8 Fast",
3305
+ api: "openai-completions",
3306
+ provider: "cloudflare-workers-ai",
3307
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3308
+ compat: { "sendSessionAffinityHeaders": true },
3309
+ reasoning: false,
3310
+ input: ["text"],
3311
+ cost: {
3312
+ input: 0.293,
3313
+ output: 2.253,
3314
+ cacheRead: 0,
3315
+ cacheWrite: 0,
3316
+ },
3317
+ contextWindow: 24000,
3318
+ maxTokens: 24000,
3319
+ },
3278
3320
  "@cf/meta/llama-4-scout-17b-16e-instruct": {
3279
3321
  id: "@cf/meta/llama-4-scout-17b-16e-instruct",
3280
3322
  name: "Llama 4 Scout 17B 16E Instruct",
@@ -3290,9 +3332,27 @@ export const MODELS = {
3290
3332
  cacheRead: 0,
3291
3333
  cacheWrite: 0,
3292
3334
  },
3293
- contextWindow: 128000,
3335
+ contextWindow: 131000,
3294
3336
  maxTokens: 16384,
3295
3337
  },
3338
+ "@cf/mistralai/mistral-small-3.1-24b-instruct": {
3339
+ id: "@cf/mistralai/mistral-small-3.1-24b-instruct",
3340
+ name: "Mistral Small 3.1 24B Instruct",
3341
+ api: "openai-completions",
3342
+ provider: "cloudflare-workers-ai",
3343
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3344
+ compat: { "sendSessionAffinityHeaders": true },
3345
+ reasoning: false,
3346
+ input: ["text"],
3347
+ cost: {
3348
+ input: 0.351,
3349
+ output: 0.555,
3350
+ cacheRead: 0,
3351
+ cacheWrite: 0,
3352
+ },
3353
+ contextWindow: 128000,
3354
+ maxTokens: 128000,
3355
+ },
3296
3356
  "@cf/moonshotai/kimi-k2.5": {
3297
3357
  id: "@cf/moonshotai/kimi-k2.5",
3298
3358
  name: "Kimi K2.5",
@@ -3326,7 +3386,7 @@ export const MODELS = {
3326
3386
  cacheRead: 0.16,
3327
3387
  cacheWrite: 0,
3328
3388
  },
3329
- contextWindow: 256000,
3389
+ contextWindow: 262144,
3330
3390
  maxTokens: 256000,
3331
3391
  },
3332
3392
  "@cf/nvidia/nemotron-3-120b-a12b": {
@@ -3383,6 +3443,24 @@ export const MODELS = {
3383
3443
  contextWindow: 128000,
3384
3444
  maxTokens: 16384,
3385
3445
  },
3446
+ "@cf/qwen/qwen3-30b-a3b-fp8": {
3447
+ id: "@cf/qwen/qwen3-30b-a3b-fp8",
3448
+ name: "Qwen3 30B A3b fp8",
3449
+ api: "openai-completions",
3450
+ provider: "cloudflare-workers-ai",
3451
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3452
+ compat: { "sendSessionAffinityHeaders": true },
3453
+ reasoning: true,
3454
+ input: ["text"],
3455
+ cost: {
3456
+ input: 0.0509,
3457
+ output: 0.335,
3458
+ cacheRead: 0,
3459
+ cacheWrite: 0,
3460
+ },
3461
+ contextWindow: 32768,
3462
+ maxTokens: 32768,
3463
+ },
3386
3464
  "@cf/zai-org/glm-4.7-flash": {
3387
3465
  id: "@cf/zai-org/glm-4.7-flash",
3388
3466
  name: "GLM-4.7-Flash",
@@ -3393,7 +3471,7 @@ export const MODELS = {
3393
3471
  reasoning: true,
3394
3472
  input: ["text"],
3395
3473
  cost: {
3396
- input: 0.06,
3474
+ input: 0.0605,
3397
3475
  output: 0.4,
3398
3476
  cacheRead: 0,
3399
3477
  cacheWrite: 0,
@@ -3443,42 +3521,6 @@ export const MODELS = {
3443
3521
  },
3444
3522
  },
3445
3523
  "fireworks": {
3446
- "accounts/fireworks/models/deepseek-v3p1": {
3447
- id: "accounts/fireworks/models/deepseek-v3p1",
3448
- name: "DeepSeek V3.1",
3449
- api: "anthropic-messages",
3450
- provider: "fireworks",
3451
- baseUrl: "https://api.fireworks.ai/inference",
3452
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3453
- reasoning: true,
3454
- input: ["text"],
3455
- cost: {
3456
- input: 0.56,
3457
- output: 1.68,
3458
- cacheRead: 0,
3459
- cacheWrite: 0,
3460
- },
3461
- contextWindow: 163840,
3462
- maxTokens: 163840,
3463
- },
3464
- "accounts/fireworks/models/deepseek-v3p2": {
3465
- id: "accounts/fireworks/models/deepseek-v3p2",
3466
- name: "DeepSeek V3.2",
3467
- api: "anthropic-messages",
3468
- provider: "fireworks",
3469
- baseUrl: "https://api.fireworks.ai/inference",
3470
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3471
- reasoning: true,
3472
- input: ["text"],
3473
- cost: {
3474
- input: 0.56,
3475
- output: 1.68,
3476
- cacheRead: 0.28,
3477
- cacheWrite: 0,
3478
- },
3479
- contextWindow: 160000,
3480
- maxTokens: 160000,
3481
- },
3482
3524
  "accounts/fireworks/models/deepseek-v4-flash": {
3483
3525
  id: "accounts/fireworks/models/deepseek-v4-flash",
3484
3526
  name: "DeepSeek V4 Flash",
@@ -3509,84 +3551,12 @@ export const MODELS = {
3509
3551
  cost: {
3510
3552
  input: 1.74,
3511
3553
  output: 3.48,
3512
- cacheRead: 0.15,
3554
+ cacheRead: 0.145,
3513
3555
  cacheWrite: 0,
3514
3556
  },
3515
3557
  contextWindow: 1000000,
3516
3558
  maxTokens: 384000,
3517
3559
  },
3518
- "accounts/fireworks/models/glm-4p5": {
3519
- id: "accounts/fireworks/models/glm-4p5",
3520
- name: "GLM 4.5",
3521
- api: "anthropic-messages",
3522
- provider: "fireworks",
3523
- baseUrl: "https://api.fireworks.ai/inference",
3524
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3525
- reasoning: true,
3526
- input: ["text"],
3527
- cost: {
3528
- input: 0.55,
3529
- output: 2.19,
3530
- cacheRead: 0,
3531
- cacheWrite: 0,
3532
- },
3533
- contextWindow: 131072,
3534
- maxTokens: 131072,
3535
- },
3536
- "accounts/fireworks/models/glm-4p5-air": {
3537
- id: "accounts/fireworks/models/glm-4p5-air",
3538
- name: "GLM 4.5 Air",
3539
- api: "anthropic-messages",
3540
- provider: "fireworks",
3541
- baseUrl: "https://api.fireworks.ai/inference",
3542
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3543
- reasoning: true,
3544
- input: ["text"],
3545
- cost: {
3546
- input: 0.22,
3547
- output: 0.88,
3548
- cacheRead: 0,
3549
- cacheWrite: 0,
3550
- },
3551
- contextWindow: 131072,
3552
- maxTokens: 131072,
3553
- },
3554
- "accounts/fireworks/models/glm-4p7": {
3555
- id: "accounts/fireworks/models/glm-4p7",
3556
- name: "GLM 4.7",
3557
- api: "anthropic-messages",
3558
- provider: "fireworks",
3559
- baseUrl: "https://api.fireworks.ai/inference",
3560
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3561
- reasoning: true,
3562
- input: ["text"],
3563
- cost: {
3564
- input: 0.6,
3565
- output: 2.2,
3566
- cacheRead: 0.3,
3567
- cacheWrite: 0,
3568
- },
3569
- contextWindow: 198000,
3570
- maxTokens: 198000,
3571
- },
3572
- "accounts/fireworks/models/glm-5": {
3573
- id: "accounts/fireworks/models/glm-5",
3574
- name: "GLM 5",
3575
- api: "anthropic-messages",
3576
- provider: "fireworks",
3577
- baseUrl: "https://api.fireworks.ai/inference",
3578
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3579
- reasoning: true,
3580
- input: ["text"],
3581
- cost: {
3582
- input: 1,
3583
- output: 3.2,
3584
- cacheRead: 0.5,
3585
- cacheWrite: 0,
3586
- },
3587
- contextWindow: 202752,
3588
- maxTokens: 131072,
3589
- },
3590
3560
  "accounts/fireworks/models/glm-5p1": {
3591
3561
  id: "accounts/fireworks/models/glm-5p1",
3592
3562
  name: "GLM 5.1",
@@ -3617,7 +3587,7 @@ export const MODELS = {
3617
3587
  cost: {
3618
3588
  input: 0.15,
3619
3589
  output: 0.6,
3620
- cacheRead: 0,
3590
+ cacheRead: 0.015,
3621
3591
  cacheWrite: 0,
3622
3592
  },
3623
3593
  contextWindow: 131072,
@@ -3633,50 +3603,14 @@ export const MODELS = {
3633
3603
  reasoning: true,
3634
3604
  input: ["text"],
3635
3605
  cost: {
3636
- input: 0.05,
3637
- output: 0.2,
3638
- cacheRead: 0,
3606
+ input: 0.07,
3607
+ output: 0.3,
3608
+ cacheRead: 0.035,
3639
3609
  cacheWrite: 0,
3640
3610
  },
3641
3611
  contextWindow: 131072,
3642
3612
  maxTokens: 32768,
3643
3613
  },
3644
- "accounts/fireworks/models/kimi-k2-instruct": {
3645
- id: "accounts/fireworks/models/kimi-k2-instruct",
3646
- name: "Kimi K2 Instruct",
3647
- api: "anthropic-messages",
3648
- provider: "fireworks",
3649
- baseUrl: "https://api.fireworks.ai/inference",
3650
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3651
- reasoning: false,
3652
- input: ["text"],
3653
- cost: {
3654
- input: 1,
3655
- output: 3,
3656
- cacheRead: 0,
3657
- cacheWrite: 0,
3658
- },
3659
- contextWindow: 128000,
3660
- maxTokens: 16384,
3661
- },
3662
- "accounts/fireworks/models/kimi-k2-thinking": {
3663
- id: "accounts/fireworks/models/kimi-k2-thinking",
3664
- name: "Kimi K2 Thinking",
3665
- api: "anthropic-messages",
3666
- provider: "fireworks",
3667
- baseUrl: "https://api.fireworks.ai/inference",
3668
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3669
- reasoning: true,
3670
- input: ["text"],
3671
- cost: {
3672
- input: 0.6,
3673
- output: 2.5,
3674
- cacheRead: 0.3,
3675
- cacheWrite: 0,
3676
- },
3677
- contextWindow: 256000,
3678
- maxTokens: 256000,
3679
- },
3680
3614
  "accounts/fireworks/models/kimi-k2p5": {
3681
3615
  id: "accounts/fireworks/models/kimi-k2p5",
3682
3616
  name: "Kimi K2.5",
@@ -3713,24 +3647,6 @@ export const MODELS = {
3713
3647
  contextWindow: 262000,
3714
3648
  maxTokens: 262000,
3715
3649
  },
3716
- "accounts/fireworks/models/minimax-m2p1": {
3717
- id: "accounts/fireworks/models/minimax-m2p1",
3718
- name: "MiniMax-M2.1",
3719
- api: "anthropic-messages",
3720
- provider: "fireworks",
3721
- baseUrl: "https://api.fireworks.ai/inference",
3722
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3723
- reasoning: true,
3724
- input: ["text"],
3725
- cost: {
3726
- input: 0.3,
3727
- output: 1.2,
3728
- cacheRead: 0.03,
3729
- cacheWrite: 0,
3730
- },
3731
- contextWindow: 200000,
3732
- maxTokens: 200000,
3733
- },
3734
3650
  "accounts/fireworks/models/minimax-m2p5": {
3735
3651
  id: "accounts/fireworks/models/minimax-m2p5",
3736
3652
  name: "MiniMax-M2.5",
@@ -3761,7 +3677,7 @@ export const MODELS = {
3761
3677
  cost: {
3762
3678
  input: 0.3,
3763
3679
  output: 1.2,
3764
- cacheRead: 0.03,
3680
+ cacheRead: 0.06,
3765
3681
  cacheWrite: 0,
3766
3682
  },
3767
3683
  contextWindow: 196608,
@@ -3785,9 +3701,27 @@ export const MODELS = {
3785
3701
  contextWindow: 128000,
3786
3702
  maxTokens: 8192,
3787
3703
  },
3788
- "accounts/fireworks/routers/kimi-k2p5-turbo": {
3789
- id: "accounts/fireworks/routers/kimi-k2p5-turbo",
3790
- name: "Kimi K2.5 Turbo",
3704
+ "accounts/fireworks/routers/glm-5p1-fast": {
3705
+ id: "accounts/fireworks/routers/glm-5p1-fast",
3706
+ name: "GLM 5.1 Fast",
3707
+ api: "anthropic-messages",
3708
+ provider: "fireworks",
3709
+ baseUrl: "https://api.fireworks.ai/inference",
3710
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3711
+ reasoning: true,
3712
+ input: ["text"],
3713
+ cost: {
3714
+ input: 2.8,
3715
+ output: 8.8,
3716
+ cacheRead: 0.52,
3717
+ cacheWrite: 0,
3718
+ },
3719
+ contextWindow: 202800,
3720
+ maxTokens: 131072,
3721
+ },
3722
+ "accounts/fireworks/routers/kimi-k2p6-turbo": {
3723
+ id: "accounts/fireworks/routers/kimi-k2p6-turbo",
3724
+ name: "Kimi K2.6 Turbo",
3791
3725
  api: "anthropic-messages",
3792
3726
  provider: "fireworks",
3793
3727
  baseUrl: "https://api.fireworks.ai/inference",
@@ -3795,13 +3729,13 @@ export const MODELS = {
3795
3729
  reasoning: true,
3796
3730
  input: ["text", "image"],
3797
3731
  cost: {
3798
- input: 0,
3799
- output: 0,
3800
- cacheRead: 0,
3732
+ input: 2,
3733
+ output: 8,
3734
+ cacheRead: 0.3,
3801
3735
  cacheWrite: 0,
3802
3736
  },
3803
- contextWindow: 256000,
3804
- maxTokens: 256000,
3737
+ contextWindow: 262000,
3738
+ maxTokens: 262000,
3805
3739
  },
3806
3740
  },
3807
3741
  "github-copilot": {
@@ -3849,6 +3783,7 @@ export const MODELS = {
3849
3783
  provider: "github-copilot",
3850
3784
  baseUrl: "https://api.individual.githubcopilot.com",
3851
3785
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3786
+ compat: { "forceAdaptiveThinking": true },
3852
3787
  reasoning: true,
3853
3788
  thinkingLevelMap: { "xhigh": "max" },
3854
3789
  input: ["text", "image"],
@@ -3868,6 +3803,7 @@ export const MODELS = {
3868
3803
  provider: "github-copilot",
3869
3804
  baseUrl: "https://api.individual.githubcopilot.com",
3870
3805
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3806
+ compat: { "forceAdaptiveThinking": true },
3871
3807
  reasoning: true,
3872
3808
  thinkingLevelMap: { "xhigh": "xhigh" },
3873
3809
  input: ["text", "image"],
@@ -3906,6 +3842,7 @@ export const MODELS = {
3906
3842
  provider: "github-copilot",
3907
3843
  baseUrl: "https://api.individual.githubcopilot.com",
3908
3844
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3845
+ compat: { "forceAdaptiveThinking": true },
3909
3846
  reasoning: true,
3910
3847
  input: ["text", "image"],
3911
3848
  cost: {
@@ -3974,6 +3911,25 @@ export const MODELS = {
3974
3911
  contextWindow: 128000,
3975
3912
  maxTokens: 64000,
3976
3913
  },
3914
+ "gemini-3.5-flash": {
3915
+ id: "gemini-3.5-flash",
3916
+ name: "Gemini 3.5 Flash",
3917
+ api: "openai-completions",
3918
+ provider: "github-copilot",
3919
+ baseUrl: "https://api.individual.githubcopilot.com",
3920
+ headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3921
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
3922
+ reasoning: true,
3923
+ input: ["text", "image"],
3924
+ cost: {
3925
+ input: 0,
3926
+ output: 0,
3927
+ cacheRead: 0,
3928
+ cacheWrite: 0,
3929
+ },
3930
+ contextWindow: 128000,
3931
+ maxTokens: 64000,
3932
+ },
3977
3933
  "gpt-4.1": {
3978
3934
  id: "gpt-4.1",
3979
3935
  name: "GPT-4.1",
@@ -4166,57 +4122,6 @@ export const MODELS = {
4166
4122
  },
4167
4123
  },
4168
4124
  "google": {
4169
- "gemini-1.5-flash": {
4170
- id: "gemini-1.5-flash",
4171
- name: "Gemini 1.5 Flash",
4172
- api: "google-generative-ai",
4173
- provider: "google",
4174
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4175
- reasoning: false,
4176
- input: ["text", "image"],
4177
- cost: {
4178
- input: 0.075,
4179
- output: 0.3,
4180
- cacheRead: 0.01875,
4181
- cacheWrite: 0,
4182
- },
4183
- contextWindow: 1000000,
4184
- maxTokens: 8192,
4185
- },
4186
- "gemini-1.5-flash-8b": {
4187
- id: "gemini-1.5-flash-8b",
4188
- name: "Gemini 1.5 Flash-8B",
4189
- api: "google-generative-ai",
4190
- provider: "google",
4191
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4192
- reasoning: false,
4193
- input: ["text", "image"],
4194
- cost: {
4195
- input: 0.0375,
4196
- output: 0.15,
4197
- cacheRead: 0.01,
4198
- cacheWrite: 0,
4199
- },
4200
- contextWindow: 1000000,
4201
- maxTokens: 8192,
4202
- },
4203
- "gemini-1.5-pro": {
4204
- id: "gemini-1.5-pro",
4205
- name: "Gemini 1.5 Pro",
4206
- api: "google-generative-ai",
4207
- provider: "google",
4208
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4209
- reasoning: false,
4210
- input: ["text", "image"],
4211
- cost: {
4212
- input: 1.25,
4213
- output: 5,
4214
- cacheRead: 0.3125,
4215
- cacheWrite: 0,
4216
- },
4217
- contextWindow: 1000000,
4218
- maxTokens: 8192,
4219
- },
4220
4125
  "gemini-2.0-flash": {
4221
4126
  id: "gemini-2.0-flash",
4222
4127
  name: "Gemini 2.0 Flash",
@@ -4236,7 +4141,7 @@ export const MODELS = {
4236
4141
  },
4237
4142
  "gemini-2.0-flash-lite": {
4238
4143
  id: "gemini-2.0-flash-lite",
4239
- name: "Gemini 2.0 Flash Lite",
4144
+ name: "Gemini 2.0 Flash-Lite",
4240
4145
  api: "google-generative-ai",
4241
4146
  provider: "google",
4242
4147
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4270,7 +4175,7 @@ export const MODELS = {
4270
4175
  },
4271
4176
  "gemini-2.5-flash-lite": {
4272
4177
  id: "gemini-2.5-flash-lite",
4273
- name: "Gemini 2.5 Flash Lite",
4178
+ name: "Gemini 2.5 Flash-Lite",
4274
4179
  api: "google-generative-ai",
4275
4180
  provider: "google",
4276
4181
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4285,91 +4190,6 @@ export const MODELS = {
4285
4190
  contextWindow: 1048576,
4286
4191
  maxTokens: 65536,
4287
4192
  },
4288
- "gemini-2.5-flash-lite-preview-06-17": {
4289
- id: "gemini-2.5-flash-lite-preview-06-17",
4290
- name: "Gemini 2.5 Flash Lite Preview 06-17",
4291
- api: "google-generative-ai",
4292
- provider: "google",
4293
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4294
- reasoning: true,
4295
- input: ["text", "image"],
4296
- cost: {
4297
- input: 0.1,
4298
- output: 0.4,
4299
- cacheRead: 0.025,
4300
- cacheWrite: 0,
4301
- },
4302
- contextWindow: 1048576,
4303
- maxTokens: 65536,
4304
- },
4305
- "gemini-2.5-flash-lite-preview-09-2025": {
4306
- id: "gemini-2.5-flash-lite-preview-09-2025",
4307
- name: "Gemini 2.5 Flash Lite Preview 09-25",
4308
- api: "google-generative-ai",
4309
- provider: "google",
4310
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4311
- reasoning: true,
4312
- input: ["text", "image"],
4313
- cost: {
4314
- input: 0.1,
4315
- output: 0.4,
4316
- cacheRead: 0.025,
4317
- cacheWrite: 0,
4318
- },
4319
- contextWindow: 1048576,
4320
- maxTokens: 65536,
4321
- },
4322
- "gemini-2.5-flash-preview-04-17": {
4323
- id: "gemini-2.5-flash-preview-04-17",
4324
- name: "Gemini 2.5 Flash Preview 04-17",
4325
- api: "google-generative-ai",
4326
- provider: "google",
4327
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4328
- reasoning: true,
4329
- input: ["text", "image"],
4330
- cost: {
4331
- input: 0.15,
4332
- output: 0.6,
4333
- cacheRead: 0.0375,
4334
- cacheWrite: 0,
4335
- },
4336
- contextWindow: 1048576,
4337
- maxTokens: 65536,
4338
- },
4339
- "gemini-2.5-flash-preview-05-20": {
4340
- id: "gemini-2.5-flash-preview-05-20",
4341
- name: "Gemini 2.5 Flash Preview 05-20",
4342
- api: "google-generative-ai",
4343
- provider: "google",
4344
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4345
- reasoning: true,
4346
- input: ["text", "image"],
4347
- cost: {
4348
- input: 0.15,
4349
- output: 0.6,
4350
- cacheRead: 0.0375,
4351
- cacheWrite: 0,
4352
- },
4353
- contextWindow: 1048576,
4354
- maxTokens: 65536,
4355
- },
4356
- "gemini-2.5-flash-preview-09-2025": {
4357
- id: "gemini-2.5-flash-preview-09-2025",
4358
- name: "Gemini 2.5 Flash Preview 09-25",
4359
- api: "google-generative-ai",
4360
- provider: "google",
4361
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4362
- reasoning: true,
4363
- input: ["text", "image"],
4364
- cost: {
4365
- input: 0.3,
4366
- output: 2.5,
4367
- cacheRead: 0.075,
4368
- cacheWrite: 0,
4369
- },
4370
- contextWindow: 1048576,
4371
- maxTokens: 65536,
4372
- },
4373
4193
  "gemini-2.5-pro": {
4374
4194
  id: "gemini-2.5-pro",
4375
4195
  name: "Gemini 2.5 Pro",
@@ -4387,40 +4207,6 @@ export const MODELS = {
4387
4207
  contextWindow: 1048576,
4388
4208
  maxTokens: 65536,
4389
4209
  },
4390
- "gemini-2.5-pro-preview-05-06": {
4391
- id: "gemini-2.5-pro-preview-05-06",
4392
- name: "Gemini 2.5 Pro Preview 05-06",
4393
- api: "google-generative-ai",
4394
- provider: "google",
4395
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4396
- reasoning: true,
4397
- input: ["text", "image"],
4398
- cost: {
4399
- input: 1.25,
4400
- output: 10,
4401
- cacheRead: 0.31,
4402
- cacheWrite: 0,
4403
- },
4404
- contextWindow: 1048576,
4405
- maxTokens: 65536,
4406
- },
4407
- "gemini-2.5-pro-preview-06-05": {
4408
- id: "gemini-2.5-pro-preview-06-05",
4409
- name: "Gemini 2.5 Pro Preview 06-05",
4410
- api: "google-generative-ai",
4411
- provider: "google",
4412
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4413
- reasoning: true,
4414
- input: ["text", "image"],
4415
- cost: {
4416
- input: 1.25,
4417
- output: 10,
4418
- cacheRead: 0.31,
4419
- cacheWrite: 0,
4420
- },
4421
- contextWindow: 1048576,
4422
- maxTokens: 65536,
4423
- },
4424
4210
  "gemini-3-flash-preview": {
4425
4211
  id: "gemini-3-flash-preview",
4426
4212
  name: "Gemini 3 Flash Preview",
@@ -4454,8 +4240,8 @@ export const MODELS = {
4454
4240
  cacheRead: 0.2,
4455
4241
  cacheWrite: 0,
4456
4242
  },
4457
- contextWindow: 1000000,
4458
- maxTokens: 64000,
4243
+ contextWindow: 1048576,
4244
+ maxTokens: 65536,
4459
4245
  },
4460
4246
  "gemini-3.1-flash-lite": {
4461
4247
  id: "gemini-3.1-flash-lite",
@@ -4581,60 +4367,9 @@ export const MODELS = {
4581
4367
  contextWindow: 1048576,
4582
4368
  maxTokens: 65536,
4583
4369
  },
4584
- "gemini-live-2.5-flash": {
4585
- id: "gemini-live-2.5-flash",
4586
- name: "Gemini Live 2.5 Flash",
4587
- api: "google-generative-ai",
4588
- provider: "google",
4589
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4590
- reasoning: true,
4591
- input: ["text", "image"],
4592
- cost: {
4593
- input: 0.5,
4594
- output: 2,
4595
- cacheRead: 0,
4596
- cacheWrite: 0,
4597
- },
4598
- contextWindow: 128000,
4599
- maxTokens: 8000,
4600
- },
4601
- "gemini-live-2.5-flash-preview-native-audio": {
4602
- id: "gemini-live-2.5-flash-preview-native-audio",
4603
- name: "Gemini Live 2.5 Flash Preview Native Audio",
4604
- api: "google-generative-ai",
4605
- provider: "google",
4606
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4607
- reasoning: true,
4608
- input: ["text"],
4609
- cost: {
4610
- input: 0.5,
4611
- output: 2,
4612
- cacheRead: 0,
4613
- cacheWrite: 0,
4614
- },
4615
- contextWindow: 131072,
4616
- maxTokens: 65536,
4617
- },
4618
- "gemma-3-27b-it": {
4619
- id: "gemma-3-27b-it",
4620
- name: "Gemma 3 27B",
4621
- api: "google-generative-ai",
4622
- provider: "google",
4623
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4624
- reasoning: false,
4625
- input: ["text", "image"],
4626
- cost: {
4627
- input: 0,
4628
- output: 0,
4629
- cacheRead: 0,
4630
- cacheWrite: 0,
4631
- },
4632
- contextWindow: 131072,
4633
- maxTokens: 8192,
4634
- },
4635
4370
  "gemma-4-26b-a4b-it": {
4636
4371
  id: "gemma-4-26b-a4b-it",
4637
- name: "Gemma 4 26B",
4372
+ name: "Gemma 4 26B A4B IT",
4638
4373
  api: "google-generative-ai",
4639
4374
  provider: "google",
4640
4375
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4647,12 +4382,12 @@ export const MODELS = {
4647
4382
  cacheRead: 0,
4648
4383
  cacheWrite: 0,
4649
4384
  },
4650
- contextWindow: 256000,
4651
- maxTokens: 8192,
4385
+ contextWindow: 262144,
4386
+ maxTokens: 32768,
4652
4387
  },
4653
4388
  "gemma-4-31b-it": {
4654
4389
  id: "gemma-4-31b-it",
4655
- name: "Gemma 4 31B",
4390
+ name: "Gemma 4 31B IT",
4656
4391
  api: "google-generative-ai",
4657
4392
  provider: "google",
4658
4393
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4665,8 +4400,8 @@ export const MODELS = {
4665
4400
  cacheRead: 0,
4666
4401
  cacheWrite: 0,
4667
4402
  },
4668
- contextWindow: 256000,
4669
- maxTokens: 8192,
4403
+ contextWindow: 262144,
4404
+ maxTokens: 32768,
4670
4405
  },
4671
4406
  },
4672
4407
  "google-vertex": {
@@ -7372,6 +7107,7 @@ export const MODELS = {
7372
7107
  api: "anthropic-messages",
7373
7108
  provider: "opencode",
7374
7109
  baseUrl: "https://opencode.ai/zen",
7110
+ compat: { "forceAdaptiveThinking": true },
7375
7111
  reasoning: true,
7376
7112
  thinkingLevelMap: { "xhigh": "max" },
7377
7113
  input: ["text", "image"],
@@ -7390,6 +7126,7 @@ export const MODELS = {
7390
7126
  api: "anthropic-messages",
7391
7127
  provider: "opencode",
7392
7128
  baseUrl: "https://opencode.ai/zen",
7129
+ compat: { "forceAdaptiveThinking": true },
7393
7130
  reasoning: true,
7394
7131
  thinkingLevelMap: { "xhigh": "xhigh" },
7395
7132
  input: ["text", "image"],
@@ -7442,6 +7179,7 @@ export const MODELS = {
7442
7179
  api: "anthropic-messages",
7443
7180
  provider: "opencode",
7444
7181
  baseUrl: "https://opencode.ai/zen",
7182
+ compat: { "forceAdaptiveThinking": true },
7445
7183
  reasoning: true,
7446
7184
  input: ["text", "image"],
7447
7185
  cost: {
@@ -7848,6 +7586,23 @@ export const MODELS = {
7848
7586
  contextWindow: 1050000,
7849
7587
  maxTokens: 128000,
7850
7588
  },
7589
+ "grok-build-0.1": {
7590
+ id: "grok-build-0.1",
7591
+ name: "Grok Build 0.1",
7592
+ api: "openai-completions",
7593
+ provider: "opencode",
7594
+ baseUrl: "https://opencode.ai/zen/v1",
7595
+ reasoning: true,
7596
+ input: ["text", "image"],
7597
+ cost: {
7598
+ input: 1,
7599
+ output: 2,
7600
+ cacheRead: 0.2,
7601
+ cacheWrite: 0,
7602
+ },
7603
+ contextWindow: 256000,
7604
+ maxTokens: 256000,
7605
+ },
7851
7606
  "kimi-k2.5": {
7852
7607
  id: "kimi-k2.5",
7853
7608
  name: "Kimi K2.5",
@@ -7882,35 +7637,18 @@ export const MODELS = {
7882
7637
  contextWindow: 262144,
7883
7638
  maxTokens: 65536,
7884
7639
  },
7885
- "minimax-m2.5": {
7886
- id: "minimax-m2.5",
7887
- name: "MiniMax M2.5",
7888
- api: "openai-completions",
7889
- provider: "opencode",
7890
- baseUrl: "https://opencode.ai/zen/v1",
7891
- reasoning: true,
7892
- input: ["text"],
7893
- cost: {
7894
- input: 0.3,
7895
- output: 1.2,
7896
- cacheRead: 0.06,
7897
- cacheWrite: 0,
7898
- },
7899
- contextWindow: 204800,
7900
- maxTokens: 131072,
7901
- },
7902
- "minimax-m2.5-free": {
7903
- id: "minimax-m2.5-free",
7904
- name: "MiniMax M2.5 Free",
7905
- api: "anthropic-messages",
7640
+ "minimax-m2.5": {
7641
+ id: "minimax-m2.5",
7642
+ name: "MiniMax M2.5",
7643
+ api: "openai-completions",
7906
7644
  provider: "opencode",
7907
- baseUrl: "https://opencode.ai/zen",
7645
+ baseUrl: "https://opencode.ai/zen/v1",
7908
7646
  reasoning: true,
7909
7647
  input: ["text"],
7910
7648
  cost: {
7911
- input: 0,
7912
- output: 0,
7913
- cacheRead: 0,
7649
+ input: 0.3,
7650
+ output: 1.2,
7651
+ cacheRead: 0.06,
7914
7652
  cacheWrite: 0,
7915
7653
  },
7916
7654
  contextWindow: 204800,
@@ -7984,23 +7722,6 @@ export const MODELS = {
7984
7722
  contextWindow: 262144,
7985
7723
  maxTokens: 65536,
7986
7724
  },
7987
- "qwen3.6-plus-free": {
7988
- id: "qwen3.6-plus-free",
7989
- name: "Qwen3.6 Plus Free",
7990
- api: "anthropic-messages",
7991
- provider: "opencode",
7992
- baseUrl: "https://opencode.ai/zen",
7993
- reasoning: true,
7994
- input: ["text", "image"],
7995
- cost: {
7996
- input: 0,
7997
- output: 0,
7998
- cacheRead: 0,
7999
- cacheWrite: 0,
8000
- },
8001
- contextWindow: 262144,
8002
- maxTokens: 65536,
8003
- },
8004
7725
  },
8005
7726
  "opencode-go": {
8006
7727
  "deepseek-v4-flash": {
@@ -8559,23 +8280,6 @@ export const MODELS = {
8559
8280
  contextWindow: 1000000,
8560
8281
  maxTokens: 128000,
8561
8282
  },
8562
- "arcee-ai/trinity-large-preview": {
8563
- id: "arcee-ai/trinity-large-preview",
8564
- name: "Arcee AI: Trinity Large Preview",
8565
- api: "openai-completions",
8566
- provider: "openrouter",
8567
- baseUrl: "https://openrouter.ai/api/v1",
8568
- reasoning: false,
8569
- input: ["text"],
8570
- cost: {
8571
- input: 0.15,
8572
- output: 0.44999999999999996,
8573
- cacheRead: 0,
8574
- cacheWrite: 0,
8575
- },
8576
- contextWindow: 131000,
8577
- maxTokens: 4096,
8578
- },
8579
8283
  "arcee-ai/trinity-large-thinking": {
8580
8284
  id: "arcee-ai/trinity-large-thinking",
8581
8285
  name: "Arcee AI: Trinity Large Thinking",
@@ -8961,13 +8665,13 @@ export const MODELS = {
8961
8665
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
8962
8666
  input: ["text"],
8963
8667
  cost: {
8964
- input: 0.112,
8965
- output: 0.224,
8966
- cacheRead: 0.022,
8668
+ input: 0.09999999999999999,
8669
+ output: 0.19999999999999998,
8670
+ cacheRead: 0.02,
8967
8671
  cacheWrite: 0,
8968
8672
  },
8969
8673
  contextWindow: 1048576,
8970
- maxTokens: 4096,
8674
+ maxTokens: 16384,
8971
8675
  },
8972
8676
  "deepseek/deepseek-v4-flash:free": {
8973
8677
  id: "deepseek/deepseek-v4-flash:free",
@@ -9408,9 +9112,9 @@ export const MODELS = {
9408
9112
  reasoning: false,
9409
9113
  input: ["text"],
9410
9114
  cost: {
9411
- input: 0.3,
9412
- output: 2.5,
9413
- cacheRead: 0.06,
9115
+ input: 0.075,
9116
+ output: 0.625,
9117
+ cacheRead: 0.015,
9414
9118
  cacheWrite: 0,
9415
9119
  },
9416
9120
  contextWindow: 262144,
@@ -11908,7 +11612,7 @@ export const MODELS = {
11908
11612
  cacheWrite: 0,
11909
11613
  },
11910
11614
  contextWindow: 262144,
11911
- maxTokens: 65536,
11615
+ maxTokens: 262144,
11912
11616
  },
11913
11617
  "qwen/qwen3.5-27b": {
11914
11618
  id: "qwen/qwen3.5-27b",
@@ -11955,7 +11659,7 @@ export const MODELS = {
11955
11659
  cost: {
11956
11660
  input: 0.39,
11957
11661
  output: 2.34,
11958
- cacheRead: 0.195,
11662
+ cacheRead: 0,
11959
11663
  cacheWrite: 0,
11960
11664
  },
11961
11665
  contextWindow: 262144,
@@ -12038,13 +11742,13 @@ export const MODELS = {
12038
11742
  reasoning: true,
12039
11743
  input: ["text", "image"],
12040
11744
  cost: {
12041
- input: 0.32,
11745
+ input: 0.3,
12042
11746
  output: 3.1999999999999997,
12043
11747
  cacheRead: 0,
12044
11748
  cacheWrite: 0,
12045
11749
  },
12046
11750
  contextWindow: 262144,
12047
- maxTokens: 81920,
11751
+ maxTokens: 262144,
12048
11752
  },
12049
11753
  "qwen/qwen3.6-35b-a3b": {
12050
11754
  id: "qwen/qwen3.6-35b-a3b",
@@ -12055,13 +11759,13 @@ export const MODELS = {
12055
11759
  reasoning: true,
12056
11760
  input: ["text", "image"],
12057
11761
  cost: {
12058
- input: 0.149,
11762
+ input: 0.15,
12059
11763
  output: 1,
12060
11764
  cacheRead: 0,
12061
11765
  cacheWrite: 0,
12062
11766
  },
12063
11767
  contextWindow: 262144,
12064
- maxTokens: 4096,
11768
+ maxTokens: 262140,
12065
11769
  },
12066
11770
  "qwen/qwen3.6-flash": {
12067
11771
  id: "qwen/qwen3.6-flash",
@@ -12114,6 +11818,23 @@ export const MODELS = {
12114
11818
  contextWindow: 1000000,
12115
11819
  maxTokens: 65536,
12116
11820
  },
11821
+ "qwen/qwen3.7-max": {
11822
+ id: "qwen/qwen3.7-max",
11823
+ name: "Qwen: Qwen3.7 Max",
11824
+ api: "openai-completions",
11825
+ provider: "openrouter",
11826
+ baseUrl: "https://openrouter.ai/api/v1",
11827
+ reasoning: true,
11828
+ input: ["text"],
11829
+ cost: {
11830
+ input: 2.5,
11831
+ output: 7.5,
11832
+ cacheRead: 0,
11833
+ cacheWrite: 3.125,
11834
+ },
11835
+ contextWindow: 1000000,
11836
+ maxTokens: 65536,
11837
+ },
12117
11838
  "rekaai/reka-edge": {
12118
11839
  id: "rekaai/reka-edge",
12119
11840
  name: "Reka Edge",
@@ -12191,13 +11912,13 @@ export const MODELS = {
12191
11912
  reasoning: true,
12192
11913
  input: ["text"],
12193
11914
  cost: {
12194
- input: 0.09999999999999999,
11915
+ input: 0.09,
12195
11916
  output: 0.3,
12196
- cacheRead: 0,
11917
+ cacheRead: 0.02,
12197
11918
  cacheWrite: 0,
12198
11919
  },
12199
11920
  contextWindow: 262144,
12200
- maxTokens: 65536,
11921
+ maxTokens: 16384,
12201
11922
  },
12202
11923
  "tencent/hy3-preview": {
12203
11924
  id: "tencent/hy3-preview",
@@ -12301,6 +12022,23 @@ export const MODELS = {
12301
12022
  contextWindow: 1000000,
12302
12023
  maxTokens: 4096,
12303
12024
  },
12025
+ "x-ai/grok-build-0.1": {
12026
+ id: "x-ai/grok-build-0.1",
12027
+ name: "xAI: Grok Build 0.1",
12028
+ api: "openai-completions",
12029
+ provider: "openrouter",
12030
+ baseUrl: "https://openrouter.ai/api/v1",
12031
+ reasoning: true,
12032
+ input: ["text", "image"],
12033
+ cost: {
12034
+ input: 1,
12035
+ output: 2,
12036
+ cacheRead: 0.19999999999999998,
12037
+ cacheWrite: 0,
12038
+ },
12039
+ contextWindow: 256000,
12040
+ maxTokens: 4096,
12041
+ },
12304
12042
  "xiaomi/mimo-v2-flash": {
12305
12043
  id: "xiaomi/mimo-v2-flash",
12306
12044
  name: "Xiaomi: MiMo-V2-Flash",
@@ -12582,13 +12320,13 @@ export const MODELS = {
12582
12320
  reasoning: true,
12583
12321
  input: ["text"],
12584
12322
  cost: {
12585
- input: 0,
12586
- output: 0,
12587
- cacheRead: 0,
12323
+ input: 0.98,
12324
+ output: 3.08,
12325
+ cacheRead: 0.182,
12588
12326
  cacheWrite: 0,
12589
12327
  },
12590
- contextWindow: 202800,
12591
- maxTokens: 202800,
12328
+ contextWindow: 202752,
12329
+ maxTokens: 4096,
12592
12330
  },
12593
12331
  "z-ai/glm-5v-turbo": {
12594
12332
  id: "z-ai/glm-5v-turbo",
@@ -12877,6 +12615,25 @@ export const MODELS = {
12877
12615
  contextWindow: 1000000,
12878
12616
  maxTokens: 500000,
12879
12617
  },
12618
+ "Qwen/Qwen3.7-Max": {
12619
+ id: "Qwen/Qwen3.7-Max",
12620
+ name: "Qwen3.7 Max",
12621
+ api: "openai-completions",
12622
+ provider: "together",
12623
+ baseUrl: "https://api.together.ai/v1",
12624
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
12625
+ reasoning: true,
12626
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
12627
+ input: ["text"],
12628
+ cost: {
12629
+ input: 2.5,
12630
+ output: 7.5,
12631
+ cacheRead: 0,
12632
+ cacheWrite: 0,
12633
+ },
12634
+ contextWindow: 1000000,
12635
+ maxTokens: 500000,
12636
+ },
12880
12637
  "deepseek-ai/DeepSeek-V3": {
12881
12638
  id: "deepseek-ai/DeepSeek-V3",
12882
12639
  name: "DeepSeek V3",
@@ -13373,6 +13130,23 @@ export const MODELS = {
13373
13130
  contextWindow: 1000000,
13374
13131
  maxTokens: 64000,
13375
13132
  },
13133
+ "alibaba/qwen3.7-max": {
13134
+ id: "alibaba/qwen3.7-max",
13135
+ name: "Qwen 3.7 Max",
13136
+ api: "anthropic-messages",
13137
+ provider: "vercel-ai-gateway",
13138
+ baseUrl: "https://ai-gateway.vercel.sh",
13139
+ reasoning: true,
13140
+ input: ["text", "image"],
13141
+ cost: {
13142
+ input: 1.25,
13143
+ output: 3.75,
13144
+ cacheRead: 0.25,
13145
+ cacheWrite: 1.5625,
13146
+ },
13147
+ contextWindow: 991000,
13148
+ maxTokens: 64000,
13149
+ },
13376
13150
  "anthropic/claude-3-haiku": {
13377
13151
  id: "anthropic/claude-3-haiku",
13378
13152
  name: "Claude 3 Haiku",
@@ -13481,6 +13255,7 @@ export const MODELS = {
13481
13255
  api: "anthropic-messages",
13482
13256
  provider: "vercel-ai-gateway",
13483
13257
  baseUrl: "https://ai-gateway.vercel.sh",
13258
+ compat: { "forceAdaptiveThinking": true },
13484
13259
  reasoning: true,
13485
13260
  thinkingLevelMap: { "xhigh": "max" },
13486
13261
  input: ["text", "image"],
@@ -13499,6 +13274,7 @@ export const MODELS = {
13499
13274
  api: "anthropic-messages",
13500
13275
  provider: "vercel-ai-gateway",
13501
13276
  baseUrl: "https://ai-gateway.vercel.sh",
13277
+ compat: { "forceAdaptiveThinking": true },
13502
13278
  reasoning: true,
13503
13279
  thinkingLevelMap: { "xhigh": "xhigh" },
13504
13280
  input: ["text", "image"],
@@ -13551,6 +13327,7 @@ export const MODELS = {
13551
13327
  api: "anthropic-messages",
13552
13328
  provider: "vercel-ai-gateway",
13553
13329
  baseUrl: "https://ai-gateway.vercel.sh",
13330
+ compat: { "forceAdaptiveThinking": true },
13554
13331
  reasoning: true,
13555
13332
  input: ["text", "image"],
13556
13333
  cost: {
@@ -14261,7 +14038,7 @@ export const MODELS = {
14261
14038
  },
14262
14039
  "minimax/minimax-m2.7": {
14263
14040
  id: "minimax/minimax-m2.7",
14264
- name: "Minimax M2.7",
14041
+ name: "MiniMax M2.7",
14265
14042
  api: "anthropic-messages",
14266
14043
  provider: "vercel-ai-gateway",
14267
14044
  baseUrl: "https://ai-gateway.vercel.sh",
@@ -15444,6 +15221,23 @@ export const MODELS = {
15444
15221
  contextWindow: 1000000,
15445
15222
  maxTokens: 1000000,
15446
15223
  },
15224
+ "xai/grok-build-0.1": {
15225
+ id: "xai/grok-build-0.1",
15226
+ name: "Grok Build 0.1",
15227
+ api: "anthropic-messages",
15228
+ provider: "vercel-ai-gateway",
15229
+ baseUrl: "https://ai-gateway.vercel.sh",
15230
+ reasoning: true,
15231
+ input: ["text", "image"],
15232
+ cost: {
15233
+ input: 1,
15234
+ output: 2,
15235
+ cacheRead: 0.19999999999999998,
15236
+ cacheWrite: 0,
15237
+ },
15238
+ contextWindow: 256000,
15239
+ maxTokens: 256000,
15240
+ },
15447
15241
  "xiaomi/mimo-v2-flash": {
15448
15242
  id: "xiaomi/mimo-v2-flash",
15449
15243
  name: "MiMo V2 Flash",
@@ -15735,108 +15529,6 @@ export const MODELS = {
15735
15529
  },
15736
15530
  },
15737
15531
  "xai": {
15738
- "grok-2": {
15739
- id: "grok-2",
15740
- name: "Grok 2",
15741
- api: "openai-completions",
15742
- provider: "xai",
15743
- baseUrl: "https://api.x.ai/v1",
15744
- reasoning: false,
15745
- input: ["text"],
15746
- cost: {
15747
- input: 2,
15748
- output: 10,
15749
- cacheRead: 2,
15750
- cacheWrite: 0,
15751
- },
15752
- contextWindow: 131072,
15753
- maxTokens: 8192,
15754
- },
15755
- "grok-2-1212": {
15756
- id: "grok-2-1212",
15757
- name: "Grok 2 (1212)",
15758
- api: "openai-completions",
15759
- provider: "xai",
15760
- baseUrl: "https://api.x.ai/v1",
15761
- reasoning: false,
15762
- input: ["text"],
15763
- cost: {
15764
- input: 2,
15765
- output: 10,
15766
- cacheRead: 2,
15767
- cacheWrite: 0,
15768
- },
15769
- contextWindow: 131072,
15770
- maxTokens: 8192,
15771
- },
15772
- "grok-2-latest": {
15773
- id: "grok-2-latest",
15774
- name: "Grok 2 Latest",
15775
- api: "openai-completions",
15776
- provider: "xai",
15777
- baseUrl: "https://api.x.ai/v1",
15778
- reasoning: false,
15779
- input: ["text"],
15780
- cost: {
15781
- input: 2,
15782
- output: 10,
15783
- cacheRead: 2,
15784
- cacheWrite: 0,
15785
- },
15786
- contextWindow: 131072,
15787
- maxTokens: 8192,
15788
- },
15789
- "grok-2-vision": {
15790
- id: "grok-2-vision",
15791
- name: "Grok 2 Vision",
15792
- api: "openai-completions",
15793
- provider: "xai",
15794
- baseUrl: "https://api.x.ai/v1",
15795
- reasoning: false,
15796
- input: ["text", "image"],
15797
- cost: {
15798
- input: 2,
15799
- output: 10,
15800
- cacheRead: 2,
15801
- cacheWrite: 0,
15802
- },
15803
- contextWindow: 8192,
15804
- maxTokens: 4096,
15805
- },
15806
- "grok-2-vision-1212": {
15807
- id: "grok-2-vision-1212",
15808
- name: "Grok 2 Vision (1212)",
15809
- api: "openai-completions",
15810
- provider: "xai",
15811
- baseUrl: "https://api.x.ai/v1",
15812
- reasoning: false,
15813
- input: ["text", "image"],
15814
- cost: {
15815
- input: 2,
15816
- output: 10,
15817
- cacheRead: 2,
15818
- cacheWrite: 0,
15819
- },
15820
- contextWindow: 8192,
15821
- maxTokens: 4096,
15822
- },
15823
- "grok-2-vision-latest": {
15824
- id: "grok-2-vision-latest",
15825
- name: "Grok 2 Vision Latest",
15826
- api: "openai-completions",
15827
- provider: "xai",
15828
- baseUrl: "https://api.x.ai/v1",
15829
- reasoning: false,
15830
- input: ["text", "image"],
15831
- cost: {
15832
- input: 2,
15833
- output: 10,
15834
- cacheRead: 2,
15835
- cacheWrite: 0,
15836
- },
15837
- contextWindow: 8192,
15838
- maxTokens: 4096,
15839
- },
15840
15532
  "grok-3": {
15841
15533
  id: "grok-3",
15842
15534
  name: "Grok 3",
@@ -15880,8 +15572,8 @@ export const MODELS = {
15880
15572
  reasoning: false,
15881
15573
  input: ["text", "image"],
15882
15574
  cost: {
15883
- input: 2,
15884
- output: 6,
15575
+ input: 1.25,
15576
+ output: 2.5,
15885
15577
  cacheRead: 0.2,
15886
15578
  cacheWrite: 0,
15887
15579
  },
@@ -15897,8 +15589,8 @@ export const MODELS = {
15897
15589
  reasoning: true,
15898
15590
  input: ["text", "image"],
15899
15591
  cost: {
15900
- input: 2,
15901
- output: 6,
15592
+ input: 1.25,
15593
+ output: 2.5,
15902
15594
  cacheRead: 0.2,
15903
15595
  cacheWrite: 0,
15904
15596
  },
@@ -15922,22 +15614,22 @@ export const MODELS = {
15922
15614
  contextWindow: 1000000,
15923
15615
  maxTokens: 30000,
15924
15616
  },
15925
- "grok-beta": {
15926
- id: "grok-beta",
15927
- name: "Grok Beta",
15617
+ "grok-build-0.1": {
15618
+ id: "grok-build-0.1",
15619
+ name: "Grok Build 0.1",
15928
15620
  api: "openai-completions",
15929
15621
  provider: "xai",
15930
15622
  baseUrl: "https://api.x.ai/v1",
15931
- reasoning: false,
15932
- input: ["text"],
15623
+ reasoning: true,
15624
+ input: ["text", "image"],
15933
15625
  cost: {
15934
- input: 5,
15935
- output: 15,
15936
- cacheRead: 5,
15626
+ input: 1,
15627
+ output: 2,
15628
+ cacheRead: 0.2,
15937
15629
  cacheWrite: 0,
15938
15630
  },
15939
- contextWindow: 131072,
15940
- maxTokens: 4096,
15631
+ contextWindow: 256000,
15632
+ maxTokens: 256000,
15941
15633
  },
15942
15634
  "grok-code-fast-1": {
15943
15635
  id: "grok-code-fast-1",
@@ -15956,23 +15648,6 @@ export const MODELS = {
15956
15648
  contextWindow: 32768,
15957
15649
  maxTokens: 8192,
15958
15650
  },
15959
- "grok-vision-beta": {
15960
- id: "grok-vision-beta",
15961
- name: "Grok Vision Beta",
15962
- api: "openai-completions",
15963
- provider: "xai",
15964
- baseUrl: "https://api.x.ai/v1",
15965
- reasoning: false,
15966
- input: ["text", "image"],
15967
- cost: {
15968
- input: 5,
15969
- output: 15,
15970
- cacheRead: 5,
15971
- cacheWrite: 0,
15972
- },
15973
- contextWindow: 8192,
15974
- maxTokens: 4096,
15975
- },
15976
15651
  },
15977
15652
  "xiaomi": {
15978
15653
  "mimo-v2-flash": {