@kolisachint/hoocode-ai 0.2.5 → 0.2.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -157,6 +157,23 @@ export const MODELS = {
157
157
  contextWindow: 1000000,
158
158
  maxTokens: 128000,
159
159
  },
160
+ "anthropic.claude-opus-4-8": {
161
+ id: "anthropic.claude-opus-4-8",
162
+ name: "Claude Opus 4.8",
163
+ api: "bedrock-converse-stream",
164
+ provider: "amazon-bedrock",
165
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
166
+ reasoning: true,
167
+ input: ["text", "image"],
168
+ cost: {
169
+ input: 5,
170
+ output: 25,
171
+ cacheRead: 0.5,
172
+ cacheWrite: 6.25,
173
+ },
174
+ contextWindow: 1000000,
175
+ maxTokens: 128000,
176
+ },
160
177
  "anthropic.claude-sonnet-4-5-20250929-v1:0": {
161
178
  id: "anthropic.claude-sonnet-4-5-20250929-v1:0",
162
179
  name: "Claude Sonnet 4.5",
@@ -226,6 +243,23 @@ export const MODELS = {
226
243
  contextWindow: 1000000,
227
244
  maxTokens: 128000,
228
245
  },
246
+ "au.anthropic.claude-opus-4-8": {
247
+ id: "au.anthropic.claude-opus-4-8",
248
+ name: "Claude Opus 4.8 (AU)",
249
+ api: "bedrock-converse-stream",
250
+ provider: "amazon-bedrock",
251
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
252
+ reasoning: true,
253
+ input: ["text", "image"],
254
+ cost: {
255
+ input: 5,
256
+ output: 25,
257
+ cacheRead: 0.5,
258
+ cacheWrite: 6.25,
259
+ },
260
+ contextWindow: 1000000,
261
+ maxTokens: 128000,
262
+ },
229
263
  "au.anthropic.claude-sonnet-4-5-20250929-v1:0": {
230
264
  id: "au.anthropic.claude-sonnet-4-5-20250929-v1:0",
231
265
  name: "Claude Sonnet 4.5 (AU)",
@@ -381,6 +415,23 @@ export const MODELS = {
381
415
  contextWindow: 1000000,
382
416
  maxTokens: 128000,
383
417
  },
418
+ "eu.anthropic.claude-opus-4-8": {
419
+ id: "eu.anthropic.claude-opus-4-8",
420
+ name: "Claude Opus 4.8 (EU)",
421
+ api: "bedrock-converse-stream",
422
+ provider: "amazon-bedrock",
423
+ baseUrl: "https://bedrock-runtime.eu-central-1.amazonaws.com",
424
+ reasoning: true,
425
+ input: ["text", "image"],
426
+ cost: {
427
+ input: 5,
428
+ output: 25,
429
+ cacheRead: 0.5,
430
+ cacheWrite: 6.25,
431
+ },
432
+ contextWindow: 1000000,
433
+ maxTokens: 128000,
434
+ },
384
435
  "eu.anthropic.claude-sonnet-4-5-20250929-v1:0": {
385
436
  id: "eu.anthropic.claude-sonnet-4-5-20250929-v1:0",
386
437
  name: "Claude Sonnet 4.5 (EU)",
@@ -485,6 +536,23 @@ export const MODELS = {
485
536
  contextWindow: 1000000,
486
537
  maxTokens: 128000,
487
538
  },
539
+ "global.anthropic.claude-opus-4-8": {
540
+ id: "global.anthropic.claude-opus-4-8",
541
+ name: "Claude Opus 4.8 (Global)",
542
+ api: "bedrock-converse-stream",
543
+ provider: "amazon-bedrock",
544
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
545
+ reasoning: true,
546
+ input: ["text", "image"],
547
+ cost: {
548
+ input: 5,
549
+ output: 25,
550
+ cacheRead: 0.5,
551
+ cacheWrite: 6.25,
552
+ },
553
+ contextWindow: 1000000,
554
+ maxTokens: 128000,
555
+ },
488
556
  "global.anthropic.claude-sonnet-4-5-20250929-v1:0": {
489
557
  id: "global.anthropic.claude-sonnet-4-5-20250929-v1:0",
490
558
  name: "Claude Sonnet 4.5 (Global)",
@@ -571,6 +639,23 @@ export const MODELS = {
571
639
  contextWindow: 1000000,
572
640
  maxTokens: 128000,
573
641
  },
642
+ "jp.anthropic.claude-opus-4-8": {
643
+ id: "jp.anthropic.claude-opus-4-8",
644
+ name: "Claude Opus 4.8 (JP)",
645
+ api: "bedrock-converse-stream",
646
+ provider: "amazon-bedrock",
647
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
648
+ reasoning: true,
649
+ input: ["text", "image"],
650
+ cost: {
651
+ input: 5,
652
+ output: 25,
653
+ cacheRead: 0.5,
654
+ cacheWrite: 6.25,
655
+ },
656
+ contextWindow: 1000000,
657
+ maxTokens: 128000,
658
+ },
574
659
  "jp.anthropic.claude-sonnet-4-5-20250929-v1:0": {
575
660
  id: "jp.anthropic.claude-sonnet-4-5-20250929-v1:0",
576
661
  name: "Claude Sonnet 4.5 (JP)",
@@ -908,8 +993,8 @@ export const MODELS = {
908
993
  cacheRead: 0,
909
994
  cacheWrite: 0,
910
995
  },
911
- contextWindow: 256000,
912
- maxTokens: 256000,
996
+ contextWindow: 262143,
997
+ maxTokens: 16000,
913
998
  },
914
999
  "moonshotai.kimi-k2.5": {
915
1000
  id: "moonshotai.kimi-k2.5",
@@ -925,8 +1010,8 @@ export const MODELS = {
925
1010
  cacheRead: 0,
926
1011
  cacheWrite: 0,
927
1012
  },
928
- contextWindow: 256000,
929
- maxTokens: 256000,
1013
+ contextWindow: 262143,
1014
+ maxTokens: 16000,
930
1015
  },
931
1016
  "nvidia.nemotron-nano-12b-v2": {
932
1017
  id: "nvidia.nemotron-nano-12b-v2",
@@ -1270,6 +1355,23 @@ export const MODELS = {
1270
1355
  contextWindow: 1000000,
1271
1356
  maxTokens: 128000,
1272
1357
  },
1358
+ "us.anthropic.claude-opus-4-8": {
1359
+ id: "us.anthropic.claude-opus-4-8",
1360
+ name: "Claude Opus 4.8 (US)",
1361
+ api: "bedrock-converse-stream",
1362
+ provider: "amazon-bedrock",
1363
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1364
+ reasoning: true,
1365
+ input: ["text", "image"],
1366
+ cost: {
1367
+ input: 5,
1368
+ output: 25,
1369
+ cacheRead: 0.5,
1370
+ cacheWrite: 6.25,
1371
+ },
1372
+ contextWindow: 1000000,
1373
+ maxTokens: 128000,
1374
+ },
1273
1375
  "us.anthropic.claude-sonnet-4-5-20250929-v1:0": {
1274
1376
  id: "us.anthropic.claude-sonnet-4-5-20250929-v1:0",
1275
1377
  name: "Claude Sonnet 4.5 (US)",
@@ -1750,6 +1852,23 @@ export const MODELS = {
1750
1852
  contextWindow: 1000000,
1751
1853
  maxTokens: 128000,
1752
1854
  },
1855
+ "claude-opus-4-8": {
1856
+ id: "claude-opus-4-8",
1857
+ name: "Claude Opus 4.8",
1858
+ api: "anthropic-messages",
1859
+ provider: "anthropic",
1860
+ baseUrl: "https://api.anthropic.com",
1861
+ reasoning: true,
1862
+ input: ["text", "image"],
1863
+ cost: {
1864
+ input: 5,
1865
+ output: 25,
1866
+ cacheRead: 0.5,
1867
+ cacheWrite: 6.25,
1868
+ },
1869
+ contextWindow: 1000000,
1870
+ maxTokens: 128000,
1871
+ },
1753
1872
  "claude-sonnet-4-0": {
1754
1873
  id: "claude-sonnet-4-0",
1755
1874
  name: "Claude Sonnet 4 (latest)",
@@ -1916,7 +2035,7 @@ export const MODELS = {
1916
2035
  cost: {
1917
2036
  input: 0.1,
1918
2037
  output: 0.4,
1919
- cacheRead: 0.03,
2038
+ cacheRead: 0.025,
1920
2039
  cacheWrite: 0,
1921
2040
  },
1922
2041
  contextWindow: 1047576,
@@ -2001,7 +2120,7 @@ export const MODELS = {
2001
2120
  cost: {
2002
2121
  input: 0.15,
2003
2122
  output: 0.6,
2004
- cacheRead: 0.08,
2123
+ cacheRead: 0.075,
2005
2124
  cacheWrite: 0,
2006
2125
  },
2007
2126
  contextWindow: 128000,
@@ -2127,7 +2246,7 @@ export const MODELS = {
2127
2246
  cost: {
2128
2247
  input: 1.25,
2129
2248
  output: 10,
2130
- cacheRead: 0.13,
2249
+ cacheRead: 0.125,
2131
2250
  cacheWrite: 0,
2132
2251
  },
2133
2252
  contextWindow: 400000,
@@ -2552,7 +2671,7 @@ export const MODELS = {
2552
2671
  cost: {
2553
2672
  input: 1.1,
2554
2673
  output: 4.4,
2555
- cacheRead: 0.28,
2674
+ cacheRead: 0.275,
2556
2675
  cacheWrite: 0,
2557
2676
  },
2558
2677
  contextWindow: 200000,
@@ -2611,23 +2730,6 @@ export const MODELS = {
2611
2730
  contextWindow: 32000,
2612
2731
  maxTokens: 8000,
2613
2732
  },
2614
- "qwen-3-235b-a22b-instruct-2507": {
2615
- id: "qwen-3-235b-a22b-instruct-2507",
2616
- name: "Qwen 3 235B Instruct",
2617
- api: "openai-completions",
2618
- provider: "cerebras",
2619
- baseUrl: "https://api.cerebras.ai/v1",
2620
- reasoning: false,
2621
- input: ["text"],
2622
- cost: {
2623
- input: 0.6,
2624
- output: 1.2,
2625
- cacheRead: 0,
2626
- cacheWrite: 0,
2627
- },
2628
- contextWindow: 131000,
2629
- maxTokens: 32000,
2630
- },
2631
2733
  "zai-glm-4.7": {
2632
2734
  id: "zai-glm-4.7",
2633
2735
  name: "Z.AI GLM-4.7",
@@ -3275,6 +3377,42 @@ export const MODELS = {
3275
3377
  contextWindow: 256000,
3276
3378
  maxTokens: 16384,
3277
3379
  },
3380
+ "@cf/ibm-granite/granite-4.0-h-micro": {
3381
+ id: "@cf/ibm-granite/granite-4.0-h-micro",
3382
+ name: "Granite 4.0 H Micro",
3383
+ api: "openai-completions",
3384
+ provider: "cloudflare-workers-ai",
3385
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3386
+ compat: { "sendSessionAffinityHeaders": true },
3387
+ reasoning: false,
3388
+ input: ["text"],
3389
+ cost: {
3390
+ input: 0.017,
3391
+ output: 0.112,
3392
+ cacheRead: 0,
3393
+ cacheWrite: 0,
3394
+ },
3395
+ contextWindow: 131000,
3396
+ maxTokens: 131000,
3397
+ },
3398
+ "@cf/meta/llama-3.3-70b-instruct-fp8-fast": {
3399
+ id: "@cf/meta/llama-3.3-70b-instruct-fp8-fast",
3400
+ name: "Llama 3.3 70B Instruct fp8 Fast",
3401
+ api: "openai-completions",
3402
+ provider: "cloudflare-workers-ai",
3403
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3404
+ compat: { "sendSessionAffinityHeaders": true },
3405
+ reasoning: false,
3406
+ input: ["text"],
3407
+ cost: {
3408
+ input: 0.293,
3409
+ output: 2.253,
3410
+ cacheRead: 0,
3411
+ cacheWrite: 0,
3412
+ },
3413
+ contextWindow: 24000,
3414
+ maxTokens: 24000,
3415
+ },
3278
3416
  "@cf/meta/llama-4-scout-17b-16e-instruct": {
3279
3417
  id: "@cf/meta/llama-4-scout-17b-16e-instruct",
3280
3418
  name: "Llama 4 Scout 17B 16E Instruct",
@@ -3290,9 +3428,27 @@ export const MODELS = {
3290
3428
  cacheRead: 0,
3291
3429
  cacheWrite: 0,
3292
3430
  },
3293
- contextWindow: 128000,
3431
+ contextWindow: 131000,
3294
3432
  maxTokens: 16384,
3295
3433
  },
3434
+ "@cf/mistralai/mistral-small-3.1-24b-instruct": {
3435
+ id: "@cf/mistralai/mistral-small-3.1-24b-instruct",
3436
+ name: "Mistral Small 3.1 24B Instruct",
3437
+ api: "openai-completions",
3438
+ provider: "cloudflare-workers-ai",
3439
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3440
+ compat: { "sendSessionAffinityHeaders": true },
3441
+ reasoning: false,
3442
+ input: ["text"],
3443
+ cost: {
3444
+ input: 0.351,
3445
+ output: 0.555,
3446
+ cacheRead: 0,
3447
+ cacheWrite: 0,
3448
+ },
3449
+ contextWindow: 128000,
3450
+ maxTokens: 128000,
3451
+ },
3296
3452
  "@cf/moonshotai/kimi-k2.5": {
3297
3453
  id: "@cf/moonshotai/kimi-k2.5",
3298
3454
  name: "Kimi K2.5",
@@ -3326,7 +3482,7 @@ export const MODELS = {
3326
3482
  cacheRead: 0.16,
3327
3483
  cacheWrite: 0,
3328
3484
  },
3329
- contextWindow: 256000,
3485
+ contextWindow: 262144,
3330
3486
  maxTokens: 256000,
3331
3487
  },
3332
3488
  "@cf/nvidia/nemotron-3-120b-a12b": {
@@ -3383,6 +3539,24 @@ export const MODELS = {
3383
3539
  contextWindow: 128000,
3384
3540
  maxTokens: 16384,
3385
3541
  },
3542
+ "@cf/qwen/qwen3-30b-a3b-fp8": {
3543
+ id: "@cf/qwen/qwen3-30b-a3b-fp8",
3544
+ name: "Qwen3 30B A3b fp8",
3545
+ api: "openai-completions",
3546
+ provider: "cloudflare-workers-ai",
3547
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3548
+ compat: { "sendSessionAffinityHeaders": true },
3549
+ reasoning: true,
3550
+ input: ["text"],
3551
+ cost: {
3552
+ input: 0.0509,
3553
+ output: 0.335,
3554
+ cacheRead: 0,
3555
+ cacheWrite: 0,
3556
+ },
3557
+ contextWindow: 32768,
3558
+ maxTokens: 32768,
3559
+ },
3386
3560
  "@cf/zai-org/glm-4.7-flash": {
3387
3561
  id: "@cf/zai-org/glm-4.7-flash",
3388
3562
  name: "GLM-4.7-Flash",
@@ -3393,7 +3567,7 @@ export const MODELS = {
3393
3567
  reasoning: true,
3394
3568
  input: ["text"],
3395
3569
  cost: {
3396
- input: 0.06,
3570
+ input: 0.0605,
3397
3571
  output: 0.4,
3398
3572
  cacheRead: 0,
3399
3573
  cacheWrite: 0,
@@ -3443,39 +3617,22 @@ export const MODELS = {
3443
3617
  },
3444
3618
  },
3445
3619
  "fireworks": {
3446
- "accounts/fireworks/models/deepseek-v3p1": {
3447
- id: "accounts/fireworks/models/deepseek-v3p1",
3448
- name: "DeepSeek V3.1",
3449
- api: "anthropic-messages",
3450
- provider: "fireworks",
3451
- baseUrl: "https://api.fireworks.ai/inference",
3452
- reasoning: true,
3453
- input: ["text"],
3454
- cost: {
3455
- input: 0.56,
3456
- output: 1.68,
3457
- cacheRead: 0,
3458
- cacheWrite: 0,
3459
- },
3460
- contextWindow: 163840,
3461
- maxTokens: 163840,
3462
- },
3463
- "accounts/fireworks/models/deepseek-v3p2": {
3464
- id: "accounts/fireworks/models/deepseek-v3p2",
3465
- name: "DeepSeek V3.2",
3620
+ "accounts/fireworks/models/deepseek-v4-flash": {
3621
+ id: "accounts/fireworks/models/deepseek-v4-flash",
3622
+ name: "DeepSeek V4 Flash",
3466
3623
  api: "anthropic-messages",
3467
3624
  provider: "fireworks",
3468
3625
  baseUrl: "https://api.fireworks.ai/inference",
3469
3626
  reasoning: true,
3470
3627
  input: ["text"],
3471
3628
  cost: {
3472
- input: 0.56,
3473
- output: 1.68,
3474
- cacheRead: 0.28,
3629
+ input: 0.14,
3630
+ output: 0.28,
3631
+ cacheRead: 0.03,
3475
3632
  cacheWrite: 0,
3476
3633
  },
3477
- contextWindow: 160000,
3478
- maxTokens: 160000,
3634
+ contextWindow: 1000000,
3635
+ maxTokens: 384000,
3479
3636
  },
3480
3637
  "accounts/fireworks/models/deepseek-v4-pro": {
3481
3638
  id: "accounts/fireworks/models/deepseek-v4-pro",
@@ -3488,177 +3645,75 @@ export const MODELS = {
3488
3645
  cost: {
3489
3646
  input: 1.74,
3490
3647
  output: 3.48,
3491
- cacheRead: 0.15,
3648
+ cacheRead: 0.145,
3492
3649
  cacheWrite: 0,
3493
3650
  },
3494
3651
  contextWindow: 1000000,
3495
3652
  maxTokens: 384000,
3496
3653
  },
3497
- "accounts/fireworks/models/glm-4p5": {
3498
- id: "accounts/fireworks/models/glm-4p5",
3499
- name: "GLM 4.5",
3654
+ "accounts/fireworks/models/glm-5p1": {
3655
+ id: "accounts/fireworks/models/glm-5p1",
3656
+ name: "GLM 5.1",
3500
3657
  api: "anthropic-messages",
3501
3658
  provider: "fireworks",
3502
3659
  baseUrl: "https://api.fireworks.ai/inference",
3503
3660
  reasoning: true,
3504
3661
  input: ["text"],
3505
3662
  cost: {
3506
- input: 0.55,
3507
- output: 2.19,
3508
- cacheRead: 0,
3663
+ input: 1.4,
3664
+ output: 4.4,
3665
+ cacheRead: 0.26,
3509
3666
  cacheWrite: 0,
3510
3667
  },
3511
- contextWindow: 131072,
3668
+ contextWindow: 202800,
3512
3669
  maxTokens: 131072,
3513
3670
  },
3514
- "accounts/fireworks/models/glm-4p5-air": {
3515
- id: "accounts/fireworks/models/glm-4p5-air",
3516
- name: "GLM 4.5 Air",
3671
+ "accounts/fireworks/models/gpt-oss-120b": {
3672
+ id: "accounts/fireworks/models/gpt-oss-120b",
3673
+ name: "GPT OSS 120B",
3517
3674
  api: "anthropic-messages",
3518
3675
  provider: "fireworks",
3519
3676
  baseUrl: "https://api.fireworks.ai/inference",
3520
3677
  reasoning: true,
3521
3678
  input: ["text"],
3522
3679
  cost: {
3523
- input: 0.22,
3524
- output: 0.88,
3525
- cacheRead: 0,
3680
+ input: 0.15,
3681
+ output: 0.6,
3682
+ cacheRead: 0.015,
3526
3683
  cacheWrite: 0,
3527
3684
  },
3528
3685
  contextWindow: 131072,
3529
- maxTokens: 131072,
3686
+ maxTokens: 32768,
3530
3687
  },
3531
- "accounts/fireworks/models/glm-4p7": {
3532
- id: "accounts/fireworks/models/glm-4p7",
3533
- name: "GLM 4.7",
3688
+ "accounts/fireworks/models/gpt-oss-20b": {
3689
+ id: "accounts/fireworks/models/gpt-oss-20b",
3690
+ name: "GPT OSS 20B",
3534
3691
  api: "anthropic-messages",
3535
3692
  provider: "fireworks",
3536
3693
  baseUrl: "https://api.fireworks.ai/inference",
3537
3694
  reasoning: true,
3538
3695
  input: ["text"],
3539
3696
  cost: {
3540
- input: 0.6,
3541
- output: 2.2,
3542
- cacheRead: 0.3,
3697
+ input: 0.07,
3698
+ output: 0.3,
3699
+ cacheRead: 0.035,
3543
3700
  cacheWrite: 0,
3544
3701
  },
3545
- contextWindow: 198000,
3546
- maxTokens: 198000,
3702
+ contextWindow: 131072,
3703
+ maxTokens: 32768,
3547
3704
  },
3548
- "accounts/fireworks/models/glm-5": {
3549
- id: "accounts/fireworks/models/glm-5",
3550
- name: "GLM 5",
3705
+ "accounts/fireworks/models/kimi-k2p5": {
3706
+ id: "accounts/fireworks/models/kimi-k2p5",
3707
+ name: "Kimi K2.5",
3551
3708
  api: "anthropic-messages",
3552
3709
  provider: "fireworks",
3553
3710
  baseUrl: "https://api.fireworks.ai/inference",
3554
3711
  reasoning: true,
3555
- input: ["text"],
3712
+ input: ["text", "image"],
3556
3713
  cost: {
3557
- input: 1,
3558
- output: 3.2,
3559
- cacheRead: 0.5,
3560
- cacheWrite: 0,
3561
- },
3562
- contextWindow: 202752,
3563
- maxTokens: 131072,
3564
- },
3565
- "accounts/fireworks/models/glm-5p1": {
3566
- id: "accounts/fireworks/models/glm-5p1",
3567
- name: "GLM 5.1",
3568
- api: "anthropic-messages",
3569
- provider: "fireworks",
3570
- baseUrl: "https://api.fireworks.ai/inference",
3571
- reasoning: true,
3572
- input: ["text"],
3573
- cost: {
3574
- input: 1.4,
3575
- output: 4.4,
3576
- cacheRead: 0.26,
3577
- cacheWrite: 0,
3578
- },
3579
- contextWindow: 202800,
3580
- maxTokens: 131072,
3581
- },
3582
- "accounts/fireworks/models/gpt-oss-120b": {
3583
- id: "accounts/fireworks/models/gpt-oss-120b",
3584
- name: "GPT OSS 120B",
3585
- api: "anthropic-messages",
3586
- provider: "fireworks",
3587
- baseUrl: "https://api.fireworks.ai/inference",
3588
- reasoning: true,
3589
- input: ["text"],
3590
- cost: {
3591
- input: 0.15,
3592
- output: 0.6,
3593
- cacheRead: 0,
3594
- cacheWrite: 0,
3595
- },
3596
- contextWindow: 131072,
3597
- maxTokens: 32768,
3598
- },
3599
- "accounts/fireworks/models/gpt-oss-20b": {
3600
- id: "accounts/fireworks/models/gpt-oss-20b",
3601
- name: "GPT OSS 20B",
3602
- api: "anthropic-messages",
3603
- provider: "fireworks",
3604
- baseUrl: "https://api.fireworks.ai/inference",
3605
- reasoning: true,
3606
- input: ["text"],
3607
- cost: {
3608
- input: 0.05,
3609
- output: 0.2,
3610
- cacheRead: 0,
3611
- cacheWrite: 0,
3612
- },
3613
- contextWindow: 131072,
3614
- maxTokens: 32768,
3615
- },
3616
- "accounts/fireworks/models/kimi-k2-instruct": {
3617
- id: "accounts/fireworks/models/kimi-k2-instruct",
3618
- name: "Kimi K2 Instruct",
3619
- api: "anthropic-messages",
3620
- provider: "fireworks",
3621
- baseUrl: "https://api.fireworks.ai/inference",
3622
- reasoning: false,
3623
- input: ["text"],
3624
- cost: {
3625
- input: 1,
3626
- output: 3,
3627
- cacheRead: 0,
3628
- cacheWrite: 0,
3629
- },
3630
- contextWindow: 128000,
3631
- maxTokens: 16384,
3632
- },
3633
- "accounts/fireworks/models/kimi-k2-thinking": {
3634
- id: "accounts/fireworks/models/kimi-k2-thinking",
3635
- name: "Kimi K2 Thinking",
3636
- api: "anthropic-messages",
3637
- provider: "fireworks",
3638
- baseUrl: "https://api.fireworks.ai/inference",
3639
- reasoning: true,
3640
- input: ["text"],
3641
- cost: {
3642
- input: 0.6,
3643
- output: 2.5,
3644
- cacheRead: 0.3,
3645
- cacheWrite: 0,
3646
- },
3647
- contextWindow: 256000,
3648
- maxTokens: 256000,
3649
- },
3650
- "accounts/fireworks/models/kimi-k2p5": {
3651
- id: "accounts/fireworks/models/kimi-k2p5",
3652
- name: "Kimi K2.5",
3653
- api: "anthropic-messages",
3654
- provider: "fireworks",
3655
- baseUrl: "https://api.fireworks.ai/inference",
3656
- reasoning: true,
3657
- input: ["text", "image"],
3658
- cost: {
3659
- input: 0.6,
3660
- output: 3,
3661
- cacheRead: 0.1,
3714
+ input: 0.6,
3715
+ output: 3,
3716
+ cacheRead: 0.1,
3662
3717
  cacheWrite: 0,
3663
3718
  },
3664
3719
  contextWindow: 256000,
@@ -3681,23 +3736,6 @@ export const MODELS = {
3681
3736
  contextWindow: 262000,
3682
3737
  maxTokens: 262000,
3683
3738
  },
3684
- "accounts/fireworks/models/minimax-m2p1": {
3685
- id: "accounts/fireworks/models/minimax-m2p1",
3686
- name: "MiniMax-M2.1",
3687
- api: "anthropic-messages",
3688
- provider: "fireworks",
3689
- baseUrl: "https://api.fireworks.ai/inference",
3690
- reasoning: true,
3691
- input: ["text"],
3692
- cost: {
3693
- input: 0.3,
3694
- output: 1.2,
3695
- cacheRead: 0.03,
3696
- cacheWrite: 0,
3697
- },
3698
- contextWindow: 200000,
3699
- maxTokens: 200000,
3700
- },
3701
3739
  "accounts/fireworks/models/minimax-m2p5": {
3702
3740
  id: "accounts/fireworks/models/minimax-m2p5",
3703
3741
  name: "MiniMax-M2.5",
@@ -3726,7 +3764,7 @@ export const MODELS = {
3726
3764
  cost: {
3727
3765
  input: 0.3,
3728
3766
  output: 1.2,
3729
- cacheRead: 0.03,
3767
+ cacheRead: 0.06,
3730
3768
  cacheWrite: 0,
3731
3769
  },
3732
3770
  contextWindow: 196608,
@@ -3749,22 +3787,39 @@ export const MODELS = {
3749
3787
  contextWindow: 128000,
3750
3788
  maxTokens: 8192,
3751
3789
  },
3752
- "accounts/fireworks/routers/kimi-k2p5-turbo": {
3753
- id: "accounts/fireworks/routers/kimi-k2p5-turbo",
3754
- name: "Kimi K2.5 Turbo",
3790
+ "accounts/fireworks/routers/glm-5p1-fast": {
3791
+ id: "accounts/fireworks/routers/glm-5p1-fast",
3792
+ name: "GLM 5.1 Fast",
3793
+ api: "anthropic-messages",
3794
+ provider: "fireworks",
3795
+ baseUrl: "https://api.fireworks.ai/inference",
3796
+ reasoning: true,
3797
+ input: ["text"],
3798
+ cost: {
3799
+ input: 2.8,
3800
+ output: 8.8,
3801
+ cacheRead: 0.52,
3802
+ cacheWrite: 0,
3803
+ },
3804
+ contextWindow: 202800,
3805
+ maxTokens: 131072,
3806
+ },
3807
+ "accounts/fireworks/routers/kimi-k2p6-turbo": {
3808
+ id: "accounts/fireworks/routers/kimi-k2p6-turbo",
3809
+ name: "Kimi K2.6 Turbo",
3755
3810
  api: "anthropic-messages",
3756
3811
  provider: "fireworks",
3757
3812
  baseUrl: "https://api.fireworks.ai/inference",
3758
3813
  reasoning: true,
3759
3814
  input: ["text", "image"],
3760
3815
  cost: {
3761
- input: 0,
3762
- output: 0,
3763
- cacheRead: 0,
3816
+ input: 2,
3817
+ output: 8,
3818
+ cacheRead: 0.3,
3764
3819
  cacheWrite: 0,
3765
3820
  },
3766
- contextWindow: 256000,
3767
- maxTokens: 256000,
3821
+ contextWindow: 262000,
3822
+ maxTokens: 262000,
3768
3823
  },
3769
3824
  },
3770
3825
  "github-copilot": {
@@ -3784,8 +3839,8 @@ export const MODELS = {
3784
3839
  cacheRead: 0,
3785
3840
  cacheWrite: 0,
3786
3841
  },
3787
- contextWindow: 144000,
3788
- maxTokens: 32000,
3842
+ contextWindow: 200000,
3843
+ maxTokens: 64000,
3789
3844
  },
3790
3845
  "claude-opus-4.5": {
3791
3846
  id: "claude-opus-4.5",
@@ -3802,7 +3857,7 @@ export const MODELS = {
3802
3857
  cacheRead: 0,
3803
3858
  cacheWrite: 0,
3804
3859
  },
3805
- contextWindow: 160000,
3860
+ contextWindow: 200000,
3806
3861
  maxTokens: 32000,
3807
3862
  },
3808
3863
  "claude-opus-4.6": {
@@ -3822,7 +3877,7 @@ export const MODELS = {
3822
3877
  cacheWrite: 0,
3823
3878
  },
3824
3879
  contextWindow: 1000000,
3825
- maxTokens: 64000,
3880
+ maxTokens: 32000,
3826
3881
  },
3827
3882
  "claude-opus-4.7": {
3828
3883
  id: "claude-opus-4.7",
@@ -3840,7 +3895,25 @@ export const MODELS = {
3840
3895
  cacheRead: 0,
3841
3896
  cacheWrite: 0,
3842
3897
  },
3843
- contextWindow: 144000,
3898
+ contextWindow: 200000,
3899
+ maxTokens: 32000,
3900
+ },
3901
+ "claude-opus-4.8": {
3902
+ id: "claude-opus-4.8",
3903
+ name: "Claude Opus 4.8",
3904
+ api: "anthropic-messages",
3905
+ provider: "github-copilot",
3906
+ baseUrl: "https://api.individual.githubcopilot.com",
3907
+ headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3908
+ reasoning: true,
3909
+ input: ["text", "image"],
3910
+ cost: {
3911
+ input: 0,
3912
+ output: 0,
3913
+ cacheRead: 0,
3914
+ cacheWrite: 0,
3915
+ },
3916
+ contextWindow: 200000,
3844
3917
  maxTokens: 64000,
3845
3918
  },
3846
3919
  "claude-sonnet-4.5": {
@@ -3859,7 +3932,7 @@ export const MODELS = {
3859
3932
  cacheRead: 0,
3860
3933
  cacheWrite: 0,
3861
3934
  },
3862
- contextWindow: 144000,
3935
+ contextWindow: 200000,
3863
3936
  maxTokens: 32000,
3864
3937
  },
3865
3938
  "claude-sonnet-4.6": {
@@ -3934,7 +4007,26 @@ export const MODELS = {
3934
4007
  cacheRead: 0,
3935
4008
  cacheWrite: 0,
3936
4009
  },
3937
- contextWindow: 128000,
4010
+ contextWindow: 200000,
4011
+ maxTokens: 64000,
4012
+ },
4013
+ "gemini-3.5-flash": {
4014
+ id: "gemini-3.5-flash",
4015
+ name: "Gemini 3.5 Flash",
4016
+ api: "openai-completions",
4017
+ provider: "github-copilot",
4018
+ baseUrl: "https://api.individual.githubcopilot.com",
4019
+ headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4020
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
4021
+ reasoning: true,
4022
+ input: ["text", "image"],
4023
+ cost: {
4024
+ input: 0,
4025
+ output: 0,
4026
+ cacheRead: 0,
4027
+ cacheWrite: 0,
4028
+ },
4029
+ contextWindow: 200000,
3938
4030
  maxTokens: 64000,
3939
4031
  },
3940
4032
  "gpt-4.1": {
@@ -4010,8 +4102,8 @@ export const MODELS = {
4010
4102
  cacheRead: 0,
4011
4103
  cacheWrite: 0,
4012
4104
  },
4013
- contextWindow: 264000,
4014
- maxTokens: 64000,
4105
+ contextWindow: 400000,
4106
+ maxTokens: 128000,
4015
4107
  },
4016
4108
  "gpt-5.2-codex": {
4017
4109
  id: "gpt-5.2-codex",
@@ -4129,57 +4221,6 @@ export const MODELS = {
4129
4221
  },
4130
4222
  },
4131
4223
  "google": {
4132
- "gemini-1.5-flash": {
4133
- id: "gemini-1.5-flash",
4134
- name: "Gemini 1.5 Flash",
4135
- api: "google-generative-ai",
4136
- provider: "google",
4137
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4138
- reasoning: false,
4139
- input: ["text", "image"],
4140
- cost: {
4141
- input: 0.075,
4142
- output: 0.3,
4143
- cacheRead: 0.01875,
4144
- cacheWrite: 0,
4145
- },
4146
- contextWindow: 1000000,
4147
- maxTokens: 8192,
4148
- },
4149
- "gemini-1.5-flash-8b": {
4150
- id: "gemini-1.5-flash-8b",
4151
- name: "Gemini 1.5 Flash-8B",
4152
- api: "google-generative-ai",
4153
- provider: "google",
4154
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4155
- reasoning: false,
4156
- input: ["text", "image"],
4157
- cost: {
4158
- input: 0.0375,
4159
- output: 0.15,
4160
- cacheRead: 0.01,
4161
- cacheWrite: 0,
4162
- },
4163
- contextWindow: 1000000,
4164
- maxTokens: 8192,
4165
- },
4166
- "gemini-1.5-pro": {
4167
- id: "gemini-1.5-pro",
4168
- name: "Gemini 1.5 Pro",
4169
- api: "google-generative-ai",
4170
- provider: "google",
4171
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4172
- reasoning: false,
4173
- input: ["text", "image"],
4174
- cost: {
4175
- input: 1.25,
4176
- output: 5,
4177
- cacheRead: 0.3125,
4178
- cacheWrite: 0,
4179
- },
4180
- contextWindow: 1000000,
4181
- maxTokens: 8192,
4182
- },
4183
4224
  "gemini-2.0-flash": {
4184
4225
  id: "gemini-2.0-flash",
4185
4226
  name: "Gemini 2.0 Flash",
@@ -4199,7 +4240,7 @@ export const MODELS = {
4199
4240
  },
4200
4241
  "gemini-2.0-flash-lite": {
4201
4242
  id: "gemini-2.0-flash-lite",
4202
- name: "Gemini 2.0 Flash Lite",
4243
+ name: "Gemini 2.0 Flash-Lite",
4203
4244
  api: "google-generative-ai",
4204
4245
  provider: "google",
4205
4246
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4233,7 +4274,7 @@ export const MODELS = {
4233
4274
  },
4234
4275
  "gemini-2.5-flash-lite": {
4235
4276
  id: "gemini-2.5-flash-lite",
4236
- name: "Gemini 2.5 Flash Lite",
4277
+ name: "Gemini 2.5 Flash-Lite",
4237
4278
  api: "google-generative-ai",
4238
4279
  provider: "google",
4239
4280
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4248,168 +4289,49 @@ export const MODELS = {
4248
4289
  contextWindow: 1048576,
4249
4290
  maxTokens: 65536,
4250
4291
  },
4251
- "gemini-2.5-flash-lite-preview-06-17": {
4252
- id: "gemini-2.5-flash-lite-preview-06-17",
4253
- name: "Gemini 2.5 Flash Lite Preview 06-17",
4292
+ "gemini-2.5-pro": {
4293
+ id: "gemini-2.5-pro",
4294
+ name: "Gemini 2.5 Pro",
4254
4295
  api: "google-generative-ai",
4255
4296
  provider: "google",
4256
4297
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4257
4298
  reasoning: true,
4258
4299
  input: ["text", "image"],
4259
4300
  cost: {
4260
- input: 0.1,
4261
- output: 0.4,
4262
- cacheRead: 0.025,
4301
+ input: 1.25,
4302
+ output: 10,
4303
+ cacheRead: 0.125,
4263
4304
  cacheWrite: 0,
4264
4305
  },
4265
4306
  contextWindow: 1048576,
4266
4307
  maxTokens: 65536,
4267
4308
  },
4268
- "gemini-2.5-flash-lite-preview-09-2025": {
4269
- id: "gemini-2.5-flash-lite-preview-09-2025",
4270
- name: "Gemini 2.5 Flash Lite Preview 09-25",
4309
+ "gemini-3-flash-preview": {
4310
+ id: "gemini-3-flash-preview",
4311
+ name: "Gemini 3 Flash Preview",
4271
4312
  api: "google-generative-ai",
4272
4313
  provider: "google",
4273
4314
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4274
4315
  reasoning: true,
4316
+ thinkingLevelMap: { "off": null },
4275
4317
  input: ["text", "image"],
4276
4318
  cost: {
4277
- input: 0.1,
4278
- output: 0.4,
4279
- cacheRead: 0.025,
4319
+ input: 0.5,
4320
+ output: 3,
4321
+ cacheRead: 0.05,
4280
4322
  cacheWrite: 0,
4281
4323
  },
4282
4324
  contextWindow: 1048576,
4283
4325
  maxTokens: 65536,
4284
4326
  },
4285
- "gemini-2.5-flash-preview-04-17": {
4286
- id: "gemini-2.5-flash-preview-04-17",
4287
- name: "Gemini 2.5 Flash Preview 04-17",
4327
+ "gemini-3-pro-preview": {
4328
+ id: "gemini-3-pro-preview",
4329
+ name: "Gemini 3 Pro Preview",
4288
4330
  api: "google-generative-ai",
4289
4331
  provider: "google",
4290
4332
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4291
4333
  reasoning: true,
4292
- input: ["text", "image"],
4293
- cost: {
4294
- input: 0.15,
4295
- output: 0.6,
4296
- cacheRead: 0.0375,
4297
- cacheWrite: 0,
4298
- },
4299
- contextWindow: 1048576,
4300
- maxTokens: 65536,
4301
- },
4302
- "gemini-2.5-flash-preview-05-20": {
4303
- id: "gemini-2.5-flash-preview-05-20",
4304
- name: "Gemini 2.5 Flash Preview 05-20",
4305
- api: "google-generative-ai",
4306
- provider: "google",
4307
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4308
- reasoning: true,
4309
- input: ["text", "image"],
4310
- cost: {
4311
- input: 0.15,
4312
- output: 0.6,
4313
- cacheRead: 0.0375,
4314
- cacheWrite: 0,
4315
- },
4316
- contextWindow: 1048576,
4317
- maxTokens: 65536,
4318
- },
4319
- "gemini-2.5-flash-preview-09-2025": {
4320
- id: "gemini-2.5-flash-preview-09-2025",
4321
- name: "Gemini 2.5 Flash Preview 09-25",
4322
- api: "google-generative-ai",
4323
- provider: "google",
4324
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4325
- reasoning: true,
4326
- input: ["text", "image"],
4327
- cost: {
4328
- input: 0.3,
4329
- output: 2.5,
4330
- cacheRead: 0.075,
4331
- cacheWrite: 0,
4332
- },
4333
- contextWindow: 1048576,
4334
- maxTokens: 65536,
4335
- },
4336
- "gemini-2.5-pro": {
4337
- id: "gemini-2.5-pro",
4338
- name: "Gemini 2.5 Pro",
4339
- api: "google-generative-ai",
4340
- provider: "google",
4341
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4342
- reasoning: true,
4343
- input: ["text", "image"],
4344
- cost: {
4345
- input: 1.25,
4346
- output: 10,
4347
- cacheRead: 0.125,
4348
- cacheWrite: 0,
4349
- },
4350
- contextWindow: 1048576,
4351
- maxTokens: 65536,
4352
- },
4353
- "gemini-2.5-pro-preview-05-06": {
4354
- id: "gemini-2.5-pro-preview-05-06",
4355
- name: "Gemini 2.5 Pro Preview 05-06",
4356
- api: "google-generative-ai",
4357
- provider: "google",
4358
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4359
- reasoning: true,
4360
- input: ["text", "image"],
4361
- cost: {
4362
- input: 1.25,
4363
- output: 10,
4364
- cacheRead: 0.31,
4365
- cacheWrite: 0,
4366
- },
4367
- contextWindow: 1048576,
4368
- maxTokens: 65536,
4369
- },
4370
- "gemini-2.5-pro-preview-06-05": {
4371
- id: "gemini-2.5-pro-preview-06-05",
4372
- name: "Gemini 2.5 Pro Preview 06-05",
4373
- api: "google-generative-ai",
4374
- provider: "google",
4375
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4376
- reasoning: true,
4377
- input: ["text", "image"],
4378
- cost: {
4379
- input: 1.25,
4380
- output: 10,
4381
- cacheRead: 0.31,
4382
- cacheWrite: 0,
4383
- },
4384
- contextWindow: 1048576,
4385
- maxTokens: 65536,
4386
- },
4387
- "gemini-3-flash-preview": {
4388
- id: "gemini-3-flash-preview",
4389
- name: "Gemini 3 Flash Preview",
4390
- api: "google-generative-ai",
4391
- provider: "google",
4392
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4393
- reasoning: true,
4394
- thinkingLevelMap: { "off": null },
4395
- input: ["text", "image"],
4396
- cost: {
4397
- input: 0.5,
4398
- output: 3,
4399
- cacheRead: 0.05,
4400
- cacheWrite: 0,
4401
- },
4402
- contextWindow: 1048576,
4403
- maxTokens: 65536,
4404
- },
4405
- "gemini-3-pro-preview": {
4406
- id: "gemini-3-pro-preview",
4407
- name: "Gemini 3 Pro Preview",
4408
- api: "google-generative-ai",
4409
- provider: "google",
4410
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4411
- reasoning: true,
4412
- thinkingLevelMap: { "off": null, "minimal": null, "low": "LOW", "medium": null, "high": "HIGH" },
4334
+ thinkingLevelMap: { "off": null, "minimal": null, "low": "LOW", "medium": null, "high": "HIGH" },
4413
4335
  input: ["text", "image"],
4414
4336
  cost: {
4415
4337
  input: 2,
@@ -4417,8 +4339,8 @@ export const MODELS = {
4417
4339
  cacheRead: 0.2,
4418
4340
  cacheWrite: 0,
4419
4341
  },
4420
- contextWindow: 1000000,
4421
- maxTokens: 64000,
4342
+ contextWindow: 1048576,
4343
+ maxTokens: 65536,
4422
4344
  },
4423
4345
  "gemini-3.1-flash-lite": {
4424
4346
  id: "gemini-3.1-flash-lite",
@@ -4492,6 +4414,24 @@ export const MODELS = {
4492
4414
  contextWindow: 1048576,
4493
4415
  maxTokens: 65536,
4494
4416
  },
4417
+ "gemini-3.5-flash": {
4418
+ id: "gemini-3.5-flash",
4419
+ name: "Gemini 3.5 Flash",
4420
+ api: "google-generative-ai",
4421
+ provider: "google",
4422
+ baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4423
+ reasoning: true,
4424
+ thinkingLevelMap: { "off": null },
4425
+ input: ["text", "image"],
4426
+ cost: {
4427
+ input: 1.5,
4428
+ output: 9,
4429
+ cacheRead: 0.15,
4430
+ cacheWrite: 0,
4431
+ },
4432
+ contextWindow: 1048576,
4433
+ maxTokens: 65536,
4434
+ },
4495
4435
  "gemini-flash-latest": {
4496
4436
  id: "gemini-flash-latest",
4497
4437
  name: "Gemini Flash Latest",
@@ -4526,60 +4466,9 @@ export const MODELS = {
4526
4466
  contextWindow: 1048576,
4527
4467
  maxTokens: 65536,
4528
4468
  },
4529
- "gemini-live-2.5-flash": {
4530
- id: "gemini-live-2.5-flash",
4531
- name: "Gemini Live 2.5 Flash",
4532
- api: "google-generative-ai",
4533
- provider: "google",
4534
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4535
- reasoning: true,
4536
- input: ["text", "image"],
4537
- cost: {
4538
- input: 0.5,
4539
- output: 2,
4540
- cacheRead: 0,
4541
- cacheWrite: 0,
4542
- },
4543
- contextWindow: 128000,
4544
- maxTokens: 8000,
4545
- },
4546
- "gemini-live-2.5-flash-preview-native-audio": {
4547
- id: "gemini-live-2.5-flash-preview-native-audio",
4548
- name: "Gemini Live 2.5 Flash Preview Native Audio",
4549
- api: "google-generative-ai",
4550
- provider: "google",
4551
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4552
- reasoning: true,
4553
- input: ["text"],
4554
- cost: {
4555
- input: 0.5,
4556
- output: 2,
4557
- cacheRead: 0,
4558
- cacheWrite: 0,
4559
- },
4560
- contextWindow: 131072,
4561
- maxTokens: 65536,
4562
- },
4563
- "gemma-3-27b-it": {
4564
- id: "gemma-3-27b-it",
4565
- name: "Gemma 3 27B",
4566
- api: "google-generative-ai",
4567
- provider: "google",
4568
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4569
- reasoning: false,
4570
- input: ["text", "image"],
4571
- cost: {
4572
- input: 0,
4573
- output: 0,
4574
- cacheRead: 0,
4575
- cacheWrite: 0,
4576
- },
4577
- contextWindow: 131072,
4578
- maxTokens: 8192,
4579
- },
4580
4469
  "gemma-4-26b-a4b-it": {
4581
4470
  id: "gemma-4-26b-a4b-it",
4582
- name: "Gemma 4 26B",
4471
+ name: "Gemma 4 26B A4B IT",
4583
4472
  api: "google-generative-ai",
4584
4473
  provider: "google",
4585
4474
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4592,12 +4481,12 @@ export const MODELS = {
4592
4481
  cacheRead: 0,
4593
4482
  cacheWrite: 0,
4594
4483
  },
4595
- contextWindow: 256000,
4596
- maxTokens: 8192,
4484
+ contextWindow: 262144,
4485
+ maxTokens: 32768,
4597
4486
  },
4598
4487
  "gemma-4-31b-it": {
4599
4488
  id: "gemma-4-31b-it",
4600
- name: "Gemma 4 31B",
4489
+ name: "Gemma 4 31B IT",
4601
4490
  api: "google-generative-ai",
4602
4491
  provider: "google",
4603
4492
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4610,8 +4499,8 @@ export const MODELS = {
4610
4499
  cacheRead: 0,
4611
4500
  cacheWrite: 0,
4612
4501
  },
4613
- contextWindow: 256000,
4614
- maxTokens: 8192,
4502
+ contextWindow: 262144,
4503
+ maxTokens: 32768,
4615
4504
  },
4616
4505
  },
4617
4506
  "google-vertex": {
@@ -5057,7 +4946,7 @@ export const MODELS = {
5057
4946
  cost: {
5058
4947
  input: 1,
5059
4948
  output: 3,
5060
- cacheRead: 0,
4949
+ cacheRead: 0.5,
5061
4950
  cacheWrite: 0,
5062
4951
  },
5063
4952
  contextWindow: 262144,
@@ -5074,7 +4963,7 @@ export const MODELS = {
5074
4963
  cost: {
5075
4964
  input: 0.15,
5076
4965
  output: 0.6,
5077
- cacheRead: 0,
4966
+ cacheRead: 0.075,
5078
4967
  cacheWrite: 0,
5079
4968
  },
5080
4969
  contextWindow: 131072,
@@ -5091,7 +4980,7 @@ export const MODELS = {
5091
4980
  cost: {
5092
4981
  input: 0.075,
5093
4982
  output: 0.3,
5094
- cacheRead: 0,
4983
+ cacheRead: 0.0375,
5095
4984
  cacheWrite: 0,
5096
4985
  },
5097
4986
  contextWindow: 131072,
@@ -5377,9 +5266,9 @@ export const MODELS = {
5377
5266
  reasoning: true,
5378
5267
  input: ["text"],
5379
5268
  cost: {
5380
- input: 1.74,
5381
- output: 3.48,
5382
- cacheRead: 0.145,
5269
+ input: 0.435,
5270
+ output: 0.87,
5271
+ cacheRead: 0.003625,
5383
5272
  cacheWrite: 0,
5384
5273
  },
5385
5274
  contextWindow: 1048576,
@@ -6474,7 +6363,7 @@ export const MODELS = {
6474
6363
  cost: {
6475
6364
  input: 0.14,
6476
6365
  output: 0.28,
6477
- cacheRead: 0.028,
6366
+ cacheRead: 0.0028,
6478
6367
  cacheWrite: 0,
6479
6368
  },
6480
6369
  contextWindow: 1048576,
@@ -6491,9 +6380,9 @@ export const MODELS = {
6491
6380
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
6492
6381
  input: ["text"],
6493
6382
  cost: {
6494
- input: 1.74,
6495
- output: 3.48,
6496
- cacheRead: 0.145,
6383
+ input: 0.435,
6384
+ output: 0.87,
6385
+ cacheRead: 0.003625,
6497
6386
  cacheWrite: 0,
6498
6387
  },
6499
6388
  contextWindow: 1048576,
@@ -7362,7 +7251,7 @@ export const MODELS = {
7362
7251
  cost: {
7363
7252
  input: 0.1,
7364
7253
  output: 0.4,
7365
- cacheRead: 0.03,
7254
+ cacheRead: 0.025,
7366
7255
  cacheWrite: 0,
7367
7256
  },
7368
7257
  contextWindow: 1047576,
@@ -7447,7 +7336,7 @@ export const MODELS = {
7447
7336
  cost: {
7448
7337
  input: 0.15,
7449
7338
  output: 0.6,
7450
- cacheRead: 0.08,
7339
+ cacheRead: 0.075,
7451
7340
  cacheWrite: 0,
7452
7341
  },
7453
7342
  contextWindow: 128000,
@@ -7573,7 +7462,7 @@ export const MODELS = {
7573
7462
  cost: {
7574
7463
  input: 1.25,
7575
7464
  output: 10,
7576
- cacheRead: 0.13,
7465
+ cacheRead: 0.125,
7577
7466
  cacheWrite: 0,
7578
7467
  },
7579
7468
  contextWindow: 400000,
@@ -7998,7 +7887,7 @@ export const MODELS = {
7998
7887
  cost: {
7999
7888
  input: 1.1,
8000
7889
  output: 4.4,
8001
- cacheRead: 0.28,
7890
+ cacheRead: 0.275,
8002
7891
  cacheWrite: 0,
8003
7892
  },
8004
7893
  contextWindow: 200000,
@@ -8218,7 +8107,7 @@ export const MODELS = {
8218
8107
  cacheWrite: 0,
8219
8108
  },
8220
8109
  contextWindow: 200000,
8221
- maxTokens: 128000,
8110
+ maxTokens: 32000,
8222
8111
  },
8223
8112
  "claude-haiku-4-5": {
8224
8113
  id: "claude-haiku-4-5",
@@ -8307,6 +8196,23 @@ export const MODELS = {
8307
8196
  contextWindow: 1000000,
8308
8197
  maxTokens: 128000,
8309
8198
  },
8199
+ "claude-opus-4-8": {
8200
+ id: "claude-opus-4-8",
8201
+ name: "Claude Opus 4.8",
8202
+ api: "anthropic-messages",
8203
+ provider: "opencode",
8204
+ baseUrl: "https://opencode.ai/zen",
8205
+ reasoning: true,
8206
+ input: ["text", "image"],
8207
+ cost: {
8208
+ input: 5,
8209
+ output: 25,
8210
+ cacheRead: 0.5,
8211
+ cacheWrite: 6.25,
8212
+ },
8213
+ contextWindow: 1000000,
8214
+ maxTokens: 128000,
8215
+ },
8310
8216
  "claude-sonnet-4": {
8311
8217
  id: "claude-sonnet-4",
8312
8218
  name: "Claude Sonnet 4",
@@ -8374,8 +8280,8 @@ export const MODELS = {
8374
8280
  cacheRead: 0,
8375
8281
  cacheWrite: 0,
8376
8282
  },
8377
- contextWindow: 1000000,
8378
- maxTokens: 384000,
8283
+ contextWindow: 200000,
8284
+ maxTokens: 128000,
8379
8285
  },
8380
8286
  "gemini-3-flash": {
8381
8287
  id: "gemini-3-flash",
@@ -8413,6 +8319,24 @@ export const MODELS = {
8413
8319
  contextWindow: 1048576,
8414
8320
  maxTokens: 65536,
8415
8321
  },
8322
+ "gemini-3.5-flash": {
8323
+ id: "gemini-3.5-flash",
8324
+ name: "Gemini 3.5 Flash",
8325
+ api: "google-generative-ai",
8326
+ provider: "opencode",
8327
+ baseUrl: "https://opencode.ai/zen/v1",
8328
+ reasoning: true,
8329
+ thinkingLevelMap: { "off": null },
8330
+ input: ["text", "image"],
8331
+ cost: {
8332
+ input: 1.5,
8333
+ output: 9,
8334
+ cacheRead: 0.15,
8335
+ cacheWrite: 0,
8336
+ },
8337
+ contextWindow: 1048576,
8338
+ maxTokens: 65536,
8339
+ },
8416
8340
  "glm-5": {
8417
8341
  id: "glm-5",
8418
8342
  name: "GLM-5",
@@ -8735,6 +8659,23 @@ export const MODELS = {
8735
8659
  contextWindow: 1050000,
8736
8660
  maxTokens: 128000,
8737
8661
  },
8662
+ "grok-build-0.1": {
8663
+ id: "grok-build-0.1",
8664
+ name: "Grok Build 0.1",
8665
+ api: "openai-completions",
8666
+ provider: "opencode",
8667
+ baseUrl: "https://opencode.ai/zen/v1",
8668
+ reasoning: true,
8669
+ input: ["text", "image"],
8670
+ cost: {
8671
+ input: 1,
8672
+ output: 2,
8673
+ cacheRead: 0.2,
8674
+ cacheWrite: 0,
8675
+ },
8676
+ contextWindow: 256000,
8677
+ maxTokens: 256000,
8678
+ },
8738
8679
  "kimi-k2.5": {
8739
8680
  id: "kimi-k2.5",
8740
8681
  name: "Kimi K2.5",
@@ -8769,35 +8710,35 @@ export const MODELS = {
8769
8710
  contextWindow: 262144,
8770
8711
  maxTokens: 65536,
8771
8712
  },
8772
- "minimax-m2.5": {
8773
- id: "minimax-m2.5",
8774
- name: "MiniMax M2.5",
8713
+ "mimo-v2.5-free": {
8714
+ id: "mimo-v2.5-free",
8715
+ name: "MiMo V2.5 Free",
8775
8716
  api: "openai-completions",
8776
8717
  provider: "opencode",
8777
8718
  baseUrl: "https://opencode.ai/zen/v1",
8778
8719
  reasoning: true,
8779
- input: ["text"],
8720
+ input: ["text", "image"],
8780
8721
  cost: {
8781
- input: 0.3,
8782
- output: 1.2,
8783
- cacheRead: 0.06,
8722
+ input: 0,
8723
+ output: 0,
8724
+ cacheRead: 0,
8784
8725
  cacheWrite: 0,
8785
8726
  },
8786
- contextWindow: 204800,
8787
- maxTokens: 131072,
8727
+ contextWindow: 1000000,
8728
+ maxTokens: 128000,
8788
8729
  },
8789
- "minimax-m2.5-free": {
8790
- id: "minimax-m2.5-free",
8791
- name: "MiniMax M2.5 Free",
8792
- api: "anthropic-messages",
8730
+ "minimax-m2.5": {
8731
+ id: "minimax-m2.5",
8732
+ name: "MiniMax M2.5",
8733
+ api: "openai-completions",
8793
8734
  provider: "opencode",
8794
- baseUrl: "https://opencode.ai/zen",
8735
+ baseUrl: "https://opencode.ai/zen/v1",
8795
8736
  reasoning: true,
8796
8737
  input: ["text"],
8797
8738
  cost: {
8798
- input: 0,
8799
- output: 0,
8800
- cacheRead: 0,
8739
+ input: 0.3,
8740
+ output: 1.2,
8741
+ cacheRead: 0.06,
8801
8742
  cacheWrite: 0,
8802
8743
  },
8803
8744
  contextWindow: 204800,
@@ -8871,23 +8812,6 @@ export const MODELS = {
8871
8812
  contextWindow: 262144,
8872
8813
  maxTokens: 65536,
8873
8814
  },
8874
- "qwen3.6-plus-free": {
8875
- id: "qwen3.6-plus-free",
8876
- name: "Qwen3.6 Plus Free",
8877
- api: "anthropic-messages",
8878
- provider: "opencode",
8879
- baseUrl: "https://opencode.ai/zen",
8880
- reasoning: true,
8881
- input: ["text", "image"],
8882
- cost: {
8883
- input: 0,
8884
- output: 0,
8885
- cacheRead: 0,
8886
- cacheWrite: 0,
8887
- },
8888
- contextWindow: 262144,
8889
- maxTokens: 65536,
8890
- },
8891
8815
  },
8892
8816
  "opencode-go": {
8893
8817
  "deepseek-v4-flash": {
@@ -9005,9 +8929,9 @@ export const MODELS = {
9005
8929
  reasoning: true,
9006
8930
  input: ["text", "image"],
9007
8931
  cost: {
9008
- input: 0.4,
9009
- output: 2,
9010
- cacheRead: 0.08,
8932
+ input: 0.14,
8933
+ output: 0.28,
8934
+ cacheRead: 0.0028,
9011
8935
  cacheWrite: 0,
9012
8936
  },
9013
8937
  contextWindow: 1000000,
@@ -9022,9 +8946,9 @@ export const MODELS = {
9022
8946
  reasoning: true,
9023
8947
  input: ["text"],
9024
8948
  cost: {
9025
- input: 1,
9026
- output: 3,
9027
- cacheRead: 0.2,
8949
+ input: 1.74,
8950
+ output: 3.48,
8951
+ cacheRead: 0.0145,
9028
8952
  cacheWrite: 0,
9029
8953
  },
9030
8954
  contextWindow: 1048576,
@@ -9064,24 +8988,6 @@ export const MODELS = {
9064
8988
  contextWindow: 204800,
9065
8989
  maxTokens: 131072,
9066
8990
  },
9067
- "qwen3.5-plus": {
9068
- id: "qwen3.5-plus",
9069
- name: "Qwen3.5 Plus",
9070
- api: "openai-completions",
9071
- provider: "opencode-go",
9072
- baseUrl: "https://opencode.ai/zen/go/v1",
9073
- compat: { "thinkingFormat": "qwen" },
9074
- reasoning: true,
9075
- input: ["text", "image"],
9076
- cost: {
9077
- input: 0.2,
9078
- output: 1.2,
9079
- cacheRead: 0.02,
9080
- cacheWrite: 0.25,
9081
- },
9082
- contextWindow: 262144,
9083
- maxTokens: 65536,
9084
- },
9085
8991
  "qwen3.6-plus": {
9086
8992
  id: "qwen3.6-plus",
9087
8993
  name: "Qwen3.6 Plus",
@@ -9100,6 +9006,23 @@ export const MODELS = {
9100
9006
  contextWindow: 262144,
9101
9007
  maxTokens: 65536,
9102
9008
  },
9009
+ "qwen3.7-max": {
9010
+ id: "qwen3.7-max",
9011
+ name: "Qwen3.7 Max",
9012
+ api: "anthropic-messages",
9013
+ provider: "opencode-go",
9014
+ baseUrl: "https://opencode.ai/zen/go",
9015
+ reasoning: true,
9016
+ input: ["text"],
9017
+ cost: {
9018
+ input: 2.5,
9019
+ output: 7.5,
9020
+ cacheRead: 0.5,
9021
+ cacheWrite: 3.125,
9022
+ },
9023
+ contextWindow: 1000000,
9024
+ maxTokens: 65536,
9025
+ },
9103
9026
  },
9104
9027
  "openrouter": {
9105
9028
  "ai21/jamba-large-1.7": {
@@ -9119,23 +9042,6 @@ export const MODELS = {
9119
9042
  contextWindow: 256000,
9120
9043
  maxTokens: 4096,
9121
9044
  },
9122
- "alibaba/tongyi-deepresearch-30b-a3b": {
9123
- id: "alibaba/tongyi-deepresearch-30b-a3b",
9124
- name: "Tongyi DeepResearch 30B A3B",
9125
- api: "openai-completions",
9126
- provider: "openrouter",
9127
- baseUrl: "https://openrouter.ai/api/v1",
9128
- reasoning: true,
9129
- input: ["text"],
9130
- cost: {
9131
- input: 0.09,
9132
- output: 0.44999999999999996,
9133
- cacheRead: 0.09,
9134
- cacheWrite: 0,
9135
- },
9136
- contextWindow: 131072,
9137
- maxTokens: 131072,
9138
- },
9139
9045
  "amazon/nova-2-lite-v1": {
9140
9046
  id: "amazon/nova-2-lite-v1",
9141
9047
  name: "Amazon: Nova 2 Lite",
@@ -9395,6 +9301,40 @@ export const MODELS = {
9395
9301
  contextWindow: 1000000,
9396
9302
  maxTokens: 128000,
9397
9303
  },
9304
+ "anthropic/claude-opus-4.8": {
9305
+ id: "anthropic/claude-opus-4.8",
9306
+ name: "Anthropic: Claude Opus 4.8",
9307
+ api: "openai-completions",
9308
+ provider: "openrouter",
9309
+ baseUrl: "https://openrouter.ai/api/v1",
9310
+ reasoning: true,
9311
+ input: ["text", "image"],
9312
+ cost: {
9313
+ input: 5,
9314
+ output: 25,
9315
+ cacheRead: 0.5,
9316
+ cacheWrite: 6.25,
9317
+ },
9318
+ contextWindow: 1000000,
9319
+ maxTokens: 128000,
9320
+ },
9321
+ "anthropic/claude-opus-4.8-fast": {
9322
+ id: "anthropic/claude-opus-4.8-fast",
9323
+ name: "Anthropic: Claude Opus 4.8 (Fast)",
9324
+ api: "openai-completions",
9325
+ provider: "openrouter",
9326
+ baseUrl: "https://openrouter.ai/api/v1",
9327
+ reasoning: true,
9328
+ input: ["text", "image"],
9329
+ cost: {
9330
+ input: 10,
9331
+ output: 50,
9332
+ cacheRead: 1,
9333
+ cacheWrite: 12.5,
9334
+ },
9335
+ contextWindow: 1000000,
9336
+ maxTokens: 128000,
9337
+ },
9398
9338
  "anthropic/claude-sonnet-4": {
9399
9339
  id: "anthropic/claude-sonnet-4",
9400
9340
  name: "Anthropic: Claude Sonnet 4",
@@ -9446,23 +9386,6 @@ export const MODELS = {
9446
9386
  contextWindow: 1000000,
9447
9387
  maxTokens: 128000,
9448
9388
  },
9449
- "arcee-ai/trinity-large-preview": {
9450
- id: "arcee-ai/trinity-large-preview",
9451
- name: "Arcee AI: Trinity Large Preview",
9452
- api: "openai-completions",
9453
- provider: "openrouter",
9454
- baseUrl: "https://openrouter.ai/api/v1",
9455
- reasoning: false,
9456
- input: ["text"],
9457
- cost: {
9458
- input: 0.15,
9459
- output: 0.44999999999999996,
9460
- cacheRead: 0,
9461
- cacheWrite: 0,
9462
- },
9463
- contextWindow: 131000,
9464
- maxTokens: 4096,
9465
- },
9466
9389
  "arcee-ai/trinity-large-thinking": {
9467
9390
  id: "arcee-ai/trinity-large-thinking",
9468
9391
  name: "Arcee AI: Trinity Large Thinking",
@@ -9480,23 +9403,6 @@ export const MODELS = {
9480
9403
  contextWindow: 262144,
9481
9404
  maxTokens: 262144,
9482
9405
  },
9483
- "arcee-ai/trinity-large-thinking:free": {
9484
- id: "arcee-ai/trinity-large-thinking:free",
9485
- name: "Arcee AI: Trinity Large Thinking (free)",
9486
- api: "openai-completions",
9487
- provider: "openrouter",
9488
- baseUrl: "https://openrouter.ai/api/v1",
9489
- reasoning: true,
9490
- input: ["text"],
9491
- cost: {
9492
- input: 0,
9493
- output: 0,
9494
- cacheRead: 0,
9495
- cacheWrite: 0,
9496
- },
9497
- contextWindow: 262144,
9498
- maxTokens: 80000,
9499
- },
9500
9406
  "arcee-ai/trinity-mini": {
9501
9407
  id: "arcee-ai/trinity-mini",
9502
9408
  name: "Arcee AI: Trinity Mini",
@@ -9548,23 +9454,6 @@ export const MODELS = {
9548
9454
  contextWindow: 2000000,
9549
9455
  maxTokens: 30000,
9550
9456
  },
9551
- "baidu/cobuddy:free": {
9552
- id: "baidu/cobuddy:free",
9553
- name: "Baidu Qianfan: CoBuddy (free)",
9554
- api: "openai-completions",
9555
- provider: "openrouter",
9556
- baseUrl: "https://openrouter.ai/api/v1",
9557
- reasoning: true,
9558
- input: ["text"],
9559
- cost: {
9560
- input: 0,
9561
- output: 0,
9562
- cacheRead: 0,
9563
- cacheWrite: 0,
9564
- },
9565
- contextWindow: 131072,
9566
- maxTokens: 65536,
9567
- },
9568
9457
  "baidu/ernie-4.5-21b-a3b": {
9569
9458
  id: "baidu/ernie-4.5-21b-a3b",
9570
9459
  name: "Baidu: ERNIE 4.5 21B A3B",
@@ -9579,7 +9468,7 @@ export const MODELS = {
9579
9468
  cacheRead: 0,
9580
9469
  cacheWrite: 0,
9581
9470
  },
9582
- contextWindow: 120000,
9471
+ contextWindow: 131072,
9583
9472
  maxTokens: 8000,
9584
9473
  },
9585
9474
  "baidu/ernie-4.5-vl-28b-a3b": {
@@ -9596,7 +9485,7 @@ export const MODELS = {
9596
9485
  cacheRead: 0,
9597
9486
  cacheWrite: 0,
9598
9487
  },
9599
- contextWindow: 30000,
9488
+ contextWindow: 131072,
9600
9489
  maxTokens: 8000,
9601
9490
  },
9602
9491
  "bytedance-seed/seed-1.6": {
@@ -9710,13 +9599,13 @@ export const MODELS = {
9710
9599
  reasoning: false,
9711
9600
  input: ["text"],
9712
9601
  cost: {
9713
- input: 0.32,
9714
- output: 0.8899999999999999,
9602
+ input: 0.2288,
9603
+ output: 0.9144,
9715
9604
  cacheRead: 0,
9716
9605
  cacheWrite: 0,
9717
9606
  },
9718
- contextWindow: 163840,
9719
- maxTokens: 16384,
9607
+ contextWindow: 131072,
9608
+ maxTokens: 16000,
9720
9609
  },
9721
9610
  "deepseek/deepseek-chat-v3-0324": {
9722
9611
  id: "deepseek/deepseek-chat-v3-0324",
@@ -9766,7 +9655,7 @@ export const MODELS = {
9766
9655
  cacheRead: 0,
9767
9656
  cacheWrite: 0,
9768
9657
  },
9769
- contextWindow: 64000,
9658
+ contextWindow: 163840,
9770
9659
  maxTokens: 16000,
9771
9660
  },
9772
9661
  "deepseek/deepseek-r1-0528": {
@@ -9848,13 +9737,13 @@ export const MODELS = {
9848
9737
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
9849
9738
  input: ["text"],
9850
9739
  cost: {
9851
- input: 0.126,
9852
- output: 0.252,
9853
- cacheRead: 0.0252,
9740
+ input: 0.09999999999999999,
9741
+ output: 0.19999999999999998,
9742
+ cacheRead: 0.02,
9854
9743
  cacheWrite: 0,
9855
9744
  },
9856
9745
  contextWindow: 1048576,
9857
- maxTokens: 131072,
9746
+ maxTokens: 16384,
9858
9747
  },
9859
9748
  "deepseek/deepseek-v4-flash:free": {
9860
9749
  id: "deepseek/deepseek-v4-flash:free",
@@ -10129,6 +10018,23 @@ export const MODELS = {
10129
10018
  cacheRead: 0.19999999999999998,
10130
10019
  cacheWrite: 0.375,
10131
10020
  },
10021
+ contextWindow: 1048756,
10022
+ maxTokens: 65536,
10023
+ },
10024
+ "google/gemini-3.5-flash": {
10025
+ id: "google/gemini-3.5-flash",
10026
+ name: "Google: Gemini 3.5 Flash",
10027
+ api: "openai-completions",
10028
+ provider: "openrouter",
10029
+ baseUrl: "https://openrouter.ai/api/v1",
10030
+ reasoning: true,
10031
+ input: ["text", "image"],
10032
+ cost: {
10033
+ input: 1.5,
10034
+ output: 9,
10035
+ cacheRead: 0.15,
10036
+ cacheWrite: 0.08333333333333334,
10037
+ },
10132
10038
  contextWindow: 1048576,
10133
10039
  maxTokens: 65536,
10134
10040
  },
@@ -10277,9 +10183,9 @@ export const MODELS = {
10277
10183
  reasoning: false,
10278
10184
  input: ["text"],
10279
10185
  cost: {
10280
- input: 0.3,
10281
- output: 2.5,
10282
- cacheRead: 0.06,
10186
+ input: 0.075,
10187
+ output: 0.625,
10188
+ cacheRead: 0.015,
10283
10189
  cacheWrite: 0,
10284
10190
  },
10285
10191
  contextWindow: 262144,
@@ -10302,18 +10208,18 @@ export const MODELS = {
10302
10208
  contextWindow: 262144,
10303
10209
  maxTokens: 32768,
10304
10210
  },
10305
- "inclusionai/ring-2.6-1t:free": {
10306
- id: "inclusionai/ring-2.6-1t:free",
10307
- name: "inclusionAI: Ring-2.6-1T (free)",
10211
+ "inclusionai/ring-2.6-1t": {
10212
+ id: "inclusionai/ring-2.6-1t",
10213
+ name: "inclusionAI: Ring-2.6-1T",
10308
10214
  api: "openai-completions",
10309
10215
  provider: "openrouter",
10310
10216
  baseUrl: "https://openrouter.ai/api/v1",
10311
10217
  reasoning: true,
10312
10218
  input: ["text"],
10313
10219
  cost: {
10314
- input: 0,
10315
- output: 0,
10316
- cacheRead: 0,
10220
+ input: 0.075,
10221
+ output: 0.625,
10222
+ cacheRead: 0.015,
10317
10223
  cacheWrite: 0,
10318
10224
  },
10319
10225
  contextWindow: 262144,
@@ -10367,7 +10273,7 @@ export const MODELS = {
10367
10273
  cacheRead: 0,
10368
10274
  cacheWrite: 0,
10369
10275
  },
10370
- contextWindow: 16384,
10276
+ contextWindow: 131072,
10371
10277
  maxTokens: 16384,
10372
10278
  },
10373
10279
  "meta-llama/llama-3.3-70b-instruct": {
@@ -10401,7 +10307,7 @@ export const MODELS = {
10401
10307
  cacheRead: 0,
10402
10308
  cacheWrite: 0,
10403
10309
  },
10404
- contextWindow: 65536,
10310
+ contextWindow: 131072,
10405
10311
  maxTokens: 4096,
10406
10312
  },
10407
10313
  "meta-llama/llama-4-scout": {
@@ -10418,7 +10324,7 @@ export const MODELS = {
10418
10324
  cacheRead: 0,
10419
10325
  cacheWrite: 0,
10420
10326
  },
10421
- contextWindow: 327680,
10327
+ contextWindow: 10000000,
10422
10328
  maxTokens: 16384,
10423
10329
  },
10424
10330
  "minimax/minimax-m1": {
@@ -10452,7 +10358,7 @@ export const MODELS = {
10452
10358
  cacheRead: 0.03,
10453
10359
  cacheWrite: 0,
10454
10360
  },
10455
- contextWindow: 196608,
10361
+ contextWindow: 204800,
10456
10362
  maxTokens: 196608,
10457
10363
  },
10458
10364
  "minimax/minimax-m2.1": {
@@ -10469,7 +10375,7 @@ export const MODELS = {
10469
10375
  cacheRead: 0.03,
10470
10376
  cacheWrite: 0,
10471
10377
  },
10472
- contextWindow: 196608,
10378
+ contextWindow: 204800,
10473
10379
  maxTokens: 196608,
10474
10380
  },
10475
10381
  "minimax/minimax-m2.5": {
@@ -10486,7 +10392,7 @@ export const MODELS = {
10486
10392
  cacheRead: 0,
10487
10393
  cacheWrite: 0,
10488
10394
  },
10489
- contextWindow: 196608,
10395
+ contextWindow: 204800,
10490
10396
  maxTokens: 196608,
10491
10397
  },
10492
10398
  "minimax/minimax-m2.5:free": {
@@ -10503,7 +10409,7 @@ export const MODELS = {
10503
10409
  cacheRead: 0,
10504
10410
  cacheWrite: 0,
10505
10411
  },
10506
- contextWindow: 196608,
10412
+ contextWindow: 204800,
10507
10413
  maxTokens: 8192,
10508
10414
  },
10509
10415
  "minimax/minimax-m2.7": {
@@ -10520,7 +10426,7 @@ export const MODELS = {
10520
10426
  cacheRead: 0,
10521
10427
  cacheWrite: 0,
10522
10428
  },
10523
- contextWindow: 196608,
10429
+ contextWindow: 204800,
10524
10430
  maxTokens: 131072,
10525
10431
  },
10526
10432
  "mistralai/codestral-2508": {
@@ -10925,7 +10831,7 @@ export const MODELS = {
10925
10831
  cost: {
10926
10832
  input: 0.6,
10927
10833
  output: 2.5,
10928
- cacheRead: 0.15,
10834
+ cacheRead: 0,
10929
10835
  cacheWrite: 0,
10930
10836
  },
10931
10837
  contextWindow: 262144,
@@ -10962,9 +10868,26 @@ export const MODELS = {
10962
10868
  cacheRead: 0.25,
10963
10869
  cacheWrite: 0,
10964
10870
  },
10965
- contextWindow: 262142,
10871
+ contextWindow: 262144,
10966
10872
  maxTokens: 262142,
10967
10873
  },
10874
+ "moonshotai/kimi-k2.6:free": {
10875
+ id: "moonshotai/kimi-k2.6:free",
10876
+ name: "MoonshotAI: Kimi K2.6 (free)",
10877
+ api: "openai-completions",
10878
+ provider: "openrouter",
10879
+ baseUrl: "https://openrouter.ai/api/v1",
10880
+ reasoning: true,
10881
+ input: ["text", "image"],
10882
+ cost: {
10883
+ input: 0,
10884
+ output: 0,
10885
+ cacheRead: 0,
10886
+ cacheWrite: 0,
10887
+ },
10888
+ contextWindow: 262144,
10889
+ maxTokens: 4096,
10890
+ },
10968
10891
  "nex-agi/deepseek-v3.1-nex-n1": {
10969
10892
  id: "nex-agi/deepseek-v3.1-nex-n1",
10970
10893
  name: "Nex AGI: DeepSeek V3.1 Nex N1",
@@ -11064,7 +10987,7 @@ export const MODELS = {
11064
10987
  cacheRead: 0,
11065
10988
  cacheWrite: 0,
11066
10989
  },
11067
- contextWindow: 262144,
10990
+ contextWindow: 1000000,
11068
10991
  maxTokens: 4096,
11069
10992
  },
11070
10993
  "nvidia/nemotron-3-super-120b-a12b:free": {
@@ -11081,7 +11004,7 @@ export const MODELS = {
11081
11004
  cacheRead: 0,
11082
11005
  cacheWrite: 0,
11083
11006
  },
11084
- contextWindow: 262144,
11007
+ contextWindow: 1000000,
11085
11008
  maxTokens: 262144,
11086
11009
  },
11087
11010
  "nvidia/nemotron-nano-12b-v2-vl:free": {
@@ -11554,11 +11477,11 @@ export const MODELS = {
11554
11477
  cost: {
11555
11478
  input: 1.25,
11556
11479
  output: 10,
11557
- cacheRead: 0.125,
11480
+ cacheRead: 0.13,
11558
11481
  cacheWrite: 0,
11559
11482
  },
11560
11483
  contextWindow: 128000,
11561
- maxTokens: 16384,
11484
+ maxTokens: 32000,
11562
11485
  },
11563
11486
  "openai/gpt-5.1-codex": {
11564
11487
  id: "openai/gpt-5.1-codex",
@@ -11571,7 +11494,7 @@ export const MODELS = {
11571
11494
  cost: {
11572
11495
  input: 1.25,
11573
11496
  output: 10,
11574
- cacheRead: 0.125,
11497
+ cacheRead: 0.13,
11575
11498
  cacheWrite: 0,
11576
11499
  },
11577
11500
  contextWindow: 400000,
@@ -11605,11 +11528,11 @@ export const MODELS = {
11605
11528
  cost: {
11606
11529
  input: 0.25,
11607
11530
  output: 2,
11608
- cacheRead: 0.03,
11531
+ cacheRead: 0.024999999999999998,
11609
11532
  cacheWrite: 0,
11610
11533
  },
11611
11534
  contextWindow: 400000,
11612
- maxTokens: 128000,
11535
+ maxTokens: 100000,
11613
11536
  },
11614
11537
  "openai/gpt-5.2": {
11615
11538
  id: "openai/gpt-5.2",
@@ -11645,7 +11568,7 @@ export const MODELS = {
11645
11568
  cacheWrite: 0,
11646
11569
  },
11647
11570
  contextWindow: 128000,
11648
- maxTokens: 32000,
11571
+ maxTokens: 16384,
11649
11572
  },
11650
11573
  "openai/gpt-5.2-codex": {
11651
11574
  id: "openai/gpt-5.2-codex",
@@ -12181,8 +12104,8 @@ export const MODELS = {
12181
12104
  cacheRead: 0,
12182
12105
  cacheWrite: 0,
12183
12106
  },
12184
- contextWindow: 131072,
12185
- maxTokens: 8192,
12107
+ contextWindow: 262144,
12108
+ maxTokens: 32768,
12186
12109
  },
12187
12110
  "poolside/laguna-xs.2:free": {
12188
12111
  id: "poolside/laguna-xs.2:free",
@@ -12198,8 +12121,8 @@ export const MODELS = {
12198
12121
  cacheRead: 0,
12199
12122
  cacheWrite: 0,
12200
12123
  },
12201
- contextWindow: 131072,
12202
- maxTokens: 8192,
12124
+ contextWindow: 262144,
12125
+ maxTokens: 32768,
12203
12126
  },
12204
12127
  "prime-intellect/intellect-3": {
12205
12128
  id: "prime-intellect/intellect-3",
@@ -12232,7 +12155,7 @@ export const MODELS = {
12232
12155
  cacheRead: 0,
12233
12156
  cacheWrite: 0,
12234
12157
  },
12235
- contextWindow: 32768,
12158
+ contextWindow: 131072,
12236
12159
  maxTokens: 16384,
12237
12160
  },
12238
12161
  "qwen/qwen-2.5-7b-instruct": {
@@ -12249,7 +12172,7 @@ export const MODELS = {
12249
12172
  cacheRead: 0,
12250
12173
  cacheWrite: 0,
12251
12174
  },
12252
- contextWindow: 32768,
12175
+ contextWindow: 131072,
12253
12176
  maxTokens: 32768,
12254
12177
  },
12255
12178
  "qwen/qwen-plus": {
@@ -12281,7 +12204,7 @@ export const MODELS = {
12281
12204
  input: 0.26,
12282
12205
  output: 0.78,
12283
12206
  cacheRead: 0,
12284
- cacheWrite: 0.325,
12207
+ cacheWrite: 0,
12285
12208
  },
12286
12209
  contextWindow: 1000000,
12287
12210
  maxTokens: 32768,
@@ -12317,7 +12240,7 @@ export const MODELS = {
12317
12240
  cacheRead: 0,
12318
12241
  cacheWrite: 0,
12319
12242
  },
12320
- contextWindow: 40960,
12243
+ contextWindow: 131702,
12321
12244
  maxTokens: 40960,
12322
12245
  },
12323
12246
  "qwen/qwen3-235b-a22b": {
@@ -12368,7 +12291,7 @@ export const MODELS = {
12368
12291
  cacheRead: 0,
12369
12292
  cacheWrite: 0,
12370
12293
  },
12371
- contextWindow: 131072,
12294
+ contextWindow: 262144,
12372
12295
  maxTokens: 4096,
12373
12296
  },
12374
12297
  "qwen/qwen3-30b-a3b": {
@@ -12385,7 +12308,7 @@ export const MODELS = {
12385
12308
  cacheRead: 0,
12386
12309
  cacheWrite: 0,
12387
12310
  },
12388
- contextWindow: 40960,
12311
+ contextWindow: 131072,
12389
12312
  maxTokens: 20000,
12390
12313
  },
12391
12314
  "qwen/qwen3-30b-a3b-instruct-2507": {
@@ -12436,7 +12359,7 @@ export const MODELS = {
12436
12359
  cacheRead: 0,
12437
12360
  cacheWrite: 0,
12438
12361
  },
12439
- contextWindow: 40960,
12362
+ contextWindow: 131072,
12440
12363
  maxTokens: 16384,
12441
12364
  },
12442
12365
  "qwen/qwen3-8b": {
@@ -12453,7 +12376,7 @@ export const MODELS = {
12453
12376
  cacheRead: 0.049999999999999996,
12454
12377
  cacheWrite: 0,
12455
12378
  },
12456
- contextWindow: 40960,
12379
+ contextWindow: 131072,
12457
12380
  maxTokens: 8192,
12458
12381
  },
12459
12382
  "qwen/qwen3-coder": {
@@ -12470,7 +12393,7 @@ export const MODELS = {
12470
12393
  cacheRead: 0,
12471
12394
  cacheWrite: 0,
12472
12395
  },
12473
- contextWindow: 262144,
12396
+ contextWindow: 1048576,
12474
12397
  maxTokens: 65536,
12475
12398
  },
12476
12399
  "qwen/qwen3-coder-30b-a3b-instruct": {
@@ -12555,7 +12478,7 @@ export const MODELS = {
12555
12478
  cacheRead: 0,
12556
12479
  cacheWrite: 0,
12557
12480
  },
12558
- contextWindow: 262000,
12481
+ contextWindow: 1048576,
12559
12482
  maxTokens: 262000,
12560
12483
  },
12561
12484
  "qwen/qwen3-max": {
@@ -12640,7 +12563,7 @@ export const MODELS = {
12640
12563
  cacheRead: 0,
12641
12564
  cacheWrite: 0,
12642
12565
  },
12643
- contextWindow: 131072,
12566
+ contextWindow: 262144,
12644
12567
  maxTokens: 32768,
12645
12568
  },
12646
12569
  "qwen/qwen3-vl-235b-a22b-instruct": {
@@ -12691,7 +12614,7 @@ export const MODELS = {
12691
12614
  cacheRead: 0,
12692
12615
  cacheWrite: 0,
12693
12616
  },
12694
- contextWindow: 131072,
12617
+ contextWindow: 262144,
12695
12618
  maxTokens: 32768,
12696
12619
  },
12697
12620
  "qwen/qwen3-vl-30b-a3b-thinking": {
@@ -12725,7 +12648,7 @@ export const MODELS = {
12725
12648
  cacheRead: 0,
12726
12649
  cacheWrite: 0,
12727
12650
  },
12728
- contextWindow: 131072,
12651
+ contextWindow: 262144,
12729
12652
  maxTokens: 32768,
12730
12653
  },
12731
12654
  "qwen/qwen3-vl-8b-instruct": {
@@ -12742,7 +12665,7 @@ export const MODELS = {
12742
12665
  cacheRead: 0,
12743
12666
  cacheWrite: 0,
12744
12667
  },
12745
- contextWindow: 131072,
12668
+ contextWindow: 256000,
12746
12669
  maxTokens: 32768,
12747
12670
  },
12748
12671
  "qwen/qwen3-vl-8b-thinking": {
@@ -12759,7 +12682,7 @@ export const MODELS = {
12759
12682
  cacheRead: 0,
12760
12683
  cacheWrite: 0,
12761
12684
  },
12762
- contextWindow: 131072,
12685
+ contextWindow: 256000,
12763
12686
  maxTokens: 32768,
12764
12687
  },
12765
12688
  "qwen/qwen3.5-122b-a10b": {
@@ -12777,7 +12700,7 @@ export const MODELS = {
12777
12700
  cacheWrite: 0,
12778
12701
  },
12779
12702
  contextWindow: 262144,
12780
- maxTokens: 65536,
12703
+ maxTokens: 262144,
12781
12704
  },
12782
12705
  "qwen/qwen3.5-27b": {
12783
12706
  id: "qwen/qwen3.5-27b",
@@ -12805,13 +12728,13 @@ export const MODELS = {
12805
12728
  reasoning: true,
12806
12729
  input: ["text", "image"],
12807
12730
  cost: {
12808
- input: 0.14,
12731
+ input: 0.13899999999999998,
12809
12732
  output: 1,
12810
- cacheRead: 0.049999999999999996,
12733
+ cacheRead: 0,
12811
12734
  cacheWrite: 0,
12812
12735
  },
12813
12736
  contextWindow: 262144,
12814
- maxTokens: 81920,
12737
+ maxTokens: 4096,
12815
12738
  },
12816
12739
  "qwen/qwen3.5-397b-a17b": {
12817
12740
  id: "qwen/qwen3.5-397b-a17b",
@@ -12824,7 +12747,7 @@ export const MODELS = {
12824
12747
  cost: {
12825
12748
  input: 0.39,
12826
12749
  output: 2.34,
12827
- cacheRead: 0.195,
12750
+ cacheRead: 0,
12828
12751
  cacheWrite: 0,
12829
12752
  },
12830
12753
  contextWindow: 262144,
@@ -12859,7 +12782,7 @@ export const MODELS = {
12859
12782
  input: 0.065,
12860
12783
  output: 0.26,
12861
12784
  cacheRead: 0,
12862
- cacheWrite: 0.08125,
12785
+ cacheWrite: 0,
12863
12786
  },
12864
12787
  contextWindow: 1000000,
12865
12788
  maxTokens: 65536,
@@ -12876,7 +12799,7 @@ export const MODELS = {
12876
12799
  input: 0.26,
12877
12800
  output: 1.56,
12878
12801
  cacheRead: 0,
12879
- cacheWrite: 0.325,
12802
+ cacheWrite: 0,
12880
12803
  },
12881
12804
  contextWindow: 1000000,
12882
12805
  maxTokens: 65536,
@@ -12893,7 +12816,7 @@ export const MODELS = {
12893
12816
  input: 0.3,
12894
12817
  output: 1.7999999999999998,
12895
12818
  cacheRead: 0,
12896
- cacheWrite: 0,
12819
+ cacheWrite: 0.375,
12897
12820
  },
12898
12821
  contextWindow: 1000000,
12899
12822
  maxTokens: 65536,
@@ -12907,13 +12830,13 @@ export const MODELS = {
12907
12830
  reasoning: true,
12908
12831
  input: ["text", "image"],
12909
12832
  cost: {
12910
- input: 0.32,
12833
+ input: 0.29,
12911
12834
  output: 3.1999999999999997,
12912
12835
  cacheRead: 0,
12913
12836
  cacheWrite: 0,
12914
12837
  },
12915
12838
  contextWindow: 262144,
12916
- maxTokens: 81920,
12839
+ maxTokens: 262140,
12917
12840
  },
12918
12841
  "qwen/qwen3.6-35b-a3b": {
12919
12842
  id: "qwen/qwen3.6-35b-a3b",
@@ -12924,13 +12847,13 @@ export const MODELS = {
12924
12847
  reasoning: true,
12925
12848
  input: ["text", "image"],
12926
12849
  cost: {
12927
- input: 0.15,
12850
+ input: 0.14,
12928
12851
  output: 1,
12929
- cacheRead: 0.049999999999999996,
12852
+ cacheRead: 0,
12930
12853
  cacheWrite: 0,
12931
12854
  },
12932
12855
  contextWindow: 262144,
12933
- maxTokens: 262144,
12856
+ maxTokens: 262140,
12934
12857
  },
12935
12858
  "qwen/qwen3.6-flash": {
12936
12859
  id: "qwen/qwen3.6-flash",
@@ -12983,6 +12906,23 @@ export const MODELS = {
12983
12906
  contextWindow: 1000000,
12984
12907
  maxTokens: 65536,
12985
12908
  },
12909
+ "qwen/qwen3.7-max": {
12910
+ id: "qwen/qwen3.7-max",
12911
+ name: "Qwen: Qwen3.7 Max",
12912
+ api: "openai-completions",
12913
+ provider: "openrouter",
12914
+ baseUrl: "https://openrouter.ai/api/v1",
12915
+ reasoning: true,
12916
+ input: ["text"],
12917
+ cost: {
12918
+ input: 1.25,
12919
+ output: 3.75,
12920
+ cacheRead: 0.25,
12921
+ cacheWrite: 1.5625,
12922
+ },
12923
+ contextWindow: 1000000,
12924
+ maxTokens: 65536,
12925
+ },
12986
12926
  "rekaai/reka-edge": {
12987
12927
  id: "rekaai/reka-edge",
12988
12928
  name: "Reka Edge",
@@ -13060,13 +13000,30 @@ export const MODELS = {
13060
13000
  reasoning: true,
13061
13001
  input: ["text"],
13062
13002
  cost: {
13063
- input: 0.09999999999999999,
13003
+ input: 0.09,
13064
13004
  output: 0.3,
13065
- cacheRead: 0,
13005
+ cacheRead: 0.02,
13066
13006
  cacheWrite: 0,
13067
13007
  },
13068
13008
  contextWindow: 262144,
13069
- maxTokens: 65536,
13009
+ maxTokens: 16384,
13010
+ },
13011
+ "stepfun/step-3.7-flash": {
13012
+ id: "stepfun/step-3.7-flash",
13013
+ name: "StepFun: Step 3.7 Flash",
13014
+ api: "openai-completions",
13015
+ provider: "openrouter",
13016
+ baseUrl: "https://openrouter.ai/api/v1",
13017
+ reasoning: true,
13018
+ input: ["text", "image"],
13019
+ cost: {
13020
+ input: 0.19999999999999998,
13021
+ output: 1.15,
13022
+ cacheRead: 0.04,
13023
+ cacheWrite: 0,
13024
+ },
13025
+ contextWindow: 256000,
13026
+ maxTokens: 256000,
13070
13027
  },
13071
13028
  "tencent/hy3-preview": {
13072
13029
  id: "tencent/hy3-preview",
@@ -13077,13 +13034,13 @@ export const MODELS = {
13077
13034
  reasoning: true,
13078
13035
  input: ["text"],
13079
13036
  cost: {
13080
- input: 0.06599999999999999,
13081
- output: 0.26,
13082
- cacheRead: 0.029,
13037
+ input: 0.063,
13038
+ output: 0.21,
13039
+ cacheRead: 0.020999999999999998,
13083
13040
  cacheWrite: 0,
13084
13041
  },
13085
13042
  contextWindow: 262144,
13086
- maxTokens: 262144,
13043
+ maxTokens: 4096,
13087
13044
  },
13088
13045
  "thedrummer/rocinante-12b": {
13089
13046
  id: "thedrummer/rocinante-12b",
@@ -13136,125 +13093,6 @@ export const MODELS = {
13136
13093
  contextWindow: 128000,
13137
13094
  maxTokens: 4096,
13138
13095
  },
13139
- "x-ai/grok-3": {
13140
- id: "x-ai/grok-3",
13141
- name: "xAI: Grok 3",
13142
- api: "openai-completions",
13143
- provider: "openrouter",
13144
- baseUrl: "https://openrouter.ai/api/v1",
13145
- reasoning: false,
13146
- input: ["text"],
13147
- cost: {
13148
- input: 3,
13149
- output: 15,
13150
- cacheRead: 0.75,
13151
- cacheWrite: 0,
13152
- },
13153
- contextWindow: 131072,
13154
- maxTokens: 4096,
13155
- },
13156
- "x-ai/grok-3-beta": {
13157
- id: "x-ai/grok-3-beta",
13158
- name: "xAI: Grok 3 Beta",
13159
- api: "openai-completions",
13160
- provider: "openrouter",
13161
- baseUrl: "https://openrouter.ai/api/v1",
13162
- reasoning: false,
13163
- input: ["text"],
13164
- cost: {
13165
- input: 3,
13166
- output: 15,
13167
- cacheRead: 0.75,
13168
- cacheWrite: 0,
13169
- },
13170
- contextWindow: 131072,
13171
- maxTokens: 4096,
13172
- },
13173
- "x-ai/grok-3-mini": {
13174
- id: "x-ai/grok-3-mini",
13175
- name: "xAI: Grok 3 Mini",
13176
- api: "openai-completions",
13177
- provider: "openrouter",
13178
- baseUrl: "https://openrouter.ai/api/v1",
13179
- reasoning: true,
13180
- input: ["text"],
13181
- cost: {
13182
- input: 0.3,
13183
- output: 0.5,
13184
- cacheRead: 0.075,
13185
- cacheWrite: 0,
13186
- },
13187
- contextWindow: 131072,
13188
- maxTokens: 4096,
13189
- },
13190
- "x-ai/grok-3-mini-beta": {
13191
- id: "x-ai/grok-3-mini-beta",
13192
- name: "xAI: Grok 3 Mini Beta",
13193
- api: "openai-completions",
13194
- provider: "openrouter",
13195
- baseUrl: "https://openrouter.ai/api/v1",
13196
- reasoning: true,
13197
- input: ["text"],
13198
- cost: {
13199
- input: 0.3,
13200
- output: 0.5,
13201
- cacheRead: 0.075,
13202
- cacheWrite: 0,
13203
- },
13204
- contextWindow: 131072,
13205
- maxTokens: 4096,
13206
- },
13207
- "x-ai/grok-4": {
13208
- id: "x-ai/grok-4",
13209
- name: "xAI: Grok 4",
13210
- api: "openai-completions",
13211
- provider: "openrouter",
13212
- baseUrl: "https://openrouter.ai/api/v1",
13213
- reasoning: true,
13214
- input: ["text", "image"],
13215
- cost: {
13216
- input: 3,
13217
- output: 15,
13218
- cacheRead: 0.75,
13219
- cacheWrite: 0,
13220
- },
13221
- contextWindow: 256000,
13222
- maxTokens: 4096,
13223
- },
13224
- "x-ai/grok-4-fast": {
13225
- id: "x-ai/grok-4-fast",
13226
- name: "xAI: Grok 4 Fast",
13227
- api: "openai-completions",
13228
- provider: "openrouter",
13229
- baseUrl: "https://openrouter.ai/api/v1",
13230
- reasoning: true,
13231
- input: ["text", "image"],
13232
- cost: {
13233
- input: 0.19999999999999998,
13234
- output: 0.5,
13235
- cacheRead: 0.049999999999999996,
13236
- cacheWrite: 0,
13237
- },
13238
- contextWindow: 2000000,
13239
- maxTokens: 30000,
13240
- },
13241
- "x-ai/grok-4.1-fast": {
13242
- id: "x-ai/grok-4.1-fast",
13243
- name: "xAI: Grok 4.1 Fast",
13244
- api: "openai-completions",
13245
- provider: "openrouter",
13246
- baseUrl: "https://openrouter.ai/api/v1",
13247
- reasoning: true,
13248
- input: ["text", "image"],
13249
- cost: {
13250
- input: 0.19999999999999998,
13251
- output: 0.5,
13252
- cacheRead: 0.049999999999999996,
13253
- cacheWrite: 0,
13254
- },
13255
- contextWindow: 2000000,
13256
- maxTokens: 30000,
13257
- },
13258
13096
  "x-ai/grok-4.20": {
13259
13097
  id: "x-ai/grok-4.20",
13260
13098
  name: "xAI: Grok 4.20",
@@ -13289,22 +13127,22 @@ export const MODELS = {
13289
13127
  contextWindow: 1000000,
13290
13128
  maxTokens: 4096,
13291
13129
  },
13292
- "x-ai/grok-code-fast-1": {
13293
- id: "x-ai/grok-code-fast-1",
13294
- name: "xAI: Grok Code Fast 1",
13130
+ "x-ai/grok-build-0.1": {
13131
+ id: "x-ai/grok-build-0.1",
13132
+ name: "xAI: Grok Build 0.1",
13295
13133
  api: "openai-completions",
13296
13134
  provider: "openrouter",
13297
13135
  baseUrl: "https://openrouter.ai/api/v1",
13298
13136
  reasoning: true,
13299
- input: ["text"],
13137
+ input: ["text", "image"],
13300
13138
  cost: {
13301
- input: 0.19999999999999998,
13302
- output: 1.5,
13303
- cacheRead: 0.02,
13139
+ input: 1,
13140
+ output: 2,
13141
+ cacheRead: 0.19999999999999998,
13304
13142
  cacheWrite: 0,
13305
13143
  },
13306
13144
  contextWindow: 256000,
13307
- maxTokens: 10000,
13145
+ maxTokens: 4096,
13308
13146
  },
13309
13147
  "xiaomi/mimo-v2-flash": {
13310
13148
  id: "xiaomi/mimo-v2-flash",
@@ -13366,9 +13204,9 @@ export const MODELS = {
13366
13204
  reasoning: true,
13367
13205
  input: ["text", "image"],
13368
13206
  cost: {
13369
- input: 0.39999999999999997,
13370
- output: 2,
13371
- cacheRead: 0.08,
13207
+ input: 0.14,
13208
+ output: 0.28,
13209
+ cacheRead: 0.0028,
13372
13210
  cacheWrite: 0,
13373
13211
  },
13374
13212
  contextWindow: 1048576,
@@ -13383,13 +13221,13 @@ export const MODELS = {
13383
13221
  reasoning: true,
13384
13222
  input: ["text"],
13385
13223
  cost: {
13386
- input: 1,
13387
- output: 3,
13388
- cacheRead: 0.19999999999999998,
13224
+ input: 0.435,
13225
+ output: 0.87,
13226
+ cacheRead: 0.0036,
13389
13227
  cacheWrite: 0,
13390
13228
  },
13391
13229
  contextWindow: 1048576,
13392
- maxTokens: 16384,
13230
+ maxTokens: 131072,
13393
13231
  },
13394
13232
  "z-ai/glm-4-32b": {
13395
13233
  id: "z-ai/glm-4-32b",
@@ -13434,13 +13272,13 @@ export const MODELS = {
13434
13272
  reasoning: true,
13435
13273
  input: ["text"],
13436
13274
  cost: {
13437
- input: 0.13,
13275
+ input: 0.125,
13438
13276
  output: 0.85,
13439
- cacheRead: 0.024999999999999998,
13277
+ cacheRead: 0.06,
13440
13278
  cacheWrite: 0,
13441
13279
  },
13442
13280
  contextWindow: 131072,
13443
- maxTokens: 98304,
13281
+ maxTokens: 131070,
13444
13282
  },
13445
13283
  "z-ai/glm-4.5-air:free": {
13446
13284
  id: "z-ai/glm-4.5-air:free",
@@ -13672,9 +13510,9 @@ export const MODELS = {
13672
13510
  reasoning: true,
13673
13511
  input: ["text", "image"],
13674
13512
  cost: {
13675
- input: 0.5,
13676
- output: 3,
13677
- cacheRead: 0.049999999999999996,
13513
+ input: 1.5,
13514
+ output: 9,
13515
+ cacheRead: 0.15,
13678
13516
  cacheWrite: 0.08333333333333334,
13679
13517
  },
13680
13518
  contextWindow: 1048576,
@@ -13711,7 +13549,7 @@ export const MODELS = {
13711
13549
  cacheRead: 0.25,
13712
13550
  cacheWrite: 0,
13713
13551
  },
13714
- contextWindow: 262142,
13552
+ contextWindow: 262144,
13715
13553
  maxTokens: 262142,
13716
13554
  },
13717
13555
  "~openai/gpt-latest": {
@@ -13882,6 +13720,25 @@ export const MODELS = {
13882
13720
  contextWindow: 1000000,
13883
13721
  maxTokens: 500000,
13884
13722
  },
13723
+ "Qwen/Qwen3.7-Max": {
13724
+ id: "Qwen/Qwen3.7-Max",
13725
+ name: "Qwen3.7 Max",
13726
+ api: "openai-completions",
13727
+ provider: "together",
13728
+ baseUrl: "https://api.together.ai/v1",
13729
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13730
+ reasoning: true,
13731
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13732
+ input: ["text"],
13733
+ cost: {
13734
+ input: 2.5,
13735
+ output: 7.5,
13736
+ cacheRead: 0,
13737
+ cacheWrite: 0,
13738
+ },
13739
+ contextWindow: 1000000,
13740
+ maxTokens: 500000,
13741
+ },
13885
13742
  "deepseek-ai/DeepSeek-V3": {
13886
13743
  id: "deepseek-ai/DeepSeek-V3",
13887
13744
  name: "DeepSeek V3",
@@ -14378,6 +14235,23 @@ export const MODELS = {
14378
14235
  contextWindow: 1000000,
14379
14236
  maxTokens: 64000,
14380
14237
  },
14238
+ "alibaba/qwen3.7-max": {
14239
+ id: "alibaba/qwen3.7-max",
14240
+ name: "Qwen 3.7 Max",
14241
+ api: "anthropic-messages",
14242
+ provider: "vercel-ai-gateway",
14243
+ baseUrl: "https://ai-gateway.vercel.sh",
14244
+ reasoning: true,
14245
+ input: ["text", "image"],
14246
+ cost: {
14247
+ input: 1.25,
14248
+ output: 3.75,
14249
+ cacheRead: 0.25,
14250
+ cacheWrite: 1.5625,
14251
+ },
14252
+ contextWindow: 991000,
14253
+ maxTokens: 64000,
14254
+ },
14381
14255
  "anthropic/claude-3-haiku": {
14382
14256
  id: "anthropic/claude-3-haiku",
14383
14257
  name: "Claude 3 Haiku",
@@ -14516,6 +14390,23 @@ export const MODELS = {
14516
14390
  contextWindow: 1000000,
14517
14391
  maxTokens: 128000,
14518
14392
  },
14393
+ "anthropic/claude-opus-4.8": {
14394
+ id: "anthropic/claude-opus-4.8",
14395
+ name: "Claude Opus 4.8",
14396
+ api: "anthropic-messages",
14397
+ provider: "vercel-ai-gateway",
14398
+ baseUrl: "https://ai-gateway.vercel.sh",
14399
+ reasoning: true,
14400
+ input: ["text", "image"],
14401
+ cost: {
14402
+ input: 5,
14403
+ output: 25,
14404
+ cacheRead: 0.5,
14405
+ cacheWrite: 6.25,
14406
+ },
14407
+ contextWindow: 1000000,
14408
+ maxTokens: 128000,
14409
+ },
14519
14410
  "anthropic/claude-sonnet-4": {
14520
14411
  id: "anthropic/claude-sonnet-4",
14521
14412
  name: "Claude Sonnet 4",
@@ -14941,13 +14832,30 @@ export const MODELS = {
14941
14832
  contextWindow: 1000000,
14942
14833
  maxTokens: 64000,
14943
14834
  },
14944
- "google/gemma-4-26b-a4b-it": {
14945
- id: "google/gemma-4-26b-a4b-it",
14946
- name: "Gemma 4 26B A4B IT",
14835
+ "google/gemini-3.5-flash": {
14836
+ id: "google/gemini-3.5-flash",
14837
+ name: "Gemini 3.5 Flash",
14947
14838
  api: "anthropic-messages",
14948
14839
  provider: "vercel-ai-gateway",
14949
14840
  baseUrl: "https://ai-gateway.vercel.sh",
14950
- reasoning: false,
14841
+ reasoning: true,
14842
+ input: ["text", "image"],
14843
+ cost: {
14844
+ input: 1.5,
14845
+ output: 9,
14846
+ cacheRead: 0.15,
14847
+ cacheWrite: 0,
14848
+ },
14849
+ contextWindow: 1000000,
14850
+ maxTokens: 64000,
14851
+ },
14852
+ "google/gemma-4-26b-a4b-it": {
14853
+ id: "google/gemma-4-26b-a4b-it",
14854
+ name: "Gemma 4 26B A4B IT",
14855
+ api: "anthropic-messages",
14856
+ provider: "vercel-ai-gateway",
14857
+ baseUrl: "https://ai-gateway.vercel.sh",
14858
+ reasoning: false,
14951
14859
  input: ["text", "image"],
14952
14860
  cost: {
14953
14861
  input: 0.13,
@@ -15249,7 +15157,7 @@ export const MODELS = {
15249
15157
  },
15250
15158
  "minimax/minimax-m2.7": {
15251
15159
  id: "minimax/minimax-m2.7",
15252
- name: "Minimax M2.7",
15160
+ name: "MiniMax M2.7",
15253
15161
  api: "anthropic-messages",
15254
15162
  provider: "vercel-ai-gateway",
15255
15163
  baseUrl: "https://ai-gateway.vercel.sh",
@@ -15400,6 +15308,23 @@ export const MODELS = {
15400
15308
  contextWindow: 128000,
15401
15309
  maxTokens: 64000,
15402
15310
  },
15311
+ "mistral/mistral-medium-3.5": {
15312
+ id: "mistral/mistral-medium-3.5",
15313
+ name: "Mistral Medium Latest",
15314
+ api: "anthropic-messages",
15315
+ provider: "vercel-ai-gateway",
15316
+ baseUrl: "https://ai-gateway.vercel.sh",
15317
+ reasoning: true,
15318
+ input: ["text"],
15319
+ cost: {
15320
+ input: 1.5,
15321
+ output: 7.5,
15322
+ cacheRead: 0,
15323
+ cacheWrite: 0,
15324
+ },
15325
+ contextWindow: 256000,
15326
+ maxTokens: 256000,
15327
+ },
15403
15328
  "mistral/mistral-small": {
15404
15329
  id: "mistral/mistral-small",
15405
15330
  name: "Mistral Small",
@@ -16262,125 +16187,6 @@ export const MODELS = {
16262
16187
  contextWindow: 200000,
16263
16188
  maxTokens: 8000,
16264
16189
  },
16265
- "xai/grok-3": {
16266
- id: "xai/grok-3",
16267
- name: "Grok 3 Beta",
16268
- api: "anthropic-messages",
16269
- provider: "vercel-ai-gateway",
16270
- baseUrl: "https://ai-gateway.vercel.sh",
16271
- reasoning: false,
16272
- input: ["text"],
16273
- cost: {
16274
- input: 3,
16275
- output: 15,
16276
- cacheRead: 0.75,
16277
- cacheWrite: 0,
16278
- },
16279
- contextWindow: 131072,
16280
- maxTokens: 131072,
16281
- },
16282
- "xai/grok-3-fast": {
16283
- id: "xai/grok-3-fast",
16284
- name: "Grok 3 Fast Beta",
16285
- api: "anthropic-messages",
16286
- provider: "vercel-ai-gateway",
16287
- baseUrl: "https://ai-gateway.vercel.sh",
16288
- reasoning: false,
16289
- input: ["text"],
16290
- cost: {
16291
- input: 5,
16292
- output: 25,
16293
- cacheRead: 1.25,
16294
- cacheWrite: 0,
16295
- },
16296
- contextWindow: 131072,
16297
- maxTokens: 131072,
16298
- },
16299
- "xai/grok-3-mini": {
16300
- id: "xai/grok-3-mini",
16301
- name: "Grok 3 Mini Beta",
16302
- api: "anthropic-messages",
16303
- provider: "vercel-ai-gateway",
16304
- baseUrl: "https://ai-gateway.vercel.sh",
16305
- reasoning: false,
16306
- input: ["text"],
16307
- cost: {
16308
- input: 0.3,
16309
- output: 0.5,
16310
- cacheRead: 0.075,
16311
- cacheWrite: 0,
16312
- },
16313
- contextWindow: 131072,
16314
- maxTokens: 131072,
16315
- },
16316
- "xai/grok-3-mini-fast": {
16317
- id: "xai/grok-3-mini-fast",
16318
- name: "Grok 3 Mini Fast Beta",
16319
- api: "anthropic-messages",
16320
- provider: "vercel-ai-gateway",
16321
- baseUrl: "https://ai-gateway.vercel.sh",
16322
- reasoning: false,
16323
- input: ["text"],
16324
- cost: {
16325
- input: 0.6,
16326
- output: 4,
16327
- cacheRead: 0,
16328
- cacheWrite: 0,
16329
- },
16330
- contextWindow: 131072,
16331
- maxTokens: 131072,
16332
- },
16333
- "xai/grok-4": {
16334
- id: "xai/grok-4",
16335
- name: "Grok 4",
16336
- api: "anthropic-messages",
16337
- provider: "vercel-ai-gateway",
16338
- baseUrl: "https://ai-gateway.vercel.sh",
16339
- reasoning: true,
16340
- input: ["text", "image"],
16341
- cost: {
16342
- input: 3,
16343
- output: 15,
16344
- cacheRead: 0.75,
16345
- cacheWrite: 0,
16346
- },
16347
- contextWindow: 256000,
16348
- maxTokens: 256000,
16349
- },
16350
- "xai/grok-4-fast-non-reasoning": {
16351
- id: "xai/grok-4-fast-non-reasoning",
16352
- name: "Grok 4 Fast Non-Reasoning",
16353
- api: "anthropic-messages",
16354
- provider: "vercel-ai-gateway",
16355
- baseUrl: "https://ai-gateway.vercel.sh",
16356
- reasoning: false,
16357
- input: ["text", "image"],
16358
- cost: {
16359
- input: 0.19999999999999998,
16360
- output: 0.5,
16361
- cacheRead: 0.049999999999999996,
16362
- cacheWrite: 0,
16363
- },
16364
- contextWindow: 2000000,
16365
- maxTokens: 256000,
16366
- },
16367
- "xai/grok-4-fast-reasoning": {
16368
- id: "xai/grok-4-fast-reasoning",
16369
- name: "Grok 4 Fast Reasoning",
16370
- api: "anthropic-messages",
16371
- provider: "vercel-ai-gateway",
16372
- baseUrl: "https://ai-gateway.vercel.sh",
16373
- reasoning: true,
16374
- input: ["text", "image"],
16375
- cost: {
16376
- input: 0.19999999999999998,
16377
- output: 0.5,
16378
- cacheRead: 0.049999999999999996,
16379
- cacheWrite: 0,
16380
- },
16381
- contextWindow: 2000000,
16382
- maxTokens: 256000,
16383
- },
16384
16190
  "xai/grok-4.1-fast-non-reasoning": {
16385
16191
  id: "xai/grok-4.1-fast-non-reasoning",
16386
16192
  name: "Grok 4.1 Fast Non-Reasoning",
@@ -16395,8 +16201,8 @@ export const MODELS = {
16395
16201
  cacheRead: 0.049999999999999996,
16396
16202
  cacheWrite: 0,
16397
16203
  },
16398
- contextWindow: 2000000,
16399
- maxTokens: 30000,
16204
+ contextWindow: 1000000,
16205
+ maxTokens: 1000000,
16400
16206
  },
16401
16207
  "xai/grok-4.1-fast-reasoning": {
16402
16208
  id: "xai/grok-4.1-fast-reasoning",
@@ -16412,8 +16218,8 @@ export const MODELS = {
16412
16218
  cacheRead: 0.049999999999999996,
16413
16219
  cacheWrite: 0,
16414
16220
  },
16415
- contextWindow: 2000000,
16416
- maxTokens: 30000,
16221
+ contextWindow: 1000000,
16222
+ maxTokens: 1000000,
16417
16223
  },
16418
16224
  "xai/grok-4.20-multi-agent": {
16419
16225
  id: "xai/grok-4.20-multi-agent",
@@ -16534,18 +16340,18 @@ export const MODELS = {
16534
16340
  contextWindow: 1000000,
16535
16341
  maxTokens: 1000000,
16536
16342
  },
16537
- "xai/grok-code-fast-1": {
16538
- id: "xai/grok-code-fast-1",
16539
- name: "Grok Code Fast 1",
16343
+ "xai/grok-build-0.1": {
16344
+ id: "xai/grok-build-0.1",
16345
+ name: "Grok Build 0.1",
16540
16346
  api: "anthropic-messages",
16541
16347
  provider: "vercel-ai-gateway",
16542
16348
  baseUrl: "https://ai-gateway.vercel.sh",
16543
16349
  reasoning: true,
16544
- input: ["text"],
16350
+ input: ["text", "image"],
16545
16351
  cost: {
16546
- input: 0.19999999999999998,
16547
- output: 1.5,
16548
- cacheRead: 0.02,
16352
+ input: 1,
16353
+ output: 2,
16354
+ cacheRead: 0.19999999999999998,
16549
16355
  cacheWrite: 0,
16550
16356
  },
16551
16357
  contextWindow: 256000,
@@ -16594,9 +16400,9 @@ export const MODELS = {
16594
16400
  reasoning: true,
16595
16401
  input: ["text", "image"],
16596
16402
  cost: {
16597
- input: 0.39999999999999997,
16598
- output: 2,
16599
- cacheRead: 0.08,
16403
+ input: 0.14,
16404
+ output: 0.28,
16405
+ cacheRead: 0.0028,
16600
16406
  cacheWrite: 0,
16601
16407
  },
16602
16408
  contextWindow: 1050000,
@@ -16611,9 +16417,9 @@ export const MODELS = {
16611
16417
  reasoning: true,
16612
16418
  input: ["text", "image"],
16613
16419
  cost: {
16614
- input: 1,
16615
- output: 3,
16616
- cacheRead: 0.19999999999999998,
16420
+ input: 0.435,
16421
+ output: 0.87,
16422
+ cacheRead: 0.0036,
16617
16423
  cacheWrite: 0,
16618
16424
  },
16619
16425
  contextWindow: 1050000,
@@ -16842,329 +16648,6 @@ export const MODELS = {
16842
16648
  },
16843
16649
  },
16844
16650
  "xai": {
16845
- "grok-2": {
16846
- id: "grok-2",
16847
- name: "Grok 2",
16848
- api: "openai-completions",
16849
- provider: "xai",
16850
- baseUrl: "https://api.x.ai/v1",
16851
- reasoning: false,
16852
- input: ["text"],
16853
- cost: {
16854
- input: 2,
16855
- output: 10,
16856
- cacheRead: 2,
16857
- cacheWrite: 0,
16858
- },
16859
- contextWindow: 131072,
16860
- maxTokens: 8192,
16861
- },
16862
- "grok-2-1212": {
16863
- id: "grok-2-1212",
16864
- name: "Grok 2 (1212)",
16865
- api: "openai-completions",
16866
- provider: "xai",
16867
- baseUrl: "https://api.x.ai/v1",
16868
- reasoning: false,
16869
- input: ["text"],
16870
- cost: {
16871
- input: 2,
16872
- output: 10,
16873
- cacheRead: 2,
16874
- cacheWrite: 0,
16875
- },
16876
- contextWindow: 131072,
16877
- maxTokens: 8192,
16878
- },
16879
- "grok-2-latest": {
16880
- id: "grok-2-latest",
16881
- name: "Grok 2 Latest",
16882
- api: "openai-completions",
16883
- provider: "xai",
16884
- baseUrl: "https://api.x.ai/v1",
16885
- reasoning: false,
16886
- input: ["text"],
16887
- cost: {
16888
- input: 2,
16889
- output: 10,
16890
- cacheRead: 2,
16891
- cacheWrite: 0,
16892
- },
16893
- contextWindow: 131072,
16894
- maxTokens: 8192,
16895
- },
16896
- "grok-2-vision": {
16897
- id: "grok-2-vision",
16898
- name: "Grok 2 Vision",
16899
- api: "openai-completions",
16900
- provider: "xai",
16901
- baseUrl: "https://api.x.ai/v1",
16902
- reasoning: false,
16903
- input: ["text", "image"],
16904
- cost: {
16905
- input: 2,
16906
- output: 10,
16907
- cacheRead: 2,
16908
- cacheWrite: 0,
16909
- },
16910
- contextWindow: 8192,
16911
- maxTokens: 4096,
16912
- },
16913
- "grok-2-vision-1212": {
16914
- id: "grok-2-vision-1212",
16915
- name: "Grok 2 Vision (1212)",
16916
- api: "openai-completions",
16917
- provider: "xai",
16918
- baseUrl: "https://api.x.ai/v1",
16919
- reasoning: false,
16920
- input: ["text", "image"],
16921
- cost: {
16922
- input: 2,
16923
- output: 10,
16924
- cacheRead: 2,
16925
- cacheWrite: 0,
16926
- },
16927
- contextWindow: 8192,
16928
- maxTokens: 4096,
16929
- },
16930
- "grok-2-vision-latest": {
16931
- id: "grok-2-vision-latest",
16932
- name: "Grok 2 Vision Latest",
16933
- api: "openai-completions",
16934
- provider: "xai",
16935
- baseUrl: "https://api.x.ai/v1",
16936
- reasoning: false,
16937
- input: ["text", "image"],
16938
- cost: {
16939
- input: 2,
16940
- output: 10,
16941
- cacheRead: 2,
16942
- cacheWrite: 0,
16943
- },
16944
- contextWindow: 8192,
16945
- maxTokens: 4096,
16946
- },
16947
- "grok-3": {
16948
- id: "grok-3",
16949
- name: "Grok 3",
16950
- api: "openai-completions",
16951
- provider: "xai",
16952
- baseUrl: "https://api.x.ai/v1",
16953
- reasoning: false,
16954
- input: ["text"],
16955
- cost: {
16956
- input: 3,
16957
- output: 15,
16958
- cacheRead: 0.75,
16959
- cacheWrite: 0,
16960
- },
16961
- contextWindow: 131072,
16962
- maxTokens: 8192,
16963
- },
16964
- "grok-3-fast": {
16965
- id: "grok-3-fast",
16966
- name: "Grok 3 Fast",
16967
- api: "openai-completions",
16968
- provider: "xai",
16969
- baseUrl: "https://api.x.ai/v1",
16970
- reasoning: false,
16971
- input: ["text"],
16972
- cost: {
16973
- input: 5,
16974
- output: 25,
16975
- cacheRead: 1.25,
16976
- cacheWrite: 0,
16977
- },
16978
- contextWindow: 131072,
16979
- maxTokens: 8192,
16980
- },
16981
- "grok-3-fast-latest": {
16982
- id: "grok-3-fast-latest",
16983
- name: "Grok 3 Fast Latest",
16984
- api: "openai-completions",
16985
- provider: "xai",
16986
- baseUrl: "https://api.x.ai/v1",
16987
- reasoning: false,
16988
- input: ["text"],
16989
- cost: {
16990
- input: 5,
16991
- output: 25,
16992
- cacheRead: 1.25,
16993
- cacheWrite: 0,
16994
- },
16995
- contextWindow: 131072,
16996
- maxTokens: 8192,
16997
- },
16998
- "grok-3-latest": {
16999
- id: "grok-3-latest",
17000
- name: "Grok 3 Latest",
17001
- api: "openai-completions",
17002
- provider: "xai",
17003
- baseUrl: "https://api.x.ai/v1",
17004
- reasoning: false,
17005
- input: ["text"],
17006
- cost: {
17007
- input: 3,
17008
- output: 15,
17009
- cacheRead: 0.75,
17010
- cacheWrite: 0,
17011
- },
17012
- contextWindow: 131072,
17013
- maxTokens: 8192,
17014
- },
17015
- "grok-3-mini": {
17016
- id: "grok-3-mini",
17017
- name: "Grok 3 Mini",
17018
- api: "openai-completions",
17019
- provider: "xai",
17020
- baseUrl: "https://api.x.ai/v1",
17021
- reasoning: true,
17022
- input: ["text"],
17023
- cost: {
17024
- input: 0.3,
17025
- output: 0.5,
17026
- cacheRead: 0.075,
17027
- cacheWrite: 0,
17028
- },
17029
- contextWindow: 131072,
17030
- maxTokens: 8192,
17031
- },
17032
- "grok-3-mini-fast": {
17033
- id: "grok-3-mini-fast",
17034
- name: "Grok 3 Mini Fast",
17035
- api: "openai-completions",
17036
- provider: "xai",
17037
- baseUrl: "https://api.x.ai/v1",
17038
- reasoning: true,
17039
- input: ["text"],
17040
- cost: {
17041
- input: 0.6,
17042
- output: 4,
17043
- cacheRead: 0.15,
17044
- cacheWrite: 0,
17045
- },
17046
- contextWindow: 131072,
17047
- maxTokens: 8192,
17048
- },
17049
- "grok-3-mini-fast-latest": {
17050
- id: "grok-3-mini-fast-latest",
17051
- name: "Grok 3 Mini Fast Latest",
17052
- api: "openai-completions",
17053
- provider: "xai",
17054
- baseUrl: "https://api.x.ai/v1",
17055
- reasoning: true,
17056
- input: ["text"],
17057
- cost: {
17058
- input: 0.6,
17059
- output: 4,
17060
- cacheRead: 0.15,
17061
- cacheWrite: 0,
17062
- },
17063
- contextWindow: 131072,
17064
- maxTokens: 8192,
17065
- },
17066
- "grok-3-mini-latest": {
17067
- id: "grok-3-mini-latest",
17068
- name: "Grok 3 Mini Latest",
17069
- api: "openai-completions",
17070
- provider: "xai",
17071
- baseUrl: "https://api.x.ai/v1",
17072
- reasoning: true,
17073
- input: ["text"],
17074
- cost: {
17075
- input: 0.3,
17076
- output: 0.5,
17077
- cacheRead: 0.075,
17078
- cacheWrite: 0,
17079
- },
17080
- contextWindow: 131072,
17081
- maxTokens: 8192,
17082
- },
17083
- "grok-4": {
17084
- id: "grok-4",
17085
- name: "Grok 4",
17086
- api: "openai-completions",
17087
- provider: "xai",
17088
- baseUrl: "https://api.x.ai/v1",
17089
- reasoning: true,
17090
- input: ["text"],
17091
- cost: {
17092
- input: 3,
17093
- output: 15,
17094
- cacheRead: 0.75,
17095
- cacheWrite: 0,
17096
- },
17097
- contextWindow: 256000,
17098
- maxTokens: 64000,
17099
- },
17100
- "grok-4-1-fast": {
17101
- id: "grok-4-1-fast",
17102
- name: "Grok 4.1 Fast",
17103
- api: "openai-completions",
17104
- provider: "xai",
17105
- baseUrl: "https://api.x.ai/v1",
17106
- reasoning: true,
17107
- input: ["text", "image"],
17108
- cost: {
17109
- input: 0.2,
17110
- output: 0.5,
17111
- cacheRead: 0.05,
17112
- cacheWrite: 0,
17113
- },
17114
- contextWindow: 2000000,
17115
- maxTokens: 30000,
17116
- },
17117
- "grok-4-1-fast-non-reasoning": {
17118
- id: "grok-4-1-fast-non-reasoning",
17119
- name: "Grok 4.1 Fast (Non-Reasoning)",
17120
- api: "openai-completions",
17121
- provider: "xai",
17122
- baseUrl: "https://api.x.ai/v1",
17123
- reasoning: false,
17124
- input: ["text", "image"],
17125
- cost: {
17126
- input: 0.2,
17127
- output: 0.5,
17128
- cacheRead: 0.05,
17129
- cacheWrite: 0,
17130
- },
17131
- contextWindow: 2000000,
17132
- maxTokens: 30000,
17133
- },
17134
- "grok-4-fast": {
17135
- id: "grok-4-fast",
17136
- name: "Grok 4 Fast",
17137
- api: "openai-completions",
17138
- provider: "xai",
17139
- baseUrl: "https://api.x.ai/v1",
17140
- reasoning: true,
17141
- input: ["text", "image"],
17142
- cost: {
17143
- input: 0.2,
17144
- output: 0.5,
17145
- cacheRead: 0.05,
17146
- cacheWrite: 0,
17147
- },
17148
- contextWindow: 2000000,
17149
- maxTokens: 30000,
17150
- },
17151
- "grok-4-fast-non-reasoning": {
17152
- id: "grok-4-fast-non-reasoning",
17153
- name: "Grok 4 Fast (Non-Reasoning)",
17154
- api: "openai-completions",
17155
- provider: "xai",
17156
- baseUrl: "https://api.x.ai/v1",
17157
- reasoning: false,
17158
- input: ["text", "image"],
17159
- cost: {
17160
- input: 0.2,
17161
- output: 0.5,
17162
- cacheRead: 0.05,
17163
- cacheWrite: 0,
17164
- },
17165
- contextWindow: 2000000,
17166
- maxTokens: 30000,
17167
- },
17168
16651
  "grok-4.20-0309-non-reasoning": {
17169
16652
  id: "grok-4.20-0309-non-reasoning",
17170
16653
  name: "Grok 4.20 (Non-Reasoning)",
@@ -17174,8 +16657,8 @@ export const MODELS = {
17174
16657
  reasoning: false,
17175
16658
  input: ["text", "image"],
17176
16659
  cost: {
17177
- input: 2,
17178
- output: 6,
16660
+ input: 1.25,
16661
+ output: 2.5,
17179
16662
  cacheRead: 0.2,
17180
16663
  cacheWrite: 0,
17181
16664
  },
@@ -17191,8 +16674,8 @@ export const MODELS = {
17191
16674
  reasoning: true,
17192
16675
  input: ["text", "image"],
17193
16676
  cost: {
17194
- input: 2,
17195
- output: 6,
16677
+ input: 1.25,
16678
+ output: 2.5,
17196
16679
  cacheRead: 0.2,
17197
16680
  cacheWrite: 0,
17198
16681
  },
@@ -17216,22 +16699,22 @@ export const MODELS = {
17216
16699
  contextWindow: 1000000,
17217
16700
  maxTokens: 30000,
17218
16701
  },
17219
- "grok-beta": {
17220
- id: "grok-beta",
17221
- name: "Grok Beta",
16702
+ "grok-build-0.1": {
16703
+ id: "grok-build-0.1",
16704
+ name: "Grok Build 0.1",
17222
16705
  api: "openai-completions",
17223
16706
  provider: "xai",
17224
16707
  baseUrl: "https://api.x.ai/v1",
17225
- reasoning: false,
17226
- input: ["text"],
16708
+ reasoning: true,
16709
+ input: ["text", "image"],
17227
16710
  cost: {
17228
- input: 5,
17229
- output: 15,
17230
- cacheRead: 5,
16711
+ input: 1,
16712
+ output: 2,
16713
+ cacheRead: 0.2,
17231
16714
  cacheWrite: 0,
17232
16715
  },
17233
- contextWindow: 131072,
17234
- maxTokens: 4096,
16716
+ contextWindow: 256000,
16717
+ maxTokens: 256000,
17235
16718
  },
17236
16719
  "grok-code-fast-1": {
17237
16720
  id: "grok-code-fast-1",
@@ -17239,7 +16722,7 @@ export const MODELS = {
17239
16722
  api: "openai-completions",
17240
16723
  provider: "xai",
17241
16724
  baseUrl: "https://api.x.ai/v1",
17242
- reasoning: true,
16725
+ reasoning: false,
17243
16726
  input: ["text"],
17244
16727
  cost: {
17245
16728
  input: 0.2,
@@ -17247,25 +16730,8 @@ export const MODELS = {
17247
16730
  cacheRead: 0.02,
17248
16731
  cacheWrite: 0,
17249
16732
  },
17250
- contextWindow: 256000,
17251
- maxTokens: 10000,
17252
- },
17253
- "grok-vision-beta": {
17254
- id: "grok-vision-beta",
17255
- name: "Grok Vision Beta",
17256
- api: "openai-completions",
17257
- provider: "xai",
17258
- baseUrl: "https://api.x.ai/v1",
17259
- reasoning: false,
17260
- input: ["text", "image"],
17261
- cost: {
17262
- input: 5,
17263
- output: 15,
17264
- cacheRead: 5,
17265
- cacheWrite: 0,
17266
- },
17267
- contextWindow: 8192,
17268
- maxTokens: 4096,
16733
+ contextWindow: 32768,
16734
+ maxTokens: 8192,
17269
16735
  },
17270
16736
  },
17271
16737
  "xiaomi": {