@kolisachint/hoocode-ai 0.2.5 → 0.2.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -157,6 +157,23 @@ export const MODELS = {
157
157
  contextWindow: 1000000,
158
158
  maxTokens: 128000,
159
159
  },
160
+ "anthropic.claude-opus-4-8": {
161
+ id: "anthropic.claude-opus-4-8",
162
+ name: "Claude Opus 4.8",
163
+ api: "bedrock-converse-stream",
164
+ provider: "amazon-bedrock",
165
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
166
+ reasoning: true,
167
+ input: ["text", "image"],
168
+ cost: {
169
+ input: 5,
170
+ output: 25,
171
+ cacheRead: 0.5,
172
+ cacheWrite: 6.25,
173
+ },
174
+ contextWindow: 1000000,
175
+ maxTokens: 128000,
176
+ },
160
177
  "anthropic.claude-sonnet-4-5-20250929-v1:0": {
161
178
  id: "anthropic.claude-sonnet-4-5-20250929-v1:0",
162
179
  name: "Claude Sonnet 4.5",
@@ -226,6 +243,23 @@ export const MODELS = {
226
243
  contextWindow: 1000000,
227
244
  maxTokens: 128000,
228
245
  },
246
+ "au.anthropic.claude-opus-4-8": {
247
+ id: "au.anthropic.claude-opus-4-8",
248
+ name: "Claude Opus 4.8 (AU)",
249
+ api: "bedrock-converse-stream",
250
+ provider: "amazon-bedrock",
251
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
252
+ reasoning: true,
253
+ input: ["text", "image"],
254
+ cost: {
255
+ input: 5,
256
+ output: 25,
257
+ cacheRead: 0.5,
258
+ cacheWrite: 6.25,
259
+ },
260
+ contextWindow: 1000000,
261
+ maxTokens: 128000,
262
+ },
229
263
  "au.anthropic.claude-sonnet-4-5-20250929-v1:0": {
230
264
  id: "au.anthropic.claude-sonnet-4-5-20250929-v1:0",
231
265
  name: "Claude Sonnet 4.5 (AU)",
@@ -381,6 +415,23 @@ export const MODELS = {
381
415
  contextWindow: 1000000,
382
416
  maxTokens: 128000,
383
417
  },
418
+ "eu.anthropic.claude-opus-4-8": {
419
+ id: "eu.anthropic.claude-opus-4-8",
420
+ name: "Claude Opus 4.8 (EU)",
421
+ api: "bedrock-converse-stream",
422
+ provider: "amazon-bedrock",
423
+ baseUrl: "https://bedrock-runtime.eu-central-1.amazonaws.com",
424
+ reasoning: true,
425
+ input: ["text", "image"],
426
+ cost: {
427
+ input: 5,
428
+ output: 25,
429
+ cacheRead: 0.5,
430
+ cacheWrite: 6.25,
431
+ },
432
+ contextWindow: 1000000,
433
+ maxTokens: 128000,
434
+ },
384
435
  "eu.anthropic.claude-sonnet-4-5-20250929-v1:0": {
385
436
  id: "eu.anthropic.claude-sonnet-4-5-20250929-v1:0",
386
437
  name: "Claude Sonnet 4.5 (EU)",
@@ -485,6 +536,23 @@ export const MODELS = {
485
536
  contextWindow: 1000000,
486
537
  maxTokens: 128000,
487
538
  },
539
+ "global.anthropic.claude-opus-4-8": {
540
+ id: "global.anthropic.claude-opus-4-8",
541
+ name: "Claude Opus 4.8 (Global)",
542
+ api: "bedrock-converse-stream",
543
+ provider: "amazon-bedrock",
544
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
545
+ reasoning: true,
546
+ input: ["text", "image"],
547
+ cost: {
548
+ input: 5,
549
+ output: 25,
550
+ cacheRead: 0.5,
551
+ cacheWrite: 6.25,
552
+ },
553
+ contextWindow: 1000000,
554
+ maxTokens: 128000,
555
+ },
488
556
  "global.anthropic.claude-sonnet-4-5-20250929-v1:0": {
489
557
  id: "global.anthropic.claude-sonnet-4-5-20250929-v1:0",
490
558
  name: "Claude Sonnet 4.5 (Global)",
@@ -571,6 +639,23 @@ export const MODELS = {
571
639
  contextWindow: 1000000,
572
640
  maxTokens: 128000,
573
641
  },
642
+ "jp.anthropic.claude-opus-4-8": {
643
+ id: "jp.anthropic.claude-opus-4-8",
644
+ name: "Claude Opus 4.8 (JP)",
645
+ api: "bedrock-converse-stream",
646
+ provider: "amazon-bedrock",
647
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
648
+ reasoning: true,
649
+ input: ["text", "image"],
650
+ cost: {
651
+ input: 5,
652
+ output: 25,
653
+ cacheRead: 0.5,
654
+ cacheWrite: 6.25,
655
+ },
656
+ contextWindow: 1000000,
657
+ maxTokens: 128000,
658
+ },
574
659
  "jp.anthropic.claude-sonnet-4-5-20250929-v1:0": {
575
660
  id: "jp.anthropic.claude-sonnet-4-5-20250929-v1:0",
576
661
  name: "Claude Sonnet 4.5 (JP)",
@@ -908,8 +993,8 @@ export const MODELS = {
908
993
  cacheRead: 0,
909
994
  cacheWrite: 0,
910
995
  },
911
- contextWindow: 256000,
912
- maxTokens: 256000,
996
+ contextWindow: 262143,
997
+ maxTokens: 16000,
913
998
  },
914
999
  "moonshotai.kimi-k2.5": {
915
1000
  id: "moonshotai.kimi-k2.5",
@@ -925,8 +1010,8 @@ export const MODELS = {
925
1010
  cacheRead: 0,
926
1011
  cacheWrite: 0,
927
1012
  },
928
- contextWindow: 256000,
929
- maxTokens: 256000,
1013
+ contextWindow: 262143,
1014
+ maxTokens: 16000,
930
1015
  },
931
1016
  "nvidia.nemotron-nano-12b-v2": {
932
1017
  id: "nvidia.nemotron-nano-12b-v2",
@@ -1270,6 +1355,23 @@ export const MODELS = {
1270
1355
  contextWindow: 1000000,
1271
1356
  maxTokens: 128000,
1272
1357
  },
1358
+ "us.anthropic.claude-opus-4-8": {
1359
+ id: "us.anthropic.claude-opus-4-8",
1360
+ name: "Claude Opus 4.8 (US)",
1361
+ api: "bedrock-converse-stream",
1362
+ provider: "amazon-bedrock",
1363
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1364
+ reasoning: true,
1365
+ input: ["text", "image"],
1366
+ cost: {
1367
+ input: 5,
1368
+ output: 25,
1369
+ cacheRead: 0.5,
1370
+ cacheWrite: 6.25,
1371
+ },
1372
+ contextWindow: 1000000,
1373
+ maxTokens: 128000,
1374
+ },
1273
1375
  "us.anthropic.claude-sonnet-4-5-20250929-v1:0": {
1274
1376
  id: "us.anthropic.claude-sonnet-4-5-20250929-v1:0",
1275
1377
  name: "Claude Sonnet 4.5 (US)",
@@ -1750,6 +1852,23 @@ export const MODELS = {
1750
1852
  contextWindow: 1000000,
1751
1853
  maxTokens: 128000,
1752
1854
  },
1855
+ "claude-opus-4-8": {
1856
+ id: "claude-opus-4-8",
1857
+ name: "Claude Opus 4.8",
1858
+ api: "anthropic-messages",
1859
+ provider: "anthropic",
1860
+ baseUrl: "https://api.anthropic.com",
1861
+ reasoning: true,
1862
+ input: ["text", "image"],
1863
+ cost: {
1864
+ input: 5,
1865
+ output: 25,
1866
+ cacheRead: 0.5,
1867
+ cacheWrite: 6.25,
1868
+ },
1869
+ contextWindow: 1000000,
1870
+ maxTokens: 128000,
1871
+ },
1753
1872
  "claude-sonnet-4-0": {
1754
1873
  id: "claude-sonnet-4-0",
1755
1874
  name: "Claude Sonnet 4 (latest)",
@@ -1916,7 +2035,7 @@ export const MODELS = {
1916
2035
  cost: {
1917
2036
  input: 0.1,
1918
2037
  output: 0.4,
1919
- cacheRead: 0.03,
2038
+ cacheRead: 0.025,
1920
2039
  cacheWrite: 0,
1921
2040
  },
1922
2041
  contextWindow: 1047576,
@@ -2001,7 +2120,7 @@ export const MODELS = {
2001
2120
  cost: {
2002
2121
  input: 0.15,
2003
2122
  output: 0.6,
2004
- cacheRead: 0.08,
2123
+ cacheRead: 0.075,
2005
2124
  cacheWrite: 0,
2006
2125
  },
2007
2126
  contextWindow: 128000,
@@ -2127,7 +2246,7 @@ export const MODELS = {
2127
2246
  cost: {
2128
2247
  input: 1.25,
2129
2248
  output: 10,
2130
- cacheRead: 0.13,
2249
+ cacheRead: 0.125,
2131
2250
  cacheWrite: 0,
2132
2251
  },
2133
2252
  contextWindow: 400000,
@@ -2552,7 +2671,7 @@ export const MODELS = {
2552
2671
  cost: {
2553
2672
  input: 1.1,
2554
2673
  output: 4.4,
2555
- cacheRead: 0.28,
2674
+ cacheRead: 0.275,
2556
2675
  cacheWrite: 0,
2557
2676
  },
2558
2677
  contextWindow: 200000,
@@ -2611,23 +2730,6 @@ export const MODELS = {
2611
2730
  contextWindow: 32000,
2612
2731
  maxTokens: 8000,
2613
2732
  },
2614
- "qwen-3-235b-a22b-instruct-2507": {
2615
- id: "qwen-3-235b-a22b-instruct-2507",
2616
- name: "Qwen 3 235B Instruct",
2617
- api: "openai-completions",
2618
- provider: "cerebras",
2619
- baseUrl: "https://api.cerebras.ai/v1",
2620
- reasoning: false,
2621
- input: ["text"],
2622
- cost: {
2623
- input: 0.6,
2624
- output: 1.2,
2625
- cacheRead: 0,
2626
- cacheWrite: 0,
2627
- },
2628
- contextWindow: 131000,
2629
- maxTokens: 32000,
2630
- },
2631
2733
  "zai-glm-4.7": {
2632
2734
  id: "zai-glm-4.7",
2633
2735
  name: "Z.AI GLM-4.7",
@@ -3275,6 +3377,42 @@ export const MODELS = {
3275
3377
  contextWindow: 256000,
3276
3378
  maxTokens: 16384,
3277
3379
  },
3380
+ "@cf/ibm-granite/granite-4.0-h-micro": {
3381
+ id: "@cf/ibm-granite/granite-4.0-h-micro",
3382
+ name: "Granite 4.0 H Micro",
3383
+ api: "openai-completions",
3384
+ provider: "cloudflare-workers-ai",
3385
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3386
+ compat: { "sendSessionAffinityHeaders": true },
3387
+ reasoning: false,
3388
+ input: ["text"],
3389
+ cost: {
3390
+ input: 0.017,
3391
+ output: 0.112,
3392
+ cacheRead: 0,
3393
+ cacheWrite: 0,
3394
+ },
3395
+ contextWindow: 131000,
3396
+ maxTokens: 131000,
3397
+ },
3398
+ "@cf/meta/llama-3.3-70b-instruct-fp8-fast": {
3399
+ id: "@cf/meta/llama-3.3-70b-instruct-fp8-fast",
3400
+ name: "Llama 3.3 70B Instruct fp8 Fast",
3401
+ api: "openai-completions",
3402
+ provider: "cloudflare-workers-ai",
3403
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3404
+ compat: { "sendSessionAffinityHeaders": true },
3405
+ reasoning: false,
3406
+ input: ["text"],
3407
+ cost: {
3408
+ input: 0.293,
3409
+ output: 2.253,
3410
+ cacheRead: 0,
3411
+ cacheWrite: 0,
3412
+ },
3413
+ contextWindow: 24000,
3414
+ maxTokens: 24000,
3415
+ },
3278
3416
  "@cf/meta/llama-4-scout-17b-16e-instruct": {
3279
3417
  id: "@cf/meta/llama-4-scout-17b-16e-instruct",
3280
3418
  name: "Llama 4 Scout 17B 16E Instruct",
@@ -3290,9 +3428,27 @@ export const MODELS = {
3290
3428
  cacheRead: 0,
3291
3429
  cacheWrite: 0,
3292
3430
  },
3293
- contextWindow: 128000,
3431
+ contextWindow: 131000,
3294
3432
  maxTokens: 16384,
3295
3433
  },
3434
+ "@cf/mistralai/mistral-small-3.1-24b-instruct": {
3435
+ id: "@cf/mistralai/mistral-small-3.1-24b-instruct",
3436
+ name: "Mistral Small 3.1 24B Instruct",
3437
+ api: "openai-completions",
3438
+ provider: "cloudflare-workers-ai",
3439
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3440
+ compat: { "sendSessionAffinityHeaders": true },
3441
+ reasoning: false,
3442
+ input: ["text"],
3443
+ cost: {
3444
+ input: 0.351,
3445
+ output: 0.555,
3446
+ cacheRead: 0,
3447
+ cacheWrite: 0,
3448
+ },
3449
+ contextWindow: 128000,
3450
+ maxTokens: 128000,
3451
+ },
3296
3452
  "@cf/moonshotai/kimi-k2.5": {
3297
3453
  id: "@cf/moonshotai/kimi-k2.5",
3298
3454
  name: "Kimi K2.5",
@@ -3326,7 +3482,7 @@ export const MODELS = {
3326
3482
  cacheRead: 0.16,
3327
3483
  cacheWrite: 0,
3328
3484
  },
3329
- contextWindow: 256000,
3485
+ contextWindow: 262144,
3330
3486
  maxTokens: 256000,
3331
3487
  },
3332
3488
  "@cf/nvidia/nemotron-3-120b-a12b": {
@@ -3383,6 +3539,24 @@ export const MODELS = {
3383
3539
  contextWindow: 128000,
3384
3540
  maxTokens: 16384,
3385
3541
  },
3542
+ "@cf/qwen/qwen3-30b-a3b-fp8": {
3543
+ id: "@cf/qwen/qwen3-30b-a3b-fp8",
3544
+ name: "Qwen3 30B A3b fp8",
3545
+ api: "openai-completions",
3546
+ provider: "cloudflare-workers-ai",
3547
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3548
+ compat: { "sendSessionAffinityHeaders": true },
3549
+ reasoning: true,
3550
+ input: ["text"],
3551
+ cost: {
3552
+ input: 0.0509,
3553
+ output: 0.335,
3554
+ cacheRead: 0,
3555
+ cacheWrite: 0,
3556
+ },
3557
+ contextWindow: 32768,
3558
+ maxTokens: 32768,
3559
+ },
3386
3560
  "@cf/zai-org/glm-4.7-flash": {
3387
3561
  id: "@cf/zai-org/glm-4.7-flash",
3388
3562
  name: "GLM-4.7-Flash",
@@ -3393,7 +3567,7 @@ export const MODELS = {
3393
3567
  reasoning: true,
3394
3568
  input: ["text"],
3395
3569
  cost: {
3396
- input: 0.06,
3570
+ input: 0.0605,
3397
3571
  output: 0.4,
3398
3572
  cacheRead: 0,
3399
3573
  cacheWrite: 0,
@@ -3443,39 +3617,22 @@ export const MODELS = {
3443
3617
  },
3444
3618
  },
3445
3619
  "fireworks": {
3446
- "accounts/fireworks/models/deepseek-v3p1": {
3447
- id: "accounts/fireworks/models/deepseek-v3p1",
3448
- name: "DeepSeek V3.1",
3449
- api: "anthropic-messages",
3450
- provider: "fireworks",
3451
- baseUrl: "https://api.fireworks.ai/inference",
3452
- reasoning: true,
3453
- input: ["text"],
3454
- cost: {
3455
- input: 0.56,
3456
- output: 1.68,
3457
- cacheRead: 0,
3458
- cacheWrite: 0,
3459
- },
3460
- contextWindow: 163840,
3461
- maxTokens: 163840,
3462
- },
3463
- "accounts/fireworks/models/deepseek-v3p2": {
3464
- id: "accounts/fireworks/models/deepseek-v3p2",
3465
- name: "DeepSeek V3.2",
3620
+ "accounts/fireworks/models/deepseek-v4-flash": {
3621
+ id: "accounts/fireworks/models/deepseek-v4-flash",
3622
+ name: "DeepSeek V4 Flash",
3466
3623
  api: "anthropic-messages",
3467
3624
  provider: "fireworks",
3468
3625
  baseUrl: "https://api.fireworks.ai/inference",
3469
3626
  reasoning: true,
3470
3627
  input: ["text"],
3471
3628
  cost: {
3472
- input: 0.56,
3473
- output: 1.68,
3474
- cacheRead: 0.28,
3629
+ input: 0.14,
3630
+ output: 0.28,
3631
+ cacheRead: 0.03,
3475
3632
  cacheWrite: 0,
3476
3633
  },
3477
- contextWindow: 160000,
3478
- maxTokens: 160000,
3634
+ contextWindow: 1000000,
3635
+ maxTokens: 384000,
3479
3636
  },
3480
3637
  "accounts/fireworks/models/deepseek-v4-pro": {
3481
3638
  id: "accounts/fireworks/models/deepseek-v4-pro",
@@ -3488,177 +3645,75 @@ export const MODELS = {
3488
3645
  cost: {
3489
3646
  input: 1.74,
3490
3647
  output: 3.48,
3491
- cacheRead: 0.15,
3648
+ cacheRead: 0.145,
3492
3649
  cacheWrite: 0,
3493
3650
  },
3494
3651
  contextWindow: 1000000,
3495
3652
  maxTokens: 384000,
3496
3653
  },
3497
- "accounts/fireworks/models/glm-4p5": {
3498
- id: "accounts/fireworks/models/glm-4p5",
3499
- name: "GLM 4.5",
3654
+ "accounts/fireworks/models/glm-5p1": {
3655
+ id: "accounts/fireworks/models/glm-5p1",
3656
+ name: "GLM 5.1",
3500
3657
  api: "anthropic-messages",
3501
3658
  provider: "fireworks",
3502
3659
  baseUrl: "https://api.fireworks.ai/inference",
3503
3660
  reasoning: true,
3504
3661
  input: ["text"],
3505
3662
  cost: {
3506
- input: 0.55,
3507
- output: 2.19,
3508
- cacheRead: 0,
3663
+ input: 1.4,
3664
+ output: 4.4,
3665
+ cacheRead: 0.26,
3509
3666
  cacheWrite: 0,
3510
3667
  },
3511
- contextWindow: 131072,
3668
+ contextWindow: 202800,
3512
3669
  maxTokens: 131072,
3513
3670
  },
3514
- "accounts/fireworks/models/glm-4p5-air": {
3515
- id: "accounts/fireworks/models/glm-4p5-air",
3516
- name: "GLM 4.5 Air",
3671
+ "accounts/fireworks/models/gpt-oss-120b": {
3672
+ id: "accounts/fireworks/models/gpt-oss-120b",
3673
+ name: "GPT OSS 120B",
3517
3674
  api: "anthropic-messages",
3518
3675
  provider: "fireworks",
3519
3676
  baseUrl: "https://api.fireworks.ai/inference",
3520
3677
  reasoning: true,
3521
3678
  input: ["text"],
3522
3679
  cost: {
3523
- input: 0.22,
3524
- output: 0.88,
3525
- cacheRead: 0,
3680
+ input: 0.15,
3681
+ output: 0.6,
3682
+ cacheRead: 0.015,
3526
3683
  cacheWrite: 0,
3527
3684
  },
3528
3685
  contextWindow: 131072,
3529
- maxTokens: 131072,
3686
+ maxTokens: 32768,
3530
3687
  },
3531
- "accounts/fireworks/models/glm-4p7": {
3532
- id: "accounts/fireworks/models/glm-4p7",
3533
- name: "GLM 4.7",
3688
+ "accounts/fireworks/models/gpt-oss-20b": {
3689
+ id: "accounts/fireworks/models/gpt-oss-20b",
3690
+ name: "GPT OSS 20B",
3534
3691
  api: "anthropic-messages",
3535
3692
  provider: "fireworks",
3536
3693
  baseUrl: "https://api.fireworks.ai/inference",
3537
3694
  reasoning: true,
3538
3695
  input: ["text"],
3539
3696
  cost: {
3540
- input: 0.6,
3541
- output: 2.2,
3542
- cacheRead: 0.3,
3697
+ input: 0.07,
3698
+ output: 0.3,
3699
+ cacheRead: 0.035,
3543
3700
  cacheWrite: 0,
3544
3701
  },
3545
- contextWindow: 198000,
3546
- maxTokens: 198000,
3702
+ contextWindow: 131072,
3703
+ maxTokens: 32768,
3547
3704
  },
3548
- "accounts/fireworks/models/glm-5": {
3549
- id: "accounts/fireworks/models/glm-5",
3550
- name: "GLM 5",
3705
+ "accounts/fireworks/models/kimi-k2p5": {
3706
+ id: "accounts/fireworks/models/kimi-k2p5",
3707
+ name: "Kimi K2.5",
3551
3708
  api: "anthropic-messages",
3552
3709
  provider: "fireworks",
3553
3710
  baseUrl: "https://api.fireworks.ai/inference",
3554
3711
  reasoning: true,
3555
- input: ["text"],
3712
+ input: ["text", "image"],
3556
3713
  cost: {
3557
- input: 1,
3558
- output: 3.2,
3559
- cacheRead: 0.5,
3560
- cacheWrite: 0,
3561
- },
3562
- contextWindow: 202752,
3563
- maxTokens: 131072,
3564
- },
3565
- "accounts/fireworks/models/glm-5p1": {
3566
- id: "accounts/fireworks/models/glm-5p1",
3567
- name: "GLM 5.1",
3568
- api: "anthropic-messages",
3569
- provider: "fireworks",
3570
- baseUrl: "https://api.fireworks.ai/inference",
3571
- reasoning: true,
3572
- input: ["text"],
3573
- cost: {
3574
- input: 1.4,
3575
- output: 4.4,
3576
- cacheRead: 0.26,
3577
- cacheWrite: 0,
3578
- },
3579
- contextWindow: 202800,
3580
- maxTokens: 131072,
3581
- },
3582
- "accounts/fireworks/models/gpt-oss-120b": {
3583
- id: "accounts/fireworks/models/gpt-oss-120b",
3584
- name: "GPT OSS 120B",
3585
- api: "anthropic-messages",
3586
- provider: "fireworks",
3587
- baseUrl: "https://api.fireworks.ai/inference",
3588
- reasoning: true,
3589
- input: ["text"],
3590
- cost: {
3591
- input: 0.15,
3592
- output: 0.6,
3593
- cacheRead: 0,
3594
- cacheWrite: 0,
3595
- },
3596
- contextWindow: 131072,
3597
- maxTokens: 32768,
3598
- },
3599
- "accounts/fireworks/models/gpt-oss-20b": {
3600
- id: "accounts/fireworks/models/gpt-oss-20b",
3601
- name: "GPT OSS 20B",
3602
- api: "anthropic-messages",
3603
- provider: "fireworks",
3604
- baseUrl: "https://api.fireworks.ai/inference",
3605
- reasoning: true,
3606
- input: ["text"],
3607
- cost: {
3608
- input: 0.05,
3609
- output: 0.2,
3610
- cacheRead: 0,
3611
- cacheWrite: 0,
3612
- },
3613
- contextWindow: 131072,
3614
- maxTokens: 32768,
3615
- },
3616
- "accounts/fireworks/models/kimi-k2-instruct": {
3617
- id: "accounts/fireworks/models/kimi-k2-instruct",
3618
- name: "Kimi K2 Instruct",
3619
- api: "anthropic-messages",
3620
- provider: "fireworks",
3621
- baseUrl: "https://api.fireworks.ai/inference",
3622
- reasoning: false,
3623
- input: ["text"],
3624
- cost: {
3625
- input: 1,
3626
- output: 3,
3627
- cacheRead: 0,
3628
- cacheWrite: 0,
3629
- },
3630
- contextWindow: 128000,
3631
- maxTokens: 16384,
3632
- },
3633
- "accounts/fireworks/models/kimi-k2-thinking": {
3634
- id: "accounts/fireworks/models/kimi-k2-thinking",
3635
- name: "Kimi K2 Thinking",
3636
- api: "anthropic-messages",
3637
- provider: "fireworks",
3638
- baseUrl: "https://api.fireworks.ai/inference",
3639
- reasoning: true,
3640
- input: ["text"],
3641
- cost: {
3642
- input: 0.6,
3643
- output: 2.5,
3644
- cacheRead: 0.3,
3645
- cacheWrite: 0,
3646
- },
3647
- contextWindow: 256000,
3648
- maxTokens: 256000,
3649
- },
3650
- "accounts/fireworks/models/kimi-k2p5": {
3651
- id: "accounts/fireworks/models/kimi-k2p5",
3652
- name: "Kimi K2.5",
3653
- api: "anthropic-messages",
3654
- provider: "fireworks",
3655
- baseUrl: "https://api.fireworks.ai/inference",
3656
- reasoning: true,
3657
- input: ["text", "image"],
3658
- cost: {
3659
- input: 0.6,
3660
- output: 3,
3661
- cacheRead: 0.1,
3714
+ input: 0.6,
3715
+ output: 3,
3716
+ cacheRead: 0.1,
3662
3717
  cacheWrite: 0,
3663
3718
  },
3664
3719
  contextWindow: 256000,
@@ -3681,23 +3736,6 @@ export const MODELS = {
3681
3736
  contextWindow: 262000,
3682
3737
  maxTokens: 262000,
3683
3738
  },
3684
- "accounts/fireworks/models/minimax-m2p1": {
3685
- id: "accounts/fireworks/models/minimax-m2p1",
3686
- name: "MiniMax-M2.1",
3687
- api: "anthropic-messages",
3688
- provider: "fireworks",
3689
- baseUrl: "https://api.fireworks.ai/inference",
3690
- reasoning: true,
3691
- input: ["text"],
3692
- cost: {
3693
- input: 0.3,
3694
- output: 1.2,
3695
- cacheRead: 0.03,
3696
- cacheWrite: 0,
3697
- },
3698
- contextWindow: 200000,
3699
- maxTokens: 200000,
3700
- },
3701
3739
  "accounts/fireworks/models/minimax-m2p5": {
3702
3740
  id: "accounts/fireworks/models/minimax-m2p5",
3703
3741
  name: "MiniMax-M2.5",
@@ -3726,7 +3764,7 @@ export const MODELS = {
3726
3764
  cost: {
3727
3765
  input: 0.3,
3728
3766
  output: 1.2,
3729
- cacheRead: 0.03,
3767
+ cacheRead: 0.06,
3730
3768
  cacheWrite: 0,
3731
3769
  },
3732
3770
  contextWindow: 196608,
@@ -3749,22 +3787,39 @@ export const MODELS = {
3749
3787
  contextWindow: 128000,
3750
3788
  maxTokens: 8192,
3751
3789
  },
3752
- "accounts/fireworks/routers/kimi-k2p5-turbo": {
3753
- id: "accounts/fireworks/routers/kimi-k2p5-turbo",
3754
- name: "Kimi K2.5 Turbo",
3790
+ "accounts/fireworks/routers/glm-5p1-fast": {
3791
+ id: "accounts/fireworks/routers/glm-5p1-fast",
3792
+ name: "GLM 5.1 Fast",
3793
+ api: "anthropic-messages",
3794
+ provider: "fireworks",
3795
+ baseUrl: "https://api.fireworks.ai/inference",
3796
+ reasoning: true,
3797
+ input: ["text"],
3798
+ cost: {
3799
+ input: 2.8,
3800
+ output: 8.8,
3801
+ cacheRead: 0.52,
3802
+ cacheWrite: 0,
3803
+ },
3804
+ contextWindow: 202800,
3805
+ maxTokens: 131072,
3806
+ },
3807
+ "accounts/fireworks/routers/kimi-k2p6-turbo": {
3808
+ id: "accounts/fireworks/routers/kimi-k2p6-turbo",
3809
+ name: "Kimi K2.6 Turbo",
3755
3810
  api: "anthropic-messages",
3756
3811
  provider: "fireworks",
3757
3812
  baseUrl: "https://api.fireworks.ai/inference",
3758
3813
  reasoning: true,
3759
3814
  input: ["text", "image"],
3760
3815
  cost: {
3761
- input: 0,
3762
- output: 0,
3763
- cacheRead: 0,
3816
+ input: 2,
3817
+ output: 8,
3818
+ cacheRead: 0.3,
3764
3819
  cacheWrite: 0,
3765
3820
  },
3766
- contextWindow: 256000,
3767
- maxTokens: 256000,
3821
+ contextWindow: 262000,
3822
+ maxTokens: 262000,
3768
3823
  },
3769
3824
  },
3770
3825
  "github-copilot": {
@@ -3784,8 +3839,8 @@ export const MODELS = {
3784
3839
  cacheRead: 0,
3785
3840
  cacheWrite: 0,
3786
3841
  },
3787
- contextWindow: 144000,
3788
- maxTokens: 32000,
3842
+ contextWindow: 200000,
3843
+ maxTokens: 64000,
3789
3844
  },
3790
3845
  "claude-opus-4.5": {
3791
3846
  id: "claude-opus-4.5",
@@ -3802,7 +3857,7 @@ export const MODELS = {
3802
3857
  cacheRead: 0,
3803
3858
  cacheWrite: 0,
3804
3859
  },
3805
- contextWindow: 160000,
3860
+ contextWindow: 200000,
3806
3861
  maxTokens: 32000,
3807
3862
  },
3808
3863
  "claude-opus-4.6": {
@@ -3822,7 +3877,7 @@ export const MODELS = {
3822
3877
  cacheWrite: 0,
3823
3878
  },
3824
3879
  contextWindow: 1000000,
3825
- maxTokens: 64000,
3880
+ maxTokens: 32000,
3826
3881
  },
3827
3882
  "claude-opus-4.7": {
3828
3883
  id: "claude-opus-4.7",
@@ -3840,7 +3895,25 @@ export const MODELS = {
3840
3895
  cacheRead: 0,
3841
3896
  cacheWrite: 0,
3842
3897
  },
3843
- contextWindow: 144000,
3898
+ contextWindow: 200000,
3899
+ maxTokens: 32000,
3900
+ },
3901
+ "claude-opus-4.8": {
3902
+ id: "claude-opus-4.8",
3903
+ name: "Claude Opus 4.8",
3904
+ api: "anthropic-messages",
3905
+ provider: "github-copilot",
3906
+ baseUrl: "https://api.individual.githubcopilot.com",
3907
+ headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3908
+ reasoning: true,
3909
+ input: ["text", "image"],
3910
+ cost: {
3911
+ input: 0,
3912
+ output: 0,
3913
+ cacheRead: 0,
3914
+ cacheWrite: 0,
3915
+ },
3916
+ contextWindow: 200000,
3844
3917
  maxTokens: 64000,
3845
3918
  },
3846
3919
  "claude-sonnet-4.5": {
@@ -3859,7 +3932,7 @@ export const MODELS = {
3859
3932
  cacheRead: 0,
3860
3933
  cacheWrite: 0,
3861
3934
  },
3862
- contextWindow: 144000,
3935
+ contextWindow: 200000,
3863
3936
  maxTokens: 32000,
3864
3937
  },
3865
3938
  "claude-sonnet-4.6": {
@@ -3934,7 +4007,26 @@ export const MODELS = {
3934
4007
  cacheRead: 0,
3935
4008
  cacheWrite: 0,
3936
4009
  },
3937
- contextWindow: 128000,
4010
+ contextWindow: 200000,
4011
+ maxTokens: 64000,
4012
+ },
4013
+ "gemini-3.5-flash": {
4014
+ id: "gemini-3.5-flash",
4015
+ name: "Gemini 3.5 Flash",
4016
+ api: "openai-completions",
4017
+ provider: "github-copilot",
4018
+ baseUrl: "https://api.individual.githubcopilot.com",
4019
+ headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4020
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
4021
+ reasoning: true,
4022
+ input: ["text", "image"],
4023
+ cost: {
4024
+ input: 0,
4025
+ output: 0,
4026
+ cacheRead: 0,
4027
+ cacheWrite: 0,
4028
+ },
4029
+ contextWindow: 200000,
3938
4030
  maxTokens: 64000,
3939
4031
  },
3940
4032
  "gpt-4.1": {
@@ -4010,8 +4102,8 @@ export const MODELS = {
4010
4102
  cacheRead: 0,
4011
4103
  cacheWrite: 0,
4012
4104
  },
4013
- contextWindow: 264000,
4014
- maxTokens: 64000,
4105
+ contextWindow: 400000,
4106
+ maxTokens: 128000,
4015
4107
  },
4016
4108
  "gpt-5.2-codex": {
4017
4109
  id: "gpt-5.2-codex",
@@ -4129,57 +4221,6 @@ export const MODELS = {
4129
4221
  },
4130
4222
  },
4131
4223
  "google": {
4132
- "gemini-1.5-flash": {
4133
- id: "gemini-1.5-flash",
4134
- name: "Gemini 1.5 Flash",
4135
- api: "google-generative-ai",
4136
- provider: "google",
4137
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4138
- reasoning: false,
4139
- input: ["text", "image"],
4140
- cost: {
4141
- input: 0.075,
4142
- output: 0.3,
4143
- cacheRead: 0.01875,
4144
- cacheWrite: 0,
4145
- },
4146
- contextWindow: 1000000,
4147
- maxTokens: 8192,
4148
- },
4149
- "gemini-1.5-flash-8b": {
4150
- id: "gemini-1.5-flash-8b",
4151
- name: "Gemini 1.5 Flash-8B",
4152
- api: "google-generative-ai",
4153
- provider: "google",
4154
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4155
- reasoning: false,
4156
- input: ["text", "image"],
4157
- cost: {
4158
- input: 0.0375,
4159
- output: 0.15,
4160
- cacheRead: 0.01,
4161
- cacheWrite: 0,
4162
- },
4163
- contextWindow: 1000000,
4164
- maxTokens: 8192,
4165
- },
4166
- "gemini-1.5-pro": {
4167
- id: "gemini-1.5-pro",
4168
- name: "Gemini 1.5 Pro",
4169
- api: "google-generative-ai",
4170
- provider: "google",
4171
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4172
- reasoning: false,
4173
- input: ["text", "image"],
4174
- cost: {
4175
- input: 1.25,
4176
- output: 5,
4177
- cacheRead: 0.3125,
4178
- cacheWrite: 0,
4179
- },
4180
- contextWindow: 1000000,
4181
- maxTokens: 8192,
4182
- },
4183
4224
  "gemini-2.0-flash": {
4184
4225
  id: "gemini-2.0-flash",
4185
4226
  name: "Gemini 2.0 Flash",
@@ -4199,7 +4240,7 @@ export const MODELS = {
4199
4240
  },
4200
4241
  "gemini-2.0-flash-lite": {
4201
4242
  id: "gemini-2.0-flash-lite",
4202
- name: "Gemini 2.0 Flash Lite",
4243
+ name: "Gemini 2.0 Flash-Lite",
4203
4244
  api: "google-generative-ai",
4204
4245
  provider: "google",
4205
4246
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4233,7 +4274,7 @@ export const MODELS = {
4233
4274
  },
4234
4275
  "gemini-2.5-flash-lite": {
4235
4276
  id: "gemini-2.5-flash-lite",
4236
- name: "Gemini 2.5 Flash Lite",
4277
+ name: "Gemini 2.5 Flash-Lite",
4237
4278
  api: "google-generative-ai",
4238
4279
  provider: "google",
4239
4280
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4248,168 +4289,49 @@ export const MODELS = {
4248
4289
  contextWindow: 1048576,
4249
4290
  maxTokens: 65536,
4250
4291
  },
4251
- "gemini-2.5-flash-lite-preview-06-17": {
4252
- id: "gemini-2.5-flash-lite-preview-06-17",
4253
- name: "Gemini 2.5 Flash Lite Preview 06-17",
4292
+ "gemini-2.5-pro": {
4293
+ id: "gemini-2.5-pro",
4294
+ name: "Gemini 2.5 Pro",
4254
4295
  api: "google-generative-ai",
4255
4296
  provider: "google",
4256
4297
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4257
4298
  reasoning: true,
4258
4299
  input: ["text", "image"],
4259
4300
  cost: {
4260
- input: 0.1,
4261
- output: 0.4,
4262
- cacheRead: 0.025,
4301
+ input: 1.25,
4302
+ output: 10,
4303
+ cacheRead: 0.125,
4263
4304
  cacheWrite: 0,
4264
4305
  },
4265
4306
  contextWindow: 1048576,
4266
4307
  maxTokens: 65536,
4267
4308
  },
4268
- "gemini-2.5-flash-lite-preview-09-2025": {
4269
- id: "gemini-2.5-flash-lite-preview-09-2025",
4270
- name: "Gemini 2.5 Flash Lite Preview 09-25",
4309
+ "gemini-3-flash-preview": {
4310
+ id: "gemini-3-flash-preview",
4311
+ name: "Gemini 3 Flash Preview",
4271
4312
  api: "google-generative-ai",
4272
4313
  provider: "google",
4273
4314
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4274
4315
  reasoning: true,
4316
+ thinkingLevelMap: { "off": null },
4275
4317
  input: ["text", "image"],
4276
4318
  cost: {
4277
- input: 0.1,
4278
- output: 0.4,
4279
- cacheRead: 0.025,
4319
+ input: 0.5,
4320
+ output: 3,
4321
+ cacheRead: 0.05,
4280
4322
  cacheWrite: 0,
4281
4323
  },
4282
4324
  contextWindow: 1048576,
4283
4325
  maxTokens: 65536,
4284
4326
  },
4285
- "gemini-2.5-flash-preview-04-17": {
4286
- id: "gemini-2.5-flash-preview-04-17",
4287
- name: "Gemini 2.5 Flash Preview 04-17",
4327
+ "gemini-3-pro-preview": {
4328
+ id: "gemini-3-pro-preview",
4329
+ name: "Gemini 3 Pro Preview",
4288
4330
  api: "google-generative-ai",
4289
4331
  provider: "google",
4290
4332
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4291
4333
  reasoning: true,
4292
- input: ["text", "image"],
4293
- cost: {
4294
- input: 0.15,
4295
- output: 0.6,
4296
- cacheRead: 0.0375,
4297
- cacheWrite: 0,
4298
- },
4299
- contextWindow: 1048576,
4300
- maxTokens: 65536,
4301
- },
4302
- "gemini-2.5-flash-preview-05-20": {
4303
- id: "gemini-2.5-flash-preview-05-20",
4304
- name: "Gemini 2.5 Flash Preview 05-20",
4305
- api: "google-generative-ai",
4306
- provider: "google",
4307
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4308
- reasoning: true,
4309
- input: ["text", "image"],
4310
- cost: {
4311
- input: 0.15,
4312
- output: 0.6,
4313
- cacheRead: 0.0375,
4314
- cacheWrite: 0,
4315
- },
4316
- contextWindow: 1048576,
4317
- maxTokens: 65536,
4318
- },
4319
- "gemini-2.5-flash-preview-09-2025": {
4320
- id: "gemini-2.5-flash-preview-09-2025",
4321
- name: "Gemini 2.5 Flash Preview 09-25",
4322
- api: "google-generative-ai",
4323
- provider: "google",
4324
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4325
- reasoning: true,
4326
- input: ["text", "image"],
4327
- cost: {
4328
- input: 0.3,
4329
- output: 2.5,
4330
- cacheRead: 0.075,
4331
- cacheWrite: 0,
4332
- },
4333
- contextWindow: 1048576,
4334
- maxTokens: 65536,
4335
- },
4336
- "gemini-2.5-pro": {
4337
- id: "gemini-2.5-pro",
4338
- name: "Gemini 2.5 Pro",
4339
- api: "google-generative-ai",
4340
- provider: "google",
4341
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4342
- reasoning: true,
4343
- input: ["text", "image"],
4344
- cost: {
4345
- input: 1.25,
4346
- output: 10,
4347
- cacheRead: 0.125,
4348
- cacheWrite: 0,
4349
- },
4350
- contextWindow: 1048576,
4351
- maxTokens: 65536,
4352
- },
4353
- "gemini-2.5-pro-preview-05-06": {
4354
- id: "gemini-2.5-pro-preview-05-06",
4355
- name: "Gemini 2.5 Pro Preview 05-06",
4356
- api: "google-generative-ai",
4357
- provider: "google",
4358
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4359
- reasoning: true,
4360
- input: ["text", "image"],
4361
- cost: {
4362
- input: 1.25,
4363
- output: 10,
4364
- cacheRead: 0.31,
4365
- cacheWrite: 0,
4366
- },
4367
- contextWindow: 1048576,
4368
- maxTokens: 65536,
4369
- },
4370
- "gemini-2.5-pro-preview-06-05": {
4371
- id: "gemini-2.5-pro-preview-06-05",
4372
- name: "Gemini 2.5 Pro Preview 06-05",
4373
- api: "google-generative-ai",
4374
- provider: "google",
4375
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4376
- reasoning: true,
4377
- input: ["text", "image"],
4378
- cost: {
4379
- input: 1.25,
4380
- output: 10,
4381
- cacheRead: 0.31,
4382
- cacheWrite: 0,
4383
- },
4384
- contextWindow: 1048576,
4385
- maxTokens: 65536,
4386
- },
4387
- "gemini-3-flash-preview": {
4388
- id: "gemini-3-flash-preview",
4389
- name: "Gemini 3 Flash Preview",
4390
- api: "google-generative-ai",
4391
- provider: "google",
4392
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4393
- reasoning: true,
4394
- thinkingLevelMap: { "off": null },
4395
- input: ["text", "image"],
4396
- cost: {
4397
- input: 0.5,
4398
- output: 3,
4399
- cacheRead: 0.05,
4400
- cacheWrite: 0,
4401
- },
4402
- contextWindow: 1048576,
4403
- maxTokens: 65536,
4404
- },
4405
- "gemini-3-pro-preview": {
4406
- id: "gemini-3-pro-preview",
4407
- name: "Gemini 3 Pro Preview",
4408
- api: "google-generative-ai",
4409
- provider: "google",
4410
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4411
- reasoning: true,
4412
- thinkingLevelMap: { "off": null, "minimal": null, "low": "LOW", "medium": null, "high": "HIGH" },
4334
+ thinkingLevelMap: { "off": null, "minimal": null, "low": "LOW", "medium": null, "high": "HIGH" },
4413
4335
  input: ["text", "image"],
4414
4336
  cost: {
4415
4337
  input: 2,
@@ -4417,8 +4339,8 @@ export const MODELS = {
4417
4339
  cacheRead: 0.2,
4418
4340
  cacheWrite: 0,
4419
4341
  },
4420
- contextWindow: 1000000,
4421
- maxTokens: 64000,
4342
+ contextWindow: 1048576,
4343
+ maxTokens: 65536,
4422
4344
  },
4423
4345
  "gemini-3.1-flash-lite": {
4424
4346
  id: "gemini-3.1-flash-lite",
@@ -4492,6 +4414,24 @@ export const MODELS = {
4492
4414
  contextWindow: 1048576,
4493
4415
  maxTokens: 65536,
4494
4416
  },
4417
+ "gemini-3.5-flash": {
4418
+ id: "gemini-3.5-flash",
4419
+ name: "Gemini 3.5 Flash",
4420
+ api: "google-generative-ai",
4421
+ provider: "google",
4422
+ baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4423
+ reasoning: true,
4424
+ thinkingLevelMap: { "off": null },
4425
+ input: ["text", "image"],
4426
+ cost: {
4427
+ input: 1.5,
4428
+ output: 9,
4429
+ cacheRead: 0.15,
4430
+ cacheWrite: 0,
4431
+ },
4432
+ contextWindow: 1048576,
4433
+ maxTokens: 65536,
4434
+ },
4495
4435
  "gemini-flash-latest": {
4496
4436
  id: "gemini-flash-latest",
4497
4437
  name: "Gemini Flash Latest",
@@ -4526,60 +4466,9 @@ export const MODELS = {
4526
4466
  contextWindow: 1048576,
4527
4467
  maxTokens: 65536,
4528
4468
  },
4529
- "gemini-live-2.5-flash": {
4530
- id: "gemini-live-2.5-flash",
4531
- name: "Gemini Live 2.5 Flash",
4532
- api: "google-generative-ai",
4533
- provider: "google",
4534
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4535
- reasoning: true,
4536
- input: ["text", "image"],
4537
- cost: {
4538
- input: 0.5,
4539
- output: 2,
4540
- cacheRead: 0,
4541
- cacheWrite: 0,
4542
- },
4543
- contextWindow: 128000,
4544
- maxTokens: 8000,
4545
- },
4546
- "gemini-live-2.5-flash-preview-native-audio": {
4547
- id: "gemini-live-2.5-flash-preview-native-audio",
4548
- name: "Gemini Live 2.5 Flash Preview Native Audio",
4549
- api: "google-generative-ai",
4550
- provider: "google",
4551
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4552
- reasoning: true,
4553
- input: ["text"],
4554
- cost: {
4555
- input: 0.5,
4556
- output: 2,
4557
- cacheRead: 0,
4558
- cacheWrite: 0,
4559
- },
4560
- contextWindow: 131072,
4561
- maxTokens: 65536,
4562
- },
4563
- "gemma-3-27b-it": {
4564
- id: "gemma-3-27b-it",
4565
- name: "Gemma 3 27B",
4566
- api: "google-generative-ai",
4567
- provider: "google",
4568
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4569
- reasoning: false,
4570
- input: ["text", "image"],
4571
- cost: {
4572
- input: 0,
4573
- output: 0,
4574
- cacheRead: 0,
4575
- cacheWrite: 0,
4576
- },
4577
- contextWindow: 131072,
4578
- maxTokens: 8192,
4579
- },
4580
4469
  "gemma-4-26b-a4b-it": {
4581
4470
  id: "gemma-4-26b-a4b-it",
4582
- name: "Gemma 4 26B",
4471
+ name: "Gemma 4 26B A4B IT",
4583
4472
  api: "google-generative-ai",
4584
4473
  provider: "google",
4585
4474
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4592,12 +4481,12 @@ export const MODELS = {
4592
4481
  cacheRead: 0,
4593
4482
  cacheWrite: 0,
4594
4483
  },
4595
- contextWindow: 256000,
4596
- maxTokens: 8192,
4484
+ contextWindow: 262144,
4485
+ maxTokens: 32768,
4597
4486
  },
4598
4487
  "gemma-4-31b-it": {
4599
4488
  id: "gemma-4-31b-it",
4600
- name: "Gemma 4 31B",
4489
+ name: "Gemma 4 31B IT",
4601
4490
  api: "google-generative-ai",
4602
4491
  provider: "google",
4603
4492
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4610,8 +4499,8 @@ export const MODELS = {
4610
4499
  cacheRead: 0,
4611
4500
  cacheWrite: 0,
4612
4501
  },
4613
- contextWindow: 256000,
4614
- maxTokens: 8192,
4502
+ contextWindow: 262144,
4503
+ maxTokens: 32768,
4615
4504
  },
4616
4505
  },
4617
4506
  "google-vertex": {
@@ -5057,7 +4946,7 @@ export const MODELS = {
5057
4946
  cost: {
5058
4947
  input: 1,
5059
4948
  output: 3,
5060
- cacheRead: 0,
4949
+ cacheRead: 0.5,
5061
4950
  cacheWrite: 0,
5062
4951
  },
5063
4952
  contextWindow: 262144,
@@ -5074,7 +4963,7 @@ export const MODELS = {
5074
4963
  cost: {
5075
4964
  input: 0.15,
5076
4965
  output: 0.6,
5077
- cacheRead: 0,
4966
+ cacheRead: 0.075,
5078
4967
  cacheWrite: 0,
5079
4968
  },
5080
4969
  contextWindow: 131072,
@@ -5091,7 +4980,7 @@ export const MODELS = {
5091
4980
  cost: {
5092
4981
  input: 0.075,
5093
4982
  output: 0.3,
5094
- cacheRead: 0,
4983
+ cacheRead: 0.0375,
5095
4984
  cacheWrite: 0,
5096
4985
  },
5097
4986
  contextWindow: 131072,
@@ -5377,9 +5266,9 @@ export const MODELS = {
5377
5266
  reasoning: true,
5378
5267
  input: ["text"],
5379
5268
  cost: {
5380
- input: 1.74,
5381
- output: 3.48,
5382
- cacheRead: 0.145,
5269
+ input: 0.435,
5270
+ output: 0.87,
5271
+ cacheRead: 0.003625,
5383
5272
  cacheWrite: 0,
5384
5273
  },
5385
5274
  contextWindow: 1048576,
@@ -6474,7 +6363,7 @@ export const MODELS = {
6474
6363
  cost: {
6475
6364
  input: 0.14,
6476
6365
  output: 0.28,
6477
- cacheRead: 0.028,
6366
+ cacheRead: 0.0028,
6478
6367
  cacheWrite: 0,
6479
6368
  },
6480
6369
  contextWindow: 1048576,
@@ -6491,9 +6380,9 @@ export const MODELS = {
6491
6380
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
6492
6381
  input: ["text"],
6493
6382
  cost: {
6494
- input: 1.74,
6495
- output: 3.48,
6496
- cacheRead: 0.145,
6383
+ input: 0.435,
6384
+ output: 0.87,
6385
+ cacheRead: 0.003625,
6497
6386
  cacheWrite: 0,
6498
6387
  },
6499
6388
  contextWindow: 1048576,
@@ -7362,7 +7251,7 @@ export const MODELS = {
7362
7251
  cost: {
7363
7252
  input: 0.1,
7364
7253
  output: 0.4,
7365
- cacheRead: 0.03,
7254
+ cacheRead: 0.025,
7366
7255
  cacheWrite: 0,
7367
7256
  },
7368
7257
  contextWindow: 1047576,
@@ -7447,7 +7336,7 @@ export const MODELS = {
7447
7336
  cost: {
7448
7337
  input: 0.15,
7449
7338
  output: 0.6,
7450
- cacheRead: 0.08,
7339
+ cacheRead: 0.075,
7451
7340
  cacheWrite: 0,
7452
7341
  },
7453
7342
  contextWindow: 128000,
@@ -7573,7 +7462,7 @@ export const MODELS = {
7573
7462
  cost: {
7574
7463
  input: 1.25,
7575
7464
  output: 10,
7576
- cacheRead: 0.13,
7465
+ cacheRead: 0.125,
7577
7466
  cacheWrite: 0,
7578
7467
  },
7579
7468
  contextWindow: 400000,
@@ -7998,7 +7887,7 @@ export const MODELS = {
7998
7887
  cost: {
7999
7888
  input: 1.1,
8000
7889
  output: 4.4,
8001
- cacheRead: 0.28,
7890
+ cacheRead: 0.275,
8002
7891
  cacheWrite: 0,
8003
7892
  },
8004
7893
  contextWindow: 200000,
@@ -8218,7 +8107,7 @@ export const MODELS = {
8218
8107
  cacheWrite: 0,
8219
8108
  },
8220
8109
  contextWindow: 200000,
8221
- maxTokens: 128000,
8110
+ maxTokens: 32000,
8222
8111
  },
8223
8112
  "claude-haiku-4-5": {
8224
8113
  id: "claude-haiku-4-5",
@@ -8307,6 +8196,23 @@ export const MODELS = {
8307
8196
  contextWindow: 1000000,
8308
8197
  maxTokens: 128000,
8309
8198
  },
8199
+ "claude-opus-4-8": {
8200
+ id: "claude-opus-4-8",
8201
+ name: "Claude Opus 4.8",
8202
+ api: "anthropic-messages",
8203
+ provider: "opencode",
8204
+ baseUrl: "https://opencode.ai/zen",
8205
+ reasoning: true,
8206
+ input: ["text", "image"],
8207
+ cost: {
8208
+ input: 5,
8209
+ output: 25,
8210
+ cacheRead: 0.5,
8211
+ cacheWrite: 6.25,
8212
+ },
8213
+ contextWindow: 1000000,
8214
+ maxTokens: 128000,
8215
+ },
8310
8216
  "claude-sonnet-4": {
8311
8217
  id: "claude-sonnet-4",
8312
8218
  name: "Claude Sonnet 4",
@@ -8374,8 +8280,8 @@ export const MODELS = {
8374
8280
  cacheRead: 0,
8375
8281
  cacheWrite: 0,
8376
8282
  },
8377
- contextWindow: 1000000,
8378
- maxTokens: 384000,
8283
+ contextWindow: 200000,
8284
+ maxTokens: 128000,
8379
8285
  },
8380
8286
  "gemini-3-flash": {
8381
8287
  id: "gemini-3-flash",
@@ -8413,6 +8319,24 @@ export const MODELS = {
8413
8319
  contextWindow: 1048576,
8414
8320
  maxTokens: 65536,
8415
8321
  },
8322
+ "gemini-3.5-flash": {
8323
+ id: "gemini-3.5-flash",
8324
+ name: "Gemini 3.5 Flash",
8325
+ api: "google-generative-ai",
8326
+ provider: "opencode",
8327
+ baseUrl: "https://opencode.ai/zen/v1",
8328
+ reasoning: true,
8329
+ thinkingLevelMap: { "off": null },
8330
+ input: ["text", "image"],
8331
+ cost: {
8332
+ input: 1.5,
8333
+ output: 9,
8334
+ cacheRead: 0.15,
8335
+ cacheWrite: 0,
8336
+ },
8337
+ contextWindow: 1048576,
8338
+ maxTokens: 65536,
8339
+ },
8416
8340
  "glm-5": {
8417
8341
  id: "glm-5",
8418
8342
  name: "GLM-5",
@@ -8735,6 +8659,23 @@ export const MODELS = {
8735
8659
  contextWindow: 1050000,
8736
8660
  maxTokens: 128000,
8737
8661
  },
8662
+ "grok-build-0.1": {
8663
+ id: "grok-build-0.1",
8664
+ name: "Grok Build 0.1",
8665
+ api: "openai-completions",
8666
+ provider: "opencode",
8667
+ baseUrl: "https://opencode.ai/zen/v1",
8668
+ reasoning: true,
8669
+ input: ["text", "image"],
8670
+ cost: {
8671
+ input: 1,
8672
+ output: 2,
8673
+ cacheRead: 0.2,
8674
+ cacheWrite: 0,
8675
+ },
8676
+ contextWindow: 256000,
8677
+ maxTokens: 256000,
8678
+ },
8738
8679
  "kimi-k2.5": {
8739
8680
  id: "kimi-k2.5",
8740
8681
  name: "Kimi K2.5",
@@ -8769,35 +8710,35 @@ export const MODELS = {
8769
8710
  contextWindow: 262144,
8770
8711
  maxTokens: 65536,
8771
8712
  },
8772
- "minimax-m2.5": {
8773
- id: "minimax-m2.5",
8774
- name: "MiniMax M2.5",
8713
+ "mimo-v2.5-free": {
8714
+ id: "mimo-v2.5-free",
8715
+ name: "MiMo V2.5 Free",
8775
8716
  api: "openai-completions",
8776
8717
  provider: "opencode",
8777
8718
  baseUrl: "https://opencode.ai/zen/v1",
8778
8719
  reasoning: true,
8779
- input: ["text"],
8720
+ input: ["text", "image"],
8780
8721
  cost: {
8781
- input: 0.3,
8782
- output: 1.2,
8783
- cacheRead: 0.06,
8722
+ input: 0,
8723
+ output: 0,
8724
+ cacheRead: 0,
8784
8725
  cacheWrite: 0,
8785
8726
  },
8786
- contextWindow: 204800,
8787
- maxTokens: 131072,
8727
+ contextWindow: 1000000,
8728
+ maxTokens: 128000,
8788
8729
  },
8789
- "minimax-m2.5-free": {
8790
- id: "minimax-m2.5-free",
8791
- name: "MiniMax M2.5 Free",
8792
- api: "anthropic-messages",
8730
+ "minimax-m2.5": {
8731
+ id: "minimax-m2.5",
8732
+ name: "MiniMax M2.5",
8733
+ api: "openai-completions",
8793
8734
  provider: "opencode",
8794
- baseUrl: "https://opencode.ai/zen",
8735
+ baseUrl: "https://opencode.ai/zen/v1",
8795
8736
  reasoning: true,
8796
8737
  input: ["text"],
8797
8738
  cost: {
8798
- input: 0,
8799
- output: 0,
8800
- cacheRead: 0,
8739
+ input: 0.3,
8740
+ output: 1.2,
8741
+ cacheRead: 0.06,
8801
8742
  cacheWrite: 0,
8802
8743
  },
8803
8744
  contextWindow: 204800,
@@ -8871,23 +8812,6 @@ export const MODELS = {
8871
8812
  contextWindow: 262144,
8872
8813
  maxTokens: 65536,
8873
8814
  },
8874
- "qwen3.6-plus-free": {
8875
- id: "qwen3.6-plus-free",
8876
- name: "Qwen3.6 Plus Free",
8877
- api: "anthropic-messages",
8878
- provider: "opencode",
8879
- baseUrl: "https://opencode.ai/zen",
8880
- reasoning: true,
8881
- input: ["text", "image"],
8882
- cost: {
8883
- input: 0,
8884
- output: 0,
8885
- cacheRead: 0,
8886
- cacheWrite: 0,
8887
- },
8888
- contextWindow: 262144,
8889
- maxTokens: 65536,
8890
- },
8891
8815
  },
8892
8816
  "opencode-go": {
8893
8817
  "deepseek-v4-flash": {
@@ -8968,6 +8892,7 @@ export const MODELS = {
8968
8892
  api: "openai-completions",
8969
8893
  provider: "opencode-go",
8970
8894
  baseUrl: "https://opencode.ai/zen/go/v1",
8895
+ compat: { "requiresReasoningContentOnAssistantMessages": true },
8971
8896
  reasoning: true,
8972
8897
  input: ["text", "image"],
8973
8898
  cost: {
@@ -8985,6 +8910,7 @@ export const MODELS = {
8985
8910
  api: "openai-completions",
8986
8911
  provider: "opencode-go",
8987
8912
  baseUrl: "https://opencode.ai/zen/go/v1",
8913
+ compat: { "requiresReasoningContentOnAssistantMessages": true },
8988
8914
  reasoning: true,
8989
8915
  input: ["text", "image"],
8990
8916
  cost: {
@@ -9005,9 +8931,9 @@ export const MODELS = {
9005
8931
  reasoning: true,
9006
8932
  input: ["text", "image"],
9007
8933
  cost: {
9008
- input: 0.4,
9009
- output: 2,
9010
- cacheRead: 0.08,
8934
+ input: 0.14,
8935
+ output: 0.28,
8936
+ cacheRead: 0.0028,
9011
8937
  cacheWrite: 0,
9012
8938
  },
9013
8939
  contextWindow: 1000000,
@@ -9022,9 +8948,9 @@ export const MODELS = {
9022
8948
  reasoning: true,
9023
8949
  input: ["text"],
9024
8950
  cost: {
9025
- input: 1,
9026
- output: 3,
9027
- cacheRead: 0.2,
8951
+ input: 1.74,
8952
+ output: 3.48,
8953
+ cacheRead: 0.0145,
9028
8954
  cacheWrite: 0,
9029
8955
  },
9030
8956
  contextWindow: 1048576,
@@ -9064,24 +8990,6 @@ export const MODELS = {
9064
8990
  contextWindow: 204800,
9065
8991
  maxTokens: 131072,
9066
8992
  },
9067
- "qwen3.5-plus": {
9068
- id: "qwen3.5-plus",
9069
- name: "Qwen3.5 Plus",
9070
- api: "openai-completions",
9071
- provider: "opencode-go",
9072
- baseUrl: "https://opencode.ai/zen/go/v1",
9073
- compat: { "thinkingFormat": "qwen" },
9074
- reasoning: true,
9075
- input: ["text", "image"],
9076
- cost: {
9077
- input: 0.2,
9078
- output: 1.2,
9079
- cacheRead: 0.02,
9080
- cacheWrite: 0.25,
9081
- },
9082
- contextWindow: 262144,
9083
- maxTokens: 65536,
9084
- },
9085
8993
  "qwen3.6-plus": {
9086
8994
  id: "qwen3.6-plus",
9087
8995
  name: "Qwen3.6 Plus",
@@ -9100,6 +9008,23 @@ export const MODELS = {
9100
9008
  contextWindow: 262144,
9101
9009
  maxTokens: 65536,
9102
9010
  },
9011
+ "qwen3.7-max": {
9012
+ id: "qwen3.7-max",
9013
+ name: "Qwen3.7 Max",
9014
+ api: "anthropic-messages",
9015
+ provider: "opencode-go",
9016
+ baseUrl: "https://opencode.ai/zen/go",
9017
+ reasoning: true,
9018
+ input: ["text"],
9019
+ cost: {
9020
+ input: 2.5,
9021
+ output: 7.5,
9022
+ cacheRead: 0.5,
9023
+ cacheWrite: 3.125,
9024
+ },
9025
+ contextWindow: 1000000,
9026
+ maxTokens: 65536,
9027
+ },
9103
9028
  },
9104
9029
  "openrouter": {
9105
9030
  "ai21/jamba-large-1.7": {
@@ -9119,23 +9044,6 @@ export const MODELS = {
9119
9044
  contextWindow: 256000,
9120
9045
  maxTokens: 4096,
9121
9046
  },
9122
- "alibaba/tongyi-deepresearch-30b-a3b": {
9123
- id: "alibaba/tongyi-deepresearch-30b-a3b",
9124
- name: "Tongyi DeepResearch 30B A3B",
9125
- api: "openai-completions",
9126
- provider: "openrouter",
9127
- baseUrl: "https://openrouter.ai/api/v1",
9128
- reasoning: true,
9129
- input: ["text"],
9130
- cost: {
9131
- input: 0.09,
9132
- output: 0.44999999999999996,
9133
- cacheRead: 0.09,
9134
- cacheWrite: 0,
9135
- },
9136
- contextWindow: 131072,
9137
- maxTokens: 131072,
9138
- },
9139
9047
  "amazon/nova-2-lite-v1": {
9140
9048
  id: "amazon/nova-2-lite-v1",
9141
9049
  name: "Amazon: Nova 2 Lite",
@@ -9395,6 +9303,40 @@ export const MODELS = {
9395
9303
  contextWindow: 1000000,
9396
9304
  maxTokens: 128000,
9397
9305
  },
9306
+ "anthropic/claude-opus-4.8": {
9307
+ id: "anthropic/claude-opus-4.8",
9308
+ name: "Anthropic: Claude Opus 4.8",
9309
+ api: "openai-completions",
9310
+ provider: "openrouter",
9311
+ baseUrl: "https://openrouter.ai/api/v1",
9312
+ reasoning: true,
9313
+ input: ["text", "image"],
9314
+ cost: {
9315
+ input: 5,
9316
+ output: 25,
9317
+ cacheRead: 0.5,
9318
+ cacheWrite: 6.25,
9319
+ },
9320
+ contextWindow: 1000000,
9321
+ maxTokens: 128000,
9322
+ },
9323
+ "anthropic/claude-opus-4.8-fast": {
9324
+ id: "anthropic/claude-opus-4.8-fast",
9325
+ name: "Anthropic: Claude Opus 4.8 (Fast)",
9326
+ api: "openai-completions",
9327
+ provider: "openrouter",
9328
+ baseUrl: "https://openrouter.ai/api/v1",
9329
+ reasoning: true,
9330
+ input: ["text", "image"],
9331
+ cost: {
9332
+ input: 10,
9333
+ output: 50,
9334
+ cacheRead: 1,
9335
+ cacheWrite: 12.5,
9336
+ },
9337
+ contextWindow: 1000000,
9338
+ maxTokens: 128000,
9339
+ },
9398
9340
  "anthropic/claude-sonnet-4": {
9399
9341
  id: "anthropic/claude-sonnet-4",
9400
9342
  name: "Anthropic: Claude Sonnet 4",
@@ -9446,23 +9388,6 @@ export const MODELS = {
9446
9388
  contextWindow: 1000000,
9447
9389
  maxTokens: 128000,
9448
9390
  },
9449
- "arcee-ai/trinity-large-preview": {
9450
- id: "arcee-ai/trinity-large-preview",
9451
- name: "Arcee AI: Trinity Large Preview",
9452
- api: "openai-completions",
9453
- provider: "openrouter",
9454
- baseUrl: "https://openrouter.ai/api/v1",
9455
- reasoning: false,
9456
- input: ["text"],
9457
- cost: {
9458
- input: 0.15,
9459
- output: 0.44999999999999996,
9460
- cacheRead: 0,
9461
- cacheWrite: 0,
9462
- },
9463
- contextWindow: 131000,
9464
- maxTokens: 4096,
9465
- },
9466
9391
  "arcee-ai/trinity-large-thinking": {
9467
9392
  id: "arcee-ai/trinity-large-thinking",
9468
9393
  name: "Arcee AI: Trinity Large Thinking",
@@ -9480,23 +9405,6 @@ export const MODELS = {
9480
9405
  contextWindow: 262144,
9481
9406
  maxTokens: 262144,
9482
9407
  },
9483
- "arcee-ai/trinity-large-thinking:free": {
9484
- id: "arcee-ai/trinity-large-thinking:free",
9485
- name: "Arcee AI: Trinity Large Thinking (free)",
9486
- api: "openai-completions",
9487
- provider: "openrouter",
9488
- baseUrl: "https://openrouter.ai/api/v1",
9489
- reasoning: true,
9490
- input: ["text"],
9491
- cost: {
9492
- input: 0,
9493
- output: 0,
9494
- cacheRead: 0,
9495
- cacheWrite: 0,
9496
- },
9497
- contextWindow: 262144,
9498
- maxTokens: 80000,
9499
- },
9500
9408
  "arcee-ai/trinity-mini": {
9501
9409
  id: "arcee-ai/trinity-mini",
9502
9410
  name: "Arcee AI: Trinity Mini",
@@ -9548,23 +9456,6 @@ export const MODELS = {
9548
9456
  contextWindow: 2000000,
9549
9457
  maxTokens: 30000,
9550
9458
  },
9551
- "baidu/cobuddy:free": {
9552
- id: "baidu/cobuddy:free",
9553
- name: "Baidu Qianfan: CoBuddy (free)",
9554
- api: "openai-completions",
9555
- provider: "openrouter",
9556
- baseUrl: "https://openrouter.ai/api/v1",
9557
- reasoning: true,
9558
- input: ["text"],
9559
- cost: {
9560
- input: 0,
9561
- output: 0,
9562
- cacheRead: 0,
9563
- cacheWrite: 0,
9564
- },
9565
- contextWindow: 131072,
9566
- maxTokens: 65536,
9567
- },
9568
9459
  "baidu/ernie-4.5-21b-a3b": {
9569
9460
  id: "baidu/ernie-4.5-21b-a3b",
9570
9461
  name: "Baidu: ERNIE 4.5 21B A3B",
@@ -9579,7 +9470,7 @@ export const MODELS = {
9579
9470
  cacheRead: 0,
9580
9471
  cacheWrite: 0,
9581
9472
  },
9582
- contextWindow: 120000,
9473
+ contextWindow: 131072,
9583
9474
  maxTokens: 8000,
9584
9475
  },
9585
9476
  "baidu/ernie-4.5-vl-28b-a3b": {
@@ -9596,7 +9487,7 @@ export const MODELS = {
9596
9487
  cacheRead: 0,
9597
9488
  cacheWrite: 0,
9598
9489
  },
9599
- contextWindow: 30000,
9490
+ contextWindow: 131072,
9600
9491
  maxTokens: 8000,
9601
9492
  },
9602
9493
  "bytedance-seed/seed-1.6": {
@@ -9710,13 +9601,13 @@ export const MODELS = {
9710
9601
  reasoning: false,
9711
9602
  input: ["text"],
9712
9603
  cost: {
9713
- input: 0.32,
9714
- output: 0.8899999999999999,
9604
+ input: 0.2288,
9605
+ output: 0.9144,
9715
9606
  cacheRead: 0,
9716
9607
  cacheWrite: 0,
9717
9608
  },
9718
- contextWindow: 163840,
9719
- maxTokens: 16384,
9609
+ contextWindow: 131072,
9610
+ maxTokens: 16000,
9720
9611
  },
9721
9612
  "deepseek/deepseek-chat-v3-0324": {
9722
9613
  id: "deepseek/deepseek-chat-v3-0324",
@@ -9766,7 +9657,7 @@ export const MODELS = {
9766
9657
  cacheRead: 0,
9767
9658
  cacheWrite: 0,
9768
9659
  },
9769
- contextWindow: 64000,
9660
+ contextWindow: 163840,
9770
9661
  maxTokens: 16000,
9771
9662
  },
9772
9663
  "deepseek/deepseek-r1-0528": {
@@ -9848,13 +9739,13 @@ export const MODELS = {
9848
9739
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
9849
9740
  input: ["text"],
9850
9741
  cost: {
9851
- input: 0.126,
9852
- output: 0.252,
9853
- cacheRead: 0.0252,
9742
+ input: 0.09999999999999999,
9743
+ output: 0.19999999999999998,
9744
+ cacheRead: 0.02,
9854
9745
  cacheWrite: 0,
9855
9746
  },
9856
9747
  contextWindow: 1048576,
9857
- maxTokens: 131072,
9748
+ maxTokens: 16384,
9858
9749
  },
9859
9750
  "deepseek/deepseek-v4-flash:free": {
9860
9751
  id: "deepseek/deepseek-v4-flash:free",
@@ -10129,6 +10020,23 @@ export const MODELS = {
10129
10020
  cacheRead: 0.19999999999999998,
10130
10021
  cacheWrite: 0.375,
10131
10022
  },
10023
+ contextWindow: 1048756,
10024
+ maxTokens: 65536,
10025
+ },
10026
+ "google/gemini-3.5-flash": {
10027
+ id: "google/gemini-3.5-flash",
10028
+ name: "Google: Gemini 3.5 Flash",
10029
+ api: "openai-completions",
10030
+ provider: "openrouter",
10031
+ baseUrl: "https://openrouter.ai/api/v1",
10032
+ reasoning: true,
10033
+ input: ["text", "image"],
10034
+ cost: {
10035
+ input: 1.5,
10036
+ output: 9,
10037
+ cacheRead: 0.15,
10038
+ cacheWrite: 0.08333333333333334,
10039
+ },
10132
10040
  contextWindow: 1048576,
10133
10041
  maxTokens: 65536,
10134
10042
  },
@@ -10277,9 +10185,9 @@ export const MODELS = {
10277
10185
  reasoning: false,
10278
10186
  input: ["text"],
10279
10187
  cost: {
10280
- input: 0.3,
10281
- output: 2.5,
10282
- cacheRead: 0.06,
10188
+ input: 0.075,
10189
+ output: 0.625,
10190
+ cacheRead: 0.015,
10283
10191
  cacheWrite: 0,
10284
10192
  },
10285
10193
  contextWindow: 262144,
@@ -10302,18 +10210,18 @@ export const MODELS = {
10302
10210
  contextWindow: 262144,
10303
10211
  maxTokens: 32768,
10304
10212
  },
10305
- "inclusionai/ring-2.6-1t:free": {
10306
- id: "inclusionai/ring-2.6-1t:free",
10307
- name: "inclusionAI: Ring-2.6-1T (free)",
10213
+ "inclusionai/ring-2.6-1t": {
10214
+ id: "inclusionai/ring-2.6-1t",
10215
+ name: "inclusionAI: Ring-2.6-1T",
10308
10216
  api: "openai-completions",
10309
10217
  provider: "openrouter",
10310
10218
  baseUrl: "https://openrouter.ai/api/v1",
10311
10219
  reasoning: true,
10312
10220
  input: ["text"],
10313
10221
  cost: {
10314
- input: 0,
10315
- output: 0,
10316
- cacheRead: 0,
10222
+ input: 0.075,
10223
+ output: 0.625,
10224
+ cacheRead: 0.015,
10317
10225
  cacheWrite: 0,
10318
10226
  },
10319
10227
  contextWindow: 262144,
@@ -10367,7 +10275,7 @@ export const MODELS = {
10367
10275
  cacheRead: 0,
10368
10276
  cacheWrite: 0,
10369
10277
  },
10370
- contextWindow: 16384,
10278
+ contextWindow: 131072,
10371
10279
  maxTokens: 16384,
10372
10280
  },
10373
10281
  "meta-llama/llama-3.3-70b-instruct": {
@@ -10401,7 +10309,7 @@ export const MODELS = {
10401
10309
  cacheRead: 0,
10402
10310
  cacheWrite: 0,
10403
10311
  },
10404
- contextWindow: 65536,
10312
+ contextWindow: 131072,
10405
10313
  maxTokens: 4096,
10406
10314
  },
10407
10315
  "meta-llama/llama-4-scout": {
@@ -10418,7 +10326,7 @@ export const MODELS = {
10418
10326
  cacheRead: 0,
10419
10327
  cacheWrite: 0,
10420
10328
  },
10421
- contextWindow: 327680,
10329
+ contextWindow: 10000000,
10422
10330
  maxTokens: 16384,
10423
10331
  },
10424
10332
  "minimax/minimax-m1": {
@@ -10452,7 +10360,7 @@ export const MODELS = {
10452
10360
  cacheRead: 0.03,
10453
10361
  cacheWrite: 0,
10454
10362
  },
10455
- contextWindow: 196608,
10363
+ contextWindow: 204800,
10456
10364
  maxTokens: 196608,
10457
10365
  },
10458
10366
  "minimax/minimax-m2.1": {
@@ -10469,7 +10377,7 @@ export const MODELS = {
10469
10377
  cacheRead: 0.03,
10470
10378
  cacheWrite: 0,
10471
10379
  },
10472
- contextWindow: 196608,
10380
+ contextWindow: 204800,
10473
10381
  maxTokens: 196608,
10474
10382
  },
10475
10383
  "minimax/minimax-m2.5": {
@@ -10486,7 +10394,7 @@ export const MODELS = {
10486
10394
  cacheRead: 0,
10487
10395
  cacheWrite: 0,
10488
10396
  },
10489
- contextWindow: 196608,
10397
+ contextWindow: 204800,
10490
10398
  maxTokens: 196608,
10491
10399
  },
10492
10400
  "minimax/minimax-m2.5:free": {
@@ -10503,7 +10411,7 @@ export const MODELS = {
10503
10411
  cacheRead: 0,
10504
10412
  cacheWrite: 0,
10505
10413
  },
10506
- contextWindow: 196608,
10414
+ contextWindow: 204800,
10507
10415
  maxTokens: 8192,
10508
10416
  },
10509
10417
  "minimax/minimax-m2.7": {
@@ -10520,7 +10428,7 @@ export const MODELS = {
10520
10428
  cacheRead: 0,
10521
10429
  cacheWrite: 0,
10522
10430
  },
10523
- contextWindow: 196608,
10431
+ contextWindow: 204800,
10524
10432
  maxTokens: 131072,
10525
10433
  },
10526
10434
  "mistralai/codestral-2508": {
@@ -10925,7 +10833,7 @@ export const MODELS = {
10925
10833
  cost: {
10926
10834
  input: 0.6,
10927
10835
  output: 2.5,
10928
- cacheRead: 0.15,
10836
+ cacheRead: 0,
10929
10837
  cacheWrite: 0,
10930
10838
  },
10931
10839
  contextWindow: 262144,
@@ -10962,9 +10870,26 @@ export const MODELS = {
10962
10870
  cacheRead: 0.25,
10963
10871
  cacheWrite: 0,
10964
10872
  },
10965
- contextWindow: 262142,
10873
+ contextWindow: 262144,
10966
10874
  maxTokens: 262142,
10967
10875
  },
10876
+ "moonshotai/kimi-k2.6:free": {
10877
+ id: "moonshotai/kimi-k2.6:free",
10878
+ name: "MoonshotAI: Kimi K2.6 (free)",
10879
+ api: "openai-completions",
10880
+ provider: "openrouter",
10881
+ baseUrl: "https://openrouter.ai/api/v1",
10882
+ reasoning: true,
10883
+ input: ["text", "image"],
10884
+ cost: {
10885
+ input: 0,
10886
+ output: 0,
10887
+ cacheRead: 0,
10888
+ cacheWrite: 0,
10889
+ },
10890
+ contextWindow: 262144,
10891
+ maxTokens: 4096,
10892
+ },
10968
10893
  "nex-agi/deepseek-v3.1-nex-n1": {
10969
10894
  id: "nex-agi/deepseek-v3.1-nex-n1",
10970
10895
  name: "Nex AGI: DeepSeek V3.1 Nex N1",
@@ -11064,7 +10989,7 @@ export const MODELS = {
11064
10989
  cacheRead: 0,
11065
10990
  cacheWrite: 0,
11066
10991
  },
11067
- contextWindow: 262144,
10992
+ contextWindow: 1000000,
11068
10993
  maxTokens: 4096,
11069
10994
  },
11070
10995
  "nvidia/nemotron-3-super-120b-a12b:free": {
@@ -11081,7 +11006,7 @@ export const MODELS = {
11081
11006
  cacheRead: 0,
11082
11007
  cacheWrite: 0,
11083
11008
  },
11084
- contextWindow: 262144,
11009
+ contextWindow: 1000000,
11085
11010
  maxTokens: 262144,
11086
11011
  },
11087
11012
  "nvidia/nemotron-nano-12b-v2-vl:free": {
@@ -11554,11 +11479,11 @@ export const MODELS = {
11554
11479
  cost: {
11555
11480
  input: 1.25,
11556
11481
  output: 10,
11557
- cacheRead: 0.125,
11482
+ cacheRead: 0.13,
11558
11483
  cacheWrite: 0,
11559
11484
  },
11560
11485
  contextWindow: 128000,
11561
- maxTokens: 16384,
11486
+ maxTokens: 32000,
11562
11487
  },
11563
11488
  "openai/gpt-5.1-codex": {
11564
11489
  id: "openai/gpt-5.1-codex",
@@ -11571,7 +11496,7 @@ export const MODELS = {
11571
11496
  cost: {
11572
11497
  input: 1.25,
11573
11498
  output: 10,
11574
- cacheRead: 0.125,
11499
+ cacheRead: 0.13,
11575
11500
  cacheWrite: 0,
11576
11501
  },
11577
11502
  contextWindow: 400000,
@@ -11605,11 +11530,11 @@ export const MODELS = {
11605
11530
  cost: {
11606
11531
  input: 0.25,
11607
11532
  output: 2,
11608
- cacheRead: 0.03,
11533
+ cacheRead: 0.024999999999999998,
11609
11534
  cacheWrite: 0,
11610
11535
  },
11611
11536
  contextWindow: 400000,
11612
- maxTokens: 128000,
11537
+ maxTokens: 100000,
11613
11538
  },
11614
11539
  "openai/gpt-5.2": {
11615
11540
  id: "openai/gpt-5.2",
@@ -11645,7 +11570,7 @@ export const MODELS = {
11645
11570
  cacheWrite: 0,
11646
11571
  },
11647
11572
  contextWindow: 128000,
11648
- maxTokens: 32000,
11573
+ maxTokens: 16384,
11649
11574
  },
11650
11575
  "openai/gpt-5.2-codex": {
11651
11576
  id: "openai/gpt-5.2-codex",
@@ -12181,8 +12106,8 @@ export const MODELS = {
12181
12106
  cacheRead: 0,
12182
12107
  cacheWrite: 0,
12183
12108
  },
12184
- contextWindow: 131072,
12185
- maxTokens: 8192,
12109
+ contextWindow: 262144,
12110
+ maxTokens: 32768,
12186
12111
  },
12187
12112
  "poolside/laguna-xs.2:free": {
12188
12113
  id: "poolside/laguna-xs.2:free",
@@ -12198,8 +12123,8 @@ export const MODELS = {
12198
12123
  cacheRead: 0,
12199
12124
  cacheWrite: 0,
12200
12125
  },
12201
- contextWindow: 131072,
12202
- maxTokens: 8192,
12126
+ contextWindow: 262144,
12127
+ maxTokens: 32768,
12203
12128
  },
12204
12129
  "prime-intellect/intellect-3": {
12205
12130
  id: "prime-intellect/intellect-3",
@@ -12232,7 +12157,7 @@ export const MODELS = {
12232
12157
  cacheRead: 0,
12233
12158
  cacheWrite: 0,
12234
12159
  },
12235
- contextWindow: 32768,
12160
+ contextWindow: 131072,
12236
12161
  maxTokens: 16384,
12237
12162
  },
12238
12163
  "qwen/qwen-2.5-7b-instruct": {
@@ -12249,7 +12174,7 @@ export const MODELS = {
12249
12174
  cacheRead: 0,
12250
12175
  cacheWrite: 0,
12251
12176
  },
12252
- contextWindow: 32768,
12177
+ contextWindow: 131072,
12253
12178
  maxTokens: 32768,
12254
12179
  },
12255
12180
  "qwen/qwen-plus": {
@@ -12281,7 +12206,7 @@ export const MODELS = {
12281
12206
  input: 0.26,
12282
12207
  output: 0.78,
12283
12208
  cacheRead: 0,
12284
- cacheWrite: 0.325,
12209
+ cacheWrite: 0,
12285
12210
  },
12286
12211
  contextWindow: 1000000,
12287
12212
  maxTokens: 32768,
@@ -12317,7 +12242,7 @@ export const MODELS = {
12317
12242
  cacheRead: 0,
12318
12243
  cacheWrite: 0,
12319
12244
  },
12320
- contextWindow: 40960,
12245
+ contextWindow: 131702,
12321
12246
  maxTokens: 40960,
12322
12247
  },
12323
12248
  "qwen/qwen3-235b-a22b": {
@@ -12368,7 +12293,7 @@ export const MODELS = {
12368
12293
  cacheRead: 0,
12369
12294
  cacheWrite: 0,
12370
12295
  },
12371
- contextWindow: 131072,
12296
+ contextWindow: 262144,
12372
12297
  maxTokens: 4096,
12373
12298
  },
12374
12299
  "qwen/qwen3-30b-a3b": {
@@ -12385,7 +12310,7 @@ export const MODELS = {
12385
12310
  cacheRead: 0,
12386
12311
  cacheWrite: 0,
12387
12312
  },
12388
- contextWindow: 40960,
12313
+ contextWindow: 131072,
12389
12314
  maxTokens: 20000,
12390
12315
  },
12391
12316
  "qwen/qwen3-30b-a3b-instruct-2507": {
@@ -12436,7 +12361,7 @@ export const MODELS = {
12436
12361
  cacheRead: 0,
12437
12362
  cacheWrite: 0,
12438
12363
  },
12439
- contextWindow: 40960,
12364
+ contextWindow: 131072,
12440
12365
  maxTokens: 16384,
12441
12366
  },
12442
12367
  "qwen/qwen3-8b": {
@@ -12453,7 +12378,7 @@ export const MODELS = {
12453
12378
  cacheRead: 0.049999999999999996,
12454
12379
  cacheWrite: 0,
12455
12380
  },
12456
- contextWindow: 40960,
12381
+ contextWindow: 131072,
12457
12382
  maxTokens: 8192,
12458
12383
  },
12459
12384
  "qwen/qwen3-coder": {
@@ -12470,7 +12395,7 @@ export const MODELS = {
12470
12395
  cacheRead: 0,
12471
12396
  cacheWrite: 0,
12472
12397
  },
12473
- contextWindow: 262144,
12398
+ contextWindow: 1048576,
12474
12399
  maxTokens: 65536,
12475
12400
  },
12476
12401
  "qwen/qwen3-coder-30b-a3b-instruct": {
@@ -12555,7 +12480,7 @@ export const MODELS = {
12555
12480
  cacheRead: 0,
12556
12481
  cacheWrite: 0,
12557
12482
  },
12558
- contextWindow: 262000,
12483
+ contextWindow: 1048576,
12559
12484
  maxTokens: 262000,
12560
12485
  },
12561
12486
  "qwen/qwen3-max": {
@@ -12640,7 +12565,7 @@ export const MODELS = {
12640
12565
  cacheRead: 0,
12641
12566
  cacheWrite: 0,
12642
12567
  },
12643
- contextWindow: 131072,
12568
+ contextWindow: 262144,
12644
12569
  maxTokens: 32768,
12645
12570
  },
12646
12571
  "qwen/qwen3-vl-235b-a22b-instruct": {
@@ -12691,7 +12616,7 @@ export const MODELS = {
12691
12616
  cacheRead: 0,
12692
12617
  cacheWrite: 0,
12693
12618
  },
12694
- contextWindow: 131072,
12619
+ contextWindow: 262144,
12695
12620
  maxTokens: 32768,
12696
12621
  },
12697
12622
  "qwen/qwen3-vl-30b-a3b-thinking": {
@@ -12725,7 +12650,7 @@ export const MODELS = {
12725
12650
  cacheRead: 0,
12726
12651
  cacheWrite: 0,
12727
12652
  },
12728
- contextWindow: 131072,
12653
+ contextWindow: 262144,
12729
12654
  maxTokens: 32768,
12730
12655
  },
12731
12656
  "qwen/qwen3-vl-8b-instruct": {
@@ -12742,7 +12667,7 @@ export const MODELS = {
12742
12667
  cacheRead: 0,
12743
12668
  cacheWrite: 0,
12744
12669
  },
12745
- contextWindow: 131072,
12670
+ contextWindow: 256000,
12746
12671
  maxTokens: 32768,
12747
12672
  },
12748
12673
  "qwen/qwen3-vl-8b-thinking": {
@@ -12759,7 +12684,7 @@ export const MODELS = {
12759
12684
  cacheRead: 0,
12760
12685
  cacheWrite: 0,
12761
12686
  },
12762
- contextWindow: 131072,
12687
+ contextWindow: 256000,
12763
12688
  maxTokens: 32768,
12764
12689
  },
12765
12690
  "qwen/qwen3.5-122b-a10b": {
@@ -12777,7 +12702,7 @@ export const MODELS = {
12777
12702
  cacheWrite: 0,
12778
12703
  },
12779
12704
  contextWindow: 262144,
12780
- maxTokens: 65536,
12705
+ maxTokens: 262144,
12781
12706
  },
12782
12707
  "qwen/qwen3.5-27b": {
12783
12708
  id: "qwen/qwen3.5-27b",
@@ -12805,13 +12730,13 @@ export const MODELS = {
12805
12730
  reasoning: true,
12806
12731
  input: ["text", "image"],
12807
12732
  cost: {
12808
- input: 0.14,
12733
+ input: 0.13899999999999998,
12809
12734
  output: 1,
12810
- cacheRead: 0.049999999999999996,
12735
+ cacheRead: 0,
12811
12736
  cacheWrite: 0,
12812
12737
  },
12813
12738
  contextWindow: 262144,
12814
- maxTokens: 81920,
12739
+ maxTokens: 4096,
12815
12740
  },
12816
12741
  "qwen/qwen3.5-397b-a17b": {
12817
12742
  id: "qwen/qwen3.5-397b-a17b",
@@ -12824,7 +12749,7 @@ export const MODELS = {
12824
12749
  cost: {
12825
12750
  input: 0.39,
12826
12751
  output: 2.34,
12827
- cacheRead: 0.195,
12752
+ cacheRead: 0,
12828
12753
  cacheWrite: 0,
12829
12754
  },
12830
12755
  contextWindow: 262144,
@@ -12859,7 +12784,7 @@ export const MODELS = {
12859
12784
  input: 0.065,
12860
12785
  output: 0.26,
12861
12786
  cacheRead: 0,
12862
- cacheWrite: 0.08125,
12787
+ cacheWrite: 0,
12863
12788
  },
12864
12789
  contextWindow: 1000000,
12865
12790
  maxTokens: 65536,
@@ -12876,7 +12801,7 @@ export const MODELS = {
12876
12801
  input: 0.26,
12877
12802
  output: 1.56,
12878
12803
  cacheRead: 0,
12879
- cacheWrite: 0.325,
12804
+ cacheWrite: 0,
12880
12805
  },
12881
12806
  contextWindow: 1000000,
12882
12807
  maxTokens: 65536,
@@ -12893,7 +12818,7 @@ export const MODELS = {
12893
12818
  input: 0.3,
12894
12819
  output: 1.7999999999999998,
12895
12820
  cacheRead: 0,
12896
- cacheWrite: 0,
12821
+ cacheWrite: 0.375,
12897
12822
  },
12898
12823
  contextWindow: 1000000,
12899
12824
  maxTokens: 65536,
@@ -12907,13 +12832,13 @@ export const MODELS = {
12907
12832
  reasoning: true,
12908
12833
  input: ["text", "image"],
12909
12834
  cost: {
12910
- input: 0.32,
12835
+ input: 0.29,
12911
12836
  output: 3.1999999999999997,
12912
12837
  cacheRead: 0,
12913
12838
  cacheWrite: 0,
12914
12839
  },
12915
12840
  contextWindow: 262144,
12916
- maxTokens: 81920,
12841
+ maxTokens: 262140,
12917
12842
  },
12918
12843
  "qwen/qwen3.6-35b-a3b": {
12919
12844
  id: "qwen/qwen3.6-35b-a3b",
@@ -12924,13 +12849,13 @@ export const MODELS = {
12924
12849
  reasoning: true,
12925
12850
  input: ["text", "image"],
12926
12851
  cost: {
12927
- input: 0.15,
12852
+ input: 0.14,
12928
12853
  output: 1,
12929
- cacheRead: 0.049999999999999996,
12854
+ cacheRead: 0,
12930
12855
  cacheWrite: 0,
12931
12856
  },
12932
12857
  contextWindow: 262144,
12933
- maxTokens: 262144,
12858
+ maxTokens: 262140,
12934
12859
  },
12935
12860
  "qwen/qwen3.6-flash": {
12936
12861
  id: "qwen/qwen3.6-flash",
@@ -12983,6 +12908,23 @@ export const MODELS = {
12983
12908
  contextWindow: 1000000,
12984
12909
  maxTokens: 65536,
12985
12910
  },
12911
+ "qwen/qwen3.7-max": {
12912
+ id: "qwen/qwen3.7-max",
12913
+ name: "Qwen: Qwen3.7 Max",
12914
+ api: "openai-completions",
12915
+ provider: "openrouter",
12916
+ baseUrl: "https://openrouter.ai/api/v1",
12917
+ reasoning: true,
12918
+ input: ["text"],
12919
+ cost: {
12920
+ input: 1.25,
12921
+ output: 3.75,
12922
+ cacheRead: 0.25,
12923
+ cacheWrite: 1.5625,
12924
+ },
12925
+ contextWindow: 1000000,
12926
+ maxTokens: 65536,
12927
+ },
12986
12928
  "rekaai/reka-edge": {
12987
12929
  id: "rekaai/reka-edge",
12988
12930
  name: "Reka Edge",
@@ -13060,13 +13002,30 @@ export const MODELS = {
13060
13002
  reasoning: true,
13061
13003
  input: ["text"],
13062
13004
  cost: {
13063
- input: 0.09999999999999999,
13005
+ input: 0.09,
13064
13006
  output: 0.3,
13065
- cacheRead: 0,
13007
+ cacheRead: 0.02,
13066
13008
  cacheWrite: 0,
13067
13009
  },
13068
13010
  contextWindow: 262144,
13069
- maxTokens: 65536,
13011
+ maxTokens: 16384,
13012
+ },
13013
+ "stepfun/step-3.7-flash": {
13014
+ id: "stepfun/step-3.7-flash",
13015
+ name: "StepFun: Step 3.7 Flash",
13016
+ api: "openai-completions",
13017
+ provider: "openrouter",
13018
+ baseUrl: "https://openrouter.ai/api/v1",
13019
+ reasoning: true,
13020
+ input: ["text", "image"],
13021
+ cost: {
13022
+ input: 0.19999999999999998,
13023
+ output: 1.15,
13024
+ cacheRead: 0.04,
13025
+ cacheWrite: 0,
13026
+ },
13027
+ contextWindow: 256000,
13028
+ maxTokens: 256000,
13070
13029
  },
13071
13030
  "tencent/hy3-preview": {
13072
13031
  id: "tencent/hy3-preview",
@@ -13077,13 +13036,13 @@ export const MODELS = {
13077
13036
  reasoning: true,
13078
13037
  input: ["text"],
13079
13038
  cost: {
13080
- input: 0.06599999999999999,
13081
- output: 0.26,
13082
- cacheRead: 0.029,
13039
+ input: 0.063,
13040
+ output: 0.21,
13041
+ cacheRead: 0.020999999999999998,
13083
13042
  cacheWrite: 0,
13084
13043
  },
13085
13044
  contextWindow: 262144,
13086
- maxTokens: 262144,
13045
+ maxTokens: 4096,
13087
13046
  },
13088
13047
  "thedrummer/rocinante-12b": {
13089
13048
  id: "thedrummer/rocinante-12b",
@@ -13136,125 +13095,6 @@ export const MODELS = {
13136
13095
  contextWindow: 128000,
13137
13096
  maxTokens: 4096,
13138
13097
  },
13139
- "x-ai/grok-3": {
13140
- id: "x-ai/grok-3",
13141
- name: "xAI: Grok 3",
13142
- api: "openai-completions",
13143
- provider: "openrouter",
13144
- baseUrl: "https://openrouter.ai/api/v1",
13145
- reasoning: false,
13146
- input: ["text"],
13147
- cost: {
13148
- input: 3,
13149
- output: 15,
13150
- cacheRead: 0.75,
13151
- cacheWrite: 0,
13152
- },
13153
- contextWindow: 131072,
13154
- maxTokens: 4096,
13155
- },
13156
- "x-ai/grok-3-beta": {
13157
- id: "x-ai/grok-3-beta",
13158
- name: "xAI: Grok 3 Beta",
13159
- api: "openai-completions",
13160
- provider: "openrouter",
13161
- baseUrl: "https://openrouter.ai/api/v1",
13162
- reasoning: false,
13163
- input: ["text"],
13164
- cost: {
13165
- input: 3,
13166
- output: 15,
13167
- cacheRead: 0.75,
13168
- cacheWrite: 0,
13169
- },
13170
- contextWindow: 131072,
13171
- maxTokens: 4096,
13172
- },
13173
- "x-ai/grok-3-mini": {
13174
- id: "x-ai/grok-3-mini",
13175
- name: "xAI: Grok 3 Mini",
13176
- api: "openai-completions",
13177
- provider: "openrouter",
13178
- baseUrl: "https://openrouter.ai/api/v1",
13179
- reasoning: true,
13180
- input: ["text"],
13181
- cost: {
13182
- input: 0.3,
13183
- output: 0.5,
13184
- cacheRead: 0.075,
13185
- cacheWrite: 0,
13186
- },
13187
- contextWindow: 131072,
13188
- maxTokens: 4096,
13189
- },
13190
- "x-ai/grok-3-mini-beta": {
13191
- id: "x-ai/grok-3-mini-beta",
13192
- name: "xAI: Grok 3 Mini Beta",
13193
- api: "openai-completions",
13194
- provider: "openrouter",
13195
- baseUrl: "https://openrouter.ai/api/v1",
13196
- reasoning: true,
13197
- input: ["text"],
13198
- cost: {
13199
- input: 0.3,
13200
- output: 0.5,
13201
- cacheRead: 0.075,
13202
- cacheWrite: 0,
13203
- },
13204
- contextWindow: 131072,
13205
- maxTokens: 4096,
13206
- },
13207
- "x-ai/grok-4": {
13208
- id: "x-ai/grok-4",
13209
- name: "xAI: Grok 4",
13210
- api: "openai-completions",
13211
- provider: "openrouter",
13212
- baseUrl: "https://openrouter.ai/api/v1",
13213
- reasoning: true,
13214
- input: ["text", "image"],
13215
- cost: {
13216
- input: 3,
13217
- output: 15,
13218
- cacheRead: 0.75,
13219
- cacheWrite: 0,
13220
- },
13221
- contextWindow: 256000,
13222
- maxTokens: 4096,
13223
- },
13224
- "x-ai/grok-4-fast": {
13225
- id: "x-ai/grok-4-fast",
13226
- name: "xAI: Grok 4 Fast",
13227
- api: "openai-completions",
13228
- provider: "openrouter",
13229
- baseUrl: "https://openrouter.ai/api/v1",
13230
- reasoning: true,
13231
- input: ["text", "image"],
13232
- cost: {
13233
- input: 0.19999999999999998,
13234
- output: 0.5,
13235
- cacheRead: 0.049999999999999996,
13236
- cacheWrite: 0,
13237
- },
13238
- contextWindow: 2000000,
13239
- maxTokens: 30000,
13240
- },
13241
- "x-ai/grok-4.1-fast": {
13242
- id: "x-ai/grok-4.1-fast",
13243
- name: "xAI: Grok 4.1 Fast",
13244
- api: "openai-completions",
13245
- provider: "openrouter",
13246
- baseUrl: "https://openrouter.ai/api/v1",
13247
- reasoning: true,
13248
- input: ["text", "image"],
13249
- cost: {
13250
- input: 0.19999999999999998,
13251
- output: 0.5,
13252
- cacheRead: 0.049999999999999996,
13253
- cacheWrite: 0,
13254
- },
13255
- contextWindow: 2000000,
13256
- maxTokens: 30000,
13257
- },
13258
13098
  "x-ai/grok-4.20": {
13259
13099
  id: "x-ai/grok-4.20",
13260
13100
  name: "xAI: Grok 4.20",
@@ -13289,22 +13129,22 @@ export const MODELS = {
13289
13129
  contextWindow: 1000000,
13290
13130
  maxTokens: 4096,
13291
13131
  },
13292
- "x-ai/grok-code-fast-1": {
13293
- id: "x-ai/grok-code-fast-1",
13294
- name: "xAI: Grok Code Fast 1",
13132
+ "x-ai/grok-build-0.1": {
13133
+ id: "x-ai/grok-build-0.1",
13134
+ name: "xAI: Grok Build 0.1",
13295
13135
  api: "openai-completions",
13296
13136
  provider: "openrouter",
13297
13137
  baseUrl: "https://openrouter.ai/api/v1",
13298
13138
  reasoning: true,
13299
- input: ["text"],
13139
+ input: ["text", "image"],
13300
13140
  cost: {
13301
- input: 0.19999999999999998,
13302
- output: 1.5,
13303
- cacheRead: 0.02,
13141
+ input: 1,
13142
+ output: 2,
13143
+ cacheRead: 0.19999999999999998,
13304
13144
  cacheWrite: 0,
13305
13145
  },
13306
13146
  contextWindow: 256000,
13307
- maxTokens: 10000,
13147
+ maxTokens: 4096,
13308
13148
  },
13309
13149
  "xiaomi/mimo-v2-flash": {
13310
13150
  id: "xiaomi/mimo-v2-flash",
@@ -13366,9 +13206,9 @@ export const MODELS = {
13366
13206
  reasoning: true,
13367
13207
  input: ["text", "image"],
13368
13208
  cost: {
13369
- input: 0.39999999999999997,
13370
- output: 2,
13371
- cacheRead: 0.08,
13209
+ input: 0.14,
13210
+ output: 0.28,
13211
+ cacheRead: 0.0028,
13372
13212
  cacheWrite: 0,
13373
13213
  },
13374
13214
  contextWindow: 1048576,
@@ -13383,13 +13223,13 @@ export const MODELS = {
13383
13223
  reasoning: true,
13384
13224
  input: ["text"],
13385
13225
  cost: {
13386
- input: 1,
13387
- output: 3,
13388
- cacheRead: 0.19999999999999998,
13226
+ input: 0.435,
13227
+ output: 0.87,
13228
+ cacheRead: 0.0036,
13389
13229
  cacheWrite: 0,
13390
13230
  },
13391
13231
  contextWindow: 1048576,
13392
- maxTokens: 16384,
13232
+ maxTokens: 131072,
13393
13233
  },
13394
13234
  "z-ai/glm-4-32b": {
13395
13235
  id: "z-ai/glm-4-32b",
@@ -13434,13 +13274,13 @@ export const MODELS = {
13434
13274
  reasoning: true,
13435
13275
  input: ["text"],
13436
13276
  cost: {
13437
- input: 0.13,
13277
+ input: 0.125,
13438
13278
  output: 0.85,
13439
- cacheRead: 0.024999999999999998,
13279
+ cacheRead: 0.06,
13440
13280
  cacheWrite: 0,
13441
13281
  },
13442
13282
  contextWindow: 131072,
13443
- maxTokens: 98304,
13283
+ maxTokens: 131070,
13444
13284
  },
13445
13285
  "z-ai/glm-4.5-air:free": {
13446
13286
  id: "z-ai/glm-4.5-air:free",
@@ -13672,9 +13512,9 @@ export const MODELS = {
13672
13512
  reasoning: true,
13673
13513
  input: ["text", "image"],
13674
13514
  cost: {
13675
- input: 0.5,
13676
- output: 3,
13677
- cacheRead: 0.049999999999999996,
13515
+ input: 1.5,
13516
+ output: 9,
13517
+ cacheRead: 0.15,
13678
13518
  cacheWrite: 0.08333333333333334,
13679
13519
  },
13680
13520
  contextWindow: 1048576,
@@ -13711,7 +13551,7 @@ export const MODELS = {
13711
13551
  cacheRead: 0.25,
13712
13552
  cacheWrite: 0,
13713
13553
  },
13714
- contextWindow: 262142,
13554
+ contextWindow: 262144,
13715
13555
  maxTokens: 262142,
13716
13556
  },
13717
13557
  "~openai/gpt-latest": {
@@ -13882,6 +13722,25 @@ export const MODELS = {
13882
13722
  contextWindow: 1000000,
13883
13723
  maxTokens: 500000,
13884
13724
  },
13725
+ "Qwen/Qwen3.7-Max": {
13726
+ id: "Qwen/Qwen3.7-Max",
13727
+ name: "Qwen3.7 Max",
13728
+ api: "openai-completions",
13729
+ provider: "together",
13730
+ baseUrl: "https://api.together.ai/v1",
13731
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13732
+ reasoning: true,
13733
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13734
+ input: ["text"],
13735
+ cost: {
13736
+ input: 2.5,
13737
+ output: 7.5,
13738
+ cacheRead: 0,
13739
+ cacheWrite: 0,
13740
+ },
13741
+ contextWindow: 1000000,
13742
+ maxTokens: 500000,
13743
+ },
13885
13744
  "deepseek-ai/DeepSeek-V3": {
13886
13745
  id: "deepseek-ai/DeepSeek-V3",
13887
13746
  name: "DeepSeek V3",
@@ -14378,6 +14237,23 @@ export const MODELS = {
14378
14237
  contextWindow: 1000000,
14379
14238
  maxTokens: 64000,
14380
14239
  },
14240
+ "alibaba/qwen3.7-max": {
14241
+ id: "alibaba/qwen3.7-max",
14242
+ name: "Qwen 3.7 Max",
14243
+ api: "anthropic-messages",
14244
+ provider: "vercel-ai-gateway",
14245
+ baseUrl: "https://ai-gateway.vercel.sh",
14246
+ reasoning: true,
14247
+ input: ["text", "image"],
14248
+ cost: {
14249
+ input: 1.25,
14250
+ output: 3.75,
14251
+ cacheRead: 0.25,
14252
+ cacheWrite: 1.5625,
14253
+ },
14254
+ contextWindow: 991000,
14255
+ maxTokens: 64000,
14256
+ },
14381
14257
  "anthropic/claude-3-haiku": {
14382
14258
  id: "anthropic/claude-3-haiku",
14383
14259
  name: "Claude 3 Haiku",
@@ -14516,6 +14392,23 @@ export const MODELS = {
14516
14392
  contextWindow: 1000000,
14517
14393
  maxTokens: 128000,
14518
14394
  },
14395
+ "anthropic/claude-opus-4.8": {
14396
+ id: "anthropic/claude-opus-4.8",
14397
+ name: "Claude Opus 4.8",
14398
+ api: "anthropic-messages",
14399
+ provider: "vercel-ai-gateway",
14400
+ baseUrl: "https://ai-gateway.vercel.sh",
14401
+ reasoning: true,
14402
+ input: ["text", "image"],
14403
+ cost: {
14404
+ input: 5,
14405
+ output: 25,
14406
+ cacheRead: 0.5,
14407
+ cacheWrite: 6.25,
14408
+ },
14409
+ contextWindow: 1000000,
14410
+ maxTokens: 128000,
14411
+ },
14519
14412
  "anthropic/claude-sonnet-4": {
14520
14413
  id: "anthropic/claude-sonnet-4",
14521
14414
  name: "Claude Sonnet 4",
@@ -14941,13 +14834,30 @@ export const MODELS = {
14941
14834
  contextWindow: 1000000,
14942
14835
  maxTokens: 64000,
14943
14836
  },
14944
- "google/gemma-4-26b-a4b-it": {
14945
- id: "google/gemma-4-26b-a4b-it",
14946
- name: "Gemma 4 26B A4B IT",
14837
+ "google/gemini-3.5-flash": {
14838
+ id: "google/gemini-3.5-flash",
14839
+ name: "Gemini 3.5 Flash",
14947
14840
  api: "anthropic-messages",
14948
14841
  provider: "vercel-ai-gateway",
14949
14842
  baseUrl: "https://ai-gateway.vercel.sh",
14950
- reasoning: false,
14843
+ reasoning: true,
14844
+ input: ["text", "image"],
14845
+ cost: {
14846
+ input: 1.5,
14847
+ output: 9,
14848
+ cacheRead: 0.15,
14849
+ cacheWrite: 0,
14850
+ },
14851
+ contextWindow: 1000000,
14852
+ maxTokens: 64000,
14853
+ },
14854
+ "google/gemma-4-26b-a4b-it": {
14855
+ id: "google/gemma-4-26b-a4b-it",
14856
+ name: "Gemma 4 26B A4B IT",
14857
+ api: "anthropic-messages",
14858
+ provider: "vercel-ai-gateway",
14859
+ baseUrl: "https://ai-gateway.vercel.sh",
14860
+ reasoning: false,
14951
14861
  input: ["text", "image"],
14952
14862
  cost: {
14953
14863
  input: 0.13,
@@ -15249,7 +15159,7 @@ export const MODELS = {
15249
15159
  },
15250
15160
  "minimax/minimax-m2.7": {
15251
15161
  id: "minimax/minimax-m2.7",
15252
- name: "Minimax M2.7",
15162
+ name: "MiniMax M2.7",
15253
15163
  api: "anthropic-messages",
15254
15164
  provider: "vercel-ai-gateway",
15255
15165
  baseUrl: "https://ai-gateway.vercel.sh",
@@ -15400,6 +15310,23 @@ export const MODELS = {
15400
15310
  contextWindow: 128000,
15401
15311
  maxTokens: 64000,
15402
15312
  },
15313
+ "mistral/mistral-medium-3.5": {
15314
+ id: "mistral/mistral-medium-3.5",
15315
+ name: "Mistral Medium Latest",
15316
+ api: "anthropic-messages",
15317
+ provider: "vercel-ai-gateway",
15318
+ baseUrl: "https://ai-gateway.vercel.sh",
15319
+ reasoning: true,
15320
+ input: ["text"],
15321
+ cost: {
15322
+ input: 1.5,
15323
+ output: 7.5,
15324
+ cacheRead: 0,
15325
+ cacheWrite: 0,
15326
+ },
15327
+ contextWindow: 256000,
15328
+ maxTokens: 256000,
15329
+ },
15403
15330
  "mistral/mistral-small": {
15404
15331
  id: "mistral/mistral-small",
15405
15332
  name: "Mistral Small",
@@ -16262,125 +16189,6 @@ export const MODELS = {
16262
16189
  contextWindow: 200000,
16263
16190
  maxTokens: 8000,
16264
16191
  },
16265
- "xai/grok-3": {
16266
- id: "xai/grok-3",
16267
- name: "Grok 3 Beta",
16268
- api: "anthropic-messages",
16269
- provider: "vercel-ai-gateway",
16270
- baseUrl: "https://ai-gateway.vercel.sh",
16271
- reasoning: false,
16272
- input: ["text"],
16273
- cost: {
16274
- input: 3,
16275
- output: 15,
16276
- cacheRead: 0.75,
16277
- cacheWrite: 0,
16278
- },
16279
- contextWindow: 131072,
16280
- maxTokens: 131072,
16281
- },
16282
- "xai/grok-3-fast": {
16283
- id: "xai/grok-3-fast",
16284
- name: "Grok 3 Fast Beta",
16285
- api: "anthropic-messages",
16286
- provider: "vercel-ai-gateway",
16287
- baseUrl: "https://ai-gateway.vercel.sh",
16288
- reasoning: false,
16289
- input: ["text"],
16290
- cost: {
16291
- input: 5,
16292
- output: 25,
16293
- cacheRead: 1.25,
16294
- cacheWrite: 0,
16295
- },
16296
- contextWindow: 131072,
16297
- maxTokens: 131072,
16298
- },
16299
- "xai/grok-3-mini": {
16300
- id: "xai/grok-3-mini",
16301
- name: "Grok 3 Mini Beta",
16302
- api: "anthropic-messages",
16303
- provider: "vercel-ai-gateway",
16304
- baseUrl: "https://ai-gateway.vercel.sh",
16305
- reasoning: false,
16306
- input: ["text"],
16307
- cost: {
16308
- input: 0.3,
16309
- output: 0.5,
16310
- cacheRead: 0.075,
16311
- cacheWrite: 0,
16312
- },
16313
- contextWindow: 131072,
16314
- maxTokens: 131072,
16315
- },
16316
- "xai/grok-3-mini-fast": {
16317
- id: "xai/grok-3-mini-fast",
16318
- name: "Grok 3 Mini Fast Beta",
16319
- api: "anthropic-messages",
16320
- provider: "vercel-ai-gateway",
16321
- baseUrl: "https://ai-gateway.vercel.sh",
16322
- reasoning: false,
16323
- input: ["text"],
16324
- cost: {
16325
- input: 0.6,
16326
- output: 4,
16327
- cacheRead: 0,
16328
- cacheWrite: 0,
16329
- },
16330
- contextWindow: 131072,
16331
- maxTokens: 131072,
16332
- },
16333
- "xai/grok-4": {
16334
- id: "xai/grok-4",
16335
- name: "Grok 4",
16336
- api: "anthropic-messages",
16337
- provider: "vercel-ai-gateway",
16338
- baseUrl: "https://ai-gateway.vercel.sh",
16339
- reasoning: true,
16340
- input: ["text", "image"],
16341
- cost: {
16342
- input: 3,
16343
- output: 15,
16344
- cacheRead: 0.75,
16345
- cacheWrite: 0,
16346
- },
16347
- contextWindow: 256000,
16348
- maxTokens: 256000,
16349
- },
16350
- "xai/grok-4-fast-non-reasoning": {
16351
- id: "xai/grok-4-fast-non-reasoning",
16352
- name: "Grok 4 Fast Non-Reasoning",
16353
- api: "anthropic-messages",
16354
- provider: "vercel-ai-gateway",
16355
- baseUrl: "https://ai-gateway.vercel.sh",
16356
- reasoning: false,
16357
- input: ["text", "image"],
16358
- cost: {
16359
- input: 0.19999999999999998,
16360
- output: 0.5,
16361
- cacheRead: 0.049999999999999996,
16362
- cacheWrite: 0,
16363
- },
16364
- contextWindow: 2000000,
16365
- maxTokens: 256000,
16366
- },
16367
- "xai/grok-4-fast-reasoning": {
16368
- id: "xai/grok-4-fast-reasoning",
16369
- name: "Grok 4 Fast Reasoning",
16370
- api: "anthropic-messages",
16371
- provider: "vercel-ai-gateway",
16372
- baseUrl: "https://ai-gateway.vercel.sh",
16373
- reasoning: true,
16374
- input: ["text", "image"],
16375
- cost: {
16376
- input: 0.19999999999999998,
16377
- output: 0.5,
16378
- cacheRead: 0.049999999999999996,
16379
- cacheWrite: 0,
16380
- },
16381
- contextWindow: 2000000,
16382
- maxTokens: 256000,
16383
- },
16384
16192
  "xai/grok-4.1-fast-non-reasoning": {
16385
16193
  id: "xai/grok-4.1-fast-non-reasoning",
16386
16194
  name: "Grok 4.1 Fast Non-Reasoning",
@@ -16395,8 +16203,8 @@ export const MODELS = {
16395
16203
  cacheRead: 0.049999999999999996,
16396
16204
  cacheWrite: 0,
16397
16205
  },
16398
- contextWindow: 2000000,
16399
- maxTokens: 30000,
16206
+ contextWindow: 1000000,
16207
+ maxTokens: 1000000,
16400
16208
  },
16401
16209
  "xai/grok-4.1-fast-reasoning": {
16402
16210
  id: "xai/grok-4.1-fast-reasoning",
@@ -16412,8 +16220,8 @@ export const MODELS = {
16412
16220
  cacheRead: 0.049999999999999996,
16413
16221
  cacheWrite: 0,
16414
16222
  },
16415
- contextWindow: 2000000,
16416
- maxTokens: 30000,
16223
+ contextWindow: 1000000,
16224
+ maxTokens: 1000000,
16417
16225
  },
16418
16226
  "xai/grok-4.20-multi-agent": {
16419
16227
  id: "xai/grok-4.20-multi-agent",
@@ -16534,18 +16342,18 @@ export const MODELS = {
16534
16342
  contextWindow: 1000000,
16535
16343
  maxTokens: 1000000,
16536
16344
  },
16537
- "xai/grok-code-fast-1": {
16538
- id: "xai/grok-code-fast-1",
16539
- name: "Grok Code Fast 1",
16345
+ "xai/grok-build-0.1": {
16346
+ id: "xai/grok-build-0.1",
16347
+ name: "Grok Build 0.1",
16540
16348
  api: "anthropic-messages",
16541
16349
  provider: "vercel-ai-gateway",
16542
16350
  baseUrl: "https://ai-gateway.vercel.sh",
16543
16351
  reasoning: true,
16544
- input: ["text"],
16352
+ input: ["text", "image"],
16545
16353
  cost: {
16546
- input: 0.19999999999999998,
16547
- output: 1.5,
16548
- cacheRead: 0.02,
16354
+ input: 1,
16355
+ output: 2,
16356
+ cacheRead: 0.19999999999999998,
16549
16357
  cacheWrite: 0,
16550
16358
  },
16551
16359
  contextWindow: 256000,
@@ -16594,9 +16402,9 @@ export const MODELS = {
16594
16402
  reasoning: true,
16595
16403
  input: ["text", "image"],
16596
16404
  cost: {
16597
- input: 0.39999999999999997,
16598
- output: 2,
16599
- cacheRead: 0.08,
16405
+ input: 0.14,
16406
+ output: 0.28,
16407
+ cacheRead: 0.0028,
16600
16408
  cacheWrite: 0,
16601
16409
  },
16602
16410
  contextWindow: 1050000,
@@ -16611,9 +16419,9 @@ export const MODELS = {
16611
16419
  reasoning: true,
16612
16420
  input: ["text", "image"],
16613
16421
  cost: {
16614
- input: 1,
16615
- output: 3,
16616
- cacheRead: 0.19999999999999998,
16422
+ input: 0.435,
16423
+ output: 0.87,
16424
+ cacheRead: 0.0036,
16617
16425
  cacheWrite: 0,
16618
16426
  },
16619
16427
  contextWindow: 1050000,
@@ -16842,329 +16650,6 @@ export const MODELS = {
16842
16650
  },
16843
16651
  },
16844
16652
  "xai": {
16845
- "grok-2": {
16846
- id: "grok-2",
16847
- name: "Grok 2",
16848
- api: "openai-completions",
16849
- provider: "xai",
16850
- baseUrl: "https://api.x.ai/v1",
16851
- reasoning: false,
16852
- input: ["text"],
16853
- cost: {
16854
- input: 2,
16855
- output: 10,
16856
- cacheRead: 2,
16857
- cacheWrite: 0,
16858
- },
16859
- contextWindow: 131072,
16860
- maxTokens: 8192,
16861
- },
16862
- "grok-2-1212": {
16863
- id: "grok-2-1212",
16864
- name: "Grok 2 (1212)",
16865
- api: "openai-completions",
16866
- provider: "xai",
16867
- baseUrl: "https://api.x.ai/v1",
16868
- reasoning: false,
16869
- input: ["text"],
16870
- cost: {
16871
- input: 2,
16872
- output: 10,
16873
- cacheRead: 2,
16874
- cacheWrite: 0,
16875
- },
16876
- contextWindow: 131072,
16877
- maxTokens: 8192,
16878
- },
16879
- "grok-2-latest": {
16880
- id: "grok-2-latest",
16881
- name: "Grok 2 Latest",
16882
- api: "openai-completions",
16883
- provider: "xai",
16884
- baseUrl: "https://api.x.ai/v1",
16885
- reasoning: false,
16886
- input: ["text"],
16887
- cost: {
16888
- input: 2,
16889
- output: 10,
16890
- cacheRead: 2,
16891
- cacheWrite: 0,
16892
- },
16893
- contextWindow: 131072,
16894
- maxTokens: 8192,
16895
- },
16896
- "grok-2-vision": {
16897
- id: "grok-2-vision",
16898
- name: "Grok 2 Vision",
16899
- api: "openai-completions",
16900
- provider: "xai",
16901
- baseUrl: "https://api.x.ai/v1",
16902
- reasoning: false,
16903
- input: ["text", "image"],
16904
- cost: {
16905
- input: 2,
16906
- output: 10,
16907
- cacheRead: 2,
16908
- cacheWrite: 0,
16909
- },
16910
- contextWindow: 8192,
16911
- maxTokens: 4096,
16912
- },
16913
- "grok-2-vision-1212": {
16914
- id: "grok-2-vision-1212",
16915
- name: "Grok 2 Vision (1212)",
16916
- api: "openai-completions",
16917
- provider: "xai",
16918
- baseUrl: "https://api.x.ai/v1",
16919
- reasoning: false,
16920
- input: ["text", "image"],
16921
- cost: {
16922
- input: 2,
16923
- output: 10,
16924
- cacheRead: 2,
16925
- cacheWrite: 0,
16926
- },
16927
- contextWindow: 8192,
16928
- maxTokens: 4096,
16929
- },
16930
- "grok-2-vision-latest": {
16931
- id: "grok-2-vision-latest",
16932
- name: "Grok 2 Vision Latest",
16933
- api: "openai-completions",
16934
- provider: "xai",
16935
- baseUrl: "https://api.x.ai/v1",
16936
- reasoning: false,
16937
- input: ["text", "image"],
16938
- cost: {
16939
- input: 2,
16940
- output: 10,
16941
- cacheRead: 2,
16942
- cacheWrite: 0,
16943
- },
16944
- contextWindow: 8192,
16945
- maxTokens: 4096,
16946
- },
16947
- "grok-3": {
16948
- id: "grok-3",
16949
- name: "Grok 3",
16950
- api: "openai-completions",
16951
- provider: "xai",
16952
- baseUrl: "https://api.x.ai/v1",
16953
- reasoning: false,
16954
- input: ["text"],
16955
- cost: {
16956
- input: 3,
16957
- output: 15,
16958
- cacheRead: 0.75,
16959
- cacheWrite: 0,
16960
- },
16961
- contextWindow: 131072,
16962
- maxTokens: 8192,
16963
- },
16964
- "grok-3-fast": {
16965
- id: "grok-3-fast",
16966
- name: "Grok 3 Fast",
16967
- api: "openai-completions",
16968
- provider: "xai",
16969
- baseUrl: "https://api.x.ai/v1",
16970
- reasoning: false,
16971
- input: ["text"],
16972
- cost: {
16973
- input: 5,
16974
- output: 25,
16975
- cacheRead: 1.25,
16976
- cacheWrite: 0,
16977
- },
16978
- contextWindow: 131072,
16979
- maxTokens: 8192,
16980
- },
16981
- "grok-3-fast-latest": {
16982
- id: "grok-3-fast-latest",
16983
- name: "Grok 3 Fast Latest",
16984
- api: "openai-completions",
16985
- provider: "xai",
16986
- baseUrl: "https://api.x.ai/v1",
16987
- reasoning: false,
16988
- input: ["text"],
16989
- cost: {
16990
- input: 5,
16991
- output: 25,
16992
- cacheRead: 1.25,
16993
- cacheWrite: 0,
16994
- },
16995
- contextWindow: 131072,
16996
- maxTokens: 8192,
16997
- },
16998
- "grok-3-latest": {
16999
- id: "grok-3-latest",
17000
- name: "Grok 3 Latest",
17001
- api: "openai-completions",
17002
- provider: "xai",
17003
- baseUrl: "https://api.x.ai/v1",
17004
- reasoning: false,
17005
- input: ["text"],
17006
- cost: {
17007
- input: 3,
17008
- output: 15,
17009
- cacheRead: 0.75,
17010
- cacheWrite: 0,
17011
- },
17012
- contextWindow: 131072,
17013
- maxTokens: 8192,
17014
- },
17015
- "grok-3-mini": {
17016
- id: "grok-3-mini",
17017
- name: "Grok 3 Mini",
17018
- api: "openai-completions",
17019
- provider: "xai",
17020
- baseUrl: "https://api.x.ai/v1",
17021
- reasoning: true,
17022
- input: ["text"],
17023
- cost: {
17024
- input: 0.3,
17025
- output: 0.5,
17026
- cacheRead: 0.075,
17027
- cacheWrite: 0,
17028
- },
17029
- contextWindow: 131072,
17030
- maxTokens: 8192,
17031
- },
17032
- "grok-3-mini-fast": {
17033
- id: "grok-3-mini-fast",
17034
- name: "Grok 3 Mini Fast",
17035
- api: "openai-completions",
17036
- provider: "xai",
17037
- baseUrl: "https://api.x.ai/v1",
17038
- reasoning: true,
17039
- input: ["text"],
17040
- cost: {
17041
- input: 0.6,
17042
- output: 4,
17043
- cacheRead: 0.15,
17044
- cacheWrite: 0,
17045
- },
17046
- contextWindow: 131072,
17047
- maxTokens: 8192,
17048
- },
17049
- "grok-3-mini-fast-latest": {
17050
- id: "grok-3-mini-fast-latest",
17051
- name: "Grok 3 Mini Fast Latest",
17052
- api: "openai-completions",
17053
- provider: "xai",
17054
- baseUrl: "https://api.x.ai/v1",
17055
- reasoning: true,
17056
- input: ["text"],
17057
- cost: {
17058
- input: 0.6,
17059
- output: 4,
17060
- cacheRead: 0.15,
17061
- cacheWrite: 0,
17062
- },
17063
- contextWindow: 131072,
17064
- maxTokens: 8192,
17065
- },
17066
- "grok-3-mini-latest": {
17067
- id: "grok-3-mini-latest",
17068
- name: "Grok 3 Mini Latest",
17069
- api: "openai-completions",
17070
- provider: "xai",
17071
- baseUrl: "https://api.x.ai/v1",
17072
- reasoning: true,
17073
- input: ["text"],
17074
- cost: {
17075
- input: 0.3,
17076
- output: 0.5,
17077
- cacheRead: 0.075,
17078
- cacheWrite: 0,
17079
- },
17080
- contextWindow: 131072,
17081
- maxTokens: 8192,
17082
- },
17083
- "grok-4": {
17084
- id: "grok-4",
17085
- name: "Grok 4",
17086
- api: "openai-completions",
17087
- provider: "xai",
17088
- baseUrl: "https://api.x.ai/v1",
17089
- reasoning: true,
17090
- input: ["text"],
17091
- cost: {
17092
- input: 3,
17093
- output: 15,
17094
- cacheRead: 0.75,
17095
- cacheWrite: 0,
17096
- },
17097
- contextWindow: 256000,
17098
- maxTokens: 64000,
17099
- },
17100
- "grok-4-1-fast": {
17101
- id: "grok-4-1-fast",
17102
- name: "Grok 4.1 Fast",
17103
- api: "openai-completions",
17104
- provider: "xai",
17105
- baseUrl: "https://api.x.ai/v1",
17106
- reasoning: true,
17107
- input: ["text", "image"],
17108
- cost: {
17109
- input: 0.2,
17110
- output: 0.5,
17111
- cacheRead: 0.05,
17112
- cacheWrite: 0,
17113
- },
17114
- contextWindow: 2000000,
17115
- maxTokens: 30000,
17116
- },
17117
- "grok-4-1-fast-non-reasoning": {
17118
- id: "grok-4-1-fast-non-reasoning",
17119
- name: "Grok 4.1 Fast (Non-Reasoning)",
17120
- api: "openai-completions",
17121
- provider: "xai",
17122
- baseUrl: "https://api.x.ai/v1",
17123
- reasoning: false,
17124
- input: ["text", "image"],
17125
- cost: {
17126
- input: 0.2,
17127
- output: 0.5,
17128
- cacheRead: 0.05,
17129
- cacheWrite: 0,
17130
- },
17131
- contextWindow: 2000000,
17132
- maxTokens: 30000,
17133
- },
17134
- "grok-4-fast": {
17135
- id: "grok-4-fast",
17136
- name: "Grok 4 Fast",
17137
- api: "openai-completions",
17138
- provider: "xai",
17139
- baseUrl: "https://api.x.ai/v1",
17140
- reasoning: true,
17141
- input: ["text", "image"],
17142
- cost: {
17143
- input: 0.2,
17144
- output: 0.5,
17145
- cacheRead: 0.05,
17146
- cacheWrite: 0,
17147
- },
17148
- contextWindow: 2000000,
17149
- maxTokens: 30000,
17150
- },
17151
- "grok-4-fast-non-reasoning": {
17152
- id: "grok-4-fast-non-reasoning",
17153
- name: "Grok 4 Fast (Non-Reasoning)",
17154
- api: "openai-completions",
17155
- provider: "xai",
17156
- baseUrl: "https://api.x.ai/v1",
17157
- reasoning: false,
17158
- input: ["text", "image"],
17159
- cost: {
17160
- input: 0.2,
17161
- output: 0.5,
17162
- cacheRead: 0.05,
17163
- cacheWrite: 0,
17164
- },
17165
- contextWindow: 2000000,
17166
- maxTokens: 30000,
17167
- },
17168
16653
  "grok-4.20-0309-non-reasoning": {
17169
16654
  id: "grok-4.20-0309-non-reasoning",
17170
16655
  name: "Grok 4.20 (Non-Reasoning)",
@@ -17174,8 +16659,8 @@ export const MODELS = {
17174
16659
  reasoning: false,
17175
16660
  input: ["text", "image"],
17176
16661
  cost: {
17177
- input: 2,
17178
- output: 6,
16662
+ input: 1.25,
16663
+ output: 2.5,
17179
16664
  cacheRead: 0.2,
17180
16665
  cacheWrite: 0,
17181
16666
  },
@@ -17191,8 +16676,8 @@ export const MODELS = {
17191
16676
  reasoning: true,
17192
16677
  input: ["text", "image"],
17193
16678
  cost: {
17194
- input: 2,
17195
- output: 6,
16679
+ input: 1.25,
16680
+ output: 2.5,
17196
16681
  cacheRead: 0.2,
17197
16682
  cacheWrite: 0,
17198
16683
  },
@@ -17216,22 +16701,22 @@ export const MODELS = {
17216
16701
  contextWindow: 1000000,
17217
16702
  maxTokens: 30000,
17218
16703
  },
17219
- "grok-beta": {
17220
- id: "grok-beta",
17221
- name: "Grok Beta",
16704
+ "grok-build-0.1": {
16705
+ id: "grok-build-0.1",
16706
+ name: "Grok Build 0.1",
17222
16707
  api: "openai-completions",
17223
16708
  provider: "xai",
17224
16709
  baseUrl: "https://api.x.ai/v1",
17225
- reasoning: false,
17226
- input: ["text"],
16710
+ reasoning: true,
16711
+ input: ["text", "image"],
17227
16712
  cost: {
17228
- input: 5,
17229
- output: 15,
17230
- cacheRead: 5,
16713
+ input: 1,
16714
+ output: 2,
16715
+ cacheRead: 0.2,
17231
16716
  cacheWrite: 0,
17232
16717
  },
17233
- contextWindow: 131072,
17234
- maxTokens: 4096,
16718
+ contextWindow: 256000,
16719
+ maxTokens: 256000,
17235
16720
  },
17236
16721
  "grok-code-fast-1": {
17237
16722
  id: "grok-code-fast-1",
@@ -17239,7 +16724,7 @@ export const MODELS = {
17239
16724
  api: "openai-completions",
17240
16725
  provider: "xai",
17241
16726
  baseUrl: "https://api.x.ai/v1",
17242
- reasoning: true,
16727
+ reasoning: false,
17243
16728
  input: ["text"],
17244
16729
  cost: {
17245
16730
  input: 0.2,
@@ -17247,25 +16732,8 @@ export const MODELS = {
17247
16732
  cacheRead: 0.02,
17248
16733
  cacheWrite: 0,
17249
16734
  },
17250
- contextWindow: 256000,
17251
- maxTokens: 10000,
17252
- },
17253
- "grok-vision-beta": {
17254
- id: "grok-vision-beta",
17255
- name: "Grok Vision Beta",
17256
- api: "openai-completions",
17257
- provider: "xai",
17258
- baseUrl: "https://api.x.ai/v1",
17259
- reasoning: false,
17260
- input: ["text", "image"],
17261
- cost: {
17262
- input: 5,
17263
- output: 15,
17264
- cacheRead: 5,
17265
- cacheWrite: 0,
17266
- },
17267
- contextWindow: 8192,
17268
- maxTokens: 4096,
16735
+ contextWindow: 32768,
16736
+ maxTokens: 8192,
17269
16737
  },
17270
16738
  },
17271
16739
  "xiaomi": {