@earendil-works/pi-ai 0.75.3 → 0.75.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (147) hide show
  1. package/dist/api-registry.d.ts +1 -1
  2. package/dist/api-registry.d.ts.map +1 -1
  3. package/dist/api-registry.js.map +1 -1
  4. package/dist/bedrock-provider.d.ts +2 -2
  5. package/dist/bedrock-provider.d.ts.map +1 -1
  6. package/dist/bedrock-provider.js.map +1 -1
  7. package/dist/cli.d.ts.map +1 -1
  8. package/dist/cli.js +14 -0
  9. package/dist/cli.js.map +1 -1
  10. package/dist/env-api-keys.d.ts +1 -1
  11. package/dist/env-api-keys.d.ts.map +1 -1
  12. package/dist/env-api-keys.js +10 -2
  13. package/dist/env-api-keys.js.map +1 -1
  14. package/dist/image-models.d.ts +2 -2
  15. package/dist/image-models.d.ts.map +1 -1
  16. package/dist/image-models.generated.d.ts +15 -0
  17. package/dist/image-models.generated.d.ts.map +1 -1
  18. package/dist/image-models.generated.js +15 -0
  19. package/dist/image-models.generated.js.map +1 -1
  20. package/dist/image-models.js.map +1 -1
  21. package/dist/images-api-registry.d.ts +1 -1
  22. package/dist/images-api-registry.d.ts.map +1 -1
  23. package/dist/images-api-registry.js.map +1 -1
  24. package/dist/images.d.ts +2 -2
  25. package/dist/images.d.ts.map +1 -1
  26. package/dist/images.js.map +1 -1
  27. package/dist/index.d.ts +29 -29
  28. package/dist/index.d.ts.map +1 -1
  29. package/dist/index.js.map +1 -1
  30. package/dist/models.d.ts +2 -2
  31. package/dist/models.d.ts.map +1 -1
  32. package/dist/models.generated.d.ts +317 -509
  33. package/dist/models.generated.d.ts.map +1 -1
  34. package/dist/models.generated.js +400 -620
  35. package/dist/models.generated.js.map +1 -1
  36. package/dist/models.js.map +1 -1
  37. package/dist/oauth.d.ts +1 -1
  38. package/dist/oauth.d.ts.map +1 -1
  39. package/dist/oauth.js.map +1 -1
  40. package/dist/providers/amazon-bedrock.d.ts +1 -1
  41. package/dist/providers/amazon-bedrock.d.ts.map +1 -1
  42. package/dist/providers/amazon-bedrock.js +5 -2
  43. package/dist/providers/amazon-bedrock.js.map +1 -1
  44. package/dist/providers/anthropic.d.ts +23 -6
  45. package/dist/providers/anthropic.d.ts.map +1 -1
  46. package/dist/providers/anthropic.js +11 -23
  47. package/dist/providers/anthropic.js.map +1 -1
  48. package/dist/providers/azure-openai-responses.d.ts +1 -1
  49. package/dist/providers/azure-openai-responses.d.ts.map +1 -1
  50. package/dist/providers/azure-openai-responses.js +2 -1
  51. package/dist/providers/azure-openai-responses.js.map +1 -1
  52. package/dist/providers/cloudflare.d.ts +1 -1
  53. package/dist/providers/cloudflare.d.ts.map +1 -1
  54. package/dist/providers/cloudflare.js.map +1 -1
  55. package/dist/providers/faux.d.ts +1 -1
  56. package/dist/providers/faux.d.ts.map +1 -1
  57. package/dist/providers/faux.js.map +1 -1
  58. package/dist/providers/github-copilot-headers.d.ts +1 -1
  59. package/dist/providers/github-copilot-headers.d.ts.map +1 -1
  60. package/dist/providers/github-copilot-headers.js.map +1 -1
  61. package/dist/providers/google-shared.d.ts +1 -1
  62. package/dist/providers/google-shared.d.ts.map +1 -1
  63. package/dist/providers/google-shared.js.map +1 -1
  64. package/dist/providers/google-vertex.d.ts +2 -2
  65. package/dist/providers/google-vertex.d.ts.map +1 -1
  66. package/dist/providers/google-vertex.js.map +1 -1
  67. package/dist/providers/google.d.ts +2 -2
  68. package/dist/providers/google.d.ts.map +1 -1
  69. package/dist/providers/google.js.map +1 -1
  70. package/dist/providers/images/openrouter.d.ts +1 -1
  71. package/dist/providers/images/openrouter.d.ts.map +1 -1
  72. package/dist/providers/images/openrouter.js.map +1 -1
  73. package/dist/providers/images/register-builtins.d.ts +1 -1
  74. package/dist/providers/images/register-builtins.d.ts.map +1 -1
  75. package/dist/providers/images/register-builtins.js.map +1 -1
  76. package/dist/providers/mistral.d.ts +1 -1
  77. package/dist/providers/mistral.d.ts.map +1 -1
  78. package/dist/providers/mistral.js.map +1 -1
  79. package/dist/providers/openai-codex-responses.d.ts +1 -1
  80. package/dist/providers/openai-codex-responses.d.ts.map +1 -1
  81. package/dist/providers/openai-codex-responses.js +12 -3
  82. package/dist/providers/openai-codex-responses.js.map +1 -1
  83. package/dist/providers/openai-completions.d.ts +1 -1
  84. package/dist/providers/openai-completions.d.ts.map +1 -1
  85. package/dist/providers/openai-completions.js +2 -1
  86. package/dist/providers/openai-completions.js.map +1 -1
  87. package/dist/providers/openai-prompt-cache.d.ts +3 -0
  88. package/dist/providers/openai-prompt-cache.d.ts.map +1 -0
  89. package/dist/providers/openai-prompt-cache.js +10 -0
  90. package/dist/providers/openai-prompt-cache.js.map +1 -0
  91. package/dist/providers/openai-responses-shared.d.ts +2 -2
  92. package/dist/providers/openai-responses-shared.d.ts.map +1 -1
  93. package/dist/providers/openai-responses-shared.js.map +1 -1
  94. package/dist/providers/openai-responses.d.ts +1 -1
  95. package/dist/providers/openai-responses.d.ts.map +1 -1
  96. package/dist/providers/openai-responses.js +2 -1
  97. package/dist/providers/openai-responses.js.map +1 -1
  98. package/dist/providers/register-builtins.d.ts +10 -10
  99. package/dist/providers/register-builtins.d.ts.map +1 -1
  100. package/dist/providers/register-builtins.js +13 -2
  101. package/dist/providers/register-builtins.js.map +1 -1
  102. package/dist/providers/simple-options.d.ts +3 -3
  103. package/dist/providers/simple-options.d.ts.map +1 -1
  104. package/dist/providers/simple-options.js +6 -11
  105. package/dist/providers/simple-options.js.map +1 -1
  106. package/dist/providers/transform-messages.d.ts +1 -1
  107. package/dist/providers/transform-messages.d.ts.map +1 -1
  108. package/dist/providers/transform-messages.js.map +1 -1
  109. package/dist/stream.d.ts +3 -3
  110. package/dist/stream.d.ts.map +1 -1
  111. package/dist/stream.js.map +1 -1
  112. package/dist/types.d.ts +13 -3
  113. package/dist/types.d.ts.map +1 -1
  114. package/dist/types.js.map +1 -1
  115. package/dist/utils/event-stream.d.ts +3 -3
  116. package/dist/utils/event-stream.d.ts.map +1 -1
  117. package/dist/utils/event-stream.js +2 -2
  118. package/dist/utils/event-stream.js.map +1 -1
  119. package/dist/utils/oauth/anthropic.d.ts +1 -1
  120. package/dist/utils/oauth/anthropic.d.ts.map +1 -1
  121. package/dist/utils/oauth/anthropic.js.map +1 -1
  122. package/dist/utils/oauth/device-code.d.ts +19 -0
  123. package/dist/utils/oauth/device-code.d.ts.map +1 -0
  124. package/dist/utils/oauth/device-code.js +55 -0
  125. package/dist/utils/oauth/device-code.js.map +1 -0
  126. package/dist/utils/oauth/github-copilot.d.ts +3 -3
  127. package/dist/utils/oauth/github-copilot.d.ts.map +1 -1
  128. package/dist/utils/oauth/github-copilot.js +45 -69
  129. package/dist/utils/oauth/github-copilot.js.map +1 -1
  130. package/dist/utils/oauth/index.d.ts +6 -5
  131. package/dist/utils/oauth/index.d.ts.map +1 -1
  132. package/dist/utils/oauth/index.js +1 -0
  133. package/dist/utils/oauth/index.js.map +1 -1
  134. package/dist/utils/oauth/openai-codex.d.ts +1 -1
  135. package/dist/utils/oauth/openai-codex.d.ts.map +1 -1
  136. package/dist/utils/oauth/openai-codex.js +1 -1
  137. package/dist/utils/oauth/openai-codex.js.map +1 -1
  138. package/dist/utils/oauth/types.d.ts +9 -2
  139. package/dist/utils/oauth/types.d.ts.map +1 -1
  140. package/dist/utils/oauth/types.js.map +1 -1
  141. package/dist/utils/overflow.d.ts +1 -1
  142. package/dist/utils/overflow.d.ts.map +1 -1
  143. package/dist/utils/overflow.js.map +1 -1
  144. package/dist/utils/validation.d.ts +1 -1
  145. package/dist/utils/validation.d.ts.map +1 -1
  146. package/dist/utils/validation.js.map +1 -1
  147. package/package.json +15 -16
@@ -908,8 +908,8 @@ export const MODELS = {
908
908
  cacheRead: 0,
909
909
  cacheWrite: 0,
910
910
  },
911
- contextWindow: 256000,
912
- maxTokens: 256000,
911
+ contextWindow: 262143,
912
+ maxTokens: 16000,
913
913
  },
914
914
  "moonshotai.kimi-k2.5": {
915
915
  id: "moonshotai.kimi-k2.5",
@@ -925,8 +925,8 @@ export const MODELS = {
925
925
  cacheRead: 0,
926
926
  cacheWrite: 0,
927
927
  },
928
- contextWindow: 256000,
929
- maxTokens: 256000,
928
+ contextWindow: 262143,
929
+ maxTokens: 16000,
930
930
  },
931
931
  "nvidia.nemotron-nano-12b-v2": {
932
932
  id: "nvidia.nemotron-nano-12b-v2",
@@ -1720,6 +1720,7 @@ export const MODELS = {
1720
1720
  api: "anthropic-messages",
1721
1721
  provider: "anthropic",
1722
1722
  baseUrl: "https://api.anthropic.com",
1723
+ compat: { "forceAdaptiveThinking": true },
1723
1724
  reasoning: true,
1724
1725
  thinkingLevelMap: { "xhigh": "max" },
1725
1726
  input: ["text", "image"],
@@ -1738,6 +1739,7 @@ export const MODELS = {
1738
1739
  api: "anthropic-messages",
1739
1740
  provider: "anthropic",
1740
1741
  baseUrl: "https://api.anthropic.com",
1742
+ compat: { "forceAdaptiveThinking": true },
1741
1743
  reasoning: true,
1742
1744
  thinkingLevelMap: { "xhigh": "xhigh" },
1743
1745
  input: ["text", "image"],
@@ -1824,6 +1826,7 @@ export const MODELS = {
1824
1826
  api: "anthropic-messages",
1825
1827
  provider: "anthropic",
1826
1828
  baseUrl: "https://api.anthropic.com",
1829
+ compat: { "forceAdaptiveThinking": true },
1827
1830
  reasoning: true,
1828
1831
  input: ["text", "image"],
1829
1832
  cost: {
@@ -2823,6 +2826,7 @@ export const MODELS = {
2823
2826
  api: "anthropic-messages",
2824
2827
  provider: "cloudflare-ai-gateway",
2825
2828
  baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2829
+ compat: { "forceAdaptiveThinking": true },
2826
2830
  reasoning: true,
2827
2831
  thinkingLevelMap: { "xhigh": "max" },
2828
2832
  input: ["text", "image"],
@@ -2841,6 +2845,7 @@ export const MODELS = {
2841
2845
  api: "anthropic-messages",
2842
2846
  provider: "cloudflare-ai-gateway",
2843
2847
  baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2848
+ compat: { "forceAdaptiveThinking": true },
2844
2849
  reasoning: true,
2845
2850
  thinkingLevelMap: { "xhigh": "xhigh" },
2846
2851
  input: ["text", "image"],
@@ -2893,6 +2898,7 @@ export const MODELS = {
2893
2898
  api: "anthropic-messages",
2894
2899
  provider: "cloudflare-ai-gateway",
2895
2900
  baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2901
+ compat: { "forceAdaptiveThinking": true },
2896
2902
  reasoning: true,
2897
2903
  input: ["text", "image"],
2898
2904
  cost: {
@@ -3275,6 +3281,42 @@ export const MODELS = {
3275
3281
  contextWindow: 256000,
3276
3282
  maxTokens: 16384,
3277
3283
  },
3284
+ "@cf/ibm-granite/granite-4.0-h-micro": {
3285
+ id: "@cf/ibm-granite/granite-4.0-h-micro",
3286
+ name: "Granite 4.0 H Micro",
3287
+ api: "openai-completions",
3288
+ provider: "cloudflare-workers-ai",
3289
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3290
+ compat: { "sendSessionAffinityHeaders": true },
3291
+ reasoning: false,
3292
+ input: ["text"],
3293
+ cost: {
3294
+ input: 0.017,
3295
+ output: 0.112,
3296
+ cacheRead: 0,
3297
+ cacheWrite: 0,
3298
+ },
3299
+ contextWindow: 131000,
3300
+ maxTokens: 131000,
3301
+ },
3302
+ "@cf/meta/llama-3.3-70b-instruct-fp8-fast": {
3303
+ id: "@cf/meta/llama-3.3-70b-instruct-fp8-fast",
3304
+ name: "Llama 3.3 70B Instruct fp8 Fast",
3305
+ api: "openai-completions",
3306
+ provider: "cloudflare-workers-ai",
3307
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3308
+ compat: { "sendSessionAffinityHeaders": true },
3309
+ reasoning: false,
3310
+ input: ["text"],
3311
+ cost: {
3312
+ input: 0.293,
3313
+ output: 2.253,
3314
+ cacheRead: 0,
3315
+ cacheWrite: 0,
3316
+ },
3317
+ contextWindow: 24000,
3318
+ maxTokens: 24000,
3319
+ },
3278
3320
  "@cf/meta/llama-4-scout-17b-16e-instruct": {
3279
3321
  id: "@cf/meta/llama-4-scout-17b-16e-instruct",
3280
3322
  name: "Llama 4 Scout 17B 16E Instruct",
@@ -3290,9 +3332,27 @@ export const MODELS = {
3290
3332
  cacheRead: 0,
3291
3333
  cacheWrite: 0,
3292
3334
  },
3293
- contextWindow: 128000,
3335
+ contextWindow: 131000,
3294
3336
  maxTokens: 16384,
3295
3337
  },
3338
+ "@cf/mistralai/mistral-small-3.1-24b-instruct": {
3339
+ id: "@cf/mistralai/mistral-small-3.1-24b-instruct",
3340
+ name: "Mistral Small 3.1 24B Instruct",
3341
+ api: "openai-completions",
3342
+ provider: "cloudflare-workers-ai",
3343
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3344
+ compat: { "sendSessionAffinityHeaders": true },
3345
+ reasoning: false,
3346
+ input: ["text"],
3347
+ cost: {
3348
+ input: 0.351,
3349
+ output: 0.555,
3350
+ cacheRead: 0,
3351
+ cacheWrite: 0,
3352
+ },
3353
+ contextWindow: 128000,
3354
+ maxTokens: 128000,
3355
+ },
3296
3356
  "@cf/moonshotai/kimi-k2.5": {
3297
3357
  id: "@cf/moonshotai/kimi-k2.5",
3298
3358
  name: "Kimi K2.5",
@@ -3326,7 +3386,7 @@ export const MODELS = {
3326
3386
  cacheRead: 0.16,
3327
3387
  cacheWrite: 0,
3328
3388
  },
3329
- contextWindow: 256000,
3389
+ contextWindow: 262144,
3330
3390
  maxTokens: 256000,
3331
3391
  },
3332
3392
  "@cf/nvidia/nemotron-3-120b-a12b": {
@@ -3383,6 +3443,24 @@ export const MODELS = {
3383
3443
  contextWindow: 128000,
3384
3444
  maxTokens: 16384,
3385
3445
  },
3446
+ "@cf/qwen/qwen3-30b-a3b-fp8": {
3447
+ id: "@cf/qwen/qwen3-30b-a3b-fp8",
3448
+ name: "Qwen3 30B A3b fp8",
3449
+ api: "openai-completions",
3450
+ provider: "cloudflare-workers-ai",
3451
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3452
+ compat: { "sendSessionAffinityHeaders": true },
3453
+ reasoning: true,
3454
+ input: ["text"],
3455
+ cost: {
3456
+ input: 0.0509,
3457
+ output: 0.335,
3458
+ cacheRead: 0,
3459
+ cacheWrite: 0,
3460
+ },
3461
+ contextWindow: 32768,
3462
+ maxTokens: 32768,
3463
+ },
3386
3464
  "@cf/zai-org/glm-4.7-flash": {
3387
3465
  id: "@cf/zai-org/glm-4.7-flash",
3388
3466
  name: "GLM-4.7-Flash",
@@ -3393,7 +3471,7 @@ export const MODELS = {
3393
3471
  reasoning: true,
3394
3472
  input: ["text"],
3395
3473
  cost: {
3396
- input: 0.06,
3474
+ input: 0.0605,
3397
3475
  output: 0.4,
3398
3476
  cacheRead: 0,
3399
3477
  cacheWrite: 0,
@@ -3443,27 +3521,9 @@ export const MODELS = {
3443
3521
  },
3444
3522
  },
3445
3523
  "fireworks": {
3446
- "accounts/fireworks/models/deepseek-v3p1": {
3447
- id: "accounts/fireworks/models/deepseek-v3p1",
3448
- name: "DeepSeek V3.1",
3449
- api: "anthropic-messages",
3450
- provider: "fireworks",
3451
- baseUrl: "https://api.fireworks.ai/inference",
3452
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3453
- reasoning: true,
3454
- input: ["text"],
3455
- cost: {
3456
- input: 0.56,
3457
- output: 1.68,
3458
- cacheRead: 0,
3459
- cacheWrite: 0,
3460
- },
3461
- contextWindow: 163840,
3462
- maxTokens: 163840,
3463
- },
3464
- "accounts/fireworks/models/deepseek-v3p2": {
3465
- id: "accounts/fireworks/models/deepseek-v3p2",
3466
- name: "DeepSeek V3.2",
3524
+ "accounts/fireworks/models/deepseek-v4-flash": {
3525
+ id: "accounts/fireworks/models/deepseek-v4-flash",
3526
+ name: "DeepSeek V4 Flash",
3467
3527
  api: "anthropic-messages",
3468
3528
  provider: "fireworks",
3469
3529
  baseUrl: "https://api.fireworks.ai/inference",
@@ -3471,13 +3531,13 @@ export const MODELS = {
3471
3531
  reasoning: true,
3472
3532
  input: ["text"],
3473
3533
  cost: {
3474
- input: 0.56,
3475
- output: 1.68,
3476
- cacheRead: 0.28,
3534
+ input: 0.14,
3535
+ output: 0.28,
3536
+ cacheRead: 0.03,
3477
3537
  cacheWrite: 0,
3478
3538
  },
3479
- contextWindow: 160000,
3480
- maxTokens: 160000,
3539
+ contextWindow: 1000000,
3540
+ maxTokens: 384000,
3481
3541
  },
3482
3542
  "accounts/fireworks/models/deepseek-v4-pro": {
3483
3543
  id: "accounts/fireworks/models/deepseek-v4-pro",
@@ -3491,84 +3551,12 @@ export const MODELS = {
3491
3551
  cost: {
3492
3552
  input: 1.74,
3493
3553
  output: 3.48,
3494
- cacheRead: 0.15,
3554
+ cacheRead: 0.145,
3495
3555
  cacheWrite: 0,
3496
3556
  },
3497
3557
  contextWindow: 1000000,
3498
3558
  maxTokens: 384000,
3499
3559
  },
3500
- "accounts/fireworks/models/glm-4p5": {
3501
- id: "accounts/fireworks/models/glm-4p5",
3502
- name: "GLM 4.5",
3503
- api: "anthropic-messages",
3504
- provider: "fireworks",
3505
- baseUrl: "https://api.fireworks.ai/inference",
3506
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3507
- reasoning: true,
3508
- input: ["text"],
3509
- cost: {
3510
- input: 0.55,
3511
- output: 2.19,
3512
- cacheRead: 0,
3513
- cacheWrite: 0,
3514
- },
3515
- contextWindow: 131072,
3516
- maxTokens: 131072,
3517
- },
3518
- "accounts/fireworks/models/glm-4p5-air": {
3519
- id: "accounts/fireworks/models/glm-4p5-air",
3520
- name: "GLM 4.5 Air",
3521
- api: "anthropic-messages",
3522
- provider: "fireworks",
3523
- baseUrl: "https://api.fireworks.ai/inference",
3524
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3525
- reasoning: true,
3526
- input: ["text"],
3527
- cost: {
3528
- input: 0.22,
3529
- output: 0.88,
3530
- cacheRead: 0,
3531
- cacheWrite: 0,
3532
- },
3533
- contextWindow: 131072,
3534
- maxTokens: 131072,
3535
- },
3536
- "accounts/fireworks/models/glm-4p7": {
3537
- id: "accounts/fireworks/models/glm-4p7",
3538
- name: "GLM 4.7",
3539
- api: "anthropic-messages",
3540
- provider: "fireworks",
3541
- baseUrl: "https://api.fireworks.ai/inference",
3542
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3543
- reasoning: true,
3544
- input: ["text"],
3545
- cost: {
3546
- input: 0.6,
3547
- output: 2.2,
3548
- cacheRead: 0.3,
3549
- cacheWrite: 0,
3550
- },
3551
- contextWindow: 198000,
3552
- maxTokens: 198000,
3553
- },
3554
- "accounts/fireworks/models/glm-5": {
3555
- id: "accounts/fireworks/models/glm-5",
3556
- name: "GLM 5",
3557
- api: "anthropic-messages",
3558
- provider: "fireworks",
3559
- baseUrl: "https://api.fireworks.ai/inference",
3560
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3561
- reasoning: true,
3562
- input: ["text"],
3563
- cost: {
3564
- input: 1,
3565
- output: 3.2,
3566
- cacheRead: 0.5,
3567
- cacheWrite: 0,
3568
- },
3569
- contextWindow: 202752,
3570
- maxTokens: 131072,
3571
- },
3572
3560
  "accounts/fireworks/models/glm-5p1": {
3573
3561
  id: "accounts/fireworks/models/glm-5p1",
3574
3562
  name: "GLM 5.1",
@@ -3599,7 +3587,7 @@ export const MODELS = {
3599
3587
  cost: {
3600
3588
  input: 0.15,
3601
3589
  output: 0.6,
3602
- cacheRead: 0,
3590
+ cacheRead: 0.015,
3603
3591
  cacheWrite: 0,
3604
3592
  },
3605
3593
  contextWindow: 131072,
@@ -3615,50 +3603,14 @@ export const MODELS = {
3615
3603
  reasoning: true,
3616
3604
  input: ["text"],
3617
3605
  cost: {
3618
- input: 0.05,
3619
- output: 0.2,
3620
- cacheRead: 0,
3606
+ input: 0.07,
3607
+ output: 0.3,
3608
+ cacheRead: 0.035,
3621
3609
  cacheWrite: 0,
3622
3610
  },
3623
3611
  contextWindow: 131072,
3624
3612
  maxTokens: 32768,
3625
3613
  },
3626
- "accounts/fireworks/models/kimi-k2-instruct": {
3627
- id: "accounts/fireworks/models/kimi-k2-instruct",
3628
- name: "Kimi K2 Instruct",
3629
- api: "anthropic-messages",
3630
- provider: "fireworks",
3631
- baseUrl: "https://api.fireworks.ai/inference",
3632
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3633
- reasoning: false,
3634
- input: ["text"],
3635
- cost: {
3636
- input: 1,
3637
- output: 3,
3638
- cacheRead: 0,
3639
- cacheWrite: 0,
3640
- },
3641
- contextWindow: 128000,
3642
- maxTokens: 16384,
3643
- },
3644
- "accounts/fireworks/models/kimi-k2-thinking": {
3645
- id: "accounts/fireworks/models/kimi-k2-thinking",
3646
- name: "Kimi K2 Thinking",
3647
- api: "anthropic-messages",
3648
- provider: "fireworks",
3649
- baseUrl: "https://api.fireworks.ai/inference",
3650
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3651
- reasoning: true,
3652
- input: ["text"],
3653
- cost: {
3654
- input: 0.6,
3655
- output: 2.5,
3656
- cacheRead: 0.3,
3657
- cacheWrite: 0,
3658
- },
3659
- contextWindow: 256000,
3660
- maxTokens: 256000,
3661
- },
3662
3614
  "accounts/fireworks/models/kimi-k2p5": {
3663
3615
  id: "accounts/fireworks/models/kimi-k2p5",
3664
3616
  name: "Kimi K2.5",
@@ -3695,24 +3647,6 @@ export const MODELS = {
3695
3647
  contextWindow: 262000,
3696
3648
  maxTokens: 262000,
3697
3649
  },
3698
- "accounts/fireworks/models/minimax-m2p1": {
3699
- id: "accounts/fireworks/models/minimax-m2p1",
3700
- name: "MiniMax-M2.1",
3701
- api: "anthropic-messages",
3702
- provider: "fireworks",
3703
- baseUrl: "https://api.fireworks.ai/inference",
3704
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3705
- reasoning: true,
3706
- input: ["text"],
3707
- cost: {
3708
- input: 0.3,
3709
- output: 1.2,
3710
- cacheRead: 0.03,
3711
- cacheWrite: 0,
3712
- },
3713
- contextWindow: 200000,
3714
- maxTokens: 200000,
3715
- },
3716
3650
  "accounts/fireworks/models/minimax-m2p5": {
3717
3651
  id: "accounts/fireworks/models/minimax-m2p5",
3718
3652
  name: "MiniMax-M2.5",
@@ -3743,7 +3677,7 @@ export const MODELS = {
3743
3677
  cost: {
3744
3678
  input: 0.3,
3745
3679
  output: 1.2,
3746
- cacheRead: 0.03,
3680
+ cacheRead: 0.06,
3747
3681
  cacheWrite: 0,
3748
3682
  },
3749
3683
  contextWindow: 196608,
@@ -3767,9 +3701,27 @@ export const MODELS = {
3767
3701
  contextWindow: 128000,
3768
3702
  maxTokens: 8192,
3769
3703
  },
3770
- "accounts/fireworks/routers/kimi-k2p5-turbo": {
3771
- id: "accounts/fireworks/routers/kimi-k2p5-turbo",
3772
- name: "Kimi K2.5 Turbo",
3704
+ "accounts/fireworks/routers/glm-5p1-fast": {
3705
+ id: "accounts/fireworks/routers/glm-5p1-fast",
3706
+ name: "GLM 5.1 Fast",
3707
+ api: "anthropic-messages",
3708
+ provider: "fireworks",
3709
+ baseUrl: "https://api.fireworks.ai/inference",
3710
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3711
+ reasoning: true,
3712
+ input: ["text"],
3713
+ cost: {
3714
+ input: 2.8,
3715
+ output: 8.8,
3716
+ cacheRead: 0.52,
3717
+ cacheWrite: 0,
3718
+ },
3719
+ contextWindow: 202800,
3720
+ maxTokens: 131072,
3721
+ },
3722
+ "accounts/fireworks/routers/kimi-k2p6-turbo": {
3723
+ id: "accounts/fireworks/routers/kimi-k2p6-turbo",
3724
+ name: "Kimi K2.6 Turbo",
3773
3725
  api: "anthropic-messages",
3774
3726
  provider: "fireworks",
3775
3727
  baseUrl: "https://api.fireworks.ai/inference",
@@ -3777,13 +3729,13 @@ export const MODELS = {
3777
3729
  reasoning: true,
3778
3730
  input: ["text", "image"],
3779
3731
  cost: {
3780
- input: 0,
3781
- output: 0,
3782
- cacheRead: 0,
3732
+ input: 2,
3733
+ output: 8,
3734
+ cacheRead: 0.3,
3783
3735
  cacheWrite: 0,
3784
3736
  },
3785
- contextWindow: 256000,
3786
- maxTokens: 256000,
3737
+ contextWindow: 262000,
3738
+ maxTokens: 262000,
3787
3739
  },
3788
3740
  },
3789
3741
  "github-copilot": {
@@ -3831,6 +3783,7 @@ export const MODELS = {
3831
3783
  provider: "github-copilot",
3832
3784
  baseUrl: "https://api.individual.githubcopilot.com",
3833
3785
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3786
+ compat: { "forceAdaptiveThinking": true },
3834
3787
  reasoning: true,
3835
3788
  thinkingLevelMap: { "xhigh": "max" },
3836
3789
  input: ["text", "image"],
@@ -3850,6 +3803,7 @@ export const MODELS = {
3850
3803
  provider: "github-copilot",
3851
3804
  baseUrl: "https://api.individual.githubcopilot.com",
3852
3805
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3806
+ compat: { "forceAdaptiveThinking": true },
3853
3807
  reasoning: true,
3854
3808
  thinkingLevelMap: { "xhigh": "xhigh" },
3855
3809
  input: ["text", "image"],
@@ -3888,6 +3842,7 @@ export const MODELS = {
3888
3842
  provider: "github-copilot",
3889
3843
  baseUrl: "https://api.individual.githubcopilot.com",
3890
3844
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3845
+ compat: { "forceAdaptiveThinking": true },
3891
3846
  reasoning: true,
3892
3847
  input: ["text", "image"],
3893
3848
  cost: {
@@ -3956,6 +3911,25 @@ export const MODELS = {
3956
3911
  contextWindow: 128000,
3957
3912
  maxTokens: 64000,
3958
3913
  },
3914
+ "gemini-3.5-flash": {
3915
+ id: "gemini-3.5-flash",
3916
+ name: "Gemini 3.5 Flash",
3917
+ api: "openai-completions",
3918
+ provider: "github-copilot",
3919
+ baseUrl: "https://api.individual.githubcopilot.com",
3920
+ headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3921
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
3922
+ reasoning: true,
3923
+ input: ["text", "image"],
3924
+ cost: {
3925
+ input: 0,
3926
+ output: 0,
3927
+ cacheRead: 0,
3928
+ cacheWrite: 0,
3929
+ },
3930
+ contextWindow: 128000,
3931
+ maxTokens: 64000,
3932
+ },
3959
3933
  "gpt-4.1": {
3960
3934
  id: "gpt-4.1",
3961
3935
  name: "GPT-4.1",
@@ -4137,68 +4111,17 @@ export const MODELS = {
4137
4111
  compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
4138
4112
  reasoning: true,
4139
4113
  input: ["text"],
4140
- cost: {
4141
- input: 0,
4142
- output: 0,
4143
- cacheRead: 0,
4144
- cacheWrite: 0,
4145
- },
4146
- contextWindow: 128000,
4147
- maxTokens: 64000,
4148
- },
4149
- },
4150
- "google": {
4151
- "gemini-1.5-flash": {
4152
- id: "gemini-1.5-flash",
4153
- name: "Gemini 1.5 Flash",
4154
- api: "google-generative-ai",
4155
- provider: "google",
4156
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4157
- reasoning: false,
4158
- input: ["text", "image"],
4159
- cost: {
4160
- input: 0.075,
4161
- output: 0.3,
4162
- cacheRead: 0.01875,
4163
- cacheWrite: 0,
4164
- },
4165
- contextWindow: 1000000,
4166
- maxTokens: 8192,
4167
- },
4168
- "gemini-1.5-flash-8b": {
4169
- id: "gemini-1.5-flash-8b",
4170
- name: "Gemini 1.5 Flash-8B",
4171
- api: "google-generative-ai",
4172
- provider: "google",
4173
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4174
- reasoning: false,
4175
- input: ["text", "image"],
4176
- cost: {
4177
- input: 0.0375,
4178
- output: 0.15,
4179
- cacheRead: 0.01,
4180
- cacheWrite: 0,
4181
- },
4182
- contextWindow: 1000000,
4183
- maxTokens: 8192,
4184
- },
4185
- "gemini-1.5-pro": {
4186
- id: "gemini-1.5-pro",
4187
- name: "Gemini 1.5 Pro",
4188
- api: "google-generative-ai",
4189
- provider: "google",
4190
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4191
- reasoning: false,
4192
- input: ["text", "image"],
4193
- cost: {
4194
- input: 1.25,
4195
- output: 5,
4196
- cacheRead: 0.3125,
4114
+ cost: {
4115
+ input: 0,
4116
+ output: 0,
4117
+ cacheRead: 0,
4197
4118
  cacheWrite: 0,
4198
4119
  },
4199
- contextWindow: 1000000,
4200
- maxTokens: 8192,
4120
+ contextWindow: 128000,
4121
+ maxTokens: 64000,
4201
4122
  },
4123
+ },
4124
+ "google": {
4202
4125
  "gemini-2.0-flash": {
4203
4126
  id: "gemini-2.0-flash",
4204
4127
  name: "Gemini 2.0 Flash",
@@ -4218,7 +4141,7 @@ export const MODELS = {
4218
4141
  },
4219
4142
  "gemini-2.0-flash-lite": {
4220
4143
  id: "gemini-2.0-flash-lite",
4221
- name: "Gemini 2.0 Flash Lite",
4144
+ name: "Gemini 2.0 Flash-Lite",
4222
4145
  api: "google-generative-ai",
4223
4146
  provider: "google",
4224
4147
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4252,7 +4175,7 @@ export const MODELS = {
4252
4175
  },
4253
4176
  "gemini-2.5-flash-lite": {
4254
4177
  id: "gemini-2.5-flash-lite",
4255
- name: "Gemini 2.5 Flash Lite",
4178
+ name: "Gemini 2.5 Flash-Lite",
4256
4179
  api: "google-generative-ai",
4257
4180
  provider: "google",
4258
4181
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4267,91 +4190,6 @@ export const MODELS = {
4267
4190
  contextWindow: 1048576,
4268
4191
  maxTokens: 65536,
4269
4192
  },
4270
- "gemini-2.5-flash-lite-preview-06-17": {
4271
- id: "gemini-2.5-flash-lite-preview-06-17",
4272
- name: "Gemini 2.5 Flash Lite Preview 06-17",
4273
- api: "google-generative-ai",
4274
- provider: "google",
4275
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4276
- reasoning: true,
4277
- input: ["text", "image"],
4278
- cost: {
4279
- input: 0.1,
4280
- output: 0.4,
4281
- cacheRead: 0.025,
4282
- cacheWrite: 0,
4283
- },
4284
- contextWindow: 1048576,
4285
- maxTokens: 65536,
4286
- },
4287
- "gemini-2.5-flash-lite-preview-09-2025": {
4288
- id: "gemini-2.5-flash-lite-preview-09-2025",
4289
- name: "Gemini 2.5 Flash Lite Preview 09-25",
4290
- api: "google-generative-ai",
4291
- provider: "google",
4292
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4293
- reasoning: true,
4294
- input: ["text", "image"],
4295
- cost: {
4296
- input: 0.1,
4297
- output: 0.4,
4298
- cacheRead: 0.025,
4299
- cacheWrite: 0,
4300
- },
4301
- contextWindow: 1048576,
4302
- maxTokens: 65536,
4303
- },
4304
- "gemini-2.5-flash-preview-04-17": {
4305
- id: "gemini-2.5-flash-preview-04-17",
4306
- name: "Gemini 2.5 Flash Preview 04-17",
4307
- api: "google-generative-ai",
4308
- provider: "google",
4309
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4310
- reasoning: true,
4311
- input: ["text", "image"],
4312
- cost: {
4313
- input: 0.15,
4314
- output: 0.6,
4315
- cacheRead: 0.0375,
4316
- cacheWrite: 0,
4317
- },
4318
- contextWindow: 1048576,
4319
- maxTokens: 65536,
4320
- },
4321
- "gemini-2.5-flash-preview-05-20": {
4322
- id: "gemini-2.5-flash-preview-05-20",
4323
- name: "Gemini 2.5 Flash Preview 05-20",
4324
- api: "google-generative-ai",
4325
- provider: "google",
4326
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4327
- reasoning: true,
4328
- input: ["text", "image"],
4329
- cost: {
4330
- input: 0.15,
4331
- output: 0.6,
4332
- cacheRead: 0.0375,
4333
- cacheWrite: 0,
4334
- },
4335
- contextWindow: 1048576,
4336
- maxTokens: 65536,
4337
- },
4338
- "gemini-2.5-flash-preview-09-2025": {
4339
- id: "gemini-2.5-flash-preview-09-2025",
4340
- name: "Gemini 2.5 Flash Preview 09-25",
4341
- api: "google-generative-ai",
4342
- provider: "google",
4343
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4344
- reasoning: true,
4345
- input: ["text", "image"],
4346
- cost: {
4347
- input: 0.3,
4348
- output: 2.5,
4349
- cacheRead: 0.075,
4350
- cacheWrite: 0,
4351
- },
4352
- contextWindow: 1048576,
4353
- maxTokens: 65536,
4354
- },
4355
4193
  "gemini-2.5-pro": {
4356
4194
  id: "gemini-2.5-pro",
4357
4195
  name: "Gemini 2.5 Pro",
@@ -4369,40 +4207,6 @@ export const MODELS = {
4369
4207
  contextWindow: 1048576,
4370
4208
  maxTokens: 65536,
4371
4209
  },
4372
- "gemini-2.5-pro-preview-05-06": {
4373
- id: "gemini-2.5-pro-preview-05-06",
4374
- name: "Gemini 2.5 Pro Preview 05-06",
4375
- api: "google-generative-ai",
4376
- provider: "google",
4377
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4378
- reasoning: true,
4379
- input: ["text", "image"],
4380
- cost: {
4381
- input: 1.25,
4382
- output: 10,
4383
- cacheRead: 0.31,
4384
- cacheWrite: 0,
4385
- },
4386
- contextWindow: 1048576,
4387
- maxTokens: 65536,
4388
- },
4389
- "gemini-2.5-pro-preview-06-05": {
4390
- id: "gemini-2.5-pro-preview-06-05",
4391
- name: "Gemini 2.5 Pro Preview 06-05",
4392
- api: "google-generative-ai",
4393
- provider: "google",
4394
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4395
- reasoning: true,
4396
- input: ["text", "image"],
4397
- cost: {
4398
- input: 1.25,
4399
- output: 10,
4400
- cacheRead: 0.31,
4401
- cacheWrite: 0,
4402
- },
4403
- contextWindow: 1048576,
4404
- maxTokens: 65536,
4405
- },
4406
4210
  "gemini-3-flash-preview": {
4407
4211
  id: "gemini-3-flash-preview",
4408
4212
  name: "Gemini 3 Flash Preview",
@@ -4436,8 +4240,8 @@ export const MODELS = {
4436
4240
  cacheRead: 0.2,
4437
4241
  cacheWrite: 0,
4438
4242
  },
4439
- contextWindow: 1000000,
4440
- maxTokens: 64000,
4243
+ contextWindow: 1048576,
4244
+ maxTokens: 65536,
4441
4245
  },
4442
4246
  "gemini-3.1-flash-lite": {
4443
4247
  id: "gemini-3.1-flash-lite",
@@ -4511,6 +4315,24 @@ export const MODELS = {
4511
4315
  contextWindow: 1048576,
4512
4316
  maxTokens: 65536,
4513
4317
  },
4318
+ "gemini-3.5-flash": {
4319
+ id: "gemini-3.5-flash",
4320
+ name: "Gemini 3.5 Flash",
4321
+ api: "google-generative-ai",
4322
+ provider: "google",
4323
+ baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4324
+ reasoning: true,
4325
+ thinkingLevelMap: { "off": null },
4326
+ input: ["text", "image"],
4327
+ cost: {
4328
+ input: 1.5,
4329
+ output: 9,
4330
+ cacheRead: 0.15,
4331
+ cacheWrite: 0,
4332
+ },
4333
+ contextWindow: 1048576,
4334
+ maxTokens: 65536,
4335
+ },
4514
4336
  "gemini-flash-latest": {
4515
4337
  id: "gemini-flash-latest",
4516
4338
  name: "Gemini Flash Latest",
@@ -4545,60 +4367,9 @@ export const MODELS = {
4545
4367
  contextWindow: 1048576,
4546
4368
  maxTokens: 65536,
4547
4369
  },
4548
- "gemini-live-2.5-flash": {
4549
- id: "gemini-live-2.5-flash",
4550
- name: "Gemini Live 2.5 Flash",
4551
- api: "google-generative-ai",
4552
- provider: "google",
4553
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4554
- reasoning: true,
4555
- input: ["text", "image"],
4556
- cost: {
4557
- input: 0.5,
4558
- output: 2,
4559
- cacheRead: 0,
4560
- cacheWrite: 0,
4561
- },
4562
- contextWindow: 128000,
4563
- maxTokens: 8000,
4564
- },
4565
- "gemini-live-2.5-flash-preview-native-audio": {
4566
- id: "gemini-live-2.5-flash-preview-native-audio",
4567
- name: "Gemini Live 2.5 Flash Preview Native Audio",
4568
- api: "google-generative-ai",
4569
- provider: "google",
4570
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4571
- reasoning: true,
4572
- input: ["text"],
4573
- cost: {
4574
- input: 0.5,
4575
- output: 2,
4576
- cacheRead: 0,
4577
- cacheWrite: 0,
4578
- },
4579
- contextWindow: 131072,
4580
- maxTokens: 65536,
4581
- },
4582
- "gemma-3-27b-it": {
4583
- id: "gemma-3-27b-it",
4584
- name: "Gemma 3 27B",
4585
- api: "google-generative-ai",
4586
- provider: "google",
4587
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4588
- reasoning: false,
4589
- input: ["text", "image"],
4590
- cost: {
4591
- input: 0,
4592
- output: 0,
4593
- cacheRead: 0,
4594
- cacheWrite: 0,
4595
- },
4596
- contextWindow: 131072,
4597
- maxTokens: 8192,
4598
- },
4599
4370
  "gemma-4-26b-a4b-it": {
4600
4371
  id: "gemma-4-26b-a4b-it",
4601
- name: "Gemma 4 26B",
4372
+ name: "Gemma 4 26B A4B IT",
4602
4373
  api: "google-generative-ai",
4603
4374
  provider: "google",
4604
4375
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4611,12 +4382,12 @@ export const MODELS = {
4611
4382
  cacheRead: 0,
4612
4383
  cacheWrite: 0,
4613
4384
  },
4614
- contextWindow: 256000,
4615
- maxTokens: 8192,
4385
+ contextWindow: 262144,
4386
+ maxTokens: 32768,
4616
4387
  },
4617
4388
  "gemma-4-31b-it": {
4618
4389
  id: "gemma-4-31b-it",
4619
- name: "Gemma 4 31B",
4390
+ name: "Gemma 4 31B IT",
4620
4391
  api: "google-generative-ai",
4621
4392
  provider: "google",
4622
4393
  baseUrl: "https://generativelanguage.googleapis.com/v1beta",
@@ -4629,8 +4400,8 @@ export const MODELS = {
4629
4400
  cacheRead: 0,
4630
4401
  cacheWrite: 0,
4631
4402
  },
4632
- contextWindow: 256000,
4633
- maxTokens: 8192,
4403
+ contextWindow: 262144,
4404
+ maxTokens: 32768,
4634
4405
  },
4635
4406
  },
4636
4407
  "google-vertex": {
@@ -7336,6 +7107,7 @@ export const MODELS = {
7336
7107
  api: "anthropic-messages",
7337
7108
  provider: "opencode",
7338
7109
  baseUrl: "https://opencode.ai/zen",
7110
+ compat: { "forceAdaptiveThinking": true },
7339
7111
  reasoning: true,
7340
7112
  thinkingLevelMap: { "xhigh": "max" },
7341
7113
  input: ["text", "image"],
@@ -7354,6 +7126,7 @@ export const MODELS = {
7354
7126
  api: "anthropic-messages",
7355
7127
  provider: "opencode",
7356
7128
  baseUrl: "https://opencode.ai/zen",
7129
+ compat: { "forceAdaptiveThinking": true },
7357
7130
  reasoning: true,
7358
7131
  thinkingLevelMap: { "xhigh": "xhigh" },
7359
7132
  input: ["text", "image"],
@@ -7406,6 +7179,7 @@ export const MODELS = {
7406
7179
  api: "anthropic-messages",
7407
7180
  provider: "opencode",
7408
7181
  baseUrl: "https://opencode.ai/zen",
7182
+ compat: { "forceAdaptiveThinking": true },
7409
7183
  reasoning: true,
7410
7184
  input: ["text", "image"],
7411
7185
  cost: {
@@ -7472,6 +7246,24 @@ export const MODELS = {
7472
7246
  contextWindow: 1048576,
7473
7247
  maxTokens: 65536,
7474
7248
  },
7249
+ "gemini-3.5-flash": {
7250
+ id: "gemini-3.5-flash",
7251
+ name: "Gemini 3.5 Flash",
7252
+ api: "google-generative-ai",
7253
+ provider: "opencode",
7254
+ baseUrl: "https://opencode.ai/zen/v1",
7255
+ reasoning: true,
7256
+ thinkingLevelMap: { "off": null },
7257
+ input: ["text", "image"],
7258
+ cost: {
7259
+ input: 1.5,
7260
+ output: 9,
7261
+ cacheRead: 0.15,
7262
+ cacheWrite: 0,
7263
+ },
7264
+ contextWindow: 1048576,
7265
+ maxTokens: 65536,
7266
+ },
7475
7267
  "glm-5": {
7476
7268
  id: "glm-5",
7477
7269
  name: "GLM-5",
@@ -7794,6 +7586,23 @@ export const MODELS = {
7794
7586
  contextWindow: 1050000,
7795
7587
  maxTokens: 128000,
7796
7588
  },
7589
+ "grok-build-0.1": {
7590
+ id: "grok-build-0.1",
7591
+ name: "Grok Build 0.1",
7592
+ api: "openai-completions",
7593
+ provider: "opencode",
7594
+ baseUrl: "https://opencode.ai/zen/v1",
7595
+ reasoning: true,
7596
+ input: ["text", "image"],
7597
+ cost: {
7598
+ input: 1,
7599
+ output: 2,
7600
+ cacheRead: 0.2,
7601
+ cacheWrite: 0,
7602
+ },
7603
+ contextWindow: 256000,
7604
+ maxTokens: 256000,
7605
+ },
7797
7606
  "kimi-k2.5": {
7798
7607
  id: "kimi-k2.5",
7799
7608
  name: "Kimi K2.5",
@@ -7845,23 +7654,6 @@ export const MODELS = {
7845
7654
  contextWindow: 204800,
7846
7655
  maxTokens: 131072,
7847
7656
  },
7848
- "minimax-m2.5-free": {
7849
- id: "minimax-m2.5-free",
7850
- name: "MiniMax M2.5 Free",
7851
- api: "anthropic-messages",
7852
- provider: "opencode",
7853
- baseUrl: "https://opencode.ai/zen",
7854
- reasoning: true,
7855
- input: ["text"],
7856
- cost: {
7857
- input: 0,
7858
- output: 0,
7859
- cacheRead: 0,
7860
- cacheWrite: 0,
7861
- },
7862
- contextWindow: 204800,
7863
- maxTokens: 131072,
7864
- },
7865
7657
  "minimax-m2.7": {
7866
7658
  id: "minimax-m2.7",
7867
7659
  name: "MiniMax M2.7",
@@ -7930,23 +7722,6 @@ export const MODELS = {
7930
7722
  contextWindow: 262144,
7931
7723
  maxTokens: 65536,
7932
7724
  },
7933
- "qwen3.6-plus-free": {
7934
- id: "qwen3.6-plus-free",
7935
- name: "Qwen3.6 Plus Free",
7936
- api: "anthropic-messages",
7937
- provider: "opencode",
7938
- baseUrl: "https://opencode.ai/zen",
7939
- reasoning: true,
7940
- input: ["text", "image"],
7941
- cost: {
7942
- input: 0,
7943
- output: 0,
7944
- cacheRead: 0,
7945
- cacheWrite: 0,
7946
- },
7947
- contextWindow: 262144,
7948
- maxTokens: 65536,
7949
- },
7950
7725
  },
7951
7726
  "opencode-go": {
7952
7727
  "deepseek-v4-flash": {
@@ -8505,23 +8280,6 @@ export const MODELS = {
8505
8280
  contextWindow: 1000000,
8506
8281
  maxTokens: 128000,
8507
8282
  },
8508
- "arcee-ai/trinity-large-preview": {
8509
- id: "arcee-ai/trinity-large-preview",
8510
- name: "Arcee AI: Trinity Large Preview",
8511
- api: "openai-completions",
8512
- provider: "openrouter",
8513
- baseUrl: "https://openrouter.ai/api/v1",
8514
- reasoning: false,
8515
- input: ["text"],
8516
- cost: {
8517
- input: 0.15,
8518
- output: 0.44999999999999996,
8519
- cacheRead: 0,
8520
- cacheWrite: 0,
8521
- },
8522
- contextWindow: 131000,
8523
- maxTokens: 4096,
8524
- },
8525
8283
  "arcee-ai/trinity-large-thinking": {
8526
8284
  id: "arcee-ai/trinity-large-thinking",
8527
8285
  name: "Arcee AI: Trinity Large Thinking",
@@ -8907,13 +8665,13 @@ export const MODELS = {
8907
8665
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
8908
8666
  input: ["text"],
8909
8667
  cost: {
8910
- input: 0.112,
8911
- output: 0.224,
8912
- cacheRead: 0.022,
8668
+ input: 0.09999999999999999,
8669
+ output: 0.19999999999999998,
8670
+ cacheRead: 0.02,
8913
8671
  cacheWrite: 0,
8914
8672
  },
8915
8673
  contextWindow: 1048576,
8916
- maxTokens: 4096,
8674
+ maxTokens: 16384,
8917
8675
  },
8918
8676
  "deepseek/deepseek-v4-flash:free": {
8919
8677
  id: "deepseek/deepseek-v4-flash:free",
@@ -8984,7 +8742,7 @@ export const MODELS = {
8984
8742
  cacheRead: 0.024999999999999998,
8985
8743
  cacheWrite: 0.08333333333333334,
8986
8744
  },
8987
- contextWindow: 1048576,
8745
+ contextWindow: 1000000,
8988
8746
  maxTokens: 8192,
8989
8747
  },
8990
8748
  "google/gemini-2.0-flash-lite-001": {
@@ -9191,6 +8949,23 @@ export const MODELS = {
9191
8949
  contextWindow: 1048756,
9192
8950
  maxTokens: 65536,
9193
8951
  },
8952
+ "google/gemini-3.5-flash": {
8953
+ id: "google/gemini-3.5-flash",
8954
+ name: "Google: Gemini 3.5 Flash",
8955
+ api: "openai-completions",
8956
+ provider: "openrouter",
8957
+ baseUrl: "https://openrouter.ai/api/v1",
8958
+ reasoning: true,
8959
+ input: ["text", "image"],
8960
+ cost: {
8961
+ input: 1.5,
8962
+ output: 9,
8963
+ cacheRead: 0.15,
8964
+ cacheWrite: 0.08333333333333334,
8965
+ },
8966
+ contextWindow: 1048576,
8967
+ maxTokens: 65536,
8968
+ },
9194
8969
  "google/gemma-3-12b-it": {
9195
8970
  id: "google/gemma-3-12b-it",
9196
8971
  name: "Google: Gemma 3 12B",
@@ -9337,9 +9112,9 @@ export const MODELS = {
9337
9112
  reasoning: false,
9338
9113
  input: ["text"],
9339
9114
  cost: {
9340
- input: 0.3,
9341
- output: 2.5,
9342
- cacheRead: 0.06,
9115
+ input: 0.075,
9116
+ output: 0.625,
9117
+ cacheRead: 0.015,
9343
9118
  cacheWrite: 0,
9344
9119
  },
9345
9120
  contextWindow: 262144,
@@ -11837,7 +11612,7 @@ export const MODELS = {
11837
11612
  cacheWrite: 0,
11838
11613
  },
11839
11614
  contextWindow: 262144,
11840
- maxTokens: 65536,
11615
+ maxTokens: 262144,
11841
11616
  },
11842
11617
  "qwen/qwen3.5-27b": {
11843
11618
  id: "qwen/qwen3.5-27b",
@@ -11865,13 +11640,13 @@ export const MODELS = {
11865
11640
  reasoning: true,
11866
11641
  input: ["text", "image"],
11867
11642
  cost: {
11868
- input: 0.14,
11643
+ input: 0.13899999999999998,
11869
11644
  output: 1,
11870
- cacheRead: 0.049999999999999996,
11645
+ cacheRead: 0,
11871
11646
  cacheWrite: 0,
11872
11647
  },
11873
11648
  contextWindow: 262144,
11874
- maxTokens: 81920,
11649
+ maxTokens: 4096,
11875
11650
  },
11876
11651
  "qwen/qwen3.5-397b-a17b": {
11877
11652
  id: "qwen/qwen3.5-397b-a17b",
@@ -11884,7 +11659,7 @@ export const MODELS = {
11884
11659
  cost: {
11885
11660
  input: 0.39,
11886
11661
  output: 2.34,
11887
- cacheRead: 0.195,
11662
+ cacheRead: 0,
11888
11663
  cacheWrite: 0,
11889
11664
  },
11890
11665
  contextWindow: 262144,
@@ -11967,13 +11742,13 @@ export const MODELS = {
11967
11742
  reasoning: true,
11968
11743
  input: ["text", "image"],
11969
11744
  cost: {
11970
- input: 0.32,
11745
+ input: 0.3,
11971
11746
  output: 3.1999999999999997,
11972
11747
  cacheRead: 0,
11973
11748
  cacheWrite: 0,
11974
11749
  },
11975
11750
  contextWindow: 262144,
11976
- maxTokens: 81920,
11751
+ maxTokens: 262144,
11977
11752
  },
11978
11753
  "qwen/qwen3.6-35b-a3b": {
11979
11754
  id: "qwen/qwen3.6-35b-a3b",
@@ -11986,11 +11761,11 @@ export const MODELS = {
11986
11761
  cost: {
11987
11762
  input: 0.15,
11988
11763
  output: 1,
11989
- cacheRead: 0.049999999999999996,
11764
+ cacheRead: 0,
11990
11765
  cacheWrite: 0,
11991
11766
  },
11992
11767
  contextWindow: 262144,
11993
- maxTokens: 262144,
11768
+ maxTokens: 262140,
11994
11769
  },
11995
11770
  "qwen/qwen3.6-flash": {
11996
11771
  id: "qwen/qwen3.6-flash",
@@ -12043,6 +11818,23 @@ export const MODELS = {
12043
11818
  contextWindow: 1000000,
12044
11819
  maxTokens: 65536,
12045
11820
  },
11821
+ "qwen/qwen3.7-max": {
11822
+ id: "qwen/qwen3.7-max",
11823
+ name: "Qwen: Qwen3.7 Max",
11824
+ api: "openai-completions",
11825
+ provider: "openrouter",
11826
+ baseUrl: "https://openrouter.ai/api/v1",
11827
+ reasoning: true,
11828
+ input: ["text"],
11829
+ cost: {
11830
+ input: 2.5,
11831
+ output: 7.5,
11832
+ cacheRead: 0,
11833
+ cacheWrite: 3.125,
11834
+ },
11835
+ contextWindow: 1000000,
11836
+ maxTokens: 65536,
11837
+ },
12046
11838
  "rekaai/reka-edge": {
12047
11839
  id: "rekaai/reka-edge",
12048
11840
  name: "Reka Edge",
@@ -12120,13 +11912,13 @@ export const MODELS = {
12120
11912
  reasoning: true,
12121
11913
  input: ["text"],
12122
11914
  cost: {
12123
- input: 0.09999999999999999,
11915
+ input: 0.09,
12124
11916
  output: 0.3,
12125
- cacheRead: 0,
11917
+ cacheRead: 0.02,
12126
11918
  cacheWrite: 0,
12127
11919
  },
12128
11920
  contextWindow: 262144,
12129
- maxTokens: 65536,
11921
+ maxTokens: 16384,
12130
11922
  },
12131
11923
  "tencent/hy3-preview": {
12132
11924
  id: "tencent/hy3-preview",
@@ -12230,6 +12022,23 @@ export const MODELS = {
12230
12022
  contextWindow: 1000000,
12231
12023
  maxTokens: 4096,
12232
12024
  },
12025
+ "x-ai/grok-build-0.1": {
12026
+ id: "x-ai/grok-build-0.1",
12027
+ name: "xAI: Grok Build 0.1",
12028
+ api: "openai-completions",
12029
+ provider: "openrouter",
12030
+ baseUrl: "https://openrouter.ai/api/v1",
12031
+ reasoning: true,
12032
+ input: ["text", "image"],
12033
+ cost: {
12034
+ input: 1,
12035
+ output: 2,
12036
+ cacheRead: 0.19999999999999998,
12037
+ cacheWrite: 0,
12038
+ },
12039
+ contextWindow: 256000,
12040
+ maxTokens: 4096,
12041
+ },
12233
12042
  "xiaomi/mimo-v2-flash": {
12234
12043
  id: "xiaomi/mimo-v2-flash",
12235
12044
  name: "Xiaomi: MiMo-V2-Flash",
@@ -12596,9 +12405,9 @@ export const MODELS = {
12596
12405
  reasoning: true,
12597
12406
  input: ["text", "image"],
12598
12407
  cost: {
12599
- input: 0.5,
12600
- output: 3,
12601
- cacheRead: 0.049999999999999996,
12408
+ input: 1.5,
12409
+ output: 9,
12410
+ cacheRead: 0.15,
12602
12411
  cacheWrite: 0.08333333333333334,
12603
12412
  },
12604
12413
  contextWindow: 1048576,
@@ -12806,6 +12615,25 @@ export const MODELS = {
12806
12615
  contextWindow: 1000000,
12807
12616
  maxTokens: 500000,
12808
12617
  },
12618
+ "Qwen/Qwen3.7-Max": {
12619
+ id: "Qwen/Qwen3.7-Max",
12620
+ name: "Qwen3.7 Max",
12621
+ api: "openai-completions",
12622
+ provider: "together",
12623
+ baseUrl: "https://api.together.ai/v1",
12624
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
12625
+ reasoning: true,
12626
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
12627
+ input: ["text"],
12628
+ cost: {
12629
+ input: 2.5,
12630
+ output: 7.5,
12631
+ cacheRead: 0,
12632
+ cacheWrite: 0,
12633
+ },
12634
+ contextWindow: 1000000,
12635
+ maxTokens: 500000,
12636
+ },
12809
12637
  "deepseek-ai/DeepSeek-V3": {
12810
12638
  id: "deepseek-ai/DeepSeek-V3",
12811
12639
  name: "DeepSeek V3",
@@ -13302,6 +13130,23 @@ export const MODELS = {
13302
13130
  contextWindow: 1000000,
13303
13131
  maxTokens: 64000,
13304
13132
  },
13133
+ "alibaba/qwen3.7-max": {
13134
+ id: "alibaba/qwen3.7-max",
13135
+ name: "Qwen 3.7 Max",
13136
+ api: "anthropic-messages",
13137
+ provider: "vercel-ai-gateway",
13138
+ baseUrl: "https://ai-gateway.vercel.sh",
13139
+ reasoning: true,
13140
+ input: ["text", "image"],
13141
+ cost: {
13142
+ input: 1.25,
13143
+ output: 3.75,
13144
+ cacheRead: 0.25,
13145
+ cacheWrite: 1.5625,
13146
+ },
13147
+ contextWindow: 991000,
13148
+ maxTokens: 64000,
13149
+ },
13305
13150
  "anthropic/claude-3-haiku": {
13306
13151
  id: "anthropic/claude-3-haiku",
13307
13152
  name: "Claude 3 Haiku",
@@ -13410,6 +13255,7 @@ export const MODELS = {
13410
13255
  api: "anthropic-messages",
13411
13256
  provider: "vercel-ai-gateway",
13412
13257
  baseUrl: "https://ai-gateway.vercel.sh",
13258
+ compat: { "forceAdaptiveThinking": true },
13413
13259
  reasoning: true,
13414
13260
  thinkingLevelMap: { "xhigh": "max" },
13415
13261
  input: ["text", "image"],
@@ -13428,6 +13274,7 @@ export const MODELS = {
13428
13274
  api: "anthropic-messages",
13429
13275
  provider: "vercel-ai-gateway",
13430
13276
  baseUrl: "https://ai-gateway.vercel.sh",
13277
+ compat: { "forceAdaptiveThinking": true },
13431
13278
  reasoning: true,
13432
13279
  thinkingLevelMap: { "xhigh": "xhigh" },
13433
13280
  input: ["text", "image"],
@@ -13480,6 +13327,7 @@ export const MODELS = {
13480
13327
  api: "anthropic-messages",
13481
13328
  provider: "vercel-ai-gateway",
13482
13329
  baseUrl: "https://ai-gateway.vercel.sh",
13330
+ compat: { "forceAdaptiveThinking": true },
13483
13331
  reasoning: true,
13484
13332
  input: ["text", "image"],
13485
13333
  cost: {
@@ -13865,6 +13713,23 @@ export const MODELS = {
13865
13713
  contextWindow: 1000000,
13866
13714
  maxTokens: 64000,
13867
13715
  },
13716
+ "google/gemini-3.5-flash": {
13717
+ id: "google/gemini-3.5-flash",
13718
+ name: "Gemini 3.5 Flash",
13719
+ api: "anthropic-messages",
13720
+ provider: "vercel-ai-gateway",
13721
+ baseUrl: "https://ai-gateway.vercel.sh",
13722
+ reasoning: true,
13723
+ input: ["text", "image"],
13724
+ cost: {
13725
+ input: 1.5,
13726
+ output: 9,
13727
+ cacheRead: 0.15,
13728
+ cacheWrite: 0,
13729
+ },
13730
+ contextWindow: 1000000,
13731
+ maxTokens: 64000,
13732
+ },
13868
13733
  "google/gemma-4-26b-a4b-it": {
13869
13734
  id: "google/gemma-4-26b-a4b-it",
13870
13735
  name: "Gemma 4 26B A4B IT",
@@ -14173,7 +14038,7 @@ export const MODELS = {
14173
14038
  },
14174
14039
  "minimax/minimax-m2.7": {
14175
14040
  id: "minimax/minimax-m2.7",
14176
- name: "Minimax M2.7",
14041
+ name: "MiniMax M2.7",
14177
14042
  api: "anthropic-messages",
14178
14043
  provider: "vercel-ai-gateway",
14179
14044
  baseUrl: "https://ai-gateway.vercel.sh",
@@ -14324,6 +14189,23 @@ export const MODELS = {
14324
14189
  contextWindow: 128000,
14325
14190
  maxTokens: 64000,
14326
14191
  },
14192
+ "mistral/mistral-medium-3.5": {
14193
+ id: "mistral/mistral-medium-3.5",
14194
+ name: "Mistral Medium Latest",
14195
+ api: "anthropic-messages",
14196
+ provider: "vercel-ai-gateway",
14197
+ baseUrl: "https://ai-gateway.vercel.sh",
14198
+ reasoning: true,
14199
+ input: ["text"],
14200
+ cost: {
14201
+ input: 1.5,
14202
+ output: 7.5,
14203
+ cacheRead: 0,
14204
+ cacheWrite: 0,
14205
+ },
14206
+ contextWindow: 256000,
14207
+ maxTokens: 256000,
14208
+ },
14327
14209
  "mistral/mistral-small": {
14328
14210
  id: "mistral/mistral-small",
14329
14211
  name: "Mistral Small",
@@ -15339,6 +15221,23 @@ export const MODELS = {
15339
15221
  contextWindow: 1000000,
15340
15222
  maxTokens: 1000000,
15341
15223
  },
15224
+ "xai/grok-build-0.1": {
15225
+ id: "xai/grok-build-0.1",
15226
+ name: "Grok Build 0.1",
15227
+ api: "anthropic-messages",
15228
+ provider: "vercel-ai-gateway",
15229
+ baseUrl: "https://ai-gateway.vercel.sh",
15230
+ reasoning: true,
15231
+ input: ["text", "image"],
15232
+ cost: {
15233
+ input: 1,
15234
+ output: 2,
15235
+ cacheRead: 0.19999999999999998,
15236
+ cacheWrite: 0,
15237
+ },
15238
+ contextWindow: 256000,
15239
+ maxTokens: 256000,
15240
+ },
15342
15241
  "xiaomi/mimo-v2-flash": {
15343
15242
  id: "xiaomi/mimo-v2-flash",
15344
15243
  name: "MiMo V2 Flash",
@@ -15630,108 +15529,6 @@ export const MODELS = {
15630
15529
  },
15631
15530
  },
15632
15531
  "xai": {
15633
- "grok-2": {
15634
- id: "grok-2",
15635
- name: "Grok 2",
15636
- api: "openai-completions",
15637
- provider: "xai",
15638
- baseUrl: "https://api.x.ai/v1",
15639
- reasoning: false,
15640
- input: ["text"],
15641
- cost: {
15642
- input: 2,
15643
- output: 10,
15644
- cacheRead: 2,
15645
- cacheWrite: 0,
15646
- },
15647
- contextWindow: 131072,
15648
- maxTokens: 8192,
15649
- },
15650
- "grok-2-1212": {
15651
- id: "grok-2-1212",
15652
- name: "Grok 2 (1212)",
15653
- api: "openai-completions",
15654
- provider: "xai",
15655
- baseUrl: "https://api.x.ai/v1",
15656
- reasoning: false,
15657
- input: ["text"],
15658
- cost: {
15659
- input: 2,
15660
- output: 10,
15661
- cacheRead: 2,
15662
- cacheWrite: 0,
15663
- },
15664
- contextWindow: 131072,
15665
- maxTokens: 8192,
15666
- },
15667
- "grok-2-latest": {
15668
- id: "grok-2-latest",
15669
- name: "Grok 2 Latest",
15670
- api: "openai-completions",
15671
- provider: "xai",
15672
- baseUrl: "https://api.x.ai/v1",
15673
- reasoning: false,
15674
- input: ["text"],
15675
- cost: {
15676
- input: 2,
15677
- output: 10,
15678
- cacheRead: 2,
15679
- cacheWrite: 0,
15680
- },
15681
- contextWindow: 131072,
15682
- maxTokens: 8192,
15683
- },
15684
- "grok-2-vision": {
15685
- id: "grok-2-vision",
15686
- name: "Grok 2 Vision",
15687
- api: "openai-completions",
15688
- provider: "xai",
15689
- baseUrl: "https://api.x.ai/v1",
15690
- reasoning: false,
15691
- input: ["text", "image"],
15692
- cost: {
15693
- input: 2,
15694
- output: 10,
15695
- cacheRead: 2,
15696
- cacheWrite: 0,
15697
- },
15698
- contextWindow: 8192,
15699
- maxTokens: 4096,
15700
- },
15701
- "grok-2-vision-1212": {
15702
- id: "grok-2-vision-1212",
15703
- name: "Grok 2 Vision (1212)",
15704
- api: "openai-completions",
15705
- provider: "xai",
15706
- baseUrl: "https://api.x.ai/v1",
15707
- reasoning: false,
15708
- input: ["text", "image"],
15709
- cost: {
15710
- input: 2,
15711
- output: 10,
15712
- cacheRead: 2,
15713
- cacheWrite: 0,
15714
- },
15715
- contextWindow: 8192,
15716
- maxTokens: 4096,
15717
- },
15718
- "grok-2-vision-latest": {
15719
- id: "grok-2-vision-latest",
15720
- name: "Grok 2 Vision Latest",
15721
- api: "openai-completions",
15722
- provider: "xai",
15723
- baseUrl: "https://api.x.ai/v1",
15724
- reasoning: false,
15725
- input: ["text", "image"],
15726
- cost: {
15727
- input: 2,
15728
- output: 10,
15729
- cacheRead: 2,
15730
- cacheWrite: 0,
15731
- },
15732
- contextWindow: 8192,
15733
- maxTokens: 4096,
15734
- },
15735
15532
  "grok-3": {
15736
15533
  id: "grok-3",
15737
15534
  name: "Grok 3",
@@ -15775,8 +15572,8 @@ export const MODELS = {
15775
15572
  reasoning: false,
15776
15573
  input: ["text", "image"],
15777
15574
  cost: {
15778
- input: 2,
15779
- output: 6,
15575
+ input: 1.25,
15576
+ output: 2.5,
15780
15577
  cacheRead: 0.2,
15781
15578
  cacheWrite: 0,
15782
15579
  },
@@ -15792,8 +15589,8 @@ export const MODELS = {
15792
15589
  reasoning: true,
15793
15590
  input: ["text", "image"],
15794
15591
  cost: {
15795
- input: 2,
15796
- output: 6,
15592
+ input: 1.25,
15593
+ output: 2.5,
15797
15594
  cacheRead: 0.2,
15798
15595
  cacheWrite: 0,
15799
15596
  },
@@ -15817,22 +15614,22 @@ export const MODELS = {
15817
15614
  contextWindow: 1000000,
15818
15615
  maxTokens: 30000,
15819
15616
  },
15820
- "grok-beta": {
15821
- id: "grok-beta",
15822
- name: "Grok Beta",
15617
+ "grok-build-0.1": {
15618
+ id: "grok-build-0.1",
15619
+ name: "Grok Build 0.1",
15823
15620
  api: "openai-completions",
15824
15621
  provider: "xai",
15825
15622
  baseUrl: "https://api.x.ai/v1",
15826
- reasoning: false,
15827
- input: ["text"],
15623
+ reasoning: true,
15624
+ input: ["text", "image"],
15828
15625
  cost: {
15829
- input: 5,
15830
- output: 15,
15831
- cacheRead: 5,
15626
+ input: 1,
15627
+ output: 2,
15628
+ cacheRead: 0.2,
15832
15629
  cacheWrite: 0,
15833
15630
  },
15834
- contextWindow: 131072,
15835
- maxTokens: 4096,
15631
+ contextWindow: 256000,
15632
+ maxTokens: 256000,
15836
15633
  },
15837
15634
  "grok-code-fast-1": {
15838
15635
  id: "grok-code-fast-1",
@@ -15851,23 +15648,6 @@ export const MODELS = {
15851
15648
  contextWindow: 32768,
15852
15649
  maxTokens: 8192,
15853
15650
  },
15854
- "grok-vision-beta": {
15855
- id: "grok-vision-beta",
15856
- name: "Grok Vision Beta",
15857
- api: "openai-completions",
15858
- provider: "xai",
15859
- baseUrl: "https://api.x.ai/v1",
15860
- reasoning: false,
15861
- input: ["text", "image"],
15862
- cost: {
15863
- input: 5,
15864
- output: 15,
15865
- cacheRead: 5,
15866
- cacheWrite: 0,
15867
- },
15868
- contextWindow: 8192,
15869
- maxTokens: 4096,
15870
- },
15871
15651
  },
15872
15652
  "xiaomi": {
15873
15653
  "mimo-v2-flash": {