@caupulican/pi-ai 0.75.6 → 0.78.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (71) hide show
  1. package/README.md +1 -1
  2. package/dist/image-models.generated.d.ts.map +1 -1
  3. package/dist/image-models.generated.js +146 -146
  4. package/dist/image-models.generated.js.map +1 -1
  5. package/dist/models.generated.d.ts +399 -299
  6. package/dist/models.generated.d.ts.map +1 -1
  7. package/dist/models.generated.js +494 -455
  8. package/dist/models.generated.js.map +1 -1
  9. package/dist/providers/amazon-bedrock.d.ts +1 -1
  10. package/dist/providers/amazon-bedrock.d.ts.map +1 -1
  11. package/dist/providers/amazon-bedrock.js +38 -2
  12. package/dist/providers/amazon-bedrock.js.map +1 -1
  13. package/dist/providers/anthropic.d.ts.map +1 -1
  14. package/dist/providers/anthropic.js +21 -12
  15. package/dist/providers/anthropic.js.map +1 -1
  16. package/dist/providers/azure-openai-responses.d.ts.map +1 -1
  17. package/dist/providers/azure-openai-responses.js +6 -10
  18. package/dist/providers/azure-openai-responses.js.map +1 -1
  19. package/dist/providers/google-vertex.d.ts.map +1 -1
  20. package/dist/providers/google-vertex.js +1 -1
  21. package/dist/providers/google-vertex.js.map +1 -1
  22. package/dist/providers/google.d.ts.map +1 -1
  23. package/dist/providers/google.js +5 -3
  24. package/dist/providers/google.js.map +1 -1
  25. package/dist/providers/images/openrouter.d.ts.map +1 -1
  26. package/dist/providers/images/openrouter.js +3 -4
  27. package/dist/providers/images/openrouter.js.map +1 -1
  28. package/dist/providers/mistral.d.ts.map +1 -1
  29. package/dist/providers/mistral.js +2 -3
  30. package/dist/providers/mistral.js.map +1 -1
  31. package/dist/providers/openai-codex-responses.d.ts.map +1 -1
  32. package/dist/providers/openai-codex-responses.js +159 -78
  33. package/dist/providers/openai-codex-responses.js.map +1 -1
  34. package/dist/providers/openai-completions.d.ts.map +1 -1
  35. package/dist/providers/openai-completions.js +16 -11
  36. package/dist/providers/openai-completions.js.map +1 -1
  37. package/dist/providers/openai-responses-shared.d.ts.map +1 -1
  38. package/dist/providers/openai-responses-shared.js +4 -1
  39. package/dist/providers/openai-responses-shared.js.map +1 -1
  40. package/dist/providers/openai-responses.d.ts.map +1 -1
  41. package/dist/providers/openai-responses.js +6 -10
  42. package/dist/providers/openai-responses.js.map +1 -1
  43. package/dist/providers/simple-options.d.ts.map +1 -1
  44. package/dist/providers/simple-options.js +1 -0
  45. package/dist/providers/simple-options.js.map +1 -1
  46. package/dist/stream.d.ts.map +1 -1
  47. package/dist/stream.js +14 -2
  48. package/dist/stream.js.map +1 -1
  49. package/dist/types.d.ts +14 -4
  50. package/dist/types.d.ts.map +1 -1
  51. package/dist/types.js.map +1 -1
  52. package/dist/utils/abort-signals.d.ts +6 -0
  53. package/dist/utils/abort-signals.d.ts.map +1 -0
  54. package/dist/utils/abort-signals.js +34 -0
  55. package/dist/utils/abort-signals.js.map +1 -0
  56. package/dist/utils/oauth/device-code.d.ts +9 -7
  57. package/dist/utils/oauth/device-code.d.ts.map +1 -1
  58. package/dist/utils/oauth/device-code.js +8 -7
  59. package/dist/utils/oauth/device-code.js.map +1 -1
  60. package/dist/utils/oauth/github-copilot.d.ts.map +1 -1
  61. package/dist/utils/oauth/github-copilot.js +1 -1
  62. package/dist/utils/oauth/github-copilot.js.map +1 -1
  63. package/dist/utils/oauth/index.d.ts +1 -1
  64. package/dist/utils/oauth/index.d.ts.map +1 -1
  65. package/dist/utils/oauth/index.js +1 -1
  66. package/dist/utils/oauth/index.js.map +1 -1
  67. package/dist/utils/oauth/openai-codex.d.ts +10 -1
  68. package/dist/utils/oauth/openai-codex.d.ts.map +1 -1
  69. package/dist/utils/oauth/openai-codex.js +179 -79
  70. package/dist/utils/oauth/openai-codex.js.map +1 -1
  71. package/package.json +104 -91
@@ -157,6 +157,24 @@ export const MODELS = {
157
157
  contextWindow: 1000000,
158
158
  maxTokens: 128000,
159
159
  },
160
+ "anthropic.claude-opus-4-8": {
161
+ id: "anthropic.claude-opus-4-8",
162
+ name: "Claude Opus 4.8",
163
+ api: "bedrock-converse-stream",
164
+ provider: "amazon-bedrock",
165
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
166
+ reasoning: true,
167
+ thinkingLevelMap: { "xhigh": "xhigh" },
168
+ input: ["text", "image"],
169
+ cost: {
170
+ input: 5,
171
+ output: 25,
172
+ cacheRead: 0.5,
173
+ cacheWrite: 6.25,
174
+ },
175
+ contextWindow: 1000000,
176
+ maxTokens: 128000,
177
+ },
160
178
  "anthropic.claude-sonnet-4-5-20250929-v1:0": {
161
179
  id: "anthropic.claude-sonnet-4-5-20250929-v1:0",
162
180
  name: "Claude Sonnet 4.5",
@@ -226,6 +244,24 @@ export const MODELS = {
226
244
  contextWindow: 1000000,
227
245
  maxTokens: 128000,
228
246
  },
247
+ "au.anthropic.claude-opus-4-8": {
248
+ id: "au.anthropic.claude-opus-4-8",
249
+ name: "Claude Opus 4.8 (AU)",
250
+ api: "bedrock-converse-stream",
251
+ provider: "amazon-bedrock",
252
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
253
+ reasoning: true,
254
+ thinkingLevelMap: { "xhigh": "xhigh" },
255
+ input: ["text", "image"],
256
+ cost: {
257
+ input: 5,
258
+ output: 25,
259
+ cacheRead: 0.5,
260
+ cacheWrite: 6.25,
261
+ },
262
+ contextWindow: 1000000,
263
+ maxTokens: 128000,
264
+ },
229
265
  "au.anthropic.claude-sonnet-4-5-20250929-v1:0": {
230
266
  id: "au.anthropic.claude-sonnet-4-5-20250929-v1:0",
231
267
  name: "Claude Sonnet 4.5 (AU)",
@@ -381,6 +417,24 @@ export const MODELS = {
381
417
  contextWindow: 1000000,
382
418
  maxTokens: 128000,
383
419
  },
420
+ "eu.anthropic.claude-opus-4-8": {
421
+ id: "eu.anthropic.claude-opus-4-8",
422
+ name: "Claude Opus 4.8 (EU)",
423
+ api: "bedrock-converse-stream",
424
+ provider: "amazon-bedrock",
425
+ baseUrl: "https://bedrock-runtime.eu-central-1.amazonaws.com",
426
+ reasoning: true,
427
+ thinkingLevelMap: { "xhigh": "xhigh" },
428
+ input: ["text", "image"],
429
+ cost: {
430
+ input: 5,
431
+ output: 25,
432
+ cacheRead: 0.5,
433
+ cacheWrite: 6.25,
434
+ },
435
+ contextWindow: 1000000,
436
+ maxTokens: 128000,
437
+ },
384
438
  "eu.anthropic.claude-sonnet-4-5-20250929-v1:0": {
385
439
  id: "eu.anthropic.claude-sonnet-4-5-20250929-v1:0",
386
440
  name: "Claude Sonnet 4.5 (EU)",
@@ -485,6 +539,24 @@ export const MODELS = {
485
539
  contextWindow: 1000000,
486
540
  maxTokens: 128000,
487
541
  },
542
+ "global.anthropic.claude-opus-4-8": {
543
+ id: "global.anthropic.claude-opus-4-8",
544
+ name: "Claude Opus 4.8 (Global)",
545
+ api: "bedrock-converse-stream",
546
+ provider: "amazon-bedrock",
547
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
548
+ reasoning: true,
549
+ thinkingLevelMap: { "xhigh": "xhigh" },
550
+ input: ["text", "image"],
551
+ cost: {
552
+ input: 5,
553
+ output: 25,
554
+ cacheRead: 0.5,
555
+ cacheWrite: 6.25,
556
+ },
557
+ contextWindow: 1000000,
558
+ maxTokens: 128000,
559
+ },
488
560
  "global.anthropic.claude-sonnet-4-5-20250929-v1:0": {
489
561
  id: "global.anthropic.claude-sonnet-4-5-20250929-v1:0",
490
562
  name: "Claude Sonnet 4.5 (Global)",
@@ -571,6 +643,24 @@ export const MODELS = {
571
643
  contextWindow: 1000000,
572
644
  maxTokens: 128000,
573
645
  },
646
+ "jp.anthropic.claude-opus-4-8": {
647
+ id: "jp.anthropic.claude-opus-4-8",
648
+ name: "Claude Opus 4.8 (JP)",
649
+ api: "bedrock-converse-stream",
650
+ provider: "amazon-bedrock",
651
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
652
+ reasoning: true,
653
+ thinkingLevelMap: { "xhigh": "xhigh" },
654
+ input: ["text", "image"],
655
+ cost: {
656
+ input: 5,
657
+ output: 25,
658
+ cacheRead: 0.5,
659
+ cacheWrite: 6.25,
660
+ },
661
+ contextWindow: 1000000,
662
+ maxTokens: 128000,
663
+ },
574
664
  "jp.anthropic.claude-sonnet-4-5-20250929-v1:0": {
575
665
  id: "jp.anthropic.claude-sonnet-4-5-20250929-v1:0",
576
666
  name: "Claude Sonnet 4.5 (JP)",
@@ -1270,6 +1360,24 @@ export const MODELS = {
1270
1360
  contextWindow: 1000000,
1271
1361
  maxTokens: 128000,
1272
1362
  },
1363
+ "us.anthropic.claude-opus-4-8": {
1364
+ id: "us.anthropic.claude-opus-4-8",
1365
+ name: "Claude Opus 4.8 (US)",
1366
+ api: "bedrock-converse-stream",
1367
+ provider: "amazon-bedrock",
1368
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1369
+ reasoning: true,
1370
+ thinkingLevelMap: { "xhigh": "xhigh" },
1371
+ input: ["text", "image"],
1372
+ cost: {
1373
+ input: 5,
1374
+ output: 25,
1375
+ cacheRead: 0.5,
1376
+ cacheWrite: 6.25,
1377
+ },
1378
+ contextWindow: 1000000,
1379
+ maxTokens: 128000,
1380
+ },
1273
1381
  "us.anthropic.claude-sonnet-4-5-20250929-v1:0": {
1274
1382
  id: "us.anthropic.claude-sonnet-4-5-20250929-v1:0",
1275
1383
  name: "Claude Sonnet 4.5 (US)",
@@ -1752,6 +1860,25 @@ export const MODELS = {
1752
1860
  contextWindow: 1000000,
1753
1861
  maxTokens: 128000,
1754
1862
  },
1863
+ "claude-opus-4-8": {
1864
+ id: "claude-opus-4-8",
1865
+ name: "Claude Opus 4.8",
1866
+ api: "anthropic-messages",
1867
+ provider: "anthropic",
1868
+ baseUrl: "https://api.anthropic.com",
1869
+ compat: { "forceAdaptiveThinking": true },
1870
+ reasoning: true,
1871
+ thinkingLevelMap: { "xhigh": "xhigh" },
1872
+ input: ["text", "image"],
1873
+ cost: {
1874
+ input: 5,
1875
+ output: 25,
1876
+ cacheRead: 0.5,
1877
+ cacheWrite: 6.25,
1878
+ },
1879
+ contextWindow: 1000000,
1880
+ maxTokens: 128000,
1881
+ },
1755
1882
  "claude-sonnet-4-0": {
1756
1883
  id: "claude-sonnet-4-0",
1757
1884
  name: "Claude Sonnet 4 (latest)",
@@ -1919,7 +2046,7 @@ export const MODELS = {
1919
2046
  cost: {
1920
2047
  input: 0.1,
1921
2048
  output: 0.4,
1922
- cacheRead: 0.03,
2049
+ cacheRead: 0.025,
1923
2050
  cacheWrite: 0,
1924
2051
  },
1925
2052
  contextWindow: 1047576,
@@ -2004,7 +2131,7 @@ export const MODELS = {
2004
2131
  cost: {
2005
2132
  input: 0.15,
2006
2133
  output: 0.6,
2007
- cacheRead: 0.08,
2134
+ cacheRead: 0.075,
2008
2135
  cacheWrite: 0,
2009
2136
  },
2010
2137
  contextWindow: 128000,
@@ -2130,7 +2257,7 @@ export const MODELS = {
2130
2257
  cost: {
2131
2258
  input: 1.25,
2132
2259
  output: 10,
2133
- cacheRead: 0.13,
2260
+ cacheRead: 0.125,
2134
2261
  cacheWrite: 0,
2135
2262
  },
2136
2263
  contextWindow: 400000,
@@ -2431,7 +2558,7 @@ export const MODELS = {
2431
2558
  provider: "azure-openai-responses",
2432
2559
  baseUrl: "",
2433
2560
  reasoning: true,
2434
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
2561
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh", "minimal": null, "low": null },
2435
2562
  input: ["text", "image"],
2436
2563
  cost: {
2437
2564
  input: 30,
@@ -2555,7 +2682,7 @@ export const MODELS = {
2555
2682
  cost: {
2556
2683
  input: 1.1,
2557
2684
  output: 4.4,
2558
- cacheRead: 0.28,
2685
+ cacheRead: 0.275,
2559
2686
  cacheWrite: 0,
2560
2687
  },
2561
2688
  contextWindow: 200000,
@@ -2614,23 +2741,6 @@ export const MODELS = {
2614
2741
  contextWindow: 32000,
2615
2742
  maxTokens: 8000,
2616
2743
  },
2617
- "qwen-3-235b-a22b-instruct-2507": {
2618
- id: "qwen-3-235b-a22b-instruct-2507",
2619
- name: "Qwen 3 235B Instruct",
2620
- api: "openai-completions",
2621
- provider: "cerebras",
2622
- baseUrl: "https://api.cerebras.ai/v1",
2623
- reasoning: false,
2624
- input: ["text"],
2625
- cost: {
2626
- input: 0.6,
2627
- output: 1.2,
2628
- cacheRead: 0,
2629
- cacheWrite: 0,
2630
- },
2631
- contextWindow: 131000,
2632
- maxTokens: 32000,
2633
- },
2634
2744
  "zai-glm-4.7": {
2635
2745
  id: "zai-glm-4.7",
2636
2746
  name: "Z.AI GLM-4.7",
@@ -2858,6 +2968,25 @@ export const MODELS = {
2858
2968
  contextWindow: 1000000,
2859
2969
  maxTokens: 128000,
2860
2970
  },
2971
+ "claude-opus-4-8": {
2972
+ id: "claude-opus-4-8",
2973
+ name: "Claude Opus 4.8",
2974
+ api: "anthropic-messages",
2975
+ provider: "cloudflare-ai-gateway",
2976
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2977
+ compat: { "forceAdaptiveThinking": true },
2978
+ reasoning: true,
2979
+ thinkingLevelMap: { "xhigh": "xhigh" },
2980
+ input: ["text", "image"],
2981
+ cost: {
2982
+ input: 5,
2983
+ output: 25,
2984
+ cacheRead: 0.5,
2985
+ cacheWrite: 6.25,
2986
+ },
2987
+ contextWindow: 1000000,
2988
+ maxTokens: 128000,
2989
+ },
2861
2990
  "claude-sonnet-4": {
2862
2991
  id: "claude-sonnet-4",
2863
2992
  name: "Claude Sonnet 4 (latest)",
@@ -3755,8 +3884,8 @@ export const MODELS = {
3755
3884
  cacheRead: 0,
3756
3885
  cacheWrite: 0,
3757
3886
  },
3758
- contextWindow: 144000,
3759
- maxTokens: 32000,
3887
+ contextWindow: 200000,
3888
+ maxTokens: 64000,
3760
3889
  },
3761
3890
  "claude-opus-4.5": {
3762
3891
  id: "claude-opus-4.5",
@@ -3773,7 +3902,7 @@ export const MODELS = {
3773
3902
  cacheRead: 0,
3774
3903
  cacheWrite: 0,
3775
3904
  },
3776
- contextWindow: 160000,
3905
+ contextWindow: 200000,
3777
3906
  maxTokens: 32000,
3778
3907
  },
3779
3908
  "claude-opus-4.6": {
@@ -3794,7 +3923,7 @@ export const MODELS = {
3794
3923
  cacheWrite: 0,
3795
3924
  },
3796
3925
  contextWindow: 1000000,
3797
- maxTokens: 64000,
3926
+ maxTokens: 32000,
3798
3927
  },
3799
3928
  "claude-opus-4.7": {
3800
3929
  id: "claude-opus-4.7",
@@ -3813,7 +3942,27 @@ export const MODELS = {
3813
3942
  cacheRead: 0,
3814
3943
  cacheWrite: 0,
3815
3944
  },
3816
- contextWindow: 144000,
3945
+ contextWindow: 200000,
3946
+ maxTokens: 32000,
3947
+ },
3948
+ "claude-opus-4.8": {
3949
+ id: "claude-opus-4.8",
3950
+ name: "Claude Opus 4.8",
3951
+ api: "anthropic-messages",
3952
+ provider: "github-copilot",
3953
+ baseUrl: "https://api.individual.githubcopilot.com",
3954
+ headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3955
+ compat: { "forceAdaptiveThinking": true },
3956
+ reasoning: true,
3957
+ thinkingLevelMap: { "xhigh": "xhigh" },
3958
+ input: ["text", "image"],
3959
+ cost: {
3960
+ input: 0,
3961
+ output: 0,
3962
+ cacheRead: 0,
3963
+ cacheWrite: 0,
3964
+ },
3965
+ contextWindow: 200000,
3817
3966
  maxTokens: 64000,
3818
3967
  },
3819
3968
  "claude-sonnet-4.5": {
@@ -3832,7 +3981,7 @@ export const MODELS = {
3832
3981
  cacheRead: 0,
3833
3982
  cacheWrite: 0,
3834
3983
  },
3835
- contextWindow: 144000,
3984
+ contextWindow: 200000,
3836
3985
  maxTokens: 32000,
3837
3986
  },
3838
3987
  "claude-sonnet-4.6": {
@@ -3908,7 +4057,7 @@ export const MODELS = {
3908
4057
  cacheRead: 0,
3909
4058
  cacheWrite: 0,
3910
4059
  },
3911
- contextWindow: 128000,
4060
+ contextWindow: 200000,
3912
4061
  maxTokens: 64000,
3913
4062
  },
3914
4063
  "gemini-3.5-flash": {
@@ -3927,7 +4076,7 @@ export const MODELS = {
3927
4076
  cacheRead: 0,
3928
4077
  cacheWrite: 0,
3929
4078
  },
3930
- contextWindow: 128000,
4079
+ contextWindow: 200000,
3931
4080
  maxTokens: 64000,
3932
4081
  },
3933
4082
  "gpt-4.1": {
@@ -4003,8 +4152,8 @@ export const MODELS = {
4003
4152
  cacheRead: 0,
4004
4153
  cacheWrite: 0,
4005
4154
  },
4006
- contextWindow: 264000,
4007
- maxTokens: 64000,
4155
+ contextWindow: 400000,
4156
+ maxTokens: 128000,
4008
4157
  },
4009
4158
  "gpt-5.2-codex": {
4010
4159
  id: "gpt-5.2-codex",
@@ -4847,7 +4996,7 @@ export const MODELS = {
4847
4996
  cost: {
4848
4997
  input: 1,
4849
4998
  output: 3,
4850
- cacheRead: 0,
4999
+ cacheRead: 0.5,
4851
5000
  cacheWrite: 0,
4852
5001
  },
4853
5002
  contextWindow: 262144,
@@ -4864,7 +5013,7 @@ export const MODELS = {
4864
5013
  cost: {
4865
5014
  input: 0.15,
4866
5015
  output: 0.6,
4867
- cacheRead: 0,
5016
+ cacheRead: 0.075,
4868
5017
  cacheWrite: 0,
4869
5018
  },
4870
5019
  contextWindow: 131072,
@@ -4881,7 +5030,7 @@ export const MODELS = {
4881
5030
  cost: {
4882
5031
  input: 0.075,
4883
5032
  output: 0.3,
4884
- cacheRead: 0,
5033
+ cacheRead: 0.0375,
4885
5034
  cacheWrite: 0,
4886
5035
  },
4887
5036
  contextWindow: 131072,
@@ -5167,9 +5316,9 @@ export const MODELS = {
5167
5316
  reasoning: true,
5168
5317
  input: ["text"],
5169
5318
  cost: {
5170
- input: 1.74,
5171
- output: 3.48,
5172
- cacheRead: 0.145,
5319
+ input: 0.435,
5320
+ output: 0.87,
5321
+ cacheRead: 0.003625,
5173
5322
  cacheWrite: 0,
5174
5323
  },
5175
5324
  contextWindow: 1048576,
@@ -6262,7 +6411,7 @@ export const MODELS = {
6262
6411
  cost: {
6263
6412
  input: 0.1,
6264
6413
  output: 0.4,
6265
- cacheRead: 0.03,
6414
+ cacheRead: 0.025,
6266
6415
  cacheWrite: 0,
6267
6416
  },
6268
6417
  contextWindow: 1047576,
@@ -6347,7 +6496,7 @@ export const MODELS = {
6347
6496
  cost: {
6348
6497
  input: 0.15,
6349
6498
  output: 0.6,
6350
- cacheRead: 0.08,
6499
+ cacheRead: 0.075,
6351
6500
  cacheWrite: 0,
6352
6501
  },
6353
6502
  contextWindow: 128000,
@@ -6473,7 +6622,7 @@ export const MODELS = {
6473
6622
  cost: {
6474
6623
  input: 1.25,
6475
6624
  output: 10,
6476
- cacheRead: 0.13,
6625
+ cacheRead: 0.125,
6477
6626
  cacheWrite: 0,
6478
6627
  },
6479
6628
  contextWindow: 400000,
@@ -6774,7 +6923,7 @@ export const MODELS = {
6774
6923
  provider: "openai",
6775
6924
  baseUrl: "https://api.openai.com/v1",
6776
6925
  reasoning: true,
6777
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
6926
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh", "minimal": null, "low": null },
6778
6927
  input: ["text", "image"],
6779
6928
  cost: {
6780
6929
  input: 30,
@@ -6898,7 +7047,7 @@ export const MODELS = {
6898
7047
  cost: {
6899
7048
  input: 1.1,
6900
7049
  output: 4.4,
6901
- cacheRead: 0.28,
7050
+ cacheRead: 0.275,
6902
7051
  cacheWrite: 0,
6903
7052
  },
6904
7053
  contextWindow: 200000,
@@ -7048,7 +7197,7 @@ export const MODELS = {
7048
7197
  cacheWrite: 0,
7049
7198
  },
7050
7199
  contextWindow: 200000,
7051
- maxTokens: 128000,
7200
+ maxTokens: 32000,
7052
7201
  },
7053
7202
  "claude-haiku-4-5": {
7054
7203
  id: "claude-haiku-4-5",
@@ -7139,6 +7288,25 @@ export const MODELS = {
7139
7288
  contextWindow: 1000000,
7140
7289
  maxTokens: 128000,
7141
7290
  },
7291
+ "claude-opus-4-8": {
7292
+ id: "claude-opus-4-8",
7293
+ name: "Claude Opus 4.8",
7294
+ api: "anthropic-messages",
7295
+ provider: "opencode",
7296
+ baseUrl: "https://opencode.ai/zen",
7297
+ compat: { "forceAdaptiveThinking": true },
7298
+ reasoning: true,
7299
+ thinkingLevelMap: { "xhigh": "xhigh" },
7300
+ input: ["text", "image"],
7301
+ cost: {
7302
+ input: 5,
7303
+ output: 25,
7304
+ cacheRead: 0.5,
7305
+ cacheWrite: 6.25,
7306
+ },
7307
+ contextWindow: 1000000,
7308
+ maxTokens: 128000,
7309
+ },
7142
7310
  "claude-sonnet-4": {
7143
7311
  id: "claude-sonnet-4",
7144
7312
  name: "Claude Sonnet 4",
@@ -7191,6 +7359,25 @@ export const MODELS = {
7191
7359
  contextWindow: 1000000,
7192
7360
  maxTokens: 64000,
7193
7361
  },
7362
+ "deepseek-v4-flash": {
7363
+ id: "deepseek-v4-flash",
7364
+ name: "DeepSeek V4 Flash",
7365
+ api: "openai-completions",
7366
+ provider: "opencode",
7367
+ baseUrl: "https://opencode.ai/zen/v1",
7368
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7369
+ reasoning: true,
7370
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7371
+ input: ["text"],
7372
+ cost: {
7373
+ input: 0.14,
7374
+ output: 0.28,
7375
+ cacheRead: 0.03,
7376
+ cacheWrite: 0,
7377
+ },
7378
+ contextWindow: 1000000,
7379
+ maxTokens: 384000,
7380
+ },
7194
7381
  "deepseek-v4-flash-free": {
7195
7382
  id: "deepseek-v4-flash-free",
7196
7383
  name: "DeepSeek V4 Flash Free",
@@ -7575,7 +7762,7 @@ export const MODELS = {
7575
7762
  provider: "opencode",
7576
7763
  baseUrl: "https://opencode.ai/zen/v1",
7577
7764
  reasoning: true,
7578
- thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
7765
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh", "minimal": null, "low": null },
7579
7766
  input: ["text", "image"],
7580
7767
  cost: {
7581
7768
  input: 30,
@@ -7592,7 +7779,9 @@ export const MODELS = {
7592
7779
  api: "openai-completions",
7593
7780
  provider: "opencode",
7594
7781
  baseUrl: "https://opencode.ai/zen/v1",
7782
+ compat: { "supportsReasoningEffort": false },
7595
7783
  reasoning: true,
7784
+ thinkingLevelMap: { "off": null, "minimal": null, "low": null, "medium": null },
7596
7785
  input: ["text", "image"],
7597
7786
  cost: {
7598
7787
  input: 1,
@@ -7626,6 +7815,7 @@ export const MODELS = {
7626
7815
  api: "openai-completions",
7627
7816
  provider: "opencode",
7628
7817
  baseUrl: "https://opencode.ai/zen/v1",
7818
+ compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false },
7629
7819
  reasoning: true,
7630
7820
  input: ["text", "image"],
7631
7821
  cost: {
@@ -7637,6 +7827,23 @@ export const MODELS = {
7637
7827
  contextWindow: 262144,
7638
7828
  maxTokens: 65536,
7639
7829
  },
7830
+ "mimo-v2.5-free": {
7831
+ id: "mimo-v2.5-free",
7832
+ name: "MiMo V2.5 Free",
7833
+ api: "openai-completions",
7834
+ provider: "opencode",
7835
+ baseUrl: "https://opencode.ai/zen/v1",
7836
+ reasoning: true,
7837
+ input: ["text", "image"],
7838
+ cost: {
7839
+ input: 0,
7840
+ output: 0,
7841
+ cacheRead: 0,
7842
+ cacheWrite: 0,
7843
+ },
7844
+ contextWindow: 200000,
7845
+ maxTokens: 32000,
7846
+ },
7640
7847
  "minimax-m2.5": {
7641
7848
  id: "minimax-m2.5",
7642
7849
  name: "MiniMax M2.5",
@@ -7819,7 +8026,9 @@ export const MODELS = {
7819
8026
  api: "openai-completions",
7820
8027
  provider: "opencode-go",
7821
8028
  baseUrl: "https://opencode.ai/zen/go/v1",
8029
+ compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false },
7822
8030
  reasoning: true,
8031
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
7823
8032
  input: ["text", "image"],
7824
8033
  cost: {
7825
8034
  input: 0.95,
@@ -7839,9 +8048,9 @@ export const MODELS = {
7839
8048
  reasoning: true,
7840
8049
  input: ["text", "image"],
7841
8050
  cost: {
7842
- input: 0.4,
7843
- output: 2,
7844
- cacheRead: 0.08,
8051
+ input: 0.14,
8052
+ output: 0.28,
8053
+ cacheRead: 0.0028,
7845
8054
  cacheWrite: 0,
7846
8055
  },
7847
8056
  contextWindow: 1000000,
@@ -7856,9 +8065,9 @@ export const MODELS = {
7856
8065
  reasoning: true,
7857
8066
  input: ["text"],
7858
8067
  cost: {
7859
- input: 1,
7860
- output: 3,
7861
- cacheRead: 0.2,
8068
+ input: 1.74,
8069
+ output: 3.48,
8070
+ cacheRead: 0.0145,
7862
8071
  cacheWrite: 0,
7863
8072
  },
7864
8073
  contextWindow: 1048576,
@@ -7898,24 +8107,6 @@ export const MODELS = {
7898
8107
  contextWindow: 204800,
7899
8108
  maxTokens: 131072,
7900
8109
  },
7901
- "qwen3.5-plus": {
7902
- id: "qwen3.5-plus",
7903
- name: "Qwen3.5 Plus",
7904
- api: "openai-completions",
7905
- provider: "opencode-go",
7906
- baseUrl: "https://opencode.ai/zen/go/v1",
7907
- compat: { "thinkingFormat": "qwen" },
7908
- reasoning: true,
7909
- input: ["text", "image"],
7910
- cost: {
7911
- input: 0.2,
7912
- output: 1.2,
7913
- cacheRead: 0.02,
7914
- cacheWrite: 0.25,
7915
- },
7916
- contextWindow: 262144,
7917
- maxTokens: 65536,
7918
- },
7919
8110
  "qwen3.6-plus": {
7920
8111
  id: "qwen3.6-plus",
7921
8112
  name: "Qwen3.6 Plus",
@@ -7934,6 +8125,23 @@ export const MODELS = {
7934
8125
  contextWindow: 262144,
7935
8126
  maxTokens: 65536,
7936
8127
  },
8128
+ "qwen3.7-max": {
8129
+ id: "qwen3.7-max",
8130
+ name: "Qwen3.7 Max",
8131
+ api: "anthropic-messages",
8132
+ provider: "opencode-go",
8133
+ baseUrl: "https://opencode.ai/zen/go",
8134
+ reasoning: true,
8135
+ input: ["text"],
8136
+ cost: {
8137
+ input: 2.5,
8138
+ output: 7.5,
8139
+ cacheRead: 0.5,
8140
+ cacheWrite: 3.125,
8141
+ },
8142
+ contextWindow: 1000000,
8143
+ maxTokens: 65536,
8144
+ },
7937
8145
  },
7938
8146
  "openrouter": {
7939
8147
  "ai21/jamba-large-1.7": {
@@ -7953,23 +8161,6 @@ export const MODELS = {
7953
8161
  contextWindow: 256000,
7954
8162
  maxTokens: 4096,
7955
8163
  },
7956
- "alibaba/tongyi-deepresearch-30b-a3b": {
7957
- id: "alibaba/tongyi-deepresearch-30b-a3b",
7958
- name: "Tongyi DeepResearch 30B A3B",
7959
- api: "openai-completions",
7960
- provider: "openrouter",
7961
- baseUrl: "https://openrouter.ai/api/v1",
7962
- reasoning: true,
7963
- input: ["text"],
7964
- cost: {
7965
- input: 0.09,
7966
- output: 0.44999999999999996,
7967
- cacheRead: 0.09,
7968
- cacheWrite: 0,
7969
- },
7970
- contextWindow: 131072,
7971
- maxTokens: 131072,
7972
- },
7973
8164
  "amazon/nova-2-lite-v1": {
7974
8165
  id: "amazon/nova-2-lite-v1",
7975
8166
  name: "Amazon: Nova 2 Lite",
@@ -8229,6 +8420,42 @@ export const MODELS = {
8229
8420
  contextWindow: 1000000,
8230
8421
  maxTokens: 128000,
8231
8422
  },
8423
+ "anthropic/claude-opus-4.8": {
8424
+ id: "anthropic/claude-opus-4.8",
8425
+ name: "Anthropic: Claude Opus 4.8",
8426
+ api: "openai-completions",
8427
+ provider: "openrouter",
8428
+ baseUrl: "https://openrouter.ai/api/v1",
8429
+ reasoning: true,
8430
+ thinkingLevelMap: { "xhigh": "xhigh" },
8431
+ input: ["text", "image"],
8432
+ cost: {
8433
+ input: 5,
8434
+ output: 25,
8435
+ cacheRead: 0.5,
8436
+ cacheWrite: 6.25,
8437
+ },
8438
+ contextWindow: 1000000,
8439
+ maxTokens: 128000,
8440
+ },
8441
+ "anthropic/claude-opus-4.8-fast": {
8442
+ id: "anthropic/claude-opus-4.8-fast",
8443
+ name: "Anthropic: Claude Opus 4.8 (Fast)",
8444
+ api: "openai-completions",
8445
+ provider: "openrouter",
8446
+ baseUrl: "https://openrouter.ai/api/v1",
8447
+ reasoning: true,
8448
+ thinkingLevelMap: { "xhigh": "xhigh" },
8449
+ input: ["text", "image"],
8450
+ cost: {
8451
+ input: 10,
8452
+ output: 50,
8453
+ cacheRead: 1,
8454
+ cacheWrite: 12.5,
8455
+ },
8456
+ contextWindow: 1000000,
8457
+ maxTokens: 128000,
8458
+ },
8232
8459
  "anthropic/claude-sonnet-4": {
8233
8460
  id: "anthropic/claude-sonnet-4",
8234
8461
  name: "Anthropic: Claude Sonnet 4",
@@ -8297,23 +8524,6 @@ export const MODELS = {
8297
8524
  contextWindow: 262144,
8298
8525
  maxTokens: 262144,
8299
8526
  },
8300
- "arcee-ai/trinity-large-thinking:free": {
8301
- id: "arcee-ai/trinity-large-thinking:free",
8302
- name: "Arcee AI: Trinity Large Thinking (free)",
8303
- api: "openai-completions",
8304
- provider: "openrouter",
8305
- baseUrl: "https://openrouter.ai/api/v1",
8306
- reasoning: true,
8307
- input: ["text"],
8308
- cost: {
8309
- input: 0,
8310
- output: 0,
8311
- cacheRead: 0,
8312
- cacheWrite: 0,
8313
- },
8314
- contextWindow: 262144,
8315
- maxTokens: 80000,
8316
- },
8317
8527
  "arcee-ai/trinity-mini": {
8318
8528
  id: "arcee-ai/trinity-mini",
8319
8529
  name: "Arcee AI: Trinity Mini",
@@ -8365,40 +8575,6 @@ export const MODELS = {
8365
8575
  contextWindow: 2000000,
8366
8576
  maxTokens: 30000,
8367
8577
  },
8368
- "baidu/cobuddy:free": {
8369
- id: "baidu/cobuddy:free",
8370
- name: "Baidu Qianfan: CoBuddy (free)",
8371
- api: "openai-completions",
8372
- provider: "openrouter",
8373
- baseUrl: "https://openrouter.ai/api/v1",
8374
- reasoning: true,
8375
- input: ["text"],
8376
- cost: {
8377
- input: 0,
8378
- output: 0,
8379
- cacheRead: 0,
8380
- cacheWrite: 0,
8381
- },
8382
- contextWindow: 131072,
8383
- maxTokens: 65536,
8384
- },
8385
- "baidu/ernie-4.5-21b-a3b": {
8386
- id: "baidu/ernie-4.5-21b-a3b",
8387
- name: "Baidu: ERNIE 4.5 21B A3B",
8388
- api: "openai-completions",
8389
- provider: "openrouter",
8390
- baseUrl: "https://openrouter.ai/api/v1",
8391
- reasoning: false,
8392
- input: ["text"],
8393
- cost: {
8394
- input: 0.07,
8395
- output: 0.28,
8396
- cacheRead: 0,
8397
- cacheWrite: 0,
8398
- },
8399
- contextWindow: 131072,
8400
- maxTokens: 8000,
8401
- },
8402
8578
  "baidu/ernie-4.5-vl-28b-a3b": {
8403
8579
  id: "baidu/ernie-4.5-vl-28b-a3b",
8404
8580
  name: "Baidu: ERNIE 4.5 VL 28B A3B",
@@ -8527,13 +8703,13 @@ export const MODELS = {
8527
8703
  reasoning: false,
8528
8704
  input: ["text"],
8529
8705
  cost: {
8530
- input: 0.32,
8531
- output: 0.8899999999999999,
8706
+ input: 0.2288,
8707
+ output: 0.9144,
8532
8708
  cacheRead: 0,
8533
8709
  cacheWrite: 0,
8534
8710
  },
8535
- contextWindow: 163840,
8536
- maxTokens: 16384,
8711
+ contextWindow: 131072,
8712
+ maxTokens: 16000,
8537
8713
  },
8538
8714
  "deepseek/deepseek-chat-v3-0324": {
8539
8715
  id: "deepseek/deepseek-chat-v3-0324",
@@ -8660,37 +8836,18 @@ export const MODELS = {
8660
8836
  api: "openai-completions",
8661
8837
  provider: "openrouter",
8662
8838
  baseUrl: "https://openrouter.ai/api/v1",
8663
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8664
- reasoning: true,
8665
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
8666
- input: ["text"],
8667
- cost: {
8668
- input: 0.09999999999999999,
8669
- output: 0.19999999999999998,
8670
- cacheRead: 0.02,
8671
- cacheWrite: 0,
8672
- },
8673
- contextWindow: 1048576,
8674
- maxTokens: 16384,
8675
- },
8676
- "deepseek/deepseek-v4-flash:free": {
8677
- id: "deepseek/deepseek-v4-flash:free",
8678
- name: "DeepSeek: DeepSeek V4 Flash (free)",
8679
- api: "openai-completions",
8680
- provider: "openrouter",
8681
- baseUrl: "https://openrouter.ai/api/v1",
8682
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8839
+ compat: { "requiresReasoningContentOnAssistantMessages": true },
8683
8840
  reasoning: true,
8684
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
8841
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "xhigh" },
8685
8842
  input: ["text"],
8686
8843
  cost: {
8687
- input: 0,
8688
- output: 0,
8689
- cacheRead: 0,
8844
+ input: 0.0983,
8845
+ output: 0.1966,
8846
+ cacheRead: 0.019700000000000002,
8690
8847
  cacheWrite: 0,
8691
8848
  },
8692
8849
  contextWindow: 1048576,
8693
- maxTokens: 384000,
8850
+ maxTokens: 131072,
8694
8851
  },
8695
8852
  "deepseek/deepseek-v4-pro": {
8696
8853
  id: "deepseek/deepseek-v4-pro",
@@ -8698,9 +8855,9 @@ export const MODELS = {
8698
8855
  api: "openai-completions",
8699
8856
  provider: "openrouter",
8700
8857
  baseUrl: "https://openrouter.ai/api/v1",
8701
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8858
+ compat: { "requiresReasoningContentOnAssistantMessages": true },
8702
8859
  reasoning: true,
8703
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
8860
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "xhigh" },
8704
8861
  input: ["text"],
8705
8862
  cost: {
8706
8863
  input: 0.435,
@@ -8742,7 +8899,7 @@ export const MODELS = {
8742
8899
  cacheRead: 0.024999999999999998,
8743
8900
  cacheWrite: 0.08333333333333334,
8744
8901
  },
8745
- contextWindow: 1000000,
8902
+ contextWindow: 1048576,
8746
8903
  maxTokens: 8192,
8747
8904
  },
8748
8905
  "google/gemini-2.0-flash-lite-001": {
@@ -9146,9 +9303,9 @@ export const MODELS = {
9146
9303
  reasoning: true,
9147
9304
  input: ["text"],
9148
9305
  cost: {
9149
- input: 0.075,
9150
- output: 0.625,
9151
- cacheRead: 0.015,
9306
+ input: 0.3,
9307
+ output: 2.5,
9308
+ cacheRead: 0.06,
9152
9309
  cacheWrite: 0,
9153
9310
  },
9154
9311
  contextWindow: 262144,
@@ -9239,6 +9396,23 @@ export const MODELS = {
9239
9396
  contextWindow: 131072,
9240
9397
  maxTokens: 4096,
9241
9398
  },
9399
+ "meta-llama/llama-4-maverick": {
9400
+ id: "meta-llama/llama-4-maverick",
9401
+ name: "Meta: Llama 4 Maverick",
9402
+ api: "openai-completions",
9403
+ provider: "openrouter",
9404
+ baseUrl: "https://openrouter.ai/api/v1",
9405
+ reasoning: false,
9406
+ input: ["text", "image"],
9407
+ cost: {
9408
+ input: 0.15,
9409
+ output: 0.6,
9410
+ cacheRead: 0,
9411
+ cacheWrite: 0,
9412
+ },
9413
+ contextWindow: 1048576,
9414
+ maxTokens: 16384,
9415
+ },
9242
9416
  "meta-llama/llama-4-scout": {
9243
9417
  id: "meta-llama/llama-4-scout",
9244
9418
  name: "Meta: Llama 4 Scout",
@@ -9324,23 +9498,6 @@ export const MODELS = {
9324
9498
  contextWindow: 204800,
9325
9499
  maxTokens: 196608,
9326
9500
  },
9327
- "minimax/minimax-m2.5:free": {
9328
- id: "minimax/minimax-m2.5:free",
9329
- name: "MiniMax: MiniMax M2.5 (free)",
9330
- api: "openai-completions",
9331
- provider: "openrouter",
9332
- baseUrl: "https://openrouter.ai/api/v1",
9333
- reasoning: true,
9334
- input: ["text"],
9335
- cost: {
9336
- input: 0,
9337
- output: 0,
9338
- cacheRead: 0,
9339
- cacheWrite: 0,
9340
- },
9341
- contextWindow: 204800,
9342
- maxTokens: 8192,
9343
- },
9344
9501
  "minimax/minimax-m2.7": {
9345
9502
  id: "minimax/minimax-m2.7",
9346
9503
  name: "MiniMax: MiniMax M2.7",
@@ -9350,13 +9507,13 @@ export const MODELS = {
9350
9507
  reasoning: true,
9351
9508
  input: ["text"],
9352
9509
  cost: {
9353
- input: 0.27899999999999997,
9510
+ input: 0.26,
9354
9511
  output: 1.2,
9355
9512
  cacheRead: 0,
9356
9513
  cacheWrite: 0,
9357
9514
  },
9358
9515
  contextWindow: 204800,
9359
- maxTokens: 131072,
9516
+ maxTokens: 4096,
9360
9517
  },
9361
9518
  "mistralai/codestral-2508": {
9362
9519
  id: "mistralai/codestral-2508",
@@ -9392,40 +9549,6 @@ export const MODELS = {
9392
9549
  contextWindow: 262144,
9393
9550
  maxTokens: 4096,
9394
9551
  },
9395
- "mistralai/devstral-medium": {
9396
- id: "mistralai/devstral-medium",
9397
- name: "Mistral: Devstral Medium",
9398
- api: "openai-completions",
9399
- provider: "openrouter",
9400
- baseUrl: "https://openrouter.ai/api/v1",
9401
- reasoning: false,
9402
- input: ["text"],
9403
- cost: {
9404
- input: 0.39999999999999997,
9405
- output: 2,
9406
- cacheRead: 0.04,
9407
- cacheWrite: 0,
9408
- },
9409
- contextWindow: 131072,
9410
- maxTokens: 4096,
9411
- },
9412
- "mistralai/devstral-small": {
9413
- id: "mistralai/devstral-small",
9414
- name: "Mistral: Devstral Small 1.1",
9415
- api: "openai-completions",
9416
- provider: "openrouter",
9417
- baseUrl: "https://openrouter.ai/api/v1",
9418
- reasoning: false,
9419
- input: ["text"],
9420
- cost: {
9421
- input: 0.09999999999999999,
9422
- output: 0.3,
9423
- cacheRead: 0.01,
9424
- cacheWrite: 0,
9425
- },
9426
- contextWindow: 131072,
9427
- maxTokens: 4096,
9428
- },
9429
9552
  "mistralai/ministral-14b-2512": {
9430
9553
  id: "mistralai/ministral-14b-2512",
9431
9554
  name: "Mistral: Ministral 3 14B 2512",
@@ -9511,23 +9634,6 @@ export const MODELS = {
9511
9634
  contextWindow: 131072,
9512
9635
  maxTokens: 4096,
9513
9636
  },
9514
- "mistralai/mistral-large-2411": {
9515
- id: "mistralai/mistral-large-2411",
9516
- name: "Mistral Large 2411",
9517
- api: "openai-completions",
9518
- provider: "openrouter",
9519
- baseUrl: "https://openrouter.ai/api/v1",
9520
- reasoning: false,
9521
- input: ["text"],
9522
- cost: {
9523
- input: 2,
9524
- output: 6,
9525
- cacheRead: 0.19999999999999998,
9526
- cacheWrite: 0,
9527
- },
9528
- contextWindow: 131072,
9529
- maxTokens: 4096,
9530
- },
9531
9637
  "mistralai/mistral-large-2512": {
9532
9638
  id: "mistralai/mistral-large-2512",
9533
9639
  name: "Mistral: Mistral Large 3 2512",
@@ -9681,23 +9787,6 @@ export const MODELS = {
9681
9787
  contextWindow: 65536,
9682
9788
  maxTokens: 4096,
9683
9789
  },
9684
- "mistralai/pixtral-large-2411": {
9685
- id: "mistralai/pixtral-large-2411",
9686
- name: "Mistral: Pixtral Large 2411",
9687
- api: "openai-completions",
9688
- provider: "openrouter",
9689
- baseUrl: "https://openrouter.ai/api/v1",
9690
- reasoning: false,
9691
- input: ["text", "image"],
9692
- cost: {
9693
- input: 2,
9694
- output: 6,
9695
- cacheRead: 0.19999999999999998,
9696
- cacheWrite: 0,
9697
- },
9698
- contextWindow: 131072,
9699
- maxTokens: 4096,
9700
- },
9701
9790
  "mistralai/voxtral-small-24b-2507": {
9702
9791
  id: "mistralai/voxtral-small-24b-2507",
9703
9792
  name: "Mistral: Voxtral Small 24B 2507",
@@ -9789,16 +9878,35 @@ export const MODELS = {
9789
9878
  api: "openai-completions",
9790
9879
  provider: "openrouter",
9791
9880
  baseUrl: "https://openrouter.ai/api/v1",
9881
+ compat: { "supportsDeveloperRole": false },
9792
9882
  reasoning: true,
9793
9883
  input: ["text", "image"],
9794
9884
  cost: {
9795
- input: 0.73,
9796
- output: 3.49,
9797
- cacheRead: 0.25,
9885
+ input: 0.684,
9886
+ output: 3.42,
9887
+ cacheRead: 0.144,
9798
9888
  cacheWrite: 0,
9799
9889
  },
9800
9890
  contextWindow: 262144,
9801
- maxTokens: 262142,
9891
+ maxTokens: 262144,
9892
+ },
9893
+ "moonshotai/kimi-k2.6:free": {
9894
+ id: "moonshotai/kimi-k2.6:free",
9895
+ name: "MoonshotAI: Kimi K2.6 (free)",
9896
+ api: "openai-completions",
9897
+ provider: "openrouter",
9898
+ baseUrl: "https://openrouter.ai/api/v1",
9899
+ compat: { "supportsDeveloperRole": false },
9900
+ reasoning: true,
9901
+ input: ["text", "image"],
9902
+ cost: {
9903
+ input: 0,
9904
+ output: 0,
9905
+ cacheRead: 0,
9906
+ cacheWrite: 0,
9907
+ },
9908
+ contextWindow: 262144,
9909
+ maxTokens: 4096,
9802
9910
  },
9803
9911
  "nex-agi/deepseek-v3.1-nex-n1": {
9804
9912
  id: "nex-agi/deepseek-v3.1-nex-n1",
@@ -10210,33 +10318,16 @@ export const MODELS = {
10210
10318
  },
10211
10319
  "openai/gpt-4o-2024-11-20": {
10212
10320
  id: "openai/gpt-4o-2024-11-20",
10213
- name: "OpenAI: GPT-4o (2024-11-20)",
10214
- api: "openai-completions",
10215
- provider: "openrouter",
10216
- baseUrl: "https://openrouter.ai/api/v1",
10217
- reasoning: false,
10218
- input: ["text", "image"],
10219
- cost: {
10220
- input: 2.5,
10221
- output: 10,
10222
- cacheRead: 1.25,
10223
- cacheWrite: 0,
10224
- },
10225
- contextWindow: 128000,
10226
- maxTokens: 16384,
10227
- },
10228
- "openai/gpt-4o-audio-preview": {
10229
- id: "openai/gpt-4o-audio-preview",
10230
- name: "OpenAI: GPT-4o Audio",
10321
+ name: "OpenAI: GPT-4o (2024-11-20)",
10231
10322
  api: "openai-completions",
10232
10323
  provider: "openrouter",
10233
10324
  baseUrl: "https://openrouter.ai/api/v1",
10234
10325
  reasoning: false,
10235
- input: ["text"],
10326
+ input: ["text", "image"],
10236
10327
  cost: {
10237
10328
  input: 2.5,
10238
10329
  output: 10,
10239
- cacheRead: 0,
10330
+ cacheRead: 1.25,
10240
10331
  cacheWrite: 0,
10241
10332
  },
10242
10333
  contextWindow: 128000,
@@ -10389,11 +10480,11 @@ export const MODELS = {
10389
10480
  cost: {
10390
10481
  input: 1.25,
10391
10482
  output: 10,
10392
- cacheRead: 0.125,
10483
+ cacheRead: 0.13,
10393
10484
  cacheWrite: 0,
10394
10485
  },
10395
10486
  contextWindow: 128000,
10396
- maxTokens: 16384,
10487
+ maxTokens: 32000,
10397
10488
  },
10398
10489
  "openai/gpt-5.1-codex": {
10399
10490
  id: "openai/gpt-5.1-codex",
@@ -10406,7 +10497,7 @@ export const MODELS = {
10406
10497
  cost: {
10407
10498
  input: 1.25,
10408
10499
  output: 10,
10409
- cacheRead: 0.125,
10500
+ cacheRead: 0.13,
10410
10501
  cacheWrite: 0,
10411
10502
  },
10412
10503
  contextWindow: 400000,
@@ -10440,11 +10531,11 @@ export const MODELS = {
10440
10531
  cost: {
10441
10532
  input: 0.25,
10442
10533
  output: 2,
10443
- cacheRead: 0.03,
10534
+ cacheRead: 0.024999999999999998,
10444
10535
  cacheWrite: 0,
10445
10536
  },
10446
10537
  contextWindow: 400000,
10447
- maxTokens: 128000,
10538
+ maxTokens: 100000,
10448
10539
  },
10449
10540
  "openai/gpt-5.2": {
10450
10541
  id: "openai/gpt-5.2",
@@ -10480,7 +10571,7 @@ export const MODELS = {
10480
10571
  cacheWrite: 0,
10481
10572
  },
10482
10573
  contextWindow: 128000,
10483
- maxTokens: 32000,
10574
+ maxTokens: 16384,
10484
10575
  },
10485
10576
  "openai/gpt-5.2-codex": {
10486
10577
  id: "openai/gpt-5.2-codex",
@@ -10651,7 +10742,7 @@ export const MODELS = {
10651
10742
  provider: "openrouter",
10652
10743
  baseUrl: "https://openrouter.ai/api/v1",
10653
10744
  reasoning: true,
10654
- thinkingLevelMap: { "xhigh": "xhigh" },
10745
+ thinkingLevelMap: { "xhigh": "xhigh", "off": null, "minimal": null, "low": null },
10655
10746
  input: ["text", "image"],
10656
10747
  cost: {
10657
10748
  input: 30,
@@ -10756,13 +10847,13 @@ export const MODELS = {
10756
10847
  reasoning: true,
10757
10848
  input: ["text"],
10758
10849
  cost: {
10759
- input: 0.03,
10850
+ input: 0.029,
10760
10851
  output: 0.14,
10761
10852
  cacheRead: 0,
10762
10853
  cacheWrite: 0,
10763
10854
  },
10764
10855
  contextWindow: 131072,
10765
- maxTokens: 131072,
10856
+ maxTokens: 4096,
10766
10857
  },
10767
10858
  "openai/gpt-oss-20b:free": {
10768
10859
  id: "openai/gpt-oss-20b:free",
@@ -11016,8 +11107,8 @@ export const MODELS = {
11016
11107
  cacheRead: 0,
11017
11108
  cacheWrite: 0,
11018
11109
  },
11019
- contextWindow: 131072,
11020
- maxTokens: 8192,
11110
+ contextWindow: 262144,
11111
+ maxTokens: 32768,
11021
11112
  },
11022
11113
  "poolside/laguna-xs.2:free": {
11023
11114
  id: "poolside/laguna-xs.2:free",
@@ -11033,8 +11124,8 @@ export const MODELS = {
11033
11124
  cacheRead: 0,
11034
11125
  cacheWrite: 0,
11035
11126
  },
11036
- contextWindow: 131072,
11037
- maxTokens: 8192,
11127
+ contextWindow: 262144,
11128
+ maxTokens: 32768,
11038
11129
  },
11039
11130
  "prime-intellect/intellect-3": {
11040
11131
  id: "prime-intellect/intellect-3",
@@ -11070,23 +11161,6 @@ export const MODELS = {
11070
11161
  contextWindow: 131072,
11071
11162
  maxTokens: 16384,
11072
11163
  },
11073
- "qwen/qwen-2.5-7b-instruct": {
11074
- id: "qwen/qwen-2.5-7b-instruct",
11075
- name: "Qwen: Qwen2.5 7B Instruct",
11076
- api: "openai-completions",
11077
- provider: "openrouter",
11078
- baseUrl: "https://openrouter.ai/api/v1",
11079
- reasoning: false,
11080
- input: ["text"],
11081
- cost: {
11082
- input: 0.04,
11083
- output: 0.09999999999999999,
11084
- cacheRead: 0,
11085
- cacheWrite: 0,
11086
- },
11087
- contextWindow: 131072,
11088
- maxTokens: 32768,
11089
- },
11090
11164
  "qwen/qwen-plus": {
11091
11165
  id: "qwen/qwen-plus",
11092
11166
  name: "Qwen: Qwen-Plus",
@@ -11116,7 +11190,7 @@ export const MODELS = {
11116
11190
  input: 0.26,
11117
11191
  output: 0.78,
11118
11192
  cacheRead: 0,
11119
- cacheWrite: 0.325,
11193
+ cacheWrite: 0,
11120
11194
  },
11121
11195
  contextWindow: 1000000,
11122
11196
  maxTokens: 32768,
@@ -11198,13 +11272,13 @@ export const MODELS = {
11198
11272
  reasoning: true,
11199
11273
  input: ["text"],
11200
11274
  cost: {
11201
- input: 0.14950000000000002,
11202
- output: 1.495,
11203
- cacheRead: 0,
11275
+ input: 0.09999999999999999,
11276
+ output: 0.09999999999999999,
11277
+ cacheRead: 0.09999999999999999,
11204
11278
  cacheWrite: 0,
11205
11279
  },
11206
11280
  contextWindow: 262144,
11207
- maxTokens: 4096,
11281
+ maxTokens: 262144,
11208
11282
  },
11209
11283
  "qwen/qwen3-30b-a3b": {
11210
11284
  id: "qwen/qwen3-30b-a3b",
@@ -11640,13 +11714,13 @@ export const MODELS = {
11640
11714
  reasoning: true,
11641
11715
  input: ["text", "image"],
11642
11716
  cost: {
11643
- input: 0.13899999999999998,
11717
+ input: 0.14,
11644
11718
  output: 1,
11645
- cacheRead: 0,
11719
+ cacheRead: 0.049999999999999996,
11646
11720
  cacheWrite: 0,
11647
11721
  },
11648
11722
  contextWindow: 262144,
11649
- maxTokens: 4096,
11723
+ maxTokens: 262144,
11650
11724
  },
11651
11725
  "qwen/qwen3.5-397b-a17b": {
11652
11726
  id: "qwen/qwen3.5-397b-a17b",
@@ -11694,7 +11768,7 @@ export const MODELS = {
11694
11768
  input: 0.065,
11695
11769
  output: 0.26,
11696
11770
  cacheRead: 0,
11697
- cacheWrite: 0.08125,
11771
+ cacheWrite: 0,
11698
11772
  },
11699
11773
  contextWindow: 1000000,
11700
11774
  maxTokens: 65536,
@@ -11711,7 +11785,7 @@ export const MODELS = {
11711
11785
  input: 0.26,
11712
11786
  output: 1.56,
11713
11787
  cacheRead: 0,
11714
- cacheWrite: 0.325,
11788
+ cacheWrite: 0,
11715
11789
  },
11716
11790
  contextWindow: 1000000,
11717
11791
  maxTokens: 65536,
@@ -11728,7 +11802,7 @@ export const MODELS = {
11728
11802
  input: 0.3,
11729
11803
  output: 1.7999999999999998,
11730
11804
  cacheRead: 0,
11731
- cacheWrite: 0,
11805
+ cacheWrite: 0.375,
11732
11806
  },
11733
11807
  contextWindow: 1000000,
11734
11808
  maxTokens: 65536,
@@ -11742,13 +11816,13 @@ export const MODELS = {
11742
11816
  reasoning: true,
11743
11817
  input: ["text", "image"],
11744
11818
  cost: {
11745
- input: 0.3,
11819
+ input: 0.29,
11746
11820
  output: 3.1999999999999997,
11747
11821
  cacheRead: 0,
11748
11822
  cacheWrite: 0,
11749
11823
  },
11750
11824
  contextWindow: 262144,
11751
- maxTokens: 262144,
11825
+ maxTokens: 262140,
11752
11826
  },
11753
11827
  "qwen/qwen3.6-35b-a3b": {
11754
11828
  id: "qwen/qwen3.6-35b-a3b",
@@ -11759,7 +11833,7 @@ export const MODELS = {
11759
11833
  reasoning: true,
11760
11834
  input: ["text", "image"],
11761
11835
  cost: {
11762
- input: 0.15,
11836
+ input: 0.14,
11763
11837
  output: 1,
11764
11838
  cacheRead: 0,
11765
11839
  cacheWrite: 0,
@@ -11827,10 +11901,10 @@ export const MODELS = {
11827
11901
  reasoning: true,
11828
11902
  input: ["text"],
11829
11903
  cost: {
11830
- input: 2.5,
11831
- output: 7.5,
11832
- cacheRead: 0,
11833
- cacheWrite: 3.125,
11904
+ input: 1.25,
11905
+ output: 3.75,
11906
+ cacheRead: 0.25,
11907
+ cacheWrite: 1.5625,
11834
11908
  },
11835
11909
  contextWindow: 1000000,
11836
11910
  maxTokens: 65536,
@@ -11920,6 +11994,23 @@ export const MODELS = {
11920
11994
  contextWindow: 262144,
11921
11995
  maxTokens: 16384,
11922
11996
  },
11997
+ "stepfun/step-3.7-flash": {
11998
+ id: "stepfun/step-3.7-flash",
11999
+ name: "StepFun: Step 3.7 Flash",
12000
+ api: "openai-completions",
12001
+ provider: "openrouter",
12002
+ baseUrl: "https://openrouter.ai/api/v1",
12003
+ reasoning: true,
12004
+ input: ["text", "image"],
12005
+ cost: {
12006
+ input: 0.19999999999999998,
12007
+ output: 1.15,
12008
+ cacheRead: 0.04,
12009
+ cacheWrite: 0,
12010
+ },
12011
+ contextWindow: 256000,
12012
+ maxTokens: 256000,
12013
+ },
11923
12014
  "tencent/hy3-preview": {
11924
12015
  id: "tencent/hy3-preview",
11925
12016
  name: "Tencent: Hy3 preview",
@@ -11929,13 +12020,13 @@ export const MODELS = {
11929
12020
  reasoning: true,
11930
12021
  input: ["text"],
11931
12022
  cost: {
11932
- input: 0.06599999999999999,
11933
- output: 0.26,
11934
- cacheRead: 0.029,
12023
+ input: 0.063,
12024
+ output: 0.21,
12025
+ cacheRead: 0.020999999999999998,
11935
12026
  cacheWrite: 0,
11936
12027
  },
11937
12028
  contextWindow: 262144,
11938
- maxTokens: 262144,
12029
+ maxTokens: 4096,
11939
12030
  },
11940
12031
  "thedrummer/rocinante-12b": {
11941
12032
  id: "thedrummer/rocinante-12b",
@@ -12056,40 +12147,6 @@ export const MODELS = {
12056
12147
  contextWindow: 262144,
12057
12148
  maxTokens: 65536,
12058
12149
  },
12059
- "xiaomi/mimo-v2-omni": {
12060
- id: "xiaomi/mimo-v2-omni",
12061
- name: "Xiaomi: MiMo-V2-Omni",
12062
- api: "openai-completions",
12063
- provider: "openrouter",
12064
- baseUrl: "https://openrouter.ai/api/v1",
12065
- reasoning: true,
12066
- input: ["text", "image"],
12067
- cost: {
12068
- input: 0.39999999999999997,
12069
- output: 2,
12070
- cacheRead: 0.08,
12071
- cacheWrite: 0,
12072
- },
12073
- contextWindow: 262144,
12074
- maxTokens: 65536,
12075
- },
12076
- "xiaomi/mimo-v2-pro": {
12077
- id: "xiaomi/mimo-v2-pro",
12078
- name: "Xiaomi: MiMo-V2-Pro",
12079
- api: "openai-completions",
12080
- provider: "openrouter",
12081
- baseUrl: "https://openrouter.ai/api/v1",
12082
- reasoning: true,
12083
- input: ["text"],
12084
- cost: {
12085
- input: 1,
12086
- output: 3,
12087
- cacheRead: 0.19999999999999998,
12088
- cacheWrite: 0,
12089
- },
12090
- contextWindow: 1048576,
12091
- maxTokens: 131072,
12092
- },
12093
12150
  "xiaomi/mimo-v2.5": {
12094
12151
  id: "xiaomi/mimo-v2.5",
12095
12152
  name: "Xiaomi: MiMo-V2.5",
@@ -12099,9 +12156,9 @@ export const MODELS = {
12099
12156
  reasoning: true,
12100
12157
  input: ["text", "image"],
12101
12158
  cost: {
12102
- input: 0.39999999999999997,
12103
- output: 2,
12104
- cacheRead: 0.08,
12159
+ input: 0.14,
12160
+ output: 0.28,
12161
+ cacheRead: 0.0028,
12105
12162
  cacheWrite: 0,
12106
12163
  },
12107
12164
  contextWindow: 1048576,
@@ -12116,13 +12173,13 @@ export const MODELS = {
12116
12173
  reasoning: true,
12117
12174
  input: ["text"],
12118
12175
  cost: {
12119
- input: 1,
12120
- output: 3,
12121
- cacheRead: 0.19999999999999998,
12176
+ input: 0.435,
12177
+ output: 0.87,
12178
+ cacheRead: 0.0036,
12122
12179
  cacheWrite: 0,
12123
12180
  },
12124
12181
  contextWindow: 1048576,
12125
- maxTokens: 16384,
12182
+ maxTokens: 131072,
12126
12183
  },
12127
12184
  "z-ai/glm-4-32b": {
12128
12185
  id: "z-ai/glm-4-32b",
@@ -12167,13 +12224,13 @@ export const MODELS = {
12167
12224
  reasoning: true,
12168
12225
  input: ["text"],
12169
12226
  cost: {
12170
- input: 0.13,
12227
+ input: 0.125,
12171
12228
  output: 0.85,
12172
- cacheRead: 0.024999999999999998,
12229
+ cacheRead: 0.06,
12173
12230
  cacheWrite: 0,
12174
12231
  },
12175
12232
  contextWindow: 131072,
12176
- maxTokens: 98304,
12233
+ maxTokens: 131070,
12177
12234
  },
12178
12235
  "z-ai/glm-4.5-air:free": {
12179
12236
  id: "z-ai/glm-4.5-air:free",
@@ -12439,13 +12496,13 @@ export const MODELS = {
12439
12496
  reasoning: true,
12440
12497
  input: ["text", "image"],
12441
12498
  cost: {
12442
- input: 0.73,
12443
- output: 3.49,
12444
- cacheRead: 0.25,
12499
+ input: 0.684,
12500
+ output: 3.42,
12501
+ cacheRead: 0.144,
12445
12502
  cacheWrite: 0,
12446
12503
  },
12447
12504
  contextWindow: 262144,
12448
- maxTokens: 262142,
12505
+ maxTokens: 262144,
12449
12506
  },
12450
12507
  "~openai/gpt-latest": {
12451
12508
  id: "~openai/gpt-latest",
@@ -12843,20 +12900,20 @@ export const MODELS = {
12843
12900
  },
12844
12901
  "alibaba/qwen-3-235b": {
12845
12902
  id: "alibaba/qwen-3-235b",
12846
- name: "Qwen3 235B A22b Instruct 2507",
12903
+ name: "Qwen3 235B A22B",
12847
12904
  api: "anthropic-messages",
12848
12905
  provider: "vercel-ai-gateway",
12849
12906
  baseUrl: "https://ai-gateway.vercel.sh",
12850
12907
  reasoning: false,
12851
12908
  input: ["text"],
12852
12909
  cost: {
12853
- input: 0.6,
12854
- output: 1.2,
12855
- cacheRead: 0.6,
12910
+ input: 0.22,
12911
+ output: 0.88,
12912
+ cacheRead: 0,
12856
12913
  cacheWrite: 0,
12857
12914
  },
12858
- contextWindow: 131000,
12859
- maxTokens: 40000,
12915
+ contextWindow: 262144,
12916
+ maxTokens: 16384,
12860
12917
  },
12861
12918
  "alibaba/qwen-3-30b": {
12862
12919
  id: "alibaba/qwen-3-30b",
@@ -13287,6 +13344,25 @@ export const MODELS = {
13287
13344
  contextWindow: 1000000,
13288
13345
  maxTokens: 128000,
13289
13346
  },
13347
+ "anthropic/claude-opus-4.8": {
13348
+ id: "anthropic/claude-opus-4.8",
13349
+ name: "Claude Opus 4.8",
13350
+ api: "anthropic-messages",
13351
+ provider: "vercel-ai-gateway",
13352
+ baseUrl: "https://ai-gateway.vercel.sh",
13353
+ compat: { "forceAdaptiveThinking": true },
13354
+ reasoning: true,
13355
+ thinkingLevelMap: { "xhigh": "xhigh" },
13356
+ input: ["text", "image"],
13357
+ cost: {
13358
+ input: 5,
13359
+ output: 25,
13360
+ cacheRead: 0.5,
13361
+ cacheWrite: 6.25,
13362
+ },
13363
+ contextWindow: 1000000,
13364
+ maxTokens: 128000,
13365
+ },
13290
13366
  "anthropic/claude-sonnet-4": {
13291
13367
  id: "anthropic/claude-sonnet-4",
13292
13368
  name: "Claude Sonnet 4",
@@ -13433,17 +13509,17 @@ export const MODELS = {
13433
13509
  reasoning: false,
13434
13510
  input: ["text"],
13435
13511
  cost: {
13436
- input: 0.77,
13437
- output: 0.77,
13438
- cacheRead: 0,
13512
+ input: 0.27,
13513
+ output: 1.12,
13514
+ cacheRead: 0.135,
13439
13515
  cacheWrite: 0,
13440
13516
  },
13441
13517
  contextWindow: 163840,
13442
- maxTokens: 16384,
13518
+ maxTokens: 163840,
13443
13519
  },
13444
13520
  "deepseek/deepseek-v3.1": {
13445
13521
  id: "deepseek/deepseek-v3.1",
13446
- name: "DeepSeek-V3.1",
13522
+ name: "DeepSeek V3.1",
13447
13523
  api: "anthropic-messages",
13448
13524
  provider: "vercel-ai-gateway",
13449
13525
  baseUrl: "https://ai-gateway.vercel.sh",
@@ -14887,7 +14963,7 @@ export const MODELS = {
14887
14963
  provider: "vercel-ai-gateway",
14888
14964
  baseUrl: "https://ai-gateway.vercel.sh",
14889
14965
  reasoning: true,
14890
- thinkingLevelMap: { "xhigh": "xhigh" },
14966
+ thinkingLevelMap: { "xhigh": "xhigh", "off": null, "minimal": null, "low": null },
14891
14967
  input: ["text", "image"],
14892
14968
  cost: {
14893
14969
  input: 30,
@@ -15068,6 +15144,23 @@ export const MODELS = {
15068
15144
  contextWindow: 200000,
15069
15145
  maxTokens: 8000,
15070
15146
  },
15147
+ "stepfun/step-3.7-flash": {
15148
+ id: "stepfun/step-3.7-flash",
15149
+ name: "Step 3.7 Flash",
15150
+ api: "anthropic-messages",
15151
+ provider: "vercel-ai-gateway",
15152
+ baseUrl: "https://ai-gateway.vercel.sh",
15153
+ reasoning: true,
15154
+ input: ["text", "image"],
15155
+ cost: {
15156
+ input: 0.19999999999999998,
15157
+ output: 1.15,
15158
+ cacheRead: 0.04,
15159
+ cacheWrite: 0,
15160
+ },
15161
+ contextWindow: 256000,
15162
+ maxTokens: 256000,
15163
+ },
15071
15164
  "xai/grok-4.1-fast-non-reasoning": {
15072
15165
  id: "xai/grok-4.1-fast-non-reasoning",
15073
15166
  name: "Grok 4.1 Fast Non-Reasoning",
@@ -15281,9 +15374,9 @@ export const MODELS = {
15281
15374
  reasoning: true,
15282
15375
  input: ["text", "image"],
15283
15376
  cost: {
15284
- input: 0.39999999999999997,
15285
- output: 2,
15286
- cacheRead: 0.08,
15377
+ input: 0.14,
15378
+ output: 0.28,
15379
+ cacheRead: 0.0028,
15287
15380
  cacheWrite: 0,
15288
15381
  },
15289
15382
  contextWindow: 1050000,
@@ -15298,9 +15391,9 @@ export const MODELS = {
15298
15391
  reasoning: true,
15299
15392
  input: ["text", "image"],
15300
15393
  cost: {
15301
- input: 1,
15302
- output: 3,
15303
- cacheRead: 0.19999999999999998,
15394
+ input: 0.435,
15395
+ output: 0.87,
15396
+ cacheRead: 0.0036,
15304
15397
  cacheWrite: 0,
15305
15398
  },
15306
15399
  contextWindow: 1050000,
@@ -15742,24 +15835,6 @@ export const MODELS = {
15742
15835
  },
15743
15836
  },
15744
15837
  "xiaomi-token-plan-ams": {
15745
- "mimo-v2-flash": {
15746
- id: "mimo-v2-flash",
15747
- name: "MiMo-V2-Flash",
15748
- api: "openai-completions",
15749
- provider: "xiaomi-token-plan-ams",
15750
- baseUrl: "https://token-plan-ams.xiaomimimo.com/v1",
15751
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
15752
- reasoning: true,
15753
- input: ["text"],
15754
- cost: {
15755
- input: 0.1,
15756
- output: 0.3,
15757
- cacheRead: 0.01,
15758
- cacheWrite: 0,
15759
- },
15760
- contextWindow: 262144,
15761
- maxTokens: 65536,
15762
- },
15763
15838
  "mimo-v2-omni": {
15764
15839
  id: "mimo-v2-omni",
15765
15840
  name: "MiMo-V2-Omni",
@@ -15834,24 +15909,6 @@ export const MODELS = {
15834
15909
  },
15835
15910
  },
15836
15911
  "xiaomi-token-plan-cn": {
15837
- "mimo-v2-flash": {
15838
- id: "mimo-v2-flash",
15839
- name: "MiMo-V2-Flash",
15840
- api: "openai-completions",
15841
- provider: "xiaomi-token-plan-cn",
15842
- baseUrl: "https://token-plan-cn.xiaomimimo.com/v1",
15843
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
15844
- reasoning: true,
15845
- input: ["text"],
15846
- cost: {
15847
- input: 0.1,
15848
- output: 0.3,
15849
- cacheRead: 0.01,
15850
- cacheWrite: 0,
15851
- },
15852
- contextWindow: 262144,
15853
- maxTokens: 65536,
15854
- },
15855
15912
  "mimo-v2-omni": {
15856
15913
  id: "mimo-v2-omni",
15857
15914
  name: "MiMo-V2-Omni",
@@ -15926,24 +15983,6 @@ export const MODELS = {
15926
15983
  },
15927
15984
  },
15928
15985
  "xiaomi-token-plan-sgp": {
15929
- "mimo-v2-flash": {
15930
- id: "mimo-v2-flash",
15931
- name: "MiMo-V2-Flash",
15932
- api: "openai-completions",
15933
- provider: "xiaomi-token-plan-sgp",
15934
- baseUrl: "https://token-plan-sgp.xiaomimimo.com/v1",
15935
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
15936
- reasoning: true,
15937
- input: ["text"],
15938
- cost: {
15939
- input: 0.1,
15940
- output: 0.3,
15941
- cacheRead: 0.01,
15942
- cacheWrite: 0,
15943
- },
15944
- contextWindow: 262144,
15945
- maxTokens: 65536,
15946
- },
15947
15986
  "mimo-v2-omni": {
15948
15987
  id: "mimo-v2-omni",
15949
15988
  name: "MiMo-V2-Omni",