@earendil-works/pi-ai 0.78.0 → 0.79.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (37) hide show
  1. package/README.md +12 -4
  2. package/dist/env-api-keys.d.ts.map +1 -1
  3. package/dist/env-api-keys.js +3 -0
  4. package/dist/env-api-keys.js.map +1 -1
  5. package/dist/image-models.generated.d.ts +45 -0
  6. package/dist/image-models.generated.d.ts.map +1 -1
  7. package/dist/image-models.generated.js +45 -0
  8. package/dist/image-models.generated.js.map +1 -1
  9. package/dist/models.generated.d.ts +1365 -401
  10. package/dist/models.generated.d.ts.map +1 -1
  11. package/dist/models.generated.js +1331 -639
  12. package/dist/models.generated.js.map +1 -1
  13. package/dist/providers/amazon-bedrock.d.ts.map +1 -1
  14. package/dist/providers/amazon-bedrock.js +46 -19
  15. package/dist/providers/amazon-bedrock.js.map +1 -1
  16. package/dist/providers/anthropic.d.ts.map +1 -1
  17. package/dist/providers/anthropic.js +5 -4
  18. package/dist/providers/anthropic.js.map +1 -1
  19. package/dist/providers/openai-completions.d.ts.map +1 -1
  20. package/dist/providers/openai-completions.js +33 -12
  21. package/dist/providers/openai-completions.js.map +1 -1
  22. package/dist/providers/openai-responses-shared.d.ts.map +1 -1
  23. package/dist/providers/openai-responses-shared.js +2 -1
  24. package/dist/providers/openai-responses-shared.js.map +1 -1
  25. package/dist/providers/openai-responses.d.ts.map +1 -1
  26. package/dist/providers/openai-responses.js +1 -0
  27. package/dist/providers/openai-responses.js.map +1 -1
  28. package/dist/types.d.ts +12 -4
  29. package/dist/types.d.ts.map +1 -1
  30. package/dist/types.js.map +1 -1
  31. package/dist/utils/oauth/github-copilot.d.ts.map +1 -1
  32. package/dist/utils/oauth/github-copilot.js +13 -1
  33. package/dist/utils/oauth/github-copilot.js.map +1 -1
  34. package/dist/utils/oauth/openai-codex.d.ts.map +1 -1
  35. package/dist/utils/oauth/openai-codex.js +4 -2
  36. package/dist/utils/oauth/openai-codex.js.map +1 -1
  37. package/package.json +1 -1
@@ -391,8 +391,8 @@ export const MODELS = {
391
391
  thinkingLevelMap: { "xhigh": "max" },
392
392
  input: ["text", "image"],
393
393
  cost: {
394
- input: 5,
395
- output: 25,
394
+ input: 5.5,
395
+ output: 27.5,
396
396
  cacheRead: 0.5,
397
397
  cacheWrite: 6.25,
398
398
  },
@@ -409,10 +409,10 @@ export const MODELS = {
409
409
  thinkingLevelMap: { "xhigh": "xhigh" },
410
410
  input: ["text", "image"],
411
411
  cost: {
412
- input: 5,
413
- output: 25,
414
- cacheRead: 0.5,
415
- cacheWrite: 6.25,
412
+ input: 5.5,
413
+ output: 27.5,
414
+ cacheRead: 0.55,
415
+ cacheWrite: 6.875,
416
416
  },
417
417
  contextWindow: 1000000,
418
418
  maxTokens: 128000,
@@ -427,10 +427,10 @@ export const MODELS = {
427
427
  thinkingLevelMap: { "xhigh": "xhigh" },
428
428
  input: ["text", "image"],
429
429
  cost: {
430
- input: 5,
431
- output: 25,
432
- cacheRead: 0.5,
433
- cacheWrite: 6.25,
430
+ input: 5.5,
431
+ output: 27.5,
432
+ cacheRead: 0.55,
433
+ cacheWrite: 6.875,
434
434
  },
435
435
  contextWindow: 1000000,
436
436
  maxTokens: 128000,
@@ -444,10 +444,10 @@ export const MODELS = {
444
444
  reasoning: true,
445
445
  input: ["text", "image"],
446
446
  cost: {
447
- input: 3,
448
- output: 15,
449
- cacheRead: 0.3,
450
- cacheWrite: 3.75,
447
+ input: 3.3,
448
+ output: 16.5,
449
+ cacheRead: 0.33,
450
+ cacheWrite: 4.125,
451
451
  },
452
452
  contextWindow: 200000,
453
453
  maxTokens: 64000,
@@ -461,10 +461,10 @@ export const MODELS = {
461
461
  reasoning: true,
462
462
  input: ["text", "image"],
463
463
  cost: {
464
- input: 3,
465
- output: 15,
466
- cacheRead: 0.3,
467
- cacheWrite: 3.75,
464
+ input: 3.3,
465
+ output: 16.5,
466
+ cacheRead: 0.33,
467
+ cacheWrite: 4.125,
468
468
  },
469
469
  contextWindow: 1000000,
470
470
  maxTokens: 64000,
@@ -1086,6 +1086,59 @@ export const MODELS = {
1086
1086
  contextWindow: 262144,
1087
1087
  maxTokens: 131072,
1088
1088
  },
1089
+ "openai.gpt-5.4": {
1090
+ id: "openai.gpt-5.4",
1091
+ name: "GPT-5.4",
1092
+ api: "bedrock-converse-stream",
1093
+ provider: "amazon-bedrock",
1094
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1095
+ reasoning: true,
1096
+ thinkingLevelMap: { "xhigh": "xhigh" },
1097
+ input: ["text", "image"],
1098
+ cost: {
1099
+ input: 2.75,
1100
+ output: 16.5,
1101
+ cacheRead: 0.275,
1102
+ cacheWrite: 0,
1103
+ },
1104
+ contextWindow: 272000,
1105
+ maxTokens: 128000,
1106
+ },
1107
+ "openai.gpt-5.5": {
1108
+ id: "openai.gpt-5.5",
1109
+ name: "GPT-5.5",
1110
+ api: "bedrock-converse-stream",
1111
+ provider: "amazon-bedrock",
1112
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1113
+ reasoning: true,
1114
+ thinkingLevelMap: { "xhigh": "xhigh" },
1115
+ input: ["text", "image"],
1116
+ cost: {
1117
+ input: 5.5,
1118
+ output: 33,
1119
+ cacheRead: 0.55,
1120
+ cacheWrite: 0,
1121
+ },
1122
+ contextWindow: 272000,
1123
+ maxTokens: 128000,
1124
+ },
1125
+ "openai.gpt-oss-120b": {
1126
+ id: "openai.gpt-oss-120b",
1127
+ name: "gpt-oss-120b",
1128
+ api: "bedrock-converse-stream",
1129
+ provider: "amazon-bedrock",
1130
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1131
+ reasoning: false,
1132
+ input: ["text"],
1133
+ cost: {
1134
+ input: 0.15,
1135
+ output: 0.6,
1136
+ cacheRead: 0,
1137
+ cacheWrite: 0,
1138
+ },
1139
+ contextWindow: 128000,
1140
+ maxTokens: 16384,
1141
+ },
1089
1142
  "openai.gpt-oss-120b-1:0": {
1090
1143
  id: "openai.gpt-oss-120b-1:0",
1091
1144
  name: "gpt-oss-120b",
@@ -1103,6 +1156,23 @@ export const MODELS = {
1103
1156
  contextWindow: 128000,
1104
1157
  maxTokens: 16384,
1105
1158
  },
1159
+ "openai.gpt-oss-20b": {
1160
+ id: "openai.gpt-oss-20b",
1161
+ name: "gpt-oss-20b",
1162
+ api: "bedrock-converse-stream",
1163
+ provider: "amazon-bedrock",
1164
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1165
+ reasoning: false,
1166
+ input: ["text"],
1167
+ cost: {
1168
+ input: 0.07,
1169
+ output: 0.3,
1170
+ cacheRead: 0,
1171
+ cacheWrite: 0,
1172
+ },
1173
+ contextWindow: 128000,
1174
+ maxTokens: 16384,
1175
+ },
1106
1176
  "openai.gpt-oss-20b-1:0": {
1107
1177
  id: "openai.gpt-oss-20b-1:0",
1108
1178
  name: "gpt-oss-20b",
@@ -1549,6 +1619,63 @@ export const MODELS = {
1549
1619
  maxTokens: 101376,
1550
1620
  },
1551
1621
  },
1622
+ "ant-ling": {
1623
+ "Ling-2.6-1T": {
1624
+ id: "Ling-2.6-1T",
1625
+ name: "Ling 2.6 1T",
1626
+ api: "openai-completions",
1627
+ provider: "ant-ling",
1628
+ baseUrl: "https://api.ant-ling.com/v1",
1629
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsLongCacheRetention": false },
1630
+ reasoning: false,
1631
+ input: ["text"],
1632
+ cost: {
1633
+ input: 0.06,
1634
+ output: 0.25,
1635
+ cacheRead: 0,
1636
+ cacheWrite: 0,
1637
+ },
1638
+ contextWindow: 262144,
1639
+ maxTokens: 65536,
1640
+ },
1641
+ "Ling-2.6-flash": {
1642
+ id: "Ling-2.6-flash",
1643
+ name: "Ling 2.6 Flash",
1644
+ api: "openai-completions",
1645
+ provider: "ant-ling",
1646
+ baseUrl: "https://api.ant-ling.com/v1",
1647
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsLongCacheRetention": false },
1648
+ reasoning: false,
1649
+ input: ["text"],
1650
+ cost: {
1651
+ input: 0.01,
1652
+ output: 0.02,
1653
+ cacheRead: 0,
1654
+ cacheWrite: 0,
1655
+ },
1656
+ contextWindow: 262144,
1657
+ maxTokens: 65536,
1658
+ },
1659
+ "Ring-2.6-1T": {
1660
+ id: "Ring-2.6-1T",
1661
+ name: "Ring 2.6 1T",
1662
+ api: "openai-completions",
1663
+ provider: "ant-ling",
1664
+ baseUrl: "https://api.ant-ling.com/v1",
1665
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsLongCacheRetention": false, "thinkingFormat": "ant-ling" },
1666
+ reasoning: true,
1667
+ thinkingLevelMap: { "off": null, "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "xhigh" },
1668
+ input: ["text"],
1669
+ cost: {
1670
+ input: 0.06,
1671
+ output: 0.25,
1672
+ cacheRead: 0,
1673
+ cacheWrite: 0,
1674
+ },
1675
+ contextWindow: 262144,
1676
+ maxTokens: 65536,
1677
+ },
1678
+ },
1552
1679
  "anthropic": {
1553
1680
  "claude-3-5-haiku-20241022": {
1554
1681
  id: "claude-3-5-haiku-20241022",
@@ -1847,7 +1974,7 @@ export const MODELS = {
1847
1974
  api: "anthropic-messages",
1848
1975
  provider: "anthropic",
1849
1976
  baseUrl: "https://api.anthropic.com",
1850
- compat: { "forceAdaptiveThinking": true },
1977
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
1851
1978
  reasoning: true,
1852
1979
  thinkingLevelMap: { "xhigh": "xhigh" },
1853
1980
  input: ["text", "image"],
@@ -1866,7 +1993,7 @@ export const MODELS = {
1866
1993
  api: "anthropic-messages",
1867
1994
  provider: "anthropic",
1868
1995
  baseUrl: "https://api.anthropic.com",
1869
- compat: { "forceAdaptiveThinking": true },
1996
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
1870
1997
  reasoning: true,
1871
1998
  thinkingLevelMap: { "xhigh": "xhigh" },
1872
1999
  input: ["text", "image"],
@@ -2955,7 +3082,26 @@ export const MODELS = {
2955
3082
  api: "anthropic-messages",
2956
3083
  provider: "cloudflare-ai-gateway",
2957
3084
  baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2958
- compat: { "forceAdaptiveThinking": true },
3085
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
3086
+ reasoning: true,
3087
+ thinkingLevelMap: { "xhigh": "xhigh" },
3088
+ input: ["text", "image"],
3089
+ cost: {
3090
+ input: 5,
3091
+ output: 25,
3092
+ cacheRead: 0.5,
3093
+ cacheWrite: 6.25,
3094
+ },
3095
+ contextWindow: 1000000,
3096
+ maxTokens: 128000,
3097
+ },
3098
+ "claude-opus-4-8": {
3099
+ id: "claude-opus-4-8",
3100
+ name: "Claude Opus 4.8",
3101
+ api: "anthropic-messages",
3102
+ provider: "cloudflare-ai-gateway",
3103
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
3104
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
2959
3105
  reasoning: true,
2960
3106
  thinkingLevelMap: { "xhigh": "xhigh" },
2961
3107
  input: ["text", "image"],
@@ -3463,24 +3609,6 @@ export const MODELS = {
3463
3609
  contextWindow: 128000,
3464
3610
  maxTokens: 128000,
3465
3611
  },
3466
- "@cf/moonshotai/kimi-k2.5": {
3467
- id: "@cf/moonshotai/kimi-k2.5",
3468
- name: "Kimi K2.5",
3469
- api: "openai-completions",
3470
- provider: "cloudflare-workers-ai",
3471
- baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3472
- compat: { "sendSessionAffinityHeaders": true },
3473
- reasoning: true,
3474
- input: ["text", "image"],
3475
- cost: {
3476
- input: 0.6,
3477
- output: 3,
3478
- cacheRead: 0.1,
3479
- cacheWrite: 0,
3480
- },
3481
- contextWindow: 256000,
3482
- maxTokens: 256000,
3483
- },
3484
3612
  "@cf/moonshotai/kimi-k2.6": {
3485
3613
  id: "@cf/moonshotai/kimi-k2.6",
3486
3614
  name: "Kimi K2.6",
@@ -3808,8 +3936,8 @@ export const MODELS = {
3808
3936
  cacheRead: 0.1,
3809
3937
  cacheWrite: 0,
3810
3938
  },
3811
- contextWindow: 128000,
3812
- maxTokens: 8192,
3939
+ contextWindow: 262144,
3940
+ maxTokens: 65536,
3813
3941
  },
3814
3942
  "accounts/fireworks/routers/glm-5p1-fast": {
3815
3943
  id: "accounts/fireworks/routers/glm-5p1-fast",
@@ -3829,6 +3957,24 @@ export const MODELS = {
3829
3957
  contextWindow: 202800,
3830
3958
  maxTokens: 131072,
3831
3959
  },
3960
+ "accounts/fireworks/routers/kimi-k2p6-fast": {
3961
+ id: "accounts/fireworks/routers/kimi-k2p6-fast",
3962
+ name: "Kimi K2.6 Fast",
3963
+ api: "anthropic-messages",
3964
+ provider: "fireworks",
3965
+ baseUrl: "https://api.fireworks.ai/inference",
3966
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3967
+ reasoning: true,
3968
+ input: ["text", "image"],
3969
+ cost: {
3970
+ input: 2,
3971
+ output: 8,
3972
+ cacheRead: 0.3,
3973
+ cacheWrite: 0,
3974
+ },
3975
+ contextWindow: 262000,
3976
+ maxTokens: 262000,
3977
+ },
3832
3978
  "accounts/fireworks/routers/kimi-k2p6-turbo": {
3833
3979
  id: "accounts/fireworks/routers/kimi-k2p6-turbo",
3834
3980
  name: "Kimi K2.6 Turbo",
@@ -3851,7 +3997,7 @@ export const MODELS = {
3851
3997
  "github-copilot": {
3852
3998
  "claude-haiku-4.5": {
3853
3999
  id: "claude-haiku-4.5",
3854
- name: "Claude Haiku 4.5",
4000
+ name: "Claude Haiku 4.5 (latest)",
3855
4001
  api: "anthropic-messages",
3856
4002
  provider: "github-copilot",
3857
4003
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -3860,17 +4006,17 @@ export const MODELS = {
3860
4006
  reasoning: true,
3861
4007
  input: ["text", "image"],
3862
4008
  cost: {
3863
- input: 0,
3864
- output: 0,
3865
- cacheRead: 0,
3866
- cacheWrite: 0,
4009
+ input: 1,
4010
+ output: 5,
4011
+ cacheRead: 0.1,
4012
+ cacheWrite: 1.25,
3867
4013
  },
3868
4014
  contextWindow: 200000,
3869
4015
  maxTokens: 64000,
3870
4016
  },
3871
4017
  "claude-opus-4.5": {
3872
4018
  id: "claude-opus-4.5",
3873
- name: "Claude Opus 4.5",
4019
+ name: "Claude Opus 4.5 (latest)",
3874
4020
  api: "anthropic-messages",
3875
4021
  provider: "github-copilot",
3876
4022
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -3878,10 +4024,10 @@ export const MODELS = {
3878
4024
  reasoning: true,
3879
4025
  input: ["text", "image"],
3880
4026
  cost: {
3881
- input: 0,
3882
- output: 0,
3883
- cacheRead: 0,
3884
- cacheWrite: 0,
4027
+ input: 5,
4028
+ output: 25,
4029
+ cacheRead: 0.5,
4030
+ cacheWrite: 6.25,
3885
4031
  },
3886
4032
  contextWindow: 200000,
3887
4033
  maxTokens: 32000,
@@ -3898,10 +4044,10 @@ export const MODELS = {
3898
4044
  thinkingLevelMap: { "xhigh": "max" },
3899
4045
  input: ["text", "image"],
3900
4046
  cost: {
3901
- input: 0,
3902
- output: 0,
3903
- cacheRead: 0,
3904
- cacheWrite: 0,
4047
+ input: 5,
4048
+ output: 25,
4049
+ cacheRead: 0.5,
4050
+ cacheWrite: 6.25,
3905
4051
  },
3906
4052
  contextWindow: 1000000,
3907
4053
  maxTokens: 32000,
@@ -3913,15 +4059,15 @@ export const MODELS = {
3913
4059
  provider: "github-copilot",
3914
4060
  baseUrl: "https://api.individual.githubcopilot.com",
3915
4061
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3916
- compat: { "forceAdaptiveThinking": true },
4062
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
3917
4063
  reasoning: true,
3918
4064
  thinkingLevelMap: { "xhigh": "xhigh" },
3919
4065
  input: ["text", "image"],
3920
4066
  cost: {
3921
- input: 0,
3922
- output: 0,
3923
- cacheRead: 0,
3924
- cacheWrite: 0,
4067
+ input: 5,
4068
+ output: 25,
4069
+ cacheRead: 0.5,
4070
+ cacheWrite: 6.25,
3925
4071
  },
3926
4072
  contextWindow: 200000,
3927
4073
  maxTokens: 32000,
@@ -3933,22 +4079,41 @@ export const MODELS = {
3933
4079
  provider: "github-copilot",
3934
4080
  baseUrl: "https://api.individual.githubcopilot.com",
3935
4081
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3936
- compat: { "forceAdaptiveThinking": true },
4082
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
3937
4083
  reasoning: true,
3938
4084
  thinkingLevelMap: { "xhigh": "xhigh" },
3939
4085
  input: ["text", "image"],
3940
4086
  cost: {
3941
- input: 0,
3942
- output: 0,
3943
- cacheRead: 0,
3944
- cacheWrite: 0,
4087
+ input: 5,
4088
+ output: 25,
4089
+ cacheRead: 0.5,
4090
+ cacheWrite: 6.25,
3945
4091
  },
3946
4092
  contextWindow: 200000,
3947
4093
  maxTokens: 64000,
3948
4094
  },
4095
+ "claude-sonnet-4": {
4096
+ id: "claude-sonnet-4",
4097
+ name: "Claude Sonnet 4 (latest)",
4098
+ api: "anthropic-messages",
4099
+ provider: "github-copilot",
4100
+ baseUrl: "https://api.individual.githubcopilot.com",
4101
+ headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4102
+ compat: { "supportsEagerToolInputStreaming": false },
4103
+ reasoning: true,
4104
+ input: ["text", "image"],
4105
+ cost: {
4106
+ input: 3,
4107
+ output: 15,
4108
+ cacheRead: 0.3,
4109
+ cacheWrite: 3.75,
4110
+ },
4111
+ contextWindow: 216000,
4112
+ maxTokens: 16000,
4113
+ },
3949
4114
  "claude-sonnet-4.5": {
3950
4115
  id: "claude-sonnet-4.5",
3951
- name: "Claude Sonnet 4.5",
4116
+ name: "Claude Sonnet 4.5 (latest)",
3952
4117
  api: "anthropic-messages",
3953
4118
  provider: "github-copilot",
3954
4119
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -3957,10 +4122,10 @@ export const MODELS = {
3957
4122
  reasoning: true,
3958
4123
  input: ["text", "image"],
3959
4124
  cost: {
3960
- input: 0,
3961
- output: 0,
3962
- cacheRead: 0,
3963
- cacheWrite: 0,
4125
+ input: 3,
4126
+ output: 15,
4127
+ cacheRead: 0.3,
4128
+ cacheWrite: 3.75,
3964
4129
  },
3965
4130
  contextWindow: 200000,
3966
4131
  maxTokens: 32000,
@@ -3976,10 +4141,10 @@ export const MODELS = {
3976
4141
  reasoning: true,
3977
4142
  input: ["text", "image"],
3978
4143
  cost: {
3979
- input: 0,
3980
- output: 0,
3981
- cacheRead: 0,
3982
- cacheWrite: 0,
4144
+ input: 3,
4145
+ output: 15,
4146
+ cacheRead: 0.3,
4147
+ cacheWrite: 3.75,
3983
4148
  },
3984
4149
  contextWindow: 1000000,
3985
4150
  maxTokens: 32000,
@@ -3992,12 +4157,12 @@ export const MODELS = {
3992
4157
  baseUrl: "https://api.individual.githubcopilot.com",
3993
4158
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3994
4159
  compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
3995
- reasoning: false,
4160
+ reasoning: true,
3996
4161
  input: ["text", "image"],
3997
4162
  cost: {
3998
- input: 0,
3999
- output: 0,
4000
- cacheRead: 0,
4163
+ input: 1.25,
4164
+ output: 10,
4165
+ cacheRead: 0.125,
4001
4166
  cacheWrite: 0,
4002
4167
  },
4003
4168
  contextWindow: 128000,
@@ -4005,7 +4170,7 @@ export const MODELS = {
4005
4170
  },
4006
4171
  "gemini-3-flash-preview": {
4007
4172
  id: "gemini-3-flash-preview",
4008
- name: "Gemini 3 Flash",
4173
+ name: "Gemini 3 Flash Preview",
4009
4174
  api: "openai-completions",
4010
4175
  provider: "github-copilot",
4011
4176
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -4014,9 +4179,9 @@ export const MODELS = {
4014
4179
  reasoning: true,
4015
4180
  input: ["text", "image"],
4016
4181
  cost: {
4017
- input: 0,
4018
- output: 0,
4019
- cacheRead: 0,
4182
+ input: 0.5,
4183
+ output: 3,
4184
+ cacheRead: 0.05,
4020
4185
  cacheWrite: 0,
4021
4186
  },
4022
4187
  contextWindow: 128000,
@@ -4033,9 +4198,9 @@ export const MODELS = {
4033
4198
  reasoning: true,
4034
4199
  input: ["text", "image"],
4035
4200
  cost: {
4036
- input: 0,
4037
- output: 0,
4038
- cacheRead: 0,
4201
+ input: 2,
4202
+ output: 12,
4203
+ cacheRead: 0.2,
4039
4204
  cacheWrite: 0,
4040
4205
  },
4041
4206
  contextWindow: 200000,
@@ -4052,9 +4217,9 @@ export const MODELS = {
4052
4217
  reasoning: true,
4053
4218
  input: ["text", "image"],
4054
4219
  cost: {
4055
- input: 0,
4056
- output: 0,
4057
- cacheRead: 0,
4220
+ input: 1.5,
4221
+ output: 9,
4222
+ cacheRead: 0.15,
4058
4223
  cacheWrite: 0,
4059
4224
  },
4060
4225
  contextWindow: 200000,
@@ -4071,36 +4236,17 @@ export const MODELS = {
4071
4236
  reasoning: false,
4072
4237
  input: ["text", "image"],
4073
4238
  cost: {
4074
- input: 0,
4075
- output: 0,
4076
- cacheRead: 0,
4239
+ input: 2,
4240
+ output: 8,
4241
+ cacheRead: 0.5,
4077
4242
  cacheWrite: 0,
4078
4243
  },
4079
4244
  contextWindow: 128000,
4080
4245
  maxTokens: 16384,
4081
4246
  },
4082
- "gpt-4o": {
4083
- id: "gpt-4o",
4084
- name: "GPT-4o",
4085
- api: "openai-completions",
4086
- provider: "github-copilot",
4087
- baseUrl: "https://api.individual.githubcopilot.com",
4088
- headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4089
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
4090
- reasoning: false,
4091
- input: ["text", "image"],
4092
- cost: {
4093
- input: 0,
4094
- output: 0,
4095
- cacheRead: 0,
4096
- cacheWrite: 0,
4097
- },
4098
- contextWindow: 128000,
4099
- maxTokens: 4096,
4100
- },
4101
4247
  "gpt-5-mini": {
4102
4248
  id: "gpt-5-mini",
4103
- name: "GPT-5-mini",
4249
+ name: "GPT-5 Mini",
4104
4250
  api: "openai-responses",
4105
4251
  provider: "github-copilot",
4106
4252
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -4109,9 +4255,9 @@ export const MODELS = {
4109
4255
  thinkingLevelMap: { "off": null, "minimal": "low" },
4110
4256
  input: ["text", "image"],
4111
4257
  cost: {
4112
- input: 0,
4113
- output: 0,
4114
- cacheRead: 0,
4258
+ input: 0.25,
4259
+ output: 2,
4260
+ cacheRead: 0.025,
4115
4261
  cacheWrite: 0,
4116
4262
  },
4117
4263
  contextWindow: 264000,
@@ -4128,9 +4274,9 @@ export const MODELS = {
4128
4274
  thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4129
4275
  input: ["text", "image"],
4130
4276
  cost: {
4131
- input: 0,
4132
- output: 0,
4133
- cacheRead: 0,
4277
+ input: 1.75,
4278
+ output: 14,
4279
+ cacheRead: 0.175,
4134
4280
  cacheWrite: 0,
4135
4281
  },
4136
4282
  contextWindow: 400000,
@@ -4138,7 +4284,7 @@ export const MODELS = {
4138
4284
  },
4139
4285
  "gpt-5.2-codex": {
4140
4286
  id: "gpt-5.2-codex",
4141
- name: "GPT-5.2-Codex",
4287
+ name: "GPT-5.2 Codex",
4142
4288
  api: "openai-responses",
4143
4289
  provider: "github-copilot",
4144
4290
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -4147,9 +4293,9 @@ export const MODELS = {
4147
4293
  thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4148
4294
  input: ["text", "image"],
4149
4295
  cost: {
4150
- input: 0,
4151
- output: 0,
4152
- cacheRead: 0,
4296
+ input: 1.75,
4297
+ output: 14,
4298
+ cacheRead: 0.175,
4153
4299
  cacheWrite: 0,
4154
4300
  },
4155
4301
  contextWindow: 400000,
@@ -4157,7 +4303,7 @@ export const MODELS = {
4157
4303
  },
4158
4304
  "gpt-5.3-codex": {
4159
4305
  id: "gpt-5.3-codex",
4160
- name: "GPT-5.3-Codex",
4306
+ name: "GPT-5.3 Codex",
4161
4307
  api: "openai-responses",
4162
4308
  provider: "github-copilot",
4163
4309
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -4166,9 +4312,9 @@ export const MODELS = {
4166
4312
  thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4167
4313
  input: ["text", "image"],
4168
4314
  cost: {
4169
- input: 0,
4170
- output: 0,
4171
- cacheRead: 0,
4315
+ input: 1.75,
4316
+ output: 14,
4317
+ cacheRead: 0.175,
4172
4318
  cacheWrite: 0,
4173
4319
  },
4174
4320
  contextWindow: 400000,
@@ -4185,9 +4331,9 @@ export const MODELS = {
4185
4331
  thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4186
4332
  input: ["text", "image"],
4187
4333
  cost: {
4188
- input: 0,
4189
- output: 0,
4190
- cacheRead: 0,
4334
+ input: 2.5,
4335
+ output: 15,
4336
+ cacheRead: 0.25,
4191
4337
  cacheWrite: 0,
4192
4338
  },
4193
4339
  contextWindow: 400000,
@@ -4195,7 +4341,7 @@ export const MODELS = {
4195
4341
  },
4196
4342
  "gpt-5.4-mini": {
4197
4343
  id: "gpt-5.4-mini",
4198
- name: "GPT-5.4 Mini",
4344
+ name: "GPT-5.4 mini",
4199
4345
  api: "openai-responses",
4200
4346
  provider: "github-copilot",
4201
4347
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -4204,9 +4350,28 @@ export const MODELS = {
4204
4350
  thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4205
4351
  input: ["text", "image"],
4206
4352
  cost: {
4207
- input: 0,
4208
- output: 0,
4209
- cacheRead: 0,
4353
+ input: 0.75,
4354
+ output: 4.5,
4355
+ cacheRead: 0.075,
4356
+ cacheWrite: 0,
4357
+ },
4358
+ contextWindow: 400000,
4359
+ maxTokens: 128000,
4360
+ },
4361
+ "gpt-5.4-nano": {
4362
+ id: "gpt-5.4-nano",
4363
+ name: "GPT-5.4 nano",
4364
+ api: "openai-responses",
4365
+ provider: "github-copilot",
4366
+ baseUrl: "https://api.individual.githubcopilot.com",
4367
+ headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4368
+ reasoning: true,
4369
+ thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4370
+ input: ["text", "image"],
4371
+ cost: {
4372
+ input: 0.2,
4373
+ output: 1.25,
4374
+ cacheRead: 0.02,
4210
4375
  cacheWrite: 0,
4211
4376
  },
4212
4377
  contextWindow: 400000,
@@ -4223,32 +4388,32 @@ export const MODELS = {
4223
4388
  thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4224
4389
  input: ["text", "image"],
4225
4390
  cost: {
4226
- input: 0,
4227
- output: 0,
4228
- cacheRead: 0,
4391
+ input: 5,
4392
+ output: 30,
4393
+ cacheRead: 0.5,
4229
4394
  cacheWrite: 0,
4230
4395
  },
4231
4396
  contextWindow: 400000,
4232
4397
  maxTokens: 128000,
4233
4398
  },
4234
- "grok-code-fast-1": {
4235
- id: "grok-code-fast-1",
4236
- name: "Grok Code Fast 1",
4399
+ "raptor-mini": {
4400
+ id: "raptor-mini",
4401
+ name: "Raptor mini",
4237
4402
  api: "openai-completions",
4238
4403
  provider: "github-copilot",
4239
4404
  baseUrl: "https://api.individual.githubcopilot.com",
4240
4405
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4241
4406
  compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
4242
4407
  reasoning: true,
4243
- input: ["text"],
4408
+ input: ["text", "image"],
4244
4409
  cost: {
4245
- input: 0,
4246
- output: 0,
4247
- cacheRead: 0,
4410
+ input: 0.25,
4411
+ output: 2,
4412
+ cacheRead: 0.025,
4248
4413
  cacheWrite: 0,
4249
4414
  },
4250
- contextWindow: 128000,
4251
- maxTokens: 64000,
4415
+ contextWindow: 400000,
4416
+ maxTokens: 128000,
4252
4417
  },
4253
4418
  },
4254
4419
  "google": {
@@ -5541,6 +5706,23 @@ export const MODELS = {
5541
5706
  contextWindow: 204800,
5542
5707
  maxTokens: 131072,
5543
5708
  },
5709
+ "MiniMax-M3": {
5710
+ id: "MiniMax-M3",
5711
+ name: "MiniMax-M3",
5712
+ api: "anthropic-messages",
5713
+ provider: "minimax",
5714
+ baseUrl: "https://api.minimax.io/anthropic",
5715
+ reasoning: true,
5716
+ input: ["text", "image"],
5717
+ cost: {
5718
+ input: 0.6,
5719
+ output: 2.4,
5720
+ cacheRead: 0.12,
5721
+ cacheWrite: 0,
5722
+ },
5723
+ contextWindow: 512000,
5724
+ maxTokens: 128000,
5725
+ },
5544
5726
  },
5545
5727
  "minimax-cn": {
5546
5728
  "MiniMax-M2.7": {
@@ -5577,6 +5759,23 @@ export const MODELS = {
5577
5759
  contextWindow: 204800,
5578
5760
  maxTokens: 131072,
5579
5761
  },
5762
+ "MiniMax-M3": {
5763
+ id: "MiniMax-M3",
5764
+ name: "MiniMax-M3",
5765
+ api: "anthropic-messages",
5766
+ provider: "minimax-cn",
5767
+ baseUrl: "https://api.minimaxi.com/anthropic",
5768
+ reasoning: true,
5769
+ input: ["text", "image"],
5770
+ cost: {
5771
+ input: 0.6,
5772
+ output: 2.4,
5773
+ cacheRead: 0.12,
5774
+ cacheWrite: 0,
5775
+ },
5776
+ contextWindow: 512000,
5777
+ maxTokens: 128000,
5778
+ },
5580
5779
  },
5581
5780
  "mistral": {
5582
5781
  "codestral-latest": {
@@ -5613,6 +5812,23 @@ export const MODELS = {
5613
5812
  contextWindow: 262144,
5614
5813
  maxTokens: 262144,
5615
5814
  },
5815
+ "devstral-latest": {
5816
+ id: "devstral-latest",
5817
+ name: "Devstral 2",
5818
+ api: "mistral-conversations",
5819
+ provider: "mistral",
5820
+ baseUrl: "https://api.mistral.ai",
5821
+ reasoning: false,
5822
+ input: ["text"],
5823
+ cost: {
5824
+ input: 0.4,
5825
+ output: 2,
5826
+ cacheRead: 0,
5827
+ cacheWrite: 0,
5828
+ },
5829
+ contextWindow: 262144,
5830
+ maxTokens: 262144,
5831
+ },
5616
5832
  "devstral-medium-2507": {
5617
5833
  id: "devstral-medium-2507",
5618
5834
  name: "Devstral Medium",
@@ -5891,11 +6107,11 @@ export const MODELS = {
5891
6107
  api: "mistral-conversations",
5892
6108
  provider: "mistral",
5893
6109
  baseUrl: "https://api.mistral.ai",
5894
- reasoning: true,
6110
+ reasoning: false,
5895
6111
  input: ["text", "image"],
5896
6112
  cost: {
5897
- input: 1.5,
5898
- output: 7.5,
6113
+ input: 0.4,
6114
+ output: 2,
5899
6115
  cacheRead: 0,
5900
6116
  cacheWrite: 0,
5901
6117
  },
@@ -5987,6 +6203,23 @@ export const MODELS = {
5987
6203
  contextWindow: 8000,
5988
6204
  maxTokens: 8000,
5989
6205
  },
6206
+ "open-mistral-nemo": {
6207
+ id: "open-mistral-nemo",
6208
+ name: "Open Mistral Nemo",
6209
+ api: "mistral-conversations",
6210
+ provider: "mistral",
6211
+ baseUrl: "https://api.mistral.ai",
6212
+ reasoning: false,
6213
+ input: ["text"],
6214
+ cost: {
6215
+ input: 0.15,
6216
+ output: 0.15,
6217
+ cacheRead: 0,
6218
+ cacheWrite: 0,
6219
+ },
6220
+ contextWindow: 128000,
6221
+ maxTokens: 128000,
6222
+ },
5990
6223
  "open-mixtral-8x22b": {
5991
6224
  id: "open-mixtral-8x22b",
5992
6225
  name: "Mixtral 8x22B",
@@ -6312,56 +6545,457 @@ export const MODELS = {
6312
6545
  maxTokens: 262144,
6313
6546
  },
6314
6547
  },
6315
- "openai": {
6316
- "gpt-4": {
6317
- id: "gpt-4",
6318
- name: "GPT-4",
6319
- api: "openai-responses",
6320
- provider: "openai",
6321
- baseUrl: "https://api.openai.com/v1",
6548
+ "nvidia": {
6549
+ "meta/llama-3.1-70b-instruct": {
6550
+ id: "meta/llama-3.1-70b-instruct",
6551
+ name: "Llama 3.1 70b Instruct",
6552
+ api: "openai-completions",
6553
+ provider: "nvidia",
6554
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6555
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6556
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6322
6557
  reasoning: false,
6323
6558
  input: ["text"],
6324
6559
  cost: {
6325
- input: 30,
6326
- output: 60,
6560
+ input: 0,
6561
+ output: 0,
6327
6562
  cacheRead: 0,
6328
6563
  cacheWrite: 0,
6329
6564
  },
6330
- contextWindow: 8192,
6331
- maxTokens: 8192,
6565
+ contextWindow: 128000,
6566
+ maxTokens: 4096,
6332
6567
  },
6333
- "gpt-4-turbo": {
6334
- id: "gpt-4-turbo",
6335
- name: "GPT-4 Turbo",
6336
- api: "openai-responses",
6337
- provider: "openai",
6338
- baseUrl: "https://api.openai.com/v1",
6568
+ "meta/llama-3.1-8b-instruct": {
6569
+ id: "meta/llama-3.1-8b-instruct",
6570
+ name: "Llama 3.1 8B Instruct",
6571
+ api: "openai-completions",
6572
+ provider: "nvidia",
6573
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6574
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6575
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6576
+ reasoning: false,
6577
+ input: ["text"],
6578
+ cost: {
6579
+ input: 0,
6580
+ output: 0,
6581
+ cacheRead: 0,
6582
+ cacheWrite: 0,
6583
+ },
6584
+ contextWindow: 16000,
6585
+ maxTokens: 4096,
6586
+ },
6587
+ "meta/llama-3.2-11b-vision-instruct": {
6588
+ id: "meta/llama-3.2-11b-vision-instruct",
6589
+ name: "Llama 3.2 11b Vision Instruct",
6590
+ api: "openai-completions",
6591
+ provider: "nvidia",
6592
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6593
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6594
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6339
6595
  reasoning: false,
6340
6596
  input: ["text", "image"],
6341
6597
  cost: {
6342
- input: 10,
6343
- output: 30,
6598
+ input: 0,
6599
+ output: 0,
6344
6600
  cacheRead: 0,
6345
6601
  cacheWrite: 0,
6346
6602
  },
6347
6603
  contextWindow: 128000,
6348
6604
  maxTokens: 4096,
6349
6605
  },
6350
- "gpt-4.1": {
6351
- id: "gpt-4.1",
6352
- name: "GPT-4.1",
6353
- api: "openai-responses",
6354
- provider: "openai",
6355
- baseUrl: "https://api.openai.com/v1",
6606
+ "meta/llama-3.2-90b-vision-instruct": {
6607
+ id: "meta/llama-3.2-90b-vision-instruct",
6608
+ name: "Llama-3.2-90B-Vision-Instruct",
6609
+ api: "openai-completions",
6610
+ provider: "nvidia",
6611
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6612
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6613
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6356
6614
  reasoning: false,
6357
6615
  input: ["text", "image"],
6358
6616
  cost: {
6359
- input: 2,
6360
- output: 8,
6361
- cacheRead: 0.5,
6617
+ input: 0,
6618
+ output: 0,
6619
+ cacheRead: 0,
6362
6620
  cacheWrite: 0,
6363
6621
  },
6364
- contextWindow: 1047576,
6622
+ contextWindow: 128000,
6623
+ maxTokens: 8192,
6624
+ },
6625
+ "meta/llama-3.3-70b-instruct": {
6626
+ id: "meta/llama-3.3-70b-instruct",
6627
+ name: "Llama 3.3 70b Instruct",
6628
+ api: "openai-completions",
6629
+ provider: "nvidia",
6630
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6631
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6632
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6633
+ reasoning: false,
6634
+ input: ["text"],
6635
+ cost: {
6636
+ input: 0,
6637
+ output: 0,
6638
+ cacheRead: 0,
6639
+ cacheWrite: 0,
6640
+ },
6641
+ contextWindow: 128000,
6642
+ maxTokens: 4096,
6643
+ },
6644
+ "mistralai/mistral-large-3-675b-instruct-2512": {
6645
+ id: "mistralai/mistral-large-3-675b-instruct-2512",
6646
+ name: "Mistral Large 3 675B Instruct 2512",
6647
+ api: "openai-completions",
6648
+ provider: "nvidia",
6649
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6650
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6651
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6652
+ reasoning: false,
6653
+ input: ["text", "image"],
6654
+ cost: {
6655
+ input: 0,
6656
+ output: 0,
6657
+ cacheRead: 0,
6658
+ cacheWrite: 0,
6659
+ },
6660
+ contextWindow: 262144,
6661
+ maxTokens: 262144,
6662
+ },
6663
+ "mistralai/mistral-small-4-119b-2603": {
6664
+ id: "mistralai/mistral-small-4-119b-2603",
6665
+ name: "mistral-small-4-119b-2603",
6666
+ api: "openai-completions",
6667
+ provider: "nvidia",
6668
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6669
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6670
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6671
+ reasoning: false,
6672
+ input: ["text"],
6673
+ cost: {
6674
+ input: 0,
6675
+ output: 0,
6676
+ cacheRead: 0,
6677
+ cacheWrite: 0,
6678
+ },
6679
+ contextWindow: 128000,
6680
+ maxTokens: 8192,
6681
+ },
6682
+ "moonshotai/kimi-k2.6": {
6683
+ id: "moonshotai/kimi-k2.6",
6684
+ name: "Kimi K2.6",
6685
+ api: "openai-completions",
6686
+ provider: "nvidia",
6687
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6688
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6689
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6690
+ reasoning: true,
6691
+ input: ["text", "image"],
6692
+ cost: {
6693
+ input: 0,
6694
+ output: 0,
6695
+ cacheRead: 0,
6696
+ cacheWrite: 0,
6697
+ },
6698
+ contextWindow: 262144,
6699
+ maxTokens: 262144,
6700
+ },
6701
+ "nvidia/llama-3.3-nemotron-super-49b-v1": {
6702
+ id: "nvidia/llama-3.3-nemotron-super-49b-v1",
6703
+ name: "Llama 3.3 Nemotron Super 49B v1",
6704
+ api: "openai-completions",
6705
+ provider: "nvidia",
6706
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6707
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6708
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6709
+ reasoning: true,
6710
+ input: ["text"],
6711
+ cost: {
6712
+ input: 0,
6713
+ output: 0,
6714
+ cacheRead: 0,
6715
+ cacheWrite: 0,
6716
+ },
6717
+ contextWindow: 131072,
6718
+ maxTokens: 131072,
6719
+ },
6720
+ "nvidia/llama-3.3-nemotron-super-49b-v1.5": {
6721
+ id: "nvidia/llama-3.3-nemotron-super-49b-v1.5",
6722
+ name: "Llama 3.3 Nemotron Super 49B v1.5",
6723
+ api: "openai-completions",
6724
+ provider: "nvidia",
6725
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6726
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6727
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6728
+ reasoning: true,
6729
+ input: ["text"],
6730
+ cost: {
6731
+ input: 0,
6732
+ output: 0,
6733
+ cacheRead: 0,
6734
+ cacheWrite: 0,
6735
+ },
6736
+ contextWindow: 131072,
6737
+ maxTokens: 131072,
6738
+ },
6739
+ "nvidia/nemotron-3-nano-30b-a3b": {
6740
+ id: "nvidia/nemotron-3-nano-30b-a3b",
6741
+ name: "nemotron-3-nano-30b-a3b",
6742
+ api: "openai-completions",
6743
+ provider: "nvidia",
6744
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6745
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6746
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6747
+ reasoning: true,
6748
+ input: ["text"],
6749
+ cost: {
6750
+ input: 0,
6751
+ output: 0,
6752
+ cacheRead: 0,
6753
+ cacheWrite: 0,
6754
+ },
6755
+ contextWindow: 131072,
6756
+ maxTokens: 131072,
6757
+ },
6758
+ "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning": {
6759
+ id: "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning",
6760
+ name: "Nemotron 3 Nano Omni",
6761
+ api: "openai-completions",
6762
+ provider: "nvidia",
6763
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6764
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6765
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6766
+ reasoning: true,
6767
+ input: ["text", "image"],
6768
+ cost: {
6769
+ input: 0,
6770
+ output: 0,
6771
+ cacheRead: 0,
6772
+ cacheWrite: 0,
6773
+ },
6774
+ contextWindow: 256000,
6775
+ maxTokens: 65536,
6776
+ },
6777
+ "nvidia/nemotron-3-super-120b-a12b": {
6778
+ id: "nvidia/nemotron-3-super-120b-a12b",
6779
+ name: "Nemotron 3 Super",
6780
+ api: "openai-completions",
6781
+ provider: "nvidia",
6782
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6783
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6784
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6785
+ reasoning: true,
6786
+ input: ["text"],
6787
+ cost: {
6788
+ input: 0.2,
6789
+ output: 0.8,
6790
+ cacheRead: 0,
6791
+ cacheWrite: 0,
6792
+ },
6793
+ contextWindow: 262144,
6794
+ maxTokens: 262144,
6795
+ },
6796
+ "nvidia/nemotron-3-ultra-550b-a55b": {
6797
+ id: "nvidia/nemotron-3-ultra-550b-a55b",
6798
+ name: "Nemotron 3 Ultra 550B A55B",
6799
+ api: "openai-completions",
6800
+ provider: "nvidia",
6801
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6802
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6803
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6804
+ reasoning: true,
6805
+ input: ["text"],
6806
+ cost: {
6807
+ input: 0.5,
6808
+ output: 2.5,
6809
+ cacheRead: 0.15,
6810
+ cacheWrite: 0,
6811
+ },
6812
+ contextWindow: 1000000,
6813
+ maxTokens: 65536,
6814
+ },
6815
+ "nvidia/nvidia-nemotron-nano-9b-v2": {
6816
+ id: "nvidia/nvidia-nemotron-nano-9b-v2",
6817
+ name: "nvidia-nemotron-nano-9b-v2",
6818
+ api: "openai-completions",
6819
+ provider: "nvidia",
6820
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6821
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6822
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6823
+ reasoning: true,
6824
+ input: ["text"],
6825
+ cost: {
6826
+ input: 0,
6827
+ output: 0,
6828
+ cacheRead: 0,
6829
+ cacheWrite: 0,
6830
+ },
6831
+ contextWindow: 131072,
6832
+ maxTokens: 131072,
6833
+ },
6834
+ "openai/gpt-oss-20b": {
6835
+ id: "openai/gpt-oss-20b",
6836
+ name: "GPT OSS 20B",
6837
+ api: "openai-completions",
6838
+ provider: "nvidia",
6839
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6840
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6841
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6842
+ reasoning: true,
6843
+ input: ["text"],
6844
+ cost: {
6845
+ input: 0,
6846
+ output: 0,
6847
+ cacheRead: 0,
6848
+ cacheWrite: 0,
6849
+ },
6850
+ contextWindow: 131072,
6851
+ maxTokens: 32768,
6852
+ },
6853
+ "qwen/qwen3-coder-480b-a35b-instruct": {
6854
+ id: "qwen/qwen3-coder-480b-a35b-instruct",
6855
+ name: "Qwen3 Coder 480B A35B Instruct",
6856
+ api: "openai-completions",
6857
+ provider: "nvidia",
6858
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6859
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6860
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6861
+ reasoning: false,
6862
+ input: ["text"],
6863
+ cost: {
6864
+ input: 0,
6865
+ output: 0,
6866
+ cacheRead: 0,
6867
+ cacheWrite: 0,
6868
+ },
6869
+ contextWindow: 262144,
6870
+ maxTokens: 66536,
6871
+ },
6872
+ "qwen/qwen3.5-122b-a10b": {
6873
+ id: "qwen/qwen3.5-122b-a10b",
6874
+ name: "Qwen3.5 122B-A10B",
6875
+ api: "openai-completions",
6876
+ provider: "nvidia",
6877
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6878
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6879
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6880
+ reasoning: true,
6881
+ input: ["text", "image"],
6882
+ cost: {
6883
+ input: 0,
6884
+ output: 0,
6885
+ cacheRead: 0,
6886
+ cacheWrite: 0,
6887
+ },
6888
+ contextWindow: 262144,
6889
+ maxTokens: 65536,
6890
+ },
6891
+ "stepfun-ai/step-3.5-flash": {
6892
+ id: "stepfun-ai/step-3.5-flash",
6893
+ name: "Step 3.5 Flash",
6894
+ api: "openai-completions",
6895
+ provider: "nvidia",
6896
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6897
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6898
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6899
+ reasoning: true,
6900
+ input: ["text"],
6901
+ cost: {
6902
+ input: 0,
6903
+ output: 0,
6904
+ cacheRead: 0,
6905
+ cacheWrite: 0,
6906
+ },
6907
+ contextWindow: 256000,
6908
+ maxTokens: 16384,
6909
+ },
6910
+ "stepfun-ai/step-3.7-flash": {
6911
+ id: "stepfun-ai/step-3.7-flash",
6912
+ name: "Step 3.7 Flash",
6913
+ api: "openai-completions",
6914
+ provider: "nvidia",
6915
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6916
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6917
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6918
+ reasoning: true,
6919
+ input: ["text", "image"],
6920
+ cost: {
6921
+ input: 0,
6922
+ output: 0,
6923
+ cacheRead: 0,
6924
+ cacheWrite: 0,
6925
+ },
6926
+ contextWindow: 256000,
6927
+ maxTokens: 16384,
6928
+ },
6929
+ "z-ai/glm-5.1": {
6930
+ id: "z-ai/glm-5.1",
6931
+ name: "GLM-5.1",
6932
+ api: "openai-completions",
6933
+ provider: "nvidia",
6934
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6935
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6936
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6937
+ reasoning: true,
6938
+ input: ["text"],
6939
+ cost: {
6940
+ input: 0,
6941
+ output: 0,
6942
+ cacheRead: 0,
6943
+ cacheWrite: 0,
6944
+ },
6945
+ contextWindow: 131072,
6946
+ maxTokens: 131072,
6947
+ },
6948
+ },
6949
+ "openai": {
6950
+ "gpt-4": {
6951
+ id: "gpt-4",
6952
+ name: "GPT-4",
6953
+ api: "openai-responses",
6954
+ provider: "openai",
6955
+ baseUrl: "https://api.openai.com/v1",
6956
+ reasoning: false,
6957
+ input: ["text"],
6958
+ cost: {
6959
+ input: 30,
6960
+ output: 60,
6961
+ cacheRead: 0,
6962
+ cacheWrite: 0,
6963
+ },
6964
+ contextWindow: 8192,
6965
+ maxTokens: 8192,
6966
+ },
6967
+ "gpt-4-turbo": {
6968
+ id: "gpt-4-turbo",
6969
+ name: "GPT-4 Turbo",
6970
+ api: "openai-responses",
6971
+ provider: "openai",
6972
+ baseUrl: "https://api.openai.com/v1",
6973
+ reasoning: false,
6974
+ input: ["text", "image"],
6975
+ cost: {
6976
+ input: 10,
6977
+ output: 30,
6978
+ cacheRead: 0,
6979
+ cacheWrite: 0,
6980
+ },
6981
+ contextWindow: 128000,
6982
+ maxTokens: 4096,
6983
+ },
6984
+ "gpt-4.1": {
6985
+ id: "gpt-4.1",
6986
+ name: "GPT-4.1",
6987
+ api: "openai-responses",
6988
+ provider: "openai",
6989
+ baseUrl: "https://api.openai.com/v1",
6990
+ reasoning: false,
6991
+ input: ["text", "image"],
6992
+ cost: {
6993
+ input: 2,
6994
+ output: 8,
6995
+ cacheRead: 0.5,
6996
+ cacheWrite: 0,
6997
+ },
6998
+ contextWindow: 1047576,
6365
6999
  maxTokens: 32768,
6366
7000
  },
6367
7001
  "gpt-4.1-mini": {
@@ -6886,7 +7520,7 @@ export const MODELS = {
6886
7520
  provider: "openai",
6887
7521
  baseUrl: "https://api.openai.com/v1",
6888
7522
  reasoning: true,
6889
- thinkingLevelMap: { "off": "none", "xhigh": "xhigh" },
7523
+ thinkingLevelMap: { "off": "none", "xhigh": "xhigh", "minimal": null },
6890
7524
  input: ["text", "image"],
6891
7525
  cost: {
6892
7526
  input: 5,
@@ -7033,62 +7667,26 @@ export const MODELS = {
7033
7667
  },
7034
7668
  contextWindow: 200000,
7035
7669
  maxTokens: 100000,
7036
- },
7037
- "o4-mini-deep-research": {
7038
- id: "o4-mini-deep-research",
7039
- name: "o4-mini-deep-research",
7040
- api: "openai-responses",
7041
- provider: "openai",
7042
- baseUrl: "https://api.openai.com/v1",
7043
- reasoning: true,
7044
- input: ["text", "image"],
7045
- cost: {
7046
- input: 2,
7047
- output: 8,
7048
- cacheRead: 0.5,
7049
- cacheWrite: 0,
7050
- },
7051
- contextWindow: 200000,
7052
- maxTokens: 100000,
7053
- },
7054
- },
7055
- "openai-codex": {
7056
- "gpt-5.2": {
7057
- id: "gpt-5.2",
7058
- name: "GPT-5.2",
7059
- api: "openai-codex-responses",
7060
- provider: "openai-codex",
7061
- baseUrl: "https://chatgpt.com/backend-api",
7062
- reasoning: true,
7063
- thinkingLevelMap: { "xhigh": "xhigh", "minimal": "low" },
7064
- input: ["text", "image"],
7065
- cost: {
7066
- input: 1.75,
7067
- output: 14,
7068
- cacheRead: 0.175,
7069
- cacheWrite: 0,
7070
- },
7071
- contextWindow: 272000,
7072
- maxTokens: 128000,
7073
- },
7074
- "gpt-5.3-codex": {
7075
- id: "gpt-5.3-codex",
7076
- name: "GPT-5.3 Codex",
7077
- api: "openai-codex-responses",
7078
- provider: "openai-codex",
7079
- baseUrl: "https://chatgpt.com/backend-api",
7670
+ },
7671
+ "o4-mini-deep-research": {
7672
+ id: "o4-mini-deep-research",
7673
+ name: "o4-mini-deep-research",
7674
+ api: "openai-responses",
7675
+ provider: "openai",
7676
+ baseUrl: "https://api.openai.com/v1",
7080
7677
  reasoning: true,
7081
- thinkingLevelMap: { "xhigh": "xhigh", "minimal": "low" },
7082
7678
  input: ["text", "image"],
7083
7679
  cost: {
7084
- input: 1.75,
7085
- output: 14,
7086
- cacheRead: 0.175,
7680
+ input: 2,
7681
+ output: 8,
7682
+ cacheRead: 0.5,
7087
7683
  cacheWrite: 0,
7088
7684
  },
7089
- contextWindow: 272000,
7090
- maxTokens: 128000,
7685
+ contextWindow: 200000,
7686
+ maxTokens: 100000,
7091
7687
  },
7688
+ },
7689
+ "openai-codex": {
7092
7690
  "gpt-5.3-codex-spark": {
7093
7691
  id: "gpt-5.3-codex-spark",
7094
7692
  name: "GPT-5.3 Codex Spark",
@@ -7256,7 +7854,7 @@ export const MODELS = {
7256
7854
  api: "anthropic-messages",
7257
7855
  provider: "opencode",
7258
7856
  baseUrl: "https://opencode.ai/zen",
7259
- compat: { "forceAdaptiveThinking": true },
7857
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
7260
7858
  reasoning: true,
7261
7859
  thinkingLevelMap: { "xhigh": "xhigh" },
7262
7860
  input: ["text", "image"],
@@ -7275,7 +7873,7 @@ export const MODELS = {
7275
7873
  api: "anthropic-messages",
7276
7874
  provider: "opencode",
7277
7875
  baseUrl: "https://opencode.ai/zen",
7278
- compat: { "forceAdaptiveThinking": true },
7876
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
7279
7877
  reasoning: true,
7280
7878
  thinkingLevelMap: { "xhigh": "xhigh" },
7281
7879
  input: ["text", "image"],
@@ -7340,6 +7938,25 @@ export const MODELS = {
7340
7938
  contextWindow: 1000000,
7341
7939
  maxTokens: 64000,
7342
7940
  },
7941
+ "deepseek-v4-flash": {
7942
+ id: "deepseek-v4-flash",
7943
+ name: "DeepSeek V4 Flash",
7944
+ api: "openai-completions",
7945
+ provider: "opencode",
7946
+ baseUrl: "https://opencode.ai/zen/v1",
7947
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7948
+ reasoning: true,
7949
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7950
+ input: ["text"],
7951
+ cost: {
7952
+ input: 0.14,
7953
+ output: 0.28,
7954
+ cacheRead: 0.03,
7955
+ cacheWrite: 0,
7956
+ },
7957
+ contextWindow: 1000000,
7958
+ maxTokens: 384000,
7959
+ },
7343
7960
  "deepseek-v4-flash-free": {
7344
7961
  id: "deepseek-v4-flash-free",
7345
7962
  name: "DeepSeek V4 Flash Free",
@@ -7803,8 +8420,8 @@ export const MODELS = {
7803
8420
  cacheRead: 0,
7804
8421
  cacheWrite: 0,
7805
8422
  },
7806
- contextWindow: 1000000,
7807
- maxTokens: 128000,
8423
+ contextWindow: 200000,
8424
+ maxTokens: 32000,
7808
8425
  },
7809
8426
  "minimax-m2.5": {
7810
8427
  id: "minimax-m2.5",
@@ -7840,9 +8457,9 @@ export const MODELS = {
7840
8457
  contextWindow: 204800,
7841
8458
  maxTokens: 131072,
7842
8459
  },
7843
- "nemotron-3-super-free": {
7844
- id: "nemotron-3-super-free",
7845
- name: "Nemotron 3 Super Free",
8460
+ "nemotron-3-ultra-free": {
8461
+ id: "nemotron-3-ultra-free",
8462
+ name: "Nemotron 3 Ultra Free",
7846
8463
  api: "openai-completions",
7847
8464
  provider: "opencode",
7848
8465
  baseUrl: "https://opencode.ai/zen/v1",
@@ -7854,7 +8471,7 @@ export const MODELS = {
7854
8471
  cacheRead: 0,
7855
8472
  cacheWrite: 0,
7856
8473
  },
7857
- contextWindow: 204800,
8474
+ contextWindow: 1000000,
7858
8475
  maxTokens: 128000,
7859
8476
  },
7860
8477
  "qwen3.5-plus": {
@@ -8069,6 +8686,23 @@ export const MODELS = {
8069
8686
  contextWindow: 204800,
8070
8687
  maxTokens: 131072,
8071
8688
  },
8689
+ "minimax-m3": {
8690
+ id: "minimax-m3",
8691
+ name: "MiniMax M3",
8692
+ api: "anthropic-messages",
8693
+ provider: "opencode-go",
8694
+ baseUrl: "https://opencode.ai/zen/go",
8695
+ reasoning: true,
8696
+ input: ["text", "image"],
8697
+ cost: {
8698
+ input: 0.3,
8699
+ output: 1.2,
8700
+ cacheRead: 0.06,
8701
+ cacheWrite: 0,
8702
+ },
8703
+ contextWindow: 512000,
8704
+ maxTokens: 131072,
8705
+ },
8072
8706
  "qwen3.6-plus": {
8073
8707
  id: "qwen3.6-plus",
8074
8708
  name: "Qwen3.6 Plus",
@@ -8084,7 +8718,7 @@ export const MODELS = {
8084
8718
  cacheRead: 0.05,
8085
8719
  cacheWrite: 0.625,
8086
8720
  },
8087
- contextWindow: 262144,
8721
+ contextWindow: 1000000,
8088
8722
  maxTokens: 65536,
8089
8723
  },
8090
8724
  "qwen3.7-max": {
@@ -8104,6 +8738,23 @@ export const MODELS = {
8104
8738
  contextWindow: 1000000,
8105
8739
  maxTokens: 65536,
8106
8740
  },
8741
+ "qwen3.7-plus": {
8742
+ id: "qwen3.7-plus",
8743
+ name: "Qwen3.7 Plus",
8744
+ api: "anthropic-messages",
8745
+ provider: "opencode-go",
8746
+ baseUrl: "https://opencode.ai/zen/go",
8747
+ reasoning: true,
8748
+ input: ["text", "image"],
8749
+ cost: {
8750
+ input: 0.4,
8751
+ output: 1.6,
8752
+ cacheRead: 0.04,
8753
+ cacheWrite: 0.5,
8754
+ },
8755
+ contextWindow: 1000000,
8756
+ maxTokens: 65536,
8757
+ },
8107
8758
  },
8108
8759
  "openrouter": {
8109
8760
  "ai21/jamba-large-1.7": {
@@ -8537,40 +9188,6 @@ export const MODELS = {
8537
9188
  contextWindow: 2000000,
8538
9189
  maxTokens: 30000,
8539
9190
  },
8540
- "baidu/ernie-4.5-21b-a3b": {
8541
- id: "baidu/ernie-4.5-21b-a3b",
8542
- name: "Baidu: ERNIE 4.5 21B A3B",
8543
- api: "openai-completions",
8544
- provider: "openrouter",
8545
- baseUrl: "https://openrouter.ai/api/v1",
8546
- reasoning: false,
8547
- input: ["text"],
8548
- cost: {
8549
- input: 0.07,
8550
- output: 0.28,
8551
- cacheRead: 0,
8552
- cacheWrite: 0,
8553
- },
8554
- contextWindow: 131072,
8555
- maxTokens: 8000,
8556
- },
8557
- "baidu/ernie-4.5-vl-28b-a3b": {
8558
- id: "baidu/ernie-4.5-vl-28b-a3b",
8559
- name: "Baidu: ERNIE 4.5 VL 28B A3B",
8560
- api: "openai-completions",
8561
- provider: "openrouter",
8562
- baseUrl: "https://openrouter.ai/api/v1",
8563
- reasoning: true,
8564
- input: ["text", "image"],
8565
- cost: {
8566
- input: 0.14,
8567
- output: 0.56,
8568
- cacheRead: 0,
8569
- cacheWrite: 0,
8570
- },
8571
- contextWindow: 131072,
8572
- maxTokens: 8000,
8573
- },
8574
9191
  "bytedance-seed/seed-1.6": {
8575
9192
  id: "bytedance-seed/seed-1.6",
8576
9193
  name: "ByteDance Seed: Seed 1.6",
@@ -8682,8 +9299,8 @@ export const MODELS = {
8682
9299
  reasoning: false,
8683
9300
  input: ["text"],
8684
9301
  cost: {
8685
- input: 0.2288,
8686
- output: 0.9144,
9302
+ input: 0.20020000000000002,
9303
+ output: 0.8000999999999999,
8687
9304
  cacheRead: 0,
8688
9305
  cacheWrite: 0,
8689
9306
  },
@@ -8784,13 +9401,13 @@ export const MODELS = {
8784
9401
  reasoning: true,
8785
9402
  input: ["text"],
8786
9403
  cost: {
8787
- input: 0.252,
8788
- output: 0.378,
8789
- cacheRead: 0.0252,
9404
+ input: 0.2288,
9405
+ output: 0.3432,
9406
+ cacheRead: 0,
8790
9407
  cacheWrite: 0,
8791
9408
  },
8792
9409
  contextWindow: 131072,
8793
- maxTokens: 65536,
9410
+ maxTokens: 64000,
8794
9411
  },
8795
9412
  "deepseek/deepseek-v3.2-exp": {
8796
9413
  id: "deepseek/deepseek-v3.2-exp",
@@ -8828,25 +9445,6 @@ export const MODELS = {
8828
9445
  contextWindow: 1048576,
8829
9446
  maxTokens: 131072,
8830
9447
  },
8831
- "deepseek/deepseek-v4-flash:free": {
8832
- id: "deepseek/deepseek-v4-flash:free",
8833
- name: "DeepSeek: DeepSeek V4 Flash (free)",
8834
- api: "openai-completions",
8835
- provider: "openrouter",
8836
- baseUrl: "https://openrouter.ai/api/v1",
8837
- compat: { "requiresReasoningContentOnAssistantMessages": true },
8838
- reasoning: true,
8839
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "xhigh" },
8840
- input: ["text"],
8841
- cost: {
8842
- input: 0,
8843
- output: 0,
8844
- cacheRead: 0,
8845
- cacheWrite: 0,
8846
- },
8847
- contextWindow: 1048576,
8848
- maxTokens: 384000,
8849
- },
8850
9448
  "deepseek/deepseek-v4-pro": {
8851
9449
  id: "deepseek/deepseek-v4-pro",
8852
9450
  name: "DeepSeek: DeepSeek V4 Pro",
@@ -8883,40 +9481,6 @@ export const MODELS = {
8883
9481
  contextWindow: 32768,
8884
9482
  maxTokens: 4096,
8885
9483
  },
8886
- "google/gemini-2.0-flash-001": {
8887
- id: "google/gemini-2.0-flash-001",
8888
- name: "Google: Gemini 2.0 Flash",
8889
- api: "openai-completions",
8890
- provider: "openrouter",
8891
- baseUrl: "https://openrouter.ai/api/v1",
8892
- reasoning: false,
8893
- input: ["text", "image"],
8894
- cost: {
8895
- input: 0.09999999999999999,
8896
- output: 0.39999999999999997,
8897
- cacheRead: 0.024999999999999998,
8898
- cacheWrite: 0.08333333333333334,
8899
- },
8900
- contextWindow: 1048576,
8901
- maxTokens: 8192,
8902
- },
8903
- "google/gemini-2.0-flash-lite-001": {
8904
- id: "google/gemini-2.0-flash-lite-001",
8905
- name: "Google: Gemini 2.0 Flash Lite",
8906
- api: "openai-completions",
8907
- provider: "openrouter",
8908
- baseUrl: "https://openrouter.ai/api/v1",
8909
- reasoning: false,
8910
- input: ["text", "image"],
8911
- cost: {
8912
- input: 0.075,
8913
- output: 0.3,
8914
- cacheRead: 0,
8915
- cacheWrite: 0,
8916
- },
8917
- contextWindow: 1048576,
8918
- maxTokens: 8192,
8919
- },
8920
9484
  "google/gemini-2.5-flash": {
8921
9485
  id: "google/gemini-2.5-flash",
8922
9486
  name: "Google: Gemini 2.5 Flash",
@@ -9130,8 +9694,8 @@ export const MODELS = {
9130
9694
  reasoning: false,
9131
9695
  input: ["text", "image"],
9132
9696
  cost: {
9133
- input: 0.04,
9134
- output: 0.13,
9697
+ input: 0.049999999999999996,
9698
+ output: 0.15,
9135
9699
  cacheRead: 0,
9136
9700
  cacheWrite: 0,
9137
9701
  },
@@ -9199,12 +9763,12 @@ export const MODELS = {
9199
9763
  input: ["text", "image"],
9200
9764
  cost: {
9201
9765
  input: 0.12,
9202
- output: 0.37,
9203
- cacheRead: 0,
9766
+ output: 0.36,
9767
+ cacheRead: 0.09,
9204
9768
  cacheWrite: 0,
9205
9769
  },
9206
9770
  contextWindow: 262144,
9207
- maxTokens: 16384,
9771
+ maxTokens: 8192,
9208
9772
  },
9209
9773
  "google/gemma-4-31b-it:free": {
9210
9774
  id: "google/gemma-4-31b-it:free",
@@ -9353,7 +9917,7 @@ export const MODELS = {
9353
9917
  input: ["text"],
9354
9918
  cost: {
9355
9919
  input: 0.02,
9356
- output: 0.049999999999999996,
9920
+ output: 0.03,
9357
9921
  cacheRead: 0,
9358
9922
  cacheWrite: 0,
9359
9923
  },
@@ -9394,6 +9958,23 @@ export const MODELS = {
9394
9958
  contextWindow: 131072,
9395
9959
  maxTokens: 4096,
9396
9960
  },
9961
+ "meta-llama/llama-4-maverick": {
9962
+ id: "meta-llama/llama-4-maverick",
9963
+ name: "Meta: Llama 4 Maverick",
9964
+ api: "openai-completions",
9965
+ provider: "openrouter",
9966
+ baseUrl: "https://openrouter.ai/api/v1",
9967
+ reasoning: false,
9968
+ input: ["text", "image"],
9969
+ cost: {
9970
+ input: 0.15,
9971
+ output: 0.6,
9972
+ cacheRead: 0,
9973
+ cacheWrite: 0,
9974
+ },
9975
+ contextWindow: 1048576,
9976
+ maxTokens: 16384,
9977
+ },
9397
9978
  "meta-llama/llama-4-scout": {
9398
9979
  id: "meta-llama/llama-4-scout",
9399
9980
  name: "Meta: Llama 4 Scout",
@@ -9403,7 +9984,7 @@ export const MODELS = {
9403
9984
  reasoning: false,
9404
9985
  input: ["text", "image"],
9405
9986
  cost: {
9406
- input: 0.08,
9987
+ input: 0.09999999999999999,
9407
9988
  output: 0.3,
9408
9989
  cacheRead: 0,
9409
9990
  cacheWrite: 0,
@@ -9479,39 +10060,39 @@ export const MODELS = {
9479
10060
  contextWindow: 204800,
9480
10061
  maxTokens: 196608,
9481
10062
  },
9482
- "minimax/minimax-m2.5:free": {
9483
- id: "minimax/minimax-m2.5:free",
9484
- name: "MiniMax: MiniMax M2.5 (free)",
10063
+ "minimax/minimax-m2.7": {
10064
+ id: "minimax/minimax-m2.7",
10065
+ name: "MiniMax: MiniMax M2.7",
9485
10066
  api: "openai-completions",
9486
10067
  provider: "openrouter",
9487
10068
  baseUrl: "https://openrouter.ai/api/v1",
9488
10069
  reasoning: true,
9489
10070
  input: ["text"],
9490
10071
  cost: {
9491
- input: 0,
9492
- output: 0,
10072
+ input: 0.27899999999999997,
10073
+ output: 1.2,
9493
10074
  cacheRead: 0,
9494
10075
  cacheWrite: 0,
9495
10076
  },
9496
10077
  contextWindow: 204800,
9497
- maxTokens: 8192,
10078
+ maxTokens: 196608,
9498
10079
  },
9499
- "minimax/minimax-m2.7": {
9500
- id: "minimax/minimax-m2.7",
9501
- name: "MiniMax: MiniMax M2.7",
10080
+ "minimax/minimax-m3": {
10081
+ id: "minimax/minimax-m3",
10082
+ name: "MiniMax: MiniMax M3",
9502
10083
  api: "openai-completions",
9503
10084
  provider: "openrouter",
9504
10085
  baseUrl: "https://openrouter.ai/api/v1",
9505
10086
  reasoning: true,
9506
- input: ["text"],
10087
+ input: ["text", "image"],
9507
10088
  cost: {
9508
- input: 0.27899999999999997,
10089
+ input: 0.3,
9509
10090
  output: 1.2,
9510
- cacheRead: 0,
10091
+ cacheRead: 0.06,
9511
10092
  cacheWrite: 0,
9512
10093
  },
9513
- contextWindow: 204800,
9514
- maxTokens: 131072,
10094
+ contextWindow: 1048576,
10095
+ maxTokens: 512000,
9515
10096
  },
9516
10097
  "mistralai/codestral-2508": {
9517
10098
  id: "mistralai/codestral-2508",
@@ -9547,40 +10128,6 @@ export const MODELS = {
9547
10128
  contextWindow: 262144,
9548
10129
  maxTokens: 4096,
9549
10130
  },
9550
- "mistralai/devstral-medium": {
9551
- id: "mistralai/devstral-medium",
9552
- name: "Mistral: Devstral Medium",
9553
- api: "openai-completions",
9554
- provider: "openrouter",
9555
- baseUrl: "https://openrouter.ai/api/v1",
9556
- reasoning: false,
9557
- input: ["text"],
9558
- cost: {
9559
- input: 0.39999999999999997,
9560
- output: 2,
9561
- cacheRead: 0.04,
9562
- cacheWrite: 0,
9563
- },
9564
- contextWindow: 131072,
9565
- maxTokens: 4096,
9566
- },
9567
- "mistralai/devstral-small": {
9568
- id: "mistralai/devstral-small",
9569
- name: "Mistral: Devstral Small 1.1",
9570
- api: "openai-completions",
9571
- provider: "openrouter",
9572
- baseUrl: "https://openrouter.ai/api/v1",
9573
- reasoning: false,
9574
- input: ["text"],
9575
- cost: {
9576
- input: 0.09999999999999999,
9577
- output: 0.3,
9578
- cacheRead: 0.01,
9579
- cacheWrite: 0,
9580
- },
9581
- contextWindow: 131072,
9582
- maxTokens: 4096,
9583
- },
9584
10131
  "mistralai/ministral-14b-2512": {
9585
10132
  id: "mistralai/ministral-14b-2512",
9586
10133
  name: "Mistral: Ministral 3 14B 2512",
@@ -9666,23 +10213,6 @@ export const MODELS = {
9666
10213
  contextWindow: 131072,
9667
10214
  maxTokens: 4096,
9668
10215
  },
9669
- "mistralai/mistral-large-2411": {
9670
- id: "mistralai/mistral-large-2411",
9671
- name: "Mistral Large 2411",
9672
- api: "openai-completions",
9673
- provider: "openrouter",
9674
- baseUrl: "https://openrouter.ai/api/v1",
9675
- reasoning: false,
9676
- input: ["text"],
9677
- cost: {
9678
- input: 2,
9679
- output: 6,
9680
- cacheRead: 0.19999999999999998,
9681
- cacheWrite: 0,
9682
- },
9683
- contextWindow: 131072,
9684
- maxTokens: 4096,
9685
- },
9686
10216
  "mistralai/mistral-large-2512": {
9687
10217
  id: "mistralai/mistral-large-2512",
9688
10218
  name: "Mistral: Mistral Large 3 2512",
@@ -9816,41 +10346,24 @@ export const MODELS = {
9816
10346
  cacheRead: 0,
9817
10347
  cacheWrite: 0,
9818
10348
  },
9819
- contextWindow: 128000,
9820
- maxTokens: 16384,
9821
- },
9822
- "mistralai/mixtral-8x22b-instruct": {
9823
- id: "mistralai/mixtral-8x22b-instruct",
9824
- name: "Mistral: Mixtral 8x22B Instruct",
9825
- api: "openai-completions",
9826
- provider: "openrouter",
9827
- baseUrl: "https://openrouter.ai/api/v1",
9828
- reasoning: false,
9829
- input: ["text"],
9830
- cost: {
9831
- input: 2,
9832
- output: 6,
9833
- cacheRead: 0.19999999999999998,
9834
- cacheWrite: 0,
9835
- },
9836
- contextWindow: 65536,
9837
- maxTokens: 4096,
10349
+ contextWindow: 128000,
10350
+ maxTokens: 16384,
9838
10351
  },
9839
- "mistralai/pixtral-large-2411": {
9840
- id: "mistralai/pixtral-large-2411",
9841
- name: "Mistral: Pixtral Large 2411",
10352
+ "mistralai/mixtral-8x22b-instruct": {
10353
+ id: "mistralai/mixtral-8x22b-instruct",
10354
+ name: "Mistral: Mixtral 8x22B Instruct",
9842
10355
  api: "openai-completions",
9843
10356
  provider: "openrouter",
9844
10357
  baseUrl: "https://openrouter.ai/api/v1",
9845
10358
  reasoning: false,
9846
- input: ["text", "image"],
10359
+ input: ["text"],
9847
10360
  cost: {
9848
10361
  input: 2,
9849
10362
  output: 6,
9850
10363
  cacheRead: 0.19999999999999998,
9851
10364
  cacheWrite: 0,
9852
10365
  },
9853
- contextWindow: 131072,
10366
+ contextWindow: 65536,
9854
10367
  maxTokens: 4096,
9855
10368
  },
9856
10369
  "mistralai/voxtral-small-24b-2507": {
@@ -9944,17 +10457,17 @@ export const MODELS = {
9944
10457
  api: "openai-completions",
9945
10458
  provider: "openrouter",
9946
10459
  baseUrl: "https://openrouter.ai/api/v1",
9947
- compat: { "supportsDeveloperRole": false },
10460
+ compat: { "supportsDeveloperRole": false, "requiresReasoningContentOnAssistantMessages": true },
9948
10461
  reasoning: true,
9949
10462
  input: ["text", "image"],
9950
10463
  cost: {
9951
- input: 0.684,
9952
- output: 3.42,
9953
- cacheRead: 0.144,
10464
+ input: 0.6799999999999999,
10465
+ output: 3.41,
10466
+ cacheRead: 0.33999999999999997,
9954
10467
  cacheWrite: 0,
9955
10468
  },
9956
10469
  contextWindow: 262144,
9957
- maxTokens: 262144,
10470
+ maxTokens: 262142,
9958
10471
  },
9959
10472
  "moonshotai/kimi-k2.6:free": {
9960
10473
  id: "moonshotai/kimi-k2.6:free",
@@ -9962,7 +10475,7 @@ export const MODELS = {
9962
10475
  api: "openai-completions",
9963
10476
  provider: "openrouter",
9964
10477
  baseUrl: "https://openrouter.ai/api/v1",
9965
- compat: { "supportsDeveloperRole": false },
10478
+ compat: { "supportsDeveloperRole": false, "requiresReasoningContentOnAssistantMessages": true },
9966
10479
  reasoning: true,
9967
10480
  input: ["text", "image"],
9968
10481
  cost: {
@@ -9974,23 +10487,6 @@ export const MODELS = {
9974
10487
  contextWindow: 262144,
9975
10488
  maxTokens: 4096,
9976
10489
  },
9977
- "nex-agi/deepseek-v3.1-nex-n1": {
9978
- id: "nex-agi/deepseek-v3.1-nex-n1",
9979
- name: "Nex AGI: DeepSeek V3.1 Nex N1",
9980
- api: "openai-completions",
9981
- provider: "openrouter",
9982
- baseUrl: "https://openrouter.ai/api/v1",
9983
- reasoning: false,
9984
- input: ["text"],
9985
- cost: {
9986
- input: 0.135,
9987
- output: 0.5,
9988
- cacheRead: 0,
9989
- cacheWrite: 0,
9990
- },
9991
- contextWindow: 131072,
9992
- maxTokens: 163840,
9993
- },
9994
10490
  "nvidia/llama-3.3-nemotron-super-49b-v1.5": {
9995
10491
  id: "nvidia/llama-3.3-nemotron-super-49b-v1.5",
9996
10492
  name: "NVIDIA: Llama 3.3 Nemotron Super 49B V1.5",
@@ -10000,7 +10496,7 @@ export const MODELS = {
10000
10496
  reasoning: true,
10001
10497
  input: ["text"],
10002
10498
  cost: {
10003
- input: 0.09999999999999999,
10499
+ input: 0.39999999999999997,
10004
10500
  output: 0.39999999999999997,
10005
10501
  cacheRead: 0,
10006
10502
  cacheWrite: 0,
@@ -10093,6 +10589,40 @@ export const MODELS = {
10093
10589
  contextWindow: 1000000,
10094
10590
  maxTokens: 262144,
10095
10591
  },
10592
+ "nvidia/nemotron-3-ultra-550b-a55b": {
10593
+ id: "nvidia/nemotron-3-ultra-550b-a55b",
10594
+ name: "NVIDIA: Nemotron 3 Ultra",
10595
+ api: "openai-completions",
10596
+ provider: "openrouter",
10597
+ baseUrl: "https://openrouter.ai/api/v1",
10598
+ reasoning: true,
10599
+ input: ["text"],
10600
+ cost: {
10601
+ input: 0.5,
10602
+ output: 2.5,
10603
+ cacheRead: 0.15,
10604
+ cacheWrite: 0,
10605
+ },
10606
+ contextWindow: 1000000,
10607
+ maxTokens: 16384,
10608
+ },
10609
+ "nvidia/nemotron-3-ultra-550b-a55b:free": {
10610
+ id: "nvidia/nemotron-3-ultra-550b-a55b:free",
10611
+ name: "NVIDIA: Nemotron 3 Ultra (free)",
10612
+ api: "openai-completions",
10613
+ provider: "openrouter",
10614
+ baseUrl: "https://openrouter.ai/api/v1",
10615
+ reasoning: true,
10616
+ input: ["text"],
10617
+ cost: {
10618
+ input: 0,
10619
+ output: 0,
10620
+ cacheRead: 0,
10621
+ cacheWrite: 0,
10622
+ },
10623
+ contextWindow: 1000000,
10624
+ maxTokens: 65536,
10625
+ },
10096
10626
  "nvidia/nemotron-nano-12b-v2-vl:free": {
10097
10627
  id: "nvidia/nemotron-nano-12b-v2-vl:free",
10098
10628
  name: "NVIDIA: Nemotron Nano 12B 2 VL (free)",
@@ -10212,40 +10742,6 @@ export const MODELS = {
10212
10742
  contextWindow: 8191,
10213
10743
  maxTokens: 4096,
10214
10744
  },
10215
- "openai/gpt-4-0314": {
10216
- id: "openai/gpt-4-0314",
10217
- name: "OpenAI: GPT-4 (older v0314)",
10218
- api: "openai-completions",
10219
- provider: "openrouter",
10220
- baseUrl: "https://openrouter.ai/api/v1",
10221
- reasoning: false,
10222
- input: ["text"],
10223
- cost: {
10224
- input: 30,
10225
- output: 60,
10226
- cacheRead: 0,
10227
- cacheWrite: 0,
10228
- },
10229
- contextWindow: 8191,
10230
- maxTokens: 4096,
10231
- },
10232
- "openai/gpt-4-1106-preview": {
10233
- id: "openai/gpt-4-1106-preview",
10234
- name: "OpenAI: GPT-4 Turbo (older v1106)",
10235
- api: "openai-completions",
10236
- provider: "openrouter",
10237
- baseUrl: "https://openrouter.ai/api/v1",
10238
- reasoning: false,
10239
- input: ["text"],
10240
- cost: {
10241
- input: 10,
10242
- output: 30,
10243
- cacheRead: 0,
10244
- cacheWrite: 0,
10245
- },
10246
- contextWindow: 128000,
10247
- maxTokens: 4096,
10248
- },
10249
10745
  "openai/gpt-4-turbo": {
10250
10746
  id: "openai/gpt-4-turbo",
10251
10747
  name: "OpenAI: GPT-4 Turbo",
@@ -10913,13 +11409,13 @@ export const MODELS = {
10913
11409
  reasoning: true,
10914
11410
  input: ["text"],
10915
11411
  cost: {
10916
- input: 0.03,
11412
+ input: 0.029,
10917
11413
  output: 0.14,
10918
11414
  cacheRead: 0,
10919
11415
  cacheWrite: 0,
10920
11416
  },
10921
11417
  contextWindow: 131072,
10922
- maxTokens: 131072,
11418
+ maxTokens: 4096,
10923
11419
  },
10924
11420
  "openai/gpt-oss-20b:free": {
10925
11421
  id: "openai/gpt-oss-20b:free",
@@ -11227,23 +11723,6 @@ export const MODELS = {
11227
11723
  contextWindow: 131072,
11228
11724
  maxTokens: 16384,
11229
11725
  },
11230
- "qwen/qwen-2.5-7b-instruct": {
11231
- id: "qwen/qwen-2.5-7b-instruct",
11232
- name: "Qwen: Qwen2.5 7B Instruct",
11233
- api: "openai-completions",
11234
- provider: "openrouter",
11235
- baseUrl: "https://openrouter.ai/api/v1",
11236
- reasoning: false,
11237
- input: ["text"],
11238
- cost: {
11239
- input: 0.04,
11240
- output: 0.09999999999999999,
11241
- cacheRead: 0,
11242
- cacheWrite: 0,
11243
- },
11244
- contextWindow: 131072,
11245
- maxTokens: 32768,
11246
- },
11247
11726
  "qwen/qwen-plus": {
11248
11727
  id: "qwen/qwen-plus",
11249
11728
  name: "Qwen: Qwen-Plus",
@@ -11338,7 +11817,7 @@ export const MODELS = {
11338
11817
  reasoning: false,
11339
11818
  input: ["text"],
11340
11819
  cost: {
11341
- input: 0.071,
11820
+ input: 0.09,
11342
11821
  output: 0.09999999999999999,
11343
11822
  cacheRead: 0,
11344
11823
  cacheWrite: 0,
@@ -11355,13 +11834,13 @@ export const MODELS = {
11355
11834
  reasoning: true,
11356
11835
  input: ["text"],
11357
11836
  cost: {
11358
- input: 0.14950000000000002,
11359
- output: 1.495,
11360
- cacheRead: 0,
11837
+ input: 0.09999999999999999,
11838
+ output: 0.09999999999999999,
11839
+ cacheRead: 0.09999999999999999,
11361
11840
  cacheWrite: 0,
11362
11841
  },
11363
11842
  contextWindow: 262144,
11364
- maxTokens: 4096,
11843
+ maxTokens: 262144,
11365
11844
  },
11366
11845
  "qwen/qwen3-30b-a3b": {
11367
11846
  id: "qwen/qwen3-30b-a3b",
@@ -11372,13 +11851,13 @@ export const MODELS = {
11372
11851
  reasoning: true,
11373
11852
  input: ["text"],
11374
11853
  cost: {
11375
- input: 0.09,
11376
- output: 0.44999999999999996,
11854
+ input: 0.12,
11855
+ output: 0.5,
11377
11856
  cacheRead: 0,
11378
11857
  cacheWrite: 0,
11379
11858
  },
11380
11859
  contextWindow: 131072,
11381
- maxTokens: 20000,
11860
+ maxTokens: 16384,
11382
11861
  },
11383
11862
  "qwen/qwen3-30b-a3b-instruct-2507": {
11384
11863
  id: "qwen/qwen3-30b-a3b-instruct-2507",
@@ -11389,13 +11868,13 @@ export const MODELS = {
11389
11868
  reasoning: false,
11390
11869
  input: ["text"],
11391
11870
  cost: {
11392
- input: 0.09,
11393
- output: 0.3,
11871
+ input: 0.04815,
11872
+ output: 0.19305,
11394
11873
  cacheRead: 0,
11395
11874
  cacheWrite: 0,
11396
11875
  },
11397
- contextWindow: 262144,
11398
- maxTokens: 262144,
11876
+ contextWindow: 131072,
11877
+ maxTokens: 32000,
11399
11878
  },
11400
11879
  "qwen/qwen3-30b-a3b-thinking-2507": {
11401
11880
  id: "qwen/qwen3-30b-a3b-thinking-2507",
@@ -11797,13 +12276,13 @@ export const MODELS = {
11797
12276
  reasoning: true,
11798
12277
  input: ["text", "image"],
11799
12278
  cost: {
11800
- input: 0.13899999999999998,
12279
+ input: 0.14,
11801
12280
  output: 1,
11802
- cacheRead: 0,
12281
+ cacheRead: 0.049999999999999996,
11803
12282
  cacheWrite: 0,
11804
12283
  },
11805
12284
  contextWindow: 262144,
11806
- maxTokens: 4096,
12285
+ maxTokens: 262144,
11807
12286
  },
11808
12287
  "qwen/qwen3.5-397b-a17b": {
11809
12288
  id: "qwen/qwen3.5-397b-a17b",
@@ -11831,13 +12310,13 @@ export const MODELS = {
11831
12310
  reasoning: true,
11832
12311
  input: ["text", "image"],
11833
12312
  cost: {
11834
- input: 0.04,
12313
+ input: 0.09999999999999999,
11835
12314
  output: 0.15,
11836
12315
  cacheRead: 0,
11837
12316
  cacheWrite: 0,
11838
12317
  },
11839
12318
  contextWindow: 262144,
11840
- maxTokens: 81920,
12319
+ maxTokens: 262144,
11841
12320
  },
11842
12321
  "qwen/qwen3.5-flash-02-23": {
11843
12322
  id: "qwen/qwen3.5-flash-02-23",
@@ -11899,13 +12378,13 @@ export const MODELS = {
11899
12378
  reasoning: true,
11900
12379
  input: ["text", "image"],
11901
12380
  cost: {
11902
- input: 0.29,
11903
- output: 3.1999999999999997,
12381
+ input: 0.28900000000000003,
12382
+ output: 2.4,
11904
12383
  cacheRead: 0,
11905
12384
  cacheWrite: 0,
11906
12385
  },
11907
12386
  contextWindow: 262144,
11908
- maxTokens: 262140,
12387
+ maxTokens: 131072,
11909
12388
  },
11910
12389
  "qwen/qwen3.6-35b-a3b": {
11911
12390
  id: "qwen/qwen3.6-35b-a3b",
@@ -11992,6 +12471,23 @@ export const MODELS = {
11992
12471
  contextWindow: 1000000,
11993
12472
  maxTokens: 65536,
11994
12473
  },
12474
+ "qwen/qwen3.7-plus": {
12475
+ id: "qwen/qwen3.7-plus",
12476
+ name: "Qwen: Qwen3.7 Plus",
12477
+ api: "openai-completions",
12478
+ provider: "openrouter",
12479
+ baseUrl: "https://openrouter.ai/api/v1",
12480
+ reasoning: true,
12481
+ input: ["text", "image"],
12482
+ cost: {
12483
+ input: 0.39999999999999997,
12484
+ output: 1.5999999999999999,
12485
+ cacheRead: 0.08,
12486
+ cacheWrite: 0.5,
12487
+ },
12488
+ contextWindow: 1000000,
12489
+ maxTokens: 65536,
12490
+ },
11995
12491
  "rekaai/reka-edge": {
11996
12492
  id: "rekaai/reka-edge",
11997
12493
  name: "Reka Edge",
@@ -12026,23 +12522,6 @@ export const MODELS = {
12026
12522
  contextWindow: 256000,
12027
12523
  maxTokens: 128000,
12028
12524
  },
12029
- "sao10k/l3-euryale-70b": {
12030
- id: "sao10k/l3-euryale-70b",
12031
- name: "Sao10k: Llama 3 Euryale 70B v2.1",
12032
- api: "openai-completions",
12033
- provider: "openrouter",
12034
- baseUrl: "https://openrouter.ai/api/v1",
12035
- reasoning: false,
12036
- input: ["text"],
12037
- cost: {
12038
- input: 1.48,
12039
- output: 1.48,
12040
- cacheRead: 0,
12041
- cacheWrite: 0,
12042
- },
12043
- contextWindow: 8192,
12044
- maxTokens: 8192,
12045
- },
12046
12525
  "sao10k/l3.1-euryale-70b": {
12047
12526
  id: "sao10k/l3.1-euryale-70b",
12048
12527
  name: "Sao10K: Llama 3.1 Euryale 70B v2.2",
@@ -12230,40 +12709,6 @@ export const MODELS = {
12230
12709
  contextWindow: 262144,
12231
12710
  maxTokens: 65536,
12232
12711
  },
12233
- "xiaomi/mimo-v2-omni": {
12234
- id: "xiaomi/mimo-v2-omni",
12235
- name: "Xiaomi: MiMo-V2-Omni",
12236
- api: "openai-completions",
12237
- provider: "openrouter",
12238
- baseUrl: "https://openrouter.ai/api/v1",
12239
- reasoning: true,
12240
- input: ["text", "image"],
12241
- cost: {
12242
- input: 0.39999999999999997,
12243
- output: 2,
12244
- cacheRead: 0.08,
12245
- cacheWrite: 0,
12246
- },
12247
- contextWindow: 262144,
12248
- maxTokens: 65536,
12249
- },
12250
- "xiaomi/mimo-v2-pro": {
12251
- id: "xiaomi/mimo-v2-pro",
12252
- name: "Xiaomi: MiMo-V2-Pro",
12253
- api: "openai-completions",
12254
- provider: "openrouter",
12255
- baseUrl: "https://openrouter.ai/api/v1",
12256
- reasoning: true,
12257
- input: ["text"],
12258
- cost: {
12259
- input: 1,
12260
- output: 3,
12261
- cacheRead: 0.19999999999999998,
12262
- cacheWrite: 0,
12263
- },
12264
- contextWindow: 1048576,
12265
- maxTokens: 131072,
12266
- },
12267
12712
  "xiaomi/mimo-v2.5": {
12268
12713
  id: "xiaomi/mimo-v2.5",
12269
12714
  name: "Xiaomi: MiMo-V2.5",
@@ -12613,13 +13058,13 @@ export const MODELS = {
12613
13058
  reasoning: true,
12614
13059
  input: ["text", "image"],
12615
13060
  cost: {
12616
- input: 0.684,
12617
- output: 3.42,
12618
- cacheRead: 0.144,
13061
+ input: 0.6799999999999999,
13062
+ output: 3.41,
13063
+ cacheRead: 0.33999999999999997,
12619
13064
  cacheWrite: 0,
12620
13065
  },
12621
13066
  contextWindow: 262144,
12622
- maxTokens: 262144,
13067
+ maxTokens: 262142,
12623
13068
  },
12624
13069
  "~openai/gpt-latest": {
12625
13070
  id: "~openai/gpt-latest",
@@ -12810,7 +13255,7 @@ export const MODELS = {
12810
13255
  },
12811
13256
  "deepseek-ai/DeepSeek-V3": {
12812
13257
  id: "deepseek-ai/DeepSeek-V3",
12813
- name: "DeepSeek V3",
13258
+ name: "DeepSeek-V3",
12814
13259
  api: "openai-completions",
12815
13260
  provider: "together",
12816
13261
  baseUrl: "https://api.together.ai/v1",
@@ -12958,6 +13403,25 @@ export const MODELS = {
12958
13403
  contextWindow: 262144,
12959
13404
  maxTokens: 131000,
12960
13405
  },
13406
+ "nvidia/nemotron-3-ultra-550b-a55b": {
13407
+ id: "nvidia/nemotron-3-ultra-550b-a55b",
13408
+ name: "Nemotron 3 Ultra 550B A55B",
13409
+ api: "openai-completions",
13410
+ provider: "together",
13411
+ baseUrl: "https://api.together.ai/v1",
13412
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13413
+ reasoning: true,
13414
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13415
+ input: ["text"],
13416
+ cost: {
13417
+ input: 0.6,
13418
+ output: 3.6,
13419
+ cacheRead: 0.2,
13420
+ cacheWrite: 0,
13421
+ },
13422
+ contextWindow: 512300,
13423
+ maxTokens: 512300,
13424
+ },
12961
13425
  "openai/gpt-oss-120b": {
12962
13426
  id: "openai/gpt-oss-120b",
12963
13427
  name: "GPT OSS 120B",
@@ -13021,7 +13485,7 @@ export const MODELS = {
13021
13485
  api: "anthropic-messages",
13022
13486
  provider: "vercel-ai-gateway",
13023
13487
  baseUrl: "https://ai-gateway.vercel.sh",
13024
- reasoning: false,
13488
+ reasoning: true,
13025
13489
  input: ["text"],
13026
13490
  cost: {
13027
13491
  input: 0.22,
@@ -13073,7 +13537,7 @@ export const MODELS = {
13073
13537
  provider: "vercel-ai-gateway",
13074
13538
  baseUrl: "https://ai-gateway.vercel.sh",
13075
13539
  reasoning: true,
13076
- input: ["text", "image"],
13540
+ input: ["text"],
13077
13541
  cost: {
13078
13542
  input: 1.3,
13079
13543
  output: 7.8,
@@ -13106,7 +13570,7 @@ export const MODELS = {
13106
13570
  api: "anthropic-messages",
13107
13571
  provider: "vercel-ai-gateway",
13108
13572
  baseUrl: "https://ai-gateway.vercel.sh",
13109
- reasoning: false,
13573
+ reasoning: true,
13110
13574
  input: ["text"],
13111
13575
  cost: {
13112
13576
  input: 1.5,
@@ -13140,7 +13604,7 @@ export const MODELS = {
13140
13604
  api: "anthropic-messages",
13141
13605
  provider: "vercel-ai-gateway",
13142
13606
  baseUrl: "https://ai-gateway.vercel.sh",
13143
- reasoning: false,
13607
+ reasoning: true,
13144
13608
  input: ["text"],
13145
13609
  cost: {
13146
13610
  input: 0.5,
@@ -13219,6 +13683,40 @@ export const MODELS = {
13219
13683
  contextWindow: 256000,
13220
13684
  maxTokens: 65536,
13221
13685
  },
13686
+ "alibaba/qwen3-next-80b-a3b-instruct": {
13687
+ id: "alibaba/qwen3-next-80b-a3b-instruct",
13688
+ name: "Qwen3 Next 80B A3B Instruct",
13689
+ api: "anthropic-messages",
13690
+ provider: "vercel-ai-gateway",
13691
+ baseUrl: "https://ai-gateway.vercel.sh",
13692
+ reasoning: false,
13693
+ input: ["text"],
13694
+ cost: {
13695
+ input: 0.15,
13696
+ output: 1.2,
13697
+ cacheRead: 0,
13698
+ cacheWrite: 0,
13699
+ },
13700
+ contextWindow: 131072,
13701
+ maxTokens: 32768,
13702
+ },
13703
+ "alibaba/qwen3-next-80b-a3b-thinking": {
13704
+ id: "alibaba/qwen3-next-80b-a3b-thinking",
13705
+ name: "Qwen3 Next 80B A3B Thinking",
13706
+ api: "anthropic-messages",
13707
+ provider: "vercel-ai-gateway",
13708
+ baseUrl: "https://ai-gateway.vercel.sh",
13709
+ reasoning: true,
13710
+ input: ["text"],
13711
+ cost: {
13712
+ input: 0.15,
13713
+ output: 1.2,
13714
+ cacheRead: 0,
13715
+ cacheWrite: 0,
13716
+ },
13717
+ contextWindow: 131072,
13718
+ maxTokens: 32768,
13719
+ },
13222
13720
  "alibaba/qwen3-vl-thinking": {
13223
13721
  id: "alibaba/qwen3-vl-thinking",
13224
13722
  name: "Qwen3 VL 235B A22B Thinking",
@@ -13311,14 +13809,31 @@ export const MODELS = {
13311
13809
  provider: "vercel-ai-gateway",
13312
13810
  baseUrl: "https://ai-gateway.vercel.sh",
13313
13811
  reasoning: true,
13314
- input: ["text", "image"],
13812
+ input: ["text"],
13315
13813
  cost: {
13316
13814
  input: 1.25,
13317
13815
  output: 3.75,
13318
13816
  cacheRead: 0.25,
13319
13817
  cacheWrite: 1.5625,
13320
13818
  },
13321
- contextWindow: 991000,
13819
+ contextWindow: 991000,
13820
+ maxTokens: 64000,
13821
+ },
13822
+ "alibaba/qwen3.7-plus": {
13823
+ id: "alibaba/qwen3.7-plus",
13824
+ name: "Qwen 3.7 Plus",
13825
+ api: "anthropic-messages",
13826
+ provider: "vercel-ai-gateway",
13827
+ baseUrl: "https://ai-gateway.vercel.sh",
13828
+ reasoning: true,
13829
+ input: ["text", "image"],
13830
+ cost: {
13831
+ input: 0.39999999999999997,
13832
+ output: 1.5999999999999999,
13833
+ cacheRead: 0.08,
13834
+ cacheWrite: 0.5,
13835
+ },
13836
+ contextWindow: 1000000,
13322
13837
  maxTokens: 64000,
13323
13838
  },
13324
13839
  "anthropic/claude-3-haiku": {
@@ -13448,7 +13963,7 @@ export const MODELS = {
13448
13963
  api: "anthropic-messages",
13449
13964
  provider: "vercel-ai-gateway",
13450
13965
  baseUrl: "https://ai-gateway.vercel.sh",
13451
- compat: { "forceAdaptiveThinking": true },
13966
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
13452
13967
  reasoning: true,
13453
13968
  thinkingLevelMap: { "xhigh": "xhigh" },
13454
13969
  input: ["text", "image"],
@@ -13467,7 +13982,7 @@ export const MODELS = {
13467
13982
  api: "anthropic-messages",
13468
13983
  provider: "vercel-ai-gateway",
13469
13984
  baseUrl: "https://ai-gateway.vercel.sh",
13470
- compat: { "forceAdaptiveThinking": true },
13985
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
13471
13986
  reasoning: true,
13472
13987
  thinkingLevelMap: { "xhigh": "xhigh" },
13473
13988
  input: ["text", "image"],
@@ -13626,17 +14141,17 @@ export const MODELS = {
13626
14141
  reasoning: false,
13627
14142
  input: ["text"],
13628
14143
  cost: {
13629
- input: 0.77,
13630
- output: 0.77,
13631
- cacheRead: 0,
14144
+ input: 0.27,
14145
+ output: 1.12,
14146
+ cacheRead: 0.135,
13632
14147
  cacheWrite: 0,
13633
14148
  },
13634
14149
  contextWindow: 163840,
13635
- maxTokens: 16384,
14150
+ maxTokens: 163840,
13636
14151
  },
13637
14152
  "deepseek/deepseek-v3.1": {
13638
14153
  id: "deepseek/deepseek-v3.1",
13639
- name: "DeepSeek-V3.1",
14154
+ name: "DeepSeek V3.1",
13640
14155
  api: "anthropic-messages",
13641
14156
  provider: "vercel-ai-gateway",
13642
14157
  baseUrl: "https://ai-gateway.vercel.sh",
@@ -13674,8 +14189,8 @@ export const MODELS = {
13674
14189
  api: "anthropic-messages",
13675
14190
  provider: "vercel-ai-gateway",
13676
14191
  baseUrl: "https://ai-gateway.vercel.sh",
13677
- reasoning: false,
13678
- input: ["text"],
14192
+ reasoning: true,
14193
+ input: ["text", "image"],
13679
14194
  cost: {
13680
14195
  input: 0.28,
13681
14196
  output: 0.42,
@@ -13691,8 +14206,8 @@ export const MODELS = {
13691
14206
  api: "anthropic-messages",
13692
14207
  provider: "vercel-ai-gateway",
13693
14208
  baseUrl: "https://ai-gateway.vercel.sh",
13694
- reasoning: false,
13695
- input: ["text"],
14209
+ reasoning: true,
14210
+ input: ["text", "image"],
13696
14211
  cost: {
13697
14212
  input: 0.62,
13698
14213
  output: 1.85,
@@ -13709,7 +14224,7 @@ export const MODELS = {
13709
14224
  provider: "vercel-ai-gateway",
13710
14225
  baseUrl: "https://ai-gateway.vercel.sh",
13711
14226
  reasoning: true,
13712
- input: ["text"],
14227
+ input: ["text", "image"],
13713
14228
  cost: {
13714
14229
  input: 0.14,
13715
14230
  output: 0.28,
@@ -13736,40 +14251,6 @@ export const MODELS = {
13736
14251
  contextWindow: 1000000,
13737
14252
  maxTokens: 384000,
13738
14253
  },
13739
- "google/gemini-2.0-flash": {
13740
- id: "google/gemini-2.0-flash",
13741
- name: "Gemini 2.0 Flash",
13742
- api: "anthropic-messages",
13743
- provider: "vercel-ai-gateway",
13744
- baseUrl: "https://ai-gateway.vercel.sh",
13745
- reasoning: false,
13746
- input: ["text", "image"],
13747
- cost: {
13748
- input: 0.15,
13749
- output: 0.6,
13750
- cacheRead: 0.024999999999999998,
13751
- cacheWrite: 0,
13752
- },
13753
- contextWindow: 1048576,
13754
- maxTokens: 8192,
13755
- },
13756
- "google/gemini-2.0-flash-lite": {
13757
- id: "google/gemini-2.0-flash-lite",
13758
- name: "Gemini 2.0 Flash Lite",
13759
- api: "anthropic-messages",
13760
- provider: "vercel-ai-gateway",
13761
- baseUrl: "https://ai-gateway.vercel.sh",
13762
- reasoning: false,
13763
- input: ["text", "image"],
13764
- cost: {
13765
- input: 0.075,
13766
- output: 0.3,
13767
- cacheRead: 0.02,
13768
- cacheWrite: 0,
13769
- },
13770
- contextWindow: 1048576,
13771
- maxTokens: 8192,
13772
- },
13773
14254
  "google/gemini-2.5-flash": {
13774
14255
  id: "google/gemini-2.5-flash",
13775
14256
  name: "Gemini 2.5 Flash",
@@ -13929,12 +14410,12 @@ export const MODELS = {
13929
14410
  api: "anthropic-messages",
13930
14411
  provider: "vercel-ai-gateway",
13931
14412
  baseUrl: "https://ai-gateway.vercel.sh",
13932
- reasoning: false,
14413
+ reasoning: true,
13933
14414
  input: ["text", "image"],
13934
14415
  cost: {
13935
- input: 0.13,
13936
- output: 0.39999999999999997,
13937
- cacheRead: 0,
14416
+ input: 0.15,
14417
+ output: 0.6,
14418
+ cacheRead: 0.015,
13938
14419
  cacheWrite: 0,
13939
14420
  },
13940
14421
  contextWindow: 262144,
@@ -14236,7 +14717,7 @@ export const MODELS = {
14236
14717
  provider: "vercel-ai-gateway",
14237
14718
  baseUrl: "https://ai-gateway.vercel.sh",
14238
14719
  reasoning: true,
14239
- input: ["text", "image"],
14720
+ input: ["text"],
14240
14721
  cost: {
14241
14722
  input: 0.3,
14242
14723
  output: 1.2,
@@ -14253,7 +14734,7 @@ export const MODELS = {
14253
14734
  provider: "vercel-ai-gateway",
14254
14735
  baseUrl: "https://ai-gateway.vercel.sh",
14255
14736
  reasoning: true,
14256
- input: ["text", "image"],
14737
+ input: ["text"],
14257
14738
  cost: {
14258
14739
  input: 0.6,
14259
14740
  output: 2.4,
@@ -14263,6 +14744,23 @@ export const MODELS = {
14263
14744
  contextWindow: 204800,
14264
14745
  maxTokens: 131100,
14265
14746
  },
14747
+ "minimax/minimax-m3": {
14748
+ id: "minimax/minimax-m3",
14749
+ name: "MiniMax M3",
14750
+ api: "anthropic-messages",
14751
+ provider: "vercel-ai-gateway",
14752
+ baseUrl: "https://ai-gateway.vercel.sh",
14753
+ reasoning: true,
14754
+ input: ["text", "image"],
14755
+ cost: {
14756
+ input: 0.3,
14757
+ output: 1.2,
14758
+ cacheRead: 0.06,
14759
+ cacheWrite: 0,
14760
+ },
14761
+ contextWindow: 1000000,
14762
+ maxTokens: 1000000,
14763
+ },
14266
14764
  "mistral/codestral": {
14267
14765
  id: "mistral/codestral",
14268
14766
  name: "Mistral Codestral",
@@ -14399,6 +14897,23 @@ export const MODELS = {
14399
14897
  contextWindow: 256000,
14400
14898
  maxTokens: 256000,
14401
14899
  },
14900
+ "mistral/mistral-nemo": {
14901
+ id: "mistral/mistral-nemo",
14902
+ name: "Mistral Nemo 12B",
14903
+ api: "anthropic-messages",
14904
+ provider: "vercel-ai-gateway",
14905
+ baseUrl: "https://ai-gateway.vercel.sh",
14906
+ reasoning: false,
14907
+ input: ["text"],
14908
+ cost: {
14909
+ input: 0.02,
14910
+ output: 0.04,
14911
+ cacheRead: 0,
14912
+ cacheWrite: 0,
14913
+ },
14914
+ contextWindow: 131072,
14915
+ maxTokens: 131072,
14916
+ },
14402
14917
  "mistral/mistral-small": {
14403
14918
  id: "mistral/mistral-small",
14404
14919
  name: "Mistral Small",
@@ -14552,6 +15067,40 @@ export const MODELS = {
14552
15067
  contextWindow: 262000,
14553
15068
  maxTokens: 262000,
14554
15069
  },
15070
+ "nvidia/nemotron-3-super-120b-a12b": {
15071
+ id: "nvidia/nemotron-3-super-120b-a12b",
15072
+ name: "NVIDIA Nemotron 3 Super 120B A12B",
15073
+ api: "anthropic-messages",
15074
+ provider: "vercel-ai-gateway",
15075
+ baseUrl: "https://ai-gateway.vercel.sh",
15076
+ reasoning: true,
15077
+ input: ["text"],
15078
+ cost: {
15079
+ input: 0.15,
15080
+ output: 0.65,
15081
+ cacheRead: 0,
15082
+ cacheWrite: 0,
15083
+ },
15084
+ contextWindow: 256000,
15085
+ maxTokens: 32000,
15086
+ },
15087
+ "nvidia/nemotron-3-ultra-550b-a55b": {
15088
+ id: "nvidia/nemotron-3-ultra-550b-a55b",
15089
+ name: "Nemotron 3 Ultra",
15090
+ api: "anthropic-messages",
15091
+ provider: "vercel-ai-gateway",
15092
+ baseUrl: "https://ai-gateway.vercel.sh",
15093
+ reasoning: true,
15094
+ input: ["text"],
15095
+ cost: {
15096
+ input: 0.6,
15097
+ output: 2.4,
15098
+ cacheRead: 0.12,
15099
+ cacheWrite: 0,
15100
+ },
15101
+ contextWindow: 1000000,
15102
+ maxTokens: 65000,
15103
+ },
14555
15104
  "nvidia/nemotron-nano-12b-v2-vl": {
14556
15105
  id: "nvidia/nemotron-nano-12b-v2-vl",
14557
15106
  name: "Nvidia Nemotron Nano 12B V2 VL",
@@ -14729,7 +15278,7 @@ export const MODELS = {
14729
15278
  provider: "vercel-ai-gateway",
14730
15279
  baseUrl: "https://ai-gateway.vercel.sh",
14731
15280
  reasoning: true,
14732
- input: ["text"],
15281
+ input: ["text", "image"],
14733
15282
  cost: {
14734
15283
  input: 1.25,
14735
15284
  output: 10,
@@ -15091,6 +15640,23 @@ export const MODELS = {
15091
15640
  contextWindow: 1000000,
15092
15641
  maxTokens: 128000,
15093
15642
  },
15643
+ "openai/gpt-oss-120b": {
15644
+ id: "openai/gpt-oss-120b",
15645
+ name: "GPT OSS 120B",
15646
+ api: "anthropic-messages",
15647
+ provider: "vercel-ai-gateway",
15648
+ baseUrl: "https://ai-gateway.vercel.sh",
15649
+ reasoning: true,
15650
+ input: ["text"],
15651
+ cost: {
15652
+ input: 0.35,
15653
+ output: 0.75,
15654
+ cacheRead: 0.25,
15655
+ cacheWrite: 0,
15656
+ },
15657
+ contextWindow: 131072,
15658
+ maxTokens: 131000,
15659
+ },
15094
15660
  "openai/gpt-oss-20b": {
15095
15661
  id: "openai/gpt-oss-20b",
15096
15662
  name: "GPT OSS 20B",
@@ -15261,6 +15827,40 @@ export const MODELS = {
15261
15827
  contextWindow: 200000,
15262
15828
  maxTokens: 8000,
15263
15829
  },
15830
+ "stepfun/step-3.5-flash": {
15831
+ id: "stepfun/step-3.5-flash",
15832
+ name: "StepFun 3.5 Flash",
15833
+ api: "anthropic-messages",
15834
+ provider: "vercel-ai-gateway",
15835
+ baseUrl: "https://ai-gateway.vercel.sh",
15836
+ reasoning: true,
15837
+ input: ["text"],
15838
+ cost: {
15839
+ input: 0.09,
15840
+ output: 0.3,
15841
+ cacheRead: 0,
15842
+ cacheWrite: 0.02,
15843
+ },
15844
+ contextWindow: 262114,
15845
+ maxTokens: 262114,
15846
+ },
15847
+ "stepfun/step-3.7-flash": {
15848
+ id: "stepfun/step-3.7-flash",
15849
+ name: "Step 3.7 Flash",
15850
+ api: "anthropic-messages",
15851
+ provider: "vercel-ai-gateway",
15852
+ baseUrl: "https://ai-gateway.vercel.sh",
15853
+ reasoning: true,
15854
+ input: ["text", "image"],
15855
+ cost: {
15856
+ input: 0.19999999999999998,
15857
+ output: 1.15,
15858
+ cacheRead: 0.04,
15859
+ cacheWrite: 0,
15860
+ },
15861
+ contextWindow: 256000,
15862
+ maxTokens: 256000,
15863
+ },
15264
15864
  "xai/grok-4.1-fast-non-reasoning": {
15265
15865
  id: "xai/grok-4.1-fast-non-reasoning",
15266
15866
  name: "Grok 4.1 Fast Non-Reasoning",
@@ -15539,7 +16139,7 @@ export const MODELS = {
15539
16139
  api: "anthropic-messages",
15540
16140
  provider: "vercel-ai-gateway",
15541
16141
  baseUrl: "https://ai-gateway.vercel.sh",
15542
- reasoning: false,
16142
+ reasoning: true,
15543
16143
  input: ["text", "image"],
15544
16144
  cost: {
15545
16145
  input: 0.6,
@@ -15693,7 +16293,7 @@ export const MODELS = {
15693
16293
  provider: "vercel-ai-gateway",
15694
16294
  baseUrl: "https://ai-gateway.vercel.sh",
15695
16295
  reasoning: true,
15696
- input: ["text"],
16296
+ input: ["text", "image"],
15697
16297
  cost: {
15698
16298
  input: 1.4,
15699
16299
  output: 4.4,
@@ -16248,5 +16848,97 @@ export const MODELS = {
16248
16848
  maxTokens: 131072,
16249
16849
  },
16250
16850
  },
16851
+ "zai-coding-cn": {
16852
+ "glm-4.5-air": {
16853
+ id: "glm-4.5-air",
16854
+ name: "GLM-4.5-Air",
16855
+ api: "openai-completions",
16856
+ provider: "zai-coding-cn",
16857
+ baseUrl: "https://open.bigmodel.cn/api/coding/paas/v4",
16858
+ compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai" },
16859
+ reasoning: true,
16860
+ input: ["text"],
16861
+ cost: {
16862
+ input: 0,
16863
+ output: 0,
16864
+ cacheRead: 0,
16865
+ cacheWrite: 0,
16866
+ },
16867
+ contextWindow: 131072,
16868
+ maxTokens: 98304,
16869
+ },
16870
+ "glm-4.7": {
16871
+ id: "glm-4.7",
16872
+ name: "GLM-4.7",
16873
+ api: "openai-completions",
16874
+ provider: "zai-coding-cn",
16875
+ baseUrl: "https://open.bigmodel.cn/api/coding/paas/v4",
16876
+ compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "zaiToolStream": true },
16877
+ reasoning: true,
16878
+ input: ["text"],
16879
+ cost: {
16880
+ input: 0,
16881
+ output: 0,
16882
+ cacheRead: 0,
16883
+ cacheWrite: 0,
16884
+ },
16885
+ contextWindow: 204800,
16886
+ maxTokens: 131072,
16887
+ },
16888
+ "glm-5-turbo": {
16889
+ id: "glm-5-turbo",
16890
+ name: "GLM-5-Turbo",
16891
+ api: "openai-completions",
16892
+ provider: "zai-coding-cn",
16893
+ baseUrl: "https://open.bigmodel.cn/api/coding/paas/v4",
16894
+ compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "zaiToolStream": true },
16895
+ reasoning: true,
16896
+ input: ["text"],
16897
+ cost: {
16898
+ input: 0,
16899
+ output: 0,
16900
+ cacheRead: 0,
16901
+ cacheWrite: 0,
16902
+ },
16903
+ contextWindow: 200000,
16904
+ maxTokens: 131072,
16905
+ },
16906
+ "glm-5.1": {
16907
+ id: "glm-5.1",
16908
+ name: "GLM-5.1",
16909
+ api: "openai-completions",
16910
+ provider: "zai-coding-cn",
16911
+ baseUrl: "https://open.bigmodel.cn/api/coding/paas/v4",
16912
+ compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "zaiToolStream": true },
16913
+ reasoning: true,
16914
+ input: ["text"],
16915
+ cost: {
16916
+ input: 0,
16917
+ output: 0,
16918
+ cacheRead: 0,
16919
+ cacheWrite: 0,
16920
+ },
16921
+ contextWindow: 200000,
16922
+ maxTokens: 131072,
16923
+ },
16924
+ "glm-5v-turbo": {
16925
+ id: "glm-5v-turbo",
16926
+ name: "GLM-5V-Turbo",
16927
+ api: "openai-completions",
16928
+ provider: "zai-coding-cn",
16929
+ baseUrl: "https://open.bigmodel.cn/api/coding/paas/v4",
16930
+ compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "zaiToolStream": true },
16931
+ reasoning: true,
16932
+ input: ["text", "image"],
16933
+ cost: {
16934
+ input: 0,
16935
+ output: 0,
16936
+ cacheRead: 0,
16937
+ cacheWrite: 0,
16938
+ },
16939
+ contextWindow: 200000,
16940
+ maxTokens: 131072,
16941
+ },
16942
+ },
16251
16943
  };
16252
16944
  //# sourceMappingURL=models.generated.js.map