@earendil-works/pi-ai 0.78.0 → 0.79.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +12 -4
- package/dist/env-api-keys.d.ts.map +1 -1
- package/dist/env-api-keys.js +3 -0
- package/dist/env-api-keys.js.map +1 -1
- package/dist/image-models.generated.d.ts +45 -0
- package/dist/image-models.generated.d.ts.map +1 -1
- package/dist/image-models.generated.js +45 -0
- package/dist/image-models.generated.js.map +1 -1
- package/dist/models.generated.d.ts +1365 -401
- package/dist/models.generated.d.ts.map +1 -1
- package/dist/models.generated.js +1331 -639
- package/dist/models.generated.js.map +1 -1
- package/dist/providers/amazon-bedrock.d.ts.map +1 -1
- package/dist/providers/amazon-bedrock.js +46 -19
- package/dist/providers/amazon-bedrock.js.map +1 -1
- package/dist/providers/anthropic.d.ts.map +1 -1
- package/dist/providers/anthropic.js +5 -4
- package/dist/providers/anthropic.js.map +1 -1
- package/dist/providers/openai-completions.d.ts.map +1 -1
- package/dist/providers/openai-completions.js +33 -12
- package/dist/providers/openai-completions.js.map +1 -1
- package/dist/providers/openai-responses-shared.d.ts.map +1 -1
- package/dist/providers/openai-responses-shared.js +2 -1
- package/dist/providers/openai-responses-shared.js.map +1 -1
- package/dist/providers/openai-responses.d.ts.map +1 -1
- package/dist/providers/openai-responses.js +1 -0
- package/dist/providers/openai-responses.js.map +1 -1
- package/dist/types.d.ts +12 -4
- package/dist/types.d.ts.map +1 -1
- package/dist/types.js.map +1 -1
- package/dist/utils/oauth/github-copilot.d.ts.map +1 -1
- package/dist/utils/oauth/github-copilot.js +13 -1
- package/dist/utils/oauth/github-copilot.js.map +1 -1
- package/dist/utils/oauth/openai-codex.d.ts.map +1 -1
- package/dist/utils/oauth/openai-codex.js +4 -2
- package/dist/utils/oauth/openai-codex.js.map +1 -1
- package/package.json +1 -1
package/dist/models.generated.js
CHANGED
|
@@ -391,8 +391,8 @@ export const MODELS = {
|
|
|
391
391
|
thinkingLevelMap: { "xhigh": "max" },
|
|
392
392
|
input: ["text", "image"],
|
|
393
393
|
cost: {
|
|
394
|
-
input: 5,
|
|
395
|
-
output:
|
|
394
|
+
input: 5.5,
|
|
395
|
+
output: 27.5,
|
|
396
396
|
cacheRead: 0.5,
|
|
397
397
|
cacheWrite: 6.25,
|
|
398
398
|
},
|
|
@@ -409,10 +409,10 @@ export const MODELS = {
|
|
|
409
409
|
thinkingLevelMap: { "xhigh": "xhigh" },
|
|
410
410
|
input: ["text", "image"],
|
|
411
411
|
cost: {
|
|
412
|
-
input: 5,
|
|
413
|
-
output:
|
|
414
|
-
cacheRead: 0.
|
|
415
|
-
cacheWrite: 6.
|
|
412
|
+
input: 5.5,
|
|
413
|
+
output: 27.5,
|
|
414
|
+
cacheRead: 0.55,
|
|
415
|
+
cacheWrite: 6.875,
|
|
416
416
|
},
|
|
417
417
|
contextWindow: 1000000,
|
|
418
418
|
maxTokens: 128000,
|
|
@@ -427,10 +427,10 @@ export const MODELS = {
|
|
|
427
427
|
thinkingLevelMap: { "xhigh": "xhigh" },
|
|
428
428
|
input: ["text", "image"],
|
|
429
429
|
cost: {
|
|
430
|
-
input: 5,
|
|
431
|
-
output:
|
|
432
|
-
cacheRead: 0.
|
|
433
|
-
cacheWrite: 6.
|
|
430
|
+
input: 5.5,
|
|
431
|
+
output: 27.5,
|
|
432
|
+
cacheRead: 0.55,
|
|
433
|
+
cacheWrite: 6.875,
|
|
434
434
|
},
|
|
435
435
|
contextWindow: 1000000,
|
|
436
436
|
maxTokens: 128000,
|
|
@@ -444,10 +444,10 @@ export const MODELS = {
|
|
|
444
444
|
reasoning: true,
|
|
445
445
|
input: ["text", "image"],
|
|
446
446
|
cost: {
|
|
447
|
-
input: 3,
|
|
448
|
-
output:
|
|
449
|
-
cacheRead: 0.
|
|
450
|
-
cacheWrite:
|
|
447
|
+
input: 3.3,
|
|
448
|
+
output: 16.5,
|
|
449
|
+
cacheRead: 0.33,
|
|
450
|
+
cacheWrite: 4.125,
|
|
451
451
|
},
|
|
452
452
|
contextWindow: 200000,
|
|
453
453
|
maxTokens: 64000,
|
|
@@ -461,10 +461,10 @@ export const MODELS = {
|
|
|
461
461
|
reasoning: true,
|
|
462
462
|
input: ["text", "image"],
|
|
463
463
|
cost: {
|
|
464
|
-
input: 3,
|
|
465
|
-
output:
|
|
466
|
-
cacheRead: 0.
|
|
467
|
-
cacheWrite:
|
|
464
|
+
input: 3.3,
|
|
465
|
+
output: 16.5,
|
|
466
|
+
cacheRead: 0.33,
|
|
467
|
+
cacheWrite: 4.125,
|
|
468
468
|
},
|
|
469
469
|
contextWindow: 1000000,
|
|
470
470
|
maxTokens: 64000,
|
|
@@ -1086,6 +1086,59 @@ export const MODELS = {
|
|
|
1086
1086
|
contextWindow: 262144,
|
|
1087
1087
|
maxTokens: 131072,
|
|
1088
1088
|
},
|
|
1089
|
+
"openai.gpt-5.4": {
|
|
1090
|
+
id: "openai.gpt-5.4",
|
|
1091
|
+
name: "GPT-5.4",
|
|
1092
|
+
api: "bedrock-converse-stream",
|
|
1093
|
+
provider: "amazon-bedrock",
|
|
1094
|
+
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
1095
|
+
reasoning: true,
|
|
1096
|
+
thinkingLevelMap: { "xhigh": "xhigh" },
|
|
1097
|
+
input: ["text", "image"],
|
|
1098
|
+
cost: {
|
|
1099
|
+
input: 2.75,
|
|
1100
|
+
output: 16.5,
|
|
1101
|
+
cacheRead: 0.275,
|
|
1102
|
+
cacheWrite: 0,
|
|
1103
|
+
},
|
|
1104
|
+
contextWindow: 272000,
|
|
1105
|
+
maxTokens: 128000,
|
|
1106
|
+
},
|
|
1107
|
+
"openai.gpt-5.5": {
|
|
1108
|
+
id: "openai.gpt-5.5",
|
|
1109
|
+
name: "GPT-5.5",
|
|
1110
|
+
api: "bedrock-converse-stream",
|
|
1111
|
+
provider: "amazon-bedrock",
|
|
1112
|
+
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
1113
|
+
reasoning: true,
|
|
1114
|
+
thinkingLevelMap: { "xhigh": "xhigh" },
|
|
1115
|
+
input: ["text", "image"],
|
|
1116
|
+
cost: {
|
|
1117
|
+
input: 5.5,
|
|
1118
|
+
output: 33,
|
|
1119
|
+
cacheRead: 0.55,
|
|
1120
|
+
cacheWrite: 0,
|
|
1121
|
+
},
|
|
1122
|
+
contextWindow: 272000,
|
|
1123
|
+
maxTokens: 128000,
|
|
1124
|
+
},
|
|
1125
|
+
"openai.gpt-oss-120b": {
|
|
1126
|
+
id: "openai.gpt-oss-120b",
|
|
1127
|
+
name: "gpt-oss-120b",
|
|
1128
|
+
api: "bedrock-converse-stream",
|
|
1129
|
+
provider: "amazon-bedrock",
|
|
1130
|
+
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
1131
|
+
reasoning: false,
|
|
1132
|
+
input: ["text"],
|
|
1133
|
+
cost: {
|
|
1134
|
+
input: 0.15,
|
|
1135
|
+
output: 0.6,
|
|
1136
|
+
cacheRead: 0,
|
|
1137
|
+
cacheWrite: 0,
|
|
1138
|
+
},
|
|
1139
|
+
contextWindow: 128000,
|
|
1140
|
+
maxTokens: 16384,
|
|
1141
|
+
},
|
|
1089
1142
|
"openai.gpt-oss-120b-1:0": {
|
|
1090
1143
|
id: "openai.gpt-oss-120b-1:0",
|
|
1091
1144
|
name: "gpt-oss-120b",
|
|
@@ -1103,6 +1156,23 @@ export const MODELS = {
|
|
|
1103
1156
|
contextWindow: 128000,
|
|
1104
1157
|
maxTokens: 16384,
|
|
1105
1158
|
},
|
|
1159
|
+
"openai.gpt-oss-20b": {
|
|
1160
|
+
id: "openai.gpt-oss-20b",
|
|
1161
|
+
name: "gpt-oss-20b",
|
|
1162
|
+
api: "bedrock-converse-stream",
|
|
1163
|
+
provider: "amazon-bedrock",
|
|
1164
|
+
baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
|
|
1165
|
+
reasoning: false,
|
|
1166
|
+
input: ["text"],
|
|
1167
|
+
cost: {
|
|
1168
|
+
input: 0.07,
|
|
1169
|
+
output: 0.3,
|
|
1170
|
+
cacheRead: 0,
|
|
1171
|
+
cacheWrite: 0,
|
|
1172
|
+
},
|
|
1173
|
+
contextWindow: 128000,
|
|
1174
|
+
maxTokens: 16384,
|
|
1175
|
+
},
|
|
1106
1176
|
"openai.gpt-oss-20b-1:0": {
|
|
1107
1177
|
id: "openai.gpt-oss-20b-1:0",
|
|
1108
1178
|
name: "gpt-oss-20b",
|
|
@@ -1549,6 +1619,63 @@ export const MODELS = {
|
|
|
1549
1619
|
maxTokens: 101376,
|
|
1550
1620
|
},
|
|
1551
1621
|
},
|
|
1622
|
+
"ant-ling": {
|
|
1623
|
+
"Ling-2.6-1T": {
|
|
1624
|
+
id: "Ling-2.6-1T",
|
|
1625
|
+
name: "Ling 2.6 1T",
|
|
1626
|
+
api: "openai-completions",
|
|
1627
|
+
provider: "ant-ling",
|
|
1628
|
+
baseUrl: "https://api.ant-ling.com/v1",
|
|
1629
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsLongCacheRetention": false },
|
|
1630
|
+
reasoning: false,
|
|
1631
|
+
input: ["text"],
|
|
1632
|
+
cost: {
|
|
1633
|
+
input: 0.06,
|
|
1634
|
+
output: 0.25,
|
|
1635
|
+
cacheRead: 0,
|
|
1636
|
+
cacheWrite: 0,
|
|
1637
|
+
},
|
|
1638
|
+
contextWindow: 262144,
|
|
1639
|
+
maxTokens: 65536,
|
|
1640
|
+
},
|
|
1641
|
+
"Ling-2.6-flash": {
|
|
1642
|
+
id: "Ling-2.6-flash",
|
|
1643
|
+
name: "Ling 2.6 Flash",
|
|
1644
|
+
api: "openai-completions",
|
|
1645
|
+
provider: "ant-ling",
|
|
1646
|
+
baseUrl: "https://api.ant-ling.com/v1",
|
|
1647
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsLongCacheRetention": false },
|
|
1648
|
+
reasoning: false,
|
|
1649
|
+
input: ["text"],
|
|
1650
|
+
cost: {
|
|
1651
|
+
input: 0.01,
|
|
1652
|
+
output: 0.02,
|
|
1653
|
+
cacheRead: 0,
|
|
1654
|
+
cacheWrite: 0,
|
|
1655
|
+
},
|
|
1656
|
+
contextWindow: 262144,
|
|
1657
|
+
maxTokens: 65536,
|
|
1658
|
+
},
|
|
1659
|
+
"Ring-2.6-1T": {
|
|
1660
|
+
id: "Ring-2.6-1T",
|
|
1661
|
+
name: "Ring 2.6 1T",
|
|
1662
|
+
api: "openai-completions",
|
|
1663
|
+
provider: "ant-ling",
|
|
1664
|
+
baseUrl: "https://api.ant-ling.com/v1",
|
|
1665
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsLongCacheRetention": false, "thinkingFormat": "ant-ling" },
|
|
1666
|
+
reasoning: true,
|
|
1667
|
+
thinkingLevelMap: { "off": null, "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "xhigh" },
|
|
1668
|
+
input: ["text"],
|
|
1669
|
+
cost: {
|
|
1670
|
+
input: 0.06,
|
|
1671
|
+
output: 0.25,
|
|
1672
|
+
cacheRead: 0,
|
|
1673
|
+
cacheWrite: 0,
|
|
1674
|
+
},
|
|
1675
|
+
contextWindow: 262144,
|
|
1676
|
+
maxTokens: 65536,
|
|
1677
|
+
},
|
|
1678
|
+
},
|
|
1552
1679
|
"anthropic": {
|
|
1553
1680
|
"claude-3-5-haiku-20241022": {
|
|
1554
1681
|
id: "claude-3-5-haiku-20241022",
|
|
@@ -1847,7 +1974,7 @@ export const MODELS = {
|
|
|
1847
1974
|
api: "anthropic-messages",
|
|
1848
1975
|
provider: "anthropic",
|
|
1849
1976
|
baseUrl: "https://api.anthropic.com",
|
|
1850
|
-
compat: { "forceAdaptiveThinking": true },
|
|
1977
|
+
compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
|
|
1851
1978
|
reasoning: true,
|
|
1852
1979
|
thinkingLevelMap: { "xhigh": "xhigh" },
|
|
1853
1980
|
input: ["text", "image"],
|
|
@@ -1866,7 +1993,7 @@ export const MODELS = {
|
|
|
1866
1993
|
api: "anthropic-messages",
|
|
1867
1994
|
provider: "anthropic",
|
|
1868
1995
|
baseUrl: "https://api.anthropic.com",
|
|
1869
|
-
compat: { "forceAdaptiveThinking": true },
|
|
1996
|
+
compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
|
|
1870
1997
|
reasoning: true,
|
|
1871
1998
|
thinkingLevelMap: { "xhigh": "xhigh" },
|
|
1872
1999
|
input: ["text", "image"],
|
|
@@ -2955,7 +3082,26 @@ export const MODELS = {
|
|
|
2955
3082
|
api: "anthropic-messages",
|
|
2956
3083
|
provider: "cloudflare-ai-gateway",
|
|
2957
3084
|
baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
|
|
2958
|
-
compat: { "forceAdaptiveThinking": true },
|
|
3085
|
+
compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
|
|
3086
|
+
reasoning: true,
|
|
3087
|
+
thinkingLevelMap: { "xhigh": "xhigh" },
|
|
3088
|
+
input: ["text", "image"],
|
|
3089
|
+
cost: {
|
|
3090
|
+
input: 5,
|
|
3091
|
+
output: 25,
|
|
3092
|
+
cacheRead: 0.5,
|
|
3093
|
+
cacheWrite: 6.25,
|
|
3094
|
+
},
|
|
3095
|
+
contextWindow: 1000000,
|
|
3096
|
+
maxTokens: 128000,
|
|
3097
|
+
},
|
|
3098
|
+
"claude-opus-4-8": {
|
|
3099
|
+
id: "claude-opus-4-8",
|
|
3100
|
+
name: "Claude Opus 4.8",
|
|
3101
|
+
api: "anthropic-messages",
|
|
3102
|
+
provider: "cloudflare-ai-gateway",
|
|
3103
|
+
baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
|
|
3104
|
+
compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
|
|
2959
3105
|
reasoning: true,
|
|
2960
3106
|
thinkingLevelMap: { "xhigh": "xhigh" },
|
|
2961
3107
|
input: ["text", "image"],
|
|
@@ -3463,24 +3609,6 @@ export const MODELS = {
|
|
|
3463
3609
|
contextWindow: 128000,
|
|
3464
3610
|
maxTokens: 128000,
|
|
3465
3611
|
},
|
|
3466
|
-
"@cf/moonshotai/kimi-k2.5": {
|
|
3467
|
-
id: "@cf/moonshotai/kimi-k2.5",
|
|
3468
|
-
name: "Kimi K2.5",
|
|
3469
|
-
api: "openai-completions",
|
|
3470
|
-
provider: "cloudflare-workers-ai",
|
|
3471
|
-
baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
|
|
3472
|
-
compat: { "sendSessionAffinityHeaders": true },
|
|
3473
|
-
reasoning: true,
|
|
3474
|
-
input: ["text", "image"],
|
|
3475
|
-
cost: {
|
|
3476
|
-
input: 0.6,
|
|
3477
|
-
output: 3,
|
|
3478
|
-
cacheRead: 0.1,
|
|
3479
|
-
cacheWrite: 0,
|
|
3480
|
-
},
|
|
3481
|
-
contextWindow: 256000,
|
|
3482
|
-
maxTokens: 256000,
|
|
3483
|
-
},
|
|
3484
3612
|
"@cf/moonshotai/kimi-k2.6": {
|
|
3485
3613
|
id: "@cf/moonshotai/kimi-k2.6",
|
|
3486
3614
|
name: "Kimi K2.6",
|
|
@@ -3808,8 +3936,8 @@ export const MODELS = {
|
|
|
3808
3936
|
cacheRead: 0.1,
|
|
3809
3937
|
cacheWrite: 0,
|
|
3810
3938
|
},
|
|
3811
|
-
contextWindow:
|
|
3812
|
-
maxTokens:
|
|
3939
|
+
contextWindow: 262144,
|
|
3940
|
+
maxTokens: 65536,
|
|
3813
3941
|
},
|
|
3814
3942
|
"accounts/fireworks/routers/glm-5p1-fast": {
|
|
3815
3943
|
id: "accounts/fireworks/routers/glm-5p1-fast",
|
|
@@ -3829,6 +3957,24 @@ export const MODELS = {
|
|
|
3829
3957
|
contextWindow: 202800,
|
|
3830
3958
|
maxTokens: 131072,
|
|
3831
3959
|
},
|
|
3960
|
+
"accounts/fireworks/routers/kimi-k2p6-fast": {
|
|
3961
|
+
id: "accounts/fireworks/routers/kimi-k2p6-fast",
|
|
3962
|
+
name: "Kimi K2.6 Fast",
|
|
3963
|
+
api: "anthropic-messages",
|
|
3964
|
+
provider: "fireworks",
|
|
3965
|
+
baseUrl: "https://api.fireworks.ai/inference",
|
|
3966
|
+
compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
|
|
3967
|
+
reasoning: true,
|
|
3968
|
+
input: ["text", "image"],
|
|
3969
|
+
cost: {
|
|
3970
|
+
input: 2,
|
|
3971
|
+
output: 8,
|
|
3972
|
+
cacheRead: 0.3,
|
|
3973
|
+
cacheWrite: 0,
|
|
3974
|
+
},
|
|
3975
|
+
contextWindow: 262000,
|
|
3976
|
+
maxTokens: 262000,
|
|
3977
|
+
},
|
|
3832
3978
|
"accounts/fireworks/routers/kimi-k2p6-turbo": {
|
|
3833
3979
|
id: "accounts/fireworks/routers/kimi-k2p6-turbo",
|
|
3834
3980
|
name: "Kimi K2.6 Turbo",
|
|
@@ -3851,7 +3997,7 @@ export const MODELS = {
|
|
|
3851
3997
|
"github-copilot": {
|
|
3852
3998
|
"claude-haiku-4.5": {
|
|
3853
3999
|
id: "claude-haiku-4.5",
|
|
3854
|
-
name: "Claude Haiku 4.5",
|
|
4000
|
+
name: "Claude Haiku 4.5 (latest)",
|
|
3855
4001
|
api: "anthropic-messages",
|
|
3856
4002
|
provider: "github-copilot",
|
|
3857
4003
|
baseUrl: "https://api.individual.githubcopilot.com",
|
|
@@ -3860,17 +4006,17 @@ export const MODELS = {
|
|
|
3860
4006
|
reasoning: true,
|
|
3861
4007
|
input: ["text", "image"],
|
|
3862
4008
|
cost: {
|
|
3863
|
-
input:
|
|
3864
|
-
output:
|
|
3865
|
-
cacheRead: 0,
|
|
3866
|
-
cacheWrite:
|
|
4009
|
+
input: 1,
|
|
4010
|
+
output: 5,
|
|
4011
|
+
cacheRead: 0.1,
|
|
4012
|
+
cacheWrite: 1.25,
|
|
3867
4013
|
},
|
|
3868
4014
|
contextWindow: 200000,
|
|
3869
4015
|
maxTokens: 64000,
|
|
3870
4016
|
},
|
|
3871
4017
|
"claude-opus-4.5": {
|
|
3872
4018
|
id: "claude-opus-4.5",
|
|
3873
|
-
name: "Claude Opus 4.5",
|
|
4019
|
+
name: "Claude Opus 4.5 (latest)",
|
|
3874
4020
|
api: "anthropic-messages",
|
|
3875
4021
|
provider: "github-copilot",
|
|
3876
4022
|
baseUrl: "https://api.individual.githubcopilot.com",
|
|
@@ -3878,10 +4024,10 @@ export const MODELS = {
|
|
|
3878
4024
|
reasoning: true,
|
|
3879
4025
|
input: ["text", "image"],
|
|
3880
4026
|
cost: {
|
|
3881
|
-
input:
|
|
3882
|
-
output:
|
|
3883
|
-
cacheRead: 0,
|
|
3884
|
-
cacheWrite:
|
|
4027
|
+
input: 5,
|
|
4028
|
+
output: 25,
|
|
4029
|
+
cacheRead: 0.5,
|
|
4030
|
+
cacheWrite: 6.25,
|
|
3885
4031
|
},
|
|
3886
4032
|
contextWindow: 200000,
|
|
3887
4033
|
maxTokens: 32000,
|
|
@@ -3898,10 +4044,10 @@ export const MODELS = {
|
|
|
3898
4044
|
thinkingLevelMap: { "xhigh": "max" },
|
|
3899
4045
|
input: ["text", "image"],
|
|
3900
4046
|
cost: {
|
|
3901
|
-
input:
|
|
3902
|
-
output:
|
|
3903
|
-
cacheRead: 0,
|
|
3904
|
-
cacheWrite:
|
|
4047
|
+
input: 5,
|
|
4048
|
+
output: 25,
|
|
4049
|
+
cacheRead: 0.5,
|
|
4050
|
+
cacheWrite: 6.25,
|
|
3905
4051
|
},
|
|
3906
4052
|
contextWindow: 1000000,
|
|
3907
4053
|
maxTokens: 32000,
|
|
@@ -3913,15 +4059,15 @@ export const MODELS = {
|
|
|
3913
4059
|
provider: "github-copilot",
|
|
3914
4060
|
baseUrl: "https://api.individual.githubcopilot.com",
|
|
3915
4061
|
headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
|
|
3916
|
-
compat: { "forceAdaptiveThinking": true },
|
|
4062
|
+
compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
|
|
3917
4063
|
reasoning: true,
|
|
3918
4064
|
thinkingLevelMap: { "xhigh": "xhigh" },
|
|
3919
4065
|
input: ["text", "image"],
|
|
3920
4066
|
cost: {
|
|
3921
|
-
input:
|
|
3922
|
-
output:
|
|
3923
|
-
cacheRead: 0,
|
|
3924
|
-
cacheWrite:
|
|
4067
|
+
input: 5,
|
|
4068
|
+
output: 25,
|
|
4069
|
+
cacheRead: 0.5,
|
|
4070
|
+
cacheWrite: 6.25,
|
|
3925
4071
|
},
|
|
3926
4072
|
contextWindow: 200000,
|
|
3927
4073
|
maxTokens: 32000,
|
|
@@ -3933,22 +4079,41 @@ export const MODELS = {
|
|
|
3933
4079
|
provider: "github-copilot",
|
|
3934
4080
|
baseUrl: "https://api.individual.githubcopilot.com",
|
|
3935
4081
|
headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
|
|
3936
|
-
compat: { "forceAdaptiveThinking": true },
|
|
4082
|
+
compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
|
|
3937
4083
|
reasoning: true,
|
|
3938
4084
|
thinkingLevelMap: { "xhigh": "xhigh" },
|
|
3939
4085
|
input: ["text", "image"],
|
|
3940
4086
|
cost: {
|
|
3941
|
-
input:
|
|
3942
|
-
output:
|
|
3943
|
-
cacheRead: 0,
|
|
3944
|
-
cacheWrite:
|
|
4087
|
+
input: 5,
|
|
4088
|
+
output: 25,
|
|
4089
|
+
cacheRead: 0.5,
|
|
4090
|
+
cacheWrite: 6.25,
|
|
3945
4091
|
},
|
|
3946
4092
|
contextWindow: 200000,
|
|
3947
4093
|
maxTokens: 64000,
|
|
3948
4094
|
},
|
|
4095
|
+
"claude-sonnet-4": {
|
|
4096
|
+
id: "claude-sonnet-4",
|
|
4097
|
+
name: "Claude Sonnet 4 (latest)",
|
|
4098
|
+
api: "anthropic-messages",
|
|
4099
|
+
provider: "github-copilot",
|
|
4100
|
+
baseUrl: "https://api.individual.githubcopilot.com",
|
|
4101
|
+
headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
|
|
4102
|
+
compat: { "supportsEagerToolInputStreaming": false },
|
|
4103
|
+
reasoning: true,
|
|
4104
|
+
input: ["text", "image"],
|
|
4105
|
+
cost: {
|
|
4106
|
+
input: 3,
|
|
4107
|
+
output: 15,
|
|
4108
|
+
cacheRead: 0.3,
|
|
4109
|
+
cacheWrite: 3.75,
|
|
4110
|
+
},
|
|
4111
|
+
contextWindow: 216000,
|
|
4112
|
+
maxTokens: 16000,
|
|
4113
|
+
},
|
|
3949
4114
|
"claude-sonnet-4.5": {
|
|
3950
4115
|
id: "claude-sonnet-4.5",
|
|
3951
|
-
name: "Claude Sonnet 4.5",
|
|
4116
|
+
name: "Claude Sonnet 4.5 (latest)",
|
|
3952
4117
|
api: "anthropic-messages",
|
|
3953
4118
|
provider: "github-copilot",
|
|
3954
4119
|
baseUrl: "https://api.individual.githubcopilot.com",
|
|
@@ -3957,10 +4122,10 @@ export const MODELS = {
|
|
|
3957
4122
|
reasoning: true,
|
|
3958
4123
|
input: ["text", "image"],
|
|
3959
4124
|
cost: {
|
|
3960
|
-
input:
|
|
3961
|
-
output:
|
|
3962
|
-
cacheRead: 0,
|
|
3963
|
-
cacheWrite:
|
|
4125
|
+
input: 3,
|
|
4126
|
+
output: 15,
|
|
4127
|
+
cacheRead: 0.3,
|
|
4128
|
+
cacheWrite: 3.75,
|
|
3964
4129
|
},
|
|
3965
4130
|
contextWindow: 200000,
|
|
3966
4131
|
maxTokens: 32000,
|
|
@@ -3976,10 +4141,10 @@ export const MODELS = {
|
|
|
3976
4141
|
reasoning: true,
|
|
3977
4142
|
input: ["text", "image"],
|
|
3978
4143
|
cost: {
|
|
3979
|
-
input:
|
|
3980
|
-
output:
|
|
3981
|
-
cacheRead: 0,
|
|
3982
|
-
cacheWrite:
|
|
4144
|
+
input: 3,
|
|
4145
|
+
output: 15,
|
|
4146
|
+
cacheRead: 0.3,
|
|
4147
|
+
cacheWrite: 3.75,
|
|
3983
4148
|
},
|
|
3984
4149
|
contextWindow: 1000000,
|
|
3985
4150
|
maxTokens: 32000,
|
|
@@ -3992,12 +4157,12 @@ export const MODELS = {
|
|
|
3992
4157
|
baseUrl: "https://api.individual.githubcopilot.com",
|
|
3993
4158
|
headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
|
|
3994
4159
|
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
|
|
3995
|
-
reasoning:
|
|
4160
|
+
reasoning: true,
|
|
3996
4161
|
input: ["text", "image"],
|
|
3997
4162
|
cost: {
|
|
3998
|
-
input:
|
|
3999
|
-
output:
|
|
4000
|
-
cacheRead: 0,
|
|
4163
|
+
input: 1.25,
|
|
4164
|
+
output: 10,
|
|
4165
|
+
cacheRead: 0.125,
|
|
4001
4166
|
cacheWrite: 0,
|
|
4002
4167
|
},
|
|
4003
4168
|
contextWindow: 128000,
|
|
@@ -4005,7 +4170,7 @@ export const MODELS = {
|
|
|
4005
4170
|
},
|
|
4006
4171
|
"gemini-3-flash-preview": {
|
|
4007
4172
|
id: "gemini-3-flash-preview",
|
|
4008
|
-
name: "Gemini 3 Flash",
|
|
4173
|
+
name: "Gemini 3 Flash Preview",
|
|
4009
4174
|
api: "openai-completions",
|
|
4010
4175
|
provider: "github-copilot",
|
|
4011
4176
|
baseUrl: "https://api.individual.githubcopilot.com",
|
|
@@ -4014,9 +4179,9 @@ export const MODELS = {
|
|
|
4014
4179
|
reasoning: true,
|
|
4015
4180
|
input: ["text", "image"],
|
|
4016
4181
|
cost: {
|
|
4017
|
-
input: 0,
|
|
4018
|
-
output:
|
|
4019
|
-
cacheRead: 0,
|
|
4182
|
+
input: 0.5,
|
|
4183
|
+
output: 3,
|
|
4184
|
+
cacheRead: 0.05,
|
|
4020
4185
|
cacheWrite: 0,
|
|
4021
4186
|
},
|
|
4022
4187
|
contextWindow: 128000,
|
|
@@ -4033,9 +4198,9 @@ export const MODELS = {
|
|
|
4033
4198
|
reasoning: true,
|
|
4034
4199
|
input: ["text", "image"],
|
|
4035
4200
|
cost: {
|
|
4036
|
-
input:
|
|
4037
|
-
output:
|
|
4038
|
-
cacheRead: 0,
|
|
4201
|
+
input: 2,
|
|
4202
|
+
output: 12,
|
|
4203
|
+
cacheRead: 0.2,
|
|
4039
4204
|
cacheWrite: 0,
|
|
4040
4205
|
},
|
|
4041
4206
|
contextWindow: 200000,
|
|
@@ -4052,9 +4217,9 @@ export const MODELS = {
|
|
|
4052
4217
|
reasoning: true,
|
|
4053
4218
|
input: ["text", "image"],
|
|
4054
4219
|
cost: {
|
|
4055
|
-
input:
|
|
4056
|
-
output:
|
|
4057
|
-
cacheRead: 0,
|
|
4220
|
+
input: 1.5,
|
|
4221
|
+
output: 9,
|
|
4222
|
+
cacheRead: 0.15,
|
|
4058
4223
|
cacheWrite: 0,
|
|
4059
4224
|
},
|
|
4060
4225
|
contextWindow: 200000,
|
|
@@ -4071,36 +4236,17 @@ export const MODELS = {
|
|
|
4071
4236
|
reasoning: false,
|
|
4072
4237
|
input: ["text", "image"],
|
|
4073
4238
|
cost: {
|
|
4074
|
-
input:
|
|
4075
|
-
output:
|
|
4076
|
-
cacheRead: 0,
|
|
4239
|
+
input: 2,
|
|
4240
|
+
output: 8,
|
|
4241
|
+
cacheRead: 0.5,
|
|
4077
4242
|
cacheWrite: 0,
|
|
4078
4243
|
},
|
|
4079
4244
|
contextWindow: 128000,
|
|
4080
4245
|
maxTokens: 16384,
|
|
4081
4246
|
},
|
|
4082
|
-
"gpt-4o": {
|
|
4083
|
-
id: "gpt-4o",
|
|
4084
|
-
name: "GPT-4o",
|
|
4085
|
-
api: "openai-completions",
|
|
4086
|
-
provider: "github-copilot",
|
|
4087
|
-
baseUrl: "https://api.individual.githubcopilot.com",
|
|
4088
|
-
headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
|
|
4089
|
-
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
|
|
4090
|
-
reasoning: false,
|
|
4091
|
-
input: ["text", "image"],
|
|
4092
|
-
cost: {
|
|
4093
|
-
input: 0,
|
|
4094
|
-
output: 0,
|
|
4095
|
-
cacheRead: 0,
|
|
4096
|
-
cacheWrite: 0,
|
|
4097
|
-
},
|
|
4098
|
-
contextWindow: 128000,
|
|
4099
|
-
maxTokens: 4096,
|
|
4100
|
-
},
|
|
4101
4247
|
"gpt-5-mini": {
|
|
4102
4248
|
id: "gpt-5-mini",
|
|
4103
|
-
name: "GPT-5
|
|
4249
|
+
name: "GPT-5 Mini",
|
|
4104
4250
|
api: "openai-responses",
|
|
4105
4251
|
provider: "github-copilot",
|
|
4106
4252
|
baseUrl: "https://api.individual.githubcopilot.com",
|
|
@@ -4109,9 +4255,9 @@ export const MODELS = {
|
|
|
4109
4255
|
thinkingLevelMap: { "off": null, "minimal": "low" },
|
|
4110
4256
|
input: ["text", "image"],
|
|
4111
4257
|
cost: {
|
|
4112
|
-
input: 0,
|
|
4113
|
-
output:
|
|
4114
|
-
cacheRead: 0,
|
|
4258
|
+
input: 0.25,
|
|
4259
|
+
output: 2,
|
|
4260
|
+
cacheRead: 0.025,
|
|
4115
4261
|
cacheWrite: 0,
|
|
4116
4262
|
},
|
|
4117
4263
|
contextWindow: 264000,
|
|
@@ -4128,9 +4274,9 @@ export const MODELS = {
|
|
|
4128
4274
|
thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
|
|
4129
4275
|
input: ["text", "image"],
|
|
4130
4276
|
cost: {
|
|
4131
|
-
input:
|
|
4132
|
-
output:
|
|
4133
|
-
cacheRead: 0,
|
|
4277
|
+
input: 1.75,
|
|
4278
|
+
output: 14,
|
|
4279
|
+
cacheRead: 0.175,
|
|
4134
4280
|
cacheWrite: 0,
|
|
4135
4281
|
},
|
|
4136
4282
|
contextWindow: 400000,
|
|
@@ -4138,7 +4284,7 @@ export const MODELS = {
|
|
|
4138
4284
|
},
|
|
4139
4285
|
"gpt-5.2-codex": {
|
|
4140
4286
|
id: "gpt-5.2-codex",
|
|
4141
|
-
name: "GPT-5.2
|
|
4287
|
+
name: "GPT-5.2 Codex",
|
|
4142
4288
|
api: "openai-responses",
|
|
4143
4289
|
provider: "github-copilot",
|
|
4144
4290
|
baseUrl: "https://api.individual.githubcopilot.com",
|
|
@@ -4147,9 +4293,9 @@ export const MODELS = {
|
|
|
4147
4293
|
thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
|
|
4148
4294
|
input: ["text", "image"],
|
|
4149
4295
|
cost: {
|
|
4150
|
-
input:
|
|
4151
|
-
output:
|
|
4152
|
-
cacheRead: 0,
|
|
4296
|
+
input: 1.75,
|
|
4297
|
+
output: 14,
|
|
4298
|
+
cacheRead: 0.175,
|
|
4153
4299
|
cacheWrite: 0,
|
|
4154
4300
|
},
|
|
4155
4301
|
contextWindow: 400000,
|
|
@@ -4157,7 +4303,7 @@ export const MODELS = {
|
|
|
4157
4303
|
},
|
|
4158
4304
|
"gpt-5.3-codex": {
|
|
4159
4305
|
id: "gpt-5.3-codex",
|
|
4160
|
-
name: "GPT-5.3
|
|
4306
|
+
name: "GPT-5.3 Codex",
|
|
4161
4307
|
api: "openai-responses",
|
|
4162
4308
|
provider: "github-copilot",
|
|
4163
4309
|
baseUrl: "https://api.individual.githubcopilot.com",
|
|
@@ -4166,9 +4312,9 @@ export const MODELS = {
|
|
|
4166
4312
|
thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
|
|
4167
4313
|
input: ["text", "image"],
|
|
4168
4314
|
cost: {
|
|
4169
|
-
input:
|
|
4170
|
-
output:
|
|
4171
|
-
cacheRead: 0,
|
|
4315
|
+
input: 1.75,
|
|
4316
|
+
output: 14,
|
|
4317
|
+
cacheRead: 0.175,
|
|
4172
4318
|
cacheWrite: 0,
|
|
4173
4319
|
},
|
|
4174
4320
|
contextWindow: 400000,
|
|
@@ -4185,9 +4331,9 @@ export const MODELS = {
|
|
|
4185
4331
|
thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
|
|
4186
4332
|
input: ["text", "image"],
|
|
4187
4333
|
cost: {
|
|
4188
|
-
input:
|
|
4189
|
-
output:
|
|
4190
|
-
cacheRead: 0,
|
|
4334
|
+
input: 2.5,
|
|
4335
|
+
output: 15,
|
|
4336
|
+
cacheRead: 0.25,
|
|
4191
4337
|
cacheWrite: 0,
|
|
4192
4338
|
},
|
|
4193
4339
|
contextWindow: 400000,
|
|
@@ -4195,7 +4341,7 @@ export const MODELS = {
|
|
|
4195
4341
|
},
|
|
4196
4342
|
"gpt-5.4-mini": {
|
|
4197
4343
|
id: "gpt-5.4-mini",
|
|
4198
|
-
name: "GPT-5.4
|
|
4344
|
+
name: "GPT-5.4 mini",
|
|
4199
4345
|
api: "openai-responses",
|
|
4200
4346
|
provider: "github-copilot",
|
|
4201
4347
|
baseUrl: "https://api.individual.githubcopilot.com",
|
|
@@ -4204,9 +4350,28 @@ export const MODELS = {
|
|
|
4204
4350
|
thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
|
|
4205
4351
|
input: ["text", "image"],
|
|
4206
4352
|
cost: {
|
|
4207
|
-
input: 0,
|
|
4208
|
-
output:
|
|
4209
|
-
cacheRead: 0,
|
|
4353
|
+
input: 0.75,
|
|
4354
|
+
output: 4.5,
|
|
4355
|
+
cacheRead: 0.075,
|
|
4356
|
+
cacheWrite: 0,
|
|
4357
|
+
},
|
|
4358
|
+
contextWindow: 400000,
|
|
4359
|
+
maxTokens: 128000,
|
|
4360
|
+
},
|
|
4361
|
+
"gpt-5.4-nano": {
|
|
4362
|
+
id: "gpt-5.4-nano",
|
|
4363
|
+
name: "GPT-5.4 nano",
|
|
4364
|
+
api: "openai-responses",
|
|
4365
|
+
provider: "github-copilot",
|
|
4366
|
+
baseUrl: "https://api.individual.githubcopilot.com",
|
|
4367
|
+
headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
|
|
4368
|
+
reasoning: true,
|
|
4369
|
+
thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
|
|
4370
|
+
input: ["text", "image"],
|
|
4371
|
+
cost: {
|
|
4372
|
+
input: 0.2,
|
|
4373
|
+
output: 1.25,
|
|
4374
|
+
cacheRead: 0.02,
|
|
4210
4375
|
cacheWrite: 0,
|
|
4211
4376
|
},
|
|
4212
4377
|
contextWindow: 400000,
|
|
@@ -4223,32 +4388,32 @@ export const MODELS = {
|
|
|
4223
4388
|
thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
|
|
4224
4389
|
input: ["text", "image"],
|
|
4225
4390
|
cost: {
|
|
4226
|
-
input:
|
|
4227
|
-
output:
|
|
4228
|
-
cacheRead: 0,
|
|
4391
|
+
input: 5,
|
|
4392
|
+
output: 30,
|
|
4393
|
+
cacheRead: 0.5,
|
|
4229
4394
|
cacheWrite: 0,
|
|
4230
4395
|
},
|
|
4231
4396
|
contextWindow: 400000,
|
|
4232
4397
|
maxTokens: 128000,
|
|
4233
4398
|
},
|
|
4234
|
-
"
|
|
4235
|
-
id: "
|
|
4236
|
-
name: "
|
|
4399
|
+
"raptor-mini": {
|
|
4400
|
+
id: "raptor-mini",
|
|
4401
|
+
name: "Raptor mini",
|
|
4237
4402
|
api: "openai-completions",
|
|
4238
4403
|
provider: "github-copilot",
|
|
4239
4404
|
baseUrl: "https://api.individual.githubcopilot.com",
|
|
4240
4405
|
headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
|
|
4241
4406
|
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
|
|
4242
4407
|
reasoning: true,
|
|
4243
|
-
input: ["text"],
|
|
4408
|
+
input: ["text", "image"],
|
|
4244
4409
|
cost: {
|
|
4245
|
-
input: 0,
|
|
4246
|
-
output:
|
|
4247
|
-
cacheRead: 0,
|
|
4410
|
+
input: 0.25,
|
|
4411
|
+
output: 2,
|
|
4412
|
+
cacheRead: 0.025,
|
|
4248
4413
|
cacheWrite: 0,
|
|
4249
4414
|
},
|
|
4250
|
-
contextWindow:
|
|
4251
|
-
maxTokens:
|
|
4415
|
+
contextWindow: 400000,
|
|
4416
|
+
maxTokens: 128000,
|
|
4252
4417
|
},
|
|
4253
4418
|
},
|
|
4254
4419
|
"google": {
|
|
@@ -5541,6 +5706,23 @@ export const MODELS = {
|
|
|
5541
5706
|
contextWindow: 204800,
|
|
5542
5707
|
maxTokens: 131072,
|
|
5543
5708
|
},
|
|
5709
|
+
"MiniMax-M3": {
|
|
5710
|
+
id: "MiniMax-M3",
|
|
5711
|
+
name: "MiniMax-M3",
|
|
5712
|
+
api: "anthropic-messages",
|
|
5713
|
+
provider: "minimax",
|
|
5714
|
+
baseUrl: "https://api.minimax.io/anthropic",
|
|
5715
|
+
reasoning: true,
|
|
5716
|
+
input: ["text", "image"],
|
|
5717
|
+
cost: {
|
|
5718
|
+
input: 0.6,
|
|
5719
|
+
output: 2.4,
|
|
5720
|
+
cacheRead: 0.12,
|
|
5721
|
+
cacheWrite: 0,
|
|
5722
|
+
},
|
|
5723
|
+
contextWindow: 512000,
|
|
5724
|
+
maxTokens: 128000,
|
|
5725
|
+
},
|
|
5544
5726
|
},
|
|
5545
5727
|
"minimax-cn": {
|
|
5546
5728
|
"MiniMax-M2.7": {
|
|
@@ -5577,6 +5759,23 @@ export const MODELS = {
|
|
|
5577
5759
|
contextWindow: 204800,
|
|
5578
5760
|
maxTokens: 131072,
|
|
5579
5761
|
},
|
|
5762
|
+
"MiniMax-M3": {
|
|
5763
|
+
id: "MiniMax-M3",
|
|
5764
|
+
name: "MiniMax-M3",
|
|
5765
|
+
api: "anthropic-messages",
|
|
5766
|
+
provider: "minimax-cn",
|
|
5767
|
+
baseUrl: "https://api.minimaxi.com/anthropic",
|
|
5768
|
+
reasoning: true,
|
|
5769
|
+
input: ["text", "image"],
|
|
5770
|
+
cost: {
|
|
5771
|
+
input: 0.6,
|
|
5772
|
+
output: 2.4,
|
|
5773
|
+
cacheRead: 0.12,
|
|
5774
|
+
cacheWrite: 0,
|
|
5775
|
+
},
|
|
5776
|
+
contextWindow: 512000,
|
|
5777
|
+
maxTokens: 128000,
|
|
5778
|
+
},
|
|
5580
5779
|
},
|
|
5581
5780
|
"mistral": {
|
|
5582
5781
|
"codestral-latest": {
|
|
@@ -5613,6 +5812,23 @@ export const MODELS = {
|
|
|
5613
5812
|
contextWindow: 262144,
|
|
5614
5813
|
maxTokens: 262144,
|
|
5615
5814
|
},
|
|
5815
|
+
"devstral-latest": {
|
|
5816
|
+
id: "devstral-latest",
|
|
5817
|
+
name: "Devstral 2",
|
|
5818
|
+
api: "mistral-conversations",
|
|
5819
|
+
provider: "mistral",
|
|
5820
|
+
baseUrl: "https://api.mistral.ai",
|
|
5821
|
+
reasoning: false,
|
|
5822
|
+
input: ["text"],
|
|
5823
|
+
cost: {
|
|
5824
|
+
input: 0.4,
|
|
5825
|
+
output: 2,
|
|
5826
|
+
cacheRead: 0,
|
|
5827
|
+
cacheWrite: 0,
|
|
5828
|
+
},
|
|
5829
|
+
contextWindow: 262144,
|
|
5830
|
+
maxTokens: 262144,
|
|
5831
|
+
},
|
|
5616
5832
|
"devstral-medium-2507": {
|
|
5617
5833
|
id: "devstral-medium-2507",
|
|
5618
5834
|
name: "Devstral Medium",
|
|
@@ -5891,11 +6107,11 @@ export const MODELS = {
|
|
|
5891
6107
|
api: "mistral-conversations",
|
|
5892
6108
|
provider: "mistral",
|
|
5893
6109
|
baseUrl: "https://api.mistral.ai",
|
|
5894
|
-
reasoning:
|
|
6110
|
+
reasoning: false,
|
|
5895
6111
|
input: ["text", "image"],
|
|
5896
6112
|
cost: {
|
|
5897
|
-
input:
|
|
5898
|
-
output:
|
|
6113
|
+
input: 0.4,
|
|
6114
|
+
output: 2,
|
|
5899
6115
|
cacheRead: 0,
|
|
5900
6116
|
cacheWrite: 0,
|
|
5901
6117
|
},
|
|
@@ -5987,6 +6203,23 @@ export const MODELS = {
|
|
|
5987
6203
|
contextWindow: 8000,
|
|
5988
6204
|
maxTokens: 8000,
|
|
5989
6205
|
},
|
|
6206
|
+
"open-mistral-nemo": {
|
|
6207
|
+
id: "open-mistral-nemo",
|
|
6208
|
+
name: "Open Mistral Nemo",
|
|
6209
|
+
api: "mistral-conversations",
|
|
6210
|
+
provider: "mistral",
|
|
6211
|
+
baseUrl: "https://api.mistral.ai",
|
|
6212
|
+
reasoning: false,
|
|
6213
|
+
input: ["text"],
|
|
6214
|
+
cost: {
|
|
6215
|
+
input: 0.15,
|
|
6216
|
+
output: 0.15,
|
|
6217
|
+
cacheRead: 0,
|
|
6218
|
+
cacheWrite: 0,
|
|
6219
|
+
},
|
|
6220
|
+
contextWindow: 128000,
|
|
6221
|
+
maxTokens: 128000,
|
|
6222
|
+
},
|
|
5990
6223
|
"open-mixtral-8x22b": {
|
|
5991
6224
|
id: "open-mixtral-8x22b",
|
|
5992
6225
|
name: "Mixtral 8x22B",
|
|
@@ -6312,56 +6545,457 @@ export const MODELS = {
|
|
|
6312
6545
|
maxTokens: 262144,
|
|
6313
6546
|
},
|
|
6314
6547
|
},
|
|
6315
|
-
"
|
|
6316
|
-
"
|
|
6317
|
-
id: "
|
|
6318
|
-
name: "
|
|
6319
|
-
api: "openai-
|
|
6320
|
-
provider: "
|
|
6321
|
-
baseUrl: "https://api.
|
|
6548
|
+
"nvidia": {
|
|
6549
|
+
"meta/llama-3.1-70b-instruct": {
|
|
6550
|
+
id: "meta/llama-3.1-70b-instruct",
|
|
6551
|
+
name: "Llama 3.1 70b Instruct",
|
|
6552
|
+
api: "openai-completions",
|
|
6553
|
+
provider: "nvidia",
|
|
6554
|
+
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
6555
|
+
headers: { "NVCF-POLL-SECONDS": "3600" },
|
|
6556
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
6322
6557
|
reasoning: false,
|
|
6323
6558
|
input: ["text"],
|
|
6324
6559
|
cost: {
|
|
6325
|
-
input:
|
|
6326
|
-
output:
|
|
6560
|
+
input: 0,
|
|
6561
|
+
output: 0,
|
|
6327
6562
|
cacheRead: 0,
|
|
6328
6563
|
cacheWrite: 0,
|
|
6329
6564
|
},
|
|
6330
|
-
contextWindow:
|
|
6331
|
-
maxTokens:
|
|
6565
|
+
contextWindow: 128000,
|
|
6566
|
+
maxTokens: 4096,
|
|
6332
6567
|
},
|
|
6333
|
-
"
|
|
6334
|
-
id: "
|
|
6335
|
-
name: "
|
|
6336
|
-
api: "openai-
|
|
6337
|
-
provider: "
|
|
6338
|
-
baseUrl: "https://api.
|
|
6568
|
+
"meta/llama-3.1-8b-instruct": {
|
|
6569
|
+
id: "meta/llama-3.1-8b-instruct",
|
|
6570
|
+
name: "Llama 3.1 8B Instruct",
|
|
6571
|
+
api: "openai-completions",
|
|
6572
|
+
provider: "nvidia",
|
|
6573
|
+
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
6574
|
+
headers: { "NVCF-POLL-SECONDS": "3600" },
|
|
6575
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
6576
|
+
reasoning: false,
|
|
6577
|
+
input: ["text"],
|
|
6578
|
+
cost: {
|
|
6579
|
+
input: 0,
|
|
6580
|
+
output: 0,
|
|
6581
|
+
cacheRead: 0,
|
|
6582
|
+
cacheWrite: 0,
|
|
6583
|
+
},
|
|
6584
|
+
contextWindow: 16000,
|
|
6585
|
+
maxTokens: 4096,
|
|
6586
|
+
},
|
|
6587
|
+
"meta/llama-3.2-11b-vision-instruct": {
|
|
6588
|
+
id: "meta/llama-3.2-11b-vision-instruct",
|
|
6589
|
+
name: "Llama 3.2 11b Vision Instruct",
|
|
6590
|
+
api: "openai-completions",
|
|
6591
|
+
provider: "nvidia",
|
|
6592
|
+
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
6593
|
+
headers: { "NVCF-POLL-SECONDS": "3600" },
|
|
6594
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
6339
6595
|
reasoning: false,
|
|
6340
6596
|
input: ["text", "image"],
|
|
6341
6597
|
cost: {
|
|
6342
|
-
input:
|
|
6343
|
-
output:
|
|
6598
|
+
input: 0,
|
|
6599
|
+
output: 0,
|
|
6344
6600
|
cacheRead: 0,
|
|
6345
6601
|
cacheWrite: 0,
|
|
6346
6602
|
},
|
|
6347
6603
|
contextWindow: 128000,
|
|
6348
6604
|
maxTokens: 4096,
|
|
6349
6605
|
},
|
|
6350
|
-
"
|
|
6351
|
-
id: "
|
|
6352
|
-
name: "
|
|
6353
|
-
api: "openai-
|
|
6354
|
-
provider: "
|
|
6355
|
-
baseUrl: "https://api.
|
|
6606
|
+
"meta/llama-3.2-90b-vision-instruct": {
|
|
6607
|
+
id: "meta/llama-3.2-90b-vision-instruct",
|
|
6608
|
+
name: "Llama-3.2-90B-Vision-Instruct",
|
|
6609
|
+
api: "openai-completions",
|
|
6610
|
+
provider: "nvidia",
|
|
6611
|
+
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
6612
|
+
headers: { "NVCF-POLL-SECONDS": "3600" },
|
|
6613
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
6356
6614
|
reasoning: false,
|
|
6357
6615
|
input: ["text", "image"],
|
|
6358
6616
|
cost: {
|
|
6359
|
-
input:
|
|
6360
|
-
output:
|
|
6361
|
-
cacheRead: 0
|
|
6617
|
+
input: 0,
|
|
6618
|
+
output: 0,
|
|
6619
|
+
cacheRead: 0,
|
|
6362
6620
|
cacheWrite: 0,
|
|
6363
6621
|
},
|
|
6364
|
-
contextWindow:
|
|
6622
|
+
contextWindow: 128000,
|
|
6623
|
+
maxTokens: 8192,
|
|
6624
|
+
},
|
|
6625
|
+
"meta/llama-3.3-70b-instruct": {
|
|
6626
|
+
id: "meta/llama-3.3-70b-instruct",
|
|
6627
|
+
name: "Llama 3.3 70b Instruct",
|
|
6628
|
+
api: "openai-completions",
|
|
6629
|
+
provider: "nvidia",
|
|
6630
|
+
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
6631
|
+
headers: { "NVCF-POLL-SECONDS": "3600" },
|
|
6632
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
6633
|
+
reasoning: false,
|
|
6634
|
+
input: ["text"],
|
|
6635
|
+
cost: {
|
|
6636
|
+
input: 0,
|
|
6637
|
+
output: 0,
|
|
6638
|
+
cacheRead: 0,
|
|
6639
|
+
cacheWrite: 0,
|
|
6640
|
+
},
|
|
6641
|
+
contextWindow: 128000,
|
|
6642
|
+
maxTokens: 4096,
|
|
6643
|
+
},
|
|
6644
|
+
"mistralai/mistral-large-3-675b-instruct-2512": {
|
|
6645
|
+
id: "mistralai/mistral-large-3-675b-instruct-2512",
|
|
6646
|
+
name: "Mistral Large 3 675B Instruct 2512",
|
|
6647
|
+
api: "openai-completions",
|
|
6648
|
+
provider: "nvidia",
|
|
6649
|
+
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
6650
|
+
headers: { "NVCF-POLL-SECONDS": "3600" },
|
|
6651
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
6652
|
+
reasoning: false,
|
|
6653
|
+
input: ["text", "image"],
|
|
6654
|
+
cost: {
|
|
6655
|
+
input: 0,
|
|
6656
|
+
output: 0,
|
|
6657
|
+
cacheRead: 0,
|
|
6658
|
+
cacheWrite: 0,
|
|
6659
|
+
},
|
|
6660
|
+
contextWindow: 262144,
|
|
6661
|
+
maxTokens: 262144,
|
|
6662
|
+
},
|
|
6663
|
+
"mistralai/mistral-small-4-119b-2603": {
|
|
6664
|
+
id: "mistralai/mistral-small-4-119b-2603",
|
|
6665
|
+
name: "mistral-small-4-119b-2603",
|
|
6666
|
+
api: "openai-completions",
|
|
6667
|
+
provider: "nvidia",
|
|
6668
|
+
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
6669
|
+
headers: { "NVCF-POLL-SECONDS": "3600" },
|
|
6670
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
6671
|
+
reasoning: false,
|
|
6672
|
+
input: ["text"],
|
|
6673
|
+
cost: {
|
|
6674
|
+
input: 0,
|
|
6675
|
+
output: 0,
|
|
6676
|
+
cacheRead: 0,
|
|
6677
|
+
cacheWrite: 0,
|
|
6678
|
+
},
|
|
6679
|
+
contextWindow: 128000,
|
|
6680
|
+
maxTokens: 8192,
|
|
6681
|
+
},
|
|
6682
|
+
"moonshotai/kimi-k2.6": {
|
|
6683
|
+
id: "moonshotai/kimi-k2.6",
|
|
6684
|
+
name: "Kimi K2.6",
|
|
6685
|
+
api: "openai-completions",
|
|
6686
|
+
provider: "nvidia",
|
|
6687
|
+
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
6688
|
+
headers: { "NVCF-POLL-SECONDS": "3600" },
|
|
6689
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
6690
|
+
reasoning: true,
|
|
6691
|
+
input: ["text", "image"],
|
|
6692
|
+
cost: {
|
|
6693
|
+
input: 0,
|
|
6694
|
+
output: 0,
|
|
6695
|
+
cacheRead: 0,
|
|
6696
|
+
cacheWrite: 0,
|
|
6697
|
+
},
|
|
6698
|
+
contextWindow: 262144,
|
|
6699
|
+
maxTokens: 262144,
|
|
6700
|
+
},
|
|
6701
|
+
"nvidia/llama-3.3-nemotron-super-49b-v1": {
|
|
6702
|
+
id: "nvidia/llama-3.3-nemotron-super-49b-v1",
|
|
6703
|
+
name: "Llama 3.3 Nemotron Super 49B v1",
|
|
6704
|
+
api: "openai-completions",
|
|
6705
|
+
provider: "nvidia",
|
|
6706
|
+
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
6707
|
+
headers: { "NVCF-POLL-SECONDS": "3600" },
|
|
6708
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
6709
|
+
reasoning: true,
|
|
6710
|
+
input: ["text"],
|
|
6711
|
+
cost: {
|
|
6712
|
+
input: 0,
|
|
6713
|
+
output: 0,
|
|
6714
|
+
cacheRead: 0,
|
|
6715
|
+
cacheWrite: 0,
|
|
6716
|
+
},
|
|
6717
|
+
contextWindow: 131072,
|
|
6718
|
+
maxTokens: 131072,
|
|
6719
|
+
},
|
|
6720
|
+
"nvidia/llama-3.3-nemotron-super-49b-v1.5": {
|
|
6721
|
+
id: "nvidia/llama-3.3-nemotron-super-49b-v1.5",
|
|
6722
|
+
name: "Llama 3.3 Nemotron Super 49B v1.5",
|
|
6723
|
+
api: "openai-completions",
|
|
6724
|
+
provider: "nvidia",
|
|
6725
|
+
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
6726
|
+
headers: { "NVCF-POLL-SECONDS": "3600" },
|
|
6727
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
6728
|
+
reasoning: true,
|
|
6729
|
+
input: ["text"],
|
|
6730
|
+
cost: {
|
|
6731
|
+
input: 0,
|
|
6732
|
+
output: 0,
|
|
6733
|
+
cacheRead: 0,
|
|
6734
|
+
cacheWrite: 0,
|
|
6735
|
+
},
|
|
6736
|
+
contextWindow: 131072,
|
|
6737
|
+
maxTokens: 131072,
|
|
6738
|
+
},
|
|
6739
|
+
"nvidia/nemotron-3-nano-30b-a3b": {
|
|
6740
|
+
id: "nvidia/nemotron-3-nano-30b-a3b",
|
|
6741
|
+
name: "nemotron-3-nano-30b-a3b",
|
|
6742
|
+
api: "openai-completions",
|
|
6743
|
+
provider: "nvidia",
|
|
6744
|
+
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
6745
|
+
headers: { "NVCF-POLL-SECONDS": "3600" },
|
|
6746
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
6747
|
+
reasoning: true,
|
|
6748
|
+
input: ["text"],
|
|
6749
|
+
cost: {
|
|
6750
|
+
input: 0,
|
|
6751
|
+
output: 0,
|
|
6752
|
+
cacheRead: 0,
|
|
6753
|
+
cacheWrite: 0,
|
|
6754
|
+
},
|
|
6755
|
+
contextWindow: 131072,
|
|
6756
|
+
maxTokens: 131072,
|
|
6757
|
+
},
|
|
6758
|
+
"nvidia/nemotron-3-nano-omni-30b-a3b-reasoning": {
|
|
6759
|
+
id: "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning",
|
|
6760
|
+
name: "Nemotron 3 Nano Omni",
|
|
6761
|
+
api: "openai-completions",
|
|
6762
|
+
provider: "nvidia",
|
|
6763
|
+
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
6764
|
+
headers: { "NVCF-POLL-SECONDS": "3600" },
|
|
6765
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
6766
|
+
reasoning: true,
|
|
6767
|
+
input: ["text", "image"],
|
|
6768
|
+
cost: {
|
|
6769
|
+
input: 0,
|
|
6770
|
+
output: 0,
|
|
6771
|
+
cacheRead: 0,
|
|
6772
|
+
cacheWrite: 0,
|
|
6773
|
+
},
|
|
6774
|
+
contextWindow: 256000,
|
|
6775
|
+
maxTokens: 65536,
|
|
6776
|
+
},
|
|
6777
|
+
"nvidia/nemotron-3-super-120b-a12b": {
|
|
6778
|
+
id: "nvidia/nemotron-3-super-120b-a12b",
|
|
6779
|
+
name: "Nemotron 3 Super",
|
|
6780
|
+
api: "openai-completions",
|
|
6781
|
+
provider: "nvidia",
|
|
6782
|
+
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
6783
|
+
headers: { "NVCF-POLL-SECONDS": "3600" },
|
|
6784
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
6785
|
+
reasoning: true,
|
|
6786
|
+
input: ["text"],
|
|
6787
|
+
cost: {
|
|
6788
|
+
input: 0.2,
|
|
6789
|
+
output: 0.8,
|
|
6790
|
+
cacheRead: 0,
|
|
6791
|
+
cacheWrite: 0,
|
|
6792
|
+
},
|
|
6793
|
+
contextWindow: 262144,
|
|
6794
|
+
maxTokens: 262144,
|
|
6795
|
+
},
|
|
6796
|
+
"nvidia/nemotron-3-ultra-550b-a55b": {
|
|
6797
|
+
id: "nvidia/nemotron-3-ultra-550b-a55b",
|
|
6798
|
+
name: "Nemotron 3 Ultra 550B A55B",
|
|
6799
|
+
api: "openai-completions",
|
|
6800
|
+
provider: "nvidia",
|
|
6801
|
+
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
6802
|
+
headers: { "NVCF-POLL-SECONDS": "3600" },
|
|
6803
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
6804
|
+
reasoning: true,
|
|
6805
|
+
input: ["text"],
|
|
6806
|
+
cost: {
|
|
6807
|
+
input: 0.5,
|
|
6808
|
+
output: 2.5,
|
|
6809
|
+
cacheRead: 0.15,
|
|
6810
|
+
cacheWrite: 0,
|
|
6811
|
+
},
|
|
6812
|
+
contextWindow: 1000000,
|
|
6813
|
+
maxTokens: 65536,
|
|
6814
|
+
},
|
|
6815
|
+
"nvidia/nvidia-nemotron-nano-9b-v2": {
|
|
6816
|
+
id: "nvidia/nvidia-nemotron-nano-9b-v2",
|
|
6817
|
+
name: "nvidia-nemotron-nano-9b-v2",
|
|
6818
|
+
api: "openai-completions",
|
|
6819
|
+
provider: "nvidia",
|
|
6820
|
+
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
6821
|
+
headers: { "NVCF-POLL-SECONDS": "3600" },
|
|
6822
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
6823
|
+
reasoning: true,
|
|
6824
|
+
input: ["text"],
|
|
6825
|
+
cost: {
|
|
6826
|
+
input: 0,
|
|
6827
|
+
output: 0,
|
|
6828
|
+
cacheRead: 0,
|
|
6829
|
+
cacheWrite: 0,
|
|
6830
|
+
},
|
|
6831
|
+
contextWindow: 131072,
|
|
6832
|
+
maxTokens: 131072,
|
|
6833
|
+
},
|
|
6834
|
+
"openai/gpt-oss-20b": {
|
|
6835
|
+
id: "openai/gpt-oss-20b",
|
|
6836
|
+
name: "GPT OSS 20B",
|
|
6837
|
+
api: "openai-completions",
|
|
6838
|
+
provider: "nvidia",
|
|
6839
|
+
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
6840
|
+
headers: { "NVCF-POLL-SECONDS": "3600" },
|
|
6841
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
6842
|
+
reasoning: true,
|
|
6843
|
+
input: ["text"],
|
|
6844
|
+
cost: {
|
|
6845
|
+
input: 0,
|
|
6846
|
+
output: 0,
|
|
6847
|
+
cacheRead: 0,
|
|
6848
|
+
cacheWrite: 0,
|
|
6849
|
+
},
|
|
6850
|
+
contextWindow: 131072,
|
|
6851
|
+
maxTokens: 32768,
|
|
6852
|
+
},
|
|
6853
|
+
"qwen/qwen3-coder-480b-a35b-instruct": {
|
|
6854
|
+
id: "qwen/qwen3-coder-480b-a35b-instruct",
|
|
6855
|
+
name: "Qwen3 Coder 480B A35B Instruct",
|
|
6856
|
+
api: "openai-completions",
|
|
6857
|
+
provider: "nvidia",
|
|
6858
|
+
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
6859
|
+
headers: { "NVCF-POLL-SECONDS": "3600" },
|
|
6860
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
6861
|
+
reasoning: false,
|
|
6862
|
+
input: ["text"],
|
|
6863
|
+
cost: {
|
|
6864
|
+
input: 0,
|
|
6865
|
+
output: 0,
|
|
6866
|
+
cacheRead: 0,
|
|
6867
|
+
cacheWrite: 0,
|
|
6868
|
+
},
|
|
6869
|
+
contextWindow: 262144,
|
|
6870
|
+
maxTokens: 66536,
|
|
6871
|
+
},
|
|
6872
|
+
"qwen/qwen3.5-122b-a10b": {
|
|
6873
|
+
id: "qwen/qwen3.5-122b-a10b",
|
|
6874
|
+
name: "Qwen3.5 122B-A10B",
|
|
6875
|
+
api: "openai-completions",
|
|
6876
|
+
provider: "nvidia",
|
|
6877
|
+
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
6878
|
+
headers: { "NVCF-POLL-SECONDS": "3600" },
|
|
6879
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
6880
|
+
reasoning: true,
|
|
6881
|
+
input: ["text", "image"],
|
|
6882
|
+
cost: {
|
|
6883
|
+
input: 0,
|
|
6884
|
+
output: 0,
|
|
6885
|
+
cacheRead: 0,
|
|
6886
|
+
cacheWrite: 0,
|
|
6887
|
+
},
|
|
6888
|
+
contextWindow: 262144,
|
|
6889
|
+
maxTokens: 65536,
|
|
6890
|
+
},
|
|
6891
|
+
"stepfun-ai/step-3.5-flash": {
|
|
6892
|
+
id: "stepfun-ai/step-3.5-flash",
|
|
6893
|
+
name: "Step 3.5 Flash",
|
|
6894
|
+
api: "openai-completions",
|
|
6895
|
+
provider: "nvidia",
|
|
6896
|
+
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
6897
|
+
headers: { "NVCF-POLL-SECONDS": "3600" },
|
|
6898
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
6899
|
+
reasoning: true,
|
|
6900
|
+
input: ["text"],
|
|
6901
|
+
cost: {
|
|
6902
|
+
input: 0,
|
|
6903
|
+
output: 0,
|
|
6904
|
+
cacheRead: 0,
|
|
6905
|
+
cacheWrite: 0,
|
|
6906
|
+
},
|
|
6907
|
+
contextWindow: 256000,
|
|
6908
|
+
maxTokens: 16384,
|
|
6909
|
+
},
|
|
6910
|
+
"stepfun-ai/step-3.7-flash": {
|
|
6911
|
+
id: "stepfun-ai/step-3.7-flash",
|
|
6912
|
+
name: "Step 3.7 Flash",
|
|
6913
|
+
api: "openai-completions",
|
|
6914
|
+
provider: "nvidia",
|
|
6915
|
+
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
6916
|
+
headers: { "NVCF-POLL-SECONDS": "3600" },
|
|
6917
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
6918
|
+
reasoning: true,
|
|
6919
|
+
input: ["text", "image"],
|
|
6920
|
+
cost: {
|
|
6921
|
+
input: 0,
|
|
6922
|
+
output: 0,
|
|
6923
|
+
cacheRead: 0,
|
|
6924
|
+
cacheWrite: 0,
|
|
6925
|
+
},
|
|
6926
|
+
contextWindow: 256000,
|
|
6927
|
+
maxTokens: 16384,
|
|
6928
|
+
},
|
|
6929
|
+
"z-ai/glm-5.1": {
|
|
6930
|
+
id: "z-ai/glm-5.1",
|
|
6931
|
+
name: "GLM-5.1",
|
|
6932
|
+
api: "openai-completions",
|
|
6933
|
+
provider: "nvidia",
|
|
6934
|
+
baseUrl: "https://integrate.api.nvidia.com/v1",
|
|
6935
|
+
headers: { "NVCF-POLL-SECONDS": "3600" },
|
|
6936
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
|
|
6937
|
+
reasoning: true,
|
|
6938
|
+
input: ["text"],
|
|
6939
|
+
cost: {
|
|
6940
|
+
input: 0,
|
|
6941
|
+
output: 0,
|
|
6942
|
+
cacheRead: 0,
|
|
6943
|
+
cacheWrite: 0,
|
|
6944
|
+
},
|
|
6945
|
+
contextWindow: 131072,
|
|
6946
|
+
maxTokens: 131072,
|
|
6947
|
+
},
|
|
6948
|
+
},
|
|
6949
|
+
"openai": {
|
|
6950
|
+
"gpt-4": {
|
|
6951
|
+
id: "gpt-4",
|
|
6952
|
+
name: "GPT-4",
|
|
6953
|
+
api: "openai-responses",
|
|
6954
|
+
provider: "openai",
|
|
6955
|
+
baseUrl: "https://api.openai.com/v1",
|
|
6956
|
+
reasoning: false,
|
|
6957
|
+
input: ["text"],
|
|
6958
|
+
cost: {
|
|
6959
|
+
input: 30,
|
|
6960
|
+
output: 60,
|
|
6961
|
+
cacheRead: 0,
|
|
6962
|
+
cacheWrite: 0,
|
|
6963
|
+
},
|
|
6964
|
+
contextWindow: 8192,
|
|
6965
|
+
maxTokens: 8192,
|
|
6966
|
+
},
|
|
6967
|
+
"gpt-4-turbo": {
|
|
6968
|
+
id: "gpt-4-turbo",
|
|
6969
|
+
name: "GPT-4 Turbo",
|
|
6970
|
+
api: "openai-responses",
|
|
6971
|
+
provider: "openai",
|
|
6972
|
+
baseUrl: "https://api.openai.com/v1",
|
|
6973
|
+
reasoning: false,
|
|
6974
|
+
input: ["text", "image"],
|
|
6975
|
+
cost: {
|
|
6976
|
+
input: 10,
|
|
6977
|
+
output: 30,
|
|
6978
|
+
cacheRead: 0,
|
|
6979
|
+
cacheWrite: 0,
|
|
6980
|
+
},
|
|
6981
|
+
contextWindow: 128000,
|
|
6982
|
+
maxTokens: 4096,
|
|
6983
|
+
},
|
|
6984
|
+
"gpt-4.1": {
|
|
6985
|
+
id: "gpt-4.1",
|
|
6986
|
+
name: "GPT-4.1",
|
|
6987
|
+
api: "openai-responses",
|
|
6988
|
+
provider: "openai",
|
|
6989
|
+
baseUrl: "https://api.openai.com/v1",
|
|
6990
|
+
reasoning: false,
|
|
6991
|
+
input: ["text", "image"],
|
|
6992
|
+
cost: {
|
|
6993
|
+
input: 2,
|
|
6994
|
+
output: 8,
|
|
6995
|
+
cacheRead: 0.5,
|
|
6996
|
+
cacheWrite: 0,
|
|
6997
|
+
},
|
|
6998
|
+
contextWindow: 1047576,
|
|
6365
6999
|
maxTokens: 32768,
|
|
6366
7000
|
},
|
|
6367
7001
|
"gpt-4.1-mini": {
|
|
@@ -6886,7 +7520,7 @@ export const MODELS = {
|
|
|
6886
7520
|
provider: "openai",
|
|
6887
7521
|
baseUrl: "https://api.openai.com/v1",
|
|
6888
7522
|
reasoning: true,
|
|
6889
|
-
thinkingLevelMap: { "off": "none", "xhigh": "xhigh" },
|
|
7523
|
+
thinkingLevelMap: { "off": "none", "xhigh": "xhigh", "minimal": null },
|
|
6890
7524
|
input: ["text", "image"],
|
|
6891
7525
|
cost: {
|
|
6892
7526
|
input: 5,
|
|
@@ -7033,62 +7667,26 @@ export const MODELS = {
|
|
|
7033
7667
|
},
|
|
7034
7668
|
contextWindow: 200000,
|
|
7035
7669
|
maxTokens: 100000,
|
|
7036
|
-
},
|
|
7037
|
-
"o4-mini-deep-research": {
|
|
7038
|
-
id: "o4-mini-deep-research",
|
|
7039
|
-
name: "o4-mini-deep-research",
|
|
7040
|
-
api: "openai-responses",
|
|
7041
|
-
provider: "openai",
|
|
7042
|
-
baseUrl: "https://api.openai.com/v1",
|
|
7043
|
-
reasoning: true,
|
|
7044
|
-
input: ["text", "image"],
|
|
7045
|
-
cost: {
|
|
7046
|
-
input: 2,
|
|
7047
|
-
output: 8,
|
|
7048
|
-
cacheRead: 0.5,
|
|
7049
|
-
cacheWrite: 0,
|
|
7050
|
-
},
|
|
7051
|
-
contextWindow: 200000,
|
|
7052
|
-
maxTokens: 100000,
|
|
7053
|
-
},
|
|
7054
|
-
},
|
|
7055
|
-
"openai-codex": {
|
|
7056
|
-
"gpt-5.2": {
|
|
7057
|
-
id: "gpt-5.2",
|
|
7058
|
-
name: "GPT-5.2",
|
|
7059
|
-
api: "openai-codex-responses",
|
|
7060
|
-
provider: "openai-codex",
|
|
7061
|
-
baseUrl: "https://chatgpt.com/backend-api",
|
|
7062
|
-
reasoning: true,
|
|
7063
|
-
thinkingLevelMap: { "xhigh": "xhigh", "minimal": "low" },
|
|
7064
|
-
input: ["text", "image"],
|
|
7065
|
-
cost: {
|
|
7066
|
-
input: 1.75,
|
|
7067
|
-
output: 14,
|
|
7068
|
-
cacheRead: 0.175,
|
|
7069
|
-
cacheWrite: 0,
|
|
7070
|
-
},
|
|
7071
|
-
contextWindow: 272000,
|
|
7072
|
-
maxTokens: 128000,
|
|
7073
|
-
},
|
|
7074
|
-
"gpt-5.3-codex": {
|
|
7075
|
-
id: "gpt-5.3-codex",
|
|
7076
|
-
name: "GPT-5.3 Codex",
|
|
7077
|
-
api: "openai-codex-responses",
|
|
7078
|
-
provider: "openai-codex",
|
|
7079
|
-
baseUrl: "https://chatgpt.com/backend-api",
|
|
7670
|
+
},
|
|
7671
|
+
"o4-mini-deep-research": {
|
|
7672
|
+
id: "o4-mini-deep-research",
|
|
7673
|
+
name: "o4-mini-deep-research",
|
|
7674
|
+
api: "openai-responses",
|
|
7675
|
+
provider: "openai",
|
|
7676
|
+
baseUrl: "https://api.openai.com/v1",
|
|
7080
7677
|
reasoning: true,
|
|
7081
|
-
thinkingLevelMap: { "xhigh": "xhigh", "minimal": "low" },
|
|
7082
7678
|
input: ["text", "image"],
|
|
7083
7679
|
cost: {
|
|
7084
|
-
input:
|
|
7085
|
-
output:
|
|
7086
|
-
cacheRead: 0.
|
|
7680
|
+
input: 2,
|
|
7681
|
+
output: 8,
|
|
7682
|
+
cacheRead: 0.5,
|
|
7087
7683
|
cacheWrite: 0,
|
|
7088
7684
|
},
|
|
7089
|
-
contextWindow:
|
|
7090
|
-
maxTokens:
|
|
7685
|
+
contextWindow: 200000,
|
|
7686
|
+
maxTokens: 100000,
|
|
7091
7687
|
},
|
|
7688
|
+
},
|
|
7689
|
+
"openai-codex": {
|
|
7092
7690
|
"gpt-5.3-codex-spark": {
|
|
7093
7691
|
id: "gpt-5.3-codex-spark",
|
|
7094
7692
|
name: "GPT-5.3 Codex Spark",
|
|
@@ -7256,7 +7854,7 @@ export const MODELS = {
|
|
|
7256
7854
|
api: "anthropic-messages",
|
|
7257
7855
|
provider: "opencode",
|
|
7258
7856
|
baseUrl: "https://opencode.ai/zen",
|
|
7259
|
-
compat: { "forceAdaptiveThinking": true },
|
|
7857
|
+
compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
|
|
7260
7858
|
reasoning: true,
|
|
7261
7859
|
thinkingLevelMap: { "xhigh": "xhigh" },
|
|
7262
7860
|
input: ["text", "image"],
|
|
@@ -7275,7 +7873,7 @@ export const MODELS = {
|
|
|
7275
7873
|
api: "anthropic-messages",
|
|
7276
7874
|
provider: "opencode",
|
|
7277
7875
|
baseUrl: "https://opencode.ai/zen",
|
|
7278
|
-
compat: { "forceAdaptiveThinking": true },
|
|
7876
|
+
compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
|
|
7279
7877
|
reasoning: true,
|
|
7280
7878
|
thinkingLevelMap: { "xhigh": "xhigh" },
|
|
7281
7879
|
input: ["text", "image"],
|
|
@@ -7340,6 +7938,25 @@ export const MODELS = {
|
|
|
7340
7938
|
contextWindow: 1000000,
|
|
7341
7939
|
maxTokens: 64000,
|
|
7342
7940
|
},
|
|
7941
|
+
"deepseek-v4-flash": {
|
|
7942
|
+
id: "deepseek-v4-flash",
|
|
7943
|
+
name: "DeepSeek V4 Flash",
|
|
7944
|
+
api: "openai-completions",
|
|
7945
|
+
provider: "opencode",
|
|
7946
|
+
baseUrl: "https://opencode.ai/zen/v1",
|
|
7947
|
+
compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
|
|
7948
|
+
reasoning: true,
|
|
7949
|
+
thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
|
|
7950
|
+
input: ["text"],
|
|
7951
|
+
cost: {
|
|
7952
|
+
input: 0.14,
|
|
7953
|
+
output: 0.28,
|
|
7954
|
+
cacheRead: 0.03,
|
|
7955
|
+
cacheWrite: 0,
|
|
7956
|
+
},
|
|
7957
|
+
contextWindow: 1000000,
|
|
7958
|
+
maxTokens: 384000,
|
|
7959
|
+
},
|
|
7343
7960
|
"deepseek-v4-flash-free": {
|
|
7344
7961
|
id: "deepseek-v4-flash-free",
|
|
7345
7962
|
name: "DeepSeek V4 Flash Free",
|
|
@@ -7803,8 +8420,8 @@ export const MODELS = {
|
|
|
7803
8420
|
cacheRead: 0,
|
|
7804
8421
|
cacheWrite: 0,
|
|
7805
8422
|
},
|
|
7806
|
-
contextWindow:
|
|
7807
|
-
maxTokens:
|
|
8423
|
+
contextWindow: 200000,
|
|
8424
|
+
maxTokens: 32000,
|
|
7808
8425
|
},
|
|
7809
8426
|
"minimax-m2.5": {
|
|
7810
8427
|
id: "minimax-m2.5",
|
|
@@ -7840,9 +8457,9 @@ export const MODELS = {
|
|
|
7840
8457
|
contextWindow: 204800,
|
|
7841
8458
|
maxTokens: 131072,
|
|
7842
8459
|
},
|
|
7843
|
-
"nemotron-3-
|
|
7844
|
-
id: "nemotron-3-
|
|
7845
|
-
name: "Nemotron 3
|
|
8460
|
+
"nemotron-3-ultra-free": {
|
|
8461
|
+
id: "nemotron-3-ultra-free",
|
|
8462
|
+
name: "Nemotron 3 Ultra Free",
|
|
7846
8463
|
api: "openai-completions",
|
|
7847
8464
|
provider: "opencode",
|
|
7848
8465
|
baseUrl: "https://opencode.ai/zen/v1",
|
|
@@ -7854,7 +8471,7 @@ export const MODELS = {
|
|
|
7854
8471
|
cacheRead: 0,
|
|
7855
8472
|
cacheWrite: 0,
|
|
7856
8473
|
},
|
|
7857
|
-
contextWindow:
|
|
8474
|
+
contextWindow: 1000000,
|
|
7858
8475
|
maxTokens: 128000,
|
|
7859
8476
|
},
|
|
7860
8477
|
"qwen3.5-plus": {
|
|
@@ -8069,6 +8686,23 @@ export const MODELS = {
|
|
|
8069
8686
|
contextWindow: 204800,
|
|
8070
8687
|
maxTokens: 131072,
|
|
8071
8688
|
},
|
|
8689
|
+
"minimax-m3": {
|
|
8690
|
+
id: "minimax-m3",
|
|
8691
|
+
name: "MiniMax M3",
|
|
8692
|
+
api: "anthropic-messages",
|
|
8693
|
+
provider: "opencode-go",
|
|
8694
|
+
baseUrl: "https://opencode.ai/zen/go",
|
|
8695
|
+
reasoning: true,
|
|
8696
|
+
input: ["text", "image"],
|
|
8697
|
+
cost: {
|
|
8698
|
+
input: 0.3,
|
|
8699
|
+
output: 1.2,
|
|
8700
|
+
cacheRead: 0.06,
|
|
8701
|
+
cacheWrite: 0,
|
|
8702
|
+
},
|
|
8703
|
+
contextWindow: 512000,
|
|
8704
|
+
maxTokens: 131072,
|
|
8705
|
+
},
|
|
8072
8706
|
"qwen3.6-plus": {
|
|
8073
8707
|
id: "qwen3.6-plus",
|
|
8074
8708
|
name: "Qwen3.6 Plus",
|
|
@@ -8084,7 +8718,7 @@ export const MODELS = {
|
|
|
8084
8718
|
cacheRead: 0.05,
|
|
8085
8719
|
cacheWrite: 0.625,
|
|
8086
8720
|
},
|
|
8087
|
-
contextWindow:
|
|
8721
|
+
contextWindow: 1000000,
|
|
8088
8722
|
maxTokens: 65536,
|
|
8089
8723
|
},
|
|
8090
8724
|
"qwen3.7-max": {
|
|
@@ -8104,6 +8738,23 @@ export const MODELS = {
|
|
|
8104
8738
|
contextWindow: 1000000,
|
|
8105
8739
|
maxTokens: 65536,
|
|
8106
8740
|
},
|
|
8741
|
+
"qwen3.7-plus": {
|
|
8742
|
+
id: "qwen3.7-plus",
|
|
8743
|
+
name: "Qwen3.7 Plus",
|
|
8744
|
+
api: "anthropic-messages",
|
|
8745
|
+
provider: "opencode-go",
|
|
8746
|
+
baseUrl: "https://opencode.ai/zen/go",
|
|
8747
|
+
reasoning: true,
|
|
8748
|
+
input: ["text", "image"],
|
|
8749
|
+
cost: {
|
|
8750
|
+
input: 0.4,
|
|
8751
|
+
output: 1.6,
|
|
8752
|
+
cacheRead: 0.04,
|
|
8753
|
+
cacheWrite: 0.5,
|
|
8754
|
+
},
|
|
8755
|
+
contextWindow: 1000000,
|
|
8756
|
+
maxTokens: 65536,
|
|
8757
|
+
},
|
|
8107
8758
|
},
|
|
8108
8759
|
"openrouter": {
|
|
8109
8760
|
"ai21/jamba-large-1.7": {
|
|
@@ -8537,40 +9188,6 @@ export const MODELS = {
|
|
|
8537
9188
|
contextWindow: 2000000,
|
|
8538
9189
|
maxTokens: 30000,
|
|
8539
9190
|
},
|
|
8540
|
-
"baidu/ernie-4.5-21b-a3b": {
|
|
8541
|
-
id: "baidu/ernie-4.5-21b-a3b",
|
|
8542
|
-
name: "Baidu: ERNIE 4.5 21B A3B",
|
|
8543
|
-
api: "openai-completions",
|
|
8544
|
-
provider: "openrouter",
|
|
8545
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
8546
|
-
reasoning: false,
|
|
8547
|
-
input: ["text"],
|
|
8548
|
-
cost: {
|
|
8549
|
-
input: 0.07,
|
|
8550
|
-
output: 0.28,
|
|
8551
|
-
cacheRead: 0,
|
|
8552
|
-
cacheWrite: 0,
|
|
8553
|
-
},
|
|
8554
|
-
contextWindow: 131072,
|
|
8555
|
-
maxTokens: 8000,
|
|
8556
|
-
},
|
|
8557
|
-
"baidu/ernie-4.5-vl-28b-a3b": {
|
|
8558
|
-
id: "baidu/ernie-4.5-vl-28b-a3b",
|
|
8559
|
-
name: "Baidu: ERNIE 4.5 VL 28B A3B",
|
|
8560
|
-
api: "openai-completions",
|
|
8561
|
-
provider: "openrouter",
|
|
8562
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
8563
|
-
reasoning: true,
|
|
8564
|
-
input: ["text", "image"],
|
|
8565
|
-
cost: {
|
|
8566
|
-
input: 0.14,
|
|
8567
|
-
output: 0.56,
|
|
8568
|
-
cacheRead: 0,
|
|
8569
|
-
cacheWrite: 0,
|
|
8570
|
-
},
|
|
8571
|
-
contextWindow: 131072,
|
|
8572
|
-
maxTokens: 8000,
|
|
8573
|
-
},
|
|
8574
9191
|
"bytedance-seed/seed-1.6": {
|
|
8575
9192
|
id: "bytedance-seed/seed-1.6",
|
|
8576
9193
|
name: "ByteDance Seed: Seed 1.6",
|
|
@@ -8682,8 +9299,8 @@ export const MODELS = {
|
|
|
8682
9299
|
reasoning: false,
|
|
8683
9300
|
input: ["text"],
|
|
8684
9301
|
cost: {
|
|
8685
|
-
input: 0.
|
|
8686
|
-
output: 0.
|
|
9302
|
+
input: 0.20020000000000002,
|
|
9303
|
+
output: 0.8000999999999999,
|
|
8687
9304
|
cacheRead: 0,
|
|
8688
9305
|
cacheWrite: 0,
|
|
8689
9306
|
},
|
|
@@ -8784,13 +9401,13 @@ export const MODELS = {
|
|
|
8784
9401
|
reasoning: true,
|
|
8785
9402
|
input: ["text"],
|
|
8786
9403
|
cost: {
|
|
8787
|
-
input: 0.
|
|
8788
|
-
output: 0.
|
|
8789
|
-
cacheRead: 0
|
|
9404
|
+
input: 0.2288,
|
|
9405
|
+
output: 0.3432,
|
|
9406
|
+
cacheRead: 0,
|
|
8790
9407
|
cacheWrite: 0,
|
|
8791
9408
|
},
|
|
8792
9409
|
contextWindow: 131072,
|
|
8793
|
-
maxTokens:
|
|
9410
|
+
maxTokens: 64000,
|
|
8794
9411
|
},
|
|
8795
9412
|
"deepseek/deepseek-v3.2-exp": {
|
|
8796
9413
|
id: "deepseek/deepseek-v3.2-exp",
|
|
@@ -8828,25 +9445,6 @@ export const MODELS = {
|
|
|
8828
9445
|
contextWindow: 1048576,
|
|
8829
9446
|
maxTokens: 131072,
|
|
8830
9447
|
},
|
|
8831
|
-
"deepseek/deepseek-v4-flash:free": {
|
|
8832
|
-
id: "deepseek/deepseek-v4-flash:free",
|
|
8833
|
-
name: "DeepSeek: DeepSeek V4 Flash (free)",
|
|
8834
|
-
api: "openai-completions",
|
|
8835
|
-
provider: "openrouter",
|
|
8836
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
8837
|
-
compat: { "requiresReasoningContentOnAssistantMessages": true },
|
|
8838
|
-
reasoning: true,
|
|
8839
|
-
thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "xhigh" },
|
|
8840
|
-
input: ["text"],
|
|
8841
|
-
cost: {
|
|
8842
|
-
input: 0,
|
|
8843
|
-
output: 0,
|
|
8844
|
-
cacheRead: 0,
|
|
8845
|
-
cacheWrite: 0,
|
|
8846
|
-
},
|
|
8847
|
-
contextWindow: 1048576,
|
|
8848
|
-
maxTokens: 384000,
|
|
8849
|
-
},
|
|
8850
9448
|
"deepseek/deepseek-v4-pro": {
|
|
8851
9449
|
id: "deepseek/deepseek-v4-pro",
|
|
8852
9450
|
name: "DeepSeek: DeepSeek V4 Pro",
|
|
@@ -8883,40 +9481,6 @@ export const MODELS = {
|
|
|
8883
9481
|
contextWindow: 32768,
|
|
8884
9482
|
maxTokens: 4096,
|
|
8885
9483
|
},
|
|
8886
|
-
"google/gemini-2.0-flash-001": {
|
|
8887
|
-
id: "google/gemini-2.0-flash-001",
|
|
8888
|
-
name: "Google: Gemini 2.0 Flash",
|
|
8889
|
-
api: "openai-completions",
|
|
8890
|
-
provider: "openrouter",
|
|
8891
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
8892
|
-
reasoning: false,
|
|
8893
|
-
input: ["text", "image"],
|
|
8894
|
-
cost: {
|
|
8895
|
-
input: 0.09999999999999999,
|
|
8896
|
-
output: 0.39999999999999997,
|
|
8897
|
-
cacheRead: 0.024999999999999998,
|
|
8898
|
-
cacheWrite: 0.08333333333333334,
|
|
8899
|
-
},
|
|
8900
|
-
contextWindow: 1048576,
|
|
8901
|
-
maxTokens: 8192,
|
|
8902
|
-
},
|
|
8903
|
-
"google/gemini-2.0-flash-lite-001": {
|
|
8904
|
-
id: "google/gemini-2.0-flash-lite-001",
|
|
8905
|
-
name: "Google: Gemini 2.0 Flash Lite",
|
|
8906
|
-
api: "openai-completions",
|
|
8907
|
-
provider: "openrouter",
|
|
8908
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
8909
|
-
reasoning: false,
|
|
8910
|
-
input: ["text", "image"],
|
|
8911
|
-
cost: {
|
|
8912
|
-
input: 0.075,
|
|
8913
|
-
output: 0.3,
|
|
8914
|
-
cacheRead: 0,
|
|
8915
|
-
cacheWrite: 0,
|
|
8916
|
-
},
|
|
8917
|
-
contextWindow: 1048576,
|
|
8918
|
-
maxTokens: 8192,
|
|
8919
|
-
},
|
|
8920
9484
|
"google/gemini-2.5-flash": {
|
|
8921
9485
|
id: "google/gemini-2.5-flash",
|
|
8922
9486
|
name: "Google: Gemini 2.5 Flash",
|
|
@@ -9130,8 +9694,8 @@ export const MODELS = {
|
|
|
9130
9694
|
reasoning: false,
|
|
9131
9695
|
input: ["text", "image"],
|
|
9132
9696
|
cost: {
|
|
9133
|
-
input: 0.
|
|
9134
|
-
output: 0.
|
|
9697
|
+
input: 0.049999999999999996,
|
|
9698
|
+
output: 0.15,
|
|
9135
9699
|
cacheRead: 0,
|
|
9136
9700
|
cacheWrite: 0,
|
|
9137
9701
|
},
|
|
@@ -9199,12 +9763,12 @@ export const MODELS = {
|
|
|
9199
9763
|
input: ["text", "image"],
|
|
9200
9764
|
cost: {
|
|
9201
9765
|
input: 0.12,
|
|
9202
|
-
output: 0.
|
|
9203
|
-
cacheRead: 0,
|
|
9766
|
+
output: 0.36,
|
|
9767
|
+
cacheRead: 0.09,
|
|
9204
9768
|
cacheWrite: 0,
|
|
9205
9769
|
},
|
|
9206
9770
|
contextWindow: 262144,
|
|
9207
|
-
maxTokens:
|
|
9771
|
+
maxTokens: 8192,
|
|
9208
9772
|
},
|
|
9209
9773
|
"google/gemma-4-31b-it:free": {
|
|
9210
9774
|
id: "google/gemma-4-31b-it:free",
|
|
@@ -9353,7 +9917,7 @@ export const MODELS = {
|
|
|
9353
9917
|
input: ["text"],
|
|
9354
9918
|
cost: {
|
|
9355
9919
|
input: 0.02,
|
|
9356
|
-
output: 0.
|
|
9920
|
+
output: 0.03,
|
|
9357
9921
|
cacheRead: 0,
|
|
9358
9922
|
cacheWrite: 0,
|
|
9359
9923
|
},
|
|
@@ -9394,6 +9958,23 @@ export const MODELS = {
|
|
|
9394
9958
|
contextWindow: 131072,
|
|
9395
9959
|
maxTokens: 4096,
|
|
9396
9960
|
},
|
|
9961
|
+
"meta-llama/llama-4-maverick": {
|
|
9962
|
+
id: "meta-llama/llama-4-maverick",
|
|
9963
|
+
name: "Meta: Llama 4 Maverick",
|
|
9964
|
+
api: "openai-completions",
|
|
9965
|
+
provider: "openrouter",
|
|
9966
|
+
baseUrl: "https://openrouter.ai/api/v1",
|
|
9967
|
+
reasoning: false,
|
|
9968
|
+
input: ["text", "image"],
|
|
9969
|
+
cost: {
|
|
9970
|
+
input: 0.15,
|
|
9971
|
+
output: 0.6,
|
|
9972
|
+
cacheRead: 0,
|
|
9973
|
+
cacheWrite: 0,
|
|
9974
|
+
},
|
|
9975
|
+
contextWindow: 1048576,
|
|
9976
|
+
maxTokens: 16384,
|
|
9977
|
+
},
|
|
9397
9978
|
"meta-llama/llama-4-scout": {
|
|
9398
9979
|
id: "meta-llama/llama-4-scout",
|
|
9399
9980
|
name: "Meta: Llama 4 Scout",
|
|
@@ -9403,7 +9984,7 @@ export const MODELS = {
|
|
|
9403
9984
|
reasoning: false,
|
|
9404
9985
|
input: ["text", "image"],
|
|
9405
9986
|
cost: {
|
|
9406
|
-
input: 0.
|
|
9987
|
+
input: 0.09999999999999999,
|
|
9407
9988
|
output: 0.3,
|
|
9408
9989
|
cacheRead: 0,
|
|
9409
9990
|
cacheWrite: 0,
|
|
@@ -9479,39 +10060,39 @@ export const MODELS = {
|
|
|
9479
10060
|
contextWindow: 204800,
|
|
9480
10061
|
maxTokens: 196608,
|
|
9481
10062
|
},
|
|
9482
|
-
"minimax/minimax-m2.
|
|
9483
|
-
id: "minimax/minimax-m2.
|
|
9484
|
-
name: "MiniMax: MiniMax M2.
|
|
10063
|
+
"minimax/minimax-m2.7": {
|
|
10064
|
+
id: "minimax/minimax-m2.7",
|
|
10065
|
+
name: "MiniMax: MiniMax M2.7",
|
|
9485
10066
|
api: "openai-completions",
|
|
9486
10067
|
provider: "openrouter",
|
|
9487
10068
|
baseUrl: "https://openrouter.ai/api/v1",
|
|
9488
10069
|
reasoning: true,
|
|
9489
10070
|
input: ["text"],
|
|
9490
10071
|
cost: {
|
|
9491
|
-
input: 0,
|
|
9492
|
-
output:
|
|
10072
|
+
input: 0.27899999999999997,
|
|
10073
|
+
output: 1.2,
|
|
9493
10074
|
cacheRead: 0,
|
|
9494
10075
|
cacheWrite: 0,
|
|
9495
10076
|
},
|
|
9496
10077
|
contextWindow: 204800,
|
|
9497
|
-
maxTokens:
|
|
10078
|
+
maxTokens: 196608,
|
|
9498
10079
|
},
|
|
9499
|
-
"minimax/minimax-
|
|
9500
|
-
id: "minimax/minimax-
|
|
9501
|
-
name: "MiniMax: MiniMax
|
|
10080
|
+
"minimax/minimax-m3": {
|
|
10081
|
+
id: "minimax/minimax-m3",
|
|
10082
|
+
name: "MiniMax: MiniMax M3",
|
|
9502
10083
|
api: "openai-completions",
|
|
9503
10084
|
provider: "openrouter",
|
|
9504
10085
|
baseUrl: "https://openrouter.ai/api/v1",
|
|
9505
10086
|
reasoning: true,
|
|
9506
|
-
input: ["text"],
|
|
10087
|
+
input: ["text", "image"],
|
|
9507
10088
|
cost: {
|
|
9508
|
-
input: 0.
|
|
10089
|
+
input: 0.3,
|
|
9509
10090
|
output: 1.2,
|
|
9510
|
-
cacheRead: 0,
|
|
10091
|
+
cacheRead: 0.06,
|
|
9511
10092
|
cacheWrite: 0,
|
|
9512
10093
|
},
|
|
9513
|
-
contextWindow:
|
|
9514
|
-
maxTokens:
|
|
10094
|
+
contextWindow: 1048576,
|
|
10095
|
+
maxTokens: 512000,
|
|
9515
10096
|
},
|
|
9516
10097
|
"mistralai/codestral-2508": {
|
|
9517
10098
|
id: "mistralai/codestral-2508",
|
|
@@ -9547,40 +10128,6 @@ export const MODELS = {
|
|
|
9547
10128
|
contextWindow: 262144,
|
|
9548
10129
|
maxTokens: 4096,
|
|
9549
10130
|
},
|
|
9550
|
-
"mistralai/devstral-medium": {
|
|
9551
|
-
id: "mistralai/devstral-medium",
|
|
9552
|
-
name: "Mistral: Devstral Medium",
|
|
9553
|
-
api: "openai-completions",
|
|
9554
|
-
provider: "openrouter",
|
|
9555
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
9556
|
-
reasoning: false,
|
|
9557
|
-
input: ["text"],
|
|
9558
|
-
cost: {
|
|
9559
|
-
input: 0.39999999999999997,
|
|
9560
|
-
output: 2,
|
|
9561
|
-
cacheRead: 0.04,
|
|
9562
|
-
cacheWrite: 0,
|
|
9563
|
-
},
|
|
9564
|
-
contextWindow: 131072,
|
|
9565
|
-
maxTokens: 4096,
|
|
9566
|
-
},
|
|
9567
|
-
"mistralai/devstral-small": {
|
|
9568
|
-
id: "mistralai/devstral-small",
|
|
9569
|
-
name: "Mistral: Devstral Small 1.1",
|
|
9570
|
-
api: "openai-completions",
|
|
9571
|
-
provider: "openrouter",
|
|
9572
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
9573
|
-
reasoning: false,
|
|
9574
|
-
input: ["text"],
|
|
9575
|
-
cost: {
|
|
9576
|
-
input: 0.09999999999999999,
|
|
9577
|
-
output: 0.3,
|
|
9578
|
-
cacheRead: 0.01,
|
|
9579
|
-
cacheWrite: 0,
|
|
9580
|
-
},
|
|
9581
|
-
contextWindow: 131072,
|
|
9582
|
-
maxTokens: 4096,
|
|
9583
|
-
},
|
|
9584
10131
|
"mistralai/ministral-14b-2512": {
|
|
9585
10132
|
id: "mistralai/ministral-14b-2512",
|
|
9586
10133
|
name: "Mistral: Ministral 3 14B 2512",
|
|
@@ -9666,23 +10213,6 @@ export const MODELS = {
|
|
|
9666
10213
|
contextWindow: 131072,
|
|
9667
10214
|
maxTokens: 4096,
|
|
9668
10215
|
},
|
|
9669
|
-
"mistralai/mistral-large-2411": {
|
|
9670
|
-
id: "mistralai/mistral-large-2411",
|
|
9671
|
-
name: "Mistral Large 2411",
|
|
9672
|
-
api: "openai-completions",
|
|
9673
|
-
provider: "openrouter",
|
|
9674
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
9675
|
-
reasoning: false,
|
|
9676
|
-
input: ["text"],
|
|
9677
|
-
cost: {
|
|
9678
|
-
input: 2,
|
|
9679
|
-
output: 6,
|
|
9680
|
-
cacheRead: 0.19999999999999998,
|
|
9681
|
-
cacheWrite: 0,
|
|
9682
|
-
},
|
|
9683
|
-
contextWindow: 131072,
|
|
9684
|
-
maxTokens: 4096,
|
|
9685
|
-
},
|
|
9686
10216
|
"mistralai/mistral-large-2512": {
|
|
9687
10217
|
id: "mistralai/mistral-large-2512",
|
|
9688
10218
|
name: "Mistral: Mistral Large 3 2512",
|
|
@@ -9816,41 +10346,24 @@ export const MODELS = {
|
|
|
9816
10346
|
cacheRead: 0,
|
|
9817
10347
|
cacheWrite: 0,
|
|
9818
10348
|
},
|
|
9819
|
-
contextWindow: 128000,
|
|
9820
|
-
maxTokens: 16384,
|
|
9821
|
-
},
|
|
9822
|
-
"mistralai/mixtral-8x22b-instruct": {
|
|
9823
|
-
id: "mistralai/mixtral-8x22b-instruct",
|
|
9824
|
-
name: "Mistral: Mixtral 8x22B Instruct",
|
|
9825
|
-
api: "openai-completions",
|
|
9826
|
-
provider: "openrouter",
|
|
9827
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
9828
|
-
reasoning: false,
|
|
9829
|
-
input: ["text"],
|
|
9830
|
-
cost: {
|
|
9831
|
-
input: 2,
|
|
9832
|
-
output: 6,
|
|
9833
|
-
cacheRead: 0.19999999999999998,
|
|
9834
|
-
cacheWrite: 0,
|
|
9835
|
-
},
|
|
9836
|
-
contextWindow: 65536,
|
|
9837
|
-
maxTokens: 4096,
|
|
10349
|
+
contextWindow: 128000,
|
|
10350
|
+
maxTokens: 16384,
|
|
9838
10351
|
},
|
|
9839
|
-
"mistralai/
|
|
9840
|
-
id: "mistralai/
|
|
9841
|
-
name: "Mistral:
|
|
10352
|
+
"mistralai/mixtral-8x22b-instruct": {
|
|
10353
|
+
id: "mistralai/mixtral-8x22b-instruct",
|
|
10354
|
+
name: "Mistral: Mixtral 8x22B Instruct",
|
|
9842
10355
|
api: "openai-completions",
|
|
9843
10356
|
provider: "openrouter",
|
|
9844
10357
|
baseUrl: "https://openrouter.ai/api/v1",
|
|
9845
10358
|
reasoning: false,
|
|
9846
|
-
input: ["text"
|
|
10359
|
+
input: ["text"],
|
|
9847
10360
|
cost: {
|
|
9848
10361
|
input: 2,
|
|
9849
10362
|
output: 6,
|
|
9850
10363
|
cacheRead: 0.19999999999999998,
|
|
9851
10364
|
cacheWrite: 0,
|
|
9852
10365
|
},
|
|
9853
|
-
contextWindow:
|
|
10366
|
+
contextWindow: 65536,
|
|
9854
10367
|
maxTokens: 4096,
|
|
9855
10368
|
},
|
|
9856
10369
|
"mistralai/voxtral-small-24b-2507": {
|
|
@@ -9944,17 +10457,17 @@ export const MODELS = {
|
|
|
9944
10457
|
api: "openai-completions",
|
|
9945
10458
|
provider: "openrouter",
|
|
9946
10459
|
baseUrl: "https://openrouter.ai/api/v1",
|
|
9947
|
-
compat: { "supportsDeveloperRole": false },
|
|
10460
|
+
compat: { "supportsDeveloperRole": false, "requiresReasoningContentOnAssistantMessages": true },
|
|
9948
10461
|
reasoning: true,
|
|
9949
10462
|
input: ["text", "image"],
|
|
9950
10463
|
cost: {
|
|
9951
|
-
input: 0.
|
|
9952
|
-
output: 3.
|
|
9953
|
-
cacheRead: 0.
|
|
10464
|
+
input: 0.6799999999999999,
|
|
10465
|
+
output: 3.41,
|
|
10466
|
+
cacheRead: 0.33999999999999997,
|
|
9954
10467
|
cacheWrite: 0,
|
|
9955
10468
|
},
|
|
9956
10469
|
contextWindow: 262144,
|
|
9957
|
-
maxTokens:
|
|
10470
|
+
maxTokens: 262142,
|
|
9958
10471
|
},
|
|
9959
10472
|
"moonshotai/kimi-k2.6:free": {
|
|
9960
10473
|
id: "moonshotai/kimi-k2.6:free",
|
|
@@ -9962,7 +10475,7 @@ export const MODELS = {
|
|
|
9962
10475
|
api: "openai-completions",
|
|
9963
10476
|
provider: "openrouter",
|
|
9964
10477
|
baseUrl: "https://openrouter.ai/api/v1",
|
|
9965
|
-
compat: { "supportsDeveloperRole": false },
|
|
10478
|
+
compat: { "supportsDeveloperRole": false, "requiresReasoningContentOnAssistantMessages": true },
|
|
9966
10479
|
reasoning: true,
|
|
9967
10480
|
input: ["text", "image"],
|
|
9968
10481
|
cost: {
|
|
@@ -9974,23 +10487,6 @@ export const MODELS = {
|
|
|
9974
10487
|
contextWindow: 262144,
|
|
9975
10488
|
maxTokens: 4096,
|
|
9976
10489
|
},
|
|
9977
|
-
"nex-agi/deepseek-v3.1-nex-n1": {
|
|
9978
|
-
id: "nex-agi/deepseek-v3.1-nex-n1",
|
|
9979
|
-
name: "Nex AGI: DeepSeek V3.1 Nex N1",
|
|
9980
|
-
api: "openai-completions",
|
|
9981
|
-
provider: "openrouter",
|
|
9982
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
9983
|
-
reasoning: false,
|
|
9984
|
-
input: ["text"],
|
|
9985
|
-
cost: {
|
|
9986
|
-
input: 0.135,
|
|
9987
|
-
output: 0.5,
|
|
9988
|
-
cacheRead: 0,
|
|
9989
|
-
cacheWrite: 0,
|
|
9990
|
-
},
|
|
9991
|
-
contextWindow: 131072,
|
|
9992
|
-
maxTokens: 163840,
|
|
9993
|
-
},
|
|
9994
10490
|
"nvidia/llama-3.3-nemotron-super-49b-v1.5": {
|
|
9995
10491
|
id: "nvidia/llama-3.3-nemotron-super-49b-v1.5",
|
|
9996
10492
|
name: "NVIDIA: Llama 3.3 Nemotron Super 49B V1.5",
|
|
@@ -10000,7 +10496,7 @@ export const MODELS = {
|
|
|
10000
10496
|
reasoning: true,
|
|
10001
10497
|
input: ["text"],
|
|
10002
10498
|
cost: {
|
|
10003
|
-
input: 0.
|
|
10499
|
+
input: 0.39999999999999997,
|
|
10004
10500
|
output: 0.39999999999999997,
|
|
10005
10501
|
cacheRead: 0,
|
|
10006
10502
|
cacheWrite: 0,
|
|
@@ -10093,6 +10589,40 @@ export const MODELS = {
|
|
|
10093
10589
|
contextWindow: 1000000,
|
|
10094
10590
|
maxTokens: 262144,
|
|
10095
10591
|
},
|
|
10592
|
+
"nvidia/nemotron-3-ultra-550b-a55b": {
|
|
10593
|
+
id: "nvidia/nemotron-3-ultra-550b-a55b",
|
|
10594
|
+
name: "NVIDIA: Nemotron 3 Ultra",
|
|
10595
|
+
api: "openai-completions",
|
|
10596
|
+
provider: "openrouter",
|
|
10597
|
+
baseUrl: "https://openrouter.ai/api/v1",
|
|
10598
|
+
reasoning: true,
|
|
10599
|
+
input: ["text"],
|
|
10600
|
+
cost: {
|
|
10601
|
+
input: 0.5,
|
|
10602
|
+
output: 2.5,
|
|
10603
|
+
cacheRead: 0.15,
|
|
10604
|
+
cacheWrite: 0,
|
|
10605
|
+
},
|
|
10606
|
+
contextWindow: 1000000,
|
|
10607
|
+
maxTokens: 16384,
|
|
10608
|
+
},
|
|
10609
|
+
"nvidia/nemotron-3-ultra-550b-a55b:free": {
|
|
10610
|
+
id: "nvidia/nemotron-3-ultra-550b-a55b:free",
|
|
10611
|
+
name: "NVIDIA: Nemotron 3 Ultra (free)",
|
|
10612
|
+
api: "openai-completions",
|
|
10613
|
+
provider: "openrouter",
|
|
10614
|
+
baseUrl: "https://openrouter.ai/api/v1",
|
|
10615
|
+
reasoning: true,
|
|
10616
|
+
input: ["text"],
|
|
10617
|
+
cost: {
|
|
10618
|
+
input: 0,
|
|
10619
|
+
output: 0,
|
|
10620
|
+
cacheRead: 0,
|
|
10621
|
+
cacheWrite: 0,
|
|
10622
|
+
},
|
|
10623
|
+
contextWindow: 1000000,
|
|
10624
|
+
maxTokens: 65536,
|
|
10625
|
+
},
|
|
10096
10626
|
"nvidia/nemotron-nano-12b-v2-vl:free": {
|
|
10097
10627
|
id: "nvidia/nemotron-nano-12b-v2-vl:free",
|
|
10098
10628
|
name: "NVIDIA: Nemotron Nano 12B 2 VL (free)",
|
|
@@ -10212,40 +10742,6 @@ export const MODELS = {
|
|
|
10212
10742
|
contextWindow: 8191,
|
|
10213
10743
|
maxTokens: 4096,
|
|
10214
10744
|
},
|
|
10215
|
-
"openai/gpt-4-0314": {
|
|
10216
|
-
id: "openai/gpt-4-0314",
|
|
10217
|
-
name: "OpenAI: GPT-4 (older v0314)",
|
|
10218
|
-
api: "openai-completions",
|
|
10219
|
-
provider: "openrouter",
|
|
10220
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
10221
|
-
reasoning: false,
|
|
10222
|
-
input: ["text"],
|
|
10223
|
-
cost: {
|
|
10224
|
-
input: 30,
|
|
10225
|
-
output: 60,
|
|
10226
|
-
cacheRead: 0,
|
|
10227
|
-
cacheWrite: 0,
|
|
10228
|
-
},
|
|
10229
|
-
contextWindow: 8191,
|
|
10230
|
-
maxTokens: 4096,
|
|
10231
|
-
},
|
|
10232
|
-
"openai/gpt-4-1106-preview": {
|
|
10233
|
-
id: "openai/gpt-4-1106-preview",
|
|
10234
|
-
name: "OpenAI: GPT-4 Turbo (older v1106)",
|
|
10235
|
-
api: "openai-completions",
|
|
10236
|
-
provider: "openrouter",
|
|
10237
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
10238
|
-
reasoning: false,
|
|
10239
|
-
input: ["text"],
|
|
10240
|
-
cost: {
|
|
10241
|
-
input: 10,
|
|
10242
|
-
output: 30,
|
|
10243
|
-
cacheRead: 0,
|
|
10244
|
-
cacheWrite: 0,
|
|
10245
|
-
},
|
|
10246
|
-
contextWindow: 128000,
|
|
10247
|
-
maxTokens: 4096,
|
|
10248
|
-
},
|
|
10249
10745
|
"openai/gpt-4-turbo": {
|
|
10250
10746
|
id: "openai/gpt-4-turbo",
|
|
10251
10747
|
name: "OpenAI: GPT-4 Turbo",
|
|
@@ -10913,13 +11409,13 @@ export const MODELS = {
|
|
|
10913
11409
|
reasoning: true,
|
|
10914
11410
|
input: ["text"],
|
|
10915
11411
|
cost: {
|
|
10916
|
-
input: 0.
|
|
11412
|
+
input: 0.029,
|
|
10917
11413
|
output: 0.14,
|
|
10918
11414
|
cacheRead: 0,
|
|
10919
11415
|
cacheWrite: 0,
|
|
10920
11416
|
},
|
|
10921
11417
|
contextWindow: 131072,
|
|
10922
|
-
maxTokens:
|
|
11418
|
+
maxTokens: 4096,
|
|
10923
11419
|
},
|
|
10924
11420
|
"openai/gpt-oss-20b:free": {
|
|
10925
11421
|
id: "openai/gpt-oss-20b:free",
|
|
@@ -11227,23 +11723,6 @@ export const MODELS = {
|
|
|
11227
11723
|
contextWindow: 131072,
|
|
11228
11724
|
maxTokens: 16384,
|
|
11229
11725
|
},
|
|
11230
|
-
"qwen/qwen-2.5-7b-instruct": {
|
|
11231
|
-
id: "qwen/qwen-2.5-7b-instruct",
|
|
11232
|
-
name: "Qwen: Qwen2.5 7B Instruct",
|
|
11233
|
-
api: "openai-completions",
|
|
11234
|
-
provider: "openrouter",
|
|
11235
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
11236
|
-
reasoning: false,
|
|
11237
|
-
input: ["text"],
|
|
11238
|
-
cost: {
|
|
11239
|
-
input: 0.04,
|
|
11240
|
-
output: 0.09999999999999999,
|
|
11241
|
-
cacheRead: 0,
|
|
11242
|
-
cacheWrite: 0,
|
|
11243
|
-
},
|
|
11244
|
-
contextWindow: 131072,
|
|
11245
|
-
maxTokens: 32768,
|
|
11246
|
-
},
|
|
11247
11726
|
"qwen/qwen-plus": {
|
|
11248
11727
|
id: "qwen/qwen-plus",
|
|
11249
11728
|
name: "Qwen: Qwen-Plus",
|
|
@@ -11338,7 +11817,7 @@ export const MODELS = {
|
|
|
11338
11817
|
reasoning: false,
|
|
11339
11818
|
input: ["text"],
|
|
11340
11819
|
cost: {
|
|
11341
|
-
input: 0.
|
|
11820
|
+
input: 0.09,
|
|
11342
11821
|
output: 0.09999999999999999,
|
|
11343
11822
|
cacheRead: 0,
|
|
11344
11823
|
cacheWrite: 0,
|
|
@@ -11355,13 +11834,13 @@ export const MODELS = {
|
|
|
11355
11834
|
reasoning: true,
|
|
11356
11835
|
input: ["text"],
|
|
11357
11836
|
cost: {
|
|
11358
|
-
input: 0.
|
|
11359
|
-
output:
|
|
11360
|
-
cacheRead: 0,
|
|
11837
|
+
input: 0.09999999999999999,
|
|
11838
|
+
output: 0.09999999999999999,
|
|
11839
|
+
cacheRead: 0.09999999999999999,
|
|
11361
11840
|
cacheWrite: 0,
|
|
11362
11841
|
},
|
|
11363
11842
|
contextWindow: 262144,
|
|
11364
|
-
maxTokens:
|
|
11843
|
+
maxTokens: 262144,
|
|
11365
11844
|
},
|
|
11366
11845
|
"qwen/qwen3-30b-a3b": {
|
|
11367
11846
|
id: "qwen/qwen3-30b-a3b",
|
|
@@ -11372,13 +11851,13 @@ export const MODELS = {
|
|
|
11372
11851
|
reasoning: true,
|
|
11373
11852
|
input: ["text"],
|
|
11374
11853
|
cost: {
|
|
11375
|
-
input: 0.
|
|
11376
|
-
output: 0.
|
|
11854
|
+
input: 0.12,
|
|
11855
|
+
output: 0.5,
|
|
11377
11856
|
cacheRead: 0,
|
|
11378
11857
|
cacheWrite: 0,
|
|
11379
11858
|
},
|
|
11380
11859
|
contextWindow: 131072,
|
|
11381
|
-
maxTokens:
|
|
11860
|
+
maxTokens: 16384,
|
|
11382
11861
|
},
|
|
11383
11862
|
"qwen/qwen3-30b-a3b-instruct-2507": {
|
|
11384
11863
|
id: "qwen/qwen3-30b-a3b-instruct-2507",
|
|
@@ -11389,13 +11868,13 @@ export const MODELS = {
|
|
|
11389
11868
|
reasoning: false,
|
|
11390
11869
|
input: ["text"],
|
|
11391
11870
|
cost: {
|
|
11392
|
-
input: 0.
|
|
11393
|
-
output: 0.
|
|
11871
|
+
input: 0.04815,
|
|
11872
|
+
output: 0.19305,
|
|
11394
11873
|
cacheRead: 0,
|
|
11395
11874
|
cacheWrite: 0,
|
|
11396
11875
|
},
|
|
11397
|
-
contextWindow:
|
|
11398
|
-
maxTokens:
|
|
11876
|
+
contextWindow: 131072,
|
|
11877
|
+
maxTokens: 32000,
|
|
11399
11878
|
},
|
|
11400
11879
|
"qwen/qwen3-30b-a3b-thinking-2507": {
|
|
11401
11880
|
id: "qwen/qwen3-30b-a3b-thinking-2507",
|
|
@@ -11797,13 +12276,13 @@ export const MODELS = {
|
|
|
11797
12276
|
reasoning: true,
|
|
11798
12277
|
input: ["text", "image"],
|
|
11799
12278
|
cost: {
|
|
11800
|
-
input: 0.
|
|
12279
|
+
input: 0.14,
|
|
11801
12280
|
output: 1,
|
|
11802
|
-
cacheRead: 0,
|
|
12281
|
+
cacheRead: 0.049999999999999996,
|
|
11803
12282
|
cacheWrite: 0,
|
|
11804
12283
|
},
|
|
11805
12284
|
contextWindow: 262144,
|
|
11806
|
-
maxTokens:
|
|
12285
|
+
maxTokens: 262144,
|
|
11807
12286
|
},
|
|
11808
12287
|
"qwen/qwen3.5-397b-a17b": {
|
|
11809
12288
|
id: "qwen/qwen3.5-397b-a17b",
|
|
@@ -11831,13 +12310,13 @@ export const MODELS = {
|
|
|
11831
12310
|
reasoning: true,
|
|
11832
12311
|
input: ["text", "image"],
|
|
11833
12312
|
cost: {
|
|
11834
|
-
input: 0.
|
|
12313
|
+
input: 0.09999999999999999,
|
|
11835
12314
|
output: 0.15,
|
|
11836
12315
|
cacheRead: 0,
|
|
11837
12316
|
cacheWrite: 0,
|
|
11838
12317
|
},
|
|
11839
12318
|
contextWindow: 262144,
|
|
11840
|
-
maxTokens:
|
|
12319
|
+
maxTokens: 262144,
|
|
11841
12320
|
},
|
|
11842
12321
|
"qwen/qwen3.5-flash-02-23": {
|
|
11843
12322
|
id: "qwen/qwen3.5-flash-02-23",
|
|
@@ -11899,13 +12378,13 @@ export const MODELS = {
|
|
|
11899
12378
|
reasoning: true,
|
|
11900
12379
|
input: ["text", "image"],
|
|
11901
12380
|
cost: {
|
|
11902
|
-
input: 0.
|
|
11903
|
-
output:
|
|
12381
|
+
input: 0.28900000000000003,
|
|
12382
|
+
output: 2.4,
|
|
11904
12383
|
cacheRead: 0,
|
|
11905
12384
|
cacheWrite: 0,
|
|
11906
12385
|
},
|
|
11907
12386
|
contextWindow: 262144,
|
|
11908
|
-
maxTokens:
|
|
12387
|
+
maxTokens: 131072,
|
|
11909
12388
|
},
|
|
11910
12389
|
"qwen/qwen3.6-35b-a3b": {
|
|
11911
12390
|
id: "qwen/qwen3.6-35b-a3b",
|
|
@@ -11992,6 +12471,23 @@ export const MODELS = {
|
|
|
11992
12471
|
contextWindow: 1000000,
|
|
11993
12472
|
maxTokens: 65536,
|
|
11994
12473
|
},
|
|
12474
|
+
"qwen/qwen3.7-plus": {
|
|
12475
|
+
id: "qwen/qwen3.7-plus",
|
|
12476
|
+
name: "Qwen: Qwen3.7 Plus",
|
|
12477
|
+
api: "openai-completions",
|
|
12478
|
+
provider: "openrouter",
|
|
12479
|
+
baseUrl: "https://openrouter.ai/api/v1",
|
|
12480
|
+
reasoning: true,
|
|
12481
|
+
input: ["text", "image"],
|
|
12482
|
+
cost: {
|
|
12483
|
+
input: 0.39999999999999997,
|
|
12484
|
+
output: 1.5999999999999999,
|
|
12485
|
+
cacheRead: 0.08,
|
|
12486
|
+
cacheWrite: 0.5,
|
|
12487
|
+
},
|
|
12488
|
+
contextWindow: 1000000,
|
|
12489
|
+
maxTokens: 65536,
|
|
12490
|
+
},
|
|
11995
12491
|
"rekaai/reka-edge": {
|
|
11996
12492
|
id: "rekaai/reka-edge",
|
|
11997
12493
|
name: "Reka Edge",
|
|
@@ -12026,23 +12522,6 @@ export const MODELS = {
|
|
|
12026
12522
|
contextWindow: 256000,
|
|
12027
12523
|
maxTokens: 128000,
|
|
12028
12524
|
},
|
|
12029
|
-
"sao10k/l3-euryale-70b": {
|
|
12030
|
-
id: "sao10k/l3-euryale-70b",
|
|
12031
|
-
name: "Sao10k: Llama 3 Euryale 70B v2.1",
|
|
12032
|
-
api: "openai-completions",
|
|
12033
|
-
provider: "openrouter",
|
|
12034
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
12035
|
-
reasoning: false,
|
|
12036
|
-
input: ["text"],
|
|
12037
|
-
cost: {
|
|
12038
|
-
input: 1.48,
|
|
12039
|
-
output: 1.48,
|
|
12040
|
-
cacheRead: 0,
|
|
12041
|
-
cacheWrite: 0,
|
|
12042
|
-
},
|
|
12043
|
-
contextWindow: 8192,
|
|
12044
|
-
maxTokens: 8192,
|
|
12045
|
-
},
|
|
12046
12525
|
"sao10k/l3.1-euryale-70b": {
|
|
12047
12526
|
id: "sao10k/l3.1-euryale-70b",
|
|
12048
12527
|
name: "Sao10K: Llama 3.1 Euryale 70B v2.2",
|
|
@@ -12230,40 +12709,6 @@ export const MODELS = {
|
|
|
12230
12709
|
contextWindow: 262144,
|
|
12231
12710
|
maxTokens: 65536,
|
|
12232
12711
|
},
|
|
12233
|
-
"xiaomi/mimo-v2-omni": {
|
|
12234
|
-
id: "xiaomi/mimo-v2-omni",
|
|
12235
|
-
name: "Xiaomi: MiMo-V2-Omni",
|
|
12236
|
-
api: "openai-completions",
|
|
12237
|
-
provider: "openrouter",
|
|
12238
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
12239
|
-
reasoning: true,
|
|
12240
|
-
input: ["text", "image"],
|
|
12241
|
-
cost: {
|
|
12242
|
-
input: 0.39999999999999997,
|
|
12243
|
-
output: 2,
|
|
12244
|
-
cacheRead: 0.08,
|
|
12245
|
-
cacheWrite: 0,
|
|
12246
|
-
},
|
|
12247
|
-
contextWindow: 262144,
|
|
12248
|
-
maxTokens: 65536,
|
|
12249
|
-
},
|
|
12250
|
-
"xiaomi/mimo-v2-pro": {
|
|
12251
|
-
id: "xiaomi/mimo-v2-pro",
|
|
12252
|
-
name: "Xiaomi: MiMo-V2-Pro",
|
|
12253
|
-
api: "openai-completions",
|
|
12254
|
-
provider: "openrouter",
|
|
12255
|
-
baseUrl: "https://openrouter.ai/api/v1",
|
|
12256
|
-
reasoning: true,
|
|
12257
|
-
input: ["text"],
|
|
12258
|
-
cost: {
|
|
12259
|
-
input: 1,
|
|
12260
|
-
output: 3,
|
|
12261
|
-
cacheRead: 0.19999999999999998,
|
|
12262
|
-
cacheWrite: 0,
|
|
12263
|
-
},
|
|
12264
|
-
contextWindow: 1048576,
|
|
12265
|
-
maxTokens: 131072,
|
|
12266
|
-
},
|
|
12267
12712
|
"xiaomi/mimo-v2.5": {
|
|
12268
12713
|
id: "xiaomi/mimo-v2.5",
|
|
12269
12714
|
name: "Xiaomi: MiMo-V2.5",
|
|
@@ -12613,13 +13058,13 @@ export const MODELS = {
|
|
|
12613
13058
|
reasoning: true,
|
|
12614
13059
|
input: ["text", "image"],
|
|
12615
13060
|
cost: {
|
|
12616
|
-
input: 0.
|
|
12617
|
-
output: 3.
|
|
12618
|
-
cacheRead: 0.
|
|
13061
|
+
input: 0.6799999999999999,
|
|
13062
|
+
output: 3.41,
|
|
13063
|
+
cacheRead: 0.33999999999999997,
|
|
12619
13064
|
cacheWrite: 0,
|
|
12620
13065
|
},
|
|
12621
13066
|
contextWindow: 262144,
|
|
12622
|
-
maxTokens:
|
|
13067
|
+
maxTokens: 262142,
|
|
12623
13068
|
},
|
|
12624
13069
|
"~openai/gpt-latest": {
|
|
12625
13070
|
id: "~openai/gpt-latest",
|
|
@@ -12810,7 +13255,7 @@ export const MODELS = {
|
|
|
12810
13255
|
},
|
|
12811
13256
|
"deepseek-ai/DeepSeek-V3": {
|
|
12812
13257
|
id: "deepseek-ai/DeepSeek-V3",
|
|
12813
|
-
name: "DeepSeek
|
|
13258
|
+
name: "DeepSeek-V3",
|
|
12814
13259
|
api: "openai-completions",
|
|
12815
13260
|
provider: "together",
|
|
12816
13261
|
baseUrl: "https://api.together.ai/v1",
|
|
@@ -12958,6 +13403,25 @@ export const MODELS = {
|
|
|
12958
13403
|
contextWindow: 262144,
|
|
12959
13404
|
maxTokens: 131000,
|
|
12960
13405
|
},
|
|
13406
|
+
"nvidia/nemotron-3-ultra-550b-a55b": {
|
|
13407
|
+
id: "nvidia/nemotron-3-ultra-550b-a55b",
|
|
13408
|
+
name: "Nemotron 3 Ultra 550B A55B",
|
|
13409
|
+
api: "openai-completions",
|
|
13410
|
+
provider: "together",
|
|
13411
|
+
baseUrl: "https://api.together.ai/v1",
|
|
13412
|
+
compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
|
|
13413
|
+
reasoning: true,
|
|
13414
|
+
thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
|
|
13415
|
+
input: ["text"],
|
|
13416
|
+
cost: {
|
|
13417
|
+
input: 0.6,
|
|
13418
|
+
output: 3.6,
|
|
13419
|
+
cacheRead: 0.2,
|
|
13420
|
+
cacheWrite: 0,
|
|
13421
|
+
},
|
|
13422
|
+
contextWindow: 512300,
|
|
13423
|
+
maxTokens: 512300,
|
|
13424
|
+
},
|
|
12961
13425
|
"openai/gpt-oss-120b": {
|
|
12962
13426
|
id: "openai/gpt-oss-120b",
|
|
12963
13427
|
name: "GPT OSS 120B",
|
|
@@ -13021,7 +13485,7 @@ export const MODELS = {
|
|
|
13021
13485
|
api: "anthropic-messages",
|
|
13022
13486
|
provider: "vercel-ai-gateway",
|
|
13023
13487
|
baseUrl: "https://ai-gateway.vercel.sh",
|
|
13024
|
-
reasoning:
|
|
13488
|
+
reasoning: true,
|
|
13025
13489
|
input: ["text"],
|
|
13026
13490
|
cost: {
|
|
13027
13491
|
input: 0.22,
|
|
@@ -13073,7 +13537,7 @@ export const MODELS = {
|
|
|
13073
13537
|
provider: "vercel-ai-gateway",
|
|
13074
13538
|
baseUrl: "https://ai-gateway.vercel.sh",
|
|
13075
13539
|
reasoning: true,
|
|
13076
|
-
input: ["text"
|
|
13540
|
+
input: ["text"],
|
|
13077
13541
|
cost: {
|
|
13078
13542
|
input: 1.3,
|
|
13079
13543
|
output: 7.8,
|
|
@@ -13106,7 +13570,7 @@ export const MODELS = {
|
|
|
13106
13570
|
api: "anthropic-messages",
|
|
13107
13571
|
provider: "vercel-ai-gateway",
|
|
13108
13572
|
baseUrl: "https://ai-gateway.vercel.sh",
|
|
13109
|
-
reasoning:
|
|
13573
|
+
reasoning: true,
|
|
13110
13574
|
input: ["text"],
|
|
13111
13575
|
cost: {
|
|
13112
13576
|
input: 1.5,
|
|
@@ -13140,7 +13604,7 @@ export const MODELS = {
|
|
|
13140
13604
|
api: "anthropic-messages",
|
|
13141
13605
|
provider: "vercel-ai-gateway",
|
|
13142
13606
|
baseUrl: "https://ai-gateway.vercel.sh",
|
|
13143
|
-
reasoning:
|
|
13607
|
+
reasoning: true,
|
|
13144
13608
|
input: ["text"],
|
|
13145
13609
|
cost: {
|
|
13146
13610
|
input: 0.5,
|
|
@@ -13219,6 +13683,40 @@ export const MODELS = {
|
|
|
13219
13683
|
contextWindow: 256000,
|
|
13220
13684
|
maxTokens: 65536,
|
|
13221
13685
|
},
|
|
13686
|
+
"alibaba/qwen3-next-80b-a3b-instruct": {
|
|
13687
|
+
id: "alibaba/qwen3-next-80b-a3b-instruct",
|
|
13688
|
+
name: "Qwen3 Next 80B A3B Instruct",
|
|
13689
|
+
api: "anthropic-messages",
|
|
13690
|
+
provider: "vercel-ai-gateway",
|
|
13691
|
+
baseUrl: "https://ai-gateway.vercel.sh",
|
|
13692
|
+
reasoning: false,
|
|
13693
|
+
input: ["text"],
|
|
13694
|
+
cost: {
|
|
13695
|
+
input: 0.15,
|
|
13696
|
+
output: 1.2,
|
|
13697
|
+
cacheRead: 0,
|
|
13698
|
+
cacheWrite: 0,
|
|
13699
|
+
},
|
|
13700
|
+
contextWindow: 131072,
|
|
13701
|
+
maxTokens: 32768,
|
|
13702
|
+
},
|
|
13703
|
+
"alibaba/qwen3-next-80b-a3b-thinking": {
|
|
13704
|
+
id: "alibaba/qwen3-next-80b-a3b-thinking",
|
|
13705
|
+
name: "Qwen3 Next 80B A3B Thinking",
|
|
13706
|
+
api: "anthropic-messages",
|
|
13707
|
+
provider: "vercel-ai-gateway",
|
|
13708
|
+
baseUrl: "https://ai-gateway.vercel.sh",
|
|
13709
|
+
reasoning: true,
|
|
13710
|
+
input: ["text"],
|
|
13711
|
+
cost: {
|
|
13712
|
+
input: 0.15,
|
|
13713
|
+
output: 1.2,
|
|
13714
|
+
cacheRead: 0,
|
|
13715
|
+
cacheWrite: 0,
|
|
13716
|
+
},
|
|
13717
|
+
contextWindow: 131072,
|
|
13718
|
+
maxTokens: 32768,
|
|
13719
|
+
},
|
|
13222
13720
|
"alibaba/qwen3-vl-thinking": {
|
|
13223
13721
|
id: "alibaba/qwen3-vl-thinking",
|
|
13224
13722
|
name: "Qwen3 VL 235B A22B Thinking",
|
|
@@ -13311,14 +13809,31 @@ export const MODELS = {
|
|
|
13311
13809
|
provider: "vercel-ai-gateway",
|
|
13312
13810
|
baseUrl: "https://ai-gateway.vercel.sh",
|
|
13313
13811
|
reasoning: true,
|
|
13314
|
-
input: ["text"
|
|
13812
|
+
input: ["text"],
|
|
13315
13813
|
cost: {
|
|
13316
13814
|
input: 1.25,
|
|
13317
13815
|
output: 3.75,
|
|
13318
13816
|
cacheRead: 0.25,
|
|
13319
13817
|
cacheWrite: 1.5625,
|
|
13320
13818
|
},
|
|
13321
|
-
contextWindow: 991000,
|
|
13819
|
+
contextWindow: 991000,
|
|
13820
|
+
maxTokens: 64000,
|
|
13821
|
+
},
|
|
13822
|
+
"alibaba/qwen3.7-plus": {
|
|
13823
|
+
id: "alibaba/qwen3.7-plus",
|
|
13824
|
+
name: "Qwen 3.7 Plus",
|
|
13825
|
+
api: "anthropic-messages",
|
|
13826
|
+
provider: "vercel-ai-gateway",
|
|
13827
|
+
baseUrl: "https://ai-gateway.vercel.sh",
|
|
13828
|
+
reasoning: true,
|
|
13829
|
+
input: ["text", "image"],
|
|
13830
|
+
cost: {
|
|
13831
|
+
input: 0.39999999999999997,
|
|
13832
|
+
output: 1.5999999999999999,
|
|
13833
|
+
cacheRead: 0.08,
|
|
13834
|
+
cacheWrite: 0.5,
|
|
13835
|
+
},
|
|
13836
|
+
contextWindow: 1000000,
|
|
13322
13837
|
maxTokens: 64000,
|
|
13323
13838
|
},
|
|
13324
13839
|
"anthropic/claude-3-haiku": {
|
|
@@ -13448,7 +13963,7 @@ export const MODELS = {
|
|
|
13448
13963
|
api: "anthropic-messages",
|
|
13449
13964
|
provider: "vercel-ai-gateway",
|
|
13450
13965
|
baseUrl: "https://ai-gateway.vercel.sh",
|
|
13451
|
-
compat: { "forceAdaptiveThinking": true },
|
|
13966
|
+
compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
|
|
13452
13967
|
reasoning: true,
|
|
13453
13968
|
thinkingLevelMap: { "xhigh": "xhigh" },
|
|
13454
13969
|
input: ["text", "image"],
|
|
@@ -13467,7 +13982,7 @@ export const MODELS = {
|
|
|
13467
13982
|
api: "anthropic-messages",
|
|
13468
13983
|
provider: "vercel-ai-gateway",
|
|
13469
13984
|
baseUrl: "https://ai-gateway.vercel.sh",
|
|
13470
|
-
compat: { "forceAdaptiveThinking": true },
|
|
13985
|
+
compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
|
|
13471
13986
|
reasoning: true,
|
|
13472
13987
|
thinkingLevelMap: { "xhigh": "xhigh" },
|
|
13473
13988
|
input: ["text", "image"],
|
|
@@ -13626,17 +14141,17 @@ export const MODELS = {
|
|
|
13626
14141
|
reasoning: false,
|
|
13627
14142
|
input: ["text"],
|
|
13628
14143
|
cost: {
|
|
13629
|
-
input: 0.
|
|
13630
|
-
output:
|
|
13631
|
-
cacheRead: 0,
|
|
14144
|
+
input: 0.27,
|
|
14145
|
+
output: 1.12,
|
|
14146
|
+
cacheRead: 0.135,
|
|
13632
14147
|
cacheWrite: 0,
|
|
13633
14148
|
},
|
|
13634
14149
|
contextWindow: 163840,
|
|
13635
|
-
maxTokens:
|
|
14150
|
+
maxTokens: 163840,
|
|
13636
14151
|
},
|
|
13637
14152
|
"deepseek/deepseek-v3.1": {
|
|
13638
14153
|
id: "deepseek/deepseek-v3.1",
|
|
13639
|
-
name: "DeepSeek
|
|
14154
|
+
name: "DeepSeek V3.1",
|
|
13640
14155
|
api: "anthropic-messages",
|
|
13641
14156
|
provider: "vercel-ai-gateway",
|
|
13642
14157
|
baseUrl: "https://ai-gateway.vercel.sh",
|
|
@@ -13674,8 +14189,8 @@ export const MODELS = {
|
|
|
13674
14189
|
api: "anthropic-messages",
|
|
13675
14190
|
provider: "vercel-ai-gateway",
|
|
13676
14191
|
baseUrl: "https://ai-gateway.vercel.sh",
|
|
13677
|
-
reasoning:
|
|
13678
|
-
input: ["text"],
|
|
14192
|
+
reasoning: true,
|
|
14193
|
+
input: ["text", "image"],
|
|
13679
14194
|
cost: {
|
|
13680
14195
|
input: 0.28,
|
|
13681
14196
|
output: 0.42,
|
|
@@ -13691,8 +14206,8 @@ export const MODELS = {
|
|
|
13691
14206
|
api: "anthropic-messages",
|
|
13692
14207
|
provider: "vercel-ai-gateway",
|
|
13693
14208
|
baseUrl: "https://ai-gateway.vercel.sh",
|
|
13694
|
-
reasoning:
|
|
13695
|
-
input: ["text"],
|
|
14209
|
+
reasoning: true,
|
|
14210
|
+
input: ["text", "image"],
|
|
13696
14211
|
cost: {
|
|
13697
14212
|
input: 0.62,
|
|
13698
14213
|
output: 1.85,
|
|
@@ -13709,7 +14224,7 @@ export const MODELS = {
|
|
|
13709
14224
|
provider: "vercel-ai-gateway",
|
|
13710
14225
|
baseUrl: "https://ai-gateway.vercel.sh",
|
|
13711
14226
|
reasoning: true,
|
|
13712
|
-
input: ["text"],
|
|
14227
|
+
input: ["text", "image"],
|
|
13713
14228
|
cost: {
|
|
13714
14229
|
input: 0.14,
|
|
13715
14230
|
output: 0.28,
|
|
@@ -13736,40 +14251,6 @@ export const MODELS = {
|
|
|
13736
14251
|
contextWindow: 1000000,
|
|
13737
14252
|
maxTokens: 384000,
|
|
13738
14253
|
},
|
|
13739
|
-
"google/gemini-2.0-flash": {
|
|
13740
|
-
id: "google/gemini-2.0-flash",
|
|
13741
|
-
name: "Gemini 2.0 Flash",
|
|
13742
|
-
api: "anthropic-messages",
|
|
13743
|
-
provider: "vercel-ai-gateway",
|
|
13744
|
-
baseUrl: "https://ai-gateway.vercel.sh",
|
|
13745
|
-
reasoning: false,
|
|
13746
|
-
input: ["text", "image"],
|
|
13747
|
-
cost: {
|
|
13748
|
-
input: 0.15,
|
|
13749
|
-
output: 0.6,
|
|
13750
|
-
cacheRead: 0.024999999999999998,
|
|
13751
|
-
cacheWrite: 0,
|
|
13752
|
-
},
|
|
13753
|
-
contextWindow: 1048576,
|
|
13754
|
-
maxTokens: 8192,
|
|
13755
|
-
},
|
|
13756
|
-
"google/gemini-2.0-flash-lite": {
|
|
13757
|
-
id: "google/gemini-2.0-flash-lite",
|
|
13758
|
-
name: "Gemini 2.0 Flash Lite",
|
|
13759
|
-
api: "anthropic-messages",
|
|
13760
|
-
provider: "vercel-ai-gateway",
|
|
13761
|
-
baseUrl: "https://ai-gateway.vercel.sh",
|
|
13762
|
-
reasoning: false,
|
|
13763
|
-
input: ["text", "image"],
|
|
13764
|
-
cost: {
|
|
13765
|
-
input: 0.075,
|
|
13766
|
-
output: 0.3,
|
|
13767
|
-
cacheRead: 0.02,
|
|
13768
|
-
cacheWrite: 0,
|
|
13769
|
-
},
|
|
13770
|
-
contextWindow: 1048576,
|
|
13771
|
-
maxTokens: 8192,
|
|
13772
|
-
},
|
|
13773
14254
|
"google/gemini-2.5-flash": {
|
|
13774
14255
|
id: "google/gemini-2.5-flash",
|
|
13775
14256
|
name: "Gemini 2.5 Flash",
|
|
@@ -13929,12 +14410,12 @@ export const MODELS = {
|
|
|
13929
14410
|
api: "anthropic-messages",
|
|
13930
14411
|
provider: "vercel-ai-gateway",
|
|
13931
14412
|
baseUrl: "https://ai-gateway.vercel.sh",
|
|
13932
|
-
reasoning:
|
|
14413
|
+
reasoning: true,
|
|
13933
14414
|
input: ["text", "image"],
|
|
13934
14415
|
cost: {
|
|
13935
|
-
input: 0.
|
|
13936
|
-
output: 0.
|
|
13937
|
-
cacheRead: 0,
|
|
14416
|
+
input: 0.15,
|
|
14417
|
+
output: 0.6,
|
|
14418
|
+
cacheRead: 0.015,
|
|
13938
14419
|
cacheWrite: 0,
|
|
13939
14420
|
},
|
|
13940
14421
|
contextWindow: 262144,
|
|
@@ -14236,7 +14717,7 @@ export const MODELS = {
|
|
|
14236
14717
|
provider: "vercel-ai-gateway",
|
|
14237
14718
|
baseUrl: "https://ai-gateway.vercel.sh",
|
|
14238
14719
|
reasoning: true,
|
|
14239
|
-
input: ["text"
|
|
14720
|
+
input: ["text"],
|
|
14240
14721
|
cost: {
|
|
14241
14722
|
input: 0.3,
|
|
14242
14723
|
output: 1.2,
|
|
@@ -14253,7 +14734,7 @@ export const MODELS = {
|
|
|
14253
14734
|
provider: "vercel-ai-gateway",
|
|
14254
14735
|
baseUrl: "https://ai-gateway.vercel.sh",
|
|
14255
14736
|
reasoning: true,
|
|
14256
|
-
input: ["text"
|
|
14737
|
+
input: ["text"],
|
|
14257
14738
|
cost: {
|
|
14258
14739
|
input: 0.6,
|
|
14259
14740
|
output: 2.4,
|
|
@@ -14263,6 +14744,23 @@ export const MODELS = {
|
|
|
14263
14744
|
contextWindow: 204800,
|
|
14264
14745
|
maxTokens: 131100,
|
|
14265
14746
|
},
|
|
14747
|
+
"minimax/minimax-m3": {
|
|
14748
|
+
id: "minimax/minimax-m3",
|
|
14749
|
+
name: "MiniMax M3",
|
|
14750
|
+
api: "anthropic-messages",
|
|
14751
|
+
provider: "vercel-ai-gateway",
|
|
14752
|
+
baseUrl: "https://ai-gateway.vercel.sh",
|
|
14753
|
+
reasoning: true,
|
|
14754
|
+
input: ["text", "image"],
|
|
14755
|
+
cost: {
|
|
14756
|
+
input: 0.3,
|
|
14757
|
+
output: 1.2,
|
|
14758
|
+
cacheRead: 0.06,
|
|
14759
|
+
cacheWrite: 0,
|
|
14760
|
+
},
|
|
14761
|
+
contextWindow: 1000000,
|
|
14762
|
+
maxTokens: 1000000,
|
|
14763
|
+
},
|
|
14266
14764
|
"mistral/codestral": {
|
|
14267
14765
|
id: "mistral/codestral",
|
|
14268
14766
|
name: "Mistral Codestral",
|
|
@@ -14399,6 +14897,23 @@ export const MODELS = {
|
|
|
14399
14897
|
contextWindow: 256000,
|
|
14400
14898
|
maxTokens: 256000,
|
|
14401
14899
|
},
|
|
14900
|
+
"mistral/mistral-nemo": {
|
|
14901
|
+
id: "mistral/mistral-nemo",
|
|
14902
|
+
name: "Mistral Nemo 12B",
|
|
14903
|
+
api: "anthropic-messages",
|
|
14904
|
+
provider: "vercel-ai-gateway",
|
|
14905
|
+
baseUrl: "https://ai-gateway.vercel.sh",
|
|
14906
|
+
reasoning: false,
|
|
14907
|
+
input: ["text"],
|
|
14908
|
+
cost: {
|
|
14909
|
+
input: 0.02,
|
|
14910
|
+
output: 0.04,
|
|
14911
|
+
cacheRead: 0,
|
|
14912
|
+
cacheWrite: 0,
|
|
14913
|
+
},
|
|
14914
|
+
contextWindow: 131072,
|
|
14915
|
+
maxTokens: 131072,
|
|
14916
|
+
},
|
|
14402
14917
|
"mistral/mistral-small": {
|
|
14403
14918
|
id: "mistral/mistral-small",
|
|
14404
14919
|
name: "Mistral Small",
|
|
@@ -14552,6 +15067,40 @@ export const MODELS = {
|
|
|
14552
15067
|
contextWindow: 262000,
|
|
14553
15068
|
maxTokens: 262000,
|
|
14554
15069
|
},
|
|
15070
|
+
"nvidia/nemotron-3-super-120b-a12b": {
|
|
15071
|
+
id: "nvidia/nemotron-3-super-120b-a12b",
|
|
15072
|
+
name: "NVIDIA Nemotron 3 Super 120B A12B",
|
|
15073
|
+
api: "anthropic-messages",
|
|
15074
|
+
provider: "vercel-ai-gateway",
|
|
15075
|
+
baseUrl: "https://ai-gateway.vercel.sh",
|
|
15076
|
+
reasoning: true,
|
|
15077
|
+
input: ["text"],
|
|
15078
|
+
cost: {
|
|
15079
|
+
input: 0.15,
|
|
15080
|
+
output: 0.65,
|
|
15081
|
+
cacheRead: 0,
|
|
15082
|
+
cacheWrite: 0,
|
|
15083
|
+
},
|
|
15084
|
+
contextWindow: 256000,
|
|
15085
|
+
maxTokens: 32000,
|
|
15086
|
+
},
|
|
15087
|
+
"nvidia/nemotron-3-ultra-550b-a55b": {
|
|
15088
|
+
id: "nvidia/nemotron-3-ultra-550b-a55b",
|
|
15089
|
+
name: "Nemotron 3 Ultra",
|
|
15090
|
+
api: "anthropic-messages",
|
|
15091
|
+
provider: "vercel-ai-gateway",
|
|
15092
|
+
baseUrl: "https://ai-gateway.vercel.sh",
|
|
15093
|
+
reasoning: true,
|
|
15094
|
+
input: ["text"],
|
|
15095
|
+
cost: {
|
|
15096
|
+
input: 0.6,
|
|
15097
|
+
output: 2.4,
|
|
15098
|
+
cacheRead: 0.12,
|
|
15099
|
+
cacheWrite: 0,
|
|
15100
|
+
},
|
|
15101
|
+
contextWindow: 1000000,
|
|
15102
|
+
maxTokens: 65000,
|
|
15103
|
+
},
|
|
14555
15104
|
"nvidia/nemotron-nano-12b-v2-vl": {
|
|
14556
15105
|
id: "nvidia/nemotron-nano-12b-v2-vl",
|
|
14557
15106
|
name: "Nvidia Nemotron Nano 12B V2 VL",
|
|
@@ -14729,7 +15278,7 @@ export const MODELS = {
|
|
|
14729
15278
|
provider: "vercel-ai-gateway",
|
|
14730
15279
|
baseUrl: "https://ai-gateway.vercel.sh",
|
|
14731
15280
|
reasoning: true,
|
|
14732
|
-
input: ["text"],
|
|
15281
|
+
input: ["text", "image"],
|
|
14733
15282
|
cost: {
|
|
14734
15283
|
input: 1.25,
|
|
14735
15284
|
output: 10,
|
|
@@ -15091,6 +15640,23 @@ export const MODELS = {
|
|
|
15091
15640
|
contextWindow: 1000000,
|
|
15092
15641
|
maxTokens: 128000,
|
|
15093
15642
|
},
|
|
15643
|
+
"openai/gpt-oss-120b": {
|
|
15644
|
+
id: "openai/gpt-oss-120b",
|
|
15645
|
+
name: "GPT OSS 120B",
|
|
15646
|
+
api: "anthropic-messages",
|
|
15647
|
+
provider: "vercel-ai-gateway",
|
|
15648
|
+
baseUrl: "https://ai-gateway.vercel.sh",
|
|
15649
|
+
reasoning: true,
|
|
15650
|
+
input: ["text"],
|
|
15651
|
+
cost: {
|
|
15652
|
+
input: 0.35,
|
|
15653
|
+
output: 0.75,
|
|
15654
|
+
cacheRead: 0.25,
|
|
15655
|
+
cacheWrite: 0,
|
|
15656
|
+
},
|
|
15657
|
+
contextWindow: 131072,
|
|
15658
|
+
maxTokens: 131000,
|
|
15659
|
+
},
|
|
15094
15660
|
"openai/gpt-oss-20b": {
|
|
15095
15661
|
id: "openai/gpt-oss-20b",
|
|
15096
15662
|
name: "GPT OSS 20B",
|
|
@@ -15261,6 +15827,40 @@ export const MODELS = {
|
|
|
15261
15827
|
contextWindow: 200000,
|
|
15262
15828
|
maxTokens: 8000,
|
|
15263
15829
|
},
|
|
15830
|
+
"stepfun/step-3.5-flash": {
|
|
15831
|
+
id: "stepfun/step-3.5-flash",
|
|
15832
|
+
name: "StepFun 3.5 Flash",
|
|
15833
|
+
api: "anthropic-messages",
|
|
15834
|
+
provider: "vercel-ai-gateway",
|
|
15835
|
+
baseUrl: "https://ai-gateway.vercel.sh",
|
|
15836
|
+
reasoning: true,
|
|
15837
|
+
input: ["text"],
|
|
15838
|
+
cost: {
|
|
15839
|
+
input: 0.09,
|
|
15840
|
+
output: 0.3,
|
|
15841
|
+
cacheRead: 0,
|
|
15842
|
+
cacheWrite: 0.02,
|
|
15843
|
+
},
|
|
15844
|
+
contextWindow: 262114,
|
|
15845
|
+
maxTokens: 262114,
|
|
15846
|
+
},
|
|
15847
|
+
"stepfun/step-3.7-flash": {
|
|
15848
|
+
id: "stepfun/step-3.7-flash",
|
|
15849
|
+
name: "Step 3.7 Flash",
|
|
15850
|
+
api: "anthropic-messages",
|
|
15851
|
+
provider: "vercel-ai-gateway",
|
|
15852
|
+
baseUrl: "https://ai-gateway.vercel.sh",
|
|
15853
|
+
reasoning: true,
|
|
15854
|
+
input: ["text", "image"],
|
|
15855
|
+
cost: {
|
|
15856
|
+
input: 0.19999999999999998,
|
|
15857
|
+
output: 1.15,
|
|
15858
|
+
cacheRead: 0.04,
|
|
15859
|
+
cacheWrite: 0,
|
|
15860
|
+
},
|
|
15861
|
+
contextWindow: 256000,
|
|
15862
|
+
maxTokens: 256000,
|
|
15863
|
+
},
|
|
15264
15864
|
"xai/grok-4.1-fast-non-reasoning": {
|
|
15265
15865
|
id: "xai/grok-4.1-fast-non-reasoning",
|
|
15266
15866
|
name: "Grok 4.1 Fast Non-Reasoning",
|
|
@@ -15539,7 +16139,7 @@ export const MODELS = {
|
|
|
15539
16139
|
api: "anthropic-messages",
|
|
15540
16140
|
provider: "vercel-ai-gateway",
|
|
15541
16141
|
baseUrl: "https://ai-gateway.vercel.sh",
|
|
15542
|
-
reasoning:
|
|
16142
|
+
reasoning: true,
|
|
15543
16143
|
input: ["text", "image"],
|
|
15544
16144
|
cost: {
|
|
15545
16145
|
input: 0.6,
|
|
@@ -15693,7 +16293,7 @@ export const MODELS = {
|
|
|
15693
16293
|
provider: "vercel-ai-gateway",
|
|
15694
16294
|
baseUrl: "https://ai-gateway.vercel.sh",
|
|
15695
16295
|
reasoning: true,
|
|
15696
|
-
input: ["text"],
|
|
16296
|
+
input: ["text", "image"],
|
|
15697
16297
|
cost: {
|
|
15698
16298
|
input: 1.4,
|
|
15699
16299
|
output: 4.4,
|
|
@@ -16248,5 +16848,97 @@ export const MODELS = {
|
|
|
16248
16848
|
maxTokens: 131072,
|
|
16249
16849
|
},
|
|
16250
16850
|
},
|
|
16851
|
+
"zai-coding-cn": {
|
|
16852
|
+
"glm-4.5-air": {
|
|
16853
|
+
id: "glm-4.5-air",
|
|
16854
|
+
name: "GLM-4.5-Air",
|
|
16855
|
+
api: "openai-completions",
|
|
16856
|
+
provider: "zai-coding-cn",
|
|
16857
|
+
baseUrl: "https://open.bigmodel.cn/api/coding/paas/v4",
|
|
16858
|
+
compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai" },
|
|
16859
|
+
reasoning: true,
|
|
16860
|
+
input: ["text"],
|
|
16861
|
+
cost: {
|
|
16862
|
+
input: 0,
|
|
16863
|
+
output: 0,
|
|
16864
|
+
cacheRead: 0,
|
|
16865
|
+
cacheWrite: 0,
|
|
16866
|
+
},
|
|
16867
|
+
contextWindow: 131072,
|
|
16868
|
+
maxTokens: 98304,
|
|
16869
|
+
},
|
|
16870
|
+
"glm-4.7": {
|
|
16871
|
+
id: "glm-4.7",
|
|
16872
|
+
name: "GLM-4.7",
|
|
16873
|
+
api: "openai-completions",
|
|
16874
|
+
provider: "zai-coding-cn",
|
|
16875
|
+
baseUrl: "https://open.bigmodel.cn/api/coding/paas/v4",
|
|
16876
|
+
compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "zaiToolStream": true },
|
|
16877
|
+
reasoning: true,
|
|
16878
|
+
input: ["text"],
|
|
16879
|
+
cost: {
|
|
16880
|
+
input: 0,
|
|
16881
|
+
output: 0,
|
|
16882
|
+
cacheRead: 0,
|
|
16883
|
+
cacheWrite: 0,
|
|
16884
|
+
},
|
|
16885
|
+
contextWindow: 204800,
|
|
16886
|
+
maxTokens: 131072,
|
|
16887
|
+
},
|
|
16888
|
+
"glm-5-turbo": {
|
|
16889
|
+
id: "glm-5-turbo",
|
|
16890
|
+
name: "GLM-5-Turbo",
|
|
16891
|
+
api: "openai-completions",
|
|
16892
|
+
provider: "zai-coding-cn",
|
|
16893
|
+
baseUrl: "https://open.bigmodel.cn/api/coding/paas/v4",
|
|
16894
|
+
compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "zaiToolStream": true },
|
|
16895
|
+
reasoning: true,
|
|
16896
|
+
input: ["text"],
|
|
16897
|
+
cost: {
|
|
16898
|
+
input: 0,
|
|
16899
|
+
output: 0,
|
|
16900
|
+
cacheRead: 0,
|
|
16901
|
+
cacheWrite: 0,
|
|
16902
|
+
},
|
|
16903
|
+
contextWindow: 200000,
|
|
16904
|
+
maxTokens: 131072,
|
|
16905
|
+
},
|
|
16906
|
+
"glm-5.1": {
|
|
16907
|
+
id: "glm-5.1",
|
|
16908
|
+
name: "GLM-5.1",
|
|
16909
|
+
api: "openai-completions",
|
|
16910
|
+
provider: "zai-coding-cn",
|
|
16911
|
+
baseUrl: "https://open.bigmodel.cn/api/coding/paas/v4",
|
|
16912
|
+
compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "zaiToolStream": true },
|
|
16913
|
+
reasoning: true,
|
|
16914
|
+
input: ["text"],
|
|
16915
|
+
cost: {
|
|
16916
|
+
input: 0,
|
|
16917
|
+
output: 0,
|
|
16918
|
+
cacheRead: 0,
|
|
16919
|
+
cacheWrite: 0,
|
|
16920
|
+
},
|
|
16921
|
+
contextWindow: 200000,
|
|
16922
|
+
maxTokens: 131072,
|
|
16923
|
+
},
|
|
16924
|
+
"glm-5v-turbo": {
|
|
16925
|
+
id: "glm-5v-turbo",
|
|
16926
|
+
name: "GLM-5V-Turbo",
|
|
16927
|
+
api: "openai-completions",
|
|
16928
|
+
provider: "zai-coding-cn",
|
|
16929
|
+
baseUrl: "https://open.bigmodel.cn/api/coding/paas/v4",
|
|
16930
|
+
compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "zaiToolStream": true },
|
|
16931
|
+
reasoning: true,
|
|
16932
|
+
input: ["text", "image"],
|
|
16933
|
+
cost: {
|
|
16934
|
+
input: 0,
|
|
16935
|
+
output: 0,
|
|
16936
|
+
cacheRead: 0,
|
|
16937
|
+
cacheWrite: 0,
|
|
16938
|
+
},
|
|
16939
|
+
contextWindow: 200000,
|
|
16940
|
+
maxTokens: 131072,
|
|
16941
|
+
},
|
|
16942
|
+
},
|
|
16251
16943
|
};
|
|
16252
16944
|
//# sourceMappingURL=models.generated.js.map
|