@earendil-works/pi-ai 0.78.0 → 0.78.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -391,8 +391,8 @@ export const MODELS = {
391
391
  thinkingLevelMap: { "xhigh": "max" },
392
392
  input: ["text", "image"],
393
393
  cost: {
394
- input: 5,
395
- output: 25,
394
+ input: 5.5,
395
+ output: 27.5,
396
396
  cacheRead: 0.5,
397
397
  cacheWrite: 6.25,
398
398
  },
@@ -409,10 +409,10 @@ export const MODELS = {
409
409
  thinkingLevelMap: { "xhigh": "xhigh" },
410
410
  input: ["text", "image"],
411
411
  cost: {
412
- input: 5,
413
- output: 25,
414
- cacheRead: 0.5,
415
- cacheWrite: 6.25,
412
+ input: 5.5,
413
+ output: 27.5,
414
+ cacheRead: 0.55,
415
+ cacheWrite: 6.875,
416
416
  },
417
417
  contextWindow: 1000000,
418
418
  maxTokens: 128000,
@@ -427,10 +427,10 @@ export const MODELS = {
427
427
  thinkingLevelMap: { "xhigh": "xhigh" },
428
428
  input: ["text", "image"],
429
429
  cost: {
430
- input: 5,
431
- output: 25,
432
- cacheRead: 0.5,
433
- cacheWrite: 6.25,
430
+ input: 5.5,
431
+ output: 27.5,
432
+ cacheRead: 0.55,
433
+ cacheWrite: 6.875,
434
434
  },
435
435
  contextWindow: 1000000,
436
436
  maxTokens: 128000,
@@ -444,10 +444,10 @@ export const MODELS = {
444
444
  reasoning: true,
445
445
  input: ["text", "image"],
446
446
  cost: {
447
- input: 3,
448
- output: 15,
449
- cacheRead: 0.3,
450
- cacheWrite: 3.75,
447
+ input: 3.3,
448
+ output: 16.5,
449
+ cacheRead: 0.33,
450
+ cacheWrite: 4.125,
451
451
  },
452
452
  contextWindow: 200000,
453
453
  maxTokens: 64000,
@@ -461,10 +461,10 @@ export const MODELS = {
461
461
  reasoning: true,
462
462
  input: ["text", "image"],
463
463
  cost: {
464
- input: 3,
465
- output: 15,
466
- cacheRead: 0.3,
467
- cacheWrite: 3.75,
464
+ input: 3.3,
465
+ output: 16.5,
466
+ cacheRead: 0.33,
467
+ cacheWrite: 4.125,
468
468
  },
469
469
  contextWindow: 1000000,
470
470
  maxTokens: 64000,
@@ -1549,6 +1549,63 @@ export const MODELS = {
1549
1549
  maxTokens: 101376,
1550
1550
  },
1551
1551
  },
1552
+ "ant-ling": {
1553
+ "Ling-2.6-1T": {
1554
+ id: "Ling-2.6-1T",
1555
+ name: "Ling 2.6 1T",
1556
+ api: "openai-completions",
1557
+ provider: "ant-ling",
1558
+ baseUrl: "https://api.ant-ling.com/v1",
1559
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsLongCacheRetention": false },
1560
+ reasoning: false,
1561
+ input: ["text"],
1562
+ cost: {
1563
+ input: 0.06,
1564
+ output: 0.25,
1565
+ cacheRead: 0,
1566
+ cacheWrite: 0,
1567
+ },
1568
+ contextWindow: 262144,
1569
+ maxTokens: 65536,
1570
+ },
1571
+ "Ling-2.6-flash": {
1572
+ id: "Ling-2.6-flash",
1573
+ name: "Ling 2.6 Flash",
1574
+ api: "openai-completions",
1575
+ provider: "ant-ling",
1576
+ baseUrl: "https://api.ant-ling.com/v1",
1577
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsLongCacheRetention": false },
1578
+ reasoning: false,
1579
+ input: ["text"],
1580
+ cost: {
1581
+ input: 0.01,
1582
+ output: 0.02,
1583
+ cacheRead: 0,
1584
+ cacheWrite: 0,
1585
+ },
1586
+ contextWindow: 262144,
1587
+ maxTokens: 65536,
1588
+ },
1589
+ "Ring-2.6-1T": {
1590
+ id: "Ring-2.6-1T",
1591
+ name: "Ring 2.6 1T",
1592
+ api: "openai-completions",
1593
+ provider: "ant-ling",
1594
+ baseUrl: "https://api.ant-ling.com/v1",
1595
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsLongCacheRetention": false, "thinkingFormat": "ant-ling" },
1596
+ reasoning: true,
1597
+ thinkingLevelMap: { "off": null, "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "xhigh" },
1598
+ input: ["text"],
1599
+ cost: {
1600
+ input: 0.06,
1601
+ output: 0.25,
1602
+ cacheRead: 0,
1603
+ cacheWrite: 0,
1604
+ },
1605
+ contextWindow: 262144,
1606
+ maxTokens: 65536,
1607
+ },
1608
+ },
1552
1609
  "anthropic": {
1553
1610
  "claude-3-5-haiku-20241022": {
1554
1611
  id: "claude-3-5-haiku-20241022",
@@ -1847,7 +1904,7 @@ export const MODELS = {
1847
1904
  api: "anthropic-messages",
1848
1905
  provider: "anthropic",
1849
1906
  baseUrl: "https://api.anthropic.com",
1850
- compat: { "forceAdaptiveThinking": true },
1907
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
1851
1908
  reasoning: true,
1852
1909
  thinkingLevelMap: { "xhigh": "xhigh" },
1853
1910
  input: ["text", "image"],
@@ -1866,7 +1923,7 @@ export const MODELS = {
1866
1923
  api: "anthropic-messages",
1867
1924
  provider: "anthropic",
1868
1925
  baseUrl: "https://api.anthropic.com",
1869
- compat: { "forceAdaptiveThinking": true },
1926
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
1870
1927
  reasoning: true,
1871
1928
  thinkingLevelMap: { "xhigh": "xhigh" },
1872
1929
  input: ["text", "image"],
@@ -2955,7 +3012,26 @@ export const MODELS = {
2955
3012
  api: "anthropic-messages",
2956
3013
  provider: "cloudflare-ai-gateway",
2957
3014
  baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
2958
- compat: { "forceAdaptiveThinking": true },
3015
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
3016
+ reasoning: true,
3017
+ thinkingLevelMap: { "xhigh": "xhigh" },
3018
+ input: ["text", "image"],
3019
+ cost: {
3020
+ input: 5,
3021
+ output: 25,
3022
+ cacheRead: 0.5,
3023
+ cacheWrite: 6.25,
3024
+ },
3025
+ contextWindow: 1000000,
3026
+ maxTokens: 128000,
3027
+ },
3028
+ "claude-opus-4-8": {
3029
+ id: "claude-opus-4-8",
3030
+ name: "Claude Opus 4.8",
3031
+ api: "anthropic-messages",
3032
+ provider: "cloudflare-ai-gateway",
3033
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
3034
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
2959
3035
  reasoning: true,
2960
3036
  thinkingLevelMap: { "xhigh": "xhigh" },
2961
3037
  input: ["text", "image"],
@@ -3463,24 +3539,6 @@ export const MODELS = {
3463
3539
  contextWindow: 128000,
3464
3540
  maxTokens: 128000,
3465
3541
  },
3466
- "@cf/moonshotai/kimi-k2.5": {
3467
- id: "@cf/moonshotai/kimi-k2.5",
3468
- name: "Kimi K2.5",
3469
- api: "openai-completions",
3470
- provider: "cloudflare-workers-ai",
3471
- baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3472
- compat: { "sendSessionAffinityHeaders": true },
3473
- reasoning: true,
3474
- input: ["text", "image"],
3475
- cost: {
3476
- input: 0.6,
3477
- output: 3,
3478
- cacheRead: 0.1,
3479
- cacheWrite: 0,
3480
- },
3481
- contextWindow: 256000,
3482
- maxTokens: 256000,
3483
- },
3484
3542
  "@cf/moonshotai/kimi-k2.6": {
3485
3543
  id: "@cf/moonshotai/kimi-k2.6",
3486
3544
  name: "Kimi K2.6",
@@ -3808,8 +3866,8 @@ export const MODELS = {
3808
3866
  cacheRead: 0.1,
3809
3867
  cacheWrite: 0,
3810
3868
  },
3811
- contextWindow: 128000,
3812
- maxTokens: 8192,
3869
+ contextWindow: 262144,
3870
+ maxTokens: 65536,
3813
3871
  },
3814
3872
  "accounts/fireworks/routers/glm-5p1-fast": {
3815
3873
  id: "accounts/fireworks/routers/glm-5p1-fast",
@@ -3851,7 +3909,7 @@ export const MODELS = {
3851
3909
  "github-copilot": {
3852
3910
  "claude-haiku-4.5": {
3853
3911
  id: "claude-haiku-4.5",
3854
- name: "Claude Haiku 4.5",
3912
+ name: "Claude Haiku 4.5 (latest)",
3855
3913
  api: "anthropic-messages",
3856
3914
  provider: "github-copilot",
3857
3915
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -3860,17 +3918,17 @@ export const MODELS = {
3860
3918
  reasoning: true,
3861
3919
  input: ["text", "image"],
3862
3920
  cost: {
3863
- input: 0,
3864
- output: 0,
3865
- cacheRead: 0,
3866
- cacheWrite: 0,
3921
+ input: 1,
3922
+ output: 5,
3923
+ cacheRead: 0.1,
3924
+ cacheWrite: 1.25,
3867
3925
  },
3868
3926
  contextWindow: 200000,
3869
3927
  maxTokens: 64000,
3870
3928
  },
3871
3929
  "claude-opus-4.5": {
3872
3930
  id: "claude-opus-4.5",
3873
- name: "Claude Opus 4.5",
3931
+ name: "Claude Opus 4.5 (latest)",
3874
3932
  api: "anthropic-messages",
3875
3933
  provider: "github-copilot",
3876
3934
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -3878,10 +3936,10 @@ export const MODELS = {
3878
3936
  reasoning: true,
3879
3937
  input: ["text", "image"],
3880
3938
  cost: {
3881
- input: 0,
3882
- output: 0,
3883
- cacheRead: 0,
3884
- cacheWrite: 0,
3939
+ input: 5,
3940
+ output: 25,
3941
+ cacheRead: 0.5,
3942
+ cacheWrite: 6.25,
3885
3943
  },
3886
3944
  contextWindow: 200000,
3887
3945
  maxTokens: 32000,
@@ -3898,10 +3956,10 @@ export const MODELS = {
3898
3956
  thinkingLevelMap: { "xhigh": "max" },
3899
3957
  input: ["text", "image"],
3900
3958
  cost: {
3901
- input: 0,
3902
- output: 0,
3903
- cacheRead: 0,
3904
- cacheWrite: 0,
3959
+ input: 5,
3960
+ output: 25,
3961
+ cacheRead: 0.5,
3962
+ cacheWrite: 6.25,
3905
3963
  },
3906
3964
  contextWindow: 1000000,
3907
3965
  maxTokens: 32000,
@@ -3913,15 +3971,15 @@ export const MODELS = {
3913
3971
  provider: "github-copilot",
3914
3972
  baseUrl: "https://api.individual.githubcopilot.com",
3915
3973
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3916
- compat: { "forceAdaptiveThinking": true },
3974
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
3917
3975
  reasoning: true,
3918
3976
  thinkingLevelMap: { "xhigh": "xhigh" },
3919
3977
  input: ["text", "image"],
3920
3978
  cost: {
3921
- input: 0,
3922
- output: 0,
3923
- cacheRead: 0,
3924
- cacheWrite: 0,
3979
+ input: 5,
3980
+ output: 25,
3981
+ cacheRead: 0.5,
3982
+ cacheWrite: 6.25,
3925
3983
  },
3926
3984
  contextWindow: 200000,
3927
3985
  maxTokens: 32000,
@@ -3933,22 +3991,41 @@ export const MODELS = {
3933
3991
  provider: "github-copilot",
3934
3992
  baseUrl: "https://api.individual.githubcopilot.com",
3935
3993
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3936
- compat: { "forceAdaptiveThinking": true },
3994
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
3937
3995
  reasoning: true,
3938
3996
  thinkingLevelMap: { "xhigh": "xhigh" },
3939
3997
  input: ["text", "image"],
3940
3998
  cost: {
3941
- input: 0,
3942
- output: 0,
3943
- cacheRead: 0,
3944
- cacheWrite: 0,
3999
+ input: 5,
4000
+ output: 25,
4001
+ cacheRead: 0.5,
4002
+ cacheWrite: 6.25,
3945
4003
  },
3946
4004
  contextWindow: 200000,
3947
4005
  maxTokens: 64000,
3948
4006
  },
4007
+ "claude-sonnet-4": {
4008
+ id: "claude-sonnet-4",
4009
+ name: "Claude Sonnet 4 (latest)",
4010
+ api: "anthropic-messages",
4011
+ provider: "github-copilot",
4012
+ baseUrl: "https://api.individual.githubcopilot.com",
4013
+ headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4014
+ compat: { "supportsEagerToolInputStreaming": false },
4015
+ reasoning: true,
4016
+ input: ["text", "image"],
4017
+ cost: {
4018
+ input: 3,
4019
+ output: 15,
4020
+ cacheRead: 0.3,
4021
+ cacheWrite: 3.75,
4022
+ },
4023
+ contextWindow: 216000,
4024
+ maxTokens: 16000,
4025
+ },
3949
4026
  "claude-sonnet-4.5": {
3950
4027
  id: "claude-sonnet-4.5",
3951
- name: "Claude Sonnet 4.5",
4028
+ name: "Claude Sonnet 4.5 (latest)",
3952
4029
  api: "anthropic-messages",
3953
4030
  provider: "github-copilot",
3954
4031
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -3957,10 +4034,10 @@ export const MODELS = {
3957
4034
  reasoning: true,
3958
4035
  input: ["text", "image"],
3959
4036
  cost: {
3960
- input: 0,
3961
- output: 0,
3962
- cacheRead: 0,
3963
- cacheWrite: 0,
4037
+ input: 3,
4038
+ output: 15,
4039
+ cacheRead: 0.3,
4040
+ cacheWrite: 3.75,
3964
4041
  },
3965
4042
  contextWindow: 200000,
3966
4043
  maxTokens: 32000,
@@ -3976,10 +4053,10 @@ export const MODELS = {
3976
4053
  reasoning: true,
3977
4054
  input: ["text", "image"],
3978
4055
  cost: {
3979
- input: 0,
3980
- output: 0,
3981
- cacheRead: 0,
3982
- cacheWrite: 0,
4056
+ input: 3,
4057
+ output: 15,
4058
+ cacheRead: 0.3,
4059
+ cacheWrite: 3.75,
3983
4060
  },
3984
4061
  contextWindow: 1000000,
3985
4062
  maxTokens: 32000,
@@ -3992,12 +4069,12 @@ export const MODELS = {
3992
4069
  baseUrl: "https://api.individual.githubcopilot.com",
3993
4070
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3994
4071
  compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
3995
- reasoning: false,
4072
+ reasoning: true,
3996
4073
  input: ["text", "image"],
3997
4074
  cost: {
3998
- input: 0,
3999
- output: 0,
4000
- cacheRead: 0,
4075
+ input: 1.25,
4076
+ output: 10,
4077
+ cacheRead: 0.125,
4001
4078
  cacheWrite: 0,
4002
4079
  },
4003
4080
  contextWindow: 128000,
@@ -4005,7 +4082,7 @@ export const MODELS = {
4005
4082
  },
4006
4083
  "gemini-3-flash-preview": {
4007
4084
  id: "gemini-3-flash-preview",
4008
- name: "Gemini 3 Flash",
4085
+ name: "Gemini 3 Flash Preview",
4009
4086
  api: "openai-completions",
4010
4087
  provider: "github-copilot",
4011
4088
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -4014,9 +4091,9 @@ export const MODELS = {
4014
4091
  reasoning: true,
4015
4092
  input: ["text", "image"],
4016
4093
  cost: {
4017
- input: 0,
4018
- output: 0,
4019
- cacheRead: 0,
4094
+ input: 0.5,
4095
+ output: 3,
4096
+ cacheRead: 0.05,
4020
4097
  cacheWrite: 0,
4021
4098
  },
4022
4099
  contextWindow: 128000,
@@ -4033,9 +4110,9 @@ export const MODELS = {
4033
4110
  reasoning: true,
4034
4111
  input: ["text", "image"],
4035
4112
  cost: {
4036
- input: 0,
4037
- output: 0,
4038
- cacheRead: 0,
4113
+ input: 2,
4114
+ output: 12,
4115
+ cacheRead: 0.2,
4039
4116
  cacheWrite: 0,
4040
4117
  },
4041
4118
  contextWindow: 200000,
@@ -4052,9 +4129,9 @@ export const MODELS = {
4052
4129
  reasoning: true,
4053
4130
  input: ["text", "image"],
4054
4131
  cost: {
4055
- input: 0,
4056
- output: 0,
4057
- cacheRead: 0,
4132
+ input: 1.5,
4133
+ output: 9,
4134
+ cacheRead: 0.15,
4058
4135
  cacheWrite: 0,
4059
4136
  },
4060
4137
  contextWindow: 200000,
@@ -4071,36 +4148,17 @@ export const MODELS = {
4071
4148
  reasoning: false,
4072
4149
  input: ["text", "image"],
4073
4150
  cost: {
4074
- input: 0,
4075
- output: 0,
4076
- cacheRead: 0,
4151
+ input: 2,
4152
+ output: 8,
4153
+ cacheRead: 0.5,
4077
4154
  cacheWrite: 0,
4078
4155
  },
4079
4156
  contextWindow: 128000,
4080
4157
  maxTokens: 16384,
4081
4158
  },
4082
- "gpt-4o": {
4083
- id: "gpt-4o",
4084
- name: "GPT-4o",
4085
- api: "openai-completions",
4086
- provider: "github-copilot",
4087
- baseUrl: "https://api.individual.githubcopilot.com",
4088
- headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4089
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
4090
- reasoning: false,
4091
- input: ["text", "image"],
4092
- cost: {
4093
- input: 0,
4094
- output: 0,
4095
- cacheRead: 0,
4096
- cacheWrite: 0,
4097
- },
4098
- contextWindow: 128000,
4099
- maxTokens: 4096,
4100
- },
4101
4159
  "gpt-5-mini": {
4102
4160
  id: "gpt-5-mini",
4103
- name: "GPT-5-mini",
4161
+ name: "GPT-5 Mini",
4104
4162
  api: "openai-responses",
4105
4163
  provider: "github-copilot",
4106
4164
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -4109,9 +4167,9 @@ export const MODELS = {
4109
4167
  thinkingLevelMap: { "off": null, "minimal": "low" },
4110
4168
  input: ["text", "image"],
4111
4169
  cost: {
4112
- input: 0,
4113
- output: 0,
4114
- cacheRead: 0,
4170
+ input: 0.25,
4171
+ output: 2,
4172
+ cacheRead: 0.025,
4115
4173
  cacheWrite: 0,
4116
4174
  },
4117
4175
  contextWindow: 264000,
@@ -4128,9 +4186,9 @@ export const MODELS = {
4128
4186
  thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4129
4187
  input: ["text", "image"],
4130
4188
  cost: {
4131
- input: 0,
4132
- output: 0,
4133
- cacheRead: 0,
4189
+ input: 1.75,
4190
+ output: 14,
4191
+ cacheRead: 0.175,
4134
4192
  cacheWrite: 0,
4135
4193
  },
4136
4194
  contextWindow: 400000,
@@ -4138,7 +4196,7 @@ export const MODELS = {
4138
4196
  },
4139
4197
  "gpt-5.2-codex": {
4140
4198
  id: "gpt-5.2-codex",
4141
- name: "GPT-5.2-Codex",
4199
+ name: "GPT-5.2 Codex",
4142
4200
  api: "openai-responses",
4143
4201
  provider: "github-copilot",
4144
4202
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -4147,9 +4205,9 @@ export const MODELS = {
4147
4205
  thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4148
4206
  input: ["text", "image"],
4149
4207
  cost: {
4150
- input: 0,
4151
- output: 0,
4152
- cacheRead: 0,
4208
+ input: 1.75,
4209
+ output: 14,
4210
+ cacheRead: 0.175,
4153
4211
  cacheWrite: 0,
4154
4212
  },
4155
4213
  contextWindow: 400000,
@@ -4157,7 +4215,7 @@ export const MODELS = {
4157
4215
  },
4158
4216
  "gpt-5.3-codex": {
4159
4217
  id: "gpt-5.3-codex",
4160
- name: "GPT-5.3-Codex",
4218
+ name: "GPT-5.3 Codex",
4161
4219
  api: "openai-responses",
4162
4220
  provider: "github-copilot",
4163
4221
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -4166,9 +4224,9 @@ export const MODELS = {
4166
4224
  thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4167
4225
  input: ["text", "image"],
4168
4226
  cost: {
4169
- input: 0,
4170
- output: 0,
4171
- cacheRead: 0,
4227
+ input: 1.75,
4228
+ output: 14,
4229
+ cacheRead: 0.175,
4172
4230
  cacheWrite: 0,
4173
4231
  },
4174
4232
  contextWindow: 400000,
@@ -4185,9 +4243,9 @@ export const MODELS = {
4185
4243
  thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4186
4244
  input: ["text", "image"],
4187
4245
  cost: {
4188
- input: 0,
4189
- output: 0,
4190
- cacheRead: 0,
4246
+ input: 2.5,
4247
+ output: 15,
4248
+ cacheRead: 0.25,
4191
4249
  cacheWrite: 0,
4192
4250
  },
4193
4251
  contextWindow: 400000,
@@ -4195,7 +4253,7 @@ export const MODELS = {
4195
4253
  },
4196
4254
  "gpt-5.4-mini": {
4197
4255
  id: "gpt-5.4-mini",
4198
- name: "GPT-5.4 Mini",
4256
+ name: "GPT-5.4 mini",
4199
4257
  api: "openai-responses",
4200
4258
  provider: "github-copilot",
4201
4259
  baseUrl: "https://api.individual.githubcopilot.com",
@@ -4204,9 +4262,28 @@ export const MODELS = {
4204
4262
  thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4205
4263
  input: ["text", "image"],
4206
4264
  cost: {
4207
- input: 0,
4208
- output: 0,
4209
- cacheRead: 0,
4265
+ input: 0.75,
4266
+ output: 4.5,
4267
+ cacheRead: 0.075,
4268
+ cacheWrite: 0,
4269
+ },
4270
+ contextWindow: 400000,
4271
+ maxTokens: 128000,
4272
+ },
4273
+ "gpt-5.4-nano": {
4274
+ id: "gpt-5.4-nano",
4275
+ name: "GPT-5.4 nano",
4276
+ api: "openai-responses",
4277
+ provider: "github-copilot",
4278
+ baseUrl: "https://api.individual.githubcopilot.com",
4279
+ headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4280
+ reasoning: true,
4281
+ thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4282
+ input: ["text", "image"],
4283
+ cost: {
4284
+ input: 0.2,
4285
+ output: 1.25,
4286
+ cacheRead: 0.02,
4210
4287
  cacheWrite: 0,
4211
4288
  },
4212
4289
  contextWindow: 400000,
@@ -4223,32 +4300,32 @@ export const MODELS = {
4223
4300
  thinkingLevelMap: { "off": null, "minimal": "low", "xhigh": "xhigh" },
4224
4301
  input: ["text", "image"],
4225
4302
  cost: {
4226
- input: 0,
4227
- output: 0,
4228
- cacheRead: 0,
4303
+ input: 5,
4304
+ output: 30,
4305
+ cacheRead: 0.5,
4229
4306
  cacheWrite: 0,
4230
4307
  },
4231
4308
  contextWindow: 400000,
4232
4309
  maxTokens: 128000,
4233
4310
  },
4234
- "grok-code-fast-1": {
4235
- id: "grok-code-fast-1",
4236
- name: "Grok Code Fast 1",
4311
+ "raptor-mini": {
4312
+ id: "raptor-mini",
4313
+ name: "Raptor mini",
4237
4314
  api: "openai-completions",
4238
4315
  provider: "github-copilot",
4239
4316
  baseUrl: "https://api.individual.githubcopilot.com",
4240
4317
  headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4241
4318
  compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
4242
4319
  reasoning: true,
4243
- input: ["text"],
4320
+ input: ["text", "image"],
4244
4321
  cost: {
4245
- input: 0,
4246
- output: 0,
4247
- cacheRead: 0,
4322
+ input: 0.25,
4323
+ output: 2,
4324
+ cacheRead: 0.025,
4248
4325
  cacheWrite: 0,
4249
4326
  },
4250
- contextWindow: 128000,
4251
- maxTokens: 64000,
4327
+ contextWindow: 400000,
4328
+ maxTokens: 128000,
4252
4329
  },
4253
4330
  },
4254
4331
  "google": {
@@ -5541,6 +5618,23 @@ export const MODELS = {
5541
5618
  contextWindow: 204800,
5542
5619
  maxTokens: 131072,
5543
5620
  },
5621
+ "MiniMax-M3": {
5622
+ id: "MiniMax-M3",
5623
+ name: "MiniMax-M3",
5624
+ api: "anthropic-messages",
5625
+ provider: "minimax",
5626
+ baseUrl: "https://api.minimax.io/anthropic",
5627
+ reasoning: true,
5628
+ input: ["text", "image"],
5629
+ cost: {
5630
+ input: 0.6,
5631
+ output: 2.4,
5632
+ cacheRead: 0.12,
5633
+ cacheWrite: 0,
5634
+ },
5635
+ contextWindow: 512000,
5636
+ maxTokens: 128000,
5637
+ },
5544
5638
  },
5545
5639
  "minimax-cn": {
5546
5640
  "MiniMax-M2.7": {
@@ -5577,6 +5671,23 @@ export const MODELS = {
5577
5671
  contextWindow: 204800,
5578
5672
  maxTokens: 131072,
5579
5673
  },
5674
+ "MiniMax-M3": {
5675
+ id: "MiniMax-M3",
5676
+ name: "MiniMax-M3",
5677
+ api: "anthropic-messages",
5678
+ provider: "minimax-cn",
5679
+ baseUrl: "https://api.minimaxi.com/anthropic",
5680
+ reasoning: true,
5681
+ input: ["text", "image"],
5682
+ cost: {
5683
+ input: 0.6,
5684
+ output: 2.4,
5685
+ cacheRead: 0.12,
5686
+ cacheWrite: 0,
5687
+ },
5688
+ contextWindow: 512000,
5689
+ maxTokens: 128000,
5690
+ },
5580
5691
  },
5581
5692
  "mistral": {
5582
5693
  "codestral-latest": {
@@ -5613,6 +5724,23 @@ export const MODELS = {
5613
5724
  contextWindow: 262144,
5614
5725
  maxTokens: 262144,
5615
5726
  },
5727
+ "devstral-latest": {
5728
+ id: "devstral-latest",
5729
+ name: "Devstral 2",
5730
+ api: "mistral-conversations",
5731
+ provider: "mistral",
5732
+ baseUrl: "https://api.mistral.ai",
5733
+ reasoning: false,
5734
+ input: ["text"],
5735
+ cost: {
5736
+ input: 0.4,
5737
+ output: 2,
5738
+ cacheRead: 0,
5739
+ cacheWrite: 0,
5740
+ },
5741
+ contextWindow: 262144,
5742
+ maxTokens: 262144,
5743
+ },
5616
5744
  "devstral-medium-2507": {
5617
5745
  id: "devstral-medium-2507",
5618
5746
  name: "Devstral Medium",
@@ -5987,6 +6115,23 @@ export const MODELS = {
5987
6115
  contextWindow: 8000,
5988
6116
  maxTokens: 8000,
5989
6117
  },
6118
+ "open-mistral-nemo": {
6119
+ id: "open-mistral-nemo",
6120
+ name: "Open Mistral Nemo",
6121
+ api: "mistral-conversations",
6122
+ provider: "mistral",
6123
+ baseUrl: "https://api.mistral.ai",
6124
+ reasoning: false,
6125
+ input: ["text"],
6126
+ cost: {
6127
+ input: 0.15,
6128
+ output: 0.15,
6129
+ cacheRead: 0,
6130
+ cacheWrite: 0,
6131
+ },
6132
+ contextWindow: 128000,
6133
+ maxTokens: 128000,
6134
+ },
5990
6135
  "open-mixtral-8x22b": {
5991
6136
  id: "open-mixtral-8x22b",
5992
6137
  name: "Mixtral 8x22B",
@@ -6231,85 +6376,467 @@ export const MODELS = {
6231
6376
  reasoning: true,
6232
6377
  input: ["text"],
6233
6378
  cost: {
6234
- input: 0.6,
6235
- output: 2.5,
6236
- cacheRead: 0.15,
6379
+ input: 0.6,
6380
+ output: 2.5,
6381
+ cacheRead: 0.15,
6382
+ cacheWrite: 0,
6383
+ },
6384
+ contextWindow: 262144,
6385
+ maxTokens: 262144,
6386
+ },
6387
+ "kimi-k2-thinking-turbo": {
6388
+ id: "kimi-k2-thinking-turbo",
6389
+ name: "Kimi K2 Thinking Turbo",
6390
+ api: "openai-completions",
6391
+ provider: "moonshotai-cn",
6392
+ baseUrl: "https://api.moonshot.cn/v1",
6393
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6394
+ reasoning: true,
6395
+ input: ["text"],
6396
+ cost: {
6397
+ input: 1.15,
6398
+ output: 8,
6399
+ cacheRead: 0.15,
6400
+ cacheWrite: 0,
6401
+ },
6402
+ contextWindow: 262144,
6403
+ maxTokens: 262144,
6404
+ },
6405
+ "kimi-k2-turbo-preview": {
6406
+ id: "kimi-k2-turbo-preview",
6407
+ name: "Kimi K2 Turbo",
6408
+ api: "openai-completions",
6409
+ provider: "moonshotai-cn",
6410
+ baseUrl: "https://api.moonshot.cn/v1",
6411
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6412
+ reasoning: false,
6413
+ input: ["text"],
6414
+ cost: {
6415
+ input: 2.4,
6416
+ output: 10,
6417
+ cacheRead: 0.6,
6418
+ cacheWrite: 0,
6419
+ },
6420
+ contextWindow: 262144,
6421
+ maxTokens: 262144,
6422
+ },
6423
+ "kimi-k2.5": {
6424
+ id: "kimi-k2.5",
6425
+ name: "Kimi K2.5",
6426
+ api: "openai-completions",
6427
+ provider: "moonshotai-cn",
6428
+ baseUrl: "https://api.moonshot.cn/v1",
6429
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6430
+ reasoning: true,
6431
+ input: ["text", "image"],
6432
+ cost: {
6433
+ input: 0.6,
6434
+ output: 3,
6435
+ cacheRead: 0.1,
6436
+ cacheWrite: 0,
6437
+ },
6438
+ contextWindow: 262144,
6439
+ maxTokens: 262144,
6440
+ },
6441
+ "kimi-k2.6": {
6442
+ id: "kimi-k2.6",
6443
+ name: "Kimi K2.6",
6444
+ api: "openai-completions",
6445
+ provider: "moonshotai-cn",
6446
+ baseUrl: "https://api.moonshot.cn/v1",
6447
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6448
+ reasoning: true,
6449
+ input: ["text", "image"],
6450
+ cost: {
6451
+ input: 0.95,
6452
+ output: 4,
6453
+ cacheRead: 0.16,
6454
+ cacheWrite: 0,
6455
+ },
6456
+ contextWindow: 262144,
6457
+ maxTokens: 262144,
6458
+ },
6459
+ },
6460
+ "nvidia": {
6461
+ "meta/llama-3.1-70b-instruct": {
6462
+ id: "meta/llama-3.1-70b-instruct",
6463
+ name: "Llama 3.1 70b Instruct",
6464
+ api: "openai-completions",
6465
+ provider: "nvidia",
6466
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6467
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6468
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6469
+ reasoning: false,
6470
+ input: ["text"],
6471
+ cost: {
6472
+ input: 0,
6473
+ output: 0,
6474
+ cacheRead: 0,
6475
+ cacheWrite: 0,
6476
+ },
6477
+ contextWindow: 128000,
6478
+ maxTokens: 4096,
6479
+ },
6480
+ "meta/llama-3.1-8b-instruct": {
6481
+ id: "meta/llama-3.1-8b-instruct",
6482
+ name: "Llama 3.1 8B Instruct",
6483
+ api: "openai-completions",
6484
+ provider: "nvidia",
6485
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6486
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6487
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6488
+ reasoning: false,
6489
+ input: ["text"],
6490
+ cost: {
6491
+ input: 0,
6492
+ output: 0,
6493
+ cacheRead: 0,
6494
+ cacheWrite: 0,
6495
+ },
6496
+ contextWindow: 16000,
6497
+ maxTokens: 4096,
6498
+ },
6499
+ "meta/llama-3.2-11b-vision-instruct": {
6500
+ id: "meta/llama-3.2-11b-vision-instruct",
6501
+ name: "Llama 3.2 11b Vision Instruct",
6502
+ api: "openai-completions",
6503
+ provider: "nvidia",
6504
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6505
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6506
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6507
+ reasoning: false,
6508
+ input: ["text", "image"],
6509
+ cost: {
6510
+ input: 0,
6511
+ output: 0,
6512
+ cacheRead: 0,
6513
+ cacheWrite: 0,
6514
+ },
6515
+ contextWindow: 128000,
6516
+ maxTokens: 4096,
6517
+ },
6518
+ "meta/llama-3.2-90b-vision-instruct": {
6519
+ id: "meta/llama-3.2-90b-vision-instruct",
6520
+ name: "Llama-3.2-90B-Vision-Instruct",
6521
+ api: "openai-completions",
6522
+ provider: "nvidia",
6523
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6524
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6525
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6526
+ reasoning: false,
6527
+ input: ["text", "image"],
6528
+ cost: {
6529
+ input: 0,
6530
+ output: 0,
6531
+ cacheRead: 0,
6532
+ cacheWrite: 0,
6533
+ },
6534
+ contextWindow: 128000,
6535
+ maxTokens: 8192,
6536
+ },
6537
+ "meta/llama-3.3-70b-instruct": {
6538
+ id: "meta/llama-3.3-70b-instruct",
6539
+ name: "Llama 3.3 70b Instruct",
6540
+ api: "openai-completions",
6541
+ provider: "nvidia",
6542
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6543
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6544
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6545
+ reasoning: false,
6546
+ input: ["text"],
6547
+ cost: {
6548
+ input: 0,
6549
+ output: 0,
6550
+ cacheRead: 0,
6551
+ cacheWrite: 0,
6552
+ },
6553
+ contextWindow: 128000,
6554
+ maxTokens: 4096,
6555
+ },
6556
+ "mistralai/mistral-large-3-675b-instruct-2512": {
6557
+ id: "mistralai/mistral-large-3-675b-instruct-2512",
6558
+ name: "Mistral Large 3 675B Instruct 2512",
6559
+ api: "openai-completions",
6560
+ provider: "nvidia",
6561
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6562
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6563
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6564
+ reasoning: false,
6565
+ input: ["text", "image"],
6566
+ cost: {
6567
+ input: 0,
6568
+ output: 0,
6569
+ cacheRead: 0,
6570
+ cacheWrite: 0,
6571
+ },
6572
+ contextWindow: 262144,
6573
+ maxTokens: 262144,
6574
+ },
6575
+ "mistralai/mistral-small-4-119b-2603": {
6576
+ id: "mistralai/mistral-small-4-119b-2603",
6577
+ name: "mistral-small-4-119b-2603",
6578
+ api: "openai-completions",
6579
+ provider: "nvidia",
6580
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6581
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6582
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6583
+ reasoning: false,
6584
+ input: ["text"],
6585
+ cost: {
6586
+ input: 0,
6587
+ output: 0,
6588
+ cacheRead: 0,
6589
+ cacheWrite: 0,
6590
+ },
6591
+ contextWindow: 128000,
6592
+ maxTokens: 8192,
6593
+ },
6594
+ "moonshotai/kimi-k2.6": {
6595
+ id: "moonshotai/kimi-k2.6",
6596
+ name: "Kimi K2.6",
6597
+ api: "openai-completions",
6598
+ provider: "nvidia",
6599
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6600
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6601
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6602
+ reasoning: true,
6603
+ input: ["text", "image"],
6604
+ cost: {
6605
+ input: 0,
6606
+ output: 0,
6607
+ cacheRead: 0,
6608
+ cacheWrite: 0,
6609
+ },
6610
+ contextWindow: 262144,
6611
+ maxTokens: 262144,
6612
+ },
6613
+ "nvidia/llama-3.3-nemotron-super-49b-v1": {
6614
+ id: "nvidia/llama-3.3-nemotron-super-49b-v1",
6615
+ name: "Llama 3.3 Nemotron Super 49B v1",
6616
+ api: "openai-completions",
6617
+ provider: "nvidia",
6618
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6619
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6620
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6621
+ reasoning: true,
6622
+ input: ["text"],
6623
+ cost: {
6624
+ input: 0,
6625
+ output: 0,
6626
+ cacheRead: 0,
6627
+ cacheWrite: 0,
6628
+ },
6629
+ contextWindow: 131072,
6630
+ maxTokens: 131072,
6631
+ },
6632
+ "nvidia/llama-3.3-nemotron-super-49b-v1.5": {
6633
+ id: "nvidia/llama-3.3-nemotron-super-49b-v1.5",
6634
+ name: "Llama 3.3 Nemotron Super 49B v1.5",
6635
+ api: "openai-completions",
6636
+ provider: "nvidia",
6637
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6638
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6639
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6640
+ reasoning: true,
6641
+ input: ["text"],
6642
+ cost: {
6643
+ input: 0,
6644
+ output: 0,
6645
+ cacheRead: 0,
6646
+ cacheWrite: 0,
6647
+ },
6648
+ contextWindow: 131072,
6649
+ maxTokens: 131072,
6650
+ },
6651
+ "nvidia/nemotron-3-nano-30b-a3b": {
6652
+ id: "nvidia/nemotron-3-nano-30b-a3b",
6653
+ name: "nemotron-3-nano-30b-a3b",
6654
+ api: "openai-completions",
6655
+ provider: "nvidia",
6656
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6657
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6658
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6659
+ reasoning: true,
6660
+ input: ["text"],
6661
+ cost: {
6662
+ input: 0,
6663
+ output: 0,
6664
+ cacheRead: 0,
6665
+ cacheWrite: 0,
6666
+ },
6667
+ contextWindow: 131072,
6668
+ maxTokens: 131072,
6669
+ },
6670
+ "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning": {
6671
+ id: "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning",
6672
+ name: "Nemotron 3 Nano Omni",
6673
+ api: "openai-completions",
6674
+ provider: "nvidia",
6675
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6676
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6677
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6678
+ reasoning: true,
6679
+ input: ["text", "image"],
6680
+ cost: {
6681
+ input: 0,
6682
+ output: 0,
6683
+ cacheRead: 0,
6684
+ cacheWrite: 0,
6685
+ },
6686
+ contextWindow: 256000,
6687
+ maxTokens: 65536,
6688
+ },
6689
+ "nvidia/nemotron-3-super-120b-a12b": {
6690
+ id: "nvidia/nemotron-3-super-120b-a12b",
6691
+ name: "Nemotron 3 Super",
6692
+ api: "openai-completions",
6693
+ provider: "nvidia",
6694
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6695
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6696
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6697
+ reasoning: true,
6698
+ input: ["text"],
6699
+ cost: {
6700
+ input: 0.2,
6701
+ output: 0.8,
6702
+ cacheRead: 0,
6703
+ cacheWrite: 0,
6704
+ },
6705
+ contextWindow: 262144,
6706
+ maxTokens: 262144,
6707
+ },
6708
+ "nvidia/nvidia-nemotron-nano-9b-v2": {
6709
+ id: "nvidia/nvidia-nemotron-nano-9b-v2",
6710
+ name: "nvidia-nemotron-nano-9b-v2",
6711
+ api: "openai-completions",
6712
+ provider: "nvidia",
6713
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6714
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6715
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6716
+ reasoning: true,
6717
+ input: ["text"],
6718
+ cost: {
6719
+ input: 0,
6720
+ output: 0,
6721
+ cacheRead: 0,
6722
+ cacheWrite: 0,
6723
+ },
6724
+ contextWindow: 131072,
6725
+ maxTokens: 131072,
6726
+ },
6727
+ "openai/gpt-oss-20b": {
6728
+ id: "openai/gpt-oss-20b",
6729
+ name: "GPT OSS 20B",
6730
+ api: "openai-completions",
6731
+ provider: "nvidia",
6732
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6733
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6734
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6735
+ reasoning: true,
6736
+ input: ["text"],
6737
+ cost: {
6738
+ input: 0,
6739
+ output: 0,
6740
+ cacheRead: 0,
6741
+ cacheWrite: 0,
6742
+ },
6743
+ contextWindow: 131072,
6744
+ maxTokens: 32768,
6745
+ },
6746
+ "qwen/qwen3-coder-480b-a35b-instruct": {
6747
+ id: "qwen/qwen3-coder-480b-a35b-instruct",
6748
+ name: "Qwen3 Coder 480B A35B Instruct",
6749
+ api: "openai-completions",
6750
+ provider: "nvidia",
6751
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6752
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6753
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6754
+ reasoning: false,
6755
+ input: ["text"],
6756
+ cost: {
6757
+ input: 0,
6758
+ output: 0,
6759
+ cacheRead: 0,
6237
6760
  cacheWrite: 0,
6238
6761
  },
6239
6762
  contextWindow: 262144,
6240
- maxTokens: 262144,
6763
+ maxTokens: 66536,
6241
6764
  },
6242
- "kimi-k2-thinking-turbo": {
6243
- id: "kimi-k2-thinking-turbo",
6244
- name: "Kimi K2 Thinking Turbo",
6765
+ "qwen/qwen3.5-122b-a10b": {
6766
+ id: "qwen/qwen3.5-122b-a10b",
6767
+ name: "Qwen3.5 122B-A10B",
6245
6768
  api: "openai-completions",
6246
- provider: "moonshotai-cn",
6247
- baseUrl: "https://api.moonshot.cn/v1",
6248
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6769
+ provider: "nvidia",
6770
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6771
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6772
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6249
6773
  reasoning: true,
6250
- input: ["text"],
6774
+ input: ["text", "image"],
6251
6775
  cost: {
6252
- input: 1.15,
6253
- output: 8,
6254
- cacheRead: 0.15,
6776
+ input: 0,
6777
+ output: 0,
6778
+ cacheRead: 0,
6255
6779
  cacheWrite: 0,
6256
6780
  },
6257
6781
  contextWindow: 262144,
6258
- maxTokens: 262144,
6782
+ maxTokens: 65536,
6259
6783
  },
6260
- "kimi-k2-turbo-preview": {
6261
- id: "kimi-k2-turbo-preview",
6262
- name: "Kimi K2 Turbo",
6784
+ "stepfun-ai/step-3.5-flash": {
6785
+ id: "stepfun-ai/step-3.5-flash",
6786
+ name: "Step 3.5 Flash",
6263
6787
  api: "openai-completions",
6264
- provider: "moonshotai-cn",
6265
- baseUrl: "https://api.moonshot.cn/v1",
6266
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6267
- reasoning: false,
6788
+ provider: "nvidia",
6789
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6790
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6791
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6792
+ reasoning: true,
6268
6793
  input: ["text"],
6269
6794
  cost: {
6270
- input: 2.4,
6271
- output: 10,
6272
- cacheRead: 0.6,
6795
+ input: 0,
6796
+ output: 0,
6797
+ cacheRead: 0,
6273
6798
  cacheWrite: 0,
6274
6799
  },
6275
- contextWindow: 262144,
6276
- maxTokens: 262144,
6800
+ contextWindow: 256000,
6801
+ maxTokens: 16384,
6277
6802
  },
6278
- "kimi-k2.5": {
6279
- id: "kimi-k2.5",
6280
- name: "Kimi K2.5",
6803
+ "stepfun-ai/step-3.7-flash": {
6804
+ id: "stepfun-ai/step-3.7-flash",
6805
+ name: "Step 3.7 Flash",
6281
6806
  api: "openai-completions",
6282
- provider: "moonshotai-cn",
6283
- baseUrl: "https://api.moonshot.cn/v1",
6284
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6807
+ provider: "nvidia",
6808
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6809
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6810
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6285
6811
  reasoning: true,
6286
6812
  input: ["text", "image"],
6287
6813
  cost: {
6288
- input: 0.6,
6289
- output: 3,
6290
- cacheRead: 0.1,
6814
+ input: 0,
6815
+ output: 0,
6816
+ cacheRead: 0,
6291
6817
  cacheWrite: 0,
6292
6818
  },
6293
- contextWindow: 262144,
6294
- maxTokens: 262144,
6819
+ contextWindow: 256000,
6820
+ maxTokens: 16384,
6295
6821
  },
6296
- "kimi-k2.6": {
6297
- id: "kimi-k2.6",
6298
- name: "Kimi K2.6",
6822
+ "z-ai/glm-5.1": {
6823
+ id: "z-ai/glm-5.1",
6824
+ name: "GLM-5.1",
6299
6825
  api: "openai-completions",
6300
- provider: "moonshotai-cn",
6301
- baseUrl: "https://api.moonshot.cn/v1",
6302
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6826
+ provider: "nvidia",
6827
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6828
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6829
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6303
6830
  reasoning: true,
6304
- input: ["text", "image"],
6831
+ input: ["text"],
6305
6832
  cost: {
6306
- input: 0.95,
6307
- output: 4,
6308
- cacheRead: 0.16,
6833
+ input: 0,
6834
+ output: 0,
6835
+ cacheRead: 0,
6309
6836
  cacheWrite: 0,
6310
6837
  },
6311
- contextWindow: 262144,
6312
- maxTokens: 262144,
6838
+ contextWindow: 131072,
6839
+ maxTokens: 131072,
6313
6840
  },
6314
6841
  },
6315
6842
  "openai": {
@@ -6886,7 +7413,7 @@ export const MODELS = {
6886
7413
  provider: "openai",
6887
7414
  baseUrl: "https://api.openai.com/v1",
6888
7415
  reasoning: true,
6889
- thinkingLevelMap: { "off": "none", "xhigh": "xhigh" },
7416
+ thinkingLevelMap: { "off": "none", "xhigh": "xhigh", "minimal": null },
6890
7417
  input: ["text", "image"],
6891
7418
  cost: {
6892
7419
  input: 5,
@@ -7053,42 +7580,6 @@ export const MODELS = {
7053
7580
  },
7054
7581
  },
7055
7582
  "openai-codex": {
7056
- "gpt-5.2": {
7057
- id: "gpt-5.2",
7058
- name: "GPT-5.2",
7059
- api: "openai-codex-responses",
7060
- provider: "openai-codex",
7061
- baseUrl: "https://chatgpt.com/backend-api",
7062
- reasoning: true,
7063
- thinkingLevelMap: { "xhigh": "xhigh", "minimal": "low" },
7064
- input: ["text", "image"],
7065
- cost: {
7066
- input: 1.75,
7067
- output: 14,
7068
- cacheRead: 0.175,
7069
- cacheWrite: 0,
7070
- },
7071
- contextWindow: 272000,
7072
- maxTokens: 128000,
7073
- },
7074
- "gpt-5.3-codex": {
7075
- id: "gpt-5.3-codex",
7076
- name: "GPT-5.3 Codex",
7077
- api: "openai-codex-responses",
7078
- provider: "openai-codex",
7079
- baseUrl: "https://chatgpt.com/backend-api",
7080
- reasoning: true,
7081
- thinkingLevelMap: { "xhigh": "xhigh", "minimal": "low" },
7082
- input: ["text", "image"],
7083
- cost: {
7084
- input: 1.75,
7085
- output: 14,
7086
- cacheRead: 0.175,
7087
- cacheWrite: 0,
7088
- },
7089
- contextWindow: 272000,
7090
- maxTokens: 128000,
7091
- },
7092
7583
  "gpt-5.3-codex-spark": {
7093
7584
  id: "gpt-5.3-codex-spark",
7094
7585
  name: "GPT-5.3 Codex Spark",
@@ -7256,7 +7747,7 @@ export const MODELS = {
7256
7747
  api: "anthropic-messages",
7257
7748
  provider: "opencode",
7258
7749
  baseUrl: "https://opencode.ai/zen",
7259
- compat: { "forceAdaptiveThinking": true },
7750
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
7260
7751
  reasoning: true,
7261
7752
  thinkingLevelMap: { "xhigh": "xhigh" },
7262
7753
  input: ["text", "image"],
@@ -7275,7 +7766,7 @@ export const MODELS = {
7275
7766
  api: "anthropic-messages",
7276
7767
  provider: "opencode",
7277
7768
  baseUrl: "https://opencode.ai/zen",
7278
- compat: { "forceAdaptiveThinking": true },
7769
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
7279
7770
  reasoning: true,
7280
7771
  thinkingLevelMap: { "xhigh": "xhigh" },
7281
7772
  input: ["text", "image"],
@@ -7340,6 +7831,25 @@ export const MODELS = {
7340
7831
  contextWindow: 1000000,
7341
7832
  maxTokens: 64000,
7342
7833
  },
7834
+ "deepseek-v4-flash": {
7835
+ id: "deepseek-v4-flash",
7836
+ name: "DeepSeek V4 Flash",
7837
+ api: "openai-completions",
7838
+ provider: "opencode",
7839
+ baseUrl: "https://opencode.ai/zen/v1",
7840
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7841
+ reasoning: true,
7842
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7843
+ input: ["text"],
7844
+ cost: {
7845
+ input: 0.14,
7846
+ output: 0.28,
7847
+ cacheRead: 0.03,
7848
+ cacheWrite: 0,
7849
+ },
7850
+ contextWindow: 1000000,
7851
+ maxTokens: 384000,
7852
+ },
7343
7853
  "deepseek-v4-flash-free": {
7344
7854
  id: "deepseek-v4-flash-free",
7345
7855
  name: "DeepSeek V4 Flash Free",
@@ -7803,8 +8313,8 @@ export const MODELS = {
7803
8313
  cacheRead: 0,
7804
8314
  cacheWrite: 0,
7805
8315
  },
7806
- contextWindow: 1000000,
7807
- maxTokens: 128000,
8316
+ contextWindow: 200000,
8317
+ maxTokens: 32000,
7808
8318
  },
7809
8319
  "minimax-m2.5": {
7810
8320
  id: "minimax-m2.5",
@@ -7840,9 +8350,26 @@ export const MODELS = {
7840
8350
  contextWindow: 204800,
7841
8351
  maxTokens: 131072,
7842
8352
  },
7843
- "nemotron-3-super-free": {
7844
- id: "nemotron-3-super-free",
7845
- name: "Nemotron 3 Super Free",
8353
+ "minimax-m3-free": {
8354
+ id: "minimax-m3-free",
8355
+ name: "MiniMax M3 Free",
8356
+ api: "anthropic-messages",
8357
+ provider: "opencode",
8358
+ baseUrl: "https://opencode.ai/zen",
8359
+ reasoning: true,
8360
+ input: ["text", "image"],
8361
+ cost: {
8362
+ input: 0,
8363
+ output: 0,
8364
+ cacheRead: 0,
8365
+ cacheWrite: 0,
8366
+ },
8367
+ contextWindow: 200000,
8368
+ maxTokens: 32000,
8369
+ },
8370
+ "nemotron-3-ultra-free": {
8371
+ id: "nemotron-3-ultra-free",
8372
+ name: "Nemotron 3 Ultra Free",
7846
8373
  api: "openai-completions",
7847
8374
  provider: "opencode",
7848
8375
  baseUrl: "https://opencode.ai/zen/v1",
@@ -7854,7 +8381,7 @@ export const MODELS = {
7854
8381
  cacheRead: 0,
7855
8382
  cacheWrite: 0,
7856
8383
  },
7857
- contextWindow: 204800,
8384
+ contextWindow: 1000000,
7858
8385
  maxTokens: 128000,
7859
8386
  },
7860
8387
  "qwen3.5-plus": {
@@ -8069,6 +8596,23 @@ export const MODELS = {
8069
8596
  contextWindow: 204800,
8070
8597
  maxTokens: 131072,
8071
8598
  },
8599
+ "minimax-m3": {
8600
+ id: "minimax-m3",
8601
+ name: "MiniMax M3",
8602
+ api: "anthropic-messages",
8603
+ provider: "opencode-go",
8604
+ baseUrl: "https://opencode.ai/zen/go",
8605
+ reasoning: true,
8606
+ input: ["text", "image"],
8607
+ cost: {
8608
+ input: 0.6,
8609
+ output: 2.4,
8610
+ cacheRead: 0.12,
8611
+ cacheWrite: 0,
8612
+ },
8613
+ contextWindow: 512000,
8614
+ maxTokens: 131072,
8615
+ },
8072
8616
  "qwen3.6-plus": {
8073
8617
  id: "qwen3.6-plus",
8074
8618
  name: "Qwen3.6 Plus",
@@ -8104,6 +8648,23 @@ export const MODELS = {
8104
8648
  contextWindow: 1000000,
8105
8649
  maxTokens: 65536,
8106
8650
  },
8651
+ "qwen3.7-plus": {
8652
+ id: "qwen3.7-plus",
8653
+ name: "Qwen3.7 Plus",
8654
+ api: "anthropic-messages",
8655
+ provider: "opencode-go",
8656
+ baseUrl: "https://opencode.ai/zen/go",
8657
+ reasoning: true,
8658
+ input: ["text", "image"],
8659
+ cost: {
8660
+ input: 0.4,
8661
+ output: 1.6,
8662
+ cacheRead: 0.04,
8663
+ cacheWrite: 0.5,
8664
+ },
8665
+ contextWindow: 262144,
8666
+ maxTokens: 65536,
8667
+ },
8107
8668
  },
8108
8669
  "openrouter": {
8109
8670
  "ai21/jamba-large-1.7": {
@@ -8537,23 +9098,6 @@ export const MODELS = {
8537
9098
  contextWindow: 2000000,
8538
9099
  maxTokens: 30000,
8539
9100
  },
8540
- "baidu/ernie-4.5-21b-a3b": {
8541
- id: "baidu/ernie-4.5-21b-a3b",
8542
- name: "Baidu: ERNIE 4.5 21B A3B",
8543
- api: "openai-completions",
8544
- provider: "openrouter",
8545
- baseUrl: "https://openrouter.ai/api/v1",
8546
- reasoning: false,
8547
- input: ["text"],
8548
- cost: {
8549
- input: 0.07,
8550
- output: 0.28,
8551
- cacheRead: 0,
8552
- cacheWrite: 0,
8553
- },
8554
- contextWindow: 131072,
8555
- maxTokens: 8000,
8556
- },
8557
9101
  "baidu/ernie-4.5-vl-28b-a3b": {
8558
9102
  id: "baidu/ernie-4.5-vl-28b-a3b",
8559
9103
  name: "Baidu: ERNIE 4.5 VL 28B A3B",
@@ -8682,8 +9226,8 @@ export const MODELS = {
8682
9226
  reasoning: false,
8683
9227
  input: ["text"],
8684
9228
  cost: {
8685
- input: 0.2288,
8686
- output: 0.9144,
9229
+ input: 0.20020000000000002,
9230
+ output: 0.8000999999999999,
8687
9231
  cacheRead: 0,
8688
9232
  cacheWrite: 0,
8689
9233
  },
@@ -8784,13 +9328,13 @@ export const MODELS = {
8784
9328
  reasoning: true,
8785
9329
  input: ["text"],
8786
9330
  cost: {
8787
- input: 0.252,
8788
- output: 0.378,
8789
- cacheRead: 0.0252,
9331
+ input: 0.2288,
9332
+ output: 0.3432,
9333
+ cacheRead: 0,
8790
9334
  cacheWrite: 0,
8791
9335
  },
8792
9336
  contextWindow: 131072,
8793
- maxTokens: 65536,
9337
+ maxTokens: 64000,
8794
9338
  },
8795
9339
  "deepseek/deepseek-v3.2-exp": {
8796
9340
  id: "deepseek/deepseek-v3.2-exp",
@@ -8828,25 +9372,6 @@ export const MODELS = {
8828
9372
  contextWindow: 1048576,
8829
9373
  maxTokens: 131072,
8830
9374
  },
8831
- "deepseek/deepseek-v4-flash:free": {
8832
- id: "deepseek/deepseek-v4-flash:free",
8833
- name: "DeepSeek: DeepSeek V4 Flash (free)",
8834
- api: "openai-completions",
8835
- provider: "openrouter",
8836
- baseUrl: "https://openrouter.ai/api/v1",
8837
- compat: { "requiresReasoningContentOnAssistantMessages": true },
8838
- reasoning: true,
8839
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "xhigh" },
8840
- input: ["text"],
8841
- cost: {
8842
- input: 0,
8843
- output: 0,
8844
- cacheRead: 0,
8845
- cacheWrite: 0,
8846
- },
8847
- contextWindow: 1048576,
8848
- maxTokens: 384000,
8849
- },
8850
9375
  "deepseek/deepseek-v4-pro": {
8851
9376
  id: "deepseek/deepseek-v4-pro",
8852
9377
  name: "DeepSeek: DeepSeek V4 Pro",
@@ -8875,47 +9400,13 @@ export const MODELS = {
8875
9400
  reasoning: false,
8876
9401
  input: ["text"],
8877
9402
  cost: {
8878
- input: 0.15,
8879
- output: 0.15,
8880
- cacheRead: 0,
8881
- cacheWrite: 0,
8882
- },
8883
- contextWindow: 32768,
8884
- maxTokens: 4096,
8885
- },
8886
- "google/gemini-2.0-flash-001": {
8887
- id: "google/gemini-2.0-flash-001",
8888
- name: "Google: Gemini 2.0 Flash",
8889
- api: "openai-completions",
8890
- provider: "openrouter",
8891
- baseUrl: "https://openrouter.ai/api/v1",
8892
- reasoning: false,
8893
- input: ["text", "image"],
8894
- cost: {
8895
- input: 0.09999999999999999,
8896
- output: 0.39999999999999997,
8897
- cacheRead: 0.024999999999999998,
8898
- cacheWrite: 0.08333333333333334,
8899
- },
8900
- contextWindow: 1048576,
8901
- maxTokens: 8192,
8902
- },
8903
- "google/gemini-2.0-flash-lite-001": {
8904
- id: "google/gemini-2.0-flash-lite-001",
8905
- name: "Google: Gemini 2.0 Flash Lite",
8906
- api: "openai-completions",
8907
- provider: "openrouter",
8908
- baseUrl: "https://openrouter.ai/api/v1",
8909
- reasoning: false,
8910
- input: ["text", "image"],
8911
- cost: {
8912
- input: 0.075,
8913
- output: 0.3,
9403
+ input: 0.15,
9404
+ output: 0.15,
8914
9405
  cacheRead: 0,
8915
9406
  cacheWrite: 0,
8916
9407
  },
8917
- contextWindow: 1048576,
8918
- maxTokens: 8192,
9408
+ contextWindow: 32768,
9409
+ maxTokens: 4096,
8919
9410
  },
8920
9411
  "google/gemini-2.5-flash": {
8921
9412
  id: "google/gemini-2.5-flash",
@@ -9394,6 +9885,23 @@ export const MODELS = {
9394
9885
  contextWindow: 131072,
9395
9886
  maxTokens: 4096,
9396
9887
  },
9888
+ "meta-llama/llama-4-maverick": {
9889
+ id: "meta-llama/llama-4-maverick",
9890
+ name: "Meta: Llama 4 Maverick",
9891
+ api: "openai-completions",
9892
+ provider: "openrouter",
9893
+ baseUrl: "https://openrouter.ai/api/v1",
9894
+ reasoning: false,
9895
+ input: ["text", "image"],
9896
+ cost: {
9897
+ input: 0.15,
9898
+ output: 0.6,
9899
+ cacheRead: 0,
9900
+ cacheWrite: 0,
9901
+ },
9902
+ contextWindow: 1048576,
9903
+ maxTokens: 16384,
9904
+ },
9397
9905
  "meta-llama/llama-4-scout": {
9398
9906
  id: "meta-llama/llama-4-scout",
9399
9907
  name: "Meta: Llama 4 Scout",
@@ -9479,39 +9987,39 @@ export const MODELS = {
9479
9987
  contextWindow: 204800,
9480
9988
  maxTokens: 196608,
9481
9989
  },
9482
- "minimax/minimax-m2.5:free": {
9483
- id: "minimax/minimax-m2.5:free",
9484
- name: "MiniMax: MiniMax M2.5 (free)",
9990
+ "minimax/minimax-m2.7": {
9991
+ id: "minimax/minimax-m2.7",
9992
+ name: "MiniMax: MiniMax M2.7",
9485
9993
  api: "openai-completions",
9486
9994
  provider: "openrouter",
9487
9995
  baseUrl: "https://openrouter.ai/api/v1",
9488
9996
  reasoning: true,
9489
9997
  input: ["text"],
9490
9998
  cost: {
9491
- input: 0,
9492
- output: 0,
9999
+ input: 0.27899999999999997,
10000
+ output: 1.2,
9493
10001
  cacheRead: 0,
9494
10002
  cacheWrite: 0,
9495
10003
  },
9496
10004
  contextWindow: 204800,
9497
- maxTokens: 8192,
10005
+ maxTokens: 131072,
9498
10006
  },
9499
- "minimax/minimax-m2.7": {
9500
- id: "minimax/minimax-m2.7",
9501
- name: "MiniMax: MiniMax M2.7",
10007
+ "minimax/minimax-m3": {
10008
+ id: "minimax/minimax-m3",
10009
+ name: "MiniMax: MiniMax M3",
9502
10010
  api: "openai-completions",
9503
10011
  provider: "openrouter",
9504
10012
  baseUrl: "https://openrouter.ai/api/v1",
9505
10013
  reasoning: true,
9506
- input: ["text"],
10014
+ input: ["text", "image"],
9507
10015
  cost: {
9508
- input: 0.27899999999999997,
10016
+ input: 0.3,
9509
10017
  output: 1.2,
9510
- cacheRead: 0,
10018
+ cacheRead: 0.06,
9511
10019
  cacheWrite: 0,
9512
10020
  },
9513
- contextWindow: 204800,
9514
- maxTokens: 131072,
10021
+ contextWindow: 1048576,
10022
+ maxTokens: 512000,
9515
10023
  },
9516
10024
  "mistralai/codestral-2508": {
9517
10025
  id: "mistralai/codestral-2508",
@@ -9547,40 +10055,6 @@ export const MODELS = {
9547
10055
  contextWindow: 262144,
9548
10056
  maxTokens: 4096,
9549
10057
  },
9550
- "mistralai/devstral-medium": {
9551
- id: "mistralai/devstral-medium",
9552
- name: "Mistral: Devstral Medium",
9553
- api: "openai-completions",
9554
- provider: "openrouter",
9555
- baseUrl: "https://openrouter.ai/api/v1",
9556
- reasoning: false,
9557
- input: ["text"],
9558
- cost: {
9559
- input: 0.39999999999999997,
9560
- output: 2,
9561
- cacheRead: 0.04,
9562
- cacheWrite: 0,
9563
- },
9564
- contextWindow: 131072,
9565
- maxTokens: 4096,
9566
- },
9567
- "mistralai/devstral-small": {
9568
- id: "mistralai/devstral-small",
9569
- name: "Mistral: Devstral Small 1.1",
9570
- api: "openai-completions",
9571
- provider: "openrouter",
9572
- baseUrl: "https://openrouter.ai/api/v1",
9573
- reasoning: false,
9574
- input: ["text"],
9575
- cost: {
9576
- input: 0.09999999999999999,
9577
- output: 0.3,
9578
- cacheRead: 0.01,
9579
- cacheWrite: 0,
9580
- },
9581
- contextWindow: 131072,
9582
- maxTokens: 4096,
9583
- },
9584
10058
  "mistralai/ministral-14b-2512": {
9585
10059
  id: "mistralai/ministral-14b-2512",
9586
10060
  name: "Mistral: Ministral 3 14B 2512",
@@ -9666,23 +10140,6 @@ export const MODELS = {
9666
10140
  contextWindow: 131072,
9667
10141
  maxTokens: 4096,
9668
10142
  },
9669
- "mistralai/mistral-large-2411": {
9670
- id: "mistralai/mistral-large-2411",
9671
- name: "Mistral Large 2411",
9672
- api: "openai-completions",
9673
- provider: "openrouter",
9674
- baseUrl: "https://openrouter.ai/api/v1",
9675
- reasoning: false,
9676
- input: ["text"],
9677
- cost: {
9678
- input: 2,
9679
- output: 6,
9680
- cacheRead: 0.19999999999999998,
9681
- cacheWrite: 0,
9682
- },
9683
- contextWindow: 131072,
9684
- maxTokens: 4096,
9685
- },
9686
10143
  "mistralai/mistral-large-2512": {
9687
10144
  id: "mistralai/mistral-large-2512",
9688
10145
  name: "Mistral: Mistral Large 3 2512",
@@ -9836,23 +10293,6 @@ export const MODELS = {
9836
10293
  contextWindow: 65536,
9837
10294
  maxTokens: 4096,
9838
10295
  },
9839
- "mistralai/pixtral-large-2411": {
9840
- id: "mistralai/pixtral-large-2411",
9841
- name: "Mistral: Pixtral Large 2411",
9842
- api: "openai-completions",
9843
- provider: "openrouter",
9844
- baseUrl: "https://openrouter.ai/api/v1",
9845
- reasoning: false,
9846
- input: ["text", "image"],
9847
- cost: {
9848
- input: 2,
9849
- output: 6,
9850
- cacheRead: 0.19999999999999998,
9851
- cacheWrite: 0,
9852
- },
9853
- contextWindow: 131072,
9854
- maxTokens: 4096,
9855
- },
9856
10296
  "mistralai/voxtral-small-24b-2507": {
9857
10297
  id: "mistralai/voxtral-small-24b-2507",
9858
10298
  name: "Mistral: Voxtral Small 24B 2507",
@@ -9944,7 +10384,7 @@ export const MODELS = {
9944
10384
  api: "openai-completions",
9945
10385
  provider: "openrouter",
9946
10386
  baseUrl: "https://openrouter.ai/api/v1",
9947
- compat: { "supportsDeveloperRole": false },
10387
+ compat: { "supportsDeveloperRole": false, "requiresReasoningContentOnAssistantMessages": true },
9948
10388
  reasoning: true,
9949
10389
  input: ["text", "image"],
9950
10390
  cost: {
@@ -9962,7 +10402,7 @@ export const MODELS = {
9962
10402
  api: "openai-completions",
9963
10403
  provider: "openrouter",
9964
10404
  baseUrl: "https://openrouter.ai/api/v1",
9965
- compat: { "supportsDeveloperRole": false },
10405
+ compat: { "supportsDeveloperRole": false, "requiresReasoningContentOnAssistantMessages": true },
9966
10406
  reasoning: true,
9967
10407
  input: ["text", "image"],
9968
10408
  cost: {
@@ -10093,6 +10533,40 @@ export const MODELS = {
10093
10533
  contextWindow: 1000000,
10094
10534
  maxTokens: 262144,
10095
10535
  },
10536
+ "nvidia/nemotron-3-ultra-550b-a55b": {
10537
+ id: "nvidia/nemotron-3-ultra-550b-a55b",
10538
+ name: "NVIDIA: Nemotron 3 Ultra",
10539
+ api: "openai-completions",
10540
+ provider: "openrouter",
10541
+ baseUrl: "https://openrouter.ai/api/v1",
10542
+ reasoning: true,
10543
+ input: ["text"],
10544
+ cost: {
10545
+ input: 0.5,
10546
+ output: 2.5,
10547
+ cacheRead: 0.15,
10548
+ cacheWrite: 0,
10549
+ },
10550
+ contextWindow: 1000000,
10551
+ maxTokens: 16384,
10552
+ },
10553
+ "nvidia/nemotron-3-ultra-550b-a55b:free": {
10554
+ id: "nvidia/nemotron-3-ultra-550b-a55b:free",
10555
+ name: "NVIDIA: Nemotron 3 Ultra (free)",
10556
+ api: "openai-completions",
10557
+ provider: "openrouter",
10558
+ baseUrl: "https://openrouter.ai/api/v1",
10559
+ reasoning: true,
10560
+ input: ["text"],
10561
+ cost: {
10562
+ input: 0,
10563
+ output: 0,
10564
+ cacheRead: 0,
10565
+ cacheWrite: 0,
10566
+ },
10567
+ contextWindow: 1000000,
10568
+ maxTokens: 65536,
10569
+ },
10096
10570
  "nvidia/nemotron-nano-12b-v2-vl:free": {
10097
10571
  id: "nvidia/nemotron-nano-12b-v2-vl:free",
10098
10572
  name: "NVIDIA: Nemotron Nano 12B 2 VL (free)",
@@ -10212,23 +10686,6 @@ export const MODELS = {
10212
10686
  contextWindow: 8191,
10213
10687
  maxTokens: 4096,
10214
10688
  },
10215
- "openai/gpt-4-0314": {
10216
- id: "openai/gpt-4-0314",
10217
- name: "OpenAI: GPT-4 (older v0314)",
10218
- api: "openai-completions",
10219
- provider: "openrouter",
10220
- baseUrl: "https://openrouter.ai/api/v1",
10221
- reasoning: false,
10222
- input: ["text"],
10223
- cost: {
10224
- input: 30,
10225
- output: 60,
10226
- cacheRead: 0,
10227
- cacheWrite: 0,
10228
- },
10229
- contextWindow: 8191,
10230
- maxTokens: 4096,
10231
- },
10232
10689
  "openai/gpt-4-1106-preview": {
10233
10690
  id: "openai/gpt-4-1106-preview",
10234
10691
  name: "OpenAI: GPT-4 Turbo (older v1106)",
@@ -10913,13 +11370,13 @@ export const MODELS = {
10913
11370
  reasoning: true,
10914
11371
  input: ["text"],
10915
11372
  cost: {
10916
- input: 0.03,
11373
+ input: 0.029,
10917
11374
  output: 0.14,
10918
11375
  cacheRead: 0,
10919
11376
  cacheWrite: 0,
10920
11377
  },
10921
11378
  contextWindow: 131072,
10922
- maxTokens: 131072,
11379
+ maxTokens: 4096,
10923
11380
  },
10924
11381
  "openai/gpt-oss-20b:free": {
10925
11382
  id: "openai/gpt-oss-20b:free",
@@ -11227,23 +11684,6 @@ export const MODELS = {
11227
11684
  contextWindow: 131072,
11228
11685
  maxTokens: 16384,
11229
11686
  },
11230
- "qwen/qwen-2.5-7b-instruct": {
11231
- id: "qwen/qwen-2.5-7b-instruct",
11232
- name: "Qwen: Qwen2.5 7B Instruct",
11233
- api: "openai-completions",
11234
- provider: "openrouter",
11235
- baseUrl: "https://openrouter.ai/api/v1",
11236
- reasoning: false,
11237
- input: ["text"],
11238
- cost: {
11239
- input: 0.04,
11240
- output: 0.09999999999999999,
11241
- cacheRead: 0,
11242
- cacheWrite: 0,
11243
- },
11244
- contextWindow: 131072,
11245
- maxTokens: 32768,
11246
- },
11247
11687
  "qwen/qwen-plus": {
11248
11688
  id: "qwen/qwen-plus",
11249
11689
  name: "Qwen: Qwen-Plus",
@@ -11355,13 +11795,13 @@ export const MODELS = {
11355
11795
  reasoning: true,
11356
11796
  input: ["text"],
11357
11797
  cost: {
11358
- input: 0.14950000000000002,
11359
- output: 1.495,
11360
- cacheRead: 0,
11798
+ input: 0.09999999999999999,
11799
+ output: 0.09999999999999999,
11800
+ cacheRead: 0.09999999999999999,
11361
11801
  cacheWrite: 0,
11362
11802
  },
11363
11803
  contextWindow: 262144,
11364
- maxTokens: 4096,
11804
+ maxTokens: 262144,
11365
11805
  },
11366
11806
  "qwen/qwen3-30b-a3b": {
11367
11807
  id: "qwen/qwen3-30b-a3b",
@@ -11389,13 +11829,13 @@ export const MODELS = {
11389
11829
  reasoning: false,
11390
11830
  input: ["text"],
11391
11831
  cost: {
11392
- input: 0.09,
11393
- output: 0.3,
11832
+ input: 0.04815,
11833
+ output: 0.19305,
11394
11834
  cacheRead: 0,
11395
11835
  cacheWrite: 0,
11396
11836
  },
11397
- contextWindow: 262144,
11398
- maxTokens: 262144,
11837
+ contextWindow: 131072,
11838
+ maxTokens: 32000,
11399
11839
  },
11400
11840
  "qwen/qwen3-30b-a3b-thinking-2507": {
11401
11841
  id: "qwen/qwen3-30b-a3b-thinking-2507",
@@ -11797,13 +12237,13 @@ export const MODELS = {
11797
12237
  reasoning: true,
11798
12238
  input: ["text", "image"],
11799
12239
  cost: {
11800
- input: 0.13899999999999998,
12240
+ input: 0.14,
11801
12241
  output: 1,
11802
- cacheRead: 0,
12242
+ cacheRead: 0.049999999999999996,
11803
12243
  cacheWrite: 0,
11804
12244
  },
11805
12245
  contextWindow: 262144,
11806
- maxTokens: 4096,
12246
+ maxTokens: 262144,
11807
12247
  },
11808
12248
  "qwen/qwen3.5-397b-a17b": {
11809
12249
  id: "qwen/qwen3.5-397b-a17b",
@@ -11992,6 +12432,23 @@ export const MODELS = {
11992
12432
  contextWindow: 1000000,
11993
12433
  maxTokens: 65536,
11994
12434
  },
12435
+ "qwen/qwen3.7-plus": {
12436
+ id: "qwen/qwen3.7-plus",
12437
+ name: "Qwen: Qwen3.7 Plus",
12438
+ api: "openai-completions",
12439
+ provider: "openrouter",
12440
+ baseUrl: "https://openrouter.ai/api/v1",
12441
+ reasoning: true,
12442
+ input: ["text", "image"],
12443
+ cost: {
12444
+ input: 0.39999999999999997,
12445
+ output: 1.5999999999999999,
12446
+ cacheRead: 0.08,
12447
+ cacheWrite: 0.5,
12448
+ },
12449
+ contextWindow: 1000000,
12450
+ maxTokens: 65536,
12451
+ },
11995
12452
  "rekaai/reka-edge": {
11996
12453
  id: "rekaai/reka-edge",
11997
12454
  name: "Reka Edge",
@@ -12230,40 +12687,6 @@ export const MODELS = {
12230
12687
  contextWindow: 262144,
12231
12688
  maxTokens: 65536,
12232
12689
  },
12233
- "xiaomi/mimo-v2-omni": {
12234
- id: "xiaomi/mimo-v2-omni",
12235
- name: "Xiaomi: MiMo-V2-Omni",
12236
- api: "openai-completions",
12237
- provider: "openrouter",
12238
- baseUrl: "https://openrouter.ai/api/v1",
12239
- reasoning: true,
12240
- input: ["text", "image"],
12241
- cost: {
12242
- input: 0.39999999999999997,
12243
- output: 2,
12244
- cacheRead: 0.08,
12245
- cacheWrite: 0,
12246
- },
12247
- contextWindow: 262144,
12248
- maxTokens: 65536,
12249
- },
12250
- "xiaomi/mimo-v2-pro": {
12251
- id: "xiaomi/mimo-v2-pro",
12252
- name: "Xiaomi: MiMo-V2-Pro",
12253
- api: "openai-completions",
12254
- provider: "openrouter",
12255
- baseUrl: "https://openrouter.ai/api/v1",
12256
- reasoning: true,
12257
- input: ["text"],
12258
- cost: {
12259
- input: 1,
12260
- output: 3,
12261
- cacheRead: 0.19999999999999998,
12262
- cacheWrite: 0,
12263
- },
12264
- contextWindow: 1048576,
12265
- maxTokens: 131072,
12266
- },
12267
12690
  "xiaomi/mimo-v2.5": {
12268
12691
  id: "xiaomi/mimo-v2.5",
12269
12692
  name: "Xiaomi: MiMo-V2.5",
@@ -13021,7 +13444,7 @@ export const MODELS = {
13021
13444
  api: "anthropic-messages",
13022
13445
  provider: "vercel-ai-gateway",
13023
13446
  baseUrl: "https://ai-gateway.vercel.sh",
13024
- reasoning: false,
13447
+ reasoning: true,
13025
13448
  input: ["text"],
13026
13449
  cost: {
13027
13450
  input: 0.22,
@@ -13073,7 +13496,7 @@ export const MODELS = {
13073
13496
  provider: "vercel-ai-gateway",
13074
13497
  baseUrl: "https://ai-gateway.vercel.sh",
13075
13498
  reasoning: true,
13076
- input: ["text", "image"],
13499
+ input: ["text"],
13077
13500
  cost: {
13078
13501
  input: 1.3,
13079
13502
  output: 7.8,
@@ -13106,7 +13529,7 @@ export const MODELS = {
13106
13529
  api: "anthropic-messages",
13107
13530
  provider: "vercel-ai-gateway",
13108
13531
  baseUrl: "https://ai-gateway.vercel.sh",
13109
- reasoning: false,
13532
+ reasoning: true,
13110
13533
  input: ["text"],
13111
13534
  cost: {
13112
13535
  input: 1.5,
@@ -13140,7 +13563,7 @@ export const MODELS = {
13140
13563
  api: "anthropic-messages",
13141
13564
  provider: "vercel-ai-gateway",
13142
13565
  baseUrl: "https://ai-gateway.vercel.sh",
13143
- reasoning: false,
13566
+ reasoning: true,
13144
13567
  input: ["text"],
13145
13568
  cost: {
13146
13569
  input: 0.5,
@@ -13202,22 +13625,56 @@ export const MODELS = {
13202
13625
  contextWindow: 262144,
13203
13626
  maxTokens: 32768,
13204
13627
  },
13205
- "alibaba/qwen3-max-thinking": {
13206
- id: "alibaba/qwen3-max-thinking",
13207
- name: "Qwen 3 Max Thinking",
13628
+ "alibaba/qwen3-max-thinking": {
13629
+ id: "alibaba/qwen3-max-thinking",
13630
+ name: "Qwen 3 Max Thinking",
13631
+ api: "anthropic-messages",
13632
+ provider: "vercel-ai-gateway",
13633
+ baseUrl: "https://ai-gateway.vercel.sh",
13634
+ reasoning: true,
13635
+ input: ["text"],
13636
+ cost: {
13637
+ input: 1.2,
13638
+ output: 6,
13639
+ cacheRead: 0.24,
13640
+ cacheWrite: 0,
13641
+ },
13642
+ contextWindow: 256000,
13643
+ maxTokens: 65536,
13644
+ },
13645
+ "alibaba/qwen3-next-80b-a3b-instruct": {
13646
+ id: "alibaba/qwen3-next-80b-a3b-instruct",
13647
+ name: "Qwen3 Next 80B A3B Instruct",
13648
+ api: "anthropic-messages",
13649
+ provider: "vercel-ai-gateway",
13650
+ baseUrl: "https://ai-gateway.vercel.sh",
13651
+ reasoning: false,
13652
+ input: ["text"],
13653
+ cost: {
13654
+ input: 0.15,
13655
+ output: 1.2,
13656
+ cacheRead: 0,
13657
+ cacheWrite: 0,
13658
+ },
13659
+ contextWindow: 131072,
13660
+ maxTokens: 32768,
13661
+ },
13662
+ "alibaba/qwen3-next-80b-a3b-thinking": {
13663
+ id: "alibaba/qwen3-next-80b-a3b-thinking",
13664
+ name: "Qwen3 Next 80B A3B Thinking",
13208
13665
  api: "anthropic-messages",
13209
13666
  provider: "vercel-ai-gateway",
13210
13667
  baseUrl: "https://ai-gateway.vercel.sh",
13211
13668
  reasoning: true,
13212
13669
  input: ["text"],
13213
13670
  cost: {
13214
- input: 1.2,
13215
- output: 6,
13216
- cacheRead: 0.24,
13671
+ input: 0.15,
13672
+ output: 1.2,
13673
+ cacheRead: 0,
13217
13674
  cacheWrite: 0,
13218
13675
  },
13219
- contextWindow: 256000,
13220
- maxTokens: 65536,
13676
+ contextWindow: 131072,
13677
+ maxTokens: 32768,
13221
13678
  },
13222
13679
  "alibaba/qwen3-vl-thinking": {
13223
13680
  id: "alibaba/qwen3-vl-thinking",
@@ -13311,7 +13768,7 @@ export const MODELS = {
13311
13768
  provider: "vercel-ai-gateway",
13312
13769
  baseUrl: "https://ai-gateway.vercel.sh",
13313
13770
  reasoning: true,
13314
- input: ["text", "image"],
13771
+ input: ["text"],
13315
13772
  cost: {
13316
13773
  input: 1.25,
13317
13774
  output: 3.75,
@@ -13321,6 +13778,23 @@ export const MODELS = {
13321
13778
  contextWindow: 991000,
13322
13779
  maxTokens: 64000,
13323
13780
  },
13781
+ "alibaba/qwen3.7-plus": {
13782
+ id: "alibaba/qwen3.7-plus",
13783
+ name: "Qwen 3.7 Plus",
13784
+ api: "anthropic-messages",
13785
+ provider: "vercel-ai-gateway",
13786
+ baseUrl: "https://ai-gateway.vercel.sh",
13787
+ reasoning: true,
13788
+ input: ["text", "image"],
13789
+ cost: {
13790
+ input: 0.39999999999999997,
13791
+ output: 1.5999999999999999,
13792
+ cacheRead: 0.08,
13793
+ cacheWrite: 0.5,
13794
+ },
13795
+ contextWindow: 1000000,
13796
+ maxTokens: 64000,
13797
+ },
13324
13798
  "anthropic/claude-3-haiku": {
13325
13799
  id: "anthropic/claude-3-haiku",
13326
13800
  name: "Claude 3 Haiku",
@@ -13448,7 +13922,7 @@ export const MODELS = {
13448
13922
  api: "anthropic-messages",
13449
13923
  provider: "vercel-ai-gateway",
13450
13924
  baseUrl: "https://ai-gateway.vercel.sh",
13451
- compat: { "forceAdaptiveThinking": true },
13925
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
13452
13926
  reasoning: true,
13453
13927
  thinkingLevelMap: { "xhigh": "xhigh" },
13454
13928
  input: ["text", "image"],
@@ -13467,7 +13941,7 @@ export const MODELS = {
13467
13941
  api: "anthropic-messages",
13468
13942
  provider: "vercel-ai-gateway",
13469
13943
  baseUrl: "https://ai-gateway.vercel.sh",
13470
- compat: { "forceAdaptiveThinking": true },
13944
+ compat: { "forceAdaptiveThinking": true, "supportsTemperature": false },
13471
13945
  reasoning: true,
13472
13946
  thinkingLevelMap: { "xhigh": "xhigh" },
13473
13947
  input: ["text", "image"],
@@ -13626,17 +14100,17 @@ export const MODELS = {
13626
14100
  reasoning: false,
13627
14101
  input: ["text"],
13628
14102
  cost: {
13629
- input: 0.77,
13630
- output: 0.77,
13631
- cacheRead: 0,
14103
+ input: 0.27,
14104
+ output: 1.12,
14105
+ cacheRead: 0.135,
13632
14106
  cacheWrite: 0,
13633
14107
  },
13634
14108
  contextWindow: 163840,
13635
- maxTokens: 16384,
14109
+ maxTokens: 163840,
13636
14110
  },
13637
14111
  "deepseek/deepseek-v3.1": {
13638
14112
  id: "deepseek/deepseek-v3.1",
13639
- name: "DeepSeek-V3.1",
14113
+ name: "DeepSeek V3.1",
13640
14114
  api: "anthropic-messages",
13641
14115
  provider: "vercel-ai-gateway",
13642
14116
  baseUrl: "https://ai-gateway.vercel.sh",
@@ -13674,8 +14148,8 @@ export const MODELS = {
13674
14148
  api: "anthropic-messages",
13675
14149
  provider: "vercel-ai-gateway",
13676
14150
  baseUrl: "https://ai-gateway.vercel.sh",
13677
- reasoning: false,
13678
- input: ["text"],
14151
+ reasoning: true,
14152
+ input: ["text", "image"],
13679
14153
  cost: {
13680
14154
  input: 0.28,
13681
14155
  output: 0.42,
@@ -13691,8 +14165,8 @@ export const MODELS = {
13691
14165
  api: "anthropic-messages",
13692
14166
  provider: "vercel-ai-gateway",
13693
14167
  baseUrl: "https://ai-gateway.vercel.sh",
13694
- reasoning: false,
13695
- input: ["text"],
14168
+ reasoning: true,
14169
+ input: ["text", "image"],
13696
14170
  cost: {
13697
14171
  input: 0.62,
13698
14172
  output: 1.85,
@@ -13709,7 +14183,7 @@ export const MODELS = {
13709
14183
  provider: "vercel-ai-gateway",
13710
14184
  baseUrl: "https://ai-gateway.vercel.sh",
13711
14185
  reasoning: true,
13712
- input: ["text"],
14186
+ input: ["text", "image"],
13713
14187
  cost: {
13714
14188
  input: 0.14,
13715
14189
  output: 0.28,
@@ -13929,12 +14403,12 @@ export const MODELS = {
13929
14403
  api: "anthropic-messages",
13930
14404
  provider: "vercel-ai-gateway",
13931
14405
  baseUrl: "https://ai-gateway.vercel.sh",
13932
- reasoning: false,
14406
+ reasoning: true,
13933
14407
  input: ["text", "image"],
13934
14408
  cost: {
13935
- input: 0.13,
13936
- output: 0.39999999999999997,
13937
- cacheRead: 0,
14409
+ input: 0.15,
14410
+ output: 0.6,
14411
+ cacheRead: 0.015,
13938
14412
  cacheWrite: 0,
13939
14413
  },
13940
14414
  contextWindow: 262144,
@@ -14236,7 +14710,7 @@ export const MODELS = {
14236
14710
  provider: "vercel-ai-gateway",
14237
14711
  baseUrl: "https://ai-gateway.vercel.sh",
14238
14712
  reasoning: true,
14239
- input: ["text", "image"],
14713
+ input: ["text"],
14240
14714
  cost: {
14241
14715
  input: 0.3,
14242
14716
  output: 1.2,
@@ -14253,7 +14727,7 @@ export const MODELS = {
14253
14727
  provider: "vercel-ai-gateway",
14254
14728
  baseUrl: "https://ai-gateway.vercel.sh",
14255
14729
  reasoning: true,
14256
- input: ["text", "image"],
14730
+ input: ["text"],
14257
14731
  cost: {
14258
14732
  input: 0.6,
14259
14733
  output: 2.4,
@@ -14263,6 +14737,23 @@ export const MODELS = {
14263
14737
  contextWindow: 204800,
14264
14738
  maxTokens: 131100,
14265
14739
  },
14740
+ "minimax/minimax-m3": {
14741
+ id: "minimax/minimax-m3",
14742
+ name: "MiniMax M3",
14743
+ api: "anthropic-messages",
14744
+ provider: "vercel-ai-gateway",
14745
+ baseUrl: "https://ai-gateway.vercel.sh",
14746
+ reasoning: true,
14747
+ input: ["text", "image"],
14748
+ cost: {
14749
+ input: 0.3,
14750
+ output: 1.2,
14751
+ cacheRead: 0.06,
14752
+ cacheWrite: 0,
14753
+ },
14754
+ contextWindow: 1000000,
14755
+ maxTokens: 1000000,
14756
+ },
14266
14757
  "mistral/codestral": {
14267
14758
  id: "mistral/codestral",
14268
14759
  name: "Mistral Codestral",
@@ -14399,6 +14890,23 @@ export const MODELS = {
14399
14890
  contextWindow: 256000,
14400
14891
  maxTokens: 256000,
14401
14892
  },
14893
+ "mistral/mistral-nemo": {
14894
+ id: "mistral/mistral-nemo",
14895
+ name: "Mistral Nemo 12B",
14896
+ api: "anthropic-messages",
14897
+ provider: "vercel-ai-gateway",
14898
+ baseUrl: "https://ai-gateway.vercel.sh",
14899
+ reasoning: false,
14900
+ input: ["text"],
14901
+ cost: {
14902
+ input: 0.02,
14903
+ output: 0.04,
14904
+ cacheRead: 0,
14905
+ cacheWrite: 0,
14906
+ },
14907
+ contextWindow: 131072,
14908
+ maxTokens: 131072,
14909
+ },
14402
14910
  "mistral/mistral-small": {
14403
14911
  id: "mistral/mistral-small",
14404
14912
  name: "Mistral Small",
@@ -14552,6 +15060,40 @@ export const MODELS = {
14552
15060
  contextWindow: 262000,
14553
15061
  maxTokens: 262000,
14554
15062
  },
15063
+ "nvidia/nemotron-3-super-120b-a12b": {
15064
+ id: "nvidia/nemotron-3-super-120b-a12b",
15065
+ name: "NVIDIA Nemotron 3 Super 120B A12B",
15066
+ api: "anthropic-messages",
15067
+ provider: "vercel-ai-gateway",
15068
+ baseUrl: "https://ai-gateway.vercel.sh",
15069
+ reasoning: true,
15070
+ input: ["text"],
15071
+ cost: {
15072
+ input: 0.15,
15073
+ output: 0.65,
15074
+ cacheRead: 0,
15075
+ cacheWrite: 0,
15076
+ },
15077
+ contextWindow: 256000,
15078
+ maxTokens: 32000,
15079
+ },
15080
+ "nvidia/nemotron-3-ultra-550b-a55b": {
15081
+ id: "nvidia/nemotron-3-ultra-550b-a55b",
15082
+ name: "Nemotron 3 Ultra",
15083
+ api: "anthropic-messages",
15084
+ provider: "vercel-ai-gateway",
15085
+ baseUrl: "https://ai-gateway.vercel.sh",
15086
+ reasoning: true,
15087
+ input: ["text"],
15088
+ cost: {
15089
+ input: 0.5,
15090
+ output: 2.5,
15091
+ cacheRead: 0.15,
15092
+ cacheWrite: 0,
15093
+ },
15094
+ contextWindow: 262144,
15095
+ maxTokens: 65000,
15096
+ },
14555
15097
  "nvidia/nemotron-nano-12b-v2-vl": {
14556
15098
  id: "nvidia/nemotron-nano-12b-v2-vl",
14557
15099
  name: "Nvidia Nemotron Nano 12B V2 VL",
@@ -14729,7 +15271,7 @@ export const MODELS = {
14729
15271
  provider: "vercel-ai-gateway",
14730
15272
  baseUrl: "https://ai-gateway.vercel.sh",
14731
15273
  reasoning: true,
14732
- input: ["text"],
15274
+ input: ["text", "image"],
14733
15275
  cost: {
14734
15276
  input: 1.25,
14735
15277
  output: 10,
@@ -15091,6 +15633,23 @@ export const MODELS = {
15091
15633
  contextWindow: 1000000,
15092
15634
  maxTokens: 128000,
15093
15635
  },
15636
+ "openai/gpt-oss-120b": {
15637
+ id: "openai/gpt-oss-120b",
15638
+ name: "GPT OSS 120B",
15639
+ api: "anthropic-messages",
15640
+ provider: "vercel-ai-gateway",
15641
+ baseUrl: "https://ai-gateway.vercel.sh",
15642
+ reasoning: true,
15643
+ input: ["text"],
15644
+ cost: {
15645
+ input: 0.35,
15646
+ output: 0.75,
15647
+ cacheRead: 0.25,
15648
+ cacheWrite: 0,
15649
+ },
15650
+ contextWindow: 131072,
15651
+ maxTokens: 131000,
15652
+ },
15094
15653
  "openai/gpt-oss-20b": {
15095
15654
  id: "openai/gpt-oss-20b",
15096
15655
  name: "GPT OSS 20B",
@@ -15261,6 +15820,40 @@ export const MODELS = {
15261
15820
  contextWindow: 200000,
15262
15821
  maxTokens: 8000,
15263
15822
  },
15823
+ "stepfun/step-3.5-flash": {
15824
+ id: "stepfun/step-3.5-flash",
15825
+ name: "StepFun 3.5 Flash",
15826
+ api: "anthropic-messages",
15827
+ provider: "vercel-ai-gateway",
15828
+ baseUrl: "https://ai-gateway.vercel.sh",
15829
+ reasoning: true,
15830
+ input: ["text"],
15831
+ cost: {
15832
+ input: 0.09,
15833
+ output: 0.3,
15834
+ cacheRead: 0,
15835
+ cacheWrite: 0.02,
15836
+ },
15837
+ contextWindow: 262114,
15838
+ maxTokens: 262114,
15839
+ },
15840
+ "stepfun/step-3.7-flash": {
15841
+ id: "stepfun/step-3.7-flash",
15842
+ name: "Step 3.7 Flash",
15843
+ api: "anthropic-messages",
15844
+ provider: "vercel-ai-gateway",
15845
+ baseUrl: "https://ai-gateway.vercel.sh",
15846
+ reasoning: true,
15847
+ input: ["text", "image"],
15848
+ cost: {
15849
+ input: 0.19999999999999998,
15850
+ output: 1.15,
15851
+ cacheRead: 0.04,
15852
+ cacheWrite: 0,
15853
+ },
15854
+ contextWindow: 256000,
15855
+ maxTokens: 256000,
15856
+ },
15264
15857
  "xai/grok-4.1-fast-non-reasoning": {
15265
15858
  id: "xai/grok-4.1-fast-non-reasoning",
15266
15859
  name: "Grok 4.1 Fast Non-Reasoning",
@@ -15539,7 +16132,7 @@ export const MODELS = {
15539
16132
  api: "anthropic-messages",
15540
16133
  provider: "vercel-ai-gateway",
15541
16134
  baseUrl: "https://ai-gateway.vercel.sh",
15542
- reasoning: false,
16135
+ reasoning: true,
15543
16136
  input: ["text", "image"],
15544
16137
  cost: {
15545
16138
  input: 0.6,
@@ -15693,7 +16286,7 @@ export const MODELS = {
15693
16286
  provider: "vercel-ai-gateway",
15694
16287
  baseUrl: "https://ai-gateway.vercel.sh",
15695
16288
  reasoning: true,
15696
- input: ["text"],
16289
+ input: ["text", "image"],
15697
16290
  cost: {
15698
16291
  input: 1.4,
15699
16292
  output: 4.4,
@@ -16248,5 +16841,97 @@ export const MODELS = {
16248
16841
  maxTokens: 131072,
16249
16842
  },
16250
16843
  },
16844
+ "zai-coding-cn": {
16845
+ "glm-4.5-air": {
16846
+ id: "glm-4.5-air",
16847
+ name: "GLM-4.5-Air",
16848
+ api: "openai-completions",
16849
+ provider: "zai-coding-cn",
16850
+ baseUrl: "https://open.bigmodel.cn/api/coding/paas/v4",
16851
+ compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai" },
16852
+ reasoning: true,
16853
+ input: ["text"],
16854
+ cost: {
16855
+ input: 0,
16856
+ output: 0,
16857
+ cacheRead: 0,
16858
+ cacheWrite: 0,
16859
+ },
16860
+ contextWindow: 131072,
16861
+ maxTokens: 98304,
16862
+ },
16863
+ "glm-4.7": {
16864
+ id: "glm-4.7",
16865
+ name: "GLM-4.7",
16866
+ api: "openai-completions",
16867
+ provider: "zai-coding-cn",
16868
+ baseUrl: "https://open.bigmodel.cn/api/coding/paas/v4",
16869
+ compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "zaiToolStream": true },
16870
+ reasoning: true,
16871
+ input: ["text"],
16872
+ cost: {
16873
+ input: 0,
16874
+ output: 0,
16875
+ cacheRead: 0,
16876
+ cacheWrite: 0,
16877
+ },
16878
+ contextWindow: 204800,
16879
+ maxTokens: 131072,
16880
+ },
16881
+ "glm-5-turbo": {
16882
+ id: "glm-5-turbo",
16883
+ name: "GLM-5-Turbo",
16884
+ api: "openai-completions",
16885
+ provider: "zai-coding-cn",
16886
+ baseUrl: "https://open.bigmodel.cn/api/coding/paas/v4",
16887
+ compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "zaiToolStream": true },
16888
+ reasoning: true,
16889
+ input: ["text"],
16890
+ cost: {
16891
+ input: 0,
16892
+ output: 0,
16893
+ cacheRead: 0,
16894
+ cacheWrite: 0,
16895
+ },
16896
+ contextWindow: 200000,
16897
+ maxTokens: 131072,
16898
+ },
16899
+ "glm-5.1": {
16900
+ id: "glm-5.1",
16901
+ name: "GLM-5.1",
16902
+ api: "openai-completions",
16903
+ provider: "zai-coding-cn",
16904
+ baseUrl: "https://open.bigmodel.cn/api/coding/paas/v4",
16905
+ compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "zaiToolStream": true },
16906
+ reasoning: true,
16907
+ input: ["text"],
16908
+ cost: {
16909
+ input: 0,
16910
+ output: 0,
16911
+ cacheRead: 0,
16912
+ cacheWrite: 0,
16913
+ },
16914
+ contextWindow: 200000,
16915
+ maxTokens: 131072,
16916
+ },
16917
+ "glm-5v-turbo": {
16918
+ id: "glm-5v-turbo",
16919
+ name: "GLM-5V-Turbo",
16920
+ api: "openai-completions",
16921
+ provider: "zai-coding-cn",
16922
+ baseUrl: "https://open.bigmodel.cn/api/coding/paas/v4",
16923
+ compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "zaiToolStream": true },
16924
+ reasoning: true,
16925
+ input: ["text", "image"],
16926
+ cost: {
16927
+ input: 0,
16928
+ output: 0,
16929
+ cacheRead: 0,
16930
+ cacheWrite: 0,
16931
+ },
16932
+ contextWindow: 200000,
16933
+ maxTokens: 131072,
16934
+ },
16935
+ },
16251
16936
  };
16252
16937
  //# sourceMappingURL=models.generated.js.map