@hyperspaceng/neural-ai 0.63.0 → 0.64.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -815,8 +815,8 @@ export const MODELS = {
815
815
  cacheRead: 0,
816
816
  cacheWrite: 0,
817
817
  },
818
- contextWindow: 1000000,
819
- maxTokens: 131072,
818
+ contextWindow: 196608,
819
+ maxTokens: 98304,
820
820
  },
821
821
  "mistral.devstral-2-123b": {
822
822
  id: "mistral.devstral-2-123b",
@@ -1056,6 +1056,23 @@ export const MODELS = {
1056
1056
  contextWindow: 128000,
1057
1057
  maxTokens: 4096,
1058
1058
  },
1059
+ "nvidia.nemotron-super-3-120b": {
1060
+ id: "nvidia.nemotron-super-3-120b",
1061
+ name: "NVIDIA Nemotron 3 Super 120B A12B",
1062
+ api: "bedrock-converse-stream",
1063
+ provider: "amazon-bedrock",
1064
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1065
+ reasoning: true,
1066
+ input: ["text"],
1067
+ cost: {
1068
+ input: 0.15,
1069
+ output: 0.65,
1070
+ cacheRead: 0,
1071
+ cacheWrite: 0,
1072
+ },
1073
+ contextWindow: 262144,
1074
+ maxTokens: 131072,
1075
+ },
1059
1076
  "openai.gpt-oss-120b-1:0": {
1060
1077
  id: "openai.gpt-oss-120b-1:0",
1061
1078
  name: "gpt-oss-120b",
@@ -1444,8 +1461,8 @@ export const MODELS = {
1444
1461
  cacheRead: 0,
1445
1462
  cacheWrite: 0,
1446
1463
  },
1447
- contextWindow: 200000,
1448
- maxTokens: 131072,
1464
+ contextWindow: 202752,
1465
+ maxTokens: 101376,
1449
1466
  },
1450
1467
  },
1451
1468
  "anthropic": {
@@ -2284,6 +2301,23 @@ export const MODELS = {
2284
2301
  contextWindow: 400000,
2285
2302
  maxTokens: 128000,
2286
2303
  },
2304
+ "gpt-5.3-chat-latest": {
2305
+ id: "gpt-5.3-chat-latest",
2306
+ name: "GPT-5.3 Chat (latest)",
2307
+ api: "azure-openai-responses",
2308
+ provider: "azure-openai-responses",
2309
+ baseUrl: "",
2310
+ reasoning: false,
2311
+ input: ["text", "image"],
2312
+ cost: {
2313
+ input: 1.75,
2314
+ output: 14,
2315
+ cacheRead: 0.175,
2316
+ cacheWrite: 0,
2317
+ },
2318
+ contextWindow: 128000,
2319
+ maxTokens: 16384,
2320
+ },
2287
2321
  "gpt-5.3-codex": {
2288
2322
  id: "gpt-5.3-codex",
2289
2323
  name: "GPT-5.3 Codex",
@@ -3443,6 +3477,23 @@ export const MODELS = {
3443
3477
  contextWindow: 131072,
3444
3478
  maxTokens: 65536,
3445
3479
  },
3480
+ "gemma-3-27b-it": {
3481
+ id: "gemma-3-27b-it",
3482
+ name: "Gemma 3 27B",
3483
+ api: "google-generative-ai",
3484
+ provider: "google",
3485
+ baseUrl: "https://generativelanguage.googleapis.com/v1beta",
3486
+ reasoning: false,
3487
+ input: ["text", "image"],
3488
+ cost: {
3489
+ input: 0,
3490
+ output: 0,
3491
+ cacheRead: 0,
3492
+ cacheWrite: 0,
3493
+ },
3494
+ contextWindow: 131072,
3495
+ maxTokens: 8192,
3496
+ },
3446
3497
  },
3447
3498
  "google-antigravity": {
3448
3499
  "claude-opus-4-5-thinking": {
@@ -3908,6 +3959,23 @@ export const MODELS = {
3908
3959
  contextWindow: 1048576,
3909
3960
  maxTokens: 65536,
3910
3961
  },
3962
+ "gemini-3.1-pro-preview-customtools": {
3963
+ id: "gemini-3.1-pro-preview-customtools",
3964
+ name: "Gemini 3.1 Pro Preview Custom Tools (Vertex)",
3965
+ api: "google-vertex",
3966
+ provider: "google-vertex",
3967
+ baseUrl: "https://{location}-aiplatform.googleapis.com",
3968
+ reasoning: true,
3969
+ input: ["text", "image"],
3970
+ cost: {
3971
+ input: 2,
3972
+ output: 12,
3973
+ cacheRead: 0.2,
3974
+ cacheWrite: 0,
3975
+ },
3976
+ contextWindow: 1048576,
3977
+ maxTokens: 65536,
3978
+ },
3911
3979
  },
3912
3980
  "groq": {
3913
3981
  "deepseek-r1-distill-llama-70b": {
@@ -3944,6 +4012,40 @@ export const MODELS = {
3944
4012
  contextWindow: 8192,
3945
4013
  maxTokens: 8192,
3946
4014
  },
4015
+ "groq/compound": {
4016
+ id: "groq/compound",
4017
+ name: "Compound",
4018
+ api: "openai-completions",
4019
+ provider: "groq",
4020
+ baseUrl: "https://api.groq.com/openai/v1",
4021
+ reasoning: true,
4022
+ input: ["text"],
4023
+ cost: {
4024
+ input: 0,
4025
+ output: 0,
4026
+ cacheRead: 0,
4027
+ cacheWrite: 0,
4028
+ },
4029
+ contextWindow: 131072,
4030
+ maxTokens: 8192,
4031
+ },
4032
+ "groq/compound-mini": {
4033
+ id: "groq/compound-mini",
4034
+ name: "Compound Mini",
4035
+ api: "openai-completions",
4036
+ provider: "groq",
4037
+ baseUrl: "https://api.groq.com/openai/v1",
4038
+ reasoning: true,
4039
+ input: ["text"],
4040
+ cost: {
4041
+ input: 0,
4042
+ output: 0,
4043
+ cacheRead: 0,
4044
+ cacheWrite: 0,
4045
+ },
4046
+ contextWindow: 131072,
4047
+ maxTokens: 8192,
4048
+ },
3947
4049
  "llama-3.1-8b-instant": {
3948
4050
  id: "llama-3.1-8b-instant",
3949
4051
  name: "Llama 3.1 8B Instant",
@@ -4131,6 +4233,23 @@ export const MODELS = {
4131
4233
  contextWindow: 131072,
4132
4234
  maxTokens: 65536,
4133
4235
  },
4236
+ "openai/gpt-oss-safeguard-20b": {
4237
+ id: "openai/gpt-oss-safeguard-20b",
4238
+ name: "Safety GPT OSS 20B",
4239
+ api: "openai-completions",
4240
+ provider: "groq",
4241
+ baseUrl: "https://api.groq.com/openai/v1",
4242
+ reasoning: true,
4243
+ input: ["text"],
4244
+ cost: {
4245
+ input: 0.075,
4246
+ output: 0.3,
4247
+ cacheRead: 0.037,
4248
+ cacheWrite: 0,
4249
+ },
4250
+ contextWindow: 131072,
4251
+ maxTokens: 65536,
4252
+ },
4134
4253
  "qwen-qwq-32b": {
4135
4254
  id: "qwen-qwq-32b",
4136
4255
  name: "Qwen QwQ 32B",
@@ -4163,7 +4282,7 @@ export const MODELS = {
4163
4282
  cacheWrite: 0,
4164
4283
  },
4165
4284
  contextWindow: 131072,
4166
- maxTokens: 16384,
4285
+ maxTokens: 40960,
4167
4286
  },
4168
4287
  },
4169
4288
  "huggingface": {
@@ -4529,91 +4648,6 @@ export const MODELS = {
4529
4648
  },
4530
4649
  },
4531
4650
  "minimax": {
4532
- "MiniMax-M2": {
4533
- id: "MiniMax-M2",
4534
- name: "MiniMax-M2",
4535
- api: "anthropic-messages",
4536
- provider: "minimax",
4537
- baseUrl: "https://api.minimax.io/anthropic",
4538
- reasoning: true,
4539
- input: ["text"],
4540
- cost: {
4541
- input: 0.3,
4542
- output: 1.2,
4543
- cacheRead: 0,
4544
- cacheWrite: 0,
4545
- },
4546
- contextWindow: 204800,
4547
- maxTokens: 131072,
4548
- },
4549
- "MiniMax-M2.1": {
4550
- id: "MiniMax-M2.1",
4551
- name: "MiniMax-M2.1",
4552
- api: "anthropic-messages",
4553
- provider: "minimax",
4554
- baseUrl: "https://api.minimax.io/anthropic",
4555
- reasoning: true,
4556
- input: ["text"],
4557
- cost: {
4558
- input: 0.3,
4559
- output: 1.2,
4560
- cacheRead: 0,
4561
- cacheWrite: 0,
4562
- },
4563
- contextWindow: 204800,
4564
- maxTokens: 131072,
4565
- },
4566
- "MiniMax-M2.1-highspeed": {
4567
- id: "MiniMax-M2.1-highspeed",
4568
- name: "MiniMax-M2.1-highspeed",
4569
- api: "anthropic-messages",
4570
- provider: "minimax",
4571
- baseUrl: "https://api.minimax.io/anthropic",
4572
- reasoning: true,
4573
- input: ["text"],
4574
- cost: {
4575
- input: 0.6,
4576
- output: 2.4,
4577
- cacheRead: 0,
4578
- cacheWrite: 0,
4579
- },
4580
- contextWindow: 204800,
4581
- maxTokens: 131072,
4582
- },
4583
- "MiniMax-M2.5": {
4584
- id: "MiniMax-M2.5",
4585
- name: "MiniMax-M2.5",
4586
- api: "anthropic-messages",
4587
- provider: "minimax",
4588
- baseUrl: "https://api.minimax.io/anthropic",
4589
- reasoning: true,
4590
- input: ["text"],
4591
- cost: {
4592
- input: 0.3,
4593
- output: 1.2,
4594
- cacheRead: 0.03,
4595
- cacheWrite: 0.375,
4596
- },
4597
- contextWindow: 204800,
4598
- maxTokens: 131072,
4599
- },
4600
- "MiniMax-M2.5-highspeed": {
4601
- id: "MiniMax-M2.5-highspeed",
4602
- name: "MiniMax-M2.5-highspeed",
4603
- api: "anthropic-messages",
4604
- provider: "minimax",
4605
- baseUrl: "https://api.minimax.io/anthropic",
4606
- reasoning: true,
4607
- input: ["text"],
4608
- cost: {
4609
- input: 0.6,
4610
- output: 2.4,
4611
- cacheRead: 0.06,
4612
- cacheWrite: 0.375,
4613
- },
4614
- contextWindow: 204800,
4615
- maxTokens: 131072,
4616
- },
4617
4651
  "MiniMax-M2.7": {
4618
4652
  id: "MiniMax-M2.7",
4619
4653
  name: "MiniMax-M2.7",
@@ -4650,91 +4684,6 @@ export const MODELS = {
4650
4684
  },
4651
4685
  },
4652
4686
  "minimax-cn": {
4653
- "MiniMax-M2": {
4654
- id: "MiniMax-M2",
4655
- name: "MiniMax-M2",
4656
- api: "anthropic-messages",
4657
- provider: "minimax-cn",
4658
- baseUrl: "https://api.minimaxi.com/anthropic",
4659
- reasoning: true,
4660
- input: ["text"],
4661
- cost: {
4662
- input: 0.3,
4663
- output: 1.2,
4664
- cacheRead: 0,
4665
- cacheWrite: 0,
4666
- },
4667
- contextWindow: 204800,
4668
- maxTokens: 131072,
4669
- },
4670
- "MiniMax-M2.1": {
4671
- id: "MiniMax-M2.1",
4672
- name: "MiniMax-M2.1",
4673
- api: "anthropic-messages",
4674
- provider: "minimax-cn",
4675
- baseUrl: "https://api.minimaxi.com/anthropic",
4676
- reasoning: true,
4677
- input: ["text"],
4678
- cost: {
4679
- input: 0.3,
4680
- output: 1.2,
4681
- cacheRead: 0,
4682
- cacheWrite: 0,
4683
- },
4684
- contextWindow: 204800,
4685
- maxTokens: 131072,
4686
- },
4687
- "MiniMax-M2.1-highspeed": {
4688
- id: "MiniMax-M2.1-highspeed",
4689
- name: "MiniMax-M2.1-highspeed",
4690
- api: "anthropic-messages",
4691
- provider: "minimax-cn",
4692
- baseUrl: "https://api.minimaxi.com/anthropic",
4693
- reasoning: true,
4694
- input: ["text"],
4695
- cost: {
4696
- input: 0.6,
4697
- output: 2.4,
4698
- cacheRead: 0,
4699
- cacheWrite: 0,
4700
- },
4701
- contextWindow: 204800,
4702
- maxTokens: 131072,
4703
- },
4704
- "MiniMax-M2.5": {
4705
- id: "MiniMax-M2.5",
4706
- name: "MiniMax-M2.5",
4707
- api: "anthropic-messages",
4708
- provider: "minimax-cn",
4709
- baseUrl: "https://api.minimaxi.com/anthropic",
4710
- reasoning: true,
4711
- input: ["text"],
4712
- cost: {
4713
- input: 0.3,
4714
- output: 1.2,
4715
- cacheRead: 0.03,
4716
- cacheWrite: 0.375,
4717
- },
4718
- contextWindow: 204800,
4719
- maxTokens: 131072,
4720
- },
4721
- "MiniMax-M2.5-highspeed": {
4722
- id: "MiniMax-M2.5-highspeed",
4723
- name: "MiniMax-M2.5-highspeed",
4724
- api: "anthropic-messages",
4725
- provider: "minimax-cn",
4726
- baseUrl: "https://api.minimaxi.com/anthropic",
4727
- reasoning: true,
4728
- input: ["text"],
4729
- cost: {
4730
- input: 0.6,
4731
- output: 2.4,
4732
- cacheRead: 0.06,
4733
- cacheWrite: 0.375,
4734
- },
4735
- contextWindow: 204800,
4736
- maxTokens: 131072,
4737
- },
4738
4687
  "MiniMax-M2.7": {
4739
4688
  id: "MiniMax-M2.7",
4740
4689
  name: "MiniMax-M2.7",
@@ -5094,22 +5043,39 @@ export const MODELS = {
5094
5043
  contextWindow: 128000,
5095
5044
  maxTokens: 16384,
5096
5045
  },
5046
+ "mistral-small-2603": {
5047
+ id: "mistral-small-2603",
5048
+ name: "Mistral Small 4",
5049
+ api: "mistral-conversations",
5050
+ provider: "mistral",
5051
+ baseUrl: "https://api.mistral.ai",
5052
+ reasoning: true,
5053
+ input: ["text", "image"],
5054
+ cost: {
5055
+ input: 0.15,
5056
+ output: 0.6,
5057
+ cacheRead: 0,
5058
+ cacheWrite: 0,
5059
+ },
5060
+ contextWindow: 256000,
5061
+ maxTokens: 256000,
5062
+ },
5097
5063
  "mistral-small-latest": {
5098
5064
  id: "mistral-small-latest",
5099
5065
  name: "Mistral Small (latest)",
5100
5066
  api: "mistral-conversations",
5101
5067
  provider: "mistral",
5102
5068
  baseUrl: "https://api.mistral.ai",
5103
- reasoning: false,
5069
+ reasoning: true,
5104
5070
  input: ["text", "image"],
5105
5071
  cost: {
5106
- input: 0.1,
5107
- output: 0.3,
5072
+ input: 0.15,
5073
+ output: 0.6,
5108
5074
  cacheRead: 0,
5109
5075
  cacheWrite: 0,
5110
5076
  },
5111
- contextWindow: 128000,
5112
- maxTokens: 16384,
5077
+ contextWindow: 256000,
5078
+ maxTokens: 256000,
5113
5079
  },
5114
5080
  "open-mistral-7b": {
5115
5081
  id: "open-mistral-7b",
@@ -5640,6 +5606,23 @@ export const MODELS = {
5640
5606
  contextWindow: 400000,
5641
5607
  maxTokens: 128000,
5642
5608
  },
5609
+ "gpt-5.3-chat-latest": {
5610
+ id: "gpt-5.3-chat-latest",
5611
+ name: "GPT-5.3 Chat (latest)",
5612
+ api: "openai-responses",
5613
+ provider: "openai",
5614
+ baseUrl: "https://api.openai.com/v1",
5615
+ reasoning: false,
5616
+ input: ["text", "image"],
5617
+ cost: {
5618
+ input: 1.75,
5619
+ output: 14,
5620
+ cacheRead: 0.175,
5621
+ cacheWrite: 0,
5622
+ },
5623
+ contextWindow: 128000,
5624
+ maxTokens: 16384,
5625
+ },
5643
5626
  "gpt-5.3-codex": {
5644
5627
  id: "gpt-5.3-codex",
5645
5628
  name: "GPT-5.3 Codex",
@@ -6559,12 +6542,29 @@ export const MODELS = {
6559
6542
  cacheRead: 0,
6560
6543
  cacheWrite: 0,
6561
6544
  },
6562
- contextWindow: 204800,
6563
- maxTokens: 131072,
6545
+ contextWindow: 204800,
6546
+ maxTokens: 131072,
6547
+ },
6548
+ "nemotron-3-super-free": {
6549
+ id: "nemotron-3-super-free",
6550
+ name: "Nemotron 3 Super Free",
6551
+ api: "openai-completions",
6552
+ provider: "opencode",
6553
+ baseUrl: "https://opencode.ai/zen/v1",
6554
+ reasoning: true,
6555
+ input: ["text"],
6556
+ cost: {
6557
+ input: 0,
6558
+ output: 0,
6559
+ cacheRead: 0,
6560
+ cacheWrite: 0,
6561
+ },
6562
+ contextWindow: 1000000,
6563
+ maxTokens: 128000,
6564
6564
  },
6565
- "nemotron-3-super-free": {
6566
- id: "nemotron-3-super-free",
6567
- name: "Nemotron 3 Super Free",
6565
+ "qwen3.6-plus-free": {
6566
+ id: "qwen3.6-plus-free",
6567
+ name: "Qwen3.6 Plus Free",
6568
6568
  api: "openai-completions",
6569
6569
  provider: "opencode",
6570
6570
  baseUrl: "https://opencode.ai/zen/v1",
@@ -6576,8 +6576,8 @@ export const MODELS = {
6576
6576
  cacheRead: 0,
6577
6577
  cacheWrite: 0,
6578
6578
  },
6579
- contextWindow: 1000000,
6580
- maxTokens: 128000,
6579
+ contextWindow: 1048576,
6580
+ maxTokens: 64000,
6581
6581
  },
6582
6582
  },
6583
6583
  "opencode-go": {
@@ -7535,23 +7535,6 @@ export const MODELS = {
7535
7535
  contextWindow: 1048576,
7536
7536
  maxTokens: 65536,
7537
7537
  },
7538
- "google/gemini-3-pro-preview": {
7539
- id: "google/gemini-3-pro-preview",
7540
- name: "Google: Gemini 3 Pro Preview",
7541
- api: "openai-completions",
7542
- provider: "openrouter",
7543
- baseUrl: "https://openrouter.ai/api/v1",
7544
- reasoning: true,
7545
- input: ["text", "image"],
7546
- cost: {
7547
- input: 2,
7548
- output: 12,
7549
- cacheRead: 0.19999999999999998,
7550
- cacheWrite: 0.375,
7551
- },
7552
- contextWindow: 1048576,
7553
- maxTokens: 65536,
7554
- },
7555
7538
  "google/gemini-3.1-flash-lite-preview": {
7556
7539
  id: "google/gemini-3.1-flash-lite-preview",
7557
7540
  name: "Google: Gemini 3.1 Flash Lite Preview",
@@ -7654,22 +7637,22 @@ export const MODELS = {
7654
7637
  contextWindow: 128000,
7655
7638
  maxTokens: 32000,
7656
7639
  },
7657
- "kwaipilot/kat-coder-pro": {
7658
- id: "kwaipilot/kat-coder-pro",
7659
- name: "Kwaipilot: KAT-Coder-Pro V1",
7640
+ "kwaipilot/kat-coder-pro-v2": {
7641
+ id: "kwaipilot/kat-coder-pro-v2",
7642
+ name: "Kwaipilot: KAT-Coder-Pro V2",
7660
7643
  api: "openai-completions",
7661
7644
  provider: "openrouter",
7662
7645
  baseUrl: "https://openrouter.ai/api/v1",
7663
7646
  reasoning: false,
7664
7647
  input: ["text"],
7665
7648
  cost: {
7666
- input: 0.207,
7667
- output: 0.828,
7668
- cacheRead: 0.0414,
7649
+ input: 0.3,
7650
+ output: 1.2,
7651
+ cacheRead: 0.06,
7669
7652
  cacheWrite: 0,
7670
7653
  },
7671
7654
  contextWindow: 256000,
7672
- maxTokens: 128000,
7655
+ maxTokens: 80000,
7673
7656
  },
7674
7657
  "meituan/longcat-flash-chat": {
7675
7658
  id: "meituan/longcat-flash-chat",
@@ -7867,9 +7850,9 @@ export const MODELS = {
7867
7850
  reasoning: true,
7868
7851
  input: ["text"],
7869
7852
  cost: {
7870
- input: 0.19999999999999998,
7871
- output: 1.17,
7872
- cacheRead: 0.09999999999999999,
7853
+ input: 0.19,
7854
+ output: 1.15,
7855
+ cacheRead: 0.095,
7873
7856
  cacheWrite: 0,
7874
7857
  },
7875
7858
  contextWindow: 196608,
@@ -8198,23 +8181,6 @@ export const MODELS = {
8198
8181
  contextWindow: 262144,
8199
8182
  maxTokens: 4096,
8200
8183
  },
8201
- "mistralai/mistral-small-3.1-24b-instruct:free": {
8202
- id: "mistralai/mistral-small-3.1-24b-instruct:free",
8203
- name: "Mistral: Mistral Small 3.1 24B (free)",
8204
- api: "openai-completions",
8205
- provider: "openrouter",
8206
- baseUrl: "https://openrouter.ai/api/v1",
8207
- reasoning: false,
8208
- input: ["text", "image"],
8209
- cost: {
8210
- input: 0,
8211
- output: 0,
8212
- cacheRead: 0,
8213
- cacheWrite: 0,
8214
- },
8215
- contextWindow: 128000,
8216
- maxTokens: 4096,
8217
- },
8218
8184
  "mistralai/mistral-small-3.2-24b-instruct": {
8219
8185
  id: "mistralai/mistral-small-3.2-24b-instruct",
8220
8186
  name: "Mistral: Mistral Small 3.2 24B",
@@ -8326,13 +8292,13 @@ export const MODELS = {
8326
8292
  reasoning: false,
8327
8293
  input: ["text"],
8328
8294
  cost: {
8329
- input: 0.55,
8330
- output: 2.2,
8295
+ input: 0.5700000000000001,
8296
+ output: 2.3,
8331
8297
  cacheRead: 0,
8332
8298
  cacheWrite: 0,
8333
8299
  },
8334
- contextWindow: 131000,
8335
- maxTokens: 4096,
8300
+ contextWindow: 131072,
8301
+ maxTokens: 131072,
8336
8302
  },
8337
8303
  "moonshotai/kimi-k2-0905": {
8338
8304
  id: "moonshotai/kimi-k2-0905",
@@ -8394,8 +8360,8 @@ export const MODELS = {
8394
8360
  reasoning: false,
8395
8361
  input: ["text"],
8396
8362
  cost: {
8397
- input: 0.27,
8398
- output: 1,
8363
+ input: 0.135,
8364
+ output: 0.5,
8399
8365
  cacheRead: 0,
8400
8366
  cacheWrite: 0,
8401
8367
  },
@@ -8481,7 +8447,7 @@ export const MODELS = {
8481
8447
  cost: {
8482
8448
  input: 0.09999999999999999,
8483
8449
  output: 0.5,
8484
- cacheRead: 0.04,
8450
+ cacheRead: 0.09999999999999999,
8485
8451
  cacheWrite: 0,
8486
8452
  },
8487
8453
  contextWindow: 262144,
@@ -9573,7 +9539,7 @@ export const MODELS = {
9573
9539
  cacheWrite: 0,
9574
9540
  },
9575
9541
  contextWindow: 32768,
9576
- maxTokens: 4096,
9542
+ maxTokens: 32768,
9577
9543
  },
9578
9544
  "qwen/qwen-max": {
9579
9545
  id: "qwen/qwen-max",
@@ -9813,23 +9779,6 @@ export const MODELS = {
9813
9779
  contextWindow: 40960,
9814
9780
  maxTokens: 40960,
9815
9781
  },
9816
- "qwen/qwen3-4b:free": {
9817
- id: "qwen/qwen3-4b:free",
9818
- name: "Qwen: Qwen3 4B (free)",
9819
- api: "openai-completions",
9820
- provider: "openrouter",
9821
- baseUrl: "https://openrouter.ai/api/v1",
9822
- reasoning: true,
9823
- input: ["text"],
9824
- cost: {
9825
- input: 0,
9826
- output: 0,
9827
- cacheRead: 0,
9828
- cacheWrite: 0,
9829
- },
9830
- contextWindow: 40960,
9831
- maxTokens: 4096,
9832
- },
9833
9782
  "qwen/qwen3-8b": {
9834
9783
  id: "qwen/qwen3-8b",
9835
9784
  name: "Qwen: Qwen3 8B",
@@ -10236,7 +10185,7 @@ export const MODELS = {
10236
10185
  cacheWrite: 0,
10237
10186
  },
10238
10187
  contextWindow: 256000,
10239
- maxTokens: 4096,
10188
+ maxTokens: 65536,
10240
10189
  },
10241
10190
  "qwen/qwen3.5-flash-02-23": {
10242
10191
  id: "qwen/qwen3.5-flash-02-23",
@@ -10272,6 +10221,23 @@ export const MODELS = {
10272
10221
  contextWindow: 1000000,
10273
10222
  maxTokens: 65536,
10274
10223
  },
10224
+ "qwen/qwen3.6-plus-preview:free": {
10225
+ id: "qwen/qwen3.6-plus-preview:free",
10226
+ name: "Qwen: Qwen3.6 Plus Preview (free)",
10227
+ api: "openai-completions",
10228
+ provider: "openrouter",
10229
+ baseUrl: "https://openrouter.ai/api/v1",
10230
+ reasoning: true,
10231
+ input: ["text"],
10232
+ cost: {
10233
+ input: 0,
10234
+ output: 0,
10235
+ cacheRead: 0,
10236
+ cacheWrite: 0,
10237
+ },
10238
+ contextWindow: 1000000,
10239
+ maxTokens: 65536,
10240
+ },
10275
10241
  "qwen/qwq-32b": {
10276
10242
  id: "qwen/qwq-32b",
10277
10243
  name: "Qwen: QwQ 32B",
@@ -10289,6 +10255,23 @@ export const MODELS = {
10289
10255
  contextWindow: 131072,
10290
10256
  maxTokens: 131072,
10291
10257
  },
10258
+ "reka/reka-edge": {
10259
+ id: "reka/reka-edge",
10260
+ name: "Reka Edge",
10261
+ api: "openai-completions",
10262
+ provider: "openrouter",
10263
+ baseUrl: "https://openrouter.ai/api/v1",
10264
+ reasoning: false,
10265
+ input: ["text", "image"],
10266
+ cost: {
10267
+ input: 0.09999999999999999,
10268
+ output: 0.09999999999999999,
10269
+ cacheRead: 0,
10270
+ cacheWrite: 0,
10271
+ },
10272
+ contextWindow: 16384,
10273
+ maxTokens: 16384,
10274
+ },
10292
10275
  "relace/relace-search": {
10293
10276
  id: "relace/relace-search",
10294
10277
  name: "Relace: Relace Search",
@@ -10351,11 +10334,11 @@ export const MODELS = {
10351
10334
  cost: {
10352
10335
  input: 0.09999999999999999,
10353
10336
  output: 0.3,
10354
- cacheRead: 0.02,
10337
+ cacheRead: 0,
10355
10338
  cacheWrite: 0,
10356
10339
  },
10357
- contextWindow: 256000,
10358
- maxTokens: 256000,
10340
+ contextWindow: 262144,
10341
+ maxTokens: 65536,
10359
10342
  },
10360
10343
  "stepfun/step-3.5-flash:free": {
10361
10344
  id: "stepfun/step-3.5-flash:free",
@@ -10861,12 +10844,12 @@ export const MODELS = {
10861
10844
  reasoning: false,
10862
10845
  input: ["text"],
10863
10846
  cost: {
10864
- input: 0.071,
10865
- output: 0.463,
10866
- cacheRead: 0,
10847
+ input: 0.22,
10848
+ output: 0.88,
10849
+ cacheRead: 0.11,
10867
10850
  cacheWrite: 0,
10868
10851
  },
10869
- contextWindow: 40960,
10852
+ contextWindow: 32768,
10870
10853
  maxTokens: 16384,
10871
10854
  },
10872
10855
  "alibaba/qwen-3-30b": {
@@ -10895,13 +10878,13 @@ export const MODELS = {
10895
10878
  reasoning: true,
10896
10879
  input: ["text"],
10897
10880
  cost: {
10898
- input: 0.29,
10899
- output: 0.59,
10900
- cacheRead: 0.145,
10881
+ input: 0.16,
10882
+ output: 0.64,
10883
+ cacheRead: 0,
10901
10884
  cacheWrite: 0,
10902
10885
  },
10903
- contextWindow: 131072,
10904
- maxTokens: 40960,
10886
+ contextWindow: 128000,
10887
+ maxTokens: 8192,
10905
10888
  },
10906
10889
  "alibaba/qwen3-235b-a22b-thinking": {
10907
10890
  id: "alibaba/qwen3-235b-a22b-thinking",
@@ -10929,13 +10912,13 @@ export const MODELS = {
10929
10912
  reasoning: false,
10930
10913
  input: ["text"],
10931
10914
  cost: {
10932
- input: 0.39999999999999997,
10933
- output: 1.5999999999999999,
10934
- cacheRead: 0.022,
10915
+ input: 1.5,
10916
+ output: 7.5,
10917
+ cacheRead: 0.3,
10935
10918
  cacheWrite: 0,
10936
10919
  },
10937
10920
  contextWindow: 262144,
10938
- maxTokens: 66536,
10921
+ maxTokens: 65536,
10939
10922
  },
10940
10923
  "alibaba/qwen3-coder-30b-a3b": {
10941
10924
  id: "alibaba/qwen3-coder-30b-a3b",
@@ -11405,13 +11388,13 @@ export const MODELS = {
11405
11388
  reasoning: true,
11406
11389
  input: ["text"],
11407
11390
  cost: {
11408
- input: 0.5,
11409
- output: 1.5,
11410
- cacheRead: 0,
11391
+ input: 0.56,
11392
+ output: 1.68,
11393
+ cacheRead: 0.28,
11411
11394
  cacheWrite: 0,
11412
11395
  },
11413
11396
  contextWindow: 163840,
11414
- maxTokens: 16384,
11397
+ maxTokens: 8192,
11415
11398
  },
11416
11399
  "deepseek/deepseek-v3.1-terminus": {
11417
11400
  id: "deepseek/deepseek-v3.1-terminus",
@@ -11651,6 +11634,23 @@ export const MODELS = {
11651
11634
  contextWindow: 32000,
11652
11635
  maxTokens: 16384,
11653
11636
  },
11637
+ "kwaipilot/kat-coder-pro-v2": {
11638
+ id: "kwaipilot/kat-coder-pro-v2",
11639
+ name: "Kat Coder Pro V2",
11640
+ api: "anthropic-messages",
11641
+ provider: "vercel-ai-gateway",
11642
+ baseUrl: "https://ai-gateway.vercel.sh",
11643
+ reasoning: true,
11644
+ input: ["text"],
11645
+ cost: {
11646
+ input: 0.3,
11647
+ output: 1.2,
11648
+ cacheRead: 0.06,
11649
+ cacheWrite: 0,
11650
+ },
11651
+ contextWindow: 256000,
11652
+ maxTokens: 256000,
11653
+ },
11654
11654
  "meituan/longcat-flash-chat": {
11655
11655
  id: "meituan/longcat-flash-chat",
11656
11656
  name: "LongCat Flash Chat",
@@ -11666,7 +11666,7 @@ export const MODELS = {
11666
11666
  cacheWrite: 0,
11667
11667
  },
11668
11668
  contextWindow: 128000,
11669
- maxTokens: 100000,
11669
+ maxTokens: 8192,
11670
11670
  },
11671
11671
  "meituan/longcat-flash-thinking": {
11672
11672
  id: "meituan/longcat-flash-thinking",
@@ -11711,13 +11711,13 @@ export const MODELS = {
11711
11711
  reasoning: false,
11712
11712
  input: ["text"],
11713
11713
  cost: {
11714
- input: 0.09999999999999999,
11715
- output: 0.09999999999999999,
11716
- cacheRead: 0.09999999999999999,
11714
+ input: 0.22,
11715
+ output: 0.22,
11716
+ cacheRead: 0,
11717
11717
  cacheWrite: 0,
11718
11718
  },
11719
11719
  contextWindow: 128000,
11720
- maxTokens: 16384,
11720
+ maxTokens: 8192,
11721
11721
  },
11722
11722
  "meta/llama-3.2-11b": {
11723
11723
  id: "meta/llama-3.2-11b",
@@ -11779,12 +11779,12 @@ export const MODELS = {
11779
11779
  reasoning: false,
11780
11780
  input: ["text", "image"],
11781
11781
  cost: {
11782
- input: 0.24,
11783
- output: 0.9700000000000001,
11782
+ input: 0.35,
11783
+ output: 1.15,
11784
11784
  cacheRead: 0,
11785
11785
  cacheWrite: 0,
11786
11786
  },
11787
- contextWindow: 128000,
11787
+ contextWindow: 524288,
11788
11788
  maxTokens: 8192,
11789
11789
  },
11790
11790
  "meta/llama-4-scout": {
@@ -12688,6 +12688,23 @@ export const MODELS = {
12688
12688
  contextWindow: 1050000,
12689
12689
  maxTokens: 128000,
12690
12690
  },
12691
+ "openai/gpt-oss-120b": {
12692
+ id: "openai/gpt-oss-120b",
12693
+ name: "gpt-oss-120b",
12694
+ api: "anthropic-messages",
12695
+ provider: "vercel-ai-gateway",
12696
+ baseUrl: "https://ai-gateway.vercel.sh",
12697
+ reasoning: true,
12698
+ input: ["text"],
12699
+ cost: {
12700
+ input: 0.15,
12701
+ output: 0.6,
12702
+ cacheRead: 0,
12703
+ cacheWrite: 0,
12704
+ },
12705
+ contextWindow: 128000,
12706
+ maxTokens: 8192,
12707
+ },
12691
12708
  "openai/gpt-oss-20b": {
12692
12709
  id: "openai/gpt-oss-20b",
12693
12710
  name: "gpt-oss-20b",
@@ -12833,8 +12850,8 @@ export const MODELS = {
12833
12850
  reasoning: false,
12834
12851
  input: ["text", "image"],
12835
12852
  cost: {
12836
- input: 1,
12837
- output: 1,
12853
+ input: 0,
12854
+ output: 0,
12838
12855
  cacheRead: 0,
12839
12856
  cacheWrite: 0,
12840
12857
  },
@@ -12850,8 +12867,8 @@ export const MODELS = {
12850
12867
  reasoning: false,
12851
12868
  input: ["text", "image"],
12852
12869
  cost: {
12853
- input: 3,
12854
- output: 15,
12870
+ input: 0,
12871
+ output: 0,
12855
12872
  cacheRead: 0,
12856
12873
  cacheWrite: 0,
12857
12874
  },
@@ -13045,6 +13062,23 @@ export const MODELS = {
13045
13062
  contextWindow: 2000000,
13046
13063
  maxTokens: 30000,
13047
13064
  },
13065
+ "xai/grok-4.20-multi-agent": {
13066
+ id: "xai/grok-4.20-multi-agent",
13067
+ name: "Grok 4.20 Multi-Agent",
13068
+ api: "anthropic-messages",
13069
+ provider: "vercel-ai-gateway",
13070
+ baseUrl: "https://ai-gateway.vercel.sh",
13071
+ reasoning: true,
13072
+ input: ["text"],
13073
+ cost: {
13074
+ input: 2,
13075
+ output: 6,
13076
+ cacheRead: 0.19999999999999998,
13077
+ cacheWrite: 0,
13078
+ },
13079
+ contextWindow: 2000000,
13080
+ maxTokens: 2000000,
13081
+ },
13048
13082
  "xai/grok-4.20-multi-agent-beta": {
13049
13083
  id: "xai/grok-4.20-multi-agent-beta",
13050
13084
  name: "Grok 4.20 Multi Agent Beta",
@@ -13062,6 +13096,23 @@ export const MODELS = {
13062
13096
  contextWindow: 2000000,
13063
13097
  maxTokens: 2000000,
13064
13098
  },
13099
+ "xai/grok-4.20-non-reasoning": {
13100
+ id: "xai/grok-4.20-non-reasoning",
13101
+ name: "Grok 4.20 Non-Reasoning",
13102
+ api: "anthropic-messages",
13103
+ provider: "vercel-ai-gateway",
13104
+ baseUrl: "https://ai-gateway.vercel.sh",
13105
+ reasoning: false,
13106
+ input: ["text", "image"],
13107
+ cost: {
13108
+ input: 2,
13109
+ output: 6,
13110
+ cacheRead: 0.19999999999999998,
13111
+ cacheWrite: 0,
13112
+ },
13113
+ contextWindow: 2000000,
13114
+ maxTokens: 2000000,
13115
+ },
13065
13116
  "xai/grok-4.20-non-reasoning-beta": {
13066
13117
  id: "xai/grok-4.20-non-reasoning-beta",
13067
13118
  name: "Grok 4.20 Beta Non-Reasoning",
@@ -13079,6 +13130,23 @@ export const MODELS = {
13079
13130
  contextWindow: 2000000,
13080
13131
  maxTokens: 2000000,
13081
13132
  },
13133
+ "xai/grok-4.20-reasoning": {
13134
+ id: "xai/grok-4.20-reasoning",
13135
+ name: "Grok 4.20 Reasoning",
13136
+ api: "anthropic-messages",
13137
+ provider: "vercel-ai-gateway",
13138
+ baseUrl: "https://ai-gateway.vercel.sh",
13139
+ reasoning: true,
13140
+ input: ["text", "image"],
13141
+ cost: {
13142
+ input: 2,
13143
+ output: 6,
13144
+ cacheRead: 0.19999999999999998,
13145
+ cacheWrite: 0,
13146
+ },
13147
+ contextWindow: 2000000,
13148
+ maxTokens: 2000000,
13149
+ },
13082
13150
  "xai/grok-4.20-reasoning-beta": {
13083
13151
  id: "xai/grok-4.20-reasoning-beta",
13084
13152
  name: "Grok 4.20 Beta Reasoning",
@@ -13122,9 +13190,9 @@ export const MODELS = {
13122
13190
  reasoning: true,
13123
13191
  input: ["text"],
13124
13192
  cost: {
13125
- input: 0.09999999999999999,
13126
- output: 0.3,
13127
- cacheRead: 0.02,
13193
+ input: 0.09,
13194
+ output: 0.29,
13195
+ cacheRead: 0.045,
13128
13196
  cacheWrite: 0,
13129
13197
  },
13130
13198
  contextWindow: 262144,
@@ -13260,7 +13328,7 @@ export const MODELS = {
13260
13328
  cost: {
13261
13329
  input: 0.6,
13262
13330
  output: 2.2,
13263
- cacheRead: 0,
13331
+ cacheRead: 0.11,
13264
13332
  cacheWrite: 0,
13265
13333
  },
13266
13334
  contextWindow: 200000,
@@ -13890,6 +13958,24 @@ export const MODELS = {
13890
13958
  contextWindow: 200000,
13891
13959
  maxTokens: 131072,
13892
13960
  },
13961
+ "glm-4.7-flashx": {
13962
+ id: "glm-4.7-flashx",
13963
+ name: "GLM-4.7-FlashX",
13964
+ api: "openai-completions",
13965
+ provider: "zai",
13966
+ baseUrl: "https://api.z.ai/api/coding/paas/v4",
13967
+ compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai" },
13968
+ reasoning: true,
13969
+ input: ["text"],
13970
+ cost: {
13971
+ input: 0.07,
13972
+ output: 0.4,
13973
+ cacheRead: 0.01,
13974
+ cacheWrite: 0,
13975
+ },
13976
+ contextWindow: 200000,
13977
+ maxTokens: 131072,
13978
+ },
13893
13979
  "glm-5": {
13894
13980
  id: "glm-5",
13895
13981
  name: "GLM-5",