@avadisabelle/ava-pi-ai 0.65.0 → 0.65.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -325,6 +325,40 @@ export const MODELS = {
325
325
  contextWindow: 1000000,
326
326
  maxTokens: 64000,
327
327
  },
328
+ "au.anthropic.claude-opus-4-6-v1": {
329
+ id: "au.anthropic.claude-opus-4-6-v1",
330
+ name: "AU Anthropic Claude Opus 4.6",
331
+ api: "bedrock-converse-stream",
332
+ provider: "amazon-bedrock",
333
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
334
+ reasoning: true,
335
+ input: ["text", "image"],
336
+ cost: {
337
+ input: 16.5,
338
+ output: 82.5,
339
+ cacheRead: 0.5,
340
+ cacheWrite: 6.25,
341
+ },
342
+ contextWindow: 1000000,
343
+ maxTokens: 128000,
344
+ },
345
+ "au.anthropic.claude-sonnet-4-6": {
346
+ id: "au.anthropic.claude-sonnet-4-6",
347
+ name: "AU Anthropic Claude Sonnet 4.6",
348
+ api: "bedrock-converse-stream",
349
+ provider: "amazon-bedrock",
350
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
351
+ reasoning: true,
352
+ input: ["text", "image"],
353
+ cost: {
354
+ input: 3.3,
355
+ output: 16.5,
356
+ cacheRead: 0.33,
357
+ cacheWrite: 4.125,
358
+ },
359
+ contextWindow: 1000000,
360
+ maxTokens: 128000,
361
+ },
328
362
  "deepseek.r1-v1:0": {
329
363
  id: "deepseek.r1-v1:0",
330
364
  name: "DeepSeek-R1",
@@ -2488,6 +2522,40 @@ export const MODELS = {
2488
2522
  contextWindow: 1050000,
2489
2523
  maxTokens: 128000,
2490
2524
  },
2525
+ "gpt-5.5": {
2526
+ id: "gpt-5.5",
2527
+ name: "GPT-5.5",
2528
+ api: "azure-openai-responses",
2529
+ provider: "azure-openai-responses",
2530
+ baseUrl: "",
2531
+ reasoning: true,
2532
+ input: ["text", "image"],
2533
+ cost: {
2534
+ input: 5,
2535
+ output: 30,
2536
+ cacheRead: 0.5,
2537
+ cacheWrite: 0,
2538
+ },
2539
+ contextWindow: 1050000,
2540
+ maxTokens: 128000,
2541
+ },
2542
+ "gpt-5.5-pro": {
2543
+ id: "gpt-5.5-pro",
2544
+ name: "GPT-5.5 Pro",
2545
+ api: "azure-openai-responses",
2546
+ provider: "azure-openai-responses",
2547
+ baseUrl: "",
2548
+ reasoning: true,
2549
+ input: ["text", "image"],
2550
+ cost: {
2551
+ input: 30,
2552
+ output: 180,
2553
+ cacheRead: 0,
2554
+ cacheWrite: 0,
2555
+ },
2556
+ contextWindow: 1050000,
2557
+ maxTokens: 128000,
2558
+ },
2491
2559
  "o1": {
2492
2560
  id: "o1",
2493
2561
  name: "o1",
@@ -3134,6 +3202,24 @@ export const MODELS = {
3134
3202
  contextWindow: 400000,
3135
3203
  maxTokens: 128000,
3136
3204
  },
3205
+ "gpt-5.5": {
3206
+ id: "gpt-5.5",
3207
+ name: "GPT-5.5",
3208
+ api: "openai-responses",
3209
+ provider: "github-copilot",
3210
+ baseUrl: "https://api.individual.githubcopilot.com",
3211
+ headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3212
+ reasoning: true,
3213
+ input: ["text", "image"],
3214
+ cost: {
3215
+ input: 0,
3216
+ output: 0,
3217
+ cacheRead: 0,
3218
+ cacheWrite: 0,
3219
+ },
3220
+ contextWindow: 400000,
3221
+ maxTokens: 128000,
3222
+ },
3137
3223
  "grok-code-fast-1": {
3138
3224
  id: "grok-code-fast-1",
3139
3225
  name: "Grok Code Fast 1",
@@ -3251,7 +3337,7 @@ export const MODELS = {
3251
3337
  cost: {
3252
3338
  input: 0.3,
3253
3339
  output: 2.5,
3254
- cacheRead: 0.075,
3340
+ cacheRead: 0.03,
3255
3341
  cacheWrite: 0,
3256
3342
  },
3257
3343
  contextWindow: 1048576,
@@ -3370,7 +3456,7 @@ export const MODELS = {
3370
3456
  cost: {
3371
3457
  input: 1.25,
3372
3458
  output: 10,
3373
- cacheRead: 0.31,
3459
+ cacheRead: 0.125,
3374
3460
  cacheWrite: 0,
3375
3461
  },
3376
3462
  contextWindow: 1048576,
@@ -3580,8 +3666,8 @@ export const MODELS = {
3580
3666
  contextWindow: 131072,
3581
3667
  maxTokens: 8192,
3582
3668
  },
3583
- "gemma-4-26b-it": {
3584
- id: "gemma-4-26b-it",
3669
+ "gemma-4-26b-a4b-it": {
3670
+ id: "gemma-4-26b-a4b-it",
3585
3671
  name: "Gemma 4 26B",
3586
3672
  api: "google-generative-ai",
3587
3673
  provider: "google",
@@ -4622,6 +4708,24 @@ export const MODELS = {
4622
4708
  contextWindow: 163840,
4623
4709
  maxTokens: 65536,
4624
4710
  },
4711
+ "deepseek-ai/DeepSeek-V4-Pro": {
4712
+ id: "deepseek-ai/DeepSeek-V4-Pro",
4713
+ name: "DeepSeek V4 Pro",
4714
+ api: "openai-completions",
4715
+ provider: "huggingface",
4716
+ baseUrl: "https://router.huggingface.co/v1",
4717
+ compat: { "supportsDeveloperRole": false },
4718
+ reasoning: true,
4719
+ input: ["text"],
4720
+ cost: {
4721
+ input: 1.74,
4722
+ output: 3.48,
4723
+ cacheRead: 0.145,
4724
+ cacheWrite: 0,
4725
+ },
4726
+ contextWindow: 1048576,
4727
+ maxTokens: 393216,
4728
+ },
4625
4729
  "moonshotai/Kimi-K2-Instruct": {
4626
4730
  id: "moonshotai/Kimi-K2-Instruct",
4627
4731
  name: "Kimi-K2-Instruct",
@@ -4694,6 +4798,24 @@ export const MODELS = {
4694
4798
  contextWindow: 262144,
4695
4799
  maxTokens: 262144,
4696
4800
  },
4801
+ "moonshotai/Kimi-K2.6": {
4802
+ id: "moonshotai/Kimi-K2.6",
4803
+ name: "Kimi-K2.6",
4804
+ api: "openai-completions",
4805
+ provider: "huggingface",
4806
+ baseUrl: "https://router.huggingface.co/v1",
4807
+ compat: { "supportsDeveloperRole": false },
4808
+ reasoning: true,
4809
+ input: ["text", "image"],
4810
+ cost: {
4811
+ input: 0.95,
4812
+ output: 4,
4813
+ cacheRead: 0.16,
4814
+ cacheWrite: 0,
4815
+ },
4816
+ contextWindow: 262144,
4817
+ maxTokens: 262144,
4818
+ },
4697
4819
  "zai-org/GLM-4.7": {
4698
4820
  id: "zai-org/GLM-4.7",
4699
4821
  name: "GLM-4.7",
@@ -4768,6 +4890,23 @@ export const MODELS = {
4768
4890
  },
4769
4891
  },
4770
4892
  "kimi-coding": {
4893
+ "k2p6": {
4894
+ id: "k2p6",
4895
+ name: "Kimi K2.6",
4896
+ api: "anthropic-messages",
4897
+ provider: "kimi-coding",
4898
+ baseUrl: "https://api.kimi.com/coding",
4899
+ reasoning: true,
4900
+ input: ["text", "image"],
4901
+ cost: {
4902
+ input: 0,
4903
+ output: 0,
4904
+ cacheRead: 0,
4905
+ cacheWrite: 0,
4906
+ },
4907
+ contextWindow: 262144,
4908
+ maxTokens: 32768,
4909
+ },
4771
4910
  "kimi-for-coding": {
4772
4911
  id: "kimi-for-coding",
4773
4912
  name: "Kimi For Coding",
@@ -5148,22 +5287,39 @@ export const MODELS = {
5148
5287
  contextWindow: 262144,
5149
5288
  maxTokens: 262144,
5150
5289
  },
5290
+ "mistral-medium-2604": {
5291
+ id: "mistral-medium-2604",
5292
+ name: "Mistral Medium 3.5",
5293
+ api: "mistral-conversations",
5294
+ provider: "mistral",
5295
+ baseUrl: "https://api.mistral.ai",
5296
+ reasoning: true,
5297
+ input: ["text", "image"],
5298
+ cost: {
5299
+ input: 1.5,
5300
+ output: 7.5,
5301
+ cacheRead: 0,
5302
+ cacheWrite: 0,
5303
+ },
5304
+ contextWindow: 262144,
5305
+ maxTokens: 262144,
5306
+ },
5151
5307
  "mistral-medium-latest": {
5152
5308
  id: "mistral-medium-latest",
5153
5309
  name: "Mistral Medium (latest)",
5154
5310
  api: "mistral-conversations",
5155
5311
  provider: "mistral",
5156
5312
  baseUrl: "https://api.mistral.ai",
5157
- reasoning: false,
5313
+ reasoning: true,
5158
5314
  input: ["text", "image"],
5159
5315
  cost: {
5160
- input: 0.4,
5161
- output: 2,
5316
+ input: 1.5,
5317
+ output: 7.5,
5162
5318
  cacheRead: 0,
5163
5319
  cacheWrite: 0,
5164
5320
  },
5165
- contextWindow: 128000,
5166
- maxTokens: 16384,
5321
+ contextWindow: 262144,
5322
+ maxTokens: 262144,
5167
5323
  },
5168
5324
  "mistral-nemo": {
5169
5325
  id: "mistral-nemo",
@@ -5864,6 +6020,40 @@ export const MODELS = {
5864
6020
  contextWindow: 1050000,
5865
6021
  maxTokens: 128000,
5866
6022
  },
6023
+ "gpt-5.5": {
6024
+ id: "gpt-5.5",
6025
+ name: "GPT-5.5",
6026
+ api: "openai-responses",
6027
+ provider: "openai",
6028
+ baseUrl: "https://api.openai.com/v1",
6029
+ reasoning: true,
6030
+ input: ["text", "image"],
6031
+ cost: {
6032
+ input: 5,
6033
+ output: 30,
6034
+ cacheRead: 0.5,
6035
+ cacheWrite: 0,
6036
+ },
6037
+ contextWindow: 1050000,
6038
+ maxTokens: 128000,
6039
+ },
6040
+ "gpt-5.5-pro": {
6041
+ id: "gpt-5.5-pro",
6042
+ name: "GPT-5.5 Pro",
6043
+ api: "openai-responses",
6044
+ provider: "openai",
6045
+ baseUrl: "https://api.openai.com/v1",
6046
+ reasoning: true,
6047
+ input: ["text", "image"],
6048
+ cost: {
6049
+ input: 30,
6050
+ output: 180,
6051
+ cacheRead: 0,
6052
+ cacheWrite: 0,
6053
+ },
6054
+ contextWindow: 1050000,
6055
+ maxTokens: 128000,
6056
+ },
5867
6057
  "o1": {
5868
6058
  id: "o1",
5869
6059
  name: "o1",
@@ -6174,23 +6364,6 @@ export const MODELS = {
6174
6364
  contextWindow: 200000,
6175
6365
  maxTokens: 128000,
6176
6366
  },
6177
- "claude-3-5-haiku": {
6178
- id: "claude-3-5-haiku",
6179
- name: "Claude Haiku 3.5",
6180
- api: "anthropic-messages",
6181
- provider: "opencode",
6182
- baseUrl: "https://opencode.ai/zen",
6183
- reasoning: false,
6184
- input: ["text", "image"],
6185
- cost: {
6186
- input: 0.8,
6187
- output: 4,
6188
- cacheRead: 0.08,
6189
- cacheWrite: 1,
6190
- },
6191
- contextWindow: 200000,
6192
- maxTokens: 8192,
6193
- },
6194
6367
  "claude-haiku-4-5": {
6195
6368
  id: "claude-haiku-4-5",
6196
6369
  name: "Claude Haiku 4.5",
@@ -6633,6 +6806,57 @@ export const MODELS = {
6633
6806
  contextWindow: 1050000,
6634
6807
  maxTokens: 128000,
6635
6808
  },
6809
+ "gpt-5.5": {
6810
+ id: "gpt-5.5",
6811
+ name: "GPT-5.5",
6812
+ api: "openai-responses",
6813
+ provider: "opencode",
6814
+ baseUrl: "https://opencode.ai/zen/v1",
6815
+ reasoning: true,
6816
+ input: ["text", "image"],
6817
+ cost: {
6818
+ input: 5,
6819
+ output: 30,
6820
+ cacheRead: 0.5,
6821
+ cacheWrite: 0,
6822
+ },
6823
+ contextWindow: 1050000,
6824
+ maxTokens: 128000,
6825
+ },
6826
+ "gpt-5.5-pro": {
6827
+ id: "gpt-5.5-pro",
6828
+ name: "GPT-5.5 Pro",
6829
+ api: "openai-responses",
6830
+ provider: "opencode",
6831
+ baseUrl: "https://opencode.ai/zen/v1",
6832
+ reasoning: true,
6833
+ input: ["text", "image"],
6834
+ cost: {
6835
+ input: 30,
6836
+ output: 180,
6837
+ cacheRead: 30,
6838
+ cacheWrite: 0,
6839
+ },
6840
+ contextWindow: 1050000,
6841
+ maxTokens: 128000,
6842
+ },
6843
+ "hy3-preview-free": {
6844
+ id: "hy3-preview-free",
6845
+ name: "Hy3 preview Free",
6846
+ api: "openai-completions",
6847
+ provider: "opencode",
6848
+ baseUrl: "https://opencode.ai/zen/v1",
6849
+ reasoning: true,
6850
+ input: ["text"],
6851
+ cost: {
6852
+ input: 0,
6853
+ output: 0,
6854
+ cacheRead: 0,
6855
+ cacheWrite: 0,
6856
+ },
6857
+ contextWindow: 256000,
6858
+ maxTokens: 64000,
6859
+ },
6636
6860
  "kimi-k2.5": {
6637
6861
  id: "kimi-k2.5",
6638
6862
  name: "Kimi K2.5",
@@ -6650,6 +6874,23 @@ export const MODELS = {
6650
6874
  contextWindow: 262144,
6651
6875
  maxTokens: 65536,
6652
6876
  },
6877
+ "kimi-k2.6": {
6878
+ id: "kimi-k2.6",
6879
+ name: "Kimi K2.6",
6880
+ api: "openai-completions",
6881
+ provider: "opencode",
6882
+ baseUrl: "https://opencode.ai/zen/v1",
6883
+ reasoning: true,
6884
+ input: ["text", "image"],
6885
+ cost: {
6886
+ input: 0.95,
6887
+ output: 4,
6888
+ cacheRead: 0.16,
6889
+ cacheWrite: 0,
6890
+ },
6891
+ contextWindow: 262144,
6892
+ maxTokens: 65536,
6893
+ },
6653
6894
  "minimax-m2.5": {
6654
6895
  id: "minimax-m2.5",
6655
6896
  name: "MiniMax M2.5",
@@ -6684,6 +6925,23 @@ export const MODELS = {
6684
6925
  contextWindow: 204800,
6685
6926
  maxTokens: 131072,
6686
6927
  },
6928
+ "minimax-m2.7": {
6929
+ id: "minimax-m2.7",
6930
+ name: "MiniMax M2.7",
6931
+ api: "openai-completions",
6932
+ provider: "opencode",
6933
+ baseUrl: "https://opencode.ai/zen/v1",
6934
+ reasoning: true,
6935
+ input: ["text"],
6936
+ cost: {
6937
+ input: 0.3,
6938
+ output: 1.2,
6939
+ cacheRead: 0.06,
6940
+ cacheWrite: 0,
6941
+ },
6942
+ contextWindow: 204800,
6943
+ maxTokens: 131072,
6944
+ },
6687
6945
  "nemotron-3-super-free": {
6688
6946
  id: "nemotron-3-super-free",
6689
6947
  name: "Nemotron 3 Super Free",
@@ -6704,9 +6962,9 @@ export const MODELS = {
6704
6962
  "qwen3.5-plus": {
6705
6963
  id: "qwen3.5-plus",
6706
6964
  name: "Qwen3.5 Plus",
6707
- api: "openai-completions",
6965
+ api: "anthropic-messages",
6708
6966
  provider: "opencode",
6709
- baseUrl: "https://opencode.ai/zen/v1",
6967
+ baseUrl: "https://opencode.ai/zen",
6710
6968
  reasoning: true,
6711
6969
  input: ["text", "image"],
6712
6970
  cost: {
@@ -6721,9 +6979,9 @@ export const MODELS = {
6721
6979
  "qwen3.6-plus": {
6722
6980
  id: "qwen3.6-plus",
6723
6981
  name: "Qwen3.6 Plus",
6724
- api: "openai-completions",
6982
+ api: "anthropic-messages",
6725
6983
  provider: "opencode",
6726
- baseUrl: "https://opencode.ai/zen/v1",
6984
+ baseUrl: "https://opencode.ai/zen",
6727
6985
  reasoning: true,
6728
6986
  input: ["text", "image"],
6729
6987
  cost: {
@@ -6737,7 +6995,41 @@ export const MODELS = {
6737
6995
  },
6738
6996
  },
6739
6997
  "opencode-go": {
6740
- "glm-5": {
6998
+ "deepseek-v4-flash": {
6999
+ id: "deepseek-v4-flash",
7000
+ name: "DeepSeek V4 Flash",
7001
+ api: "openai-completions",
7002
+ provider: "opencode-go",
7003
+ baseUrl: "https://opencode.ai/zen/go/v1",
7004
+ reasoning: true,
7005
+ input: ["text"],
7006
+ cost: {
7007
+ input: 0.14,
7008
+ output: 0.28,
7009
+ cacheRead: 0.0028,
7010
+ cacheWrite: 0,
7011
+ },
7012
+ contextWindow: 1000000,
7013
+ maxTokens: 384000,
7014
+ },
7015
+ "deepseek-v4-pro": {
7016
+ id: "deepseek-v4-pro",
7017
+ name: "DeepSeek V4 Pro",
7018
+ api: "openai-completions",
7019
+ provider: "opencode-go",
7020
+ baseUrl: "https://opencode.ai/zen/go/v1",
7021
+ reasoning: true,
7022
+ input: ["text"],
7023
+ cost: {
7024
+ input: 1.74,
7025
+ output: 3.48,
7026
+ cacheRead: 0.0145,
7027
+ cacheWrite: 0,
7028
+ },
7029
+ contextWindow: 1000000,
7030
+ maxTokens: 384000,
7031
+ },
7032
+ "glm-5": {
6741
7033
  id: "glm-5",
6742
7034
  name: "GLM-5",
6743
7035
  api: "openai-completions",
@@ -6751,8 +7043,8 @@ export const MODELS = {
6751
7043
  cacheRead: 0.2,
6752
7044
  cacheWrite: 0,
6753
7045
  },
6754
- contextWindow: 204800,
6755
- maxTokens: 131072,
7046
+ contextWindow: 202752,
7047
+ maxTokens: 32768,
6756
7048
  },
6757
7049
  "glm-5.1": {
6758
7050
  id: "glm-5.1",
@@ -6768,8 +7060,8 @@ export const MODELS = {
6768
7060
  cacheRead: 0.26,
6769
7061
  cacheWrite: 0,
6770
7062
  },
6771
- contextWindow: 204800,
6772
- maxTokens: 131072,
7063
+ contextWindow: 202752,
7064
+ maxTokens: 32768,
6773
7065
  },
6774
7066
  "kimi-k2.5": {
6775
7067
  id: "kimi-k2.5",
@@ -6788,6 +7080,23 @@ export const MODELS = {
6788
7080
  contextWindow: 262144,
6789
7081
  maxTokens: 65536,
6790
7082
  },
7083
+ "kimi-k2.6": {
7084
+ id: "kimi-k2.6",
7085
+ name: "Kimi K2.6 (3x limits)",
7086
+ api: "openai-completions",
7087
+ provider: "opencode-go",
7088
+ baseUrl: "https://opencode.ai/zen/go/v1",
7089
+ reasoning: true,
7090
+ input: ["text", "image"],
7091
+ cost: {
7092
+ input: 0.32,
7093
+ output: 1.34,
7094
+ cacheRead: 0.054,
7095
+ cacheWrite: 0,
7096
+ },
7097
+ contextWindow: 262144,
7098
+ maxTokens: 65536,
7099
+ },
6791
7100
  "mimo-v2-omni": {
6792
7101
  id: "mimo-v2-omni",
6793
7102
  name: "MiMo V2 Omni",
@@ -6803,7 +7112,7 @@ export const MODELS = {
6803
7112
  cacheWrite: 0,
6804
7113
  },
6805
7114
  contextWindow: 262144,
6806
- maxTokens: 64000,
7115
+ maxTokens: 128000,
6807
7116
  },
6808
7117
  "mimo-v2-pro": {
6809
7118
  id: "mimo-v2-pro",
@@ -6820,7 +7129,41 @@ export const MODELS = {
6820
7129
  cacheWrite: 0,
6821
7130
  },
6822
7131
  contextWindow: 1048576,
6823
- maxTokens: 64000,
7132
+ maxTokens: 128000,
7133
+ },
7134
+ "mimo-v2.5": {
7135
+ id: "mimo-v2.5",
7136
+ name: "MiMo V2.5",
7137
+ api: "openai-completions",
7138
+ provider: "opencode-go",
7139
+ baseUrl: "https://opencode.ai/zen/go/v1",
7140
+ reasoning: true,
7141
+ input: ["text", "image"],
7142
+ cost: {
7143
+ input: 0.4,
7144
+ output: 2,
7145
+ cacheRead: 0.08,
7146
+ cacheWrite: 0,
7147
+ },
7148
+ contextWindow: 1000000,
7149
+ maxTokens: 128000,
7150
+ },
7151
+ "mimo-v2.5-pro": {
7152
+ id: "mimo-v2.5-pro",
7153
+ name: "MiMo V2.5 Pro",
7154
+ api: "openai-completions",
7155
+ provider: "opencode-go",
7156
+ baseUrl: "https://opencode.ai/zen/go/v1",
7157
+ reasoning: true,
7158
+ input: ["text"],
7159
+ cost: {
7160
+ input: 1,
7161
+ output: 3,
7162
+ cacheRead: 0.2,
7163
+ cacheWrite: 0,
7164
+ },
7165
+ contextWindow: 1048576,
7166
+ maxTokens: 128000,
6824
7167
  },
6825
7168
  "minimax-m2.5": {
6826
7169
  id: "minimax-m2.5",
@@ -6859,9 +7202,9 @@ export const MODELS = {
6859
7202
  "qwen3.5-plus": {
6860
7203
  id: "qwen3.5-plus",
6861
7204
  name: "Qwen3.5 Plus",
6862
- api: "openai-completions",
7205
+ api: "anthropic-messages",
6863
7206
  provider: "opencode-go",
6864
- baseUrl: "https://opencode.ai/zen/go/v1",
7207
+ baseUrl: "https://opencode.ai/zen/go",
6865
7208
  reasoning: true,
6866
7209
  input: ["text", "image"],
6867
7210
  cost: {
@@ -6876,9 +7219,9 @@ export const MODELS = {
6876
7219
  "qwen3.6-plus": {
6877
7220
  id: "qwen3.6-plus",
6878
7221
  name: "Qwen3.6 Plus",
6879
- api: "openai-completions",
7222
+ api: "anthropic-messages",
6880
7223
  provider: "opencode-go",
6881
- baseUrl: "https://opencode.ai/zen/go/v1",
7224
+ baseUrl: "https://opencode.ai/zen/go",
6882
7225
  reasoning: true,
6883
7226
  input: ["text", "image"],
6884
7227
  cost: {
@@ -6941,7 +7284,7 @@ export const MODELS = {
6941
7284
  cacheWrite: 0,
6942
7285
  },
6943
7286
  contextWindow: 65536,
6944
- maxTokens: 4096,
7287
+ maxTokens: 16384,
6945
7288
  },
6946
7289
  "amazon/nova-2-lite-v1": {
6947
7290
  id: "amazon/nova-2-lite-v1",
@@ -7266,17 +7609,17 @@ export const MODELS = {
7266
7609
  contextWindow: 1000000,
7267
7610
  maxTokens: 128000,
7268
7611
  },
7269
- "arcee-ai/trinity-large-preview:free": {
7270
- id: "arcee-ai/trinity-large-preview:free",
7271
- name: "Arcee AI: Trinity Large Preview (free)",
7612
+ "arcee-ai/trinity-large-preview": {
7613
+ id: "arcee-ai/trinity-large-preview",
7614
+ name: "Arcee AI: Trinity Large Preview",
7272
7615
  api: "openai-completions",
7273
7616
  provider: "openrouter",
7274
7617
  baseUrl: "https://openrouter.ai/api/v1",
7275
7618
  reasoning: false,
7276
7619
  input: ["text"],
7277
7620
  cost: {
7278
- input: 0,
7279
- output: 0,
7621
+ input: 0.15,
7622
+ output: 0.44999999999999996,
7280
7623
  cacheRead: 0,
7281
7624
  cacheWrite: 0,
7282
7625
  },
@@ -7502,7 +7845,7 @@ export const MODELS = {
7502
7845
  cacheWrite: 0,
7503
7846
  },
7504
7847
  contextWindow: 163840,
7505
- maxTokens: 163840,
7848
+ maxTokens: 16384,
7506
7849
  },
7507
7850
  "deepseek/deepseek-chat-v3-0324": {
7508
7851
  id: "deepseek/deepseek-chat-v3-0324",
@@ -7519,7 +7862,7 @@ export const MODELS = {
7519
7862
  cacheWrite: 0,
7520
7863
  },
7521
7864
  contextWindow: 163840,
7522
- maxTokens: 4096,
7865
+ maxTokens: 16384,
7523
7866
  },
7524
7867
  "deepseek/deepseek-chat-v3.1": {
7525
7868
  id: "deepseek/deepseek-chat-v3.1",
@@ -7570,7 +7913,7 @@ export const MODELS = {
7570
7913
  cacheWrite: 0,
7571
7914
  },
7572
7915
  contextWindow: 163840,
7573
- maxTokens: 4096,
7916
+ maxTokens: 32768,
7574
7917
  },
7575
7918
  "deepseek/deepseek-v3.1-terminus": {
7576
7919
  id: "deepseek/deepseek-v3.1-terminus",
@@ -7581,13 +7924,13 @@ export const MODELS = {
7581
7924
  reasoning: true,
7582
7925
  input: ["text"],
7583
7926
  cost: {
7584
- input: 0.21,
7585
- output: 0.7899999999999999,
7586
- cacheRead: 0.1300000002,
7927
+ input: 0.27,
7928
+ output: 0.95,
7929
+ cacheRead: 0.13,
7587
7930
  cacheWrite: 0,
7588
7931
  },
7589
7932
  contextWindow: 163840,
7590
- maxTokens: 4096,
7933
+ maxTokens: 32768,
7591
7934
  },
7592
7935
  "deepseek/deepseek-v3.2": {
7593
7936
  id: "deepseek/deepseek-v3.2",
@@ -7598,13 +7941,13 @@ export const MODELS = {
7598
7941
  reasoning: true,
7599
7942
  input: ["text"],
7600
7943
  cost: {
7601
- input: 0.25899999999999995,
7602
- output: 0.42,
7603
- cacheRead: 0.135,
7944
+ input: 0.252,
7945
+ output: 0.378,
7946
+ cacheRead: 0.0252,
7604
7947
  cacheWrite: 0,
7605
7948
  },
7606
- contextWindow: 163840,
7607
- maxTokens: 163840,
7949
+ contextWindow: 131072,
7950
+ maxTokens: 65536,
7608
7951
  },
7609
7952
  "deepseek/deepseek-v3.2-exp": {
7610
7953
  id: "deepseek/deepseek-v3.2-exp",
@@ -7623,6 +7966,40 @@ export const MODELS = {
7623
7966
  contextWindow: 163840,
7624
7967
  maxTokens: 65536,
7625
7968
  },
7969
+ "deepseek/deepseek-v4-flash": {
7970
+ id: "deepseek/deepseek-v4-flash",
7971
+ name: "DeepSeek: DeepSeek V4 Flash",
7972
+ api: "openai-completions",
7973
+ provider: "openrouter",
7974
+ baseUrl: "https://openrouter.ai/api/v1",
7975
+ reasoning: true,
7976
+ input: ["text"],
7977
+ cost: {
7978
+ input: 0.14,
7979
+ output: 0.28,
7980
+ cacheRead: 0.0028,
7981
+ cacheWrite: 0,
7982
+ },
7983
+ contextWindow: 1048576,
7984
+ maxTokens: 384000,
7985
+ },
7986
+ "deepseek/deepseek-v4-pro": {
7987
+ id: "deepseek/deepseek-v4-pro",
7988
+ name: "DeepSeek: DeepSeek V4 Pro",
7989
+ api: "openai-completions",
7990
+ provider: "openrouter",
7991
+ baseUrl: "https://openrouter.ai/api/v1",
7992
+ reasoning: true,
7993
+ input: ["text"],
7994
+ cost: {
7995
+ input: 0.435,
7996
+ output: 0.87,
7997
+ cacheRead: 0.003625,
7998
+ cacheWrite: 0,
7999
+ },
8000
+ contextWindow: 1048576,
8001
+ maxTokens: 384000,
8002
+ },
7626
8003
  "essentialai/rnj-1-instruct": {
7627
8004
  id: "essentialai/rnj-1-instruct",
7628
8005
  name: "EssentialAI: Rnj 1 Instruct",
@@ -7844,6 +8221,40 @@ export const MODELS = {
7844
8221
  contextWindow: 1048576,
7845
8222
  maxTokens: 65536,
7846
8223
  },
8224
+ "google/gemma-3-12b-it": {
8225
+ id: "google/gemma-3-12b-it",
8226
+ name: "Google: Gemma 3 12B",
8227
+ api: "openai-completions",
8228
+ provider: "openrouter",
8229
+ baseUrl: "https://openrouter.ai/api/v1",
8230
+ reasoning: false,
8231
+ input: ["text", "image"],
8232
+ cost: {
8233
+ input: 0.04,
8234
+ output: 0.13,
8235
+ cacheRead: 0,
8236
+ cacheWrite: 0,
8237
+ },
8238
+ contextWindow: 131072,
8239
+ maxTokens: 16384,
8240
+ },
8241
+ "google/gemma-3-27b-it": {
8242
+ id: "google/gemma-3-27b-it",
8243
+ name: "Google: Gemma 3 27B",
8244
+ api: "openai-completions",
8245
+ provider: "openrouter",
8246
+ baseUrl: "https://openrouter.ai/api/v1",
8247
+ reasoning: false,
8248
+ input: ["text", "image"],
8249
+ cost: {
8250
+ input: 0.08,
8251
+ output: 0.16,
8252
+ cacheRead: 0,
8253
+ cacheWrite: 0,
8254
+ },
8255
+ contextWindow: 131072,
8256
+ maxTokens: 16384,
8257
+ },
7847
8258
  "google/gemma-4-26b-a4b-it": {
7848
8259
  id: "google/gemma-4-26b-a4b-it",
7849
8260
  name: "Google: Gemma 4 26B A4B ",
@@ -7853,9 +8264,9 @@ export const MODELS = {
7853
8264
  reasoning: true,
7854
8265
  input: ["text", "image"],
7855
8266
  cost: {
7856
- input: 0.08,
7857
- output: 0.35,
7858
- cacheRead: 0.01,
8267
+ input: 0.06,
8268
+ output: 0.33,
8269
+ cacheRead: 0,
7859
8270
  cacheWrite: 0,
7860
8271
  },
7861
8272
  contextWindow: 262144,
@@ -7889,11 +8300,11 @@ export const MODELS = {
7889
8300
  cost: {
7890
8301
  input: 0.13,
7891
8302
  output: 0.38,
7892
- cacheRead: 0.019999999499999997,
8303
+ cacheRead: 0,
7893
8304
  cacheWrite: 0,
7894
8305
  },
7895
8306
  contextWindow: 262144,
7896
- maxTokens: 4096,
8307
+ maxTokens: 16384,
7897
8308
  },
7898
8309
  "google/gemma-4-31b-it:free": {
7899
8310
  id: "google/gemma-4-31b-it:free",
@@ -7912,6 +8323,23 @@ export const MODELS = {
7912
8323
  contextWindow: 262144,
7913
8324
  maxTokens: 32768,
7914
8325
  },
8326
+ "ibm-granite/granite-4.1-8b": {
8327
+ id: "ibm-granite/granite-4.1-8b",
8328
+ name: "IBM: Granite 4.1 8B",
8329
+ api: "openai-completions",
8330
+ provider: "openrouter",
8331
+ baseUrl: "https://openrouter.ai/api/v1",
8332
+ reasoning: false,
8333
+ input: ["text"],
8334
+ cost: {
8335
+ input: 0.049999999999999996,
8336
+ output: 0.09999999999999999,
8337
+ cacheRead: 0.049999999999999996,
8338
+ cacheWrite: 0,
8339
+ },
8340
+ contextWindow: 131072,
8341
+ maxTokens: 131072,
8342
+ },
7915
8343
  "inception/mercury-2": {
7916
8344
  id: "inception/mercury-2",
7917
8345
  name: "Inception: Mercury 2",
@@ -7929,6 +8357,40 @@ export const MODELS = {
7929
8357
  contextWindow: 128000,
7930
8358
  maxTokens: 50000,
7931
8359
  },
8360
+ "inclusionai/ling-2.6-1t:free": {
8361
+ id: "inclusionai/ling-2.6-1t:free",
8362
+ name: "inclusionAI: Ling-2.6-1T (free)",
8363
+ api: "openai-completions",
8364
+ provider: "openrouter",
8365
+ baseUrl: "https://openrouter.ai/api/v1",
8366
+ reasoning: false,
8367
+ input: ["text"],
8368
+ cost: {
8369
+ input: 0,
8370
+ output: 0,
8371
+ cacheRead: 0,
8372
+ cacheWrite: 0,
8373
+ },
8374
+ contextWindow: 262144,
8375
+ maxTokens: 32768,
8376
+ },
8377
+ "inclusionai/ling-2.6-flash": {
8378
+ id: "inclusionai/ling-2.6-flash",
8379
+ name: "inclusionAI: Ling-2.6-flash",
8380
+ api: "openai-completions",
8381
+ provider: "openrouter",
8382
+ baseUrl: "https://openrouter.ai/api/v1",
8383
+ reasoning: false,
8384
+ input: ["text"],
8385
+ cost: {
8386
+ input: 0.08,
8387
+ output: 0.24,
8388
+ cacheRead: 0.016,
8389
+ cacheWrite: 0,
8390
+ },
8391
+ contextWindow: 262144,
8392
+ maxTokens: 32768,
8393
+ },
7932
8394
  "kwaipilot/kat-coder-pro-v2": {
7933
8395
  id: "kwaipilot/kat-coder-pro-v2",
7934
8396
  name: "Kwaipilot: KAT-Coder-Pro V2",
@@ -7978,7 +8440,7 @@ export const MODELS = {
7978
8440
  cacheWrite: 0,
7979
8441
  },
7980
8442
  contextWindow: 131072,
7981
- maxTokens: 4096,
8443
+ maxTokens: 16384,
7982
8444
  },
7983
8445
  "meta-llama/llama-3.1-8b-instruct": {
7984
8446
  id: "meta-llama/llama-3.1-8b-instruct",
@@ -8006,13 +8468,13 @@ export const MODELS = {
8006
8468
  reasoning: false,
8007
8469
  input: ["text"],
8008
8470
  cost: {
8009
- input: 0.12,
8010
- output: 0.38,
8471
+ input: 0.09999999999999999,
8472
+ output: 0.32,
8011
8473
  cacheRead: 0,
8012
8474
  cacheWrite: 0,
8013
8475
  },
8014
8476
  contextWindow: 131072,
8015
- maxTokens: 131072,
8477
+ maxTokens: 16384,
8016
8478
  },
8017
8479
  "meta-llama/llama-3.3-70b-instruct:free": {
8018
8480
  id: "meta-llama/llama-3.3-70b-instruct:free",
@@ -8108,13 +8570,13 @@ export const MODELS = {
8108
8570
  reasoning: true,
8109
8571
  input: ["text"],
8110
8572
  cost: {
8111
- input: 0.118,
8112
- output: 0.9900000000000001,
8113
- cacheRead: 0.059,
8573
+ input: 0.15,
8574
+ output: 1.15,
8575
+ cacheRead: 0.03,
8114
8576
  cacheWrite: 0,
8115
8577
  },
8116
8578
  contextWindow: 196608,
8117
- maxTokens: 65536,
8579
+ maxTokens: 131072,
8118
8580
  },
8119
8581
  "minimax/minimax-m2.5:free": {
8120
8582
  id: "minimax/minimax-m2.5:free",
@@ -8381,12 +8843,12 @@ export const MODELS = {
8381
8843
  input: ["text"],
8382
8844
  cost: {
8383
8845
  input: 0.02,
8384
- output: 0.04,
8846
+ output: 0.03,
8385
8847
  cacheRead: 0,
8386
8848
  cacheWrite: 0,
8387
8849
  },
8388
8850
  contextWindow: 131072,
8389
- maxTokens: 16384,
8851
+ maxTokens: 4096,
8390
8852
  },
8391
8853
  "mistralai/mistral-saba": {
8392
8854
  id: "mistralai/mistral-saba",
@@ -8437,24 +8899,7 @@ export const MODELS = {
8437
8899
  cacheWrite: 0,
8438
8900
  },
8439
8901
  contextWindow: 128000,
8440
- maxTokens: 4096,
8441
- },
8442
- "mistralai/mistral-small-creative": {
8443
- id: "mistralai/mistral-small-creative",
8444
- name: "Mistral: Mistral Small Creative",
8445
- api: "openai-completions",
8446
- provider: "openrouter",
8447
- baseUrl: "https://openrouter.ai/api/v1",
8448
- reasoning: false,
8449
- input: ["text"],
8450
- cost: {
8451
- input: 0.09999999999999999,
8452
- output: 0.3,
8453
- cacheRead: 0.01,
8454
- cacheWrite: 0,
8455
- },
8456
- contextWindow: 32768,
8457
- maxTokens: 4096,
8902
+ maxTokens: 16384,
8458
8903
  },
8459
8904
  "mistralai/mixtral-8x22b-instruct": {
8460
8905
  id: "mistralai/mixtral-8x22b-instruct",
@@ -8592,6 +9037,23 @@ export const MODELS = {
8592
9037
  contextWindow: 262144,
8593
9038
  maxTokens: 4096,
8594
9039
  },
9040
+ "moonshotai/kimi-k2.6": {
9041
+ id: "moonshotai/kimi-k2.6",
9042
+ name: "MoonshotAI: Kimi K2.6",
9043
+ api: "openai-completions",
9044
+ provider: "openrouter",
9045
+ baseUrl: "https://openrouter.ai/api/v1",
9046
+ reasoning: true,
9047
+ input: ["text", "image"],
9048
+ cost: {
9049
+ input: 0.74,
9050
+ output: 3.49,
9051
+ cacheRead: 0.14,
9052
+ cacheWrite: 0,
9053
+ },
9054
+ contextWindow: 262142,
9055
+ maxTokens: 262142,
9056
+ },
8595
9057
  "nex-agi/deepseek-v3.1-nex-n1": {
8596
9058
  id: "nex-agi/deepseek-v3.1-nex-n1",
8597
9059
  name: "Nex AGI: DeepSeek V3.1 Nex N1",
@@ -8641,7 +9103,7 @@ export const MODELS = {
8641
9103
  cacheWrite: 0,
8642
9104
  },
8643
9105
  contextWindow: 131072,
8644
- maxTokens: 4096,
9106
+ maxTokens: 16384,
8645
9107
  },
8646
9108
  "nvidia/nemotron-3-nano-30b-a3b": {
8647
9109
  id: "nvidia/nemotron-3-nano-30b-a3b",
@@ -8658,7 +9120,7 @@ export const MODELS = {
8658
9120
  cacheWrite: 0,
8659
9121
  },
8660
9122
  contextWindow: 262144,
8661
- maxTokens: 4096,
9123
+ maxTokens: 228000,
8662
9124
  },
8663
9125
  "nvidia/nemotron-3-nano-30b-a3b:free": {
8664
9126
  id: "nvidia/nemotron-3-nano-30b-a3b:free",
@@ -8677,16 +9139,33 @@ export const MODELS = {
8677
9139
  contextWindow: 256000,
8678
9140
  maxTokens: 4096,
8679
9141
  },
8680
- "nvidia/nemotron-3-super-120b-a12b": {
8681
- id: "nvidia/nemotron-3-super-120b-a12b",
8682
- name: "NVIDIA: Nemotron 3 Super",
9142
+ "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning:free": {
9143
+ id: "nvidia/nemotron-3-nano-omni-30b-a3b-reasoning:free",
9144
+ name: "NVIDIA: Nemotron 3 Nano Omni (free)",
8683
9145
  api: "openai-completions",
8684
9146
  provider: "openrouter",
8685
9147
  baseUrl: "https://openrouter.ai/api/v1",
8686
9148
  reasoning: true,
8687
- input: ["text"],
9149
+ input: ["text", "image"],
8688
9150
  cost: {
8689
- input: 0.09,
9151
+ input: 0,
9152
+ output: 0,
9153
+ cacheRead: 0,
9154
+ cacheWrite: 0,
9155
+ },
9156
+ contextWindow: 256000,
9157
+ maxTokens: 65536,
9158
+ },
9159
+ "nvidia/nemotron-3-super-120b-a12b": {
9160
+ id: "nvidia/nemotron-3-super-120b-a12b",
9161
+ name: "NVIDIA: Nemotron 3 Super",
9162
+ api: "openai-completions",
9163
+ provider: "openrouter",
9164
+ baseUrl: "https://openrouter.ai/api/v1",
9165
+ reasoning: true,
9166
+ input: ["text"],
9167
+ cost: {
9168
+ input: 0.09,
8690
9169
  output: 0.44999999999999996,
8691
9170
  cacheRead: 0,
8692
9171
  cacheWrite: 0,
@@ -8743,7 +9222,7 @@ export const MODELS = {
8743
9222
  cacheWrite: 0,
8744
9223
  },
8745
9224
  contextWindow: 131072,
8746
- maxTokens: 4096,
9225
+ maxTokens: 16384,
8747
9226
  },
8748
9227
  "nvidia/nemotron-nano-9b-v2:free": {
8749
9228
  id: "nvidia/nemotron-nano-9b-v2:free",
@@ -9102,40 +9581,6 @@ export const MODELS = {
9102
9581
  contextWindow: 400000,
9103
9582
  maxTokens: 128000,
9104
9583
  },
9105
- "openai/gpt-5-image": {
9106
- id: "openai/gpt-5-image",
9107
- name: "OpenAI: GPT-5 Image",
9108
- api: "openai-completions",
9109
- provider: "openrouter",
9110
- baseUrl: "https://openrouter.ai/api/v1",
9111
- reasoning: true,
9112
- input: ["text", "image"],
9113
- cost: {
9114
- input: 10,
9115
- output: 10,
9116
- cacheRead: 1.25,
9117
- cacheWrite: 0,
9118
- },
9119
- contextWindow: 400000,
9120
- maxTokens: 128000,
9121
- },
9122
- "openai/gpt-5-image-mini": {
9123
- id: "openai/gpt-5-image-mini",
9124
- name: "OpenAI: GPT-5 Image Mini",
9125
- api: "openai-completions",
9126
- provider: "openrouter",
9127
- baseUrl: "https://openrouter.ai/api/v1",
9128
- reasoning: true,
9129
- input: ["text", "image"],
9130
- cost: {
9131
- input: 2.5,
9132
- output: 2,
9133
- cacheRead: 0.25,
9134
- cacheWrite: 0,
9135
- },
9136
- contextWindow: 400000,
9137
- maxTokens: 128000,
9138
- },
9139
9584
  "openai/gpt-5-mini": {
9140
9585
  id: "openai/gpt-5-mini",
9141
9586
  name: "OpenAI: GPT-5 Mini",
@@ -9442,6 +9887,40 @@ export const MODELS = {
9442
9887
  contextWindow: 1050000,
9443
9888
  maxTokens: 128000,
9444
9889
  },
9890
+ "openai/gpt-5.5": {
9891
+ id: "openai/gpt-5.5",
9892
+ name: "OpenAI: GPT-5.5",
9893
+ api: "openai-completions",
9894
+ provider: "openrouter",
9895
+ baseUrl: "https://openrouter.ai/api/v1",
9896
+ reasoning: true,
9897
+ input: ["text", "image"],
9898
+ cost: {
9899
+ input: 5,
9900
+ output: 30,
9901
+ cacheRead: 0.5,
9902
+ cacheWrite: 0,
9903
+ },
9904
+ contextWindow: 1050000,
9905
+ maxTokens: 128000,
9906
+ },
9907
+ "openai/gpt-5.5-pro": {
9908
+ id: "openai/gpt-5.5-pro",
9909
+ name: "OpenAI: GPT-5.5 Pro",
9910
+ api: "openai-completions",
9911
+ provider: "openrouter",
9912
+ baseUrl: "https://openrouter.ai/api/v1",
9913
+ reasoning: true,
9914
+ input: ["text", "image"],
9915
+ cost: {
9916
+ input: 30,
9917
+ output: 180,
9918
+ cacheRead: 0,
9919
+ cacheWrite: 0,
9920
+ },
9921
+ contextWindow: 1050000,
9922
+ maxTokens: 128000,
9923
+ },
9445
9924
  "openai/gpt-audio": {
9446
9925
  id: "openai/gpt-audio",
9447
9926
  name: "OpenAI: GPT Audio",
@@ -9486,7 +9965,7 @@ export const MODELS = {
9486
9965
  input: ["text"],
9487
9966
  cost: {
9488
9967
  input: 0.039,
9489
- output: 0.19,
9968
+ output: 0.18,
9490
9969
  cacheRead: 0,
9491
9970
  cacheWrite: 0,
9492
9971
  },
@@ -9525,7 +10004,7 @@ export const MODELS = {
9525
10004
  cacheWrite: 0,
9526
10005
  },
9527
10006
  contextWindow: 131072,
9528
- maxTokens: 4096,
10007
+ maxTokens: 131072,
9529
10008
  },
9530
10009
  "openai/gpt-oss-20b:free": {
9531
10010
  id: "openai/gpt-oss-20b:free",
@@ -9731,9 +10210,26 @@ export const MODELS = {
9731
10210
  contextWindow: 2000000,
9732
10211
  maxTokens: 4096,
9733
10212
  },
9734
- "openrouter/elephant-alpha": {
9735
- id: "openrouter/elephant-alpha",
9736
- name: "Elephant",
10213
+ "openrouter/free": {
10214
+ id: "openrouter/free",
10215
+ name: "Free Models Router",
10216
+ api: "openai-completions",
10217
+ provider: "openrouter",
10218
+ baseUrl: "https://openrouter.ai/api/v1",
10219
+ reasoning: true,
10220
+ input: ["text", "image"],
10221
+ cost: {
10222
+ input: 0,
10223
+ output: 0,
10224
+ cacheRead: 0,
10225
+ cacheWrite: 0,
10226
+ },
10227
+ contextWindow: 200000,
10228
+ maxTokens: 4096,
10229
+ },
10230
+ "openrouter/owl-alpha": {
10231
+ id: "openrouter/owl-alpha",
10232
+ name: "Owl Alpha",
9737
10233
  api: "openai-completions",
9738
10234
  provider: "openrouter",
9739
10235
  baseUrl: "https://openrouter.ai/api/v1",
@@ -9745,25 +10241,42 @@ export const MODELS = {
9745
10241
  cacheRead: 0,
9746
10242
  cacheWrite: 0,
9747
10243
  },
9748
- contextWindow: 262144,
9749
- maxTokens: 32768,
10244
+ contextWindow: 1048756,
10245
+ maxTokens: 262144,
9750
10246
  },
9751
- "openrouter/free": {
9752
- id: "openrouter/free",
9753
- name: "Free Models Router",
10247
+ "poolside/laguna-m.1:free": {
10248
+ id: "poolside/laguna-m.1:free",
10249
+ name: "Poolside: Laguna M.1 (free)",
9754
10250
  api: "openai-completions",
9755
10251
  provider: "openrouter",
9756
10252
  baseUrl: "https://openrouter.ai/api/v1",
9757
10253
  reasoning: true,
9758
- input: ["text", "image"],
10254
+ input: ["text"],
9759
10255
  cost: {
9760
10256
  input: 0,
9761
10257
  output: 0,
9762
10258
  cacheRead: 0,
9763
10259
  cacheWrite: 0,
9764
10260
  },
9765
- contextWindow: 200000,
9766
- maxTokens: 4096,
10261
+ contextWindow: 131072,
10262
+ maxTokens: 8192,
10263
+ },
10264
+ "poolside/laguna-xs.2:free": {
10265
+ id: "poolside/laguna-xs.2:free",
10266
+ name: "Poolside: Laguna XS.2 (free)",
10267
+ api: "openai-completions",
10268
+ provider: "openrouter",
10269
+ baseUrl: "https://openrouter.ai/api/v1",
10270
+ reasoning: true,
10271
+ input: ["text"],
10272
+ cost: {
10273
+ input: 0,
10274
+ output: 0,
10275
+ cacheRead: 0,
10276
+ cacheWrite: 0,
10277
+ },
10278
+ contextWindow: 131072,
10279
+ maxTokens: 8192,
9767
10280
  },
9768
10281
  "prime-intellect/intellect-3": {
9769
10282
  id: "prime-intellect/intellect-3",
@@ -9791,8 +10304,8 @@ export const MODELS = {
9791
10304
  reasoning: false,
9792
10305
  input: ["text"],
9793
10306
  cost: {
9794
- input: 0.12,
9795
- output: 0.39,
10307
+ input: 0.36,
10308
+ output: 0.39999999999999997,
9796
10309
  cacheRead: 0,
9797
10310
  cacheWrite: 0,
9798
10311
  },
@@ -9967,7 +10480,7 @@ export const MODELS = {
9967
10480
  cacheWrite: 0,
9968
10481
  },
9969
10482
  contextWindow: 262144,
9970
- maxTokens: 4096,
10483
+ maxTokens: 16384,
9971
10484
  },
9972
10485
  "qwen/qwen3-235b-a22b-thinking-2507": {
9973
10486
  id: "qwen/qwen3-235b-a22b-thinking-2507",
@@ -9978,13 +10491,13 @@ export const MODELS = {
9978
10491
  reasoning: true,
9979
10492
  input: ["text"],
9980
10493
  cost: {
9981
- input: 0.13,
9982
- output: 0.6,
10494
+ input: 0.14950000000000002,
10495
+ output: 1.495,
9983
10496
  cacheRead: 0,
9984
10497
  cacheWrite: 0,
9985
10498
  },
9986
- contextWindow: 262144,
9987
- maxTokens: 262144,
10499
+ contextWindow: 131072,
10500
+ maxTokens: 4096,
9988
10501
  },
9989
10502
  "qwen/qwen3-30b-a3b": {
9990
10503
  id: "qwen/qwen3-30b-a3b",
@@ -9995,13 +10508,13 @@ export const MODELS = {
9995
10508
  reasoning: true,
9996
10509
  input: ["text"],
9997
10510
  cost: {
9998
- input: 0.08,
9999
- output: 0.28,
10511
+ input: 0.09,
10512
+ output: 0.44999999999999996,
10000
10513
  cacheRead: 0,
10001
10514
  cacheWrite: 0,
10002
10515
  },
10003
10516
  contextWindow: 40960,
10004
- maxTokens: 40960,
10517
+ maxTokens: 20000,
10005
10518
  },
10006
10519
  "qwen/qwen3-30b-a3b-instruct-2507": {
10007
10520
  id: "qwen/qwen3-30b-a3b-instruct-2507",
@@ -10081,12 +10594,12 @@ export const MODELS = {
10081
10594
  input: ["text"],
10082
10595
  cost: {
10083
10596
  input: 0.22,
10084
- output: 1,
10085
- cacheRead: 0.022,
10597
+ output: 1.7999999999999998,
10598
+ cacheRead: 0,
10086
10599
  cacheWrite: 0,
10087
10600
  },
10088
10601
  contextWindow: 262144,
10089
- maxTokens: 4096,
10602
+ maxTokens: 65536,
10090
10603
  },
10091
10604
  "qwen/qwen3-coder-30b-a3b-instruct": {
10092
10605
  id: "qwen/qwen3-coder-30b-a3b-instruct",
@@ -10131,9 +10644,9 @@ export const MODELS = {
10131
10644
  reasoning: false,
10132
10645
  input: ["text"],
10133
10646
  cost: {
10134
- input: 0.15,
10647
+ input: 0.12,
10135
10648
  output: 0.7999999999999999,
10136
- cacheRead: 0.12,
10649
+ cacheRead: 0.07,
10137
10650
  cacheWrite: 0,
10138
10651
  },
10139
10652
  contextWindow: 262144,
@@ -10222,7 +10735,7 @@ export const MODELS = {
10222
10735
  cacheWrite: 0,
10223
10736
  },
10224
10737
  contextWindow: 262144,
10225
- maxTokens: 4096,
10738
+ maxTokens: 16384,
10226
10739
  },
10227
10740
  "qwen/qwen3-next-80b-a3b-instruct:free": {
10228
10741
  id: "qwen/qwen3-next-80b-a3b-instruct:free",
@@ -10273,7 +10786,7 @@ export const MODELS = {
10273
10786
  cacheWrite: 0,
10274
10787
  },
10275
10788
  contextWindow: 262144,
10276
- maxTokens: 4096,
10789
+ maxTokens: 16384,
10277
10790
  },
10278
10791
  "qwen/qwen3-vl-235b-a22b-thinking": {
10279
10792
  id: "qwen/qwen3-vl-235b-a22b-thinking",
@@ -10496,39 +11009,90 @@ export const MODELS = {
10496
11009
  contextWindow: 1000000,
10497
11010
  maxTokens: 65536,
10498
11011
  },
10499
- "qwen/qwen3.6-plus": {
10500
- id: "qwen/qwen3.6-plus",
10501
- name: "Qwen: Qwen3.6 Plus",
11012
+ "qwen/qwen3.5-plus-20260420": {
11013
+ id: "qwen/qwen3.5-plus-20260420",
11014
+ name: "Qwen: Qwen3.5 Plus 2026-04-20",
10502
11015
  api: "openai-completions",
10503
11016
  provider: "openrouter",
10504
11017
  baseUrl: "https://openrouter.ai/api/v1",
10505
11018
  reasoning: true,
10506
11019
  input: ["text", "image"],
10507
11020
  cost: {
10508
- input: 0.325,
10509
- output: 1.95,
11021
+ input: 0.39999999999999997,
11022
+ output: 2.4,
10510
11023
  cacheRead: 0,
10511
- cacheWrite: 0.40625,
11024
+ cacheWrite: 0,
10512
11025
  },
10513
11026
  contextWindow: 1000000,
10514
11027
  maxTokens: 65536,
10515
11028
  },
10516
- "qwen/qwq-32b": {
10517
- id: "qwen/qwq-32b",
10518
- name: "Qwen: QwQ 32B",
11029
+ "qwen/qwen3.6-27b": {
11030
+ id: "qwen/qwen3.6-27b",
11031
+ name: "Qwen: Qwen3.6 27B",
10519
11032
  api: "openai-completions",
10520
11033
  provider: "openrouter",
10521
11034
  baseUrl: "https://openrouter.ai/api/v1",
10522
11035
  reasoning: true,
10523
- input: ["text"],
11036
+ input: ["text", "image"],
10524
11037
  cost: {
10525
- input: 0.15,
10526
- output: 0.58,
11038
+ input: 0.32,
11039
+ output: 3.1999999999999997,
10527
11040
  cacheRead: 0,
10528
11041
  cacheWrite: 0,
10529
11042
  },
10530
- contextWindow: 131072,
10531
- maxTokens: 131072,
11043
+ contextWindow: 262144,
11044
+ maxTokens: 81920,
11045
+ },
11046
+ "qwen/qwen3.6-flash": {
11047
+ id: "qwen/qwen3.6-flash",
11048
+ name: "Qwen: Qwen3.6 Flash",
11049
+ api: "openai-completions",
11050
+ provider: "openrouter",
11051
+ baseUrl: "https://openrouter.ai/api/v1",
11052
+ reasoning: true,
11053
+ input: ["text", "image"],
11054
+ cost: {
11055
+ input: 0.25,
11056
+ output: 1.5,
11057
+ cacheRead: 0,
11058
+ cacheWrite: 0.3125,
11059
+ },
11060
+ contextWindow: 1000000,
11061
+ maxTokens: 65536,
11062
+ },
11063
+ "qwen/qwen3.6-max-preview": {
11064
+ id: "qwen/qwen3.6-max-preview",
11065
+ name: "Qwen: Qwen3.6 Max Preview",
11066
+ api: "openai-completions",
11067
+ provider: "openrouter",
11068
+ baseUrl: "https://openrouter.ai/api/v1",
11069
+ reasoning: true,
11070
+ input: ["text"],
11071
+ cost: {
11072
+ input: 1.04,
11073
+ output: 6.24,
11074
+ cacheRead: 0,
11075
+ cacheWrite: 1.3,
11076
+ },
11077
+ contextWindow: 262144,
11078
+ maxTokens: 65536,
11079
+ },
11080
+ "qwen/qwen3.6-plus": {
11081
+ id: "qwen/qwen3.6-plus",
11082
+ name: "Qwen: Qwen3.6 Plus",
11083
+ api: "openai-completions",
11084
+ provider: "openrouter",
11085
+ baseUrl: "https://openrouter.ai/api/v1",
11086
+ reasoning: true,
11087
+ input: ["text", "image"],
11088
+ cost: {
11089
+ input: 0.325,
11090
+ output: 1.95,
11091
+ cacheRead: 0,
11092
+ cacheWrite: 0.40625,
11093
+ },
11094
+ contextWindow: 1000000,
11095
+ maxTokens: 65536,
10532
11096
  },
10533
11097
  "rekaai/reka-edge": {
10534
11098
  id: "rekaai/reka-edge",
@@ -10615,6 +11179,23 @@ export const MODELS = {
10615
11179
  contextWindow: 262144,
10616
11180
  maxTokens: 65536,
10617
11181
  },
11182
+ "tencent/hy3-preview:free": {
11183
+ id: "tencent/hy3-preview:free",
11184
+ name: "Tencent: Hy3 preview (free)",
11185
+ api: "openai-completions",
11186
+ provider: "openrouter",
11187
+ baseUrl: "https://openrouter.ai/api/v1",
11188
+ reasoning: true,
11189
+ input: ["text"],
11190
+ cost: {
11191
+ input: 0,
11192
+ output: 0,
11193
+ cacheRead: 0,
11194
+ cacheWrite: 0,
11195
+ },
11196
+ contextWindow: 262144,
11197
+ maxTokens: 262144,
11198
+ },
10618
11199
  "thedrummer/rocinante-12b": {
10619
11200
  id: "thedrummer/rocinante-12b",
10620
11201
  name: "TheDrummer: Rocinante 12B",
@@ -10811,14 +11392,31 @@ export const MODELS = {
10811
11392
  reasoning: true,
10812
11393
  input: ["text", "image"],
10813
11394
  cost: {
10814
- input: 2,
10815
- output: 6,
11395
+ input: 1.25,
11396
+ output: 2.5,
10816
11397
  cacheRead: 0.19999999999999998,
10817
11398
  cacheWrite: 0,
10818
11399
  },
10819
11400
  contextWindow: 2000000,
10820
11401
  maxTokens: 4096,
10821
11402
  },
11403
+ "x-ai/grok-4.3": {
11404
+ id: "x-ai/grok-4.3",
11405
+ name: "xAI: Grok 4.3",
11406
+ api: "openai-completions",
11407
+ provider: "openrouter",
11408
+ baseUrl: "https://openrouter.ai/api/v1",
11409
+ reasoning: true,
11410
+ input: ["text", "image"],
11411
+ cost: {
11412
+ input: 1.25,
11413
+ output: 2.5,
11414
+ cacheRead: 0.19999999999999998,
11415
+ cacheWrite: 0,
11416
+ },
11417
+ contextWindow: 1000000,
11418
+ maxTokens: 4096,
11419
+ },
10822
11420
  "x-ai/grok-code-fast-1": {
10823
11421
  id: "x-ai/grok-code-fast-1",
10824
11422
  name: "xAI: Grok Code Fast 1",
@@ -10887,6 +11485,40 @@ export const MODELS = {
10887
11485
  contextWindow: 1048576,
10888
11486
  maxTokens: 131072,
10889
11487
  },
11488
+ "xiaomi/mimo-v2.5": {
11489
+ id: "xiaomi/mimo-v2.5",
11490
+ name: "Xiaomi: MiMo-V2.5",
11491
+ api: "openai-completions",
11492
+ provider: "openrouter",
11493
+ baseUrl: "https://openrouter.ai/api/v1",
11494
+ reasoning: true,
11495
+ input: ["text", "image"],
11496
+ cost: {
11497
+ input: 0.39999999999999997,
11498
+ output: 2,
11499
+ cacheRead: 0.08,
11500
+ cacheWrite: 0,
11501
+ },
11502
+ contextWindow: 1048576,
11503
+ maxTokens: 131072,
11504
+ },
11505
+ "xiaomi/mimo-v2.5-pro": {
11506
+ id: "xiaomi/mimo-v2.5-pro",
11507
+ name: "Xiaomi: MiMo-V2.5-Pro",
11508
+ api: "openai-completions",
11509
+ provider: "openrouter",
11510
+ baseUrl: "https://openrouter.ai/api/v1",
11511
+ reasoning: true,
11512
+ input: ["text"],
11513
+ cost: {
11514
+ input: 1,
11515
+ output: 3,
11516
+ cacheRead: 0.19999999999999998,
11517
+ cacheWrite: 0,
11518
+ },
11519
+ contextWindow: 1048576,
11520
+ maxTokens: 131072,
11521
+ },
10890
11522
  "z-ai/glm-4-32b": {
10891
11523
  id: "z-ai/glm-4-32b",
10892
11524
  name: "Z.ai: GLM 4 32B ",
@@ -11000,11 +11632,11 @@ export const MODELS = {
11000
11632
  cost: {
11001
11633
  input: 0.3,
11002
11634
  output: 0.8999999999999999,
11003
- cacheRead: 0,
11635
+ cacheRead: 0.049999999999999996,
11004
11636
  cacheWrite: 0,
11005
11637
  },
11006
11638
  contextWindow: 131072,
11007
- maxTokens: 131072,
11639
+ maxTokens: 24000,
11008
11640
  },
11009
11641
  "z-ai/glm-4.7": {
11010
11642
  id: "z-ai/glm-4.7",
@@ -11015,13 +11647,13 @@ export const MODELS = {
11015
11647
  reasoning: true,
11016
11648
  input: ["text"],
11017
11649
  cost: {
11018
- input: 0.39,
11019
- output: 1.75,
11020
- cacheRead: 0.195,
11650
+ input: 0.38,
11651
+ output: 1.74,
11652
+ cacheRead: 0,
11021
11653
  cacheWrite: 0,
11022
11654
  },
11023
11655
  contextWindow: 202752,
11024
- maxTokens: 65535,
11656
+ maxTokens: 4096,
11025
11657
  },
11026
11658
  "z-ai/glm-4.7-flash": {
11027
11659
  id: "z-ai/glm-4.7-flash",
@@ -11034,11 +11666,11 @@ export const MODELS = {
11034
11666
  cost: {
11035
11667
  input: 0.06,
11036
11668
  output: 0.39999999999999997,
11037
- cacheRead: 0.0100000002,
11669
+ cacheRead: 0.01,
11038
11670
  cacheWrite: 0,
11039
11671
  },
11040
11672
  contextWindow: 202752,
11041
- maxTokens: 4096,
11673
+ maxTokens: 16384,
11042
11674
  },
11043
11675
  "z-ai/glm-5": {
11044
11676
  id: "z-ai/glm-5",
@@ -11054,8 +11686,8 @@ export const MODELS = {
11054
11686
  cacheRead: 0.119,
11055
11687
  cacheWrite: 0,
11056
11688
  },
11057
- contextWindow: 80000,
11058
- maxTokens: 131072,
11689
+ contextWindow: 202752,
11690
+ maxTokens: 16384,
11059
11691
  },
11060
11692
  "z-ai/glm-5-turbo": {
11061
11693
  id: "z-ai/glm-5-turbo",
@@ -11083,9 +11715,9 @@ export const MODELS = {
11083
11715
  reasoning: true,
11084
11716
  input: ["text"],
11085
11717
  cost: {
11086
- input: 0.95,
11087
- output: 3.15,
11088
- cacheRead: 0.475,
11718
+ input: 1.0499999999999998,
11719
+ output: 3.5,
11720
+ cacheRead: 0.5249999999999999,
11089
11721
  cacheWrite: 0,
11090
11722
  },
11091
11723
  contextWindow: 202752,
@@ -11108,6 +11740,142 @@ export const MODELS = {
11108
11740
  contextWindow: 202752,
11109
11741
  maxTokens: 131072,
11110
11742
  },
11743
+ "~anthropic/claude-haiku-latest": {
11744
+ id: "~anthropic/claude-haiku-latest",
11745
+ name: "Anthropic Claude Haiku Latest",
11746
+ api: "openai-completions",
11747
+ provider: "openrouter",
11748
+ baseUrl: "https://openrouter.ai/api/v1",
11749
+ reasoning: true,
11750
+ input: ["text", "image"],
11751
+ cost: {
11752
+ input: 1,
11753
+ output: 5,
11754
+ cacheRead: 0.09999999999999999,
11755
+ cacheWrite: 1.25,
11756
+ },
11757
+ contextWindow: 200000,
11758
+ maxTokens: 64000,
11759
+ },
11760
+ "~anthropic/claude-opus-latest": {
11761
+ id: "~anthropic/claude-opus-latest",
11762
+ name: "Anthropic: Claude Opus Latest",
11763
+ api: "openai-completions",
11764
+ provider: "openrouter",
11765
+ baseUrl: "https://openrouter.ai/api/v1",
11766
+ reasoning: true,
11767
+ input: ["text", "image"],
11768
+ cost: {
11769
+ input: 5,
11770
+ output: 25,
11771
+ cacheRead: 0.5,
11772
+ cacheWrite: 6.25,
11773
+ },
11774
+ contextWindow: 1000000,
11775
+ maxTokens: 128000,
11776
+ },
11777
+ "~anthropic/claude-sonnet-latest": {
11778
+ id: "~anthropic/claude-sonnet-latest",
11779
+ name: "Anthropic Claude Sonnet Latest",
11780
+ api: "openai-completions",
11781
+ provider: "openrouter",
11782
+ baseUrl: "https://openrouter.ai/api/v1",
11783
+ reasoning: true,
11784
+ input: ["text", "image"],
11785
+ cost: {
11786
+ input: 3,
11787
+ output: 15,
11788
+ cacheRead: 0.3,
11789
+ cacheWrite: 3.75,
11790
+ },
11791
+ contextWindow: 1000000,
11792
+ maxTokens: 128000,
11793
+ },
11794
+ "~google/gemini-flash-latest": {
11795
+ id: "~google/gemini-flash-latest",
11796
+ name: "Google Gemini Flash Latest",
11797
+ api: "openai-completions",
11798
+ provider: "openrouter",
11799
+ baseUrl: "https://openrouter.ai/api/v1",
11800
+ reasoning: true,
11801
+ input: ["text", "image"],
11802
+ cost: {
11803
+ input: 0.5,
11804
+ output: 3,
11805
+ cacheRead: 0.049999999999999996,
11806
+ cacheWrite: 0.08333333333333334,
11807
+ },
11808
+ contextWindow: 1048576,
11809
+ maxTokens: 65536,
11810
+ },
11811
+ "~google/gemini-pro-latest": {
11812
+ id: "~google/gemini-pro-latest",
11813
+ name: "Google Gemini Pro Latest",
11814
+ api: "openai-completions",
11815
+ provider: "openrouter",
11816
+ baseUrl: "https://openrouter.ai/api/v1",
11817
+ reasoning: true,
11818
+ input: ["text", "image"],
11819
+ cost: {
11820
+ input: 2,
11821
+ output: 12,
11822
+ cacheRead: 0.19999999999999998,
11823
+ cacheWrite: 0.375,
11824
+ },
11825
+ contextWindow: 1048576,
11826
+ maxTokens: 65536,
11827
+ },
11828
+ "~moonshotai/kimi-latest": {
11829
+ id: "~moonshotai/kimi-latest",
11830
+ name: "MoonshotAI Kimi Latest",
11831
+ api: "openai-completions",
11832
+ provider: "openrouter",
11833
+ baseUrl: "https://openrouter.ai/api/v1",
11834
+ reasoning: true,
11835
+ input: ["text", "image"],
11836
+ cost: {
11837
+ input: 0.74,
11838
+ output: 3.49,
11839
+ cacheRead: 0.14,
11840
+ cacheWrite: 0,
11841
+ },
11842
+ contextWindow: 262142,
11843
+ maxTokens: 262142,
11844
+ },
11845
+ "~openai/gpt-latest": {
11846
+ id: "~openai/gpt-latest",
11847
+ name: "OpenAI GPT Latest",
11848
+ api: "openai-completions",
11849
+ provider: "openrouter",
11850
+ baseUrl: "https://openrouter.ai/api/v1",
11851
+ reasoning: true,
11852
+ input: ["text", "image"],
11853
+ cost: {
11854
+ input: 5,
11855
+ output: 30,
11856
+ cacheRead: 0.5,
11857
+ cacheWrite: 0,
11858
+ },
11859
+ contextWindow: 1050000,
11860
+ maxTokens: 128000,
11861
+ },
11862
+ "~openai/gpt-mini-latest": {
11863
+ id: "~openai/gpt-mini-latest",
11864
+ name: "OpenAI GPT Mini Latest",
11865
+ api: "openai-completions",
11866
+ provider: "openrouter",
11867
+ baseUrl: "https://openrouter.ai/api/v1",
11868
+ reasoning: true,
11869
+ input: ["text", "image"],
11870
+ cost: {
11871
+ input: 0.75,
11872
+ output: 4.5,
11873
+ cacheRead: 0.075,
11874
+ cacheWrite: 0,
11875
+ },
11876
+ contextWindow: 400000,
11877
+ maxTokens: 128000,
11878
+ },
11111
11879
  },
11112
11880
  "vercel-ai-gateway": {
11113
11881
  "alibaba/qwen-3-14b": {
@@ -11178,22 +11946,39 @@ export const MODELS = {
11178
11946
  contextWindow: 128000,
11179
11947
  maxTokens: 8192,
11180
11948
  },
11949
+ "alibaba/qwen-3.6-max-preview": {
11950
+ id: "alibaba/qwen-3.6-max-preview",
11951
+ name: "Qwen 3.6 Max Preview",
11952
+ api: "anthropic-messages",
11953
+ provider: "vercel-ai-gateway",
11954
+ baseUrl: "https://ai-gateway.vercel.sh",
11955
+ reasoning: true,
11956
+ input: ["text", "image"],
11957
+ cost: {
11958
+ input: 1.3,
11959
+ output: 7.8,
11960
+ cacheRead: 0.26,
11961
+ cacheWrite: 1.625,
11962
+ },
11963
+ contextWindow: 240000,
11964
+ maxTokens: 64000,
11965
+ },
11181
11966
  "alibaba/qwen3-235b-a22b-thinking": {
11182
11967
  id: "alibaba/qwen3-235b-a22b-thinking",
11183
- name: "Qwen3 235B A22B Thinking 2507",
11968
+ name: "Qwen3 VL 235B A22B Thinking",
11184
11969
  api: "anthropic-messages",
11185
11970
  provider: "vercel-ai-gateway",
11186
11971
  baseUrl: "https://ai-gateway.vercel.sh",
11187
11972
  reasoning: true,
11188
11973
  input: ["text", "image"],
11189
11974
  cost: {
11190
- input: 0.22999999999999998,
11191
- output: 2.3,
11192
- cacheRead: 0.19999999999999998,
11975
+ input: 0.39999999999999997,
11976
+ output: 4,
11977
+ cacheRead: 0,
11193
11978
  cacheWrite: 0,
11194
11979
  },
11195
- contextWindow: 262114,
11196
- maxTokens: 262114,
11980
+ contextWindow: 131072,
11981
+ maxTokens: 32768,
11197
11982
  },
11198
11983
  "alibaba/qwen3-coder": {
11199
11984
  id: "alibaba/qwen3-coder",
@@ -11365,6 +12150,23 @@ export const MODELS = {
11365
12150
  contextWindow: 1000000,
11366
12151
  maxTokens: 64000,
11367
12152
  },
12153
+ "alibaba/qwen3.6-27b": {
12154
+ id: "alibaba/qwen3.6-27b",
12155
+ name: "Qwen 3.6 27B",
12156
+ api: "anthropic-messages",
12157
+ provider: "vercel-ai-gateway",
12158
+ baseUrl: "https://ai-gateway.vercel.sh",
12159
+ reasoning: true,
12160
+ input: ["text", "image"],
12161
+ cost: {
12162
+ input: 0.6,
12163
+ output: 3.5999999999999996,
12164
+ cacheRead: 0,
12165
+ cacheWrite: 0,
12166
+ },
12167
+ contextWindow: 256000,
12168
+ maxTokens: 256000,
12169
+ },
11368
12170
  "alibaba/qwen3.6-plus": {
11369
12171
  id: "alibaba/qwen3.6-plus",
11370
12172
  name: "Qwen 3.6 Plus",
@@ -11377,7 +12179,7 @@ export const MODELS = {
11377
12179
  input: 0.5,
11378
12180
  output: 3,
11379
12181
  cacheRead: 0.09999999999999999,
11380
- cacheWrite: 0,
12182
+ cacheWrite: 0.625,
11381
12183
  },
11382
12184
  contextWindow: 1000000,
11383
12185
  maxTokens: 64000,
@@ -11745,16 +12547,50 @@ export const MODELS = {
11745
12547
  api: "anthropic-messages",
11746
12548
  provider: "vercel-ai-gateway",
11747
12549
  baseUrl: "https://ai-gateway.vercel.sh",
12550
+ reasoning: false,
12551
+ input: ["text"],
12552
+ cost: {
12553
+ input: 0.62,
12554
+ output: 1.85,
12555
+ cacheRead: 0,
12556
+ cacheWrite: 0,
12557
+ },
12558
+ contextWindow: 128000,
12559
+ maxTokens: 8000,
12560
+ },
12561
+ "deepseek/deepseek-v4-flash": {
12562
+ id: "deepseek/deepseek-v4-flash",
12563
+ name: "DeepSeek V4 Flash",
12564
+ api: "anthropic-messages",
12565
+ provider: "vercel-ai-gateway",
12566
+ baseUrl: "https://ai-gateway.vercel.sh",
12567
+ reasoning: true,
12568
+ input: ["text"],
12569
+ cost: {
12570
+ input: 0.14,
12571
+ output: 0.28,
12572
+ cacheRead: 0.0028,
12573
+ cacheWrite: 0,
12574
+ },
12575
+ contextWindow: 1000000,
12576
+ maxTokens: 384000,
12577
+ },
12578
+ "deepseek/deepseek-v4-pro": {
12579
+ id: "deepseek/deepseek-v4-pro",
12580
+ name: "DeepSeek V4 Pro",
12581
+ api: "anthropic-messages",
12582
+ provider: "vercel-ai-gateway",
12583
+ baseUrl: "https://ai-gateway.vercel.sh",
11748
12584
  reasoning: true,
11749
12585
  input: ["text"],
11750
12586
  cost: {
11751
- input: 0.28,
11752
- output: 0.42,
11753
- cacheRead: 0.028,
12587
+ input: 0.435,
12588
+ output: 0.87,
12589
+ cacheRead: 0.0036,
11754
12590
  cacheWrite: 0,
11755
12591
  },
11756
- contextWindow: 128000,
11757
- maxTokens: 64000,
12592
+ contextWindow: 1000000,
12593
+ maxTokens: 384000,
11758
12594
  },
11759
12595
  "google/gemini-2.0-flash": {
11760
12596
  id: "google/gemini-2.0-flash",
@@ -12521,6 +13357,23 @@ export const MODELS = {
12521
13357
  contextWindow: 262114,
12522
13358
  maxTokens: 262114,
12523
13359
  },
13360
+ "moonshotai/kimi-k2.6": {
13361
+ id: "moonshotai/kimi-k2.6",
13362
+ name: "Kimi K2.6",
13363
+ api: "anthropic-messages",
13364
+ provider: "vercel-ai-gateway",
13365
+ baseUrl: "https://ai-gateway.vercel.sh",
13366
+ reasoning: true,
13367
+ input: ["text", "image"],
13368
+ cost: {
13369
+ input: 0.95,
13370
+ output: 4,
13371
+ cacheRead: 0.16,
13372
+ cacheWrite: 0,
13373
+ },
13374
+ contextWindow: 262000,
13375
+ maxTokens: 262000,
13376
+ },
12524
13377
  "nvidia/nemotron-nano-12b-v2-vl": {
12525
13378
  id: "nvidia/nemotron-nano-12b-v2-vl",
12526
13379
  name: "Nvidia Nemotron Nano 12B V2 VL",
@@ -13014,6 +13867,40 @@ export const MODELS = {
13014
13867
  contextWindow: 1050000,
13015
13868
  maxTokens: 128000,
13016
13869
  },
13870
+ "openai/gpt-5.5": {
13871
+ id: "openai/gpt-5.5",
13872
+ name: "GPT 5.5",
13873
+ api: "anthropic-messages",
13874
+ provider: "vercel-ai-gateway",
13875
+ baseUrl: "https://ai-gateway.vercel.sh",
13876
+ reasoning: true,
13877
+ input: ["text", "image"],
13878
+ cost: {
13879
+ input: 5,
13880
+ output: 30,
13881
+ cacheRead: 0.5,
13882
+ cacheWrite: 0,
13883
+ },
13884
+ contextWindow: 1000000,
13885
+ maxTokens: 128000,
13886
+ },
13887
+ "openai/gpt-5.5-pro": {
13888
+ id: "openai/gpt-5.5-pro",
13889
+ name: "GPT 5.5 Pro",
13890
+ api: "anthropic-messages",
13891
+ provider: "vercel-ai-gateway",
13892
+ baseUrl: "https://ai-gateway.vercel.sh",
13893
+ reasoning: true,
13894
+ input: ["text", "image"],
13895
+ cost: {
13896
+ input: 30,
13897
+ output: 180,
13898
+ cacheRead: 0,
13899
+ cacheWrite: 0,
13900
+ },
13901
+ contextWindow: 1000000,
13902
+ maxTokens: 128000,
13903
+ },
13017
13904
  "openai/gpt-oss-20b": {
13018
13905
  id: "openai/gpt-oss-20b",
13019
13906
  name: "GPT OSS 120B",
@@ -13184,23 +14071,6 @@ export const MODELS = {
13184
14071
  contextWindow: 200000,
13185
14072
  maxTokens: 8000,
13186
14073
  },
13187
- "prime-intellect/intellect-3": {
13188
- id: "prime-intellect/intellect-3",
13189
- name: "INTELLECT 3",
13190
- api: "anthropic-messages",
13191
- provider: "vercel-ai-gateway",
13192
- baseUrl: "https://ai-gateway.vercel.sh",
13193
- reasoning: true,
13194
- input: ["text"],
13195
- cost: {
13196
- input: 0.19999999999999998,
13197
- output: 1.1,
13198
- cacheRead: 0,
13199
- cacheWrite: 0,
13200
- },
13201
- contextWindow: 131072,
13202
- maxTokens: 131072,
13203
- },
13204
14074
  "xai/grok-3": {
13205
14075
  id: "xai/grok-3",
13206
14076
  name: "Grok 3 Beta",
@@ -13456,6 +14326,23 @@ export const MODELS = {
13456
14326
  contextWindow: 2000000,
13457
14327
  maxTokens: 2000000,
13458
14328
  },
14329
+ "xai/grok-4.3": {
14330
+ id: "xai/grok-4.3",
14331
+ name: "Grok 4.3",
14332
+ api: "anthropic-messages",
14333
+ provider: "vercel-ai-gateway",
14334
+ baseUrl: "https://ai-gateway.vercel.sh",
14335
+ reasoning: true,
14336
+ input: ["text", "image"],
14337
+ cost: {
14338
+ input: 1.25,
14339
+ output: 2.5,
14340
+ cacheRead: 0.19999999999999998,
14341
+ cacheWrite: 0,
14342
+ },
14343
+ contextWindow: 1000000,
14344
+ maxTokens: 1000000,
14345
+ },
13459
14346
  "xai/grok-code-fast-1": {
13460
14347
  id: "xai/grok-code-fast-1",
13461
14348
  name: "Grok Code Fast 1",
@@ -13482,9 +14369,9 @@ export const MODELS = {
13482
14369
  reasoning: true,
13483
14370
  input: ["text"],
13484
14371
  cost: {
13485
- input: 0.09,
13486
- output: 0.29,
13487
- cacheRead: 0.045,
14372
+ input: 0.09999999999999999,
14373
+ output: 0.3,
14374
+ cacheRead: 0.01,
13488
14375
  cacheWrite: 0,
13489
14376
  },
13490
14377
  contextWindow: 262144,
@@ -13507,6 +14394,40 @@ export const MODELS = {
13507
14394
  contextWindow: 1000000,
13508
14395
  maxTokens: 128000,
13509
14396
  },
14397
+ "xiaomi/mimo-v2.5": {
14398
+ id: "xiaomi/mimo-v2.5",
14399
+ name: "MiMo M2.5",
14400
+ api: "anthropic-messages",
14401
+ provider: "vercel-ai-gateway",
14402
+ baseUrl: "https://ai-gateway.vercel.sh",
14403
+ reasoning: true,
14404
+ input: ["text", "image"],
14405
+ cost: {
14406
+ input: 0.39999999999999997,
14407
+ output: 2,
14408
+ cacheRead: 0.08,
14409
+ cacheWrite: 0,
14410
+ },
14411
+ contextWindow: 1050000,
14412
+ maxTokens: 131100,
14413
+ },
14414
+ "xiaomi/mimo-v2.5-pro": {
14415
+ id: "xiaomi/mimo-v2.5-pro",
14416
+ name: "MiMo V2.5 Pro",
14417
+ api: "anthropic-messages",
14418
+ provider: "vercel-ai-gateway",
14419
+ baseUrl: "https://ai-gateway.vercel.sh",
14420
+ reasoning: true,
14421
+ input: ["text", "image"],
14422
+ cost: {
14423
+ input: 1,
14424
+ output: 3,
14425
+ cacheRead: 0.19999999999999998,
14426
+ cacheWrite: 0,
14427
+ },
14428
+ contextWindow: 1050000,
14429
+ maxTokens: 131000,
14430
+ },
13510
14431
  "zai/glm-4.5": {
13511
14432
  id: "zai/glm-4.5",
13512
14433
  name: "GLM-4.5",
@@ -13701,15 +14622,15 @@ export const MODELS = {
13701
14622
  provider: "vercel-ai-gateway",
13702
14623
  baseUrl: "https://ai-gateway.vercel.sh",
13703
14624
  reasoning: true,
13704
- input: ["text", "image"],
14625
+ input: ["text"],
13705
14626
  cost: {
13706
14627
  input: 1.4,
13707
14628
  output: 4.4,
13708
14629
  cacheRead: 0.26,
13709
14630
  cacheWrite: 0,
13710
14631
  },
13711
- contextWindow: 202752,
13712
- maxTokens: 202752,
14632
+ contextWindow: 202800,
14633
+ maxTokens: 64000,
13713
14634
  },
13714
14635
  "zai/glm-5v-turbo": {
13715
14636
  id: "zai/glm-5v-turbo",
@@ -14087,6 +15008,23 @@ export const MODELS = {
14087
15008
  contextWindow: 2000000,
14088
15009
  maxTokens: 30000,
14089
15010
  },
15011
+ "grok-4.3": {
15012
+ id: "grok-4.3",
15013
+ name: "Grok 4.3",
15014
+ api: "openai-completions",
15015
+ provider: "xai",
15016
+ baseUrl: "https://api.x.ai/v1",
15017
+ reasoning: true,
15018
+ input: ["text", "image"],
15019
+ cost: {
15020
+ input: 1.25,
15021
+ output: 2.5,
15022
+ cacheRead: 0.2,
15023
+ cacheWrite: 0,
15024
+ },
15025
+ contextWindow: 1000000,
15026
+ maxTokens: 30000,
15027
+ },
14090
15028
  "grok-beta": {
14091
15029
  id: "grok-beta",
14092
15030
  name: "Grok Beta",
@@ -14140,24 +15078,6 @@ export const MODELS = {
14140
15078
  },
14141
15079
  },
14142
15080
  "zai": {
14143
- "glm-4.5": {
14144
- id: "glm-4.5",
14145
- name: "GLM-4.5",
14146
- api: "openai-completions",
14147
- provider: "zai",
14148
- baseUrl: "https://api.z.ai/api/coding/paas/v4",
14149
- compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai" },
14150
- reasoning: true,
14151
- input: ["text"],
14152
- cost: {
14153
- input: 0,
14154
- output: 0,
14155
- cacheRead: 0,
14156
- cacheWrite: 0,
14157
- },
14158
- contextWindow: 131072,
14159
- maxTokens: 98304,
14160
- },
14161
15081
  "glm-4.5-air": {
14162
15082
  id: "glm-4.5-air",
14163
15083
  name: "GLM-4.5-Air",
@@ -14176,78 +15096,6 @@ export const MODELS = {
14176
15096
  contextWindow: 131072,
14177
15097
  maxTokens: 98304,
14178
15098
  },
14179
- "glm-4.5-flash": {
14180
- id: "glm-4.5-flash",
14181
- name: "GLM-4.5-Flash",
14182
- api: "openai-completions",
14183
- provider: "zai",
14184
- baseUrl: "https://api.z.ai/api/coding/paas/v4",
14185
- compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai" },
14186
- reasoning: true,
14187
- input: ["text"],
14188
- cost: {
14189
- input: 0,
14190
- output: 0,
14191
- cacheRead: 0,
14192
- cacheWrite: 0,
14193
- },
14194
- contextWindow: 131072,
14195
- maxTokens: 98304,
14196
- },
14197
- "glm-4.5v": {
14198
- id: "glm-4.5v",
14199
- name: "GLM-4.5V",
14200
- api: "openai-completions",
14201
- provider: "zai",
14202
- baseUrl: "https://api.z.ai/api/coding/paas/v4",
14203
- compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai" },
14204
- reasoning: true,
14205
- input: ["text", "image"],
14206
- cost: {
14207
- input: 0,
14208
- output: 0,
14209
- cacheRead: 0,
14210
- cacheWrite: 0,
14211
- },
14212
- contextWindow: 64000,
14213
- maxTokens: 16384,
14214
- },
14215
- "glm-4.6": {
14216
- id: "glm-4.6",
14217
- name: "GLM-4.6",
14218
- api: "openai-completions",
14219
- provider: "zai",
14220
- baseUrl: "https://api.z.ai/api/coding/paas/v4",
14221
- compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "zaiToolStream": true },
14222
- reasoning: true,
14223
- input: ["text"],
14224
- cost: {
14225
- input: 0,
14226
- output: 0,
14227
- cacheRead: 0,
14228
- cacheWrite: 0,
14229
- },
14230
- contextWindow: 204800,
14231
- maxTokens: 131072,
14232
- },
14233
- "glm-4.6v": {
14234
- id: "glm-4.6v",
14235
- name: "GLM-4.6V",
14236
- api: "openai-completions",
14237
- provider: "zai",
14238
- baseUrl: "https://api.z.ai/api/coding/paas/v4",
14239
- compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "zaiToolStream": true },
14240
- reasoning: true,
14241
- input: ["text", "image"],
14242
- cost: {
14243
- input: 0,
14244
- output: 0,
14245
- cacheRead: 0,
14246
- cacheWrite: 0,
14247
- },
14248
- contextWindow: 128000,
14249
- maxTokens: 32768,
14250
- },
14251
15099
  "glm-4.7": {
14252
15100
  id: "glm-4.7",
14253
15101
  name: "GLM-4.7",
@@ -14266,60 +15114,6 @@ export const MODELS = {
14266
15114
  contextWindow: 204800,
14267
15115
  maxTokens: 131072,
14268
15116
  },
14269
- "glm-4.7-flash": {
14270
- id: "glm-4.7-flash",
14271
- name: "GLM-4.7-Flash",
14272
- api: "openai-completions",
14273
- provider: "zai",
14274
- baseUrl: "https://api.z.ai/api/coding/paas/v4",
14275
- compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "zaiToolStream": true },
14276
- reasoning: true,
14277
- input: ["text"],
14278
- cost: {
14279
- input: 0,
14280
- output: 0,
14281
- cacheRead: 0,
14282
- cacheWrite: 0,
14283
- },
14284
- contextWindow: 200000,
14285
- maxTokens: 131072,
14286
- },
14287
- "glm-4.7-flashx": {
14288
- id: "glm-4.7-flashx",
14289
- name: "GLM-4.7-FlashX",
14290
- api: "openai-completions",
14291
- provider: "zai",
14292
- baseUrl: "https://api.z.ai/api/coding/paas/v4",
14293
- compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "zaiToolStream": true },
14294
- reasoning: true,
14295
- input: ["text"],
14296
- cost: {
14297
- input: 0.07,
14298
- output: 0.4,
14299
- cacheRead: 0.01,
14300
- cacheWrite: 0,
14301
- },
14302
- contextWindow: 200000,
14303
- maxTokens: 131072,
14304
- },
14305
- "glm-5": {
14306
- id: "glm-5",
14307
- name: "GLM-5",
14308
- api: "openai-completions",
14309
- provider: "zai",
14310
- baseUrl: "https://api.z.ai/api/coding/paas/v4",
14311
- compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "zaiToolStream": true },
14312
- reasoning: true,
14313
- input: ["text"],
14314
- cost: {
14315
- input: 0,
14316
- output: 0,
14317
- cacheRead: 0,
14318
- cacheWrite: 0,
14319
- },
14320
- contextWindow: 204800,
14321
- maxTokens: 131072,
14322
- },
14323
15117
  "glm-5-turbo": {
14324
15118
  id: "glm-5-turbo",
14325
15119
  name: "GLM-5-Turbo",
@@ -14358,7 +15152,7 @@ export const MODELS = {
14358
15152
  },
14359
15153
  "glm-5v-turbo": {
14360
15154
  id: "glm-5v-turbo",
14361
- name: "glm-5v-turbo",
15155
+ name: "GLM-5V-Turbo",
14362
15156
  api: "openai-completions",
14363
15157
  provider: "zai",
14364
15158
  baseUrl: "https://api.z.ai/api/coding/paas/v4",