@avadisabelle/ava-pi-ai 0.64.9 → 0.65.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (79) hide show
  1. package/README.md +86 -0
  2. package/dist/cli.d.ts.map +1 -1
  3. package/dist/cli.js +1 -1
  4. package/dist/cli.js.map +1 -1
  5. package/dist/index.d.ts +3 -1
  6. package/dist/index.d.ts.map +1 -1
  7. package/dist/index.js +1 -0
  8. package/dist/index.js.map +1 -1
  9. package/dist/models.d.ts +1 -1
  10. package/dist/models.d.ts.map +1 -1
  11. package/dist/models.generated.d.ts +860 -422
  12. package/dist/models.generated.d.ts.map +1 -1
  13. package/dist/models.generated.js +966 -513
  14. package/dist/models.generated.js.map +1 -1
  15. package/dist/models.js +5 -2
  16. package/dist/models.js.map +1 -1
  17. package/dist/providers/amazon-bedrock.d.ts +23 -0
  18. package/dist/providers/amazon-bedrock.d.ts.map +1 -1
  19. package/dist/providers/amazon-bedrock.js +138 -33
  20. package/dist/providers/amazon-bedrock.js.map +1 -1
  21. package/dist/providers/anthropic.d.ts +16 -2
  22. package/dist/providers/anthropic.d.ts.map +1 -1
  23. package/dist/providers/anthropic.js +63 -26
  24. package/dist/providers/anthropic.js.map +1 -1
  25. package/dist/providers/azure-openai-responses.d.ts.map +1 -1
  26. package/dist/providers/azure-openai-responses.js +14 -15
  27. package/dist/providers/azure-openai-responses.js.map +1 -1
  28. package/dist/providers/faux.d.ts +56 -0
  29. package/dist/providers/faux.d.ts.map +1 -0
  30. package/dist/providers/faux.js +368 -0
  31. package/dist/providers/faux.js.map +1 -0
  32. package/dist/providers/google-gemini-cli.d.ts.map +1 -1
  33. package/dist/providers/google-gemini-cli.js +20 -1
  34. package/dist/providers/google-gemini-cli.js.map +1 -1
  35. package/dist/providers/google-shared.d.ts.map +1 -1
  36. package/dist/providers/google-shared.js +28 -1
  37. package/dist/providers/google-shared.js.map +1 -1
  38. package/dist/providers/google-vertex.d.ts.map +1 -1
  39. package/dist/providers/google-vertex.js +20 -2
  40. package/dist/providers/google-vertex.js.map +1 -1
  41. package/dist/providers/google.d.ts.map +1 -1
  42. package/dist/providers/google.js +45 -4
  43. package/dist/providers/google.js.map +1 -1
  44. package/dist/providers/mistral.d.ts +3 -0
  45. package/dist/providers/mistral.d.ts.map +1 -1
  46. package/dist/providers/mistral.js +37 -4
  47. package/dist/providers/mistral.js.map +1 -1
  48. package/dist/providers/openai-codex-responses.d.ts +2 -0
  49. package/dist/providers/openai-codex-responses.d.ts.map +1 -1
  50. package/dist/providers/openai-codex-responses.js +49 -12
  51. package/dist/providers/openai-codex-responses.js.map +1 -1
  52. package/dist/providers/openai-completions.d.ts.map +1 -1
  53. package/dist/providers/openai-completions.js +48 -14
  54. package/dist/providers/openai-completions.js.map +1 -1
  55. package/dist/providers/openai-responses-shared.d.ts +1 -0
  56. package/dist/providers/openai-responses-shared.d.ts.map +1 -1
  57. package/dist/providers/openai-responses-shared.js +39 -10
  58. package/dist/providers/openai-responses-shared.js.map +1 -1
  59. package/dist/providers/openai-responses.d.ts.map +1 -1
  60. package/dist/providers/openai-responses.js +23 -18
  61. package/dist/providers/openai-responses.js.map +1 -1
  62. package/dist/providers/simple-options.d.ts.map +1 -1
  63. package/dist/providers/simple-options.js +4 -1
  64. package/dist/providers/simple-options.js.map +1 -1
  65. package/dist/providers/transform-messages.d.ts.map +1 -1
  66. package/dist/providers/transform-messages.js +20 -32
  67. package/dist/providers/transform-messages.js.map +1 -1
  68. package/dist/types.d.ts +82 -4
  69. package/dist/types.d.ts.map +1 -1
  70. package/dist/types.js.map +1 -1
  71. package/dist/utils/headers.d.ts +2 -0
  72. package/dist/utils/headers.d.ts.map +1 -0
  73. package/dist/utils/headers.js +8 -0
  74. package/dist/utils/headers.js.map +1 -0
  75. package/dist/utils/overflow.d.ts +4 -3
  76. package/dist/utils/overflow.d.ts.map +1 -1
  77. package/dist/utils/overflow.js +28 -13
  78. package/dist/utils/overflow.js.map +1 -1
  79. package/package.json +4 -4
@@ -325,6 +325,40 @@ export const MODELS = {
325
325
  contextWindow: 1000000,
326
326
  maxTokens: 64000,
327
327
  },
328
+ "au.anthropic.claude-opus-4-6-v1": {
329
+ id: "au.anthropic.claude-opus-4-6-v1",
330
+ name: "AU Anthropic Claude Opus 4.6",
331
+ api: "bedrock-converse-stream",
332
+ provider: "amazon-bedrock",
333
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
334
+ reasoning: true,
335
+ input: ["text", "image"],
336
+ cost: {
337
+ input: 16.5,
338
+ output: 82.5,
339
+ cacheRead: 0.5,
340
+ cacheWrite: 6.25,
341
+ },
342
+ contextWindow: 1000000,
343
+ maxTokens: 128000,
344
+ },
345
+ "au.anthropic.claude-sonnet-4-6": {
346
+ id: "au.anthropic.claude-sonnet-4-6",
347
+ name: "AU Anthropic Claude Sonnet 4.6",
348
+ api: "bedrock-converse-stream",
349
+ provider: "amazon-bedrock",
350
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
351
+ reasoning: true,
352
+ input: ["text", "image"],
353
+ cost: {
354
+ input: 3.3,
355
+ output: 16.5,
356
+ cacheRead: 0.33,
357
+ cacheWrite: 4.125,
358
+ },
359
+ contextWindow: 1000000,
360
+ maxTokens: 128000,
361
+ },
328
362
  "deepseek.r1-v1:0": {
329
363
  id: "deepseek.r1-v1:0",
330
364
  name: "DeepSeek-R1",
@@ -2488,6 +2522,23 @@ export const MODELS = {
2488
2522
  contextWindow: 1050000,
2489
2523
  maxTokens: 128000,
2490
2524
  },
2525
+ "gpt-5.5": {
2526
+ id: "gpt-5.5",
2527
+ name: "GPT-5.5",
2528
+ api: "azure-openai-responses",
2529
+ provider: "azure-openai-responses",
2530
+ baseUrl: "",
2531
+ reasoning: true,
2532
+ input: ["text", "image"],
2533
+ cost: {
2534
+ input: 5,
2535
+ output: 30,
2536
+ cacheRead: 0.5,
2537
+ cacheWrite: 0,
2538
+ },
2539
+ contextWindow: 1050000,
2540
+ maxTokens: 128000,
2541
+ },
2491
2542
  "o1": {
2492
2543
  id: "o1",
2493
2544
  name: "o1",
@@ -3134,6 +3185,24 @@ export const MODELS = {
3134
3185
  contextWindow: 400000,
3135
3186
  maxTokens: 128000,
3136
3187
  },
3188
+ "gpt-5.5": {
3189
+ id: "gpt-5.5",
3190
+ name: "GPT-5.5",
3191
+ api: "openai-responses",
3192
+ provider: "github-copilot",
3193
+ baseUrl: "https://api.individual.githubcopilot.com",
3194
+ headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
3195
+ reasoning: true,
3196
+ input: ["text", "image"],
3197
+ cost: {
3198
+ input: 0,
3199
+ output: 0,
3200
+ cacheRead: 0,
3201
+ cacheWrite: 0,
3202
+ },
3203
+ contextWindow: 400000,
3204
+ maxTokens: 128000,
3205
+ },
3137
3206
  "grok-code-fast-1": {
3138
3207
  id: "grok-code-fast-1",
3139
3208
  name: "Grok Code Fast 1",
@@ -3251,7 +3320,7 @@ export const MODELS = {
3251
3320
  cost: {
3252
3321
  input: 0.3,
3253
3322
  output: 2.5,
3254
- cacheRead: 0.075,
3323
+ cacheRead: 0.03,
3255
3324
  cacheWrite: 0,
3256
3325
  },
3257
3326
  contextWindow: 1048576,
@@ -3370,7 +3439,7 @@ export const MODELS = {
3370
3439
  cost: {
3371
3440
  input: 1.25,
3372
3441
  output: 10,
3373
- cacheRead: 0.31,
3442
+ cacheRead: 0.125,
3374
3443
  cacheWrite: 0,
3375
3444
  },
3376
3445
  contextWindow: 1048576,
@@ -3580,8 +3649,8 @@ export const MODELS = {
3580
3649
  contextWindow: 131072,
3581
3650
  maxTokens: 8192,
3582
3651
  },
3583
- "gemma-4-26b-it": {
3584
- id: "gemma-4-26b-it",
3652
+ "gemma-4-26b-a4b-it": {
3653
+ id: "gemma-4-26b-a4b-it",
3585
3654
  name: "Gemma 4 26B",
3586
3655
  api: "google-generative-ai",
3587
3656
  provider: "google",
@@ -4079,6 +4148,23 @@ export const MODELS = {
4079
4148
  contextWindow: 1048576,
4080
4149
  maxTokens: 65536,
4081
4150
  },
4151
+ "gemini-3.1-pro-preview-customtools": {
4152
+ id: "gemini-3.1-pro-preview-customtools",
4153
+ name: "Gemini 3.1 Pro Preview Custom Tools (Vertex)",
4154
+ api: "google-vertex",
4155
+ provider: "google-vertex",
4156
+ baseUrl: "https://{location}-aiplatform.googleapis.com",
4157
+ reasoning: true,
4158
+ input: ["text", "image"],
4159
+ cost: {
4160
+ input: 2,
4161
+ output: 12,
4162
+ cacheRead: 0.2,
4163
+ cacheWrite: 0,
4164
+ },
4165
+ contextWindow: 1048576,
4166
+ maxTokens: 65536,
4167
+ },
4082
4168
  },
4083
4169
  "groq": {
4084
4170
  "deepseek-r1-distill-llama-70b": {
@@ -4605,6 +4691,24 @@ export const MODELS = {
4605
4691
  contextWindow: 163840,
4606
4692
  maxTokens: 65536,
4607
4693
  },
4694
+ "deepseek-ai/DeepSeek-V4-Pro": {
4695
+ id: "deepseek-ai/DeepSeek-V4-Pro",
4696
+ name: "DeepSeek V4 Pro",
4697
+ api: "openai-completions",
4698
+ provider: "huggingface",
4699
+ baseUrl: "https://router.huggingface.co/v1",
4700
+ compat: { "supportsDeveloperRole": false },
4701
+ reasoning: true,
4702
+ input: ["text"],
4703
+ cost: {
4704
+ input: 1.74,
4705
+ output: 3.48,
4706
+ cacheRead: 0.145,
4707
+ cacheWrite: 0,
4708
+ },
4709
+ contextWindow: 1048576,
4710
+ maxTokens: 393216,
4711
+ },
4608
4712
  "moonshotai/Kimi-K2-Instruct": {
4609
4713
  id: "moonshotai/Kimi-K2-Instruct",
4610
4714
  name: "Kimi-K2-Instruct",
@@ -4677,6 +4781,24 @@ export const MODELS = {
4677
4781
  contextWindow: 262144,
4678
4782
  maxTokens: 262144,
4679
4783
  },
4784
+ "moonshotai/Kimi-K2.6": {
4785
+ id: "moonshotai/Kimi-K2.6",
4786
+ name: "Kimi-K2.6",
4787
+ api: "openai-completions",
4788
+ provider: "huggingface",
4789
+ baseUrl: "https://router.huggingface.co/v1",
4790
+ compat: { "supportsDeveloperRole": false },
4791
+ reasoning: true,
4792
+ input: ["text", "image"],
4793
+ cost: {
4794
+ input: 0.95,
4795
+ output: 4,
4796
+ cacheRead: 0.16,
4797
+ cacheWrite: 0,
4798
+ },
4799
+ contextWindow: 262144,
4800
+ maxTokens: 262144,
4801
+ },
4680
4802
  "zai-org/GLM-4.7": {
4681
4803
  id: "zai-org/GLM-4.7",
4682
4804
  name: "GLM-4.7",
@@ -4751,9 +4873,9 @@ export const MODELS = {
4751
4873
  },
4752
4874
  },
4753
4875
  "kimi-coding": {
4754
- "k2p5": {
4755
- id: "k2p5",
4756
- name: "Kimi K2.5",
4876
+ "k2p6": {
4877
+ id: "k2p6",
4878
+ name: "Kimi K2.6",
4757
4879
  api: "anthropic-messages",
4758
4880
  provider: "kimi-coding",
4759
4881
  baseUrl: "https://api.kimi.com/coding",
@@ -4768,14 +4890,14 @@ export const MODELS = {
4768
4890
  contextWindow: 262144,
4769
4891
  maxTokens: 32768,
4770
4892
  },
4771
- "kimi-k2-thinking": {
4772
- id: "kimi-k2-thinking",
4773
- name: "Kimi K2 Thinking",
4893
+ "kimi-for-coding": {
4894
+ id: "kimi-for-coding",
4895
+ name: "Kimi For Coding",
4774
4896
  api: "anthropic-messages",
4775
4897
  provider: "kimi-coding",
4776
4898
  baseUrl: "https://api.kimi.com/coding",
4777
4899
  reasoning: true,
4778
- input: ["text"],
4900
+ input: ["text", "image"],
4779
4901
  cost: {
4780
4902
  input: 0,
4781
4903
  output: 0,
@@ -4785,93 +4907,25 @@ export const MODELS = {
4785
4907
  contextWindow: 262144,
4786
4908
  maxTokens: 32768,
4787
4909
  },
4788
- },
4789
- "minimax": {
4790
- "MiniMax-M2": {
4791
- id: "MiniMax-M2",
4792
- name: "MiniMax-M2",
4793
- api: "anthropic-messages",
4794
- provider: "minimax",
4795
- baseUrl: "https://api.minimax.io/anthropic",
4796
- reasoning: true,
4797
- input: ["text"],
4798
- cost: {
4799
- input: 0.3,
4800
- output: 1.2,
4801
- cacheRead: 0,
4802
- cacheWrite: 0,
4803
- },
4804
- contextWindow: 204800,
4805
- maxTokens: 131072,
4806
- },
4807
- "MiniMax-M2.1": {
4808
- id: "MiniMax-M2.1",
4809
- name: "MiniMax-M2.1",
4810
- api: "anthropic-messages",
4811
- provider: "minimax",
4812
- baseUrl: "https://api.minimax.io/anthropic",
4813
- reasoning: true,
4814
- input: ["text"],
4815
- cost: {
4816
- input: 0.3,
4817
- output: 1.2,
4818
- cacheRead: 0,
4819
- cacheWrite: 0,
4820
- },
4821
- contextWindow: 204800,
4822
- maxTokens: 131072,
4823
- },
4824
- "MiniMax-M2.1-highspeed": {
4825
- id: "MiniMax-M2.1-highspeed",
4826
- name: "MiniMax-M2.1-highspeed",
4910
+ "kimi-k2-thinking": {
4911
+ id: "kimi-k2-thinking",
4912
+ name: "Kimi K2 Thinking",
4827
4913
  api: "anthropic-messages",
4828
- provider: "minimax",
4829
- baseUrl: "https://api.minimax.io/anthropic",
4914
+ provider: "kimi-coding",
4915
+ baseUrl: "https://api.kimi.com/coding",
4830
4916
  reasoning: true,
4831
4917
  input: ["text"],
4832
4918
  cost: {
4833
- input: 0.6,
4834
- output: 2.4,
4919
+ input: 0,
4920
+ output: 0,
4835
4921
  cacheRead: 0,
4836
4922
  cacheWrite: 0,
4837
4923
  },
4838
- contextWindow: 204800,
4839
- maxTokens: 131072,
4840
- },
4841
- "MiniMax-M2.5": {
4842
- id: "MiniMax-M2.5",
4843
- name: "MiniMax-M2.5",
4844
- api: "anthropic-messages",
4845
- provider: "minimax",
4846
- baseUrl: "https://api.minimax.io/anthropic",
4847
- reasoning: true,
4848
- input: ["text"],
4849
- cost: {
4850
- input: 0.3,
4851
- output: 1.2,
4852
- cacheRead: 0.03,
4853
- cacheWrite: 0.375,
4854
- },
4855
- contextWindow: 204800,
4856
- maxTokens: 131072,
4857
- },
4858
- "MiniMax-M2.5-highspeed": {
4859
- id: "MiniMax-M2.5-highspeed",
4860
- name: "MiniMax-M2.5-highspeed",
4861
- api: "anthropic-messages",
4862
- provider: "minimax",
4863
- baseUrl: "https://api.minimax.io/anthropic",
4864
- reasoning: true,
4865
- input: ["text"],
4866
- cost: {
4867
- input: 0.6,
4868
- output: 2.4,
4869
- cacheRead: 0.06,
4870
- cacheWrite: 0.375,
4871
- },
4872
- contextWindow: 204800,
4873
- maxTokens: 131072,
4924
+ contextWindow: 262144,
4925
+ maxTokens: 32768,
4874
4926
  },
4927
+ },
4928
+ "minimax": {
4875
4929
  "MiniMax-M2.7": {
4876
4930
  id: "MiniMax-M2.7",
4877
4931
  name: "MiniMax-M2.7",
@@ -4908,91 +4962,6 @@ export const MODELS = {
4908
4962
  },
4909
4963
  },
4910
4964
  "minimax-cn": {
4911
- "MiniMax-M2": {
4912
- id: "MiniMax-M2",
4913
- name: "MiniMax-M2",
4914
- api: "anthropic-messages",
4915
- provider: "minimax-cn",
4916
- baseUrl: "https://api.minimaxi.com/anthropic",
4917
- reasoning: true,
4918
- input: ["text"],
4919
- cost: {
4920
- input: 0.3,
4921
- output: 1.2,
4922
- cacheRead: 0,
4923
- cacheWrite: 0,
4924
- },
4925
- contextWindow: 204800,
4926
- maxTokens: 131072,
4927
- },
4928
- "MiniMax-M2.1": {
4929
- id: "MiniMax-M2.1",
4930
- name: "MiniMax-M2.1",
4931
- api: "anthropic-messages",
4932
- provider: "minimax-cn",
4933
- baseUrl: "https://api.minimaxi.com/anthropic",
4934
- reasoning: true,
4935
- input: ["text"],
4936
- cost: {
4937
- input: 0.3,
4938
- output: 1.2,
4939
- cacheRead: 0,
4940
- cacheWrite: 0,
4941
- },
4942
- contextWindow: 204800,
4943
- maxTokens: 131072,
4944
- },
4945
- "MiniMax-M2.1-highspeed": {
4946
- id: "MiniMax-M2.1-highspeed",
4947
- name: "MiniMax-M2.1-highspeed",
4948
- api: "anthropic-messages",
4949
- provider: "minimax-cn",
4950
- baseUrl: "https://api.minimaxi.com/anthropic",
4951
- reasoning: true,
4952
- input: ["text"],
4953
- cost: {
4954
- input: 0.6,
4955
- output: 2.4,
4956
- cacheRead: 0,
4957
- cacheWrite: 0,
4958
- },
4959
- contextWindow: 204800,
4960
- maxTokens: 131072,
4961
- },
4962
- "MiniMax-M2.5": {
4963
- id: "MiniMax-M2.5",
4964
- name: "MiniMax-M2.5",
4965
- api: "anthropic-messages",
4966
- provider: "minimax-cn",
4967
- baseUrl: "https://api.minimaxi.com/anthropic",
4968
- reasoning: true,
4969
- input: ["text"],
4970
- cost: {
4971
- input: 0.3,
4972
- output: 1.2,
4973
- cacheRead: 0.03,
4974
- cacheWrite: 0.375,
4975
- },
4976
- contextWindow: 204800,
4977
- maxTokens: 131072,
4978
- },
4979
- "MiniMax-M2.5-highspeed": {
4980
- id: "MiniMax-M2.5-highspeed",
4981
- name: "MiniMax-M2.5-highspeed",
4982
- api: "anthropic-messages",
4983
- provider: "minimax-cn",
4984
- baseUrl: "https://api.minimaxi.com/anthropic",
4985
- reasoning: true,
4986
- input: ["text"],
4987
- cost: {
4988
- input: 0.6,
4989
- output: 2.4,
4990
- cacheRead: 0.06,
4991
- cacheWrite: 0.375,
4992
- },
4993
- contextWindow: 204800,
4994
- maxTokens: 131072,
4995
- },
4996
4965
  "MiniMax-M2.7": {
4997
4966
  id: "MiniMax-M2.7",
4998
4967
  name: "MiniMax-M2.7",
@@ -6017,17 +5986,34 @@ export const MODELS = {
6017
5986
  contextWindow: 1050000,
6018
5987
  maxTokens: 128000,
6019
5988
  },
6020
- "o1": {
6021
- id: "o1",
6022
- name: "o1",
5989
+ "gpt-5.5": {
5990
+ id: "gpt-5.5",
5991
+ name: "GPT-5.5",
6023
5992
  api: "openai-responses",
6024
5993
  provider: "openai",
6025
5994
  baseUrl: "https://api.openai.com/v1",
6026
5995
  reasoning: true,
6027
5996
  input: ["text", "image"],
6028
5997
  cost: {
6029
- input: 15,
6030
- output: 60,
5998
+ input: 5,
5999
+ output: 30,
6000
+ cacheRead: 0.5,
6001
+ cacheWrite: 0,
6002
+ },
6003
+ contextWindow: 1050000,
6004
+ maxTokens: 128000,
6005
+ },
6006
+ "o1": {
6007
+ id: "o1",
6008
+ name: "o1",
6009
+ api: "openai-responses",
6010
+ provider: "openai",
6011
+ baseUrl: "https://api.openai.com/v1",
6012
+ reasoning: true,
6013
+ input: ["text", "image"],
6014
+ cost: {
6015
+ input: 15,
6016
+ output: 60,
6031
6017
  cacheRead: 7.5,
6032
6018
  cacheWrite: 0,
6033
6019
  },
@@ -6327,23 +6313,6 @@ export const MODELS = {
6327
6313
  contextWindow: 200000,
6328
6314
  maxTokens: 128000,
6329
6315
  },
6330
- "claude-3-5-haiku": {
6331
- id: "claude-3-5-haiku",
6332
- name: "Claude Haiku 3.5",
6333
- api: "anthropic-messages",
6334
- provider: "opencode",
6335
- baseUrl: "https://opencode.ai/zen",
6336
- reasoning: false,
6337
- input: ["text", "image"],
6338
- cost: {
6339
- input: 0.8,
6340
- output: 4,
6341
- cacheRead: 0.08,
6342
- cacheWrite: 1,
6343
- },
6344
- contextWindow: 200000,
6345
- maxTokens: 8192,
6346
- },
6347
6316
  "claude-haiku-4-5": {
6348
6317
  id: "claude-haiku-4-5",
6349
6318
  name: "Claude Haiku 4.5",
@@ -6786,6 +6755,57 @@ export const MODELS = {
6786
6755
  contextWindow: 1050000,
6787
6756
  maxTokens: 128000,
6788
6757
  },
6758
+ "gpt-5.5": {
6759
+ id: "gpt-5.5",
6760
+ name: "GPT-5.5",
6761
+ api: "openai-responses",
6762
+ provider: "opencode",
6763
+ baseUrl: "https://opencode.ai/zen/v1",
6764
+ reasoning: true,
6765
+ input: ["text", "image"],
6766
+ cost: {
6767
+ input: 5,
6768
+ output: 30,
6769
+ cacheRead: 0.5,
6770
+ cacheWrite: 0,
6771
+ },
6772
+ contextWindow: 1050000,
6773
+ maxTokens: 128000,
6774
+ },
6775
+ "gpt-5.5-pro": {
6776
+ id: "gpt-5.5-pro",
6777
+ name: "GPT-5.5 Pro",
6778
+ api: "openai-responses",
6779
+ provider: "opencode",
6780
+ baseUrl: "https://opencode.ai/zen/v1",
6781
+ reasoning: true,
6782
+ input: ["text", "image"],
6783
+ cost: {
6784
+ input: 30,
6785
+ output: 180,
6786
+ cacheRead: 30,
6787
+ cacheWrite: 0,
6788
+ },
6789
+ contextWindow: 1050000,
6790
+ maxTokens: 128000,
6791
+ },
6792
+ "hy3-preview-free": {
6793
+ id: "hy3-preview-free",
6794
+ name: "Hy3 preview Free",
6795
+ api: "openai-completions",
6796
+ provider: "opencode",
6797
+ baseUrl: "https://opencode.ai/zen/v1",
6798
+ reasoning: true,
6799
+ input: ["text"],
6800
+ cost: {
6801
+ input: 0,
6802
+ output: 0,
6803
+ cacheRead: 0,
6804
+ cacheWrite: 0,
6805
+ },
6806
+ contextWindow: 256000,
6807
+ maxTokens: 64000,
6808
+ },
6789
6809
  "kimi-k2.5": {
6790
6810
  id: "kimi-k2.5",
6791
6811
  name: "Kimi K2.5",
@@ -6803,6 +6823,40 @@ export const MODELS = {
6803
6823
  contextWindow: 262144,
6804
6824
  maxTokens: 65536,
6805
6825
  },
6826
+ "kimi-k2.6": {
6827
+ id: "kimi-k2.6",
6828
+ name: "Kimi K2.6",
6829
+ api: "openai-completions",
6830
+ provider: "opencode",
6831
+ baseUrl: "https://opencode.ai/zen/v1",
6832
+ reasoning: true,
6833
+ input: ["text", "image"],
6834
+ cost: {
6835
+ input: 0.95,
6836
+ output: 4,
6837
+ cacheRead: 0.16,
6838
+ cacheWrite: 0,
6839
+ },
6840
+ contextWindow: 262144,
6841
+ maxTokens: 65536,
6842
+ },
6843
+ "ling-2.6-flash-free": {
6844
+ id: "ling-2.6-flash-free",
6845
+ name: "Ling 2.6 Flash Free",
6846
+ api: "openai-completions",
6847
+ provider: "opencode",
6848
+ baseUrl: "https://opencode.ai/zen/v1",
6849
+ reasoning: false,
6850
+ input: ["text"],
6851
+ cost: {
6852
+ input: 0,
6853
+ output: 0,
6854
+ cacheRead: 0,
6855
+ cacheWrite: 0,
6856
+ },
6857
+ contextWindow: 262100,
6858
+ maxTokens: 32800,
6859
+ },
6806
6860
  "minimax-m2.5": {
6807
6861
  id: "minimax-m2.5",
6808
6862
  name: "MiniMax M2.5",
@@ -6837,6 +6891,23 @@ export const MODELS = {
6837
6891
  contextWindow: 204800,
6838
6892
  maxTokens: 131072,
6839
6893
  },
6894
+ "minimax-m2.7": {
6895
+ id: "minimax-m2.7",
6896
+ name: "MiniMax M2.7",
6897
+ api: "openai-completions",
6898
+ provider: "opencode",
6899
+ baseUrl: "https://opencode.ai/zen/v1",
6900
+ reasoning: true,
6901
+ input: ["text"],
6902
+ cost: {
6903
+ input: 0.3,
6904
+ output: 1.2,
6905
+ cacheRead: 0.06,
6906
+ cacheWrite: 0,
6907
+ },
6908
+ contextWindow: 204800,
6909
+ maxTokens: 131072,
6910
+ },
6840
6911
  "nemotron-3-super-free": {
6841
6912
  id: "nemotron-3-super-free",
6842
6913
  name: "Nemotron 3 Super Free",
@@ -6857,9 +6928,9 @@ export const MODELS = {
6857
6928
  "qwen3.5-plus": {
6858
6929
  id: "qwen3.5-plus",
6859
6930
  name: "Qwen3.5 Plus",
6860
- api: "openai-completions",
6931
+ api: "anthropic-messages",
6861
6932
  provider: "opencode",
6862
- baseUrl: "https://opencode.ai/zen/v1",
6933
+ baseUrl: "https://opencode.ai/zen",
6863
6934
  reasoning: true,
6864
6935
  input: ["text", "image"],
6865
6936
  cost: {
@@ -6874,9 +6945,9 @@ export const MODELS = {
6874
6945
  "qwen3.6-plus": {
6875
6946
  id: "qwen3.6-plus",
6876
6947
  name: "Qwen3.6 Plus",
6877
- api: "openai-completions",
6948
+ api: "anthropic-messages",
6878
6949
  provider: "opencode",
6879
- baseUrl: "https://opencode.ai/zen/v1",
6950
+ baseUrl: "https://opencode.ai/zen",
6880
6951
  reasoning: true,
6881
6952
  input: ["text", "image"],
6882
6953
  cost: {
@@ -6890,6 +6961,40 @@ export const MODELS = {
6890
6961
  },
6891
6962
  },
6892
6963
  "opencode-go": {
6964
+ "deepseek-v4-flash": {
6965
+ id: "deepseek-v4-flash",
6966
+ name: "DeepSeek V4 Flash",
6967
+ api: "openai-completions",
6968
+ provider: "opencode-go",
6969
+ baseUrl: "https://opencode.ai/zen/go/v1",
6970
+ reasoning: true,
6971
+ input: ["text"],
6972
+ cost: {
6973
+ input: 0.14,
6974
+ output: 0.28,
6975
+ cacheRead: 0.0028,
6976
+ cacheWrite: 0,
6977
+ },
6978
+ contextWindow: 1000000,
6979
+ maxTokens: 384000,
6980
+ },
6981
+ "deepseek-v4-pro": {
6982
+ id: "deepseek-v4-pro",
6983
+ name: "DeepSeek V4 Pro",
6984
+ api: "openai-completions",
6985
+ provider: "opencode-go",
6986
+ baseUrl: "https://opencode.ai/zen/go/v1",
6987
+ reasoning: true,
6988
+ input: ["text"],
6989
+ cost: {
6990
+ input: 1.74,
6991
+ output: 3.48,
6992
+ cacheRead: 0.0145,
6993
+ cacheWrite: 0,
6994
+ },
6995
+ contextWindow: 1000000,
6996
+ maxTokens: 384000,
6997
+ },
6893
6998
  "glm-5": {
6894
6999
  id: "glm-5",
6895
7000
  name: "GLM-5",
@@ -6941,6 +7046,23 @@ export const MODELS = {
6941
7046
  contextWindow: 262144,
6942
7047
  maxTokens: 65536,
6943
7048
  },
7049
+ "kimi-k2.6": {
7050
+ id: "kimi-k2.6",
7051
+ name: "Kimi K2.6 (3x limits)",
7052
+ api: "openai-completions",
7053
+ provider: "opencode-go",
7054
+ baseUrl: "https://opencode.ai/zen/go/v1",
7055
+ reasoning: true,
7056
+ input: ["text", "image"],
7057
+ cost: {
7058
+ input: 0.32,
7059
+ output: 1.34,
7060
+ cacheRead: 0.054,
7061
+ cacheWrite: 0,
7062
+ },
7063
+ contextWindow: 262144,
7064
+ maxTokens: 65536,
7065
+ },
6944
7066
  "mimo-v2-omni": {
6945
7067
  id: "mimo-v2-omni",
6946
7068
  name: "MiMo V2 Omni",
@@ -6956,7 +7078,7 @@ export const MODELS = {
6956
7078
  cacheWrite: 0,
6957
7079
  },
6958
7080
  contextWindow: 262144,
6959
- maxTokens: 64000,
7081
+ maxTokens: 128000,
6960
7082
  },
6961
7083
  "mimo-v2-pro": {
6962
7084
  id: "mimo-v2-pro",
@@ -6973,7 +7095,41 @@ export const MODELS = {
6973
7095
  cacheWrite: 0,
6974
7096
  },
6975
7097
  contextWindow: 1048576,
6976
- maxTokens: 64000,
7098
+ maxTokens: 128000,
7099
+ },
7100
+ "mimo-v2.5": {
7101
+ id: "mimo-v2.5",
7102
+ name: "MiMo V2.5",
7103
+ api: "openai-completions",
7104
+ provider: "opencode-go",
7105
+ baseUrl: "https://opencode.ai/zen/go/v1",
7106
+ reasoning: true,
7107
+ input: ["text", "image"],
7108
+ cost: {
7109
+ input: 0.4,
7110
+ output: 2,
7111
+ cacheRead: 0.08,
7112
+ cacheWrite: 0,
7113
+ },
7114
+ contextWindow: 1000000,
7115
+ maxTokens: 128000,
7116
+ },
7117
+ "mimo-v2.5-pro": {
7118
+ id: "mimo-v2.5-pro",
7119
+ name: "MiMo V2.5 Pro",
7120
+ api: "openai-completions",
7121
+ provider: "opencode-go",
7122
+ baseUrl: "https://opencode.ai/zen/go/v1",
7123
+ reasoning: true,
7124
+ input: ["text"],
7125
+ cost: {
7126
+ input: 1,
7127
+ output: 3,
7128
+ cacheRead: 0.2,
7129
+ cacheWrite: 0,
7130
+ },
7131
+ contextWindow: 1048576,
7132
+ maxTokens: 128000,
6977
7133
  },
6978
7134
  "minimax-m2.5": {
6979
7135
  id: "minimax-m2.5",
@@ -7012,9 +7168,9 @@ export const MODELS = {
7012
7168
  "qwen3.5-plus": {
7013
7169
  id: "qwen3.5-plus",
7014
7170
  name: "Qwen3.5 Plus",
7015
- api: "openai-completions",
7171
+ api: "anthropic-messages",
7016
7172
  provider: "opencode-go",
7017
- baseUrl: "https://opencode.ai/zen/go/v1",
7173
+ baseUrl: "https://opencode.ai/zen/go",
7018
7174
  reasoning: true,
7019
7175
  input: ["text", "image"],
7020
7176
  cost: {
@@ -7029,9 +7185,9 @@ export const MODELS = {
7029
7185
  "qwen3.6-plus": {
7030
7186
  id: "qwen3.6-plus",
7031
7187
  name: "Qwen3.6 Plus",
7032
- api: "openai-completions",
7188
+ api: "anthropic-messages",
7033
7189
  provider: "opencode-go",
7034
- baseUrl: "https://opencode.ai/zen/go/v1",
7190
+ baseUrl: "https://opencode.ai/zen/go",
7035
7191
  reasoning: true,
7036
7192
  input: ["text", "image"],
7037
7193
  cost: {
@@ -7094,7 +7250,7 @@ export const MODELS = {
7094
7250
  cacheWrite: 0,
7095
7251
  },
7096
7252
  contextWindow: 65536,
7097
- maxTokens: 4096,
7253
+ maxTokens: 16384,
7098
7254
  },
7099
7255
  "amazon/nova-2-lite-v1": {
7100
7256
  id: "amazon/nova-2-lite-v1",
@@ -7419,17 +7575,17 @@ export const MODELS = {
7419
7575
  contextWindow: 1000000,
7420
7576
  maxTokens: 128000,
7421
7577
  },
7422
- "arcee-ai/trinity-large-preview:free": {
7423
- id: "arcee-ai/trinity-large-preview:free",
7424
- name: "Arcee AI: Trinity Large Preview (free)",
7578
+ "arcee-ai/trinity-large-preview": {
7579
+ id: "arcee-ai/trinity-large-preview",
7580
+ name: "Arcee AI: Trinity Large Preview",
7425
7581
  api: "openai-completions",
7426
7582
  provider: "openrouter",
7427
7583
  baseUrl: "https://openrouter.ai/api/v1",
7428
7584
  reasoning: false,
7429
7585
  input: ["text"],
7430
7586
  cost: {
7431
- input: 0,
7432
- output: 0,
7587
+ input: 0.15,
7588
+ output: 0.44999999999999996,
7433
7589
  cacheRead: 0,
7434
7590
  cacheWrite: 0,
7435
7591
  },
@@ -7655,7 +7811,7 @@ export const MODELS = {
7655
7811
  cacheWrite: 0,
7656
7812
  },
7657
7813
  contextWindow: 163840,
7658
- maxTokens: 163840,
7814
+ maxTokens: 16384,
7659
7815
  },
7660
7816
  "deepseek/deepseek-chat-v3-0324": {
7661
7817
  id: "deepseek/deepseek-chat-v3-0324",
@@ -7672,7 +7828,7 @@ export const MODELS = {
7672
7828
  cacheWrite: 0,
7673
7829
  },
7674
7830
  contextWindow: 163840,
7675
- maxTokens: 4096,
7831
+ maxTokens: 16384,
7676
7832
  },
7677
7833
  "deepseek/deepseek-chat-v3.1": {
7678
7834
  id: "deepseek/deepseek-chat-v3.1",
@@ -7723,7 +7879,7 @@ export const MODELS = {
7723
7879
  cacheWrite: 0,
7724
7880
  },
7725
7881
  contextWindow: 163840,
7726
- maxTokens: 4096,
7882
+ maxTokens: 32768,
7727
7883
  },
7728
7884
  "deepseek/deepseek-v3.1-terminus": {
7729
7885
  id: "deepseek/deepseek-v3.1-terminus",
@@ -7736,11 +7892,11 @@ export const MODELS = {
7736
7892
  cost: {
7737
7893
  input: 0.21,
7738
7894
  output: 0.7899999999999999,
7739
- cacheRead: 0.1300000002,
7895
+ cacheRead: 0.13,
7740
7896
  cacheWrite: 0,
7741
7897
  },
7742
7898
  contextWindow: 163840,
7743
- maxTokens: 4096,
7899
+ maxTokens: 32768,
7744
7900
  },
7745
7901
  "deepseek/deepseek-v3.2": {
7746
7902
  id: "deepseek/deepseek-v3.2",
@@ -7751,13 +7907,13 @@ export const MODELS = {
7751
7907
  reasoning: true,
7752
7908
  input: ["text"],
7753
7909
  cost: {
7754
- input: 0.25899999999999995,
7755
- output: 0.42,
7756
- cacheRead: 0.135,
7910
+ input: 0.252,
7911
+ output: 0.378,
7912
+ cacheRead: 0.0252,
7757
7913
  cacheWrite: 0,
7758
7914
  },
7759
- contextWindow: 163840,
7760
- maxTokens: 163840,
7915
+ contextWindow: 131072,
7916
+ maxTokens: 65536,
7761
7917
  },
7762
7918
  "deepseek/deepseek-v3.2-exp": {
7763
7919
  id: "deepseek/deepseek-v3.2-exp",
@@ -7776,6 +7932,40 @@ export const MODELS = {
7776
7932
  contextWindow: 163840,
7777
7933
  maxTokens: 65536,
7778
7934
  },
7935
+ "deepseek/deepseek-v4-flash": {
7936
+ id: "deepseek/deepseek-v4-flash",
7937
+ name: "DeepSeek: DeepSeek V4 Flash",
7938
+ api: "openai-completions",
7939
+ provider: "openrouter",
7940
+ baseUrl: "https://openrouter.ai/api/v1",
7941
+ reasoning: true,
7942
+ input: ["text"],
7943
+ cost: {
7944
+ input: 0.14,
7945
+ output: 0.28,
7946
+ cacheRead: 0.0028,
7947
+ cacheWrite: 0,
7948
+ },
7949
+ contextWindow: 1048576,
7950
+ maxTokens: 384000,
7951
+ },
7952
+ "deepseek/deepseek-v4-pro": {
7953
+ id: "deepseek/deepseek-v4-pro",
7954
+ name: "DeepSeek: DeepSeek V4 Pro",
7955
+ api: "openai-completions",
7956
+ provider: "openrouter",
7957
+ baseUrl: "https://openrouter.ai/api/v1",
7958
+ reasoning: true,
7959
+ input: ["text"],
7960
+ cost: {
7961
+ input: 0.435,
7962
+ output: 0.87,
7963
+ cacheRead: 0.003625,
7964
+ cacheWrite: 0,
7965
+ },
7966
+ contextWindow: 1048576,
7967
+ maxTokens: 384000,
7968
+ },
7779
7969
  "essentialai/rnj-1-instruct": {
7780
7970
  id: "essentialai/rnj-1-instruct",
7781
7971
  name: "EssentialAI: Rnj 1 Instruct",
@@ -7997,20 +8187,54 @@ export const MODELS = {
7997
8187
  contextWindow: 1048576,
7998
8188
  maxTokens: 65536,
7999
8189
  },
8000
- "google/gemma-4-26b-a4b-it": {
8001
- id: "google/gemma-4-26b-a4b-it",
8002
- name: "Google: Gemma 4 26B A4B ",
8190
+ "google/gemma-3-12b-it": {
8191
+ id: "google/gemma-3-12b-it",
8192
+ name: "Google: Gemma 3 12B",
8003
8193
  api: "openai-completions",
8004
8194
  provider: "openrouter",
8005
8195
  baseUrl: "https://openrouter.ai/api/v1",
8006
- reasoning: true,
8196
+ reasoning: false,
8007
8197
  input: ["text", "image"],
8008
8198
  cost: {
8009
- input: 0.08,
8010
- output: 0.35,
8011
- cacheRead: 0.01,
8012
- cacheWrite: 0,
8013
- },
8199
+ input: 0.04,
8200
+ output: 0.13,
8201
+ cacheRead: 0,
8202
+ cacheWrite: 0,
8203
+ },
8204
+ contextWindow: 131072,
8205
+ maxTokens: 16384,
8206
+ },
8207
+ "google/gemma-3-27b-it": {
8208
+ id: "google/gemma-3-27b-it",
8209
+ name: "Google: Gemma 3 27B",
8210
+ api: "openai-completions",
8211
+ provider: "openrouter",
8212
+ baseUrl: "https://openrouter.ai/api/v1",
8213
+ reasoning: false,
8214
+ input: ["text", "image"],
8215
+ cost: {
8216
+ input: 0.08,
8217
+ output: 0.16,
8218
+ cacheRead: 0,
8219
+ cacheWrite: 0,
8220
+ },
8221
+ contextWindow: 131072,
8222
+ maxTokens: 16384,
8223
+ },
8224
+ "google/gemma-4-26b-a4b-it": {
8225
+ id: "google/gemma-4-26b-a4b-it",
8226
+ name: "Google: Gemma 4 26B A4B ",
8227
+ api: "openai-completions",
8228
+ provider: "openrouter",
8229
+ baseUrl: "https://openrouter.ai/api/v1",
8230
+ reasoning: true,
8231
+ input: ["text", "image"],
8232
+ cost: {
8233
+ input: 0.06,
8234
+ output: 0.33,
8235
+ cacheRead: 0,
8236
+ cacheWrite: 0,
8237
+ },
8014
8238
  contextWindow: 262144,
8015
8239
  maxTokens: 4096,
8016
8240
  },
@@ -8042,11 +8266,11 @@ export const MODELS = {
8042
8266
  cost: {
8043
8267
  input: 0.13,
8044
8268
  output: 0.38,
8045
- cacheRead: 0.019999999499999997,
8269
+ cacheRead: 0,
8046
8270
  cacheWrite: 0,
8047
8271
  },
8048
8272
  contextWindow: 262144,
8049
- maxTokens: 4096,
8273
+ maxTokens: 16384,
8050
8274
  },
8051
8275
  "google/gemma-4-31b-it:free": {
8052
8276
  id: "google/gemma-4-31b-it:free",
@@ -8082,6 +8306,40 @@ export const MODELS = {
8082
8306
  contextWindow: 128000,
8083
8307
  maxTokens: 50000,
8084
8308
  },
8309
+ "inclusionai/ling-2.6-1t:free": {
8310
+ id: "inclusionai/ling-2.6-1t:free",
8311
+ name: "inclusionAI: Ling-2.6-1T (free)",
8312
+ api: "openai-completions",
8313
+ provider: "openrouter",
8314
+ baseUrl: "https://openrouter.ai/api/v1",
8315
+ reasoning: false,
8316
+ input: ["text"],
8317
+ cost: {
8318
+ input: 0,
8319
+ output: 0,
8320
+ cacheRead: 0,
8321
+ cacheWrite: 0,
8322
+ },
8323
+ contextWindow: 262144,
8324
+ maxTokens: 32768,
8325
+ },
8326
+ "inclusionai/ling-2.6-flash:free": {
8327
+ id: "inclusionai/ling-2.6-flash:free",
8328
+ name: "inclusionAI: Ling-2.6-flash (free)",
8329
+ api: "openai-completions",
8330
+ provider: "openrouter",
8331
+ baseUrl: "https://openrouter.ai/api/v1",
8332
+ reasoning: false,
8333
+ input: ["text"],
8334
+ cost: {
8335
+ input: 0,
8336
+ output: 0,
8337
+ cacheRead: 0,
8338
+ cacheWrite: 0,
8339
+ },
8340
+ contextWindow: 262144,
8341
+ maxTokens: 32768,
8342
+ },
8085
8343
  "kwaipilot/kat-coder-pro-v2": {
8086
8344
  id: "kwaipilot/kat-coder-pro-v2",
8087
8345
  name: "Kwaipilot: KAT-Coder-Pro V2",
@@ -8131,7 +8389,7 @@ export const MODELS = {
8131
8389
  cacheWrite: 0,
8132
8390
  },
8133
8391
  contextWindow: 131072,
8134
- maxTokens: 4096,
8392
+ maxTokens: 16384,
8135
8393
  },
8136
8394
  "meta-llama/llama-3.1-8b-instruct": {
8137
8395
  id: "meta-llama/llama-3.1-8b-instruct",
@@ -8159,13 +8417,13 @@ export const MODELS = {
8159
8417
  reasoning: false,
8160
8418
  input: ["text"],
8161
8419
  cost: {
8162
- input: 0.12,
8163
- output: 0.38,
8420
+ input: 0.09999999999999999,
8421
+ output: 0.32,
8164
8422
  cacheRead: 0,
8165
8423
  cacheWrite: 0,
8166
8424
  },
8167
8425
  contextWindow: 131072,
8168
- maxTokens: 131072,
8426
+ maxTokens: 16384,
8169
8427
  },
8170
8428
  "meta-llama/llama-3.3-70b-instruct:free": {
8171
8429
  id: "meta-llama/llama-3.3-70b-instruct:free",
@@ -8261,13 +8519,13 @@ export const MODELS = {
8261
8519
  reasoning: true,
8262
8520
  input: ["text"],
8263
8521
  cost: {
8264
- input: 0.118,
8265
- output: 0.9900000000000001,
8266
- cacheRead: 0.059,
8522
+ input: 0.15,
8523
+ output: 1.15,
8524
+ cacheRead: 0.03,
8267
8525
  cacheWrite: 0,
8268
8526
  },
8269
8527
  contextWindow: 196608,
8270
- maxTokens: 65536,
8528
+ maxTokens: 131072,
8271
8529
  },
8272
8530
  "minimax/minimax-m2.5:free": {
8273
8531
  id: "minimax/minimax-m2.5:free",
@@ -8590,7 +8848,7 @@ export const MODELS = {
8590
8848
  cacheWrite: 0,
8591
8849
  },
8592
8850
  contextWindow: 128000,
8593
- maxTokens: 4096,
8851
+ maxTokens: 16384,
8594
8852
  },
8595
8853
  "mistralai/mistral-small-creative": {
8596
8854
  id: "mistralai/mistral-small-creative",
@@ -8745,6 +9003,23 @@ export const MODELS = {
8745
9003
  contextWindow: 262144,
8746
9004
  maxTokens: 4096,
8747
9005
  },
9006
+ "moonshotai/kimi-k2.6": {
9007
+ id: "moonshotai/kimi-k2.6",
9008
+ name: "MoonshotAI: Kimi K2.6",
9009
+ api: "openai-completions",
9010
+ provider: "openrouter",
9011
+ baseUrl: "https://openrouter.ai/api/v1",
9012
+ reasoning: true,
9013
+ input: ["text", "image"],
9014
+ cost: {
9015
+ input: 0.7448,
9016
+ output: 4.655,
9017
+ cacheRead: 0.1463,
9018
+ cacheWrite: 0,
9019
+ },
9020
+ contextWindow: 256000,
9021
+ maxTokens: 65536,
9022
+ },
8748
9023
  "nex-agi/deepseek-v3.1-nex-n1": {
8749
9024
  id: "nex-agi/deepseek-v3.1-nex-n1",
8750
9025
  name: "Nex AGI: DeepSeek V3.1 Nex N1",
@@ -8794,7 +9069,7 @@ export const MODELS = {
8794
9069
  cacheWrite: 0,
8795
9070
  },
8796
9071
  contextWindow: 131072,
8797
- maxTokens: 4096,
9072
+ maxTokens: 16384,
8798
9073
  },
8799
9074
  "nvidia/nemotron-3-nano-30b-a3b": {
8800
9075
  id: "nvidia/nemotron-3-nano-30b-a3b",
@@ -8811,7 +9086,7 @@ export const MODELS = {
8811
9086
  cacheWrite: 0,
8812
9087
  },
8813
9088
  contextWindow: 262144,
8814
- maxTokens: 4096,
9089
+ maxTokens: 228000,
8815
9090
  },
8816
9091
  "nvidia/nemotron-3-nano-30b-a3b:free": {
8817
9092
  id: "nvidia/nemotron-3-nano-30b-a3b:free",
@@ -8896,7 +9171,7 @@ export const MODELS = {
8896
9171
  cacheWrite: 0,
8897
9172
  },
8898
9173
  contextWindow: 131072,
8899
- maxTokens: 4096,
9174
+ maxTokens: 16384,
8900
9175
  },
8901
9176
  "nvidia/nemotron-nano-9b-v2:free": {
8902
9177
  id: "nvidia/nemotron-nano-9b-v2:free",
@@ -9255,40 +9530,6 @@ export const MODELS = {
9255
9530
  contextWindow: 400000,
9256
9531
  maxTokens: 128000,
9257
9532
  },
9258
- "openai/gpt-5-image": {
9259
- id: "openai/gpt-5-image",
9260
- name: "OpenAI: GPT-5 Image",
9261
- api: "openai-completions",
9262
- provider: "openrouter",
9263
- baseUrl: "https://openrouter.ai/api/v1",
9264
- reasoning: true,
9265
- input: ["text", "image"],
9266
- cost: {
9267
- input: 10,
9268
- output: 10,
9269
- cacheRead: 1.25,
9270
- cacheWrite: 0,
9271
- },
9272
- contextWindow: 400000,
9273
- maxTokens: 128000,
9274
- },
9275
- "openai/gpt-5-image-mini": {
9276
- id: "openai/gpt-5-image-mini",
9277
- name: "OpenAI: GPT-5 Image Mini",
9278
- api: "openai-completions",
9279
- provider: "openrouter",
9280
- baseUrl: "https://openrouter.ai/api/v1",
9281
- reasoning: true,
9282
- input: ["text", "image"],
9283
- cost: {
9284
- input: 2.5,
9285
- output: 2,
9286
- cacheRead: 0.25,
9287
- cacheWrite: 0,
9288
- },
9289
- contextWindow: 400000,
9290
- maxTokens: 128000,
9291
- },
9292
9533
  "openai/gpt-5-mini": {
9293
9534
  id: "openai/gpt-5-mini",
9294
9535
  name: "OpenAI: GPT-5 Mini",
@@ -9595,6 +9836,40 @@ export const MODELS = {
9595
9836
  contextWindow: 1050000,
9596
9837
  maxTokens: 128000,
9597
9838
  },
9839
+ "openai/gpt-5.5": {
9840
+ id: "openai/gpt-5.5",
9841
+ name: "OpenAI: GPT-5.5",
9842
+ api: "openai-completions",
9843
+ provider: "openrouter",
9844
+ baseUrl: "https://openrouter.ai/api/v1",
9845
+ reasoning: true,
9846
+ input: ["text", "image"],
9847
+ cost: {
9848
+ input: 5,
9849
+ output: 30,
9850
+ cacheRead: 0.5,
9851
+ cacheWrite: 0,
9852
+ },
9853
+ contextWindow: 1050000,
9854
+ maxTokens: 128000,
9855
+ },
9856
+ "openai/gpt-5.5-pro": {
9857
+ id: "openai/gpt-5.5-pro",
9858
+ name: "OpenAI: GPT-5.5 Pro",
9859
+ api: "openai-completions",
9860
+ provider: "openrouter",
9861
+ baseUrl: "https://openrouter.ai/api/v1",
9862
+ reasoning: true,
9863
+ input: ["text", "image"],
9864
+ cost: {
9865
+ input: 30,
9866
+ output: 180,
9867
+ cacheRead: 0,
9868
+ cacheWrite: 0,
9869
+ },
9870
+ contextWindow: 1050000,
9871
+ maxTokens: 128000,
9872
+ },
9598
9873
  "openai/gpt-audio": {
9599
9874
  id: "openai/gpt-audio",
9600
9875
  name: "OpenAI: GPT Audio",
@@ -9644,7 +9919,7 @@ export const MODELS = {
9644
9919
  cacheWrite: 0,
9645
9920
  },
9646
9921
  contextWindow: 131072,
9647
- maxTokens: 4096,
9922
+ maxTokens: 131072,
9648
9923
  },
9649
9924
  "openai/gpt-oss-120b:free": {
9650
9925
  id: "openai/gpt-oss-120b:free",
@@ -9678,7 +9953,7 @@ export const MODELS = {
9678
9953
  cacheWrite: 0,
9679
9954
  },
9680
9955
  contextWindow: 131072,
9681
- maxTokens: 4096,
9956
+ maxTokens: 131072,
9682
9957
  },
9683
9958
  "openai/gpt-oss-20b:free": {
9684
9959
  id: "openai/gpt-oss-20b:free",
@@ -9884,23 +10159,6 @@ export const MODELS = {
9884
10159
  contextWindow: 2000000,
9885
10160
  maxTokens: 4096,
9886
10161
  },
9887
- "openrouter/elephant-alpha": {
9888
- id: "openrouter/elephant-alpha",
9889
- name: "Elephant",
9890
- api: "openai-completions",
9891
- provider: "openrouter",
9892
- baseUrl: "https://openrouter.ai/api/v1",
9893
- reasoning: false,
9894
- input: ["text"],
9895
- cost: {
9896
- input: 0,
9897
- output: 0,
9898
- cacheRead: 0,
9899
- cacheWrite: 0,
9900
- },
9901
- contextWindow: 262144,
9902
- maxTokens: 32768,
9903
- },
9904
10162
  "openrouter/free": {
9905
10163
  id: "openrouter/free",
9906
10164
  name: "Free Models Router",
@@ -9944,8 +10202,8 @@ export const MODELS = {
9944
10202
  reasoning: false,
9945
10203
  input: ["text"],
9946
10204
  cost: {
9947
- input: 0.12,
9948
- output: 0.39,
10205
+ input: 0.36,
10206
+ output: 0.39999999999999997,
9949
10207
  cacheRead: 0,
9950
10208
  cacheWrite: 0,
9951
10209
  },
@@ -10120,7 +10378,7 @@ export const MODELS = {
10120
10378
  cacheWrite: 0,
10121
10379
  },
10122
10380
  contextWindow: 262144,
10123
- maxTokens: 4096,
10381
+ maxTokens: 16384,
10124
10382
  },
10125
10383
  "qwen/qwen3-235b-a22b-thinking-2507": {
10126
10384
  id: "qwen/qwen3-235b-a22b-thinking-2507",
@@ -10131,13 +10389,13 @@ export const MODELS = {
10131
10389
  reasoning: true,
10132
10390
  input: ["text"],
10133
10391
  cost: {
10134
- input: 0.13,
10135
- output: 0.6,
10392
+ input: 0.14950000000000002,
10393
+ output: 1.495,
10136
10394
  cacheRead: 0,
10137
10395
  cacheWrite: 0,
10138
10396
  },
10139
- contextWindow: 262144,
10140
- maxTokens: 262144,
10397
+ contextWindow: 131072,
10398
+ maxTokens: 4096,
10141
10399
  },
10142
10400
  "qwen/qwen3-30b-a3b": {
10143
10401
  id: "qwen/qwen3-30b-a3b",
@@ -10154,7 +10412,7 @@ export const MODELS = {
10154
10412
  cacheWrite: 0,
10155
10413
  },
10156
10414
  contextWindow: 40960,
10157
- maxTokens: 40960,
10415
+ maxTokens: 16384,
10158
10416
  },
10159
10417
  "qwen/qwen3-30b-a3b-instruct-2507": {
10160
10418
  id: "qwen/qwen3-30b-a3b-instruct-2507",
@@ -10234,12 +10492,12 @@ export const MODELS = {
10234
10492
  input: ["text"],
10235
10493
  cost: {
10236
10494
  input: 0.22,
10237
- output: 1,
10238
- cacheRead: 0.022,
10495
+ output: 1.7999999999999998,
10496
+ cacheRead: 0,
10239
10497
  cacheWrite: 0,
10240
10498
  },
10241
10499
  contextWindow: 262144,
10242
- maxTokens: 4096,
10500
+ maxTokens: 65536,
10243
10501
  },
10244
10502
  "qwen/qwen3-coder-30b-a3b-instruct": {
10245
10503
  id: "qwen/qwen3-coder-30b-a3b-instruct",
@@ -10284,9 +10542,9 @@ export const MODELS = {
10284
10542
  reasoning: false,
10285
10543
  input: ["text"],
10286
10544
  cost: {
10287
- input: 0.15,
10545
+ input: 0.14,
10288
10546
  output: 0.7999999999999999,
10289
- cacheRead: 0.12,
10547
+ cacheRead: 0.09,
10290
10548
  cacheWrite: 0,
10291
10549
  },
10292
10550
  contextWindow: 262144,
@@ -10375,7 +10633,7 @@ export const MODELS = {
10375
10633
  cacheWrite: 0,
10376
10634
  },
10377
10635
  contextWindow: 262144,
10378
- maxTokens: 4096,
10636
+ maxTokens: 16384,
10379
10637
  },
10380
10638
  "qwen/qwen3-next-80b-a3b-instruct:free": {
10381
10639
  id: "qwen/qwen3-next-80b-a3b-instruct:free",
@@ -10426,7 +10684,7 @@ export const MODELS = {
10426
10684
  cacheWrite: 0,
10427
10685
  },
10428
10686
  contextWindow: 262144,
10429
- maxTokens: 4096,
10687
+ maxTokens: 16384,
10430
10688
  },
10431
10689
  "qwen/qwen3-vl-235b-a22b-thinking": {
10432
10690
  id: "qwen/qwen3-vl-235b-a22b-thinking",
@@ -10649,6 +10907,74 @@ export const MODELS = {
10649
10907
  contextWindow: 1000000,
10650
10908
  maxTokens: 65536,
10651
10909
  },
10910
+ "qwen/qwen3.5-plus-20260420": {
10911
+ id: "qwen/qwen3.5-plus-20260420",
10912
+ name: "Qwen: Qwen3.5 Plus 2026-04-20",
10913
+ api: "openai-completions",
10914
+ provider: "openrouter",
10915
+ baseUrl: "https://openrouter.ai/api/v1",
10916
+ reasoning: true,
10917
+ input: ["text", "image"],
10918
+ cost: {
10919
+ input: 0.39999999999999997,
10920
+ output: 2.4,
10921
+ cacheRead: 0,
10922
+ cacheWrite: 0,
10923
+ },
10924
+ contextWindow: 1000000,
10925
+ maxTokens: 65536,
10926
+ },
10927
+ "qwen/qwen3.6-27b": {
10928
+ id: "qwen/qwen3.6-27b",
10929
+ name: "Qwen: Qwen3.6 27B",
10930
+ api: "openai-completions",
10931
+ provider: "openrouter",
10932
+ baseUrl: "https://openrouter.ai/api/v1",
10933
+ reasoning: true,
10934
+ input: ["text", "image"],
10935
+ cost: {
10936
+ input: 0.5,
10937
+ output: 2,
10938
+ cacheRead: 0.25,
10939
+ cacheWrite: 0,
10940
+ },
10941
+ contextWindow: 262144,
10942
+ maxTokens: 65536,
10943
+ },
10944
+ "qwen/qwen3.6-flash": {
10945
+ id: "qwen/qwen3.6-flash",
10946
+ name: "Qwen: Qwen3.6 Flash",
10947
+ api: "openai-completions",
10948
+ provider: "openrouter",
10949
+ baseUrl: "https://openrouter.ai/api/v1",
10950
+ reasoning: true,
10951
+ input: ["text", "image"],
10952
+ cost: {
10953
+ input: 0.25,
10954
+ output: 1.5,
10955
+ cacheRead: 0,
10956
+ cacheWrite: 0.3125,
10957
+ },
10958
+ contextWindow: 1000000,
10959
+ maxTokens: 65536,
10960
+ },
10961
+ "qwen/qwen3.6-max-preview": {
10962
+ id: "qwen/qwen3.6-max-preview",
10963
+ name: "Qwen: Qwen3.6 Max Preview",
10964
+ api: "openai-completions",
10965
+ provider: "openrouter",
10966
+ baseUrl: "https://openrouter.ai/api/v1",
10967
+ reasoning: true,
10968
+ input: ["text"],
10969
+ cost: {
10970
+ input: 1.3,
10971
+ output: 7.8,
10972
+ cacheRead: 0,
10973
+ cacheWrite: 1.625,
10974
+ },
10975
+ contextWindow: 262144,
10976
+ maxTokens: 65536,
10977
+ },
10652
10978
  "qwen/qwen3.6-plus": {
10653
10979
  id: "qwen/qwen3.6-plus",
10654
10980
  name: "Qwen: Qwen3.6 Plus",
@@ -10768,6 +11094,23 @@ export const MODELS = {
10768
11094
  contextWindow: 262144,
10769
11095
  maxTokens: 65536,
10770
11096
  },
11097
+ "tencent/hy3-preview:free": {
11098
+ id: "tencent/hy3-preview:free",
11099
+ name: "Tencent: Hy3 preview (free)",
11100
+ api: "openai-completions",
11101
+ provider: "openrouter",
11102
+ baseUrl: "https://openrouter.ai/api/v1",
11103
+ reasoning: true,
11104
+ input: ["text"],
11105
+ cost: {
11106
+ input: 0,
11107
+ output: 0,
11108
+ cacheRead: 0,
11109
+ cacheWrite: 0,
11110
+ },
11111
+ contextWindow: 262144,
11112
+ maxTokens: 262144,
11113
+ },
10771
11114
  "thedrummer/rocinante-12b": {
10772
11115
  id: "thedrummer/rocinante-12b",
10773
11116
  name: "TheDrummer: Rocinante 12B",
@@ -11040,6 +11383,40 @@ export const MODELS = {
11040
11383
  contextWindow: 1048576,
11041
11384
  maxTokens: 131072,
11042
11385
  },
11386
+ "xiaomi/mimo-v2.5": {
11387
+ id: "xiaomi/mimo-v2.5",
11388
+ name: "Xiaomi: MiMo-V2.5",
11389
+ api: "openai-completions",
11390
+ provider: "openrouter",
11391
+ baseUrl: "https://openrouter.ai/api/v1",
11392
+ reasoning: true,
11393
+ input: ["text", "image"],
11394
+ cost: {
11395
+ input: 0.39999999999999997,
11396
+ output: 2,
11397
+ cacheRead: 0.08,
11398
+ cacheWrite: 0,
11399
+ },
11400
+ contextWindow: 1048576,
11401
+ maxTokens: 131072,
11402
+ },
11403
+ "xiaomi/mimo-v2.5-pro": {
11404
+ id: "xiaomi/mimo-v2.5-pro",
11405
+ name: "Xiaomi: MiMo-V2.5-Pro",
11406
+ api: "openai-completions",
11407
+ provider: "openrouter",
11408
+ baseUrl: "https://openrouter.ai/api/v1",
11409
+ reasoning: true,
11410
+ input: ["text"],
11411
+ cost: {
11412
+ input: 1,
11413
+ output: 3,
11414
+ cacheRead: 0.19999999999999998,
11415
+ cacheWrite: 0,
11416
+ },
11417
+ contextWindow: 1048576,
11418
+ maxTokens: 131072,
11419
+ },
11043
11420
  "z-ai/glm-4-32b": {
11044
11421
  id: "z-ai/glm-4-32b",
11045
11422
  name: "Z.ai: GLM 4 32B ",
@@ -11153,11 +11530,11 @@ export const MODELS = {
11153
11530
  cost: {
11154
11531
  input: 0.3,
11155
11532
  output: 0.8999999999999999,
11156
- cacheRead: 0,
11533
+ cacheRead: 0.049999999999999996,
11157
11534
  cacheWrite: 0,
11158
11535
  },
11159
11536
  contextWindow: 131072,
11160
- maxTokens: 131072,
11537
+ maxTokens: 24000,
11161
11538
  },
11162
11539
  "z-ai/glm-4.7": {
11163
11540
  id: "z-ai/glm-4.7",
@@ -11168,13 +11545,13 @@ export const MODELS = {
11168
11545
  reasoning: true,
11169
11546
  input: ["text"],
11170
11547
  cost: {
11171
- input: 0.39,
11172
- output: 1.75,
11173
- cacheRead: 0.195,
11548
+ input: 0.38,
11549
+ output: 1.74,
11550
+ cacheRead: 0,
11174
11551
  cacheWrite: 0,
11175
11552
  },
11176
11553
  contextWindow: 202752,
11177
- maxTokens: 65535,
11554
+ maxTokens: 4096,
11178
11555
  },
11179
11556
  "z-ai/glm-4.7-flash": {
11180
11557
  id: "z-ai/glm-4.7-flash",
@@ -11187,11 +11564,11 @@ export const MODELS = {
11187
11564
  cost: {
11188
11565
  input: 0.06,
11189
11566
  output: 0.39999999999999997,
11190
- cacheRead: 0.0100000002,
11567
+ cacheRead: 0.01,
11191
11568
  cacheWrite: 0,
11192
11569
  },
11193
11570
  contextWindow: 202752,
11194
- maxTokens: 4096,
11571
+ maxTokens: 16384,
11195
11572
  },
11196
11573
  "z-ai/glm-5": {
11197
11574
  id: "z-ai/glm-5",
@@ -11207,8 +11584,8 @@ export const MODELS = {
11207
11584
  cacheRead: 0.119,
11208
11585
  cacheWrite: 0,
11209
11586
  },
11210
- contextWindow: 80000,
11211
- maxTokens: 131072,
11587
+ contextWindow: 202752,
11588
+ maxTokens: 16384,
11212
11589
  },
11213
11590
  "z-ai/glm-5-turbo": {
11214
11591
  id: "z-ai/glm-5-turbo",
@@ -11236,30 +11613,166 @@ export const MODELS = {
11236
11613
  reasoning: true,
11237
11614
  input: ["text"],
11238
11615
  cost: {
11239
- input: 0.95,
11240
- output: 3.15,
11241
- cacheRead: 0.475,
11616
+ input: 1.0499999999999998,
11617
+ output: 3.5,
11618
+ cacheRead: 0.5249999999999999,
11242
11619
  cacheWrite: 0,
11243
11620
  },
11244
11621
  contextWindow: 202752,
11245
11622
  maxTokens: 65535,
11246
11623
  },
11247
- "z-ai/glm-5v-turbo": {
11248
- id: "z-ai/glm-5v-turbo",
11249
- name: "Z.ai: GLM 5V Turbo",
11624
+ "z-ai/glm-5v-turbo": {
11625
+ id: "z-ai/glm-5v-turbo",
11626
+ name: "Z.ai: GLM 5V Turbo",
11627
+ api: "openai-completions",
11628
+ provider: "openrouter",
11629
+ baseUrl: "https://openrouter.ai/api/v1",
11630
+ reasoning: true,
11631
+ input: ["text", "image"],
11632
+ cost: {
11633
+ input: 1.2,
11634
+ output: 4,
11635
+ cacheRead: 0.24,
11636
+ cacheWrite: 0,
11637
+ },
11638
+ contextWindow: 202752,
11639
+ maxTokens: 131072,
11640
+ },
11641
+ "~anthropic/claude-haiku-latest": {
11642
+ id: "~anthropic/claude-haiku-latest",
11643
+ name: "Anthropic Claude Haiku Latest",
11644
+ api: "openai-completions",
11645
+ provider: "openrouter",
11646
+ baseUrl: "https://openrouter.ai/api/v1",
11647
+ reasoning: true,
11648
+ input: ["text", "image"],
11649
+ cost: {
11650
+ input: 1,
11651
+ output: 5,
11652
+ cacheRead: 0.09999999999999999,
11653
+ cacheWrite: 1.25,
11654
+ },
11655
+ contextWindow: 200000,
11656
+ maxTokens: 64000,
11657
+ },
11658
+ "~anthropic/claude-opus-latest": {
11659
+ id: "~anthropic/claude-opus-latest",
11660
+ name: "Anthropic: Claude Opus Latest",
11661
+ api: "openai-completions",
11662
+ provider: "openrouter",
11663
+ baseUrl: "https://openrouter.ai/api/v1",
11664
+ reasoning: true,
11665
+ input: ["text", "image"],
11666
+ cost: {
11667
+ input: 5,
11668
+ output: 25,
11669
+ cacheRead: 0.5,
11670
+ cacheWrite: 6.25,
11671
+ },
11672
+ contextWindow: 1000000,
11673
+ maxTokens: 128000,
11674
+ },
11675
+ "~anthropic/claude-sonnet-latest": {
11676
+ id: "~anthropic/claude-sonnet-latest",
11677
+ name: "Anthropic Claude Sonnet Latest",
11678
+ api: "openai-completions",
11679
+ provider: "openrouter",
11680
+ baseUrl: "https://openrouter.ai/api/v1",
11681
+ reasoning: true,
11682
+ input: ["text", "image"],
11683
+ cost: {
11684
+ input: 3,
11685
+ output: 15,
11686
+ cacheRead: 0.3,
11687
+ cacheWrite: 3.75,
11688
+ },
11689
+ contextWindow: 1000000,
11690
+ maxTokens: 128000,
11691
+ },
11692
+ "~google/gemini-flash-latest": {
11693
+ id: "~google/gemini-flash-latest",
11694
+ name: "Google Gemini Flash Latest",
11695
+ api: "openai-completions",
11696
+ provider: "openrouter",
11697
+ baseUrl: "https://openrouter.ai/api/v1",
11698
+ reasoning: true,
11699
+ input: ["text", "image"],
11700
+ cost: {
11701
+ input: 0.5,
11702
+ output: 3,
11703
+ cacheRead: 0.049999999999999996,
11704
+ cacheWrite: 0.08333333333333334,
11705
+ },
11706
+ contextWindow: 1048576,
11707
+ maxTokens: 65536,
11708
+ },
11709
+ "~google/gemini-pro-latest": {
11710
+ id: "~google/gemini-pro-latest",
11711
+ name: "Google Gemini Pro Latest",
11712
+ api: "openai-completions",
11713
+ provider: "openrouter",
11714
+ baseUrl: "https://openrouter.ai/api/v1",
11715
+ reasoning: true,
11716
+ input: ["text", "image"],
11717
+ cost: {
11718
+ input: 2,
11719
+ output: 12,
11720
+ cacheRead: 0.19999999999999998,
11721
+ cacheWrite: 0.375,
11722
+ },
11723
+ contextWindow: 1048576,
11724
+ maxTokens: 65536,
11725
+ },
11726
+ "~moonshotai/kimi-latest": {
11727
+ id: "~moonshotai/kimi-latest",
11728
+ name: "MoonshotAI Kimi Latest",
11729
+ api: "openai-completions",
11730
+ provider: "openrouter",
11731
+ baseUrl: "https://openrouter.ai/api/v1",
11732
+ reasoning: true,
11733
+ input: ["text", "image"],
11734
+ cost: {
11735
+ input: 0.7448,
11736
+ output: 4.655,
11737
+ cacheRead: 0.1463,
11738
+ cacheWrite: 0,
11739
+ },
11740
+ contextWindow: 256000,
11741
+ maxTokens: 65536,
11742
+ },
11743
+ "~openai/gpt-latest": {
11744
+ id: "~openai/gpt-latest",
11745
+ name: "OpenAI GPT Latest",
11746
+ api: "openai-completions",
11747
+ provider: "openrouter",
11748
+ baseUrl: "https://openrouter.ai/api/v1",
11749
+ reasoning: true,
11750
+ input: ["text", "image"],
11751
+ cost: {
11752
+ input: 5,
11753
+ output: 30,
11754
+ cacheRead: 0.5,
11755
+ cacheWrite: 0,
11756
+ },
11757
+ contextWindow: 1050000,
11758
+ maxTokens: 128000,
11759
+ },
11760
+ "~openai/gpt-mini-latest": {
11761
+ id: "~openai/gpt-mini-latest",
11762
+ name: "OpenAI GPT Mini Latest",
11250
11763
  api: "openai-completions",
11251
11764
  provider: "openrouter",
11252
11765
  baseUrl: "https://openrouter.ai/api/v1",
11253
11766
  reasoning: true,
11254
11767
  input: ["text", "image"],
11255
11768
  cost: {
11256
- input: 1.2,
11257
- output: 4,
11258
- cacheRead: 0.24,
11769
+ input: 0.75,
11770
+ output: 4.5,
11771
+ cacheRead: 0.075,
11259
11772
  cacheWrite: 0,
11260
11773
  },
11261
- contextWindow: 202752,
11262
- maxTokens: 131072,
11774
+ contextWindow: 400000,
11775
+ maxTokens: 128000,
11263
11776
  },
11264
11777
  },
11265
11778
  "vercel-ai-gateway": {
@@ -11331,6 +11844,23 @@ export const MODELS = {
11331
11844
  contextWindow: 128000,
11332
11845
  maxTokens: 8192,
11333
11846
  },
11847
+ "alibaba/qwen-3.6-max-preview": {
11848
+ id: "alibaba/qwen-3.6-max-preview",
11849
+ name: "Qwen 3.6 Max Preview",
11850
+ api: "anthropic-messages",
11851
+ provider: "vercel-ai-gateway",
11852
+ baseUrl: "https://ai-gateway.vercel.sh",
11853
+ reasoning: true,
11854
+ input: ["text", "image"],
11855
+ cost: {
11856
+ input: 1.3,
11857
+ output: 7.8,
11858
+ cacheRead: 0.26,
11859
+ cacheWrite: 1.625,
11860
+ },
11861
+ contextWindow: 240000,
11862
+ maxTokens: 64000,
11863
+ },
11334
11864
  "alibaba/qwen3-235b-a22b-thinking": {
11335
11865
  id: "alibaba/qwen3-235b-a22b-thinking",
11336
11866
  name: "Qwen3 235B A22B Thinking 2507",
@@ -11530,7 +12060,7 @@ export const MODELS = {
11530
12060
  input: 0.5,
11531
12061
  output: 3,
11532
12062
  cacheRead: 0.09999999999999999,
11533
- cacheWrite: 0,
12063
+ cacheWrite: 0.625,
11534
12064
  },
11535
12065
  contextWindow: 1000000,
11536
12066
  maxTokens: 64000,
@@ -11909,6 +12439,40 @@ export const MODELS = {
11909
12439
  contextWindow: 128000,
11910
12440
  maxTokens: 64000,
11911
12441
  },
12442
+ "deepseek/deepseek-v4-flash": {
12443
+ id: "deepseek/deepseek-v4-flash",
12444
+ name: "DeepSeek V4 Flash",
12445
+ api: "anthropic-messages",
12446
+ provider: "vercel-ai-gateway",
12447
+ baseUrl: "https://ai-gateway.vercel.sh",
12448
+ reasoning: true,
12449
+ input: ["text"],
12450
+ cost: {
12451
+ input: 0.14,
12452
+ output: 0.28,
12453
+ cacheRead: 0.028,
12454
+ cacheWrite: 0,
12455
+ },
12456
+ contextWindow: 1000000,
12457
+ maxTokens: 384000,
12458
+ },
12459
+ "deepseek/deepseek-v4-pro": {
12460
+ id: "deepseek/deepseek-v4-pro",
12461
+ name: "DeepSeek V4 Pro",
12462
+ api: "anthropic-messages",
12463
+ provider: "vercel-ai-gateway",
12464
+ baseUrl: "https://ai-gateway.vercel.sh",
12465
+ reasoning: true,
12466
+ input: ["text"],
12467
+ cost: {
12468
+ input: 0.435,
12469
+ output: 0.87,
12470
+ cacheRead: 0.0036,
12471
+ cacheWrite: 0,
12472
+ },
12473
+ contextWindow: 1000000,
12474
+ maxTokens: 384000,
12475
+ },
11912
12476
  "google/gemini-2.0-flash": {
11913
12477
  id: "google/gemini-2.0-flash",
11914
12478
  name: "Gemini 2.0 Flash",
@@ -12674,6 +13238,23 @@ export const MODELS = {
12674
13238
  contextWindow: 262114,
12675
13239
  maxTokens: 262114,
12676
13240
  },
13241
+ "moonshotai/kimi-k2.6": {
13242
+ id: "moonshotai/kimi-k2.6",
13243
+ name: "Kimi K2.6",
13244
+ api: "anthropic-messages",
13245
+ provider: "vercel-ai-gateway",
13246
+ baseUrl: "https://ai-gateway.vercel.sh",
13247
+ reasoning: true,
13248
+ input: ["text", "image"],
13249
+ cost: {
13250
+ input: 0.95,
13251
+ output: 4,
13252
+ cacheRead: 0.16,
13253
+ cacheWrite: 0,
13254
+ },
13255
+ contextWindow: 262000,
13256
+ maxTokens: 262000,
13257
+ },
12677
13258
  "nvidia/nemotron-nano-12b-v2-vl": {
12678
13259
  id: "nvidia/nemotron-nano-12b-v2-vl",
12679
13260
  name: "Nvidia Nemotron Nano 12B V2 VL",
@@ -13167,6 +13748,40 @@ export const MODELS = {
13167
13748
  contextWindow: 1050000,
13168
13749
  maxTokens: 128000,
13169
13750
  },
13751
+ "openai/gpt-5.5": {
13752
+ id: "openai/gpt-5.5",
13753
+ name: "GPT 5.5",
13754
+ api: "anthropic-messages",
13755
+ provider: "vercel-ai-gateway",
13756
+ baseUrl: "https://ai-gateway.vercel.sh",
13757
+ reasoning: true,
13758
+ input: ["text", "image"],
13759
+ cost: {
13760
+ input: 5,
13761
+ output: 30,
13762
+ cacheRead: 0.5,
13763
+ cacheWrite: 0,
13764
+ },
13765
+ contextWindow: 1000000,
13766
+ maxTokens: 128000,
13767
+ },
13768
+ "openai/gpt-5.5-pro": {
13769
+ id: "openai/gpt-5.5-pro",
13770
+ name: "GPT 5.5 Pro",
13771
+ api: "anthropic-messages",
13772
+ provider: "vercel-ai-gateway",
13773
+ baseUrl: "https://ai-gateway.vercel.sh",
13774
+ reasoning: true,
13775
+ input: ["text", "image"],
13776
+ cost: {
13777
+ input: 30,
13778
+ output: 180,
13779
+ cacheRead: 0,
13780
+ cacheWrite: 0,
13781
+ },
13782
+ contextWindow: 1000000,
13783
+ maxTokens: 128000,
13784
+ },
13170
13785
  "openai/gpt-oss-20b": {
13171
13786
  id: "openai/gpt-oss-20b",
13172
13787
  name: "GPT OSS 120B",
@@ -13635,9 +14250,9 @@ export const MODELS = {
13635
14250
  reasoning: true,
13636
14251
  input: ["text"],
13637
14252
  cost: {
13638
- input: 0.09,
13639
- output: 0.29,
13640
- cacheRead: 0.045,
14253
+ input: 0.09999999999999999,
14254
+ output: 0.3,
14255
+ cacheRead: 0.01,
13641
14256
  cacheWrite: 0,
13642
14257
  },
13643
14258
  contextWindow: 262144,
@@ -13854,15 +14469,15 @@ export const MODELS = {
13854
14469
  provider: "vercel-ai-gateway",
13855
14470
  baseUrl: "https://ai-gateway.vercel.sh",
13856
14471
  reasoning: true,
13857
- input: ["text", "image"],
14472
+ input: ["text"],
13858
14473
  cost: {
13859
14474
  input: 1.4,
13860
14475
  output: 4.4,
13861
14476
  cacheRead: 0.26,
13862
14477
  cacheWrite: 0,
13863
14478
  },
13864
- contextWindow: 202752,
13865
- maxTokens: 202752,
14479
+ contextWindow: 202800,
14480
+ maxTokens: 64000,
13866
14481
  },
13867
14482
  "zai/glm-5v-turbo": {
13868
14483
  id: "zai/glm-5v-turbo",
@@ -14293,24 +14908,6 @@ export const MODELS = {
14293
14908
  },
14294
14909
  },
14295
14910
  "zai": {
14296
- "glm-4.5": {
14297
- id: "glm-4.5",
14298
- name: "GLM-4.5",
14299
- api: "openai-completions",
14300
- provider: "zai",
14301
- baseUrl: "https://api.z.ai/api/coding/paas/v4",
14302
- compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai" },
14303
- reasoning: true,
14304
- input: ["text"],
14305
- cost: {
14306
- input: 0.6,
14307
- output: 2.2,
14308
- cacheRead: 0.11,
14309
- cacheWrite: 0,
14310
- },
14311
- contextWindow: 131072,
14312
- maxTokens: 98304,
14313
- },
14314
14911
  "glm-4.5-air": {
14315
14912
  id: "glm-4.5-air",
14316
14913
  name: "GLM-4.5-Air",
@@ -14320,24 +14917,6 @@ export const MODELS = {
14320
14917
  compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai" },
14321
14918
  reasoning: true,
14322
14919
  input: ["text"],
14323
- cost: {
14324
- input: 0.2,
14325
- output: 1.1,
14326
- cacheRead: 0.03,
14327
- cacheWrite: 0,
14328
- },
14329
- contextWindow: 131072,
14330
- maxTokens: 98304,
14331
- },
14332
- "glm-4.5-flash": {
14333
- id: "glm-4.5-flash",
14334
- name: "GLM-4.5-Flash",
14335
- api: "openai-completions",
14336
- provider: "zai",
14337
- baseUrl: "https://api.z.ai/api/coding/paas/v4",
14338
- compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai" },
14339
- reasoning: true,
14340
- input: ["text"],
14341
14920
  cost: {
14342
14921
  input: 0,
14343
14922
  output: 0,
@@ -14347,85 +14926,13 @@ export const MODELS = {
14347
14926
  contextWindow: 131072,
14348
14927
  maxTokens: 98304,
14349
14928
  },
14350
- "glm-4.5v": {
14351
- id: "glm-4.5v",
14352
- name: "GLM-4.5V",
14353
- api: "openai-completions",
14354
- provider: "zai",
14355
- baseUrl: "https://api.z.ai/api/coding/paas/v4",
14356
- compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai" },
14357
- reasoning: true,
14358
- input: ["text", "image"],
14359
- cost: {
14360
- input: 0.6,
14361
- output: 1.8,
14362
- cacheRead: 0,
14363
- cacheWrite: 0,
14364
- },
14365
- contextWindow: 64000,
14366
- maxTokens: 16384,
14367
- },
14368
- "glm-4.6": {
14369
- id: "glm-4.6",
14370
- name: "GLM-4.6",
14371
- api: "openai-completions",
14372
- provider: "zai",
14373
- baseUrl: "https://api.z.ai/api/coding/paas/v4",
14374
- compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai" },
14375
- reasoning: true,
14376
- input: ["text"],
14377
- cost: {
14378
- input: 0.6,
14379
- output: 2.2,
14380
- cacheRead: 0.11,
14381
- cacheWrite: 0,
14382
- },
14383
- contextWindow: 204800,
14384
- maxTokens: 131072,
14385
- },
14386
- "glm-4.6v": {
14387
- id: "glm-4.6v",
14388
- name: "GLM-4.6V",
14389
- api: "openai-completions",
14390
- provider: "zai",
14391
- baseUrl: "https://api.z.ai/api/coding/paas/v4",
14392
- compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai" },
14393
- reasoning: true,
14394
- input: ["text", "image"],
14395
- cost: {
14396
- input: 0.3,
14397
- output: 0.9,
14398
- cacheRead: 0,
14399
- cacheWrite: 0,
14400
- },
14401
- contextWindow: 128000,
14402
- maxTokens: 32768,
14403
- },
14404
14929
  "glm-4.7": {
14405
14930
  id: "glm-4.7",
14406
14931
  name: "GLM-4.7",
14407
14932
  api: "openai-completions",
14408
14933
  provider: "zai",
14409
14934
  baseUrl: "https://api.z.ai/api/coding/paas/v4",
14410
- compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai" },
14411
- reasoning: true,
14412
- input: ["text"],
14413
- cost: {
14414
- input: 0.6,
14415
- output: 2.2,
14416
- cacheRead: 0.11,
14417
- cacheWrite: 0,
14418
- },
14419
- contextWindow: 204800,
14420
- maxTokens: 131072,
14421
- },
14422
- "glm-4.7-flash": {
14423
- id: "glm-4.7-flash",
14424
- name: "GLM-4.7-Flash",
14425
- api: "openai-completions",
14426
- provider: "zai",
14427
- baseUrl: "https://api.z.ai/api/coding/paas/v4",
14428
- compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai" },
14935
+ compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "zaiToolStream": true },
14429
14936
  reasoning: true,
14430
14937
  input: ["text"],
14431
14938
  cost: {
@@ -14434,42 +14941,6 @@ export const MODELS = {
14434
14941
  cacheRead: 0,
14435
14942
  cacheWrite: 0,
14436
14943
  },
14437
- contextWindow: 200000,
14438
- maxTokens: 131072,
14439
- },
14440
- "glm-4.7-flashx": {
14441
- id: "glm-4.7-flashx",
14442
- name: "GLM-4.7-FlashX",
14443
- api: "openai-completions",
14444
- provider: "zai",
14445
- baseUrl: "https://api.z.ai/api/coding/paas/v4",
14446
- compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai" },
14447
- reasoning: true,
14448
- input: ["text"],
14449
- cost: {
14450
- input: 0.07,
14451
- output: 0.4,
14452
- cacheRead: 0.01,
14453
- cacheWrite: 0,
14454
- },
14455
- contextWindow: 200000,
14456
- maxTokens: 131072,
14457
- },
14458
- "glm-5": {
14459
- id: "glm-5",
14460
- name: "GLM-5",
14461
- api: "openai-completions",
14462
- provider: "zai",
14463
- baseUrl: "https://api.z.ai/api/coding/paas/v4",
14464
- compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai" },
14465
- reasoning: true,
14466
- input: ["text"],
14467
- cost: {
14468
- input: 1,
14469
- output: 3.2,
14470
- cacheRead: 0.2,
14471
- cacheWrite: 0,
14472
- },
14473
14944
  contextWindow: 204800,
14474
14945
  maxTokens: 131072,
14475
14946
  },
@@ -14479,13 +14950,13 @@ export const MODELS = {
14479
14950
  api: "openai-completions",
14480
14951
  provider: "zai",
14481
14952
  baseUrl: "https://api.z.ai/api/coding/paas/v4",
14482
- compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai" },
14953
+ compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "zaiToolStream": true },
14483
14954
  reasoning: true,
14484
14955
  input: ["text"],
14485
14956
  cost: {
14486
- input: 1.2,
14487
- output: 4,
14488
- cacheRead: 0.24,
14957
+ input: 0,
14958
+ output: 0,
14959
+ cacheRead: 0,
14489
14960
  cacheWrite: 0,
14490
14961
  },
14491
14962
  contextWindow: 200000,
@@ -14497,31 +14968,13 @@ export const MODELS = {
14497
14968
  api: "openai-completions",
14498
14969
  provider: "zai",
14499
14970
  baseUrl: "https://api.z.ai/api/coding/paas/v4",
14500
- compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai" },
14971
+ compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai", "zaiToolStream": true },
14501
14972
  reasoning: true,
14502
14973
  input: ["text"],
14503
14974
  cost: {
14504
- input: 1.4,
14505
- output: 4.4,
14506
- cacheRead: 0.26,
14507
- cacheWrite: 0,
14508
- },
14509
- contextWindow: 200000,
14510
- maxTokens: 131072,
14511
- },
14512
- "glm-5v-turbo": {
14513
- id: "glm-5v-turbo",
14514
- name: "glm-5v-turbo",
14515
- api: "openai-completions",
14516
- provider: "zai",
14517
- baseUrl: "https://api.z.ai/api/coding/paas/v4",
14518
- compat: { "supportsDeveloperRole": false, "thinkingFormat": "zai" },
14519
- reasoning: true,
14520
- input: ["text", "image"],
14521
- cost: {
14522
- input: 1.2,
14523
- output: 4,
14524
- cacheRead: 0.24,
14975
+ input: 0,
14976
+ output: 0,
14977
+ cacheRead: 0,
14525
14978
  cacheWrite: 0,
14526
14979
  },
14527
14980
  contextWindow: 200000,