@earendil-works/pi-ai 0.79.1 → 0.79.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -354,7 +354,7 @@ export const MODELS = {
354
354
  provider: "amazon-bedrock",
355
355
  baseUrl: "https://bedrock-runtime.eu-central-1.amazonaws.com",
356
356
  reasoning: true,
357
- thinkingLevelMap: { "xhigh": "xhigh" },
357
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
358
358
  input: ["text", "image"],
359
359
  cost: {
360
360
  input: 11,
@@ -494,7 +494,7 @@ export const MODELS = {
494
494
  provider: "amazon-bedrock",
495
495
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
496
496
  reasoning: true,
497
- thinkingLevelMap: { "xhigh": "xhigh" },
497
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
498
498
  input: ["text", "image"],
499
499
  cost: {
500
500
  input: 10,
@@ -1386,7 +1386,7 @@ export const MODELS = {
1386
1386
  provider: "amazon-bedrock",
1387
1387
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1388
1388
  reasoning: true,
1389
- thinkingLevelMap: { "xhigh": "xhigh" },
1389
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
1390
1390
  input: ["text", "image"],
1391
1391
  cost: {
1392
1392
  input: 10,
@@ -1875,7 +1875,7 @@ export const MODELS = {
1875
1875
  baseUrl: "https://api.anthropic.com",
1876
1876
  compat: { "forceAdaptiveThinking": true },
1877
1877
  reasoning: true,
1878
- thinkingLevelMap: { "xhigh": "xhigh" },
1878
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
1879
1879
  input: ["text", "image"],
1880
1880
  cost: {
1881
1881
  input: 10,
@@ -2916,30 +2916,13 @@ export const MODELS = {
2916
2916
  reasoning: true,
2917
2917
  input: ["text"],
2918
2918
  cost: {
2919
- input: 0.25,
2920
- output: 0.69,
2919
+ input: 0.35,
2920
+ output: 0.75,
2921
2921
  cacheRead: 0,
2922
2922
  cacheWrite: 0,
2923
2923
  },
2924
2924
  contextWindow: 131072,
2925
- maxTokens: 32768,
2926
- },
2927
- "llama3.1-8b": {
2928
- id: "llama3.1-8b",
2929
- name: "Llama 3.1 8B",
2930
- api: "openai-completions",
2931
- provider: "cerebras",
2932
- baseUrl: "https://api.cerebras.ai/v1",
2933
- reasoning: false,
2934
- input: ["text"],
2935
- cost: {
2936
- input: 0.1,
2937
- output: 0.1,
2938
- cacheRead: 0,
2939
- cacheWrite: 0,
2940
- },
2941
- contextWindow: 32000,
2942
- maxTokens: 8000,
2925
+ maxTokens: 40960,
2943
2926
  },
2944
2927
  "zai-glm-4.7": {
2945
2928
  id: "zai-glm-4.7",
@@ -2947,7 +2930,7 @@ export const MODELS = {
2947
2930
  api: "openai-completions",
2948
2931
  provider: "cerebras",
2949
2932
  baseUrl: "https://api.cerebras.ai/v1",
2950
- reasoning: false,
2933
+ reasoning: true,
2951
2934
  input: ["text"],
2952
2935
  cost: {
2953
2936
  input: 2.25,
@@ -2956,7 +2939,7 @@ export const MODELS = {
2956
2939
  cacheWrite: 0,
2957
2940
  },
2958
2941
  contextWindow: 131072,
2959
- maxTokens: 40000,
2942
+ maxTokens: 40960,
2960
2943
  },
2961
2944
  },
2962
2945
  "cloudflare-ai-gateway": {
@@ -3070,7 +3053,7 @@ export const MODELS = {
3070
3053
  baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
3071
3054
  compat: { "forceAdaptiveThinking": true },
3072
3055
  reasoning: true,
3073
- thinkingLevelMap: { "xhigh": "xhigh" },
3056
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
3074
3057
  input: ["text", "image"],
3075
3058
  cost: {
3076
3059
  input: 10,
@@ -3719,6 +3702,24 @@ export const MODELS = {
3719
3702
  contextWindow: 262144,
3720
3703
  maxTokens: 256000,
3721
3704
  },
3705
+ "@cf/moonshotai/kimi-k2.7-code": {
3706
+ id: "@cf/moonshotai/kimi-k2.7-code",
3707
+ name: "Kimi K2.7 Code",
3708
+ api: "openai-completions",
3709
+ provider: "cloudflare-workers-ai",
3710
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3711
+ compat: { "sendSessionAffinityHeaders": true },
3712
+ reasoning: true,
3713
+ input: ["text", "image"],
3714
+ cost: {
3715
+ input: 0.95,
3716
+ output: 4,
3717
+ cacheRead: 0.19,
3718
+ cacheWrite: 0,
3719
+ },
3720
+ contextWindow: 262144,
3721
+ maxTokens: 262144,
3722
+ },
3722
3723
  "@cf/nvidia/nemotron-3-120b-a12b": {
3723
3724
  id: "@cf/nvidia/nemotron-3-120b-a12b",
3724
3725
  name: "Nemotron 3 Super 120B",
@@ -4087,6 +4088,25 @@ export const MODELS = {
4087
4088
  },
4088
4089
  },
4089
4090
  "github-copilot": {
4091
+ "claude-fable-5": {
4092
+ id: "claude-fable-5",
4093
+ name: "Claude Fable 5",
4094
+ api: "openai-completions",
4095
+ provider: "github-copilot",
4096
+ baseUrl: "https://api.individual.githubcopilot.com",
4097
+ headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4098
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
4099
+ reasoning: true,
4100
+ input: ["text", "image"],
4101
+ cost: {
4102
+ input: 10,
4103
+ output: 50,
4104
+ cacheRead: 1,
4105
+ cacheWrite: 12.5,
4106
+ },
4107
+ contextWindow: 1000000,
4108
+ maxTokens: 128000,
4109
+ },
4090
4110
  "claude-haiku-4.5": {
4091
4111
  id: "claude-haiku-4.5",
4092
4112
  name: "Claude Haiku 4.5 (latest)",
@@ -5019,77 +5039,9 @@ export const MODELS = {
5019
5039
  },
5020
5040
  },
5021
5041
  "groq": {
5022
- "deepseek-r1-distill-llama-70b": {
5023
- id: "deepseek-r1-distill-llama-70b",
5024
- name: "DeepSeek R1 Distill Llama 70B",
5025
- api: "openai-completions",
5026
- provider: "groq",
5027
- baseUrl: "https://api.groq.com/openai/v1",
5028
- reasoning: true,
5029
- input: ["text"],
5030
- cost: {
5031
- input: 0.75,
5032
- output: 0.99,
5033
- cacheRead: 0,
5034
- cacheWrite: 0,
5035
- },
5036
- contextWindow: 131072,
5037
- maxTokens: 8192,
5038
- },
5039
- "gemma2-9b-it": {
5040
- id: "gemma2-9b-it",
5041
- name: "Gemma 2 9B",
5042
- api: "openai-completions",
5043
- provider: "groq",
5044
- baseUrl: "https://api.groq.com/openai/v1",
5045
- reasoning: false,
5046
- input: ["text"],
5047
- cost: {
5048
- input: 0.2,
5049
- output: 0.2,
5050
- cacheRead: 0,
5051
- cacheWrite: 0,
5052
- },
5053
- contextWindow: 8192,
5054
- maxTokens: 8192,
5055
- },
5056
- "groq/compound": {
5057
- id: "groq/compound",
5058
- name: "Compound",
5059
- api: "openai-completions",
5060
- provider: "groq",
5061
- baseUrl: "https://api.groq.com/openai/v1",
5062
- reasoning: true,
5063
- input: ["text"],
5064
- cost: {
5065
- input: 0,
5066
- output: 0,
5067
- cacheRead: 0,
5068
- cacheWrite: 0,
5069
- },
5070
- contextWindow: 131072,
5071
- maxTokens: 8192,
5072
- },
5073
- "groq/compound-mini": {
5074
- id: "groq/compound-mini",
5075
- name: "Compound Mini",
5076
- api: "openai-completions",
5077
- provider: "groq",
5078
- baseUrl: "https://api.groq.com/openai/v1",
5079
- reasoning: true,
5080
- input: ["text"],
5081
- cost: {
5082
- input: 0,
5083
- output: 0,
5084
- cacheRead: 0,
5085
- cacheWrite: 0,
5086
- },
5087
- contextWindow: 131072,
5088
- maxTokens: 8192,
5089
- },
5090
5042
  "llama-3.1-8b-instant": {
5091
5043
  id: "llama-3.1-8b-instant",
5092
- name: "Llama 3.1 8B Instant",
5044
+ name: "Llama 3.1 8B",
5093
5045
  api: "openai-completions",
5094
5046
  provider: "groq",
5095
5047
  baseUrl: "https://api.groq.com/openai/v1",
@@ -5106,7 +5058,7 @@ export const MODELS = {
5106
5058
  },
5107
5059
  "llama-3.3-70b-versatile": {
5108
5060
  id: "llama-3.3-70b-versatile",
5109
- name: "Llama 3.3 70B Versatile",
5061
+ name: "Llama 3.3 70B",
5110
5062
  api: "openai-completions",
5111
5063
  provider: "groq",
5112
5064
  baseUrl: "https://api.groq.com/openai/v1",
@@ -5121,60 +5073,9 @@ export const MODELS = {
5121
5073
  contextWindow: 131072,
5122
5074
  maxTokens: 32768,
5123
5075
  },
5124
- "llama3-70b-8192": {
5125
- id: "llama3-70b-8192",
5126
- name: "Llama 3 70B",
5127
- api: "openai-completions",
5128
- provider: "groq",
5129
- baseUrl: "https://api.groq.com/openai/v1",
5130
- reasoning: false,
5131
- input: ["text"],
5132
- cost: {
5133
- input: 0.59,
5134
- output: 0.79,
5135
- cacheRead: 0,
5136
- cacheWrite: 0,
5137
- },
5138
- contextWindow: 8192,
5139
- maxTokens: 8192,
5140
- },
5141
- "llama3-8b-8192": {
5142
- id: "llama3-8b-8192",
5143
- name: "Llama 3 8B",
5144
- api: "openai-completions",
5145
- provider: "groq",
5146
- baseUrl: "https://api.groq.com/openai/v1",
5147
- reasoning: false,
5148
- input: ["text"],
5149
- cost: {
5150
- input: 0.05,
5151
- output: 0.08,
5152
- cacheRead: 0,
5153
- cacheWrite: 0,
5154
- },
5155
- contextWindow: 8192,
5156
- maxTokens: 8192,
5157
- },
5158
- "meta-llama/llama-4-maverick-17b-128e-instruct": {
5159
- id: "meta-llama/llama-4-maverick-17b-128e-instruct",
5160
- name: "Llama 4 Maverick 17B",
5161
- api: "openai-completions",
5162
- provider: "groq",
5163
- baseUrl: "https://api.groq.com/openai/v1",
5164
- reasoning: false,
5165
- input: ["text", "image"],
5166
- cost: {
5167
- input: 0.2,
5168
- output: 0.6,
5169
- cacheRead: 0,
5170
- cacheWrite: 0,
5171
- },
5172
- contextWindow: 131072,
5173
- maxTokens: 8192,
5174
- },
5175
5076
  "meta-llama/llama-4-scout-17b-16e-instruct": {
5176
5077
  id: "meta-llama/llama-4-scout-17b-16e-instruct",
5177
- name: "Llama 4 Scout 17B",
5078
+ name: "Llama 4 Scout 17B 16E",
5178
5079
  api: "openai-completions",
5179
5080
  provider: "groq",
5180
5081
  baseUrl: "https://api.groq.com/openai/v1",
@@ -5189,57 +5090,6 @@ export const MODELS = {
5189
5090
  contextWindow: 131072,
5190
5091
  maxTokens: 8192,
5191
5092
  },
5192
- "mistral-saba-24b": {
5193
- id: "mistral-saba-24b",
5194
- name: "Mistral Saba 24B",
5195
- api: "openai-completions",
5196
- provider: "groq",
5197
- baseUrl: "https://api.groq.com/openai/v1",
5198
- reasoning: false,
5199
- input: ["text"],
5200
- cost: {
5201
- input: 0.79,
5202
- output: 0.79,
5203
- cacheRead: 0,
5204
- cacheWrite: 0,
5205
- },
5206
- contextWindow: 32768,
5207
- maxTokens: 32768,
5208
- },
5209
- "moonshotai/kimi-k2-instruct": {
5210
- id: "moonshotai/kimi-k2-instruct",
5211
- name: "Kimi K2 Instruct",
5212
- api: "openai-completions",
5213
- provider: "groq",
5214
- baseUrl: "https://api.groq.com/openai/v1",
5215
- reasoning: false,
5216
- input: ["text"],
5217
- cost: {
5218
- input: 1,
5219
- output: 3,
5220
- cacheRead: 0,
5221
- cacheWrite: 0,
5222
- },
5223
- contextWindow: 131072,
5224
- maxTokens: 16384,
5225
- },
5226
- "moonshotai/kimi-k2-instruct-0905": {
5227
- id: "moonshotai/kimi-k2-instruct-0905",
5228
- name: "Kimi K2 Instruct 0905",
5229
- api: "openai-completions",
5230
- provider: "groq",
5231
- baseUrl: "https://api.groq.com/openai/v1",
5232
- reasoning: false,
5233
- input: ["text"],
5234
- cost: {
5235
- input: 1,
5236
- output: 3,
5237
- cacheRead: 0.5,
5238
- cacheWrite: 0,
5239
- },
5240
- contextWindow: 262144,
5241
- maxTokens: 16384,
5242
- },
5243
5093
  "openai/gpt-oss-120b": {
5244
5094
  id: "openai/gpt-oss-120b",
5245
5095
  name: "GPT OSS 120B",
@@ -5291,26 +5141,9 @@ export const MODELS = {
5291
5141
  contextWindow: 131072,
5292
5142
  maxTokens: 65536,
5293
5143
  },
5294
- "qwen-qwq-32b": {
5295
- id: "qwen-qwq-32b",
5296
- name: "Qwen QwQ 32B",
5297
- api: "openai-completions",
5298
- provider: "groq",
5299
- baseUrl: "https://api.groq.com/openai/v1",
5300
- reasoning: true,
5301
- input: ["text"],
5302
- cost: {
5303
- input: 0.29,
5304
- output: 0.39,
5305
- cacheRead: 0,
5306
- cacheWrite: 0,
5307
- },
5308
- contextWindow: 131072,
5309
- maxTokens: 16384,
5310
- },
5311
5144
  "qwen/qwen3-32b": {
5312
5145
  id: "qwen/qwen3-32b",
5313
- name: "Qwen3 32B",
5146
+ name: "Qwen3-32B",
5314
5147
  api: "openai-completions",
5315
5148
  provider: "groq",
5316
5149
  baseUrl: "https://api.groq.com/openai/v1",
@@ -5726,6 +5559,24 @@ export const MODELS = {
5726
5559
  },
5727
5560
  },
5728
5561
  "kimi-coding": {
5562
+ "k2p7": {
5563
+ id: "k2p7",
5564
+ name: "Kimi K2.7 Code",
5565
+ api: "anthropic-messages",
5566
+ provider: "kimi-coding",
5567
+ baseUrl: "https://api.kimi.com/coding",
5568
+ headers: { "User-Agent": "KimiCLI/1.5" },
5569
+ reasoning: true,
5570
+ input: ["text", "image"],
5571
+ cost: {
5572
+ input: 0,
5573
+ output: 0,
5574
+ cacheRead: 0,
5575
+ cacheWrite: 0,
5576
+ },
5577
+ contextWindow: 262144,
5578
+ maxTokens: 32768,
5579
+ },
5729
5580
  "kimi-for-coding": {
5730
5581
  id: "kimi-for-coding",
5731
5582
  name: "Kimi For Coding",
@@ -6508,6 +6359,24 @@ export const MODELS = {
6508
6359
  contextWindow: 262144,
6509
6360
  maxTokens: 262144,
6510
6361
  },
6362
+ "kimi-k2.7-code": {
6363
+ id: "kimi-k2.7-code",
6364
+ name: "Kimi K2.7 Code",
6365
+ api: "openai-completions",
6366
+ provider: "moonshotai",
6367
+ baseUrl: "https://api.moonshot.ai/v1",
6368
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6369
+ reasoning: true,
6370
+ input: ["text", "image"],
6371
+ cost: {
6372
+ input: 0.95,
6373
+ output: 4,
6374
+ cacheRead: 0.19,
6375
+ cacheWrite: 0,
6376
+ },
6377
+ contextWindow: 262144,
6378
+ maxTokens: 262144,
6379
+ },
6511
6380
  },
6512
6381
  "moonshotai-cn": {
6513
6382
  "kimi-k2-0711-preview": {
@@ -6760,8 +6629,8 @@ export const MODELS = {
6760
6629
  baseUrl: "https://integrate.api.nvidia.com/v1",
6761
6630
  headers: { "NVCF-POLL-SECONDS": "3600" },
6762
6631
  compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6763
- reasoning: false,
6764
- input: ["text"],
6632
+ reasoning: true,
6633
+ input: ["text", "image"],
6765
6634
  cost: {
6766
6635
  input: 0,
6767
6636
  output: 0,
@@ -6790,44 +6659,6 @@ export const MODELS = {
6790
6659
  contextWindow: 262144,
6791
6660
  maxTokens: 262144,
6792
6661
  },
6793
- "nvidia/llama-3.3-nemotron-super-49b-v1": {
6794
- id: "nvidia/llama-3.3-nemotron-super-49b-v1",
6795
- name: "Llama 3.3 Nemotron Super 49B v1",
6796
- api: "openai-completions",
6797
- provider: "nvidia",
6798
- baseUrl: "https://integrate.api.nvidia.com/v1",
6799
- headers: { "NVCF-POLL-SECONDS": "3600" },
6800
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6801
- reasoning: true,
6802
- input: ["text"],
6803
- cost: {
6804
- input: 0,
6805
- output: 0,
6806
- cacheRead: 0,
6807
- cacheWrite: 0,
6808
- },
6809
- contextWindow: 131072,
6810
- maxTokens: 131072,
6811
- },
6812
- "nvidia/llama-3.3-nemotron-super-49b-v1.5": {
6813
- id: "nvidia/llama-3.3-nemotron-super-49b-v1.5",
6814
- name: "Llama 3.3 Nemotron Super 49B v1.5",
6815
- api: "openai-completions",
6816
- provider: "nvidia",
6817
- baseUrl: "https://integrate.api.nvidia.com/v1",
6818
- headers: { "NVCF-POLL-SECONDS": "3600" },
6819
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6820
- reasoning: true,
6821
- input: ["text"],
6822
- cost: {
6823
- input: 0,
6824
- output: 0,
6825
- cacheRead: 0,
6826
- cacheWrite: 0,
6827
- },
6828
- contextWindow: 131072,
6829
- maxTokens: 131072,
6830
- },
6831
6662
  "nvidia/nemotron-3-nano-30b-a3b": {
6832
6663
  id: "nvidia/nemotron-3-nano-30b-a3b",
6833
6664
  name: "nemotron-3-nano-30b-a3b",
@@ -6923,9 +6754,9 @@ export const MODELS = {
6923
6754
  contextWindow: 131072,
6924
6755
  maxTokens: 131072,
6925
6756
  },
6926
- "openai/gpt-oss-20b": {
6927
- id: "openai/gpt-oss-20b",
6928
- name: "GPT OSS 20B",
6757
+ "openai/gpt-oss-120b": {
6758
+ id: "openai/gpt-oss-120b",
6759
+ name: "GPT-OSS-120B",
6929
6760
  api: "openai-completions",
6930
6761
  provider: "nvidia",
6931
6762
  baseUrl: "https://integrate.api.nvidia.com/v1",
@@ -6939,18 +6770,18 @@ export const MODELS = {
6939
6770
  cacheRead: 0,
6940
6771
  cacheWrite: 0,
6941
6772
  },
6942
- contextWindow: 131072,
6943
- maxTokens: 32768,
6773
+ contextWindow: 128000,
6774
+ maxTokens: 8192,
6944
6775
  },
6945
- "qwen/qwen3-coder-480b-a35b-instruct": {
6946
- id: "qwen/qwen3-coder-480b-a35b-instruct",
6947
- name: "Qwen3 Coder 480B A35B Instruct",
6776
+ "openai/gpt-oss-20b": {
6777
+ id: "openai/gpt-oss-20b",
6778
+ name: "GPT OSS 20B",
6948
6779
  api: "openai-completions",
6949
6780
  provider: "nvidia",
6950
6781
  baseUrl: "https://integrate.api.nvidia.com/v1",
6951
6782
  headers: { "NVCF-POLL-SECONDS": "3600" },
6952
6783
  compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6953
- reasoning: false,
6784
+ reasoning: true,
6954
6785
  input: ["text"],
6955
6786
  cost: {
6956
6787
  input: 0,
@@ -6958,8 +6789,8 @@ export const MODELS = {
6958
6789
  cacheRead: 0,
6959
6790
  cacheWrite: 0,
6960
6791
  },
6961
- contextWindow: 262144,
6962
- maxTokens: 66536,
6792
+ contextWindow: 131072,
6793
+ maxTokens: 32768,
6963
6794
  },
6964
6795
  "qwen/qwen3.5-122b-a10b": {
6965
6796
  id: "qwen/qwen3.5-122b-a10b",
@@ -7548,7 +7379,7 @@ export const MODELS = {
7548
7379
  cacheRead: 0.25,
7549
7380
  cacheWrite: 0,
7550
7381
  },
7551
- contextWindow: 272000,
7382
+ contextWindow: 1050000,
7552
7383
  maxTokens: 128000,
7553
7384
  },
7554
7385
  "gpt-5.4-mini": {
@@ -7620,7 +7451,7 @@ export const MODELS = {
7620
7451
  cacheRead: 0.5,
7621
7452
  cacheWrite: 0,
7622
7453
  },
7623
- contextWindow: 272000,
7454
+ contextWindow: 1050000,
7624
7455
  maxTokens: 128000,
7625
7456
  },
7626
7457
  "gpt-5.5-pro": {
@@ -7812,7 +7643,7 @@ export const MODELS = {
7812
7643
  cacheRead: 0.25,
7813
7644
  cacheWrite: 0,
7814
7645
  },
7815
- contextWindow: 272000,
7646
+ contextWindow: 1000000,
7816
7647
  maxTokens: 128000,
7817
7648
  },
7818
7649
  "gpt-5.4-mini": {
@@ -7830,7 +7661,7 @@ export const MODELS = {
7830
7661
  cacheRead: 0.075,
7831
7662
  cacheWrite: 0,
7832
7663
  },
7833
- contextWindow: 272000,
7664
+ contextWindow: 400000,
7834
7665
  maxTokens: 128000,
7835
7666
  },
7836
7667
  "gpt-5.5": {
@@ -7848,7 +7679,7 @@ export const MODELS = {
7848
7679
  cacheRead: 0.5,
7849
7680
  cacheWrite: 0,
7850
7681
  },
7851
- contextWindow: 272000,
7682
+ contextWindow: 400000,
7852
7683
  maxTokens: 128000,
7853
7684
  },
7854
7685
  },
@@ -7879,7 +7710,7 @@ export const MODELS = {
7879
7710
  baseUrl: "https://opencode.ai/zen",
7880
7711
  compat: { "forceAdaptiveThinking": true },
7881
7712
  reasoning: true,
7882
- thinkingLevelMap: { "xhigh": "xhigh" },
7713
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
7883
7714
  input: ["text", "image"],
7884
7715
  cost: {
7885
7716
  input: 10,
@@ -8063,7 +7894,7 @@ export const MODELS = {
8063
7894
  cost: {
8064
7895
  input: 0.14,
8065
7896
  output: 0.28,
8066
- cacheRead: 0.03,
7897
+ cacheRead: 0.028,
8067
7898
  cacheWrite: 0,
8068
7899
  },
8069
7900
  contextWindow: 1000000,
@@ -8088,6 +7919,25 @@ export const MODELS = {
8088
7919
  contextWindow: 200000,
8089
7920
  maxTokens: 128000,
8090
7921
  },
7922
+ "deepseek-v4-pro": {
7923
+ id: "deepseek-v4-pro",
7924
+ name: "DeepSeek V4 Pro",
7925
+ api: "openai-completions",
7926
+ provider: "opencode",
7927
+ baseUrl: "https://opencode.ai/zen/v1",
7928
+ compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7929
+ reasoning: true,
7930
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7931
+ input: ["text"],
7932
+ cost: {
7933
+ input: 1.74,
7934
+ output: 3.84,
7935
+ cacheRead: 0.145,
7936
+ cacheWrite: 0,
7937
+ },
7938
+ contextWindow: 1000000,
7939
+ maxTokens: 384000,
7940
+ },
8091
7941
  "gemini-3-flash": {
8092
7942
  id: "gemini-3-flash",
8093
7943
  name: "Gemini 3 Flash",
@@ -8721,42 +8571,42 @@ export const MODELS = {
8721
8571
  contextWindow: 202752,
8722
8572
  maxTokens: 32768,
8723
8573
  },
8724
- "kimi-k2.5": {
8725
- id: "kimi-k2.5",
8726
- name: "Kimi K2.5",
8574
+ "kimi-k2.6": {
8575
+ id: "kimi-k2.6",
8576
+ name: "Kimi K2.6",
8727
8577
  api: "openai-completions",
8728
8578
  provider: "opencode-go",
8729
8579
  baseUrl: "https://opencode.ai/zen/go/v1",
8730
- compat: { "maxTokensField": "max_tokens" },
8580
+ compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false, "maxTokensField": "max_tokens" },
8731
8581
  reasoning: true,
8582
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
8732
8583
  input: ["text", "image"],
8733
8584
  cost: {
8734
- input: 0.6,
8735
- output: 3,
8736
- cacheRead: 0.1,
8585
+ input: 0.95,
8586
+ output: 4,
8587
+ cacheRead: 0.16,
8737
8588
  cacheWrite: 0,
8738
8589
  },
8739
8590
  contextWindow: 262144,
8740
8591
  maxTokens: 65536,
8741
8592
  },
8742
- "kimi-k2.6": {
8743
- id: "kimi-k2.6",
8744
- name: "Kimi K2.6",
8593
+ "kimi-k2.7-code": {
8594
+ id: "kimi-k2.7-code",
8595
+ name: "Kimi K2.7 Code",
8745
8596
  api: "openai-completions",
8746
8597
  provider: "opencode-go",
8747
8598
  baseUrl: "https://opencode.ai/zen/go/v1",
8748
- compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false, "maxTokensField": "max_tokens" },
8599
+ compat: { "maxTokensField": "max_tokens" },
8749
8600
  reasoning: true,
8750
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
8751
8601
  input: ["text", "image"],
8752
8602
  cost: {
8753
8603
  input: 0.95,
8754
8604
  output: 4,
8755
- cacheRead: 0.16,
8605
+ cacheRead: 0.19,
8756
8606
  cacheWrite: 0,
8757
8607
  },
8758
8608
  contextWindow: 262144,
8759
- maxTokens: 65536,
8609
+ maxTokens: 262144,
8760
8610
  },
8761
8611
  "mimo-v2.5": {
8762
8612
  id: "mimo-v2.5",
@@ -8794,23 +8644,6 @@ export const MODELS = {
8794
8644
  contextWindow: 1048576,
8795
8645
  maxTokens: 128000,
8796
8646
  },
8797
- "minimax-m2.5": {
8798
- id: "minimax-m2.5",
8799
- name: "MiniMax M2.5",
8800
- api: "anthropic-messages",
8801
- provider: "opencode-go",
8802
- baseUrl: "https://opencode.ai/zen/go",
8803
- reasoning: true,
8804
- input: ["text"],
8805
- cost: {
8806
- input: 0.3,
8807
- output: 1.2,
8808
- cacheRead: 0.03,
8809
- cacheWrite: 0,
8810
- },
8811
- contextWindow: 204800,
8812
- maxTokens: 65536,
8813
- },
8814
8647
  "minimax-m2.7": {
8815
8648
  id: "minimax-m2.7",
8816
8649
  name: "MiniMax M2.7",
@@ -8831,16 +8664,16 @@ export const MODELS = {
8831
8664
  },
8832
8665
  "minimax-m3": {
8833
8666
  id: "minimax-m3",
8834
- name: "MiniMax M3",
8667
+ name: "MiniMax M3 (3x usage)",
8835
8668
  api: "anthropic-messages",
8836
8669
  provider: "opencode-go",
8837
8670
  baseUrl: "https://opencode.ai/zen/go",
8838
8671
  reasoning: true,
8839
8672
  input: ["text", "image"],
8840
8673
  cost: {
8841
- input: 0.3,
8842
- output: 1.2,
8843
- cacheRead: 0.06,
8674
+ input: 0.1,
8675
+ output: 0.4,
8676
+ cacheRead: 0.02,
8844
8677
  cacheWrite: 0,
8845
8678
  },
8846
8679
  contextWindow: 512000,
@@ -8994,8 +8827,8 @@ export const MODELS = {
8994
8827
  reasoning: false,
8995
8828
  input: ["text", "image"],
8996
8829
  cost: {
8997
- input: 0.7999999999999999,
8998
- output: 3.1999999999999997,
8830
+ input: 0.8,
8831
+ output: 3.2,
8999
8832
  cacheRead: 0,
9000
8833
  cacheWrite: 0,
9001
8834
  },
@@ -9028,7 +8861,7 @@ export const MODELS = {
9028
8861
  reasoning: false,
9029
8862
  input: ["text", "image"],
9030
8863
  cost: {
9031
- input: 0.7999999999999999,
8864
+ input: 0.8,
9032
8865
  output: 4,
9033
8866
  cacheRead: 0.08,
9034
8867
  cacheWrite: 1,
@@ -9064,7 +8897,7 @@ export const MODELS = {
9064
8897
  cost: {
9065
8898
  input: 1,
9066
8899
  output: 5,
9067
- cacheRead: 0.09999999999999999,
8900
+ cacheRead: 0.1,
9068
8901
  cacheWrite: 1.25,
9069
8902
  },
9070
8903
  contextWindow: 200000,
@@ -9408,8 +9241,8 @@ export const MODELS = {
9408
9241
  reasoning: true,
9409
9242
  input: ["text", "image"],
9410
9243
  cost: {
9411
- input: 0.09999999999999999,
9412
- output: 0.39999999999999997,
9244
+ input: 0.1,
9245
+ output: 0.4,
9413
9246
  cacheRead: 0,
9414
9247
  cacheWrite: 0,
9415
9248
  },
@@ -9459,8 +9292,8 @@ export const MODELS = {
9459
9292
  reasoning: false,
9460
9293
  input: ["text"],
9461
9294
  cost: {
9462
- input: 0.20020000000000002,
9463
- output: 0.8000999999999999,
9295
+ input: 0.2002,
9296
+ output: 0.8001,
9464
9297
  cacheRead: 0,
9465
9298
  cacheWrite: 0,
9466
9299
  },
@@ -9476,7 +9309,7 @@ export const MODELS = {
9476
9309
  reasoning: false,
9477
9310
  input: ["text"],
9478
9311
  cost: {
9479
- input: 0.19999999999999998,
9312
+ input: 0.2,
9480
9313
  output: 0.77,
9481
9314
  cacheRead: 0.135,
9482
9315
  cacheWrite: 0,
@@ -9494,7 +9327,7 @@ export const MODELS = {
9494
9327
  input: ["text"],
9495
9328
  cost: {
9496
9329
  input: 0.21,
9497
- output: 0.7899999999999999,
9330
+ output: 0.79,
9498
9331
  cacheRead: 0.13,
9499
9332
  cacheWrite: 0,
9500
9333
  },
@@ -9528,7 +9361,7 @@ export const MODELS = {
9528
9361
  input: ["text"],
9529
9362
  cost: {
9530
9363
  input: 0.5,
9531
- output: 2.1500000000000004,
9364
+ output: 2.15,
9532
9365
  cacheRead: 0.35,
9533
9366
  cacheWrite: 0,
9534
9367
  },
@@ -9597,13 +9430,13 @@ export const MODELS = {
9597
9430
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "xhigh" },
9598
9431
  input: ["text"],
9599
9432
  cost: {
9600
- input: 0.0983,
9601
- output: 0.1966,
9602
- cacheRead: 0.019700000000000002,
9433
+ input: 0.098,
9434
+ output: 0.196,
9435
+ cacheRead: 0.02,
9603
9436
  cacheWrite: 0,
9604
9437
  },
9605
9438
  contextWindow: 1048576,
9606
- maxTokens: 131072,
9439
+ maxTokens: 4096,
9607
9440
  },
9608
9441
  "deepseek/deepseek-v4-pro": {
9609
9442
  id: "deepseek/deepseek-v4-pro",
@@ -9653,7 +9486,7 @@ export const MODELS = {
9653
9486
  input: 0.3,
9654
9487
  output: 2.5,
9655
9488
  cacheRead: 0.03,
9656
- cacheWrite: 0.08333333333333334,
9489
+ cacheWrite: 0.083333,
9657
9490
  },
9658
9491
  contextWindow: 1048576,
9659
9492
  maxTokens: 65535,
@@ -9667,10 +9500,10 @@ export const MODELS = {
9667
9500
  reasoning: true,
9668
9501
  input: ["text", "image"],
9669
9502
  cost: {
9670
- input: 0.09999999999999999,
9671
- output: 0.39999999999999997,
9503
+ input: 0.1,
9504
+ output: 0.4,
9672
9505
  cacheRead: 0.01,
9673
- cacheWrite: 0.08333333333333334,
9506
+ cacheWrite: 0.083333,
9674
9507
  },
9675
9508
  contextWindow: 1048576,
9676
9509
  maxTokens: 65535,
@@ -9684,10 +9517,10 @@ export const MODELS = {
9684
9517
  reasoning: true,
9685
9518
  input: ["text", "image"],
9686
9519
  cost: {
9687
- input: 0.09999999999999999,
9688
- output: 0.39999999999999997,
9520
+ input: 0.1,
9521
+ output: 0.4,
9689
9522
  cacheRead: 0.01,
9690
- cacheWrite: 0.08333333333333334,
9523
+ cacheWrite: 0.083333,
9691
9524
  },
9692
9525
  contextWindow: 1048576,
9693
9526
  maxTokens: 65535,
@@ -9754,8 +9587,8 @@ export const MODELS = {
9754
9587
  cost: {
9755
9588
  input: 0.5,
9756
9589
  output: 3,
9757
- cacheRead: 0.049999999999999996,
9758
- cacheWrite: 0.08333333333333334,
9590
+ cacheRead: 0.05,
9591
+ cacheWrite: 0.083333,
9759
9592
  },
9760
9593
  contextWindow: 1048576,
9761
9594
  maxTokens: 65536,
@@ -9771,8 +9604,8 @@ export const MODELS = {
9771
9604
  cost: {
9772
9605
  input: 0.25,
9773
9606
  output: 1.5,
9774
- cacheRead: 0.024999999999999998,
9775
- cacheWrite: 0.08333333333333334,
9607
+ cacheRead: 0.025,
9608
+ cacheWrite: 0.083333,
9776
9609
  },
9777
9610
  contextWindow: 1048576,
9778
9611
  maxTokens: 65536,
@@ -9788,8 +9621,8 @@ export const MODELS = {
9788
9621
  cost: {
9789
9622
  input: 0.25,
9790
9623
  output: 1.5,
9791
- cacheRead: 0.024999999999999998,
9792
- cacheWrite: 0.08333333333333334,
9624
+ cacheRead: 0.025,
9625
+ cacheWrite: 0.083333,
9793
9626
  },
9794
9627
  contextWindow: 1048576,
9795
9628
  maxTokens: 65536,
@@ -9805,7 +9638,7 @@ export const MODELS = {
9805
9638
  cost: {
9806
9639
  input: 2,
9807
9640
  output: 12,
9808
- cacheRead: 0.19999999999999998,
9641
+ cacheRead: 0.2,
9809
9642
  cacheWrite: 0.375,
9810
9643
  },
9811
9644
  contextWindow: 1048576,
@@ -9822,7 +9655,7 @@ export const MODELS = {
9822
9655
  cost: {
9823
9656
  input: 2,
9824
9657
  output: 12,
9825
- cacheRead: 0.19999999999999998,
9658
+ cacheRead: 0.2,
9826
9659
  cacheWrite: 0.375,
9827
9660
  },
9828
9661
  contextWindow: 1048756,
@@ -9840,7 +9673,7 @@ export const MODELS = {
9840
9673
  input: 1.5,
9841
9674
  output: 9,
9842
9675
  cacheRead: 0.15,
9843
- cacheWrite: 0.08333333333333334,
9676
+ cacheWrite: 0.083333,
9844
9677
  },
9845
9678
  contextWindow: 1048576,
9846
9679
  maxTokens: 65536,
@@ -9854,7 +9687,7 @@ export const MODELS = {
9854
9687
  reasoning: false,
9855
9688
  input: ["text", "image"],
9856
9689
  cost: {
9857
- input: 0.049999999999999996,
9690
+ input: 0.05,
9858
9691
  output: 0.15,
9859
9692
  cacheRead: 0,
9860
9693
  cacheWrite: 0,
@@ -9923,12 +9756,12 @@ export const MODELS = {
9923
9756
  input: ["text", "image"],
9924
9757
  cost: {
9925
9758
  input: 0.12,
9926
- output: 0.36,
9759
+ output: 0.35,
9927
9760
  cacheRead: 0.09,
9928
9761
  cacheWrite: 0,
9929
9762
  },
9930
9763
  contextWindow: 262144,
9931
- maxTokens: 8192,
9764
+ maxTokens: 262144,
9932
9765
  },
9933
9766
  "google/gemma-4-31b-it:free": {
9934
9767
  id: "google/gemma-4-31b-it:free",
@@ -9956,9 +9789,9 @@ export const MODELS = {
9956
9789
  reasoning: false,
9957
9790
  input: ["text"],
9958
9791
  cost: {
9959
- input: 0.049999999999999996,
9960
- output: 0.09999999999999999,
9961
- cacheRead: 0.049999999999999996,
9792
+ input: 0.05,
9793
+ output: 0.1,
9794
+ cacheRead: 0.05,
9962
9795
  cacheWrite: 0,
9963
9796
  },
9964
9797
  contextWindow: 131072,
@@ -9976,7 +9809,7 @@ export const MODELS = {
9976
9809
  cost: {
9977
9810
  input: 0.25,
9978
9811
  output: 0.75,
9979
- cacheRead: 0.024999999999999998,
9812
+ cacheRead: 0.025,
9980
9813
  cacheWrite: 0,
9981
9814
  },
9982
9815
  contextWindow: 128000,
@@ -10059,8 +9892,8 @@ export const MODELS = {
10059
9892
  reasoning: false,
10060
9893
  input: ["text"],
10061
9894
  cost: {
10062
- input: 0.39999999999999997,
10063
- output: 0.39999999999999997,
9895
+ input: 0.4,
9896
+ output: 0.4,
10064
9897
  cacheRead: 0,
10065
9898
  cacheWrite: 0,
10066
9899
  },
@@ -10093,7 +9926,7 @@ export const MODELS = {
10093
9926
  reasoning: false,
10094
9927
  input: ["text"],
10095
9928
  cost: {
10096
- input: 0.09999999999999999,
9929
+ input: 0.1,
10097
9930
  output: 0.32,
10098
9931
  cacheRead: 0,
10099
9932
  cacheWrite: 0,
@@ -10144,7 +9977,7 @@ export const MODELS = {
10144
9977
  reasoning: false,
10145
9978
  input: ["text", "image"],
10146
9979
  cost: {
10147
- input: 0.09999999999999999,
9980
+ input: 0.1,
10148
9981
  output: 0.3,
10149
9982
  cacheRead: 0,
10150
9983
  cacheWrite: 0,
@@ -10161,7 +9994,7 @@ export const MODELS = {
10161
9994
  reasoning: true,
10162
9995
  input: ["text"],
10163
9996
  cost: {
10164
- input: 0.39999999999999997,
9997
+ input: 0.4,
10165
9998
  output: 2.2,
10166
9999
  cacheRead: 0,
10167
10000
  cacheWrite: 0,
@@ -10213,8 +10046,8 @@ export const MODELS = {
10213
10046
  input: ["text"],
10214
10047
  cost: {
10215
10048
  input: 0.15,
10216
- output: 0.8999999999999999,
10217
- cacheRead: 0.049999999999999996,
10049
+ output: 0.9,
10050
+ cacheRead: 0.05,
10218
10051
  cacheWrite: 0,
10219
10052
  },
10220
10053
  contextWindow: 204800,
@@ -10229,9 +10062,9 @@ export const MODELS = {
10229
10062
  reasoning: true,
10230
10063
  input: ["text"],
10231
10064
  cost: {
10232
- input: 0.27,
10233
- output: 1.08,
10234
- cacheRead: 0.054,
10065
+ input: 0.25,
10066
+ output: 1,
10067
+ cacheRead: 0.05,
10235
10068
  cacheWrite: 0,
10236
10069
  },
10237
10070
  contextWindow: 204800,
@@ -10264,7 +10097,7 @@ export const MODELS = {
10264
10097
  input: ["text"],
10265
10098
  cost: {
10266
10099
  input: 0.3,
10267
- output: 0.8999999999999999,
10100
+ output: 0.9,
10268
10101
  cacheRead: 0.03,
10269
10102
  cacheWrite: 0,
10270
10103
  },
@@ -10280,7 +10113,7 @@ export const MODELS = {
10280
10113
  reasoning: false,
10281
10114
  input: ["text"],
10282
10115
  cost: {
10283
- input: 0.39999999999999997,
10116
+ input: 0.4,
10284
10117
  output: 2,
10285
10118
  cacheRead: 0.04,
10286
10119
  cacheWrite: 0,
@@ -10297,8 +10130,8 @@ export const MODELS = {
10297
10130
  reasoning: false,
10298
10131
  input: ["text", "image"],
10299
10132
  cost: {
10300
- input: 0.19999999999999998,
10301
- output: 0.19999999999999998,
10133
+ input: 0.2,
10134
+ output: 0.2,
10302
10135
  cacheRead: 0.02,
10303
10136
  cacheWrite: 0,
10304
10137
  },
@@ -10314,8 +10147,8 @@ export const MODELS = {
10314
10147
  reasoning: false,
10315
10148
  input: ["text", "image"],
10316
10149
  cost: {
10317
- input: 0.09999999999999999,
10318
- output: 0.09999999999999999,
10150
+ input: 0.1,
10151
+ output: 0.1,
10319
10152
  cacheRead: 0.01,
10320
10153
  cacheWrite: 0,
10321
10154
  },
@@ -10350,7 +10183,7 @@ export const MODELS = {
10350
10183
  cost: {
10351
10184
  input: 2,
10352
10185
  output: 6,
10353
- cacheRead: 0.19999999999999998,
10186
+ cacheRead: 0.2,
10354
10187
  cacheWrite: 0,
10355
10188
  },
10356
10189
  contextWindow: 128000,
@@ -10367,7 +10200,7 @@ export const MODELS = {
10367
10200
  cost: {
10368
10201
  input: 2,
10369
10202
  output: 6,
10370
- cacheRead: 0.19999999999999998,
10203
+ cacheRead: 0.2,
10371
10204
  cacheWrite: 0,
10372
10205
  },
10373
10206
  contextWindow: 131072,
@@ -10384,7 +10217,7 @@ export const MODELS = {
10384
10217
  cost: {
10385
10218
  input: 0.5,
10386
10219
  output: 1.5,
10387
- cacheRead: 0.049999999999999996,
10220
+ cacheRead: 0.05,
10388
10221
  cacheWrite: 0,
10389
10222
  },
10390
10223
  contextWindow: 262144,
@@ -10399,7 +10232,7 @@ export const MODELS = {
10399
10232
  reasoning: false,
10400
10233
  input: ["text", "image"],
10401
10234
  cost: {
10402
- input: 0.39999999999999997,
10235
+ input: 0.4,
10403
10236
  output: 2,
10404
10237
  cacheRead: 0.04,
10405
10238
  cacheWrite: 0,
@@ -10433,7 +10266,7 @@ export const MODELS = {
10433
10266
  reasoning: false,
10434
10267
  input: ["text", "image"],
10435
10268
  cost: {
10436
- input: 0.39999999999999997,
10269
+ input: 0.4,
10437
10270
  output: 2,
10438
10271
  cacheRead: 0.04,
10439
10272
  cacheWrite: 0,
@@ -10467,7 +10300,7 @@ export const MODELS = {
10467
10300
  reasoning: false,
10468
10301
  input: ["text"],
10469
10302
  cost: {
10470
- input: 0.19999999999999998,
10303
+ input: 0.2,
10471
10304
  output: 0.6,
10472
10305
  cacheRead: 0.02,
10473
10306
  cacheWrite: 0,
@@ -10502,7 +10335,7 @@ export const MODELS = {
10502
10335
  input: ["text", "image"],
10503
10336
  cost: {
10504
10337
  input: 0.075,
10505
- output: 0.19999999999999998,
10338
+ output: 0.2,
10506
10339
  cacheRead: 0,
10507
10340
  cacheWrite: 0,
10508
10341
  },
@@ -10520,7 +10353,7 @@ export const MODELS = {
10520
10353
  cost: {
10521
10354
  input: 2,
10522
10355
  output: 6,
10523
- cacheRead: 0.19999999999999998,
10356
+ cacheRead: 0.2,
10524
10357
  cacheWrite: 0,
10525
10358
  },
10526
10359
  contextWindow: 65536,
@@ -10535,7 +10368,7 @@ export const MODELS = {
10535
10368
  reasoning: false,
10536
10369
  input: ["text"],
10537
10370
  cost: {
10538
- input: 0.09999999999999999,
10371
+ input: 0.1,
10539
10372
  output: 0.3,
10540
10373
  cacheRead: 0.01,
10541
10374
  cacheWrite: 0,
@@ -10552,7 +10385,7 @@ export const MODELS = {
10552
10385
  reasoning: false,
10553
10386
  input: ["text"],
10554
10387
  cost: {
10555
- input: 0.5700000000000001,
10388
+ input: 0.57,
10556
10389
  output: 2.3,
10557
10390
  cacheRead: 0,
10558
10391
  cacheWrite: 0,
@@ -10621,27 +10454,26 @@ export const MODELS = {
10621
10454
  reasoning: true,
10622
10455
  input: ["text", "image"],
10623
10456
  cost: {
10624
- input: 0.6799999999999999,
10457
+ input: 0.68,
10625
10458
  output: 3.41,
10626
- cacheRead: 0.33999999999999997,
10459
+ cacheRead: 0.34,
10627
10460
  cacheWrite: 0,
10628
10461
  },
10629
10462
  contextWindow: 262144,
10630
10463
  maxTokens: 262142,
10631
10464
  },
10632
- "moonshotai/kimi-k2.6:free": {
10633
- id: "moonshotai/kimi-k2.6:free",
10634
- name: "MoonshotAI: Kimi K2.6 (free)",
10465
+ "moonshotai/kimi-k2.7-code": {
10466
+ id: "moonshotai/kimi-k2.7-code",
10467
+ name: "MoonshotAI: Kimi K2.7 Code",
10635
10468
  api: "openai-completions",
10636
10469
  provider: "openrouter",
10637
10470
  baseUrl: "https://openrouter.ai/api/v1",
10638
- compat: { "supportsDeveloperRole": false, "requiresReasoningContentOnAssistantMessages": true },
10639
10471
  reasoning: true,
10640
10472
  input: ["text", "image"],
10641
10473
  cost: {
10642
- input: 0,
10643
- output: 0,
10644
- cacheRead: 0,
10474
+ input: 0.95,
10475
+ output: 4,
10476
+ cacheRead: 0.19,
10645
10477
  cacheWrite: 0,
10646
10478
  },
10647
10479
  contextWindow: 262144,
@@ -10673,8 +10505,8 @@ export const MODELS = {
10673
10505
  reasoning: true,
10674
10506
  input: ["text"],
10675
10507
  cost: {
10676
- input: 0.39999999999999997,
10677
- output: 0.39999999999999997,
10508
+ input: 0.4,
10509
+ output: 0.4,
10678
10510
  cacheRead: 0,
10679
10511
  cacheWrite: 0,
10680
10512
  },
@@ -10690,8 +10522,8 @@ export const MODELS = {
10690
10522
  reasoning: true,
10691
10523
  input: ["text"],
10692
10524
  cost: {
10693
- input: 0.049999999999999996,
10694
- output: 0.19999999999999998,
10525
+ input: 0.05,
10526
+ output: 0.2,
10695
10527
  cacheRead: 0,
10696
10528
  cacheWrite: 0,
10697
10529
  },
@@ -10742,7 +10574,7 @@ export const MODELS = {
10742
10574
  input: ["text"],
10743
10575
  cost: {
10744
10576
  input: 0.09,
10745
- output: 0.44999999999999996,
10577
+ output: 0.45,
10746
10578
  cacheRead: 0,
10747
10579
  cacheWrite: 0,
10748
10580
  },
@@ -10817,23 +10649,6 @@ export const MODELS = {
10817
10649
  contextWindow: 128000,
10818
10650
  maxTokens: 128000,
10819
10651
  },
10820
- "nvidia/nemotron-nano-9b-v2": {
10821
- id: "nvidia/nemotron-nano-9b-v2",
10822
- name: "NVIDIA: Nemotron Nano 9B V2",
10823
- api: "openai-completions",
10824
- provider: "openrouter",
10825
- baseUrl: "https://openrouter.ai/api/v1",
10826
- reasoning: true,
10827
- input: ["text"],
10828
- cost: {
10829
- input: 0.04,
10830
- output: 0.16,
10831
- cacheRead: 0,
10832
- cacheWrite: 0,
10833
- },
10834
- contextWindow: 131072,
10835
- maxTokens: 16384,
10836
- },
10837
10652
  "nvidia/nemotron-nano-9b-v2:free": {
10838
10653
  id: "nvidia/nemotron-nano-9b-v2:free",
10839
10654
  name: "NVIDIA: Nemotron Nano 9B V2 (free)",
@@ -10979,9 +10794,9 @@ export const MODELS = {
10979
10794
  reasoning: false,
10980
10795
  input: ["text", "image"],
10981
10796
  cost: {
10982
- input: 0.39999999999999997,
10983
- output: 1.5999999999999999,
10984
- cacheRead: 0.09999999999999999,
10797
+ input: 0.4,
10798
+ output: 1.6,
10799
+ cacheRead: 0.1,
10985
10800
  cacheWrite: 0,
10986
10801
  },
10987
10802
  contextWindow: 1047576,
@@ -10996,9 +10811,9 @@ export const MODELS = {
10996
10811
  reasoning: false,
10997
10812
  input: ["text", "image"],
10998
10813
  cost: {
10999
- input: 0.09999999999999999,
11000
- output: 0.39999999999999997,
11001
- cacheRead: 0.024999999999999998,
10814
+ input: 0.1,
10815
+ output: 0.4,
10816
+ cacheRead: 0.025,
11002
10817
  cacheWrite: 0,
11003
10818
  },
11004
10819
  contextWindow: 1047576,
@@ -11151,7 +10966,7 @@ export const MODELS = {
11151
10966
  cost: {
11152
10967
  input: 0.25,
11153
10968
  output: 2,
11154
- cacheRead: 0.024999999999999998,
10969
+ cacheRead: 0.025,
11155
10970
  cacheWrite: 0,
11156
10971
  },
11157
10972
  contextWindow: 400000,
@@ -11166,8 +10981,8 @@ export const MODELS = {
11166
10981
  reasoning: true,
11167
10982
  input: ["text", "image"],
11168
10983
  cost: {
11169
- input: 0.049999999999999996,
11170
- output: 0.39999999999999997,
10984
+ input: 0.05,
10985
+ output: 0.4,
11171
10986
  cacheRead: 0.01,
11172
10987
  cacheWrite: 0,
11173
10988
  },
@@ -11270,7 +11085,7 @@ export const MODELS = {
11270
11085
  cost: {
11271
11086
  input: 0.25,
11272
11087
  output: 2,
11273
- cacheRead: 0.024999999999999998,
11088
+ cacheRead: 0.025,
11274
11089
  cacheWrite: 0,
11275
11090
  },
11276
11091
  contextWindow: 400000,
@@ -11430,7 +11245,7 @@ export const MODELS = {
11430
11245
  thinkingLevelMap: { "xhigh": "xhigh" },
11431
11246
  input: ["text", "image"],
11432
11247
  cost: {
11433
- input: 0.19999999999999998,
11248
+ input: 0.2,
11434
11249
  output: 1.25,
11435
11250
  cacheRead: 0.02,
11436
11251
  cacheWrite: 0,
@@ -11875,7 +11690,7 @@ export const MODELS = {
11875
11690
  reasoning: true,
11876
11691
  input: ["text"],
11877
11692
  cost: {
11878
- input: 0.19999999999999998,
11693
+ input: 0.2,
11879
11694
  output: 1.1,
11880
11695
  cacheRead: 0,
11881
11696
  cacheWrite: 0,
@@ -11893,7 +11708,7 @@ export const MODELS = {
11893
11708
  input: ["text"],
11894
11709
  cost: {
11895
11710
  input: 0.36,
11896
- output: 0.39999999999999997,
11711
+ output: 0.4,
11897
11712
  cacheRead: 0,
11898
11713
  cacheWrite: 0,
11899
11714
  },
@@ -11911,7 +11726,7 @@ export const MODELS = {
11911
11726
  cost: {
11912
11727
  input: 0.26,
11913
11728
  output: 0.78,
11914
- cacheRead: 0.052000000000000005,
11729
+ cacheRead: 0.052,
11915
11730
  cacheWrite: 0.325,
11916
11731
  },
11917
11732
  contextWindow: 1000000,
@@ -11960,7 +11775,7 @@ export const MODELS = {
11960
11775
  reasoning: true,
11961
11776
  input: ["text"],
11962
11777
  cost: {
11963
- input: 0.09999999999999999,
11778
+ input: 0.1,
11964
11779
  output: 0.24,
11965
11780
  cacheRead: 0,
11966
11781
  cacheWrite: 0,
@@ -11977,8 +11792,8 @@ export const MODELS = {
11977
11792
  reasoning: true,
11978
11793
  input: ["text"],
11979
11794
  cost: {
11980
- input: 0.45499999999999996,
11981
- output: 1.8199999999999998,
11795
+ input: 0.455,
11796
+ output: 1.82,
11982
11797
  cacheRead: 0,
11983
11798
  cacheWrite: 0,
11984
11799
  },
@@ -11995,7 +11810,7 @@ export const MODELS = {
11995
11810
  input: ["text"],
11996
11811
  cost: {
11997
11812
  input: 0.09,
11998
- output: 0.09999999999999999,
11813
+ output: 0.1,
11999
11814
  cacheRead: 0,
12000
11815
  cacheWrite: 0,
12001
11816
  },
@@ -12011,9 +11826,9 @@ export const MODELS = {
12011
11826
  reasoning: true,
12012
11827
  input: ["text"],
12013
11828
  cost: {
12014
- input: 0.09999999999999999,
12015
- output: 0.09999999999999999,
12016
- cacheRead: 0.09999999999999999,
11829
+ input: 0.1,
11830
+ output: 0.1,
11831
+ cacheRead: 0.1,
12017
11832
  cacheWrite: 0,
12018
11833
  },
12019
11834
  contextWindow: 262144,
@@ -12063,7 +11878,7 @@ export const MODELS = {
12063
11878
  input: ["text"],
12064
11879
  cost: {
12065
11880
  input: 0.08,
12066
- output: 0.39999999999999997,
11881
+ output: 0.4,
12067
11882
  cacheRead: 0.08,
12068
11883
  cacheWrite: 0,
12069
11884
  },
@@ -12096,9 +11911,9 @@ export const MODELS = {
12096
11911
  reasoning: true,
12097
11912
  input: ["text"],
12098
11913
  cost: {
12099
- input: 0.049999999999999996,
12100
- output: 0.39999999999999997,
12101
- cacheRead: 0.049999999999999996,
11914
+ input: 0.05,
11915
+ output: 0.4,
11916
+ cacheRead: 0.05,
12102
11917
  cacheWrite: 0,
12103
11918
  },
12104
11919
  contextWindow: 131072,
@@ -12114,7 +11929,7 @@ export const MODELS = {
12114
11929
  input: ["text"],
12115
11930
  cost: {
12116
11931
  input: 0.22,
12117
- output: 1.7999999999999998,
11932
+ output: 1.8,
12118
11933
  cacheRead: 0,
12119
11934
  cacheWrite: 0,
12120
11935
  },
@@ -12165,7 +11980,7 @@ export const MODELS = {
12165
11980
  input: ["text"],
12166
11981
  cost: {
12167
11982
  input: 0.11,
12168
- output: 0.7999999999999999,
11983
+ output: 0.8,
12169
11984
  cacheRead: 0.07,
12170
11985
  cacheWrite: 0,
12171
11986
  },
@@ -12300,7 +12115,7 @@ export const MODELS = {
12300
12115
  reasoning: false,
12301
12116
  input: ["text", "image"],
12302
12117
  cost: {
12303
- input: 0.19999999999999998,
12118
+ input: 0.2,
12304
12119
  output: 0.88,
12305
12120
  cacheRead: 0.11,
12306
12121
  cacheWrite: 0,
@@ -12368,8 +12183,8 @@ export const MODELS = {
12368
12183
  reasoning: false,
12369
12184
  input: ["text", "image"],
12370
12185
  cost: {
12371
- input: 0.10400000000000001,
12372
- output: 0.41600000000000004,
12186
+ input: 0.104,
12187
+ output: 0.416,
12373
12188
  cacheRead: 0,
12374
12189
  cacheWrite: 0,
12375
12190
  },
@@ -12455,7 +12270,7 @@ export const MODELS = {
12455
12270
  cost: {
12456
12271
  input: 0.14,
12457
12272
  output: 1,
12458
- cacheRead: 0.049999999999999996,
12273
+ cacheRead: 0.05,
12459
12274
  cacheWrite: 0,
12460
12275
  },
12461
12276
  contextWindow: 262144,
@@ -12487,7 +12302,7 @@ export const MODELS = {
12487
12302
  reasoning: true,
12488
12303
  input: ["text", "image"],
12489
12304
  cost: {
12490
- input: 0.09999999999999999,
12305
+ input: 0.1,
12491
12306
  output: 0.15,
12492
12307
  cacheRead: 0,
12493
12308
  cacheWrite: 0,
@@ -12539,7 +12354,7 @@ export const MODELS = {
12539
12354
  input: ["text", "image"],
12540
12355
  cost: {
12541
12356
  input: 0.3,
12542
- output: 1.7999999999999998,
12357
+ output: 1.8,
12543
12358
  cacheRead: 0,
12544
12359
  cacheWrite: 0.375,
12545
12360
  },
@@ -12555,13 +12370,13 @@ export const MODELS = {
12555
12370
  reasoning: true,
12556
12371
  input: ["text", "image"],
12557
12372
  cost: {
12558
- input: 0.28900000000000003,
12559
- output: 2.4,
12373
+ input: 0.2885,
12374
+ output: 3.17,
12560
12375
  cacheRead: 0,
12561
12376
  cacheWrite: 0,
12562
12377
  },
12563
12378
  contextWindow: 262144,
12564
- maxTokens: 131072,
12379
+ maxTokens: 262140,
12565
12380
  },
12566
12381
  "qwen/qwen3.6-35b-a3b": {
12567
12382
  id: "qwen/qwen3.6-35b-a3b",
@@ -12572,13 +12387,13 @@ export const MODELS = {
12572
12387
  reasoning: true,
12573
12388
  input: ["text", "image"],
12574
12389
  cost: {
12575
- input: 0.14,
12390
+ input: 0.15,
12576
12391
  output: 1,
12577
- cacheRead: 0,
12392
+ cacheRead: 0.05,
12578
12393
  cacheWrite: 0,
12579
12394
  },
12580
12395
  contextWindow: 262144,
12581
- maxTokens: 262140,
12396
+ maxTokens: 262144,
12582
12397
  },
12583
12398
  "qwen/qwen3.6-flash": {
12584
12399
  id: "qwen/qwen3.6-flash",
@@ -12657,10 +12472,10 @@ export const MODELS = {
12657
12472
  reasoning: true,
12658
12473
  input: ["text", "image"],
12659
12474
  cost: {
12660
- input: 0.39999999999999997,
12661
- output: 1.5999999999999999,
12662
- cacheRead: 0.08,
12663
- cacheWrite: 0.5,
12475
+ input: 0.32,
12476
+ output: 1.28,
12477
+ cacheRead: 0.064,
12478
+ cacheWrite: 0.4,
12664
12479
  },
12665
12480
  contextWindow: 1000000,
12666
12481
  maxTokens: 65536,
@@ -12674,8 +12489,8 @@ export const MODELS = {
12674
12489
  reasoning: false,
12675
12490
  input: ["text", "image"],
12676
12491
  cost: {
12677
- input: 0.09999999999999999,
12678
- output: 0.09999999999999999,
12492
+ input: 0.1,
12493
+ output: 0.1,
12679
12494
  cacheRead: 0,
12680
12495
  cacheWrite: 0,
12681
12496
  },
@@ -12742,7 +12557,7 @@ export const MODELS = {
12742
12557
  reasoning: true,
12743
12558
  input: ["text", "image"],
12744
12559
  cost: {
12745
- input: 0.19999999999999998,
12560
+ input: 0.2,
12746
12561
  output: 1.15,
12747
12562
  cacheRead: 0.04,
12748
12563
  cacheWrite: 0,
@@ -12761,7 +12576,7 @@ export const MODELS = {
12761
12576
  cost: {
12762
12577
  input: 0.063,
12763
12578
  output: 0.21,
12764
- cacheRead: 0.020999999999999998,
12579
+ cacheRead: 0.021,
12765
12580
  cacheWrite: 0,
12766
12581
  },
12767
12582
  contextWindow: 262144,
@@ -12776,7 +12591,7 @@ export const MODELS = {
12776
12591
  reasoning: false,
12777
12592
  input: ["text"],
12778
12593
  cost: {
12779
- input: 0.16999999999999998,
12594
+ input: 0.17,
12780
12595
  output: 0.43,
12781
12596
  cacheRead: 0,
12782
12597
  cacheWrite: 0,
@@ -12793,8 +12608,8 @@ export const MODELS = {
12793
12608
  reasoning: false,
12794
12609
  input: ["text"],
12795
12610
  cost: {
12796
- input: 0.39999999999999997,
12797
- output: 0.39999999999999997,
12611
+ input: 0.4,
12612
+ output: 0.4,
12798
12613
  cacheRead: 0,
12799
12614
  cacheWrite: 0,
12800
12615
  },
@@ -12829,7 +12644,7 @@ export const MODELS = {
12829
12644
  cost: {
12830
12645
  input: 1.25,
12831
12646
  output: 2.5,
12832
- cacheRead: 0.19999999999999998,
12647
+ cacheRead: 0.2,
12833
12648
  cacheWrite: 0,
12834
12649
  },
12835
12650
  contextWindow: 2000000,
@@ -12846,7 +12661,7 @@ export const MODELS = {
12846
12661
  cost: {
12847
12662
  input: 1.25,
12848
12663
  output: 2.5,
12849
- cacheRead: 0.19999999999999998,
12664
+ cacheRead: 0.2,
12850
12665
  cacheWrite: 0,
12851
12666
  },
12852
12667
  contextWindow: 1000000,
@@ -12863,7 +12678,7 @@ export const MODELS = {
12863
12678
  cost: {
12864
12679
  input: 1,
12865
12680
  output: 2,
12866
- cacheRead: 0.19999999999999998,
12681
+ cacheRead: 0.2,
12867
12682
  cacheWrite: 0,
12868
12683
  },
12869
12684
  contextWindow: 256000,
@@ -12878,7 +12693,7 @@ export const MODELS = {
12878
12693
  reasoning: true,
12879
12694
  input: ["text"],
12880
12695
  cost: {
12881
- input: 0.09999999999999999,
12696
+ input: 0.1,
12882
12697
  output: 0.3,
12883
12698
  cacheRead: 0.01,
12884
12699
  cacheWrite: 0,
@@ -12920,23 +12735,6 @@ export const MODELS = {
12920
12735
  contextWindow: 1048576,
12921
12736
  maxTokens: 131072,
12922
12737
  },
12923
- "z-ai/glm-4-32b": {
12924
- id: "z-ai/glm-4-32b",
12925
- name: "Z.ai: GLM 4 32B ",
12926
- api: "openai-completions",
12927
- provider: "openrouter",
12928
- baseUrl: "https://openrouter.ai/api/v1",
12929
- reasoning: false,
12930
- input: ["text"],
12931
- cost: {
12932
- input: 0.09999999999999999,
12933
- output: 0.09999999999999999,
12934
- cacheRead: 0,
12935
- cacheWrite: 0,
12936
- },
12937
- contextWindow: 128000,
12938
- maxTokens: 4096,
12939
- },
12940
12738
  "z-ai/glm-4.5": {
12941
12739
  id: "z-ai/glm-4.5",
12942
12740
  name: "Z.ai: GLM 4.5",
@@ -12971,23 +12769,6 @@ export const MODELS = {
12971
12769
  contextWindow: 131072,
12972
12770
  maxTokens: 131070,
12973
12771
  },
12974
- "z-ai/glm-4.5-air:free": {
12975
- id: "z-ai/glm-4.5-air:free",
12976
- name: "Z.ai: GLM 4.5 Air (free)",
12977
- api: "openai-completions",
12978
- provider: "openrouter",
12979
- baseUrl: "https://openrouter.ai/api/v1",
12980
- reasoning: true,
12981
- input: ["text"],
12982
- cost: {
12983
- input: 0,
12984
- output: 0,
12985
- cacheRead: 0,
12986
- cacheWrite: 0,
12987
- },
12988
- contextWindow: 131072,
12989
- maxTokens: 96000,
12990
- },
12991
12772
  "z-ai/glm-4.5v": {
12992
12773
  id: "z-ai/glm-4.5v",
12993
12774
  name: "Z.ai: GLM 4.5V",
@@ -12998,7 +12779,7 @@ export const MODELS = {
12998
12779
  input: ["text", "image"],
12999
12780
  cost: {
13000
12781
  input: 0.6,
13001
- output: 1.7999999999999998,
12782
+ output: 1.8,
13002
12783
  cacheRead: 0.11,
13003
12784
  cacheWrite: 0,
13004
12785
  },
@@ -13032,12 +12813,12 @@ export const MODELS = {
13032
12813
  input: ["text", "image"],
13033
12814
  cost: {
13034
12815
  input: 0.3,
13035
- output: 0.8999999999999999,
13036
- cacheRead: 0.049999999999999996,
12816
+ output: 0.9,
12817
+ cacheRead: 0.055,
13037
12818
  cacheWrite: 0,
13038
12819
  },
13039
12820
  contextWindow: 131072,
13040
- maxTokens: 24000,
12821
+ maxTokens: 32768,
13041
12822
  },
13042
12823
  "z-ai/glm-4.7": {
13043
12824
  id: "z-ai/glm-4.7",
@@ -13048,7 +12829,7 @@ export const MODELS = {
13048
12829
  reasoning: true,
13049
12830
  input: ["text"],
13050
12831
  cost: {
13051
- input: 0.39999999999999997,
12832
+ input: 0.4,
13052
12833
  output: 1.75,
13053
12834
  cacheRead: 0.08,
13054
12835
  cacheWrite: 0,
@@ -13066,7 +12847,7 @@ export const MODELS = {
13066
12847
  input: ["text"],
13067
12848
  cost: {
13068
12849
  input: 0.06,
13069
- output: 0.39999999999999997,
12850
+ output: 0.4,
13070
12851
  cacheRead: 0.01,
13071
12852
  cacheWrite: 0,
13072
12853
  },
@@ -13104,7 +12885,7 @@ export const MODELS = {
13104
12885
  cacheRead: 0.24,
13105
12886
  cacheWrite: 0,
13106
12887
  },
13107
- contextWindow: 202752,
12888
+ contextWindow: 262144,
13108
12889
  maxTokens: 131072,
13109
12890
  },
13110
12891
  "z-ai/glm-5.1": {
@@ -13124,23 +12905,6 @@ export const MODELS = {
13124
12905
  contextWindow: 202752,
13125
12906
  maxTokens: 4096,
13126
12907
  },
13127
- "z-ai/glm-5v-turbo": {
13128
- id: "z-ai/glm-5v-turbo",
13129
- name: "Z.ai: GLM 5V Turbo",
13130
- api: "openai-completions",
13131
- provider: "openrouter",
13132
- baseUrl: "https://openrouter.ai/api/v1",
13133
- reasoning: true,
13134
- input: ["text", "image"],
13135
- cost: {
13136
- input: 1.2,
13137
- output: 4,
13138
- cacheRead: 0.24,
13139
- cacheWrite: 0,
13140
- },
13141
- contextWindow: 202752,
13142
- maxTokens: 131072,
13143
- },
13144
12908
  "~anthropic/claude-fable-latest": {
13145
12909
  id: "~anthropic/claude-fable-latest",
13146
12910
  name: "Anthropic: Claude Fable Latest",
@@ -13169,7 +12933,7 @@ export const MODELS = {
13169
12933
  cost: {
13170
12934
  input: 1,
13171
12935
  output: 5,
13172
- cacheRead: 0.09999999999999999,
12936
+ cacheRead: 0.1,
13173
12937
  cacheWrite: 1.25,
13174
12938
  },
13175
12939
  contextWindow: 200000,
@@ -13221,7 +12985,7 @@ export const MODELS = {
13221
12985
  input: 1.5,
13222
12986
  output: 9,
13223
12987
  cacheRead: 0.15,
13224
- cacheWrite: 0.08333333333333334,
12988
+ cacheWrite: 0.083333,
13225
12989
  },
13226
12990
  contextWindow: 1048576,
13227
12991
  maxTokens: 65536,
@@ -13237,7 +13001,7 @@ export const MODELS = {
13237
13001
  cost: {
13238
13002
  input: 2,
13239
13003
  output: 12,
13240
- cacheRead: 0.19999999999999998,
13004
+ cacheRead: 0.2,
13241
13005
  cacheWrite: 0.375,
13242
13006
  },
13243
13007
  contextWindow: 1048576,
@@ -13252,9 +13016,9 @@ export const MODELS = {
13252
13016
  reasoning: true,
13253
13017
  input: ["text", "image"],
13254
13018
  cost: {
13255
- input: 0.6799999999999999,
13019
+ input: 0.68,
13256
13020
  output: 3.41,
13257
- cacheRead: 0.33999999999999997,
13021
+ cacheRead: 0.34,
13258
13022
  cacheWrite: 0,
13259
13023
  },
13260
13024
  contextWindow: 262144,
@@ -13296,25 +13060,6 @@ export const MODELS = {
13296
13060
  },
13297
13061
  },
13298
13062
  "together": {
13299
- "MiniMaxAI/MiniMax-M2.5": {
13300
- id: "MiniMaxAI/MiniMax-M2.5",
13301
- name: "MiniMax-M2.5",
13302
- api: "openai-completions",
13303
- provider: "together",
13304
- baseUrl: "https://api.together.ai/v1",
13305
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13306
- reasoning: true,
13307
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13308
- input: ["text"],
13309
- cost: {
13310
- input: 0.3,
13311
- output: 1.2,
13312
- cacheRead: 0.06,
13313
- cacheWrite: 0,
13314
- },
13315
- contextWindow: 204800,
13316
- maxTokens: 131072,
13317
- },
13318
13063
  "MiniMaxAI/MiniMax-M2.7": {
13319
13064
  id: "MiniMaxAI/MiniMax-M2.7",
13320
13065
  name: "MiniMax-M2.7",
@@ -13334,28 +13079,27 @@ export const MODELS = {
13334
13079
  contextWindow: 202752,
13335
13080
  maxTokens: 131072,
13336
13081
  },
13337
- "Qwen/Qwen3-235B-A22B-Instruct-2507-tput": {
13338
- id: "Qwen/Qwen3-235B-A22B-Instruct-2507-tput",
13339
- name: "Qwen3 235B A22B Instruct 2507 FP8",
13082
+ "Qwen/Qwen2.5-7B-Instruct-Turbo": {
13083
+ id: "Qwen/Qwen2.5-7B-Instruct-Turbo",
13084
+ name: "Qwen 2.5 7B Instruct Turbo",
13340
13085
  api: "openai-completions",
13341
13086
  provider: "together",
13342
13087
  baseUrl: "https://api.together.ai/v1",
13343
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13344
- reasoning: true,
13345
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13088
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
13089
+ reasoning: false,
13346
13090
  input: ["text"],
13347
13091
  cost: {
13348
- input: 0.2,
13349
- output: 0.6,
13092
+ input: 0.3,
13093
+ output: 0.3,
13350
13094
  cacheRead: 0,
13351
13095
  cacheWrite: 0,
13352
13096
  },
13353
- contextWindow: 262144,
13354
- maxTokens: 262144,
13097
+ contextWindow: 32768,
13098
+ maxTokens: 32768,
13355
13099
  },
13356
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8": {
13357
- id: "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
13358
- name: "Qwen3 Coder 480B A35B Instruct",
13100
+ "Qwen/Qwen3-235B-A22B-Instruct-2507-tput": {
13101
+ id: "Qwen/Qwen3-235B-A22B-Instruct-2507-tput",
13102
+ name: "Qwen3 235B A22B Instruct 2507 FP8",
13359
13103
  api: "openai-completions",
13360
13104
  provider: "together",
13361
13105
  baseUrl: "https://api.together.ai/v1",
@@ -13363,36 +13107,36 @@ export const MODELS = {
13363
13107
  reasoning: false,
13364
13108
  input: ["text"],
13365
13109
  cost: {
13366
- input: 2,
13367
- output: 2,
13110
+ input: 0.2,
13111
+ output: 0.6,
13368
13112
  cacheRead: 0,
13369
13113
  cacheWrite: 0,
13370
13114
  },
13371
13115
  contextWindow: 262144,
13372
13116
  maxTokens: 262144,
13373
13117
  },
13374
- "Qwen/Qwen3-Coder-Next-FP8": {
13375
- id: "Qwen/Qwen3-Coder-Next-FP8",
13376
- name: "Qwen3 Coder Next FP8",
13118
+ "Qwen/Qwen3.5-397B-A17B": {
13119
+ id: "Qwen/Qwen3.5-397B-A17B",
13120
+ name: "Qwen3.5 397B A17B",
13377
13121
  api: "openai-completions",
13378
13122
  provider: "together",
13379
13123
  baseUrl: "https://api.together.ai/v1",
13380
13124
  compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13381
13125
  reasoning: true,
13382
13126
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13383
- input: ["text"],
13127
+ input: ["text", "image"],
13384
13128
  cost: {
13385
- input: 0.5,
13386
- output: 1.2,
13129
+ input: 0.6,
13130
+ output: 3.6,
13387
13131
  cacheRead: 0,
13388
13132
  cacheWrite: 0,
13389
13133
  },
13390
13134
  contextWindow: 262144,
13391
- maxTokens: 262144,
13135
+ maxTokens: 130000,
13392
13136
  },
13393
- "Qwen/Qwen3.5-397B-A17B": {
13394
- id: "Qwen/Qwen3.5-397B-A17B",
13395
- name: "Qwen3.5 397B A17B",
13137
+ "Qwen/Qwen3.5-9B": {
13138
+ id: "Qwen/Qwen3.5-9B",
13139
+ name: "Qwen3.5 9B",
13396
13140
  api: "openai-completions",
13397
13141
  provider: "together",
13398
13142
  baseUrl: "https://api.together.ai/v1",
@@ -13401,13 +13145,13 @@ export const MODELS = {
13401
13145
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13402
13146
  input: ["text", "image"],
13403
13147
  cost: {
13404
- input: 0.6,
13405
- output: 3.6,
13148
+ input: 0.17,
13149
+ output: 0.25,
13406
13150
  cacheRead: 0,
13407
13151
  cacheWrite: 0,
13408
13152
  },
13409
13153
  contextWindow: 262144,
13410
- maxTokens: 130000,
13154
+ maxTokens: 65536,
13411
13155
  },
13412
13156
  "Qwen/Qwen3.6-Plus": {
13413
13157
  id: "Qwen/Qwen3.6-Plus",
@@ -13434,9 +13178,8 @@ export const MODELS = {
13434
13178
  api: "openai-completions",
13435
13179
  provider: "together",
13436
13180
  baseUrl: "https://api.together.ai/v1",
13437
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13438
- reasoning: true,
13439
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13181
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
13182
+ reasoning: false,
13440
13183
  input: ["text"],
13441
13184
  cost: {
13442
13185
  input: 2.5,
@@ -13447,44 +13190,6 @@ export const MODELS = {
13447
13190
  contextWindow: 1000000,
13448
13191
  maxTokens: 500000,
13449
13192
  },
13450
- "deepseek-ai/DeepSeek-V3": {
13451
- id: "deepseek-ai/DeepSeek-V3",
13452
- name: "DeepSeek-V3",
13453
- api: "openai-completions",
13454
- provider: "together",
13455
- baseUrl: "https://api.together.ai/v1",
13456
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13457
- reasoning: true,
13458
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13459
- input: ["text"],
13460
- cost: {
13461
- input: 1.25,
13462
- output: 1.25,
13463
- cacheRead: 0,
13464
- cacheWrite: 0,
13465
- },
13466
- contextWindow: 131072,
13467
- maxTokens: 131072,
13468
- },
13469
- "deepseek-ai/DeepSeek-V3-1": {
13470
- id: "deepseek-ai/DeepSeek-V3-1",
13471
- name: "DeepSeek V3.1",
13472
- api: "openai-completions",
13473
- provider: "together",
13474
- baseUrl: "https://api.together.ai/v1",
13475
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13476
- reasoning: true,
13477
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13478
- input: ["text"],
13479
- cost: {
13480
- input: 0.6,
13481
- output: 1.7,
13482
- cacheRead: 0,
13483
- cacheWrite: 0,
13484
- },
13485
- contextWindow: 131072,
13486
- maxTokens: 131072,
13487
- },
13488
13193
  "deepseek-ai/DeepSeek-V4-Pro": {
13489
13194
  id: "deepseek-ai/DeepSeek-V4-Pro",
13490
13195
  name: "DeepSeek V4 Pro",
@@ -13496,8 +13201,8 @@ export const MODELS = {
13496
13201
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": null },
13497
13202
  input: ["text"],
13498
13203
  cost: {
13499
- input: 2.1,
13500
- output: 4.4,
13204
+ input: 1.74,
13205
+ output: 3.48,
13501
13206
  cacheRead: 0.2,
13502
13207
  cacheWrite: 0,
13503
13208
  },
@@ -13533,8 +13238,8 @@ export const MODELS = {
13533
13238
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13534
13239
  input: ["text", "image"],
13535
13240
  cost: {
13536
- input: 0.2,
13537
- output: 0.5,
13241
+ input: 0.39,
13242
+ output: 0.97,
13538
13243
  cacheRead: 0,
13539
13244
  cacheWrite: 0,
13540
13245
  },
@@ -13559,25 +13264,6 @@ export const MODELS = {
13559
13264
  contextWindow: 131072,
13560
13265
  maxTokens: 131072,
13561
13266
  },
13562
- "moonshotai/Kimi-K2.5": {
13563
- id: "moonshotai/Kimi-K2.5",
13564
- name: "Kimi K2.5",
13565
- api: "openai-completions",
13566
- provider: "together",
13567
- baseUrl: "https://api.together.ai/v1",
13568
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13569
- reasoning: true,
13570
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13571
- input: ["text", "image"],
13572
- cost: {
13573
- input: 0.5,
13574
- output: 2.8,
13575
- cacheRead: 0,
13576
- cacheWrite: 0,
13577
- },
13578
- contextWindow: 262144,
13579
- maxTokens: 262144,
13580
- },
13581
13267
  "moonshotai/Kimi-K2.6": {
13582
13268
  id: "moonshotai/Kimi-K2.6",
13583
13269
  name: "Kimi K2.6",
@@ -13635,6 +13321,44 @@ export const MODELS = {
13635
13321
  contextWindow: 131072,
13636
13322
  maxTokens: 131072,
13637
13323
  },
13324
+ "openai/gpt-oss-20b": {
13325
+ id: "openai/gpt-oss-20b",
13326
+ name: "GPT OSS 20B",
13327
+ api: "openai-completions",
13328
+ provider: "together",
13329
+ baseUrl: "https://api.together.ai/v1",
13330
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": true, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "openai" },
13331
+ reasoning: true,
13332
+ thinkingLevelMap: { "off": null, "minimal": null },
13333
+ input: ["text"],
13334
+ cost: {
13335
+ input: 0.05,
13336
+ output: 0.2,
13337
+ cacheRead: 0,
13338
+ cacheWrite: 0,
13339
+ },
13340
+ contextWindow: 131072,
13341
+ maxTokens: 131072,
13342
+ },
13343
+ "zai-org/GLM-5": {
13344
+ id: "zai-org/GLM-5",
13345
+ name: "GLM-5",
13346
+ api: "openai-completions",
13347
+ provider: "together",
13348
+ baseUrl: "https://api.together.ai/v1",
13349
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13350
+ reasoning: true,
13351
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13352
+ input: ["text"],
13353
+ cost: {
13354
+ input: 1,
13355
+ output: 3.2,
13356
+ cacheRead: 0,
13357
+ cacheWrite: 0,
13358
+ },
13359
+ contextWindow: 202752,
13360
+ maxTokens: 131072,
13361
+ },
13638
13362
  "zai-org/GLM-5.1": {
13639
13363
  id: "zai-org/GLM-5.1",
13640
13364
  name: "GLM-5.1",
@@ -13750,7 +13474,7 @@ export const MODELS = {
13750
13474
  reasoning: true,
13751
13475
  input: ["text", "image"],
13752
13476
  cost: {
13753
- input: 0.39999999999999997,
13477
+ input: 0.4,
13754
13478
  output: 4,
13755
13479
  cacheRead: 0,
13756
13480
  cacheWrite: 0,
@@ -13820,7 +13544,7 @@ export const MODELS = {
13820
13544
  cost: {
13821
13545
  input: 1,
13822
13546
  output: 5,
13823
- cacheRead: 0.19999999999999998,
13547
+ cacheRead: 0.2,
13824
13548
  cacheWrite: 0,
13825
13549
  },
13826
13550
  contextWindow: 1000000,
@@ -13920,7 +13644,7 @@ export const MODELS = {
13920
13644
  reasoning: true,
13921
13645
  input: ["text", "image"],
13922
13646
  cost: {
13923
- input: 0.39999999999999997,
13647
+ input: 0.4,
13924
13648
  output: 4,
13925
13649
  cacheRead: 0,
13926
13650
  cacheWrite: 0,
@@ -13937,8 +13661,8 @@ export const MODELS = {
13937
13661
  reasoning: true,
13938
13662
  input: ["text", "image"],
13939
13663
  cost: {
13940
- input: 0.09999999999999999,
13941
- output: 0.39999999999999997,
13664
+ input: 0.1,
13665
+ output: 0.4,
13942
13666
  cacheRead: 0.001,
13943
13667
  cacheWrite: 0.125,
13944
13668
  },
@@ -13954,7 +13678,7 @@ export const MODELS = {
13954
13678
  reasoning: true,
13955
13679
  input: ["text", "image"],
13956
13680
  cost: {
13957
- input: 0.39999999999999997,
13681
+ input: 0.4,
13958
13682
  output: 2.4,
13959
13683
  cacheRead: 0.04,
13960
13684
  cacheWrite: 0.5,
@@ -13972,7 +13696,7 @@ export const MODELS = {
13972
13696
  input: ["text", "image"],
13973
13697
  cost: {
13974
13698
  input: 0.6,
13975
- output: 3.5999999999999996,
13699
+ output: 3.6,
13976
13700
  cacheRead: 0,
13977
13701
  cacheWrite: 0,
13978
13702
  },
@@ -13990,7 +13714,7 @@ export const MODELS = {
13990
13714
  cost: {
13991
13715
  input: 0.5,
13992
13716
  output: 3,
13993
- cacheRead: 0.09999999999999999,
13717
+ cacheRead: 0.1,
13994
13718
  cacheWrite: 0.625,
13995
13719
  },
13996
13720
  contextWindow: 1000000,
@@ -14022,8 +13746,8 @@ export const MODELS = {
14022
13746
  reasoning: true,
14023
13747
  input: ["text", "image"],
14024
13748
  cost: {
14025
- input: 0.39999999999999997,
14026
- output: 1.5999999999999999,
13749
+ input: 0.4,
13750
+ output: 1.6,
14027
13751
  cacheRead: 0.08,
14028
13752
  cacheWrite: 0.5,
14029
13753
  },
@@ -14056,7 +13780,7 @@ export const MODELS = {
14056
13780
  reasoning: false,
14057
13781
  input: ["text", "image"],
14058
13782
  cost: {
14059
- input: 0.7999999999999999,
13783
+ input: 0.8,
14060
13784
  output: 4,
14061
13785
  cacheRead: 0.08,
14062
13786
  cacheWrite: 1,
@@ -14072,7 +13796,7 @@ export const MODELS = {
14072
13796
  baseUrl: "https://ai-gateway.vercel.sh",
14073
13797
  compat: { "forceAdaptiveThinking": true },
14074
13798
  reasoning: true,
14075
- thinkingLevelMap: { "xhigh": "xhigh" },
13799
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
14076
13800
  input: ["text", "image"],
14077
13801
  cost: {
14078
13802
  input: 10,
@@ -14094,7 +13818,7 @@ export const MODELS = {
14094
13818
  cost: {
14095
13819
  input: 1,
14096
13820
  output: 5,
14097
- cacheRead: 0.09999999999999999,
13821
+ cacheRead: 0.1,
14098
13822
  cacheWrite: 1.25,
14099
13823
  },
14100
13824
  contextWindow: 200000,
@@ -14287,7 +14011,7 @@ export const MODELS = {
14287
14011
  input: ["text"],
14288
14012
  cost: {
14289
14013
  input: 0.25,
14290
- output: 0.8999999999999999,
14014
+ output: 0.9,
14291
14015
  cacheRead: 0,
14292
14016
  cacheWrite: 0,
14293
14017
  },
@@ -14305,7 +14029,7 @@ export const MODELS = {
14305
14029
  cost: {
14306
14030
  input: 0.25,
14307
14031
  output: 2,
14308
- cacheRead: 0.049999999999999996,
14032
+ cacheRead: 0.05,
14309
14033
  cacheWrite: 0,
14310
14034
  },
14311
14035
  contextWindow: 256000,
@@ -14490,8 +14214,8 @@ export const MODELS = {
14490
14214
  reasoning: true,
14491
14215
  input: ["text", "image"],
14492
14216
  cost: {
14493
- input: 0.09999999999999999,
14494
- output: 0.39999999999999997,
14217
+ input: 0.1,
14218
+ output: 0.4,
14495
14219
  cacheRead: 0.01,
14496
14220
  cacheWrite: 0,
14497
14221
  },
@@ -14526,7 +14250,7 @@ export const MODELS = {
14526
14250
  cost: {
14527
14251
  input: 0.5,
14528
14252
  output: 3,
14529
- cacheRead: 0.049999999999999996,
14253
+ cacheRead: 0.05,
14530
14254
  cacheWrite: 0,
14531
14255
  },
14532
14256
  contextWindow: 1000000,
@@ -14543,7 +14267,7 @@ export const MODELS = {
14543
14267
  cost: {
14544
14268
  input: 2,
14545
14269
  output: 12,
14546
- cacheRead: 0.19999999999999998,
14270
+ cacheRead: 0.2,
14547
14271
  cacheWrite: 0,
14548
14272
  },
14549
14273
  contextWindow: 1000000,
@@ -14594,7 +14318,7 @@ export const MODELS = {
14594
14318
  cost: {
14595
14319
  input: 2,
14596
14320
  output: 12,
14597
- cacheRead: 0.19999999999999998,
14321
+ cacheRead: 0.2,
14598
14322
  cacheWrite: 0,
14599
14323
  },
14600
14324
  contextWindow: 1000000,
@@ -14644,7 +14368,7 @@ export const MODELS = {
14644
14368
  input: ["text", "image"],
14645
14369
  cost: {
14646
14370
  input: 0.14,
14647
- output: 0.39999999999999997,
14371
+ output: 0.4,
14648
14372
  cacheRead: 0,
14649
14373
  cacheWrite: 0,
14650
14374
  },
@@ -14662,7 +14386,7 @@ export const MODELS = {
14662
14386
  cost: {
14663
14387
  input: 0.25,
14664
14388
  output: 0.75,
14665
- cacheRead: 0.024999999999999998,
14389
+ cacheRead: 0.025,
14666
14390
  cacheWrite: 0,
14667
14391
  },
14668
14392
  contextWindow: 128000,
@@ -14814,7 +14538,7 @@ export const MODELS = {
14814
14538
  input: ["text", "image"],
14815
14539
  cost: {
14816
14540
  input: 0.24,
14817
- output: 0.9700000000000001,
14541
+ output: 0.97,
14818
14542
  cacheRead: 0,
14819
14543
  cacheWrite: 0,
14820
14544
  },
@@ -14830,7 +14554,7 @@ export const MODELS = {
14830
14554
  reasoning: false,
14831
14555
  input: ["text", "image"],
14832
14556
  cost: {
14833
- input: 0.16999999999999998,
14557
+ input: 0.17,
14834
14558
  output: 0.66,
14835
14559
  cacheRead: 0,
14836
14560
  cacheWrite: 0,
@@ -14984,7 +14708,7 @@ export const MODELS = {
14984
14708
  input: ["text"],
14985
14709
  cost: {
14986
14710
  input: 0.3,
14987
- output: 0.8999999999999999,
14711
+ output: 0.9,
14988
14712
  cacheRead: 0,
14989
14713
  cacheWrite: 0,
14990
14714
  },
@@ -15000,7 +14724,7 @@ export const MODELS = {
15000
14724
  reasoning: false,
15001
14725
  input: ["text"],
15002
14726
  cost: {
15003
- input: 0.39999999999999997,
14727
+ input: 0.4,
15004
14728
  output: 2,
15005
14729
  cacheRead: 0,
15006
14730
  cacheWrite: 0,
@@ -15017,7 +14741,7 @@ export const MODELS = {
15017
14741
  reasoning: false,
15018
14742
  input: ["text"],
15019
14743
  cost: {
15020
- input: 0.09999999999999999,
14744
+ input: 0.1,
15021
14745
  output: 0.3,
15022
14746
  cacheRead: 0,
15023
14747
  cacheWrite: 0,
@@ -15034,7 +14758,7 @@ export const MODELS = {
15034
14758
  reasoning: false,
15035
14759
  input: ["text"],
15036
14760
  cost: {
15037
- input: 0.09999999999999999,
14761
+ input: 0.1,
15038
14762
  output: 0.3,
15039
14763
  cacheRead: 0,
15040
14764
  cacheWrite: 0,
@@ -15051,8 +14775,8 @@ export const MODELS = {
15051
14775
  reasoning: false,
15052
14776
  input: ["text"],
15053
14777
  cost: {
15054
- input: 0.09999999999999999,
15055
- output: 0.09999999999999999,
14778
+ input: 0.1,
14779
+ output: 0.1,
15056
14780
  cacheRead: 0,
15057
14781
  cacheWrite: 0,
15058
14782
  },
@@ -15085,7 +14809,7 @@ export const MODELS = {
15085
14809
  reasoning: false,
15086
14810
  input: ["text", "image"],
15087
14811
  cost: {
15088
- input: 0.39999999999999997,
14812
+ input: 0.4,
15089
14813
  output: 2,
15090
14814
  cacheRead: 0,
15091
14815
  cacheWrite: 0,
@@ -15136,7 +14860,7 @@ export const MODELS = {
15136
14860
  reasoning: false,
15137
14861
  input: ["text", "image"],
15138
14862
  cost: {
15139
- input: 0.09999999999999999,
14863
+ input: 0.1,
15140
14864
  output: 0.3,
15141
14865
  cacheRead: 0,
15142
14866
  cacheWrite: 0,
@@ -15187,7 +14911,7 @@ export const MODELS = {
15187
14911
  reasoning: false,
15188
14912
  input: ["text"],
15189
14913
  cost: {
15190
- input: 0.5700000000000001,
14914
+ input: 0.57,
15191
14915
  output: 2.3,
15192
14916
  cacheRead: 0,
15193
14917
  cacheWrite: 0,
@@ -15212,40 +14936,6 @@ export const MODELS = {
15212
14936
  contextWindow: 262114,
15213
14937
  maxTokens: 262114,
15214
14938
  },
15215
- "moonshotai/kimi-k2-thinking-turbo": {
15216
- id: "moonshotai/kimi-k2-thinking-turbo",
15217
- name: "Kimi K2 Thinking Turbo",
15218
- api: "anthropic-messages",
15219
- provider: "vercel-ai-gateway",
15220
- baseUrl: "https://ai-gateway.vercel.sh",
15221
- reasoning: true,
15222
- input: ["text"],
15223
- cost: {
15224
- input: 1.15,
15225
- output: 8,
15226
- cacheRead: 0.15,
15227
- cacheWrite: 0,
15228
- },
15229
- contextWindow: 262114,
15230
- maxTokens: 262114,
15231
- },
15232
- "moonshotai/kimi-k2-turbo": {
15233
- id: "moonshotai/kimi-k2-turbo",
15234
- name: "Kimi K2 Turbo",
15235
- api: "anthropic-messages",
15236
- provider: "vercel-ai-gateway",
15237
- baseUrl: "https://ai-gateway.vercel.sh",
15238
- reasoning: false,
15239
- input: ["text"],
15240
- cost: {
15241
- input: 1.15,
15242
- output: 8,
15243
- cacheRead: 0.15,
15244
- cacheWrite: 0,
15245
- },
15246
- contextWindow: 256000,
15247
- maxTokens: 16384,
15248
- },
15249
14939
  "moonshotai/kimi-k2.5": {
15250
14940
  id: "moonshotai/kimi-k2.5",
15251
14941
  name: "Kimi K2.5",
@@ -15257,7 +14947,7 @@ export const MODELS = {
15257
14947
  cost: {
15258
14948
  input: 0.6,
15259
14949
  output: 3,
15260
- cacheRead: 0.09999999999999999,
14950
+ cacheRead: 0.1,
15261
14951
  cacheWrite: 0,
15262
14952
  },
15263
14953
  contextWindow: 262114,
@@ -15280,6 +14970,23 @@ export const MODELS = {
15280
14970
  contextWindow: 262000,
15281
14971
  maxTokens: 262000,
15282
14972
  },
14973
+ "moonshotai/kimi-k2.7-code": {
14974
+ id: "moonshotai/kimi-k2.7-code",
14975
+ name: "Kimi K2.7 Code",
14976
+ api: "anthropic-messages",
14977
+ provider: "vercel-ai-gateway",
14978
+ baseUrl: "https://ai-gateway.vercel.sh",
14979
+ reasoning: true,
14980
+ input: ["text", "image"],
14981
+ cost: {
14982
+ input: 0.95,
14983
+ output: 4,
14984
+ cacheRead: 0.19,
14985
+ cacheWrite: 0,
14986
+ },
14987
+ contextWindow: 256000,
14988
+ maxTokens: 32768,
14989
+ },
15283
14990
  "nvidia/nemotron-3-super-120b-a12b": {
15284
14991
  id: "nvidia/nemotron-3-super-120b-a12b",
15285
14992
  name: "NVIDIA Nemotron 3 Super 120B A12B",
@@ -15323,7 +15030,7 @@ export const MODELS = {
15323
15030
  reasoning: true,
15324
15031
  input: ["text", "image"],
15325
15032
  cost: {
15326
- input: 0.19999999999999998,
15033
+ input: 0.2,
15327
15034
  output: 0.6,
15328
15035
  cacheRead: 0,
15329
15036
  cacheWrite: 0,
@@ -15341,7 +15048,7 @@ export const MODELS = {
15341
15048
  input: ["text"],
15342
15049
  cost: {
15343
15050
  input: 0.06,
15344
- output: 0.22999999999999998,
15051
+ output: 0.23,
15345
15052
  cacheRead: 0,
15346
15053
  cacheWrite: 0,
15347
15054
  },
@@ -15391,9 +15098,9 @@ export const MODELS = {
15391
15098
  reasoning: false,
15392
15099
  input: ["text", "image"],
15393
15100
  cost: {
15394
- input: 0.39999999999999997,
15395
- output: 1.5999999999999999,
15396
- cacheRead: 0.09999999999999999,
15101
+ input: 0.4,
15102
+ output: 1.6,
15103
+ cacheRead: 0.1,
15397
15104
  cacheWrite: 0,
15398
15105
  },
15399
15106
  contextWindow: 1047576,
@@ -15408,9 +15115,9 @@ export const MODELS = {
15408
15115
  reasoning: false,
15409
15116
  input: ["text", "image"],
15410
15117
  cost: {
15411
- input: 0.09999999999999999,
15412
- output: 0.39999999999999997,
15413
- cacheRead: 0.024999999999999998,
15118
+ input: 0.1,
15119
+ output: 0.4,
15120
+ cacheRead: 0.025,
15414
15121
  cacheWrite: 0,
15415
15122
  },
15416
15123
  contextWindow: 1047576,
@@ -15512,7 +15219,7 @@ export const MODELS = {
15512
15219
  cost: {
15513
15220
  input: 0.25,
15514
15221
  output: 2,
15515
- cacheRead: 0.024999999999999998,
15222
+ cacheRead: 0.025,
15516
15223
  cacheWrite: 0,
15517
15224
  },
15518
15225
  contextWindow: 400000,
@@ -15527,8 +15234,8 @@ export const MODELS = {
15527
15234
  reasoning: true,
15528
15235
  input: ["text", "image"],
15529
15236
  cost: {
15530
- input: 0.049999999999999996,
15531
- output: 0.39999999999999997,
15237
+ input: 0.05,
15238
+ output: 0.4,
15532
15239
  cacheRead: 0.005,
15533
15240
  cacheWrite: 0,
15534
15241
  },
@@ -15597,7 +15304,7 @@ export const MODELS = {
15597
15304
  cost: {
15598
15305
  input: 0.25,
15599
15306
  output: 2,
15600
- cacheRead: 0.024999999999999998,
15307
+ cacheRead: 0.025,
15601
15308
  cacheWrite: 0,
15602
15309
  },
15603
15310
  contextWindow: 400000,
@@ -15791,7 +15498,7 @@ export const MODELS = {
15791
15498
  thinkingLevelMap: { "xhigh": "xhigh" },
15792
15499
  input: ["text", "image"],
15793
15500
  cost: {
15794
- input: 0.19999999999999998,
15501
+ input: 0.2,
15795
15502
  output: 1.25,
15796
15503
  cacheRead: 0.02,
15797
15504
  cacheWrite: 0,
@@ -15879,8 +15586,8 @@ export const MODELS = {
15879
15586
  reasoning: true,
15880
15587
  input: ["text"],
15881
15588
  cost: {
15882
- input: 0.049999999999999996,
15883
- output: 0.19999999999999998,
15589
+ input: 0.05,
15590
+ output: 0.2,
15884
15591
  cacheRead: 0,
15885
15592
  cacheWrite: 0,
15886
15593
  },
@@ -16066,7 +15773,7 @@ export const MODELS = {
16066
15773
  reasoning: true,
16067
15774
  input: ["text", "image"],
16068
15775
  cost: {
16069
- input: 0.19999999999999998,
15776
+ input: 0.2,
16070
15777
  output: 1.15,
16071
15778
  cacheRead: 0.04,
16072
15779
  cacheWrite: 0,
@@ -16083,9 +15790,9 @@ export const MODELS = {
16083
15790
  reasoning: false,
16084
15791
  input: ["text", "image"],
16085
15792
  cost: {
16086
- input: 0.19999999999999998,
15793
+ input: 0.2,
16087
15794
  output: 0.5,
16088
- cacheRead: 0.049999999999999996,
15795
+ cacheRead: 0.05,
16089
15796
  cacheWrite: 0,
16090
15797
  },
16091
15798
  contextWindow: 1000000,
@@ -16100,9 +15807,9 @@ export const MODELS = {
16100
15807
  reasoning: true,
16101
15808
  input: ["text", "image"],
16102
15809
  cost: {
16103
- input: 0.19999999999999998,
15810
+ input: 0.2,
16104
15811
  output: 0.5,
16105
- cacheRead: 0.049999999999999996,
15812
+ cacheRead: 0.05,
16106
15813
  cacheWrite: 0,
16107
15814
  },
16108
15815
  contextWindow: 1000000,
@@ -16119,7 +15826,7 @@ export const MODELS = {
16119
15826
  cost: {
16120
15827
  input: 1.25,
16121
15828
  output: 2.5,
16122
- cacheRead: 0.19999999999999998,
15829
+ cacheRead: 0.2,
16123
15830
  cacheWrite: 0,
16124
15831
  },
16125
15832
  contextWindow: 2000000,
@@ -16136,7 +15843,7 @@ export const MODELS = {
16136
15843
  cost: {
16137
15844
  input: 1.25,
16138
15845
  output: 2.5,
16139
- cacheRead: 0.19999999999999998,
15846
+ cacheRead: 0.2,
16140
15847
  cacheWrite: 0,
16141
15848
  },
16142
15849
  contextWindow: 2000000,
@@ -16153,7 +15860,7 @@ export const MODELS = {
16153
15860
  cost: {
16154
15861
  input: 1.25,
16155
15862
  output: 2.5,
16156
- cacheRead: 0.19999999999999998,
15863
+ cacheRead: 0.2,
16157
15864
  cacheWrite: 0,
16158
15865
  },
16159
15866
  contextWindow: 2000000,
@@ -16170,7 +15877,7 @@ export const MODELS = {
16170
15877
  cost: {
16171
15878
  input: 1.25,
16172
15879
  output: 2.5,
16173
- cacheRead: 0.19999999999999998,
15880
+ cacheRead: 0.2,
16174
15881
  cacheWrite: 0,
16175
15882
  },
16176
15883
  contextWindow: 2000000,
@@ -16187,7 +15894,7 @@ export const MODELS = {
16187
15894
  cost: {
16188
15895
  input: 1.25,
16189
15896
  output: 2.5,
16190
- cacheRead: 0.19999999999999998,
15897
+ cacheRead: 0.2,
16191
15898
  cacheWrite: 0,
16192
15899
  },
16193
15900
  contextWindow: 2000000,
@@ -16204,7 +15911,7 @@ export const MODELS = {
16204
15911
  cost: {
16205
15912
  input: 1.25,
16206
15913
  output: 2.5,
16207
- cacheRead: 0.19999999999999998,
15914
+ cacheRead: 0.2,
16208
15915
  cacheWrite: 0,
16209
15916
  },
16210
15917
  contextWindow: 2000000,
@@ -16221,7 +15928,7 @@ export const MODELS = {
16221
15928
  cost: {
16222
15929
  input: 1.25,
16223
15930
  output: 2.5,
16224
- cacheRead: 0.19999999999999998,
15931
+ cacheRead: 0.2,
16225
15932
  cacheWrite: 0,
16226
15933
  },
16227
15934
  contextWindow: 1000000,
@@ -16238,7 +15945,7 @@ export const MODELS = {
16238
15945
  cost: {
16239
15946
  input: 1,
16240
15947
  output: 2,
16241
- cacheRead: 0.19999999999999998,
15948
+ cacheRead: 0.2,
16242
15949
  cacheWrite: 0,
16243
15950
  },
16244
15951
  contextWindow: 256000,
@@ -16253,7 +15960,7 @@ export const MODELS = {
16253
15960
  reasoning: true,
16254
15961
  input: ["text"],
16255
15962
  cost: {
16256
- input: 0.09999999999999999,
15963
+ input: 0.1,
16257
15964
  output: 0.3,
16258
15965
  cacheRead: 0.01,
16259
15966
  cacheWrite: 0,
@@ -16272,7 +15979,7 @@ export const MODELS = {
16272
15979
  cost: {
16273
15980
  input: 1,
16274
15981
  output: 3,
16275
- cacheRead: 0.19999999999999998,
15982
+ cacheRead: 0.2,
16276
15983
  cacheWrite: 0,
16277
15984
  },
16278
15985
  contextWindow: 1000000,
@@ -16338,7 +16045,7 @@ export const MODELS = {
16338
16045
  reasoning: true,
16339
16046
  input: ["text"],
16340
16047
  cost: {
16341
- input: 0.19999999999999998,
16048
+ input: 0.2,
16342
16049
  output: 1.1,
16343
16050
  cacheRead: 0.03,
16344
16051
  cacheWrite: 0,
@@ -16356,7 +16063,7 @@ export const MODELS = {
16356
16063
  input: ["text", "image"],
16357
16064
  cost: {
16358
16065
  input: 0.6,
16359
- output: 1.7999999999999998,
16066
+ output: 1.8,
16360
16067
  cacheRead: 0.11,
16361
16068
  cacheWrite: 0,
16362
16069
  },
@@ -16390,8 +16097,8 @@ export const MODELS = {
16390
16097
  input: ["text", "image"],
16391
16098
  cost: {
16392
16099
  input: 0.3,
16393
- output: 0.8999999999999999,
16394
- cacheRead: 0.049999999999999996,
16100
+ output: 0.9,
16101
+ cacheRead: 0.05,
16395
16102
  cacheWrite: 0,
16396
16103
  },
16397
16104
  contextWindow: 128000,
@@ -16441,7 +16148,7 @@ export const MODELS = {
16441
16148
  input: ["text"],
16442
16149
  cost: {
16443
16150
  input: 0.07,
16444
- output: 0.39999999999999997,
16151
+ output: 0.4,
16445
16152
  cacheRead: 0,
16446
16153
  cacheWrite: 0,
16447
16154
  },
@@ -16458,7 +16165,7 @@ export const MODELS = {
16458
16165
  input: ["text"],
16459
16166
  cost: {
16460
16167
  input: 0.06,
16461
- output: 0.39999999999999997,
16168
+ output: 0.4,
16462
16169
  cacheRead: 0.01,
16463
16170
  cacheWrite: 0,
16464
16171
  },
@@ -16475,8 +16182,8 @@ export const MODELS = {
16475
16182
  input: ["text"],
16476
16183
  cost: {
16477
16184
  input: 1,
16478
- output: 3.1999999999999997,
16479
- cacheRead: 0.19999999999999998,
16185
+ output: 3.2,
16186
+ cacheRead: 0.2,
16480
16187
  cacheWrite: 0,
16481
16188
  },
16482
16189
  contextWindow: 202800,
@@ -16746,6 +16453,24 @@ export const MODELS = {
16746
16453
  contextWindow: 1048576,
16747
16454
  maxTokens: 131072,
16748
16455
  },
16456
+ "mimo-v2.5-pro-ultraspeed": {
16457
+ id: "mimo-v2.5-pro-ultraspeed",
16458
+ name: "MiMo-V2.5-Pro-UltraSpeed",
16459
+ api: "openai-completions",
16460
+ provider: "xiaomi",
16461
+ baseUrl: "https://api.xiaomimimo.com/v1",
16462
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
16463
+ reasoning: true,
16464
+ input: ["text"],
16465
+ cost: {
16466
+ input: 1.305,
16467
+ output: 2.61,
16468
+ cacheRead: 0.0108,
16469
+ cacheWrite: 0,
16470
+ },
16471
+ contextWindow: 1048576,
16472
+ maxTokens: 131072,
16473
+ },
16749
16474
  },
16750
16475
  "xiaomi-token-plan-ams": {
16751
16476
  "mimo-v2-omni": {
@@ -16820,6 +16545,24 @@ export const MODELS = {
16820
16545
  contextWindow: 1048576,
16821
16546
  maxTokens: 131072,
16822
16547
  },
16548
+ "mimo-v2.5-pro-ultraspeed": {
16549
+ id: "mimo-v2.5-pro-ultraspeed",
16550
+ name: "MiMo-V2.5-Pro-UltraSpeed",
16551
+ api: "openai-completions",
16552
+ provider: "xiaomi-token-plan-ams",
16553
+ baseUrl: "https://token-plan-ams.xiaomimimo.com/v1",
16554
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
16555
+ reasoning: true,
16556
+ input: ["text"],
16557
+ cost: {
16558
+ input: 1.305,
16559
+ output: 2.61,
16560
+ cacheRead: 0.0108,
16561
+ cacheWrite: 0,
16562
+ },
16563
+ contextWindow: 1048576,
16564
+ maxTokens: 131072,
16565
+ },
16823
16566
  },
16824
16567
  "xiaomi-token-plan-cn": {
16825
16568
  "mimo-v2-omni": {
@@ -16894,6 +16637,24 @@ export const MODELS = {
16894
16637
  contextWindow: 1048576,
16895
16638
  maxTokens: 131072,
16896
16639
  },
16640
+ "mimo-v2.5-pro-ultraspeed": {
16641
+ id: "mimo-v2.5-pro-ultraspeed",
16642
+ name: "MiMo-V2.5-Pro-UltraSpeed",
16643
+ api: "openai-completions",
16644
+ provider: "xiaomi-token-plan-cn",
16645
+ baseUrl: "https://token-plan-cn.xiaomimimo.com/v1",
16646
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
16647
+ reasoning: true,
16648
+ input: ["text"],
16649
+ cost: {
16650
+ input: 1.305,
16651
+ output: 2.61,
16652
+ cacheRead: 0.0108,
16653
+ cacheWrite: 0,
16654
+ },
16655
+ contextWindow: 1048576,
16656
+ maxTokens: 131072,
16657
+ },
16897
16658
  },
16898
16659
  "xiaomi-token-plan-sgp": {
16899
16660
  "mimo-v2-omni": {
@@ -16968,6 +16729,24 @@ export const MODELS = {
16968
16729
  contextWindow: 1048576,
16969
16730
  maxTokens: 131072,
16970
16731
  },
16732
+ "mimo-v2.5-pro-ultraspeed": {
16733
+ id: "mimo-v2.5-pro-ultraspeed",
16734
+ name: "MiMo-V2.5-Pro-UltraSpeed",
16735
+ api: "openai-completions",
16736
+ provider: "xiaomi-token-plan-sgp",
16737
+ baseUrl: "https://token-plan-sgp.xiaomimimo.com/v1",
16738
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
16739
+ reasoning: true,
16740
+ input: ["text"],
16741
+ cost: {
16742
+ input: 1.305,
16743
+ output: 2.61,
16744
+ cacheRead: 0.0108,
16745
+ cacheWrite: 0,
16746
+ },
16747
+ contextWindow: 1048576,
16748
+ maxTokens: 131072,
16749
+ },
16971
16750
  },
16972
16751
  "zai": {
16973
16752
  "glm-4.5-air": {