@earendil-works/pi-ai 0.79.1 → 0.79.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -354,7 +354,7 @@ export const MODELS = {
354
354
  provider: "amazon-bedrock",
355
355
  baseUrl: "https://bedrock-runtime.eu-central-1.amazonaws.com",
356
356
  reasoning: true,
357
- thinkingLevelMap: { "xhigh": "xhigh" },
357
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
358
358
  input: ["text", "image"],
359
359
  cost: {
360
360
  input: 11,
@@ -494,7 +494,7 @@ export const MODELS = {
494
494
  provider: "amazon-bedrock",
495
495
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
496
496
  reasoning: true,
497
- thinkingLevelMap: { "xhigh": "xhigh" },
497
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
498
498
  input: ["text", "image"],
499
499
  cost: {
500
500
  input: 10,
@@ -1386,7 +1386,7 @@ export const MODELS = {
1386
1386
  provider: "amazon-bedrock",
1387
1387
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1388
1388
  reasoning: true,
1389
- thinkingLevelMap: { "xhigh": "xhigh" },
1389
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
1390
1390
  input: ["text", "image"],
1391
1391
  cost: {
1392
1392
  input: 10,
@@ -1875,7 +1875,7 @@ export const MODELS = {
1875
1875
  baseUrl: "https://api.anthropic.com",
1876
1876
  compat: { "forceAdaptiveThinking": true },
1877
1877
  reasoning: true,
1878
- thinkingLevelMap: { "xhigh": "xhigh" },
1878
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
1879
1879
  input: ["text", "image"],
1880
1880
  cost: {
1881
1881
  input: 10,
@@ -2916,30 +2916,13 @@ export const MODELS = {
2916
2916
  reasoning: true,
2917
2917
  input: ["text"],
2918
2918
  cost: {
2919
- input: 0.25,
2920
- output: 0.69,
2919
+ input: 0.35,
2920
+ output: 0.75,
2921
2921
  cacheRead: 0,
2922
2922
  cacheWrite: 0,
2923
2923
  },
2924
2924
  contextWindow: 131072,
2925
- maxTokens: 32768,
2926
- },
2927
- "llama3.1-8b": {
2928
- id: "llama3.1-8b",
2929
- name: "Llama 3.1 8B",
2930
- api: "openai-completions",
2931
- provider: "cerebras",
2932
- baseUrl: "https://api.cerebras.ai/v1",
2933
- reasoning: false,
2934
- input: ["text"],
2935
- cost: {
2936
- input: 0.1,
2937
- output: 0.1,
2938
- cacheRead: 0,
2939
- cacheWrite: 0,
2940
- },
2941
- contextWindow: 32000,
2942
- maxTokens: 8000,
2925
+ maxTokens: 40960,
2943
2926
  },
2944
2927
  "zai-glm-4.7": {
2945
2928
  id: "zai-glm-4.7",
@@ -2947,7 +2930,7 @@ export const MODELS = {
2947
2930
  api: "openai-completions",
2948
2931
  provider: "cerebras",
2949
2932
  baseUrl: "https://api.cerebras.ai/v1",
2950
- reasoning: false,
2933
+ reasoning: true,
2951
2934
  input: ["text"],
2952
2935
  cost: {
2953
2936
  input: 2.25,
@@ -2956,7 +2939,7 @@ export const MODELS = {
2956
2939
  cacheWrite: 0,
2957
2940
  },
2958
2941
  contextWindow: 131072,
2959
- maxTokens: 40000,
2942
+ maxTokens: 40960,
2960
2943
  },
2961
2944
  },
2962
2945
  "cloudflare-ai-gateway": {
@@ -3070,7 +3053,7 @@ export const MODELS = {
3070
3053
  baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
3071
3054
  compat: { "forceAdaptiveThinking": true },
3072
3055
  reasoning: true,
3073
- thinkingLevelMap: { "xhigh": "xhigh" },
3056
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
3074
3057
  input: ["text", "image"],
3075
3058
  cost: {
3076
3059
  input: 10,
@@ -3719,6 +3702,24 @@ export const MODELS = {
3719
3702
  contextWindow: 262144,
3720
3703
  maxTokens: 256000,
3721
3704
  },
3705
+ "@cf/moonshotai/kimi-k2.7-code": {
3706
+ id: "@cf/moonshotai/kimi-k2.7-code",
3707
+ name: "Kimi K2.7 Code",
3708
+ api: "openai-completions",
3709
+ provider: "cloudflare-workers-ai",
3710
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3711
+ compat: { "sendSessionAffinityHeaders": true },
3712
+ reasoning: true,
3713
+ input: ["text", "image"],
3714
+ cost: {
3715
+ input: 0.95,
3716
+ output: 4,
3717
+ cacheRead: 0.19,
3718
+ cacheWrite: 0,
3719
+ },
3720
+ contextWindow: 262144,
3721
+ maxTokens: 262144,
3722
+ },
3722
3723
  "@cf/nvidia/nemotron-3-120b-a12b": {
3723
3724
  id: "@cf/nvidia/nemotron-3-120b-a12b",
3724
3725
  name: "Nemotron 3 Super 120B",
@@ -3941,9 +3942,9 @@ export const MODELS = {
3941
3942
  contextWindow: 131072,
3942
3943
  maxTokens: 32768,
3943
3944
  },
3944
- "accounts/fireworks/models/kimi-k2p5": {
3945
- id: "accounts/fireworks/models/kimi-k2p5",
3946
- name: "Kimi K2.5",
3945
+ "accounts/fireworks/models/kimi-k2p6": {
3946
+ id: "accounts/fireworks/models/kimi-k2p6",
3947
+ name: "Kimi K2.6",
3947
3948
  api: "anthropic-messages",
3948
3949
  provider: "fireworks",
3949
3950
  baseUrl: "https://api.fireworks.ai/inference",
@@ -3951,17 +3952,17 @@ export const MODELS = {
3951
3952
  reasoning: true,
3952
3953
  input: ["text", "image"],
3953
3954
  cost: {
3954
- input: 0.6,
3955
- output: 3,
3956
- cacheRead: 0.1,
3955
+ input: 0.95,
3956
+ output: 4,
3957
+ cacheRead: 0.16,
3957
3958
  cacheWrite: 0,
3958
3959
  },
3959
- contextWindow: 256000,
3960
- maxTokens: 256000,
3960
+ contextWindow: 262000,
3961
+ maxTokens: 262000,
3961
3962
  },
3962
- "accounts/fireworks/models/kimi-k2p6": {
3963
- id: "accounts/fireworks/models/kimi-k2p6",
3964
- name: "Kimi K2.6",
3963
+ "accounts/fireworks/models/kimi-k2p7-code": {
3964
+ id: "accounts/fireworks/models/kimi-k2p7-code",
3965
+ name: "Kimi K2.7 Code",
3965
3966
  api: "anthropic-messages",
3966
3967
  provider: "fireworks",
3967
3968
  baseUrl: "https://api.fireworks.ai/inference",
@@ -3971,15 +3972,15 @@ export const MODELS = {
3971
3972
  cost: {
3972
3973
  input: 0.95,
3973
3974
  output: 4,
3974
- cacheRead: 0.16,
3975
+ cacheRead: 0.19,
3975
3976
  cacheWrite: 0,
3976
3977
  },
3977
3978
  contextWindow: 262000,
3978
3979
  maxTokens: 262000,
3979
3980
  },
3980
- "accounts/fireworks/models/minimax-m2p5": {
3981
- id: "accounts/fireworks/models/minimax-m2p5",
3982
- name: "MiniMax-M2.5",
3981
+ "accounts/fireworks/models/minimax-m2p7": {
3982
+ id: "accounts/fireworks/models/minimax-m2p7",
3983
+ name: "MiniMax-M2.7",
3983
3984
  api: "anthropic-messages",
3984
3985
  provider: "fireworks",
3985
3986
  baseUrl: "https://api.fireworks.ai/inference",
@@ -3989,15 +3990,15 @@ export const MODELS = {
3989
3990
  cost: {
3990
3991
  input: 0.3,
3991
3992
  output: 1.2,
3992
- cacheRead: 0.03,
3993
+ cacheRead: 0.06,
3993
3994
  cacheWrite: 0,
3994
3995
  },
3995
3996
  contextWindow: 196608,
3996
3997
  maxTokens: 196608,
3997
3998
  },
3998
- "accounts/fireworks/models/minimax-m2p7": {
3999
- id: "accounts/fireworks/models/minimax-m2p7",
4000
- name: "MiniMax-M2.7",
3999
+ "accounts/fireworks/models/minimax-m3": {
4000
+ id: "accounts/fireworks/models/minimax-m3",
4001
+ name: "MiniMax-M3",
4001
4002
  api: "anthropic-messages",
4002
4003
  provider: "fireworks",
4003
4004
  baseUrl: "https://api.fireworks.ai/inference",
@@ -4010,12 +4011,12 @@ export const MODELS = {
4010
4011
  cacheRead: 0.06,
4011
4012
  cacheWrite: 0,
4012
4013
  },
4013
- contextWindow: 196608,
4014
- maxTokens: 196608,
4014
+ contextWindow: 512000,
4015
+ maxTokens: 512000,
4015
4016
  },
4016
- "accounts/fireworks/models/qwen3p6-plus": {
4017
- id: "accounts/fireworks/models/qwen3p6-plus",
4018
- name: "Qwen 3.6 Plus",
4017
+ "accounts/fireworks/models/qwen3p7-plus": {
4018
+ id: "accounts/fireworks/models/qwen3p7-plus",
4019
+ name: "Qwen 3.7 Plus",
4019
4020
  api: "anthropic-messages",
4020
4021
  provider: "fireworks",
4021
4022
  baseUrl: "https://api.fireworks.ai/inference",
@@ -4023,9 +4024,9 @@ export const MODELS = {
4023
4024
  reasoning: true,
4024
4025
  input: ["text", "image"],
4025
4026
  cost: {
4026
- input: 0.5,
4027
- output: 3,
4028
- cacheRead: 0.1,
4027
+ input: 0.4,
4028
+ output: 1.6,
4029
+ cacheRead: 0.08,
4029
4030
  cacheWrite: 0,
4030
4031
  },
4031
4032
  contextWindow: 262144,
@@ -4085,8 +4086,45 @@ export const MODELS = {
4085
4086
  contextWindow: 262000,
4086
4087
  maxTokens: 262000,
4087
4088
  },
4089
+ "accounts/fireworks/routers/kimi-k2p7-code-fast": {
4090
+ id: "accounts/fireworks/routers/kimi-k2p7-code-fast",
4091
+ name: "Kimi K2.7 Code Fast",
4092
+ api: "anthropic-messages",
4093
+ provider: "fireworks",
4094
+ baseUrl: "https://api.fireworks.ai/inference",
4095
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
4096
+ reasoning: true,
4097
+ input: ["text", "image"],
4098
+ cost: {
4099
+ input: 2,
4100
+ output: 8,
4101
+ cacheRead: 0.38,
4102
+ cacheWrite: 0,
4103
+ },
4104
+ contextWindow: 262000,
4105
+ maxTokens: 262000,
4106
+ },
4088
4107
  },
4089
4108
  "github-copilot": {
4109
+ "claude-fable-5": {
4110
+ id: "claude-fable-5",
4111
+ name: "Claude Fable 5",
4112
+ api: "openai-completions",
4113
+ provider: "github-copilot",
4114
+ baseUrl: "https://api.individual.githubcopilot.com",
4115
+ headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4116
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
4117
+ reasoning: true,
4118
+ input: ["text", "image"],
4119
+ cost: {
4120
+ input: 10,
4121
+ output: 50,
4122
+ cacheRead: 1,
4123
+ cacheWrite: 12.5,
4124
+ },
4125
+ contextWindow: 1000000,
4126
+ maxTokens: 128000,
4127
+ },
4090
4128
  "claude-haiku-4.5": {
4091
4129
  id: "claude-haiku-4.5",
4092
4130
  name: "Claude Haiku 4.5 (latest)",
@@ -5019,354 +5057,167 @@ export const MODELS = {
5019
5057
  },
5020
5058
  },
5021
5059
  "groq": {
5022
- "deepseek-r1-distill-llama-70b": {
5023
- id: "deepseek-r1-distill-llama-70b",
5024
- name: "DeepSeek R1 Distill Llama 70B",
5060
+ "llama-3.1-8b-instant": {
5061
+ id: "llama-3.1-8b-instant",
5062
+ name: "Llama 3.1 8B",
5025
5063
  api: "openai-completions",
5026
5064
  provider: "groq",
5027
5065
  baseUrl: "https://api.groq.com/openai/v1",
5028
- reasoning: true,
5066
+ reasoning: false,
5029
5067
  input: ["text"],
5030
5068
  cost: {
5031
- input: 0.75,
5032
- output: 0.99,
5069
+ input: 0.05,
5070
+ output: 0.08,
5033
5071
  cacheRead: 0,
5034
5072
  cacheWrite: 0,
5035
5073
  },
5036
5074
  contextWindow: 131072,
5037
- maxTokens: 8192,
5075
+ maxTokens: 131072,
5038
5076
  },
5039
- "gemma2-9b-it": {
5040
- id: "gemma2-9b-it",
5041
- name: "Gemma 2 9B",
5077
+ "llama-3.3-70b-versatile": {
5078
+ id: "llama-3.3-70b-versatile",
5079
+ name: "Llama 3.3 70B",
5042
5080
  api: "openai-completions",
5043
5081
  provider: "groq",
5044
5082
  baseUrl: "https://api.groq.com/openai/v1",
5045
5083
  reasoning: false,
5046
5084
  input: ["text"],
5047
5085
  cost: {
5048
- input: 0.2,
5049
- output: 0.2,
5086
+ input: 0.59,
5087
+ output: 0.79,
5050
5088
  cacheRead: 0,
5051
5089
  cacheWrite: 0,
5052
5090
  },
5053
- contextWindow: 8192,
5054
- maxTokens: 8192,
5091
+ contextWindow: 131072,
5092
+ maxTokens: 32768,
5055
5093
  },
5056
- "groq/compound": {
5057
- id: "groq/compound",
5058
- name: "Compound",
5094
+ "meta-llama/llama-4-scout-17b-16e-instruct": {
5095
+ id: "meta-llama/llama-4-scout-17b-16e-instruct",
5096
+ name: "Llama 4 Scout 17B 16E",
5059
5097
  api: "openai-completions",
5060
5098
  provider: "groq",
5061
5099
  baseUrl: "https://api.groq.com/openai/v1",
5062
- reasoning: true,
5063
- input: ["text"],
5100
+ reasoning: false,
5101
+ input: ["text", "image"],
5064
5102
  cost: {
5065
- input: 0,
5066
- output: 0,
5103
+ input: 0.11,
5104
+ output: 0.34,
5067
5105
  cacheRead: 0,
5068
5106
  cacheWrite: 0,
5069
5107
  },
5070
5108
  contextWindow: 131072,
5071
5109
  maxTokens: 8192,
5072
5110
  },
5073
- "groq/compound-mini": {
5074
- id: "groq/compound-mini",
5075
- name: "Compound Mini",
5111
+ "openai/gpt-oss-120b": {
5112
+ id: "openai/gpt-oss-120b",
5113
+ name: "GPT OSS 120B",
5076
5114
  api: "openai-completions",
5077
5115
  provider: "groq",
5078
5116
  baseUrl: "https://api.groq.com/openai/v1",
5079
5117
  reasoning: true,
5080
5118
  input: ["text"],
5081
5119
  cost: {
5082
- input: 0,
5083
- output: 0,
5084
- cacheRead: 0,
5120
+ input: 0.15,
5121
+ output: 0.6,
5122
+ cacheRead: 0.075,
5085
5123
  cacheWrite: 0,
5086
5124
  },
5087
5125
  contextWindow: 131072,
5088
- maxTokens: 8192,
5126
+ maxTokens: 65536,
5089
5127
  },
5090
- "llama-3.1-8b-instant": {
5091
- id: "llama-3.1-8b-instant",
5092
- name: "Llama 3.1 8B Instant",
5128
+ "openai/gpt-oss-20b": {
5129
+ id: "openai/gpt-oss-20b",
5130
+ name: "GPT OSS 20B",
5093
5131
  api: "openai-completions",
5094
5132
  provider: "groq",
5095
5133
  baseUrl: "https://api.groq.com/openai/v1",
5096
- reasoning: false,
5134
+ reasoning: true,
5097
5135
  input: ["text"],
5098
5136
  cost: {
5099
- input: 0.05,
5100
- output: 0.08,
5101
- cacheRead: 0,
5137
+ input: 0.075,
5138
+ output: 0.3,
5139
+ cacheRead: 0.0375,
5102
5140
  cacheWrite: 0,
5103
5141
  },
5104
5142
  contextWindow: 131072,
5105
- maxTokens: 131072,
5143
+ maxTokens: 65536,
5106
5144
  },
5107
- "llama-3.3-70b-versatile": {
5108
- id: "llama-3.3-70b-versatile",
5109
- name: "Llama 3.3 70B Versatile",
5145
+ "openai/gpt-oss-safeguard-20b": {
5146
+ id: "openai/gpt-oss-safeguard-20b",
5147
+ name: "Safety GPT OSS 20B",
5110
5148
  api: "openai-completions",
5111
5149
  provider: "groq",
5112
5150
  baseUrl: "https://api.groq.com/openai/v1",
5113
- reasoning: false,
5151
+ reasoning: true,
5114
5152
  input: ["text"],
5115
5153
  cost: {
5116
- input: 0.59,
5117
- output: 0.79,
5118
- cacheRead: 0,
5154
+ input: 0.075,
5155
+ output: 0.3,
5156
+ cacheRead: 0.037,
5119
5157
  cacheWrite: 0,
5120
5158
  },
5121
5159
  contextWindow: 131072,
5122
- maxTokens: 32768,
5160
+ maxTokens: 65536,
5123
5161
  },
5124
- "llama3-70b-8192": {
5125
- id: "llama3-70b-8192",
5126
- name: "Llama 3 70B",
5162
+ "qwen/qwen3-32b": {
5163
+ id: "qwen/qwen3-32b",
5164
+ name: "Qwen3-32B",
5127
5165
  api: "openai-completions",
5128
5166
  provider: "groq",
5129
5167
  baseUrl: "https://api.groq.com/openai/v1",
5130
- reasoning: false,
5168
+ reasoning: true,
5169
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "default" },
5131
5170
  input: ["text"],
5132
5171
  cost: {
5133
- input: 0.59,
5134
- output: 0.79,
5172
+ input: 0.29,
5173
+ output: 0.59,
5135
5174
  cacheRead: 0,
5136
5175
  cacheWrite: 0,
5137
5176
  },
5138
- contextWindow: 8192,
5139
- maxTokens: 8192,
5177
+ contextWindow: 131072,
5178
+ maxTokens: 40960,
5140
5179
  },
5141
- "llama3-8b-8192": {
5142
- id: "llama3-8b-8192",
5143
- name: "Llama 3 8B",
5180
+ },
5181
+ "huggingface": {
5182
+ "MiniMaxAI/MiniMax-M2.1": {
5183
+ id: "MiniMaxAI/MiniMax-M2.1",
5184
+ name: "MiniMax-M2.1",
5144
5185
  api: "openai-completions",
5145
- provider: "groq",
5146
- baseUrl: "https://api.groq.com/openai/v1",
5147
- reasoning: false,
5186
+ provider: "huggingface",
5187
+ baseUrl: "https://router.huggingface.co/v1",
5188
+ compat: { "supportsDeveloperRole": false },
5189
+ reasoning: true,
5148
5190
  input: ["text"],
5149
5191
  cost: {
5150
- input: 0.05,
5151
- output: 0.08,
5192
+ input: 0.3,
5193
+ output: 1.2,
5152
5194
  cacheRead: 0,
5153
5195
  cacheWrite: 0,
5154
5196
  },
5155
- contextWindow: 8192,
5156
- maxTokens: 8192,
5197
+ contextWindow: 204800,
5198
+ maxTokens: 131072,
5157
5199
  },
5158
- "meta-llama/llama-4-maverick-17b-128e-instruct": {
5159
- id: "meta-llama/llama-4-maverick-17b-128e-instruct",
5160
- name: "Llama 4 Maverick 17B",
5200
+ "MiniMaxAI/MiniMax-M2.5": {
5201
+ id: "MiniMaxAI/MiniMax-M2.5",
5202
+ name: "MiniMax-M2.5",
5161
5203
  api: "openai-completions",
5162
- provider: "groq",
5163
- baseUrl: "https://api.groq.com/openai/v1",
5164
- reasoning: false,
5165
- input: ["text", "image"],
5204
+ provider: "huggingface",
5205
+ baseUrl: "https://router.huggingface.co/v1",
5206
+ compat: { "supportsDeveloperRole": false },
5207
+ reasoning: true,
5208
+ input: ["text"],
5166
5209
  cost: {
5167
- input: 0.2,
5168
- output: 0.6,
5169
- cacheRead: 0,
5210
+ input: 0.3,
5211
+ output: 1.2,
5212
+ cacheRead: 0.03,
5170
5213
  cacheWrite: 0,
5171
5214
  },
5172
- contextWindow: 131072,
5173
- maxTokens: 8192,
5215
+ contextWindow: 204800,
5216
+ maxTokens: 131072,
5174
5217
  },
5175
- "meta-llama/llama-4-scout-17b-16e-instruct": {
5176
- id: "meta-llama/llama-4-scout-17b-16e-instruct",
5177
- name: "Llama 4 Scout 17B",
5178
- api: "openai-completions",
5179
- provider: "groq",
5180
- baseUrl: "https://api.groq.com/openai/v1",
5181
- reasoning: false,
5182
- input: ["text", "image"],
5183
- cost: {
5184
- input: 0.11,
5185
- output: 0.34,
5186
- cacheRead: 0,
5187
- cacheWrite: 0,
5188
- },
5189
- contextWindow: 131072,
5190
- maxTokens: 8192,
5191
- },
5192
- "mistral-saba-24b": {
5193
- id: "mistral-saba-24b",
5194
- name: "Mistral Saba 24B",
5195
- api: "openai-completions",
5196
- provider: "groq",
5197
- baseUrl: "https://api.groq.com/openai/v1",
5198
- reasoning: false,
5199
- input: ["text"],
5200
- cost: {
5201
- input: 0.79,
5202
- output: 0.79,
5203
- cacheRead: 0,
5204
- cacheWrite: 0,
5205
- },
5206
- contextWindow: 32768,
5207
- maxTokens: 32768,
5208
- },
5209
- "moonshotai/kimi-k2-instruct": {
5210
- id: "moonshotai/kimi-k2-instruct",
5211
- name: "Kimi K2 Instruct",
5212
- api: "openai-completions",
5213
- provider: "groq",
5214
- baseUrl: "https://api.groq.com/openai/v1",
5215
- reasoning: false,
5216
- input: ["text"],
5217
- cost: {
5218
- input: 1,
5219
- output: 3,
5220
- cacheRead: 0,
5221
- cacheWrite: 0,
5222
- },
5223
- contextWindow: 131072,
5224
- maxTokens: 16384,
5225
- },
5226
- "moonshotai/kimi-k2-instruct-0905": {
5227
- id: "moonshotai/kimi-k2-instruct-0905",
5228
- name: "Kimi K2 Instruct 0905",
5229
- api: "openai-completions",
5230
- provider: "groq",
5231
- baseUrl: "https://api.groq.com/openai/v1",
5232
- reasoning: false,
5233
- input: ["text"],
5234
- cost: {
5235
- input: 1,
5236
- output: 3,
5237
- cacheRead: 0.5,
5238
- cacheWrite: 0,
5239
- },
5240
- contextWindow: 262144,
5241
- maxTokens: 16384,
5242
- },
5243
- "openai/gpt-oss-120b": {
5244
- id: "openai/gpt-oss-120b",
5245
- name: "GPT OSS 120B",
5246
- api: "openai-completions",
5247
- provider: "groq",
5248
- baseUrl: "https://api.groq.com/openai/v1",
5249
- reasoning: true,
5250
- input: ["text"],
5251
- cost: {
5252
- input: 0.15,
5253
- output: 0.6,
5254
- cacheRead: 0.075,
5255
- cacheWrite: 0,
5256
- },
5257
- contextWindow: 131072,
5258
- maxTokens: 65536,
5259
- },
5260
- "openai/gpt-oss-20b": {
5261
- id: "openai/gpt-oss-20b",
5262
- name: "GPT OSS 20B",
5263
- api: "openai-completions",
5264
- provider: "groq",
5265
- baseUrl: "https://api.groq.com/openai/v1",
5266
- reasoning: true,
5267
- input: ["text"],
5268
- cost: {
5269
- input: 0.075,
5270
- output: 0.3,
5271
- cacheRead: 0.0375,
5272
- cacheWrite: 0,
5273
- },
5274
- contextWindow: 131072,
5275
- maxTokens: 65536,
5276
- },
5277
- "openai/gpt-oss-safeguard-20b": {
5278
- id: "openai/gpt-oss-safeguard-20b",
5279
- name: "Safety GPT OSS 20B",
5280
- api: "openai-completions",
5281
- provider: "groq",
5282
- baseUrl: "https://api.groq.com/openai/v1",
5283
- reasoning: true,
5284
- input: ["text"],
5285
- cost: {
5286
- input: 0.075,
5287
- output: 0.3,
5288
- cacheRead: 0.037,
5289
- cacheWrite: 0,
5290
- },
5291
- contextWindow: 131072,
5292
- maxTokens: 65536,
5293
- },
5294
- "qwen-qwq-32b": {
5295
- id: "qwen-qwq-32b",
5296
- name: "Qwen QwQ 32B",
5297
- api: "openai-completions",
5298
- provider: "groq",
5299
- baseUrl: "https://api.groq.com/openai/v1",
5300
- reasoning: true,
5301
- input: ["text"],
5302
- cost: {
5303
- input: 0.29,
5304
- output: 0.39,
5305
- cacheRead: 0,
5306
- cacheWrite: 0,
5307
- },
5308
- contextWindow: 131072,
5309
- maxTokens: 16384,
5310
- },
5311
- "qwen/qwen3-32b": {
5312
- id: "qwen/qwen3-32b",
5313
- name: "Qwen3 32B",
5314
- api: "openai-completions",
5315
- provider: "groq",
5316
- baseUrl: "https://api.groq.com/openai/v1",
5317
- reasoning: true,
5318
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "default" },
5319
- input: ["text"],
5320
- cost: {
5321
- input: 0.29,
5322
- output: 0.59,
5323
- cacheRead: 0,
5324
- cacheWrite: 0,
5325
- },
5326
- contextWindow: 131072,
5327
- maxTokens: 40960,
5328
- },
5329
- },
5330
- "huggingface": {
5331
- "MiniMaxAI/MiniMax-M2.1": {
5332
- id: "MiniMaxAI/MiniMax-M2.1",
5333
- name: "MiniMax-M2.1",
5334
- api: "openai-completions",
5335
- provider: "huggingface",
5336
- baseUrl: "https://router.huggingface.co/v1",
5337
- compat: { "supportsDeveloperRole": false },
5338
- reasoning: true,
5339
- input: ["text"],
5340
- cost: {
5341
- input: 0.3,
5342
- output: 1.2,
5343
- cacheRead: 0,
5344
- cacheWrite: 0,
5345
- },
5346
- contextWindow: 204800,
5347
- maxTokens: 131072,
5348
- },
5349
- "MiniMaxAI/MiniMax-M2.5": {
5350
- id: "MiniMaxAI/MiniMax-M2.5",
5351
- name: "MiniMax-M2.5",
5352
- api: "openai-completions",
5353
- provider: "huggingface",
5354
- baseUrl: "https://router.huggingface.co/v1",
5355
- compat: { "supportsDeveloperRole": false },
5356
- reasoning: true,
5357
- input: ["text"],
5358
- cost: {
5359
- input: 0.3,
5360
- output: 1.2,
5361
- cacheRead: 0.03,
5362
- cacheWrite: 0,
5363
- },
5364
- contextWindow: 204800,
5365
- maxTokens: 131072,
5366
- },
5367
- "MiniMaxAI/MiniMax-M2.7": {
5368
- id: "MiniMaxAI/MiniMax-M2.7",
5369
- name: "MiniMax-M2.7",
5218
+ "MiniMaxAI/MiniMax-M2.7": {
5219
+ id: "MiniMaxAI/MiniMax-M2.7",
5220
+ name: "MiniMax-M2.7",
5370
5221
  api: "openai-completions",
5371
5222
  provider: "huggingface",
5372
5223
  baseUrl: "https://router.huggingface.co/v1",
@@ -5726,6 +5577,24 @@ export const MODELS = {
5726
5577
  },
5727
5578
  },
5728
5579
  "kimi-coding": {
5580
+ "k2p7": {
5581
+ id: "k2p7",
5582
+ name: "Kimi K2.7 Code",
5583
+ api: "anthropic-messages",
5584
+ provider: "kimi-coding",
5585
+ baseUrl: "https://api.kimi.com/coding",
5586
+ headers: { "User-Agent": "KimiCLI/1.5" },
5587
+ reasoning: true,
5588
+ input: ["text", "image"],
5589
+ cost: {
5590
+ input: 0,
5591
+ output: 0,
5592
+ cacheRead: 0,
5593
+ cacheWrite: 0,
5594
+ },
5595
+ contextWindow: 262144,
5596
+ maxTokens: 32768,
5597
+ },
5729
5598
  "kimi-for-coding": {
5730
5599
  id: "kimi-for-coding",
5731
5600
  name: "Kimi For Coding",
@@ -6508,6 +6377,24 @@ export const MODELS = {
6508
6377
  contextWindow: 262144,
6509
6378
  maxTokens: 262144,
6510
6379
  },
6380
+ "kimi-k2.7-code": {
6381
+ id: "kimi-k2.7-code",
6382
+ name: "Kimi K2.7 Code",
6383
+ api: "openai-completions",
6384
+ provider: "moonshotai",
6385
+ baseUrl: "https://api.moonshot.ai/v1",
6386
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6387
+ reasoning: true,
6388
+ input: ["text", "image"],
6389
+ cost: {
6390
+ input: 0.95,
6391
+ output: 4,
6392
+ cacheRead: 0.19,
6393
+ cacheWrite: 0,
6394
+ },
6395
+ contextWindow: 262144,
6396
+ maxTokens: 262144,
6397
+ },
6511
6398
  },
6512
6399
  "moonshotai-cn": {
6513
6400
  "kimi-k2-0711-preview": {
@@ -6760,8 +6647,8 @@ export const MODELS = {
6760
6647
  baseUrl: "https://integrate.api.nvidia.com/v1",
6761
6648
  headers: { "NVCF-POLL-SECONDS": "3600" },
6762
6649
  compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6763
- reasoning: false,
6764
- input: ["text"],
6650
+ reasoning: true,
6651
+ input: ["text", "image"],
6765
6652
  cost: {
6766
6653
  input: 0,
6767
6654
  output: 0,
@@ -6790,44 +6677,6 @@ export const MODELS = {
6790
6677
  contextWindow: 262144,
6791
6678
  maxTokens: 262144,
6792
6679
  },
6793
- "nvidia/llama-3.3-nemotron-super-49b-v1": {
6794
- id: "nvidia/llama-3.3-nemotron-super-49b-v1",
6795
- name: "Llama 3.3 Nemotron Super 49B v1",
6796
- api: "openai-completions",
6797
- provider: "nvidia",
6798
- baseUrl: "https://integrate.api.nvidia.com/v1",
6799
- headers: { "NVCF-POLL-SECONDS": "3600" },
6800
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6801
- reasoning: true,
6802
- input: ["text"],
6803
- cost: {
6804
- input: 0,
6805
- output: 0,
6806
- cacheRead: 0,
6807
- cacheWrite: 0,
6808
- },
6809
- contextWindow: 131072,
6810
- maxTokens: 131072,
6811
- },
6812
- "nvidia/llama-3.3-nemotron-super-49b-v1.5": {
6813
- id: "nvidia/llama-3.3-nemotron-super-49b-v1.5",
6814
- name: "Llama 3.3 Nemotron Super 49B v1.5",
6815
- api: "openai-completions",
6816
- provider: "nvidia",
6817
- baseUrl: "https://integrate.api.nvidia.com/v1",
6818
- headers: { "NVCF-POLL-SECONDS": "3600" },
6819
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6820
- reasoning: true,
6821
- input: ["text"],
6822
- cost: {
6823
- input: 0,
6824
- output: 0,
6825
- cacheRead: 0,
6826
- cacheWrite: 0,
6827
- },
6828
- contextWindow: 131072,
6829
- maxTokens: 131072,
6830
- },
6831
6680
  "nvidia/nemotron-3-nano-30b-a3b": {
6832
6681
  id: "nvidia/nemotron-3-nano-30b-a3b",
6833
6682
  name: "nemotron-3-nano-30b-a3b",
@@ -6923,9 +6772,9 @@ export const MODELS = {
6923
6772
  contextWindow: 131072,
6924
6773
  maxTokens: 131072,
6925
6774
  },
6926
- "openai/gpt-oss-20b": {
6927
- id: "openai/gpt-oss-20b",
6928
- name: "GPT OSS 20B",
6775
+ "openai/gpt-oss-120b": {
6776
+ id: "openai/gpt-oss-120b",
6777
+ name: "GPT-OSS-120B",
6929
6778
  api: "openai-completions",
6930
6779
  provider: "nvidia",
6931
6780
  baseUrl: "https://integrate.api.nvidia.com/v1",
@@ -6939,18 +6788,18 @@ export const MODELS = {
6939
6788
  cacheRead: 0,
6940
6789
  cacheWrite: 0,
6941
6790
  },
6942
- contextWindow: 131072,
6943
- maxTokens: 32768,
6791
+ contextWindow: 128000,
6792
+ maxTokens: 8192,
6944
6793
  },
6945
- "qwen/qwen3-coder-480b-a35b-instruct": {
6946
- id: "qwen/qwen3-coder-480b-a35b-instruct",
6947
- name: "Qwen3 Coder 480B A35B Instruct",
6794
+ "openai/gpt-oss-20b": {
6795
+ id: "openai/gpt-oss-20b",
6796
+ name: "GPT OSS 20B",
6948
6797
  api: "openai-completions",
6949
6798
  provider: "nvidia",
6950
6799
  baseUrl: "https://integrate.api.nvidia.com/v1",
6951
6800
  headers: { "NVCF-POLL-SECONDS": "3600" },
6952
6801
  compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6953
- reasoning: false,
6802
+ reasoning: true,
6954
6803
  input: ["text"],
6955
6804
  cost: {
6956
6805
  input: 0,
@@ -6958,8 +6807,8 @@ export const MODELS = {
6958
6807
  cacheRead: 0,
6959
6808
  cacheWrite: 0,
6960
6809
  },
6961
- contextWindow: 262144,
6962
- maxTokens: 66536,
6810
+ contextWindow: 131072,
6811
+ maxTokens: 32768,
6963
6812
  },
6964
6813
  "qwen/qwen3.5-122b-a10b": {
6965
6814
  id: "qwen/qwen3.5-122b-a10b",
@@ -7871,25 +7720,6 @@ export const MODELS = {
7871
7720
  contextWindow: 200000,
7872
7721
  maxTokens: 32000,
7873
7722
  },
7874
- "claude-fable-5": {
7875
- id: "claude-fable-5",
7876
- name: "Claude Fable 5",
7877
- api: "anthropic-messages",
7878
- provider: "opencode",
7879
- baseUrl: "https://opencode.ai/zen",
7880
- compat: { "forceAdaptiveThinking": true },
7881
- reasoning: true,
7882
- thinkingLevelMap: { "xhigh": "xhigh" },
7883
- input: ["text", "image"],
7884
- cost: {
7885
- input: 10,
7886
- output: 50,
7887
- cacheRead: 1,
7888
- cacheWrite: 12.5,
7889
- },
7890
- contextWindow: 1000000,
7891
- maxTokens: 128000,
7892
- },
7893
7723
  "claude-haiku-4-5": {
7894
7724
  id: "claude-haiku-4-5",
7895
7725
  name: "Claude Haiku 4.5",
@@ -8063,7 +7893,7 @@ export const MODELS = {
8063
7893
  cost: {
8064
7894
  input: 0.14,
8065
7895
  output: 0.28,
8066
- cacheRead: 0.03,
7896
+ cacheRead: 0.028,
8067
7897
  cacheWrite: 0,
8068
7898
  },
8069
7899
  contextWindow: 1000000,
@@ -8088,6 +7918,25 @@ export const MODELS = {
8088
7918
  contextWindow: 200000,
8089
7919
  maxTokens: 128000,
8090
7920
  },
7921
+ "deepseek-v4-pro": {
7922
+ id: "deepseek-v4-pro",
7923
+ name: "DeepSeek V4 Pro",
7924
+ api: "openai-completions",
7925
+ provider: "opencode",
7926
+ baseUrl: "https://opencode.ai/zen/v1",
7927
+ compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7928
+ reasoning: true,
7929
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7930
+ input: ["text"],
7931
+ cost: {
7932
+ input: 1.74,
7933
+ output: 3.84,
7934
+ cacheRead: 0.145,
7935
+ cacheWrite: 0,
7936
+ },
7937
+ contextWindow: 1000000,
7938
+ maxTokens: 384000,
7939
+ },
8091
7940
  "gemini-3-flash": {
8092
7941
  id: "gemini-3-flash",
8093
7942
  name: "Gemini 3 Flash",
@@ -8721,42 +8570,42 @@ export const MODELS = {
8721
8570
  contextWindow: 202752,
8722
8571
  maxTokens: 32768,
8723
8572
  },
8724
- "kimi-k2.5": {
8725
- id: "kimi-k2.5",
8726
- name: "Kimi K2.5",
8573
+ "kimi-k2.6": {
8574
+ id: "kimi-k2.6",
8575
+ name: "Kimi K2.6",
8727
8576
  api: "openai-completions",
8728
8577
  provider: "opencode-go",
8729
8578
  baseUrl: "https://opencode.ai/zen/go/v1",
8730
- compat: { "maxTokensField": "max_tokens" },
8579
+ compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false, "maxTokensField": "max_tokens" },
8731
8580
  reasoning: true,
8581
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
8732
8582
  input: ["text", "image"],
8733
8583
  cost: {
8734
- input: 0.6,
8735
- output: 3,
8736
- cacheRead: 0.1,
8584
+ input: 0.95,
8585
+ output: 4,
8586
+ cacheRead: 0.16,
8737
8587
  cacheWrite: 0,
8738
8588
  },
8739
8589
  contextWindow: 262144,
8740
8590
  maxTokens: 65536,
8741
8591
  },
8742
- "kimi-k2.6": {
8743
- id: "kimi-k2.6",
8744
- name: "Kimi K2.6",
8592
+ "kimi-k2.7-code": {
8593
+ id: "kimi-k2.7-code",
8594
+ name: "Kimi K2.7 Code",
8745
8595
  api: "openai-completions",
8746
8596
  provider: "opencode-go",
8747
8597
  baseUrl: "https://opencode.ai/zen/go/v1",
8748
- compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false, "maxTokensField": "max_tokens" },
8598
+ compat: { "maxTokensField": "max_tokens" },
8749
8599
  reasoning: true,
8750
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
8751
8600
  input: ["text", "image"],
8752
8601
  cost: {
8753
8602
  input: 0.95,
8754
8603
  output: 4,
8755
- cacheRead: 0.16,
8604
+ cacheRead: 0.19,
8756
8605
  cacheWrite: 0,
8757
8606
  },
8758
8607
  contextWindow: 262144,
8759
- maxTokens: 65536,
8608
+ maxTokens: 262144,
8760
8609
  },
8761
8610
  "mimo-v2.5": {
8762
8611
  id: "mimo-v2.5",
@@ -8794,23 +8643,6 @@ export const MODELS = {
8794
8643
  contextWindow: 1048576,
8795
8644
  maxTokens: 128000,
8796
8645
  },
8797
- "minimax-m2.5": {
8798
- id: "minimax-m2.5",
8799
- name: "MiniMax M2.5",
8800
- api: "anthropic-messages",
8801
- provider: "opencode-go",
8802
- baseUrl: "https://opencode.ai/zen/go",
8803
- reasoning: true,
8804
- input: ["text"],
8805
- cost: {
8806
- input: 0.3,
8807
- output: 1.2,
8808
- cacheRead: 0.03,
8809
- cacheWrite: 0,
8810
- },
8811
- contextWindow: 204800,
8812
- maxTokens: 65536,
8813
- },
8814
8646
  "minimax-m2.7": {
8815
8647
  id: "minimax-m2.7",
8816
8648
  name: "MiniMax M2.7",
@@ -8831,16 +8663,16 @@ export const MODELS = {
8831
8663
  },
8832
8664
  "minimax-m3": {
8833
8665
  id: "minimax-m3",
8834
- name: "MiniMax M3",
8666
+ name: "MiniMax M3 (3x usage)",
8835
8667
  api: "anthropic-messages",
8836
8668
  provider: "opencode-go",
8837
8669
  baseUrl: "https://opencode.ai/zen/go",
8838
8670
  reasoning: true,
8839
8671
  input: ["text", "image"],
8840
8672
  cost: {
8841
- input: 0.3,
8842
- output: 1.2,
8843
- cacheRead: 0.06,
8673
+ input: 0.1,
8674
+ output: 0.4,
8675
+ cacheRead: 0.02,
8844
8676
  cacheWrite: 0,
8845
8677
  },
8846
8678
  contextWindow: 512000,
@@ -8994,8 +8826,8 @@ export const MODELS = {
8994
8826
  reasoning: false,
8995
8827
  input: ["text", "image"],
8996
8828
  cost: {
8997
- input: 0.7999999999999999,
8998
- output: 3.1999999999999997,
8829
+ input: 0.8,
8830
+ output: 3.2,
8999
8831
  cacheRead: 0,
9000
8832
  cacheWrite: 0,
9001
8833
  },
@@ -9028,7 +8860,7 @@ export const MODELS = {
9028
8860
  reasoning: false,
9029
8861
  input: ["text", "image"],
9030
8862
  cost: {
9031
- input: 0.7999999999999999,
8863
+ input: 0.8,
9032
8864
  output: 4,
9033
8865
  cacheRead: 0.08,
9034
8866
  cacheWrite: 1,
@@ -9064,7 +8896,7 @@ export const MODELS = {
9064
8896
  cost: {
9065
8897
  input: 1,
9066
8898
  output: 5,
9067
- cacheRead: 0.09999999999999999,
8899
+ cacheRead: 0.1,
9068
8900
  cacheWrite: 1.25,
9069
8901
  },
9070
8902
  contextWindow: 200000,
@@ -9408,8 +9240,8 @@ export const MODELS = {
9408
9240
  reasoning: true,
9409
9241
  input: ["text", "image"],
9410
9242
  cost: {
9411
- input: 0.09999999999999999,
9412
- output: 0.39999999999999997,
9243
+ input: 0.1,
9244
+ output: 0.4,
9413
9245
  cacheRead: 0,
9414
9246
  cacheWrite: 0,
9415
9247
  },
@@ -9459,8 +9291,8 @@ export const MODELS = {
9459
9291
  reasoning: false,
9460
9292
  input: ["text"],
9461
9293
  cost: {
9462
- input: 0.20020000000000002,
9463
- output: 0.8000999999999999,
9294
+ input: 0.2002,
9295
+ output: 0.8001,
9464
9296
  cacheRead: 0,
9465
9297
  cacheWrite: 0,
9466
9298
  },
@@ -9476,7 +9308,7 @@ export const MODELS = {
9476
9308
  reasoning: false,
9477
9309
  input: ["text"],
9478
9310
  cost: {
9479
- input: 0.19999999999999998,
9311
+ input: 0.2,
9480
9312
  output: 0.77,
9481
9313
  cacheRead: 0.135,
9482
9314
  cacheWrite: 0,
@@ -9494,7 +9326,7 @@ export const MODELS = {
9494
9326
  input: ["text"],
9495
9327
  cost: {
9496
9328
  input: 0.21,
9497
- output: 0.7899999999999999,
9329
+ output: 0.79,
9498
9330
  cacheRead: 0.13,
9499
9331
  cacheWrite: 0,
9500
9332
  },
@@ -9528,7 +9360,7 @@ export const MODELS = {
9528
9360
  input: ["text"],
9529
9361
  cost: {
9530
9362
  input: 0.5,
9531
- output: 2.1500000000000004,
9363
+ output: 2.15,
9532
9364
  cacheRead: 0.35,
9533
9365
  cacheWrite: 0,
9534
9366
  },
@@ -9597,13 +9429,13 @@ export const MODELS = {
9597
9429
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "xhigh" },
9598
9430
  input: ["text"],
9599
9431
  cost: {
9600
- input: 0.0983,
9601
- output: 0.1966,
9602
- cacheRead: 0.019700000000000002,
9432
+ input: 0.098,
9433
+ output: 0.196,
9434
+ cacheRead: 0.02,
9603
9435
  cacheWrite: 0,
9604
9436
  },
9605
9437
  contextWindow: 1048576,
9606
- maxTokens: 131072,
9438
+ maxTokens: 4096,
9607
9439
  },
9608
9440
  "deepseek/deepseek-v4-pro": {
9609
9441
  id: "deepseek/deepseek-v4-pro",
@@ -9653,7 +9485,7 @@ export const MODELS = {
9653
9485
  input: 0.3,
9654
9486
  output: 2.5,
9655
9487
  cacheRead: 0.03,
9656
- cacheWrite: 0.08333333333333334,
9488
+ cacheWrite: 0.083333,
9657
9489
  },
9658
9490
  contextWindow: 1048576,
9659
9491
  maxTokens: 65535,
@@ -9667,10 +9499,10 @@ export const MODELS = {
9667
9499
  reasoning: true,
9668
9500
  input: ["text", "image"],
9669
9501
  cost: {
9670
- input: 0.09999999999999999,
9671
- output: 0.39999999999999997,
9502
+ input: 0.1,
9503
+ output: 0.4,
9672
9504
  cacheRead: 0.01,
9673
- cacheWrite: 0.08333333333333334,
9505
+ cacheWrite: 0.083333,
9674
9506
  },
9675
9507
  contextWindow: 1048576,
9676
9508
  maxTokens: 65535,
@@ -9684,10 +9516,10 @@ export const MODELS = {
9684
9516
  reasoning: true,
9685
9517
  input: ["text", "image"],
9686
9518
  cost: {
9687
- input: 0.09999999999999999,
9688
- output: 0.39999999999999997,
9519
+ input: 0.1,
9520
+ output: 0.4,
9689
9521
  cacheRead: 0.01,
9690
- cacheWrite: 0.08333333333333334,
9522
+ cacheWrite: 0.083333,
9691
9523
  },
9692
9524
  contextWindow: 1048576,
9693
9525
  maxTokens: 65535,
@@ -9754,8 +9586,8 @@ export const MODELS = {
9754
9586
  cost: {
9755
9587
  input: 0.5,
9756
9588
  output: 3,
9757
- cacheRead: 0.049999999999999996,
9758
- cacheWrite: 0.08333333333333334,
9589
+ cacheRead: 0.05,
9590
+ cacheWrite: 0.083333,
9759
9591
  },
9760
9592
  contextWindow: 1048576,
9761
9593
  maxTokens: 65536,
@@ -9771,8 +9603,8 @@ export const MODELS = {
9771
9603
  cost: {
9772
9604
  input: 0.25,
9773
9605
  output: 1.5,
9774
- cacheRead: 0.024999999999999998,
9775
- cacheWrite: 0.08333333333333334,
9606
+ cacheRead: 0.025,
9607
+ cacheWrite: 0.083333,
9776
9608
  },
9777
9609
  contextWindow: 1048576,
9778
9610
  maxTokens: 65536,
@@ -9788,8 +9620,8 @@ export const MODELS = {
9788
9620
  cost: {
9789
9621
  input: 0.25,
9790
9622
  output: 1.5,
9791
- cacheRead: 0.024999999999999998,
9792
- cacheWrite: 0.08333333333333334,
9623
+ cacheRead: 0.025,
9624
+ cacheWrite: 0.083333,
9793
9625
  },
9794
9626
  contextWindow: 1048576,
9795
9627
  maxTokens: 65536,
@@ -9805,7 +9637,7 @@ export const MODELS = {
9805
9637
  cost: {
9806
9638
  input: 2,
9807
9639
  output: 12,
9808
- cacheRead: 0.19999999999999998,
9640
+ cacheRead: 0.2,
9809
9641
  cacheWrite: 0.375,
9810
9642
  },
9811
9643
  contextWindow: 1048576,
@@ -9822,7 +9654,7 @@ export const MODELS = {
9822
9654
  cost: {
9823
9655
  input: 2,
9824
9656
  output: 12,
9825
- cacheRead: 0.19999999999999998,
9657
+ cacheRead: 0.2,
9826
9658
  cacheWrite: 0.375,
9827
9659
  },
9828
9660
  contextWindow: 1048756,
@@ -9840,7 +9672,7 @@ export const MODELS = {
9840
9672
  input: 1.5,
9841
9673
  output: 9,
9842
9674
  cacheRead: 0.15,
9843
- cacheWrite: 0.08333333333333334,
9675
+ cacheWrite: 0.083333,
9844
9676
  },
9845
9677
  contextWindow: 1048576,
9846
9678
  maxTokens: 65536,
@@ -9854,7 +9686,7 @@ export const MODELS = {
9854
9686
  reasoning: false,
9855
9687
  input: ["text", "image"],
9856
9688
  cost: {
9857
- input: 0.049999999999999996,
9689
+ input: 0.05,
9858
9690
  output: 0.15,
9859
9691
  cacheRead: 0,
9860
9692
  cacheWrite: 0,
@@ -9923,12 +9755,12 @@ export const MODELS = {
9923
9755
  input: ["text", "image"],
9924
9756
  cost: {
9925
9757
  input: 0.12,
9926
- output: 0.36,
9758
+ output: 0.35,
9927
9759
  cacheRead: 0.09,
9928
9760
  cacheWrite: 0,
9929
9761
  },
9930
9762
  contextWindow: 262144,
9931
- maxTokens: 8192,
9763
+ maxTokens: 262144,
9932
9764
  },
9933
9765
  "google/gemma-4-31b-it:free": {
9934
9766
  id: "google/gemma-4-31b-it:free",
@@ -9956,9 +9788,9 @@ export const MODELS = {
9956
9788
  reasoning: false,
9957
9789
  input: ["text"],
9958
9790
  cost: {
9959
- input: 0.049999999999999996,
9960
- output: 0.09999999999999999,
9961
- cacheRead: 0.049999999999999996,
9791
+ input: 0.05,
9792
+ output: 0.1,
9793
+ cacheRead: 0.05,
9962
9794
  cacheWrite: 0,
9963
9795
  },
9964
9796
  contextWindow: 131072,
@@ -9976,7 +9808,7 @@ export const MODELS = {
9976
9808
  cost: {
9977
9809
  input: 0.25,
9978
9810
  output: 0.75,
9979
- cacheRead: 0.024999999999999998,
9811
+ cacheRead: 0.025,
9980
9812
  cacheWrite: 0,
9981
9813
  },
9982
9814
  contextWindow: 128000,
@@ -10059,8 +9891,8 @@ export const MODELS = {
10059
9891
  reasoning: false,
10060
9892
  input: ["text"],
10061
9893
  cost: {
10062
- input: 0.39999999999999997,
10063
- output: 0.39999999999999997,
9894
+ input: 0.4,
9895
+ output: 0.4,
10064
9896
  cacheRead: 0,
10065
9897
  cacheWrite: 0,
10066
9898
  },
@@ -10093,7 +9925,7 @@ export const MODELS = {
10093
9925
  reasoning: false,
10094
9926
  input: ["text"],
10095
9927
  cost: {
10096
- input: 0.09999999999999999,
9928
+ input: 0.1,
10097
9929
  output: 0.32,
10098
9930
  cacheRead: 0,
10099
9931
  cacheWrite: 0,
@@ -10144,7 +9976,7 @@ export const MODELS = {
10144
9976
  reasoning: false,
10145
9977
  input: ["text", "image"],
10146
9978
  cost: {
10147
- input: 0.09999999999999999,
9979
+ input: 0.1,
10148
9980
  output: 0.3,
10149
9981
  cacheRead: 0,
10150
9982
  cacheWrite: 0,
@@ -10161,7 +9993,7 @@ export const MODELS = {
10161
9993
  reasoning: true,
10162
9994
  input: ["text"],
10163
9995
  cost: {
10164
- input: 0.39999999999999997,
9996
+ input: 0.4,
10165
9997
  output: 2.2,
10166
9998
  cacheRead: 0,
10167
9999
  cacheWrite: 0,
@@ -10213,8 +10045,8 @@ export const MODELS = {
10213
10045
  input: ["text"],
10214
10046
  cost: {
10215
10047
  input: 0.15,
10216
- output: 0.8999999999999999,
10217
- cacheRead: 0.049999999999999996,
10048
+ output: 0.9,
10049
+ cacheRead: 0.05,
10218
10050
  cacheWrite: 0,
10219
10051
  },
10220
10052
  contextWindow: 204800,
@@ -10229,9 +10061,9 @@ export const MODELS = {
10229
10061
  reasoning: true,
10230
10062
  input: ["text"],
10231
10063
  cost: {
10232
- input: 0.27,
10233
- output: 1.08,
10234
- cacheRead: 0.054,
10064
+ input: 0.25,
10065
+ output: 1,
10066
+ cacheRead: 0.05,
10235
10067
  cacheWrite: 0,
10236
10068
  },
10237
10069
  contextWindow: 204800,
@@ -10264,7 +10096,7 @@ export const MODELS = {
10264
10096
  input: ["text"],
10265
10097
  cost: {
10266
10098
  input: 0.3,
10267
- output: 0.8999999999999999,
10099
+ output: 0.9,
10268
10100
  cacheRead: 0.03,
10269
10101
  cacheWrite: 0,
10270
10102
  },
@@ -10280,7 +10112,7 @@ export const MODELS = {
10280
10112
  reasoning: false,
10281
10113
  input: ["text"],
10282
10114
  cost: {
10283
- input: 0.39999999999999997,
10115
+ input: 0.4,
10284
10116
  output: 2,
10285
10117
  cacheRead: 0.04,
10286
10118
  cacheWrite: 0,
@@ -10297,8 +10129,8 @@ export const MODELS = {
10297
10129
  reasoning: false,
10298
10130
  input: ["text", "image"],
10299
10131
  cost: {
10300
- input: 0.19999999999999998,
10301
- output: 0.19999999999999998,
10132
+ input: 0.2,
10133
+ output: 0.2,
10302
10134
  cacheRead: 0.02,
10303
10135
  cacheWrite: 0,
10304
10136
  },
@@ -10314,8 +10146,8 @@ export const MODELS = {
10314
10146
  reasoning: false,
10315
10147
  input: ["text", "image"],
10316
10148
  cost: {
10317
- input: 0.09999999999999999,
10318
- output: 0.09999999999999999,
10149
+ input: 0.1,
10150
+ output: 0.1,
10319
10151
  cacheRead: 0.01,
10320
10152
  cacheWrite: 0,
10321
10153
  },
@@ -10350,7 +10182,7 @@ export const MODELS = {
10350
10182
  cost: {
10351
10183
  input: 2,
10352
10184
  output: 6,
10353
- cacheRead: 0.19999999999999998,
10185
+ cacheRead: 0.2,
10354
10186
  cacheWrite: 0,
10355
10187
  },
10356
10188
  contextWindow: 128000,
@@ -10367,7 +10199,7 @@ export const MODELS = {
10367
10199
  cost: {
10368
10200
  input: 2,
10369
10201
  output: 6,
10370
- cacheRead: 0.19999999999999998,
10202
+ cacheRead: 0.2,
10371
10203
  cacheWrite: 0,
10372
10204
  },
10373
10205
  contextWindow: 131072,
@@ -10384,7 +10216,7 @@ export const MODELS = {
10384
10216
  cost: {
10385
10217
  input: 0.5,
10386
10218
  output: 1.5,
10387
- cacheRead: 0.049999999999999996,
10219
+ cacheRead: 0.05,
10388
10220
  cacheWrite: 0,
10389
10221
  },
10390
10222
  contextWindow: 262144,
@@ -10399,7 +10231,7 @@ export const MODELS = {
10399
10231
  reasoning: false,
10400
10232
  input: ["text", "image"],
10401
10233
  cost: {
10402
- input: 0.39999999999999997,
10234
+ input: 0.4,
10403
10235
  output: 2,
10404
10236
  cacheRead: 0.04,
10405
10237
  cacheWrite: 0,
@@ -10433,7 +10265,7 @@ export const MODELS = {
10433
10265
  reasoning: false,
10434
10266
  input: ["text", "image"],
10435
10267
  cost: {
10436
- input: 0.39999999999999997,
10268
+ input: 0.4,
10437
10269
  output: 2,
10438
10270
  cacheRead: 0.04,
10439
10271
  cacheWrite: 0,
@@ -10467,7 +10299,7 @@ export const MODELS = {
10467
10299
  reasoning: false,
10468
10300
  input: ["text"],
10469
10301
  cost: {
10470
- input: 0.19999999999999998,
10302
+ input: 0.2,
10471
10303
  output: 0.6,
10472
10304
  cacheRead: 0.02,
10473
10305
  cacheWrite: 0,
@@ -10502,7 +10334,7 @@ export const MODELS = {
10502
10334
  input: ["text", "image"],
10503
10335
  cost: {
10504
10336
  input: 0.075,
10505
- output: 0.19999999999999998,
10337
+ output: 0.2,
10506
10338
  cacheRead: 0,
10507
10339
  cacheWrite: 0,
10508
10340
  },
@@ -10520,7 +10352,7 @@ export const MODELS = {
10520
10352
  cost: {
10521
10353
  input: 2,
10522
10354
  output: 6,
10523
- cacheRead: 0.19999999999999998,
10355
+ cacheRead: 0.2,
10524
10356
  cacheWrite: 0,
10525
10357
  },
10526
10358
  contextWindow: 65536,
@@ -10535,7 +10367,7 @@ export const MODELS = {
10535
10367
  reasoning: false,
10536
10368
  input: ["text"],
10537
10369
  cost: {
10538
- input: 0.09999999999999999,
10370
+ input: 0.1,
10539
10371
  output: 0.3,
10540
10372
  cacheRead: 0.01,
10541
10373
  cacheWrite: 0,
@@ -10552,7 +10384,7 @@ export const MODELS = {
10552
10384
  reasoning: false,
10553
10385
  input: ["text"],
10554
10386
  cost: {
10555
- input: 0.5700000000000001,
10387
+ input: 0.57,
10556
10388
  output: 2.3,
10557
10389
  cacheRead: 0,
10558
10390
  cacheWrite: 0,
@@ -10621,27 +10453,26 @@ export const MODELS = {
10621
10453
  reasoning: true,
10622
10454
  input: ["text", "image"],
10623
10455
  cost: {
10624
- input: 0.6799999999999999,
10456
+ input: 0.68,
10625
10457
  output: 3.41,
10626
- cacheRead: 0.33999999999999997,
10458
+ cacheRead: 0.34,
10627
10459
  cacheWrite: 0,
10628
10460
  },
10629
10461
  contextWindow: 262144,
10630
10462
  maxTokens: 262142,
10631
10463
  },
10632
- "moonshotai/kimi-k2.6:free": {
10633
- id: "moonshotai/kimi-k2.6:free",
10634
- name: "MoonshotAI: Kimi K2.6 (free)",
10464
+ "moonshotai/kimi-k2.7-code": {
10465
+ id: "moonshotai/kimi-k2.7-code",
10466
+ name: "MoonshotAI: Kimi K2.7 Code",
10635
10467
  api: "openai-completions",
10636
10468
  provider: "openrouter",
10637
10469
  baseUrl: "https://openrouter.ai/api/v1",
10638
- compat: { "supportsDeveloperRole": false, "requiresReasoningContentOnAssistantMessages": true },
10639
10470
  reasoning: true,
10640
10471
  input: ["text", "image"],
10641
10472
  cost: {
10642
- input: 0,
10643
- output: 0,
10644
- cacheRead: 0,
10473
+ input: 0.95,
10474
+ output: 4,
10475
+ cacheRead: 0.19,
10645
10476
  cacheWrite: 0,
10646
10477
  },
10647
10478
  contextWindow: 262144,
@@ -10673,8 +10504,8 @@ export const MODELS = {
10673
10504
  reasoning: true,
10674
10505
  input: ["text"],
10675
10506
  cost: {
10676
- input: 0.39999999999999997,
10677
- output: 0.39999999999999997,
10507
+ input: 0.4,
10508
+ output: 0.4,
10678
10509
  cacheRead: 0,
10679
10510
  cacheWrite: 0,
10680
10511
  },
@@ -10690,8 +10521,8 @@ export const MODELS = {
10690
10521
  reasoning: true,
10691
10522
  input: ["text"],
10692
10523
  cost: {
10693
- input: 0.049999999999999996,
10694
- output: 0.19999999999999998,
10524
+ input: 0.05,
10525
+ output: 0.2,
10695
10526
  cacheRead: 0,
10696
10527
  cacheWrite: 0,
10697
10528
  },
@@ -10742,7 +10573,7 @@ export const MODELS = {
10742
10573
  input: ["text"],
10743
10574
  cost: {
10744
10575
  input: 0.09,
10745
- output: 0.44999999999999996,
10576
+ output: 0.45,
10746
10577
  cacheRead: 0,
10747
10578
  cacheWrite: 0,
10748
10579
  },
@@ -10817,23 +10648,6 @@ export const MODELS = {
10817
10648
  contextWindow: 128000,
10818
10649
  maxTokens: 128000,
10819
10650
  },
10820
- "nvidia/nemotron-nano-9b-v2": {
10821
- id: "nvidia/nemotron-nano-9b-v2",
10822
- name: "NVIDIA: Nemotron Nano 9B V2",
10823
- api: "openai-completions",
10824
- provider: "openrouter",
10825
- baseUrl: "https://openrouter.ai/api/v1",
10826
- reasoning: true,
10827
- input: ["text"],
10828
- cost: {
10829
- input: 0.04,
10830
- output: 0.16,
10831
- cacheRead: 0,
10832
- cacheWrite: 0,
10833
- },
10834
- contextWindow: 131072,
10835
- maxTokens: 16384,
10836
- },
10837
10651
  "nvidia/nemotron-nano-9b-v2:free": {
10838
10652
  id: "nvidia/nemotron-nano-9b-v2:free",
10839
10653
  name: "NVIDIA: Nemotron Nano 9B V2 (free)",
@@ -10979,9 +10793,9 @@ export const MODELS = {
10979
10793
  reasoning: false,
10980
10794
  input: ["text", "image"],
10981
10795
  cost: {
10982
- input: 0.39999999999999997,
10983
- output: 1.5999999999999999,
10984
- cacheRead: 0.09999999999999999,
10796
+ input: 0.4,
10797
+ output: 1.6,
10798
+ cacheRead: 0.1,
10985
10799
  cacheWrite: 0,
10986
10800
  },
10987
10801
  contextWindow: 1047576,
@@ -10996,9 +10810,9 @@ export const MODELS = {
10996
10810
  reasoning: false,
10997
10811
  input: ["text", "image"],
10998
10812
  cost: {
10999
- input: 0.09999999999999999,
11000
- output: 0.39999999999999997,
11001
- cacheRead: 0.024999999999999998,
10813
+ input: 0.1,
10814
+ output: 0.4,
10815
+ cacheRead: 0.025,
11002
10816
  cacheWrite: 0,
11003
10817
  },
11004
10818
  contextWindow: 1047576,
@@ -11151,7 +10965,7 @@ export const MODELS = {
11151
10965
  cost: {
11152
10966
  input: 0.25,
11153
10967
  output: 2,
11154
- cacheRead: 0.024999999999999998,
10968
+ cacheRead: 0.025,
11155
10969
  cacheWrite: 0,
11156
10970
  },
11157
10971
  contextWindow: 400000,
@@ -11166,8 +10980,8 @@ export const MODELS = {
11166
10980
  reasoning: true,
11167
10981
  input: ["text", "image"],
11168
10982
  cost: {
11169
- input: 0.049999999999999996,
11170
- output: 0.39999999999999997,
10983
+ input: 0.05,
10984
+ output: 0.4,
11171
10985
  cacheRead: 0.01,
11172
10986
  cacheWrite: 0,
11173
10987
  },
@@ -11270,7 +11084,7 @@ export const MODELS = {
11270
11084
  cost: {
11271
11085
  input: 0.25,
11272
11086
  output: 2,
11273
- cacheRead: 0.024999999999999998,
11087
+ cacheRead: 0.025,
11274
11088
  cacheWrite: 0,
11275
11089
  },
11276
11090
  contextWindow: 400000,
@@ -11430,7 +11244,7 @@ export const MODELS = {
11430
11244
  thinkingLevelMap: { "xhigh": "xhigh" },
11431
11245
  input: ["text", "image"],
11432
11246
  cost: {
11433
- input: 0.19999999999999998,
11247
+ input: 0.2,
11434
11248
  output: 1.25,
11435
11249
  cacheRead: 0.02,
11436
11250
  cacheWrite: 0,
@@ -11875,7 +11689,7 @@ export const MODELS = {
11875
11689
  reasoning: true,
11876
11690
  input: ["text"],
11877
11691
  cost: {
11878
- input: 0.19999999999999998,
11692
+ input: 0.2,
11879
11693
  output: 1.1,
11880
11694
  cacheRead: 0,
11881
11695
  cacheWrite: 0,
@@ -11893,7 +11707,7 @@ export const MODELS = {
11893
11707
  input: ["text"],
11894
11708
  cost: {
11895
11709
  input: 0.36,
11896
- output: 0.39999999999999997,
11710
+ output: 0.4,
11897
11711
  cacheRead: 0,
11898
11712
  cacheWrite: 0,
11899
11713
  },
@@ -11911,7 +11725,7 @@ export const MODELS = {
11911
11725
  cost: {
11912
11726
  input: 0.26,
11913
11727
  output: 0.78,
11914
- cacheRead: 0.052000000000000005,
11728
+ cacheRead: 0.052,
11915
11729
  cacheWrite: 0.325,
11916
11730
  },
11917
11731
  contextWindow: 1000000,
@@ -11960,7 +11774,7 @@ export const MODELS = {
11960
11774
  reasoning: true,
11961
11775
  input: ["text"],
11962
11776
  cost: {
11963
- input: 0.09999999999999999,
11777
+ input: 0.1,
11964
11778
  output: 0.24,
11965
11779
  cacheRead: 0,
11966
11780
  cacheWrite: 0,
@@ -11977,8 +11791,8 @@ export const MODELS = {
11977
11791
  reasoning: true,
11978
11792
  input: ["text"],
11979
11793
  cost: {
11980
- input: 0.45499999999999996,
11981
- output: 1.8199999999999998,
11794
+ input: 0.455,
11795
+ output: 1.82,
11982
11796
  cacheRead: 0,
11983
11797
  cacheWrite: 0,
11984
11798
  },
@@ -11995,7 +11809,7 @@ export const MODELS = {
11995
11809
  input: ["text"],
11996
11810
  cost: {
11997
11811
  input: 0.09,
11998
- output: 0.09999999999999999,
11812
+ output: 0.1,
11999
11813
  cacheRead: 0,
12000
11814
  cacheWrite: 0,
12001
11815
  },
@@ -12011,9 +11825,9 @@ export const MODELS = {
12011
11825
  reasoning: true,
12012
11826
  input: ["text"],
12013
11827
  cost: {
12014
- input: 0.09999999999999999,
12015
- output: 0.09999999999999999,
12016
- cacheRead: 0.09999999999999999,
11828
+ input: 0.1,
11829
+ output: 0.1,
11830
+ cacheRead: 0.1,
12017
11831
  cacheWrite: 0,
12018
11832
  },
12019
11833
  contextWindow: 262144,
@@ -12063,7 +11877,7 @@ export const MODELS = {
12063
11877
  input: ["text"],
12064
11878
  cost: {
12065
11879
  input: 0.08,
12066
- output: 0.39999999999999997,
11880
+ output: 0.4,
12067
11881
  cacheRead: 0.08,
12068
11882
  cacheWrite: 0,
12069
11883
  },
@@ -12096,9 +11910,9 @@ export const MODELS = {
12096
11910
  reasoning: true,
12097
11911
  input: ["text"],
12098
11912
  cost: {
12099
- input: 0.049999999999999996,
12100
- output: 0.39999999999999997,
12101
- cacheRead: 0.049999999999999996,
11913
+ input: 0.05,
11914
+ output: 0.4,
11915
+ cacheRead: 0.05,
12102
11916
  cacheWrite: 0,
12103
11917
  },
12104
11918
  contextWindow: 131072,
@@ -12114,7 +11928,7 @@ export const MODELS = {
12114
11928
  input: ["text"],
12115
11929
  cost: {
12116
11930
  input: 0.22,
12117
- output: 1.7999999999999998,
11931
+ output: 1.8,
12118
11932
  cacheRead: 0,
12119
11933
  cacheWrite: 0,
12120
11934
  },
@@ -12165,7 +11979,7 @@ export const MODELS = {
12165
11979
  input: ["text"],
12166
11980
  cost: {
12167
11981
  input: 0.11,
12168
- output: 0.7999999999999999,
11982
+ output: 0.8,
12169
11983
  cacheRead: 0.07,
12170
11984
  cacheWrite: 0,
12171
11985
  },
@@ -12300,7 +12114,7 @@ export const MODELS = {
12300
12114
  reasoning: false,
12301
12115
  input: ["text", "image"],
12302
12116
  cost: {
12303
- input: 0.19999999999999998,
12117
+ input: 0.2,
12304
12118
  output: 0.88,
12305
12119
  cacheRead: 0.11,
12306
12120
  cacheWrite: 0,
@@ -12368,8 +12182,8 @@ export const MODELS = {
12368
12182
  reasoning: false,
12369
12183
  input: ["text", "image"],
12370
12184
  cost: {
12371
- input: 0.10400000000000001,
12372
- output: 0.41600000000000004,
12185
+ input: 0.104,
12186
+ output: 0.416,
12373
12187
  cacheRead: 0,
12374
12188
  cacheWrite: 0,
12375
12189
  },
@@ -12455,7 +12269,7 @@ export const MODELS = {
12455
12269
  cost: {
12456
12270
  input: 0.14,
12457
12271
  output: 1,
12458
- cacheRead: 0.049999999999999996,
12272
+ cacheRead: 0.05,
12459
12273
  cacheWrite: 0,
12460
12274
  },
12461
12275
  contextWindow: 262144,
@@ -12487,7 +12301,7 @@ export const MODELS = {
12487
12301
  reasoning: true,
12488
12302
  input: ["text", "image"],
12489
12303
  cost: {
12490
- input: 0.09999999999999999,
12304
+ input: 0.1,
12491
12305
  output: 0.15,
12492
12306
  cacheRead: 0,
12493
12307
  cacheWrite: 0,
@@ -12539,7 +12353,7 @@ export const MODELS = {
12539
12353
  input: ["text", "image"],
12540
12354
  cost: {
12541
12355
  input: 0.3,
12542
- output: 1.7999999999999998,
12356
+ output: 1.8,
12543
12357
  cacheRead: 0,
12544
12358
  cacheWrite: 0.375,
12545
12359
  },
@@ -12555,13 +12369,13 @@ export const MODELS = {
12555
12369
  reasoning: true,
12556
12370
  input: ["text", "image"],
12557
12371
  cost: {
12558
- input: 0.28900000000000003,
12559
- output: 2.4,
12372
+ input: 0.2885,
12373
+ output: 3.17,
12560
12374
  cacheRead: 0,
12561
12375
  cacheWrite: 0,
12562
12376
  },
12563
12377
  contextWindow: 262144,
12564
- maxTokens: 131072,
12378
+ maxTokens: 262140,
12565
12379
  },
12566
12380
  "qwen/qwen3.6-35b-a3b": {
12567
12381
  id: "qwen/qwen3.6-35b-a3b",
@@ -12572,13 +12386,13 @@ export const MODELS = {
12572
12386
  reasoning: true,
12573
12387
  input: ["text", "image"],
12574
12388
  cost: {
12575
- input: 0.14,
12389
+ input: 0.15,
12576
12390
  output: 1,
12577
- cacheRead: 0,
12391
+ cacheRead: 0.05,
12578
12392
  cacheWrite: 0,
12579
12393
  },
12580
12394
  contextWindow: 262144,
12581
- maxTokens: 262140,
12395
+ maxTokens: 262144,
12582
12396
  },
12583
12397
  "qwen/qwen3.6-flash": {
12584
12398
  id: "qwen/qwen3.6-flash",
@@ -12657,10 +12471,10 @@ export const MODELS = {
12657
12471
  reasoning: true,
12658
12472
  input: ["text", "image"],
12659
12473
  cost: {
12660
- input: 0.39999999999999997,
12661
- output: 1.5999999999999999,
12662
- cacheRead: 0.08,
12663
- cacheWrite: 0.5,
12474
+ input: 0.32,
12475
+ output: 1.28,
12476
+ cacheRead: 0.064,
12477
+ cacheWrite: 0.4,
12664
12478
  },
12665
12479
  contextWindow: 1000000,
12666
12480
  maxTokens: 65536,
@@ -12674,8 +12488,8 @@ export const MODELS = {
12674
12488
  reasoning: false,
12675
12489
  input: ["text", "image"],
12676
12490
  cost: {
12677
- input: 0.09999999999999999,
12678
- output: 0.09999999999999999,
12491
+ input: 0.1,
12492
+ output: 0.1,
12679
12493
  cacheRead: 0,
12680
12494
  cacheWrite: 0,
12681
12495
  },
@@ -12742,7 +12556,7 @@ export const MODELS = {
12742
12556
  reasoning: true,
12743
12557
  input: ["text", "image"],
12744
12558
  cost: {
12745
- input: 0.19999999999999998,
12559
+ input: 0.2,
12746
12560
  output: 1.15,
12747
12561
  cacheRead: 0.04,
12748
12562
  cacheWrite: 0,
@@ -12761,7 +12575,7 @@ export const MODELS = {
12761
12575
  cost: {
12762
12576
  input: 0.063,
12763
12577
  output: 0.21,
12764
- cacheRead: 0.020999999999999998,
12578
+ cacheRead: 0.021,
12765
12579
  cacheWrite: 0,
12766
12580
  },
12767
12581
  contextWindow: 262144,
@@ -12776,7 +12590,7 @@ export const MODELS = {
12776
12590
  reasoning: false,
12777
12591
  input: ["text"],
12778
12592
  cost: {
12779
- input: 0.16999999999999998,
12593
+ input: 0.17,
12780
12594
  output: 0.43,
12781
12595
  cacheRead: 0,
12782
12596
  cacheWrite: 0,
@@ -12793,8 +12607,8 @@ export const MODELS = {
12793
12607
  reasoning: false,
12794
12608
  input: ["text"],
12795
12609
  cost: {
12796
- input: 0.39999999999999997,
12797
- output: 0.39999999999999997,
12610
+ input: 0.4,
12611
+ output: 0.4,
12798
12612
  cacheRead: 0,
12799
12613
  cacheWrite: 0,
12800
12614
  },
@@ -12829,7 +12643,7 @@ export const MODELS = {
12829
12643
  cost: {
12830
12644
  input: 1.25,
12831
12645
  output: 2.5,
12832
- cacheRead: 0.19999999999999998,
12646
+ cacheRead: 0.2,
12833
12647
  cacheWrite: 0,
12834
12648
  },
12835
12649
  contextWindow: 2000000,
@@ -12846,7 +12660,7 @@ export const MODELS = {
12846
12660
  cost: {
12847
12661
  input: 1.25,
12848
12662
  output: 2.5,
12849
- cacheRead: 0.19999999999999998,
12663
+ cacheRead: 0.2,
12850
12664
  cacheWrite: 0,
12851
12665
  },
12852
12666
  contextWindow: 1000000,
@@ -12863,7 +12677,7 @@ export const MODELS = {
12863
12677
  cost: {
12864
12678
  input: 1,
12865
12679
  output: 2,
12866
- cacheRead: 0.19999999999999998,
12680
+ cacheRead: 0.2,
12867
12681
  cacheWrite: 0,
12868
12682
  },
12869
12683
  contextWindow: 256000,
@@ -12878,7 +12692,7 @@ export const MODELS = {
12878
12692
  reasoning: true,
12879
12693
  input: ["text"],
12880
12694
  cost: {
12881
- input: 0.09999999999999999,
12695
+ input: 0.1,
12882
12696
  output: 0.3,
12883
12697
  cacheRead: 0.01,
12884
12698
  cacheWrite: 0,
@@ -12920,23 +12734,6 @@ export const MODELS = {
12920
12734
  contextWindow: 1048576,
12921
12735
  maxTokens: 131072,
12922
12736
  },
12923
- "z-ai/glm-4-32b": {
12924
- id: "z-ai/glm-4-32b",
12925
- name: "Z.ai: GLM 4 32B ",
12926
- api: "openai-completions",
12927
- provider: "openrouter",
12928
- baseUrl: "https://openrouter.ai/api/v1",
12929
- reasoning: false,
12930
- input: ["text"],
12931
- cost: {
12932
- input: 0.09999999999999999,
12933
- output: 0.09999999999999999,
12934
- cacheRead: 0,
12935
- cacheWrite: 0,
12936
- },
12937
- contextWindow: 128000,
12938
- maxTokens: 4096,
12939
- },
12940
12737
  "z-ai/glm-4.5": {
12941
12738
  id: "z-ai/glm-4.5",
12942
12739
  name: "Z.ai: GLM 4.5",
@@ -12971,23 +12768,6 @@ export const MODELS = {
12971
12768
  contextWindow: 131072,
12972
12769
  maxTokens: 131070,
12973
12770
  },
12974
- "z-ai/glm-4.5-air:free": {
12975
- id: "z-ai/glm-4.5-air:free",
12976
- name: "Z.ai: GLM 4.5 Air (free)",
12977
- api: "openai-completions",
12978
- provider: "openrouter",
12979
- baseUrl: "https://openrouter.ai/api/v1",
12980
- reasoning: true,
12981
- input: ["text"],
12982
- cost: {
12983
- input: 0,
12984
- output: 0,
12985
- cacheRead: 0,
12986
- cacheWrite: 0,
12987
- },
12988
- contextWindow: 131072,
12989
- maxTokens: 96000,
12990
- },
12991
12771
  "z-ai/glm-4.5v": {
12992
12772
  id: "z-ai/glm-4.5v",
12993
12773
  name: "Z.ai: GLM 4.5V",
@@ -12998,7 +12778,7 @@ export const MODELS = {
12998
12778
  input: ["text", "image"],
12999
12779
  cost: {
13000
12780
  input: 0.6,
13001
- output: 1.7999999999999998,
12781
+ output: 1.8,
13002
12782
  cacheRead: 0.11,
13003
12783
  cacheWrite: 0,
13004
12784
  },
@@ -13032,12 +12812,12 @@ export const MODELS = {
13032
12812
  input: ["text", "image"],
13033
12813
  cost: {
13034
12814
  input: 0.3,
13035
- output: 0.8999999999999999,
13036
- cacheRead: 0.049999999999999996,
12815
+ output: 0.9,
12816
+ cacheRead: 0.055,
13037
12817
  cacheWrite: 0,
13038
12818
  },
13039
12819
  contextWindow: 131072,
13040
- maxTokens: 24000,
12820
+ maxTokens: 32768,
13041
12821
  },
13042
12822
  "z-ai/glm-4.7": {
13043
12823
  id: "z-ai/glm-4.7",
@@ -13048,7 +12828,7 @@ export const MODELS = {
13048
12828
  reasoning: true,
13049
12829
  input: ["text"],
13050
12830
  cost: {
13051
- input: 0.39999999999999997,
12831
+ input: 0.4,
13052
12832
  output: 1.75,
13053
12833
  cacheRead: 0.08,
13054
12834
  cacheWrite: 0,
@@ -13066,7 +12846,7 @@ export const MODELS = {
13066
12846
  input: ["text"],
13067
12847
  cost: {
13068
12848
  input: 0.06,
13069
- output: 0.39999999999999997,
12849
+ output: 0.4,
13070
12850
  cacheRead: 0.01,
13071
12851
  cacheWrite: 0,
13072
12852
  },
@@ -13104,7 +12884,7 @@ export const MODELS = {
13104
12884
  cacheRead: 0.24,
13105
12885
  cacheWrite: 0,
13106
12886
  },
13107
- contextWindow: 202752,
12887
+ contextWindow: 262144,
13108
12888
  maxTokens: 131072,
13109
12889
  },
13110
12890
  "z-ai/glm-5.1": {
@@ -13124,23 +12904,6 @@ export const MODELS = {
13124
12904
  contextWindow: 202752,
13125
12905
  maxTokens: 4096,
13126
12906
  },
13127
- "z-ai/glm-5v-turbo": {
13128
- id: "z-ai/glm-5v-turbo",
13129
- name: "Z.ai: GLM 5V Turbo",
13130
- api: "openai-completions",
13131
- provider: "openrouter",
13132
- baseUrl: "https://openrouter.ai/api/v1",
13133
- reasoning: true,
13134
- input: ["text", "image"],
13135
- cost: {
13136
- input: 1.2,
13137
- output: 4,
13138
- cacheRead: 0.24,
13139
- cacheWrite: 0,
13140
- },
13141
- contextWindow: 202752,
13142
- maxTokens: 131072,
13143
- },
13144
12907
  "~anthropic/claude-fable-latest": {
13145
12908
  id: "~anthropic/claude-fable-latest",
13146
12909
  name: "Anthropic: Claude Fable Latest",
@@ -13169,7 +12932,7 @@ export const MODELS = {
13169
12932
  cost: {
13170
12933
  input: 1,
13171
12934
  output: 5,
13172
- cacheRead: 0.09999999999999999,
12935
+ cacheRead: 0.1,
13173
12936
  cacheWrite: 1.25,
13174
12937
  },
13175
12938
  contextWindow: 200000,
@@ -13221,7 +12984,7 @@ export const MODELS = {
13221
12984
  input: 1.5,
13222
12985
  output: 9,
13223
12986
  cacheRead: 0.15,
13224
- cacheWrite: 0.08333333333333334,
12987
+ cacheWrite: 0.083333,
13225
12988
  },
13226
12989
  contextWindow: 1048576,
13227
12990
  maxTokens: 65536,
@@ -13237,7 +13000,7 @@ export const MODELS = {
13237
13000
  cost: {
13238
13001
  input: 2,
13239
13002
  output: 12,
13240
- cacheRead: 0.19999999999999998,
13003
+ cacheRead: 0.2,
13241
13004
  cacheWrite: 0.375,
13242
13005
  },
13243
13006
  contextWindow: 1048576,
@@ -13252,9 +13015,9 @@ export const MODELS = {
13252
13015
  reasoning: true,
13253
13016
  input: ["text", "image"],
13254
13017
  cost: {
13255
- input: 0.6799999999999999,
13018
+ input: 0.68,
13256
13019
  output: 3.41,
13257
- cacheRead: 0.33999999999999997,
13020
+ cacheRead: 0.34,
13258
13021
  cacheWrite: 0,
13259
13022
  },
13260
13023
  contextWindow: 262144,
@@ -13296,25 +13059,6 @@ export const MODELS = {
13296
13059
  },
13297
13060
  },
13298
13061
  "together": {
13299
- "MiniMaxAI/MiniMax-M2.5": {
13300
- id: "MiniMaxAI/MiniMax-M2.5",
13301
- name: "MiniMax-M2.5",
13302
- api: "openai-completions",
13303
- provider: "together",
13304
- baseUrl: "https://api.together.ai/v1",
13305
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13306
- reasoning: true,
13307
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13308
- input: ["text"],
13309
- cost: {
13310
- input: 0.3,
13311
- output: 1.2,
13312
- cacheRead: 0.06,
13313
- cacheWrite: 0,
13314
- },
13315
- contextWindow: 204800,
13316
- maxTokens: 131072,
13317
- },
13318
13062
  "MiniMaxAI/MiniMax-M2.7": {
13319
13063
  id: "MiniMaxAI/MiniMax-M2.7",
13320
13064
  name: "MiniMax-M2.7",
@@ -13334,28 +13078,28 @@ export const MODELS = {
13334
13078
  contextWindow: 202752,
13335
13079
  maxTokens: 131072,
13336
13080
  },
13337
- "Qwen/Qwen3-235B-A22B-Instruct-2507-tput": {
13338
- id: "Qwen/Qwen3-235B-A22B-Instruct-2507-tput",
13339
- name: "Qwen3 235B A22B Instruct 2507 FP8",
13081
+ "MiniMaxAI/MiniMax-M3": {
13082
+ id: "MiniMaxAI/MiniMax-M3",
13083
+ name: "MiniMax-M3",
13340
13084
  api: "openai-completions",
13341
13085
  provider: "together",
13342
13086
  baseUrl: "https://api.together.ai/v1",
13343
13087
  compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13344
13088
  reasoning: true,
13345
13089
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13346
- input: ["text"],
13090
+ input: ["text", "image"],
13347
13091
  cost: {
13348
- input: 0.2,
13349
- output: 0.6,
13350
- cacheRead: 0,
13092
+ input: 0.3,
13093
+ output: 1.2,
13094
+ cacheRead: 0.06,
13351
13095
  cacheWrite: 0,
13352
13096
  },
13353
- contextWindow: 262144,
13354
- maxTokens: 262144,
13097
+ contextWindow: 524288,
13098
+ maxTokens: 250000,
13355
13099
  },
13356
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8": {
13357
- id: "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
13358
- name: "Qwen3 Coder 480B A35B Instruct",
13100
+ "Qwen/Qwen2.5-7B-Instruct-Turbo": {
13101
+ id: "Qwen/Qwen2.5-7B-Instruct-Turbo",
13102
+ name: "Qwen 2.5 7B Instruct Turbo",
13359
13103
  api: "openai-completions",
13360
13104
  provider: "together",
13361
13105
  baseUrl: "https://api.together.ai/v1",
@@ -13363,27 +13107,26 @@ export const MODELS = {
13363
13107
  reasoning: false,
13364
13108
  input: ["text"],
13365
13109
  cost: {
13366
- input: 2,
13367
- output: 2,
13110
+ input: 0.3,
13111
+ output: 0.3,
13368
13112
  cacheRead: 0,
13369
13113
  cacheWrite: 0,
13370
13114
  },
13371
- contextWindow: 262144,
13372
- maxTokens: 262144,
13115
+ contextWindow: 32768,
13116
+ maxTokens: 32768,
13373
13117
  },
13374
- "Qwen/Qwen3-Coder-Next-FP8": {
13375
- id: "Qwen/Qwen3-Coder-Next-FP8",
13376
- name: "Qwen3 Coder Next FP8",
13118
+ "Qwen/Qwen3-235B-A22B-Instruct-2507-tput": {
13119
+ id: "Qwen/Qwen3-235B-A22B-Instruct-2507-tput",
13120
+ name: "Qwen3 235B A22B Instruct 2507 FP8",
13377
13121
  api: "openai-completions",
13378
13122
  provider: "together",
13379
13123
  baseUrl: "https://api.together.ai/v1",
13380
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13381
- reasoning: true,
13382
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13124
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
13125
+ reasoning: false,
13383
13126
  input: ["text"],
13384
13127
  cost: {
13385
- input: 0.5,
13386
- output: 1.2,
13128
+ input: 0.2,
13129
+ output: 0.6,
13387
13130
  cacheRead: 0,
13388
13131
  cacheWrite: 0,
13389
13132
  },
@@ -13409,28 +13152,28 @@ export const MODELS = {
13409
13152
  contextWindow: 262144,
13410
13153
  maxTokens: 130000,
13411
13154
  },
13412
- "Qwen/Qwen3.6-Plus": {
13413
- id: "Qwen/Qwen3.6-Plus",
13414
- name: "Qwen3.6 Plus",
13155
+ "Qwen/Qwen3.5-9B": {
13156
+ id: "Qwen/Qwen3.5-9B",
13157
+ name: "Qwen3.5 9B",
13415
13158
  api: "openai-completions",
13416
13159
  provider: "together",
13417
13160
  baseUrl: "https://api.together.ai/v1",
13418
13161
  compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13419
13162
  reasoning: true,
13420
13163
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13421
- input: ["text"],
13164
+ input: ["text", "image"],
13422
13165
  cost: {
13423
- input: 0.5,
13424
- output: 3,
13166
+ input: 0.17,
13167
+ output: 0.25,
13425
13168
  cacheRead: 0,
13426
13169
  cacheWrite: 0,
13427
13170
  },
13428
- contextWindow: 1000000,
13429
- maxTokens: 500000,
13171
+ contextWindow: 262144,
13172
+ maxTokens: 65536,
13430
13173
  },
13431
- "Qwen/Qwen3.7-Max": {
13432
- id: "Qwen/Qwen3.7-Max",
13433
- name: "Qwen3.7 Max",
13174
+ "Qwen/Qwen3.6-Plus": {
13175
+ id: "Qwen/Qwen3.6-Plus",
13176
+ name: "Qwen3.6 Plus",
13434
13177
  api: "openai-completions",
13435
13178
  provider: "together",
13436
13179
  baseUrl: "https://api.together.ai/v1",
@@ -13439,51 +13182,31 @@ export const MODELS = {
13439
13182
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13440
13183
  input: ["text"],
13441
13184
  cost: {
13442
- input: 2.5,
13443
- output: 7.5,
13185
+ input: 0.5,
13186
+ output: 3,
13444
13187
  cacheRead: 0,
13445
13188
  cacheWrite: 0,
13446
13189
  },
13447
13190
  contextWindow: 1000000,
13448
13191
  maxTokens: 500000,
13449
13192
  },
13450
- "deepseek-ai/DeepSeek-V3": {
13451
- id: "deepseek-ai/DeepSeek-V3",
13452
- name: "DeepSeek-V3",
13453
- api: "openai-completions",
13454
- provider: "together",
13455
- baseUrl: "https://api.together.ai/v1",
13456
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13457
- reasoning: true,
13458
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13459
- input: ["text"],
13460
- cost: {
13461
- input: 1.25,
13462
- output: 1.25,
13463
- cacheRead: 0,
13464
- cacheWrite: 0,
13465
- },
13466
- contextWindow: 131072,
13467
- maxTokens: 131072,
13468
- },
13469
- "deepseek-ai/DeepSeek-V3-1": {
13470
- id: "deepseek-ai/DeepSeek-V3-1",
13471
- name: "DeepSeek V3.1",
13193
+ "Qwen/Qwen3.7-Max": {
13194
+ id: "Qwen/Qwen3.7-Max",
13195
+ name: "Qwen3.7 Max",
13472
13196
  api: "openai-completions",
13473
13197
  provider: "together",
13474
13198
  baseUrl: "https://api.together.ai/v1",
13475
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13476
- reasoning: true,
13477
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13199
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
13200
+ reasoning: false,
13478
13201
  input: ["text"],
13479
13202
  cost: {
13480
- input: 0.6,
13481
- output: 1.7,
13203
+ input: 2.5,
13204
+ output: 7.5,
13482
13205
  cacheRead: 0,
13483
13206
  cacheWrite: 0,
13484
13207
  },
13485
- contextWindow: 131072,
13486
- maxTokens: 131072,
13208
+ contextWindow: 1000000,
13209
+ maxTokens: 500000,
13487
13210
  },
13488
13211
  "deepseek-ai/DeepSeek-V4-Pro": {
13489
13212
  id: "deepseek-ai/DeepSeek-V4-Pro",
@@ -13496,8 +13219,8 @@ export const MODELS = {
13496
13219
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": null },
13497
13220
  input: ["text"],
13498
13221
  cost: {
13499
- input: 2.1,
13500
- output: 4.4,
13222
+ input: 1.74,
13223
+ output: 3.48,
13501
13224
  cacheRead: 0.2,
13502
13225
  cacheWrite: 0,
13503
13226
  },
@@ -13533,8 +13256,8 @@ export const MODELS = {
13533
13256
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13534
13257
  input: ["text", "image"],
13535
13258
  cost: {
13536
- input: 0.2,
13537
- output: 0.5,
13259
+ input: 0.39,
13260
+ output: 0.97,
13538
13261
  cacheRead: 0,
13539
13262
  cacheWrite: 0,
13540
13263
  },
@@ -13559,25 +13282,6 @@ export const MODELS = {
13559
13282
  contextWindow: 131072,
13560
13283
  maxTokens: 131072,
13561
13284
  },
13562
- "moonshotai/Kimi-K2.5": {
13563
- id: "moonshotai/Kimi-K2.5",
13564
- name: "Kimi K2.5",
13565
- api: "openai-completions",
13566
- provider: "together",
13567
- baseUrl: "https://api.together.ai/v1",
13568
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13569
- reasoning: true,
13570
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13571
- input: ["text", "image"],
13572
- cost: {
13573
- input: 0.5,
13574
- output: 2.8,
13575
- cacheRead: 0,
13576
- cacheWrite: 0,
13577
- },
13578
- contextWindow: 262144,
13579
- maxTokens: 262144,
13580
- },
13581
13285
  "moonshotai/Kimi-K2.6": {
13582
13286
  id: "moonshotai/Kimi-K2.6",
13583
13287
  name: "Kimi K2.6",
@@ -13635,6 +13339,44 @@ export const MODELS = {
13635
13339
  contextWindow: 131072,
13636
13340
  maxTokens: 131072,
13637
13341
  },
13342
+ "openai/gpt-oss-20b": {
13343
+ id: "openai/gpt-oss-20b",
13344
+ name: "GPT OSS 20B",
13345
+ api: "openai-completions",
13346
+ provider: "together",
13347
+ baseUrl: "https://api.together.ai/v1",
13348
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": true, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "openai" },
13349
+ reasoning: true,
13350
+ thinkingLevelMap: { "off": null, "minimal": null },
13351
+ input: ["text"],
13352
+ cost: {
13353
+ input: 0.05,
13354
+ output: 0.2,
13355
+ cacheRead: 0,
13356
+ cacheWrite: 0,
13357
+ },
13358
+ contextWindow: 131072,
13359
+ maxTokens: 131072,
13360
+ },
13361
+ "zai-org/GLM-5": {
13362
+ id: "zai-org/GLM-5",
13363
+ name: "GLM-5",
13364
+ api: "openai-completions",
13365
+ provider: "together",
13366
+ baseUrl: "https://api.together.ai/v1",
13367
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13368
+ reasoning: true,
13369
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13370
+ input: ["text"],
13371
+ cost: {
13372
+ input: 1,
13373
+ output: 3.2,
13374
+ cacheRead: 0,
13375
+ cacheWrite: 0,
13376
+ },
13377
+ contextWindow: 202752,
13378
+ maxTokens: 131072,
13379
+ },
13638
13380
  "zai-org/GLM-5.1": {
13639
13381
  id: "zai-org/GLM-5.1",
13640
13382
  name: "GLM-5.1",
@@ -13750,7 +13492,7 @@ export const MODELS = {
13750
13492
  reasoning: true,
13751
13493
  input: ["text", "image"],
13752
13494
  cost: {
13753
- input: 0.39999999999999997,
13495
+ input: 0.4,
13754
13496
  output: 4,
13755
13497
  cacheRead: 0,
13756
13498
  cacheWrite: 0,
@@ -13820,7 +13562,7 @@ export const MODELS = {
13820
13562
  cost: {
13821
13563
  input: 1,
13822
13564
  output: 5,
13823
- cacheRead: 0.19999999999999998,
13565
+ cacheRead: 0.2,
13824
13566
  cacheWrite: 0,
13825
13567
  },
13826
13568
  contextWindow: 1000000,
@@ -13920,7 +13662,7 @@ export const MODELS = {
13920
13662
  reasoning: true,
13921
13663
  input: ["text", "image"],
13922
13664
  cost: {
13923
- input: 0.39999999999999997,
13665
+ input: 0.4,
13924
13666
  output: 4,
13925
13667
  cacheRead: 0,
13926
13668
  cacheWrite: 0,
@@ -13937,8 +13679,8 @@ export const MODELS = {
13937
13679
  reasoning: true,
13938
13680
  input: ["text", "image"],
13939
13681
  cost: {
13940
- input: 0.09999999999999999,
13941
- output: 0.39999999999999997,
13682
+ input: 0.1,
13683
+ output: 0.4,
13942
13684
  cacheRead: 0.001,
13943
13685
  cacheWrite: 0.125,
13944
13686
  },
@@ -13954,7 +13696,7 @@ export const MODELS = {
13954
13696
  reasoning: true,
13955
13697
  input: ["text", "image"],
13956
13698
  cost: {
13957
- input: 0.39999999999999997,
13699
+ input: 0.4,
13958
13700
  output: 2.4,
13959
13701
  cacheRead: 0.04,
13960
13702
  cacheWrite: 0.5,
@@ -13972,7 +13714,7 @@ export const MODELS = {
13972
13714
  input: ["text", "image"],
13973
13715
  cost: {
13974
13716
  input: 0.6,
13975
- output: 3.5999999999999996,
13717
+ output: 3.6,
13976
13718
  cacheRead: 0,
13977
13719
  cacheWrite: 0,
13978
13720
  },
@@ -13990,7 +13732,7 @@ export const MODELS = {
13990
13732
  cost: {
13991
13733
  input: 0.5,
13992
13734
  output: 3,
13993
- cacheRead: 0.09999999999999999,
13735
+ cacheRead: 0.1,
13994
13736
  cacheWrite: 0.625,
13995
13737
  },
13996
13738
  contextWindow: 1000000,
@@ -14022,8 +13764,8 @@ export const MODELS = {
14022
13764
  reasoning: true,
14023
13765
  input: ["text", "image"],
14024
13766
  cost: {
14025
- input: 0.39999999999999997,
14026
- output: 1.5999999999999999,
13767
+ input: 0.4,
13768
+ output: 1.6,
14027
13769
  cacheRead: 0.08,
14028
13770
  cacheWrite: 0.5,
14029
13771
  },
@@ -14056,7 +13798,7 @@ export const MODELS = {
14056
13798
  reasoning: false,
14057
13799
  input: ["text", "image"],
14058
13800
  cost: {
14059
- input: 0.7999999999999999,
13801
+ input: 0.8,
14060
13802
  output: 4,
14061
13803
  cacheRead: 0.08,
14062
13804
  cacheWrite: 1,
@@ -14064,25 +13806,6 @@ export const MODELS = {
14064
13806
  contextWindow: 200000,
14065
13807
  maxTokens: 8192,
14066
13808
  },
14067
- "anthropic/claude-fable-5": {
14068
- id: "anthropic/claude-fable-5",
14069
- name: "Claude Fable 5",
14070
- api: "anthropic-messages",
14071
- provider: "vercel-ai-gateway",
14072
- baseUrl: "https://ai-gateway.vercel.sh",
14073
- compat: { "forceAdaptiveThinking": true },
14074
- reasoning: true,
14075
- thinkingLevelMap: { "xhigh": "xhigh" },
14076
- input: ["text", "image"],
14077
- cost: {
14078
- input: 10,
14079
- output: 50,
14080
- cacheRead: 1,
14081
- cacheWrite: 12.5,
14082
- },
14083
- contextWindow: 1000000,
14084
- maxTokens: 128000,
14085
- },
14086
13809
  "anthropic/claude-haiku-4.5": {
14087
13810
  id: "anthropic/claude-haiku-4.5",
14088
13811
  name: "Claude Haiku 4.5",
@@ -14094,7 +13817,7 @@ export const MODELS = {
14094
13817
  cost: {
14095
13818
  input: 1,
14096
13819
  output: 5,
14097
- cacheRead: 0.09999999999999999,
13820
+ cacheRead: 0.1,
14098
13821
  cacheWrite: 1.25,
14099
13822
  },
14100
13823
  contextWindow: 200000,
@@ -14287,7 +14010,7 @@ export const MODELS = {
14287
14010
  input: ["text"],
14288
14011
  cost: {
14289
14012
  input: 0.25,
14290
- output: 0.8999999999999999,
14013
+ output: 0.9,
14291
14014
  cacheRead: 0,
14292
14015
  cacheWrite: 0,
14293
14016
  },
@@ -14305,7 +14028,7 @@ export const MODELS = {
14305
14028
  cost: {
14306
14029
  input: 0.25,
14307
14030
  output: 2,
14308
- cacheRead: 0.049999999999999996,
14031
+ cacheRead: 0.05,
14309
14032
  cacheWrite: 0,
14310
14033
  },
14311
14034
  contextWindow: 256000,
@@ -14490,8 +14213,8 @@ export const MODELS = {
14490
14213
  reasoning: true,
14491
14214
  input: ["text", "image"],
14492
14215
  cost: {
14493
- input: 0.09999999999999999,
14494
- output: 0.39999999999999997,
14216
+ input: 0.1,
14217
+ output: 0.4,
14495
14218
  cacheRead: 0.01,
14496
14219
  cacheWrite: 0,
14497
14220
  },
@@ -14526,7 +14249,7 @@ export const MODELS = {
14526
14249
  cost: {
14527
14250
  input: 0.5,
14528
14251
  output: 3,
14529
- cacheRead: 0.049999999999999996,
14252
+ cacheRead: 0.05,
14530
14253
  cacheWrite: 0,
14531
14254
  },
14532
14255
  contextWindow: 1000000,
@@ -14543,7 +14266,7 @@ export const MODELS = {
14543
14266
  cost: {
14544
14267
  input: 2,
14545
14268
  output: 12,
14546
- cacheRead: 0.19999999999999998,
14269
+ cacheRead: 0.2,
14547
14270
  cacheWrite: 0,
14548
14271
  },
14549
14272
  contextWindow: 1000000,
@@ -14594,7 +14317,7 @@ export const MODELS = {
14594
14317
  cost: {
14595
14318
  input: 2,
14596
14319
  output: 12,
14597
- cacheRead: 0.19999999999999998,
14320
+ cacheRead: 0.2,
14598
14321
  cacheWrite: 0,
14599
14322
  },
14600
14323
  contextWindow: 1000000,
@@ -14644,7 +14367,7 @@ export const MODELS = {
14644
14367
  input: ["text", "image"],
14645
14368
  cost: {
14646
14369
  input: 0.14,
14647
- output: 0.39999999999999997,
14370
+ output: 0.4,
14648
14371
  cacheRead: 0,
14649
14372
  cacheWrite: 0,
14650
14373
  },
@@ -14662,7 +14385,7 @@ export const MODELS = {
14662
14385
  cost: {
14663
14386
  input: 0.25,
14664
14387
  output: 0.75,
14665
- cacheRead: 0.024999999999999998,
14388
+ cacheRead: 0.025,
14666
14389
  cacheWrite: 0,
14667
14390
  },
14668
14391
  contextWindow: 128000,
@@ -14814,7 +14537,7 @@ export const MODELS = {
14814
14537
  input: ["text", "image"],
14815
14538
  cost: {
14816
14539
  input: 0.24,
14817
- output: 0.9700000000000001,
14540
+ output: 0.97,
14818
14541
  cacheRead: 0,
14819
14542
  cacheWrite: 0,
14820
14543
  },
@@ -14830,7 +14553,7 @@ export const MODELS = {
14830
14553
  reasoning: false,
14831
14554
  input: ["text", "image"],
14832
14555
  cost: {
14833
- input: 0.16999999999999998,
14556
+ input: 0.17,
14834
14557
  output: 0.66,
14835
14558
  cacheRead: 0,
14836
14559
  cacheWrite: 0,
@@ -14984,7 +14707,7 @@ export const MODELS = {
14984
14707
  input: ["text"],
14985
14708
  cost: {
14986
14709
  input: 0.3,
14987
- output: 0.8999999999999999,
14710
+ output: 0.9,
14988
14711
  cacheRead: 0,
14989
14712
  cacheWrite: 0,
14990
14713
  },
@@ -15000,7 +14723,7 @@ export const MODELS = {
15000
14723
  reasoning: false,
15001
14724
  input: ["text"],
15002
14725
  cost: {
15003
- input: 0.39999999999999997,
14726
+ input: 0.4,
15004
14727
  output: 2,
15005
14728
  cacheRead: 0,
15006
14729
  cacheWrite: 0,
@@ -15017,7 +14740,7 @@ export const MODELS = {
15017
14740
  reasoning: false,
15018
14741
  input: ["text"],
15019
14742
  cost: {
15020
- input: 0.09999999999999999,
14743
+ input: 0.1,
15021
14744
  output: 0.3,
15022
14745
  cacheRead: 0,
15023
14746
  cacheWrite: 0,
@@ -15034,7 +14757,7 @@ export const MODELS = {
15034
14757
  reasoning: false,
15035
14758
  input: ["text"],
15036
14759
  cost: {
15037
- input: 0.09999999999999999,
14760
+ input: 0.1,
15038
14761
  output: 0.3,
15039
14762
  cacheRead: 0,
15040
14763
  cacheWrite: 0,
@@ -15051,8 +14774,8 @@ export const MODELS = {
15051
14774
  reasoning: false,
15052
14775
  input: ["text"],
15053
14776
  cost: {
15054
- input: 0.09999999999999999,
15055
- output: 0.09999999999999999,
14777
+ input: 0.1,
14778
+ output: 0.1,
15056
14779
  cacheRead: 0,
15057
14780
  cacheWrite: 0,
15058
14781
  },
@@ -15085,7 +14808,7 @@ export const MODELS = {
15085
14808
  reasoning: false,
15086
14809
  input: ["text", "image"],
15087
14810
  cost: {
15088
- input: 0.39999999999999997,
14811
+ input: 0.4,
15089
14812
  output: 2,
15090
14813
  cacheRead: 0,
15091
14814
  cacheWrite: 0,
@@ -15136,7 +14859,7 @@ export const MODELS = {
15136
14859
  reasoning: false,
15137
14860
  input: ["text", "image"],
15138
14861
  cost: {
15139
- input: 0.09999999999999999,
14862
+ input: 0.1,
15140
14863
  output: 0.3,
15141
14864
  cacheRead: 0,
15142
14865
  cacheWrite: 0,
@@ -15187,7 +14910,7 @@ export const MODELS = {
15187
14910
  reasoning: false,
15188
14911
  input: ["text"],
15189
14912
  cost: {
15190
- input: 0.5700000000000001,
14913
+ input: 0.57,
15191
14914
  output: 2.3,
15192
14915
  cacheRead: 0,
15193
14916
  cacheWrite: 0,
@@ -15212,40 +14935,6 @@ export const MODELS = {
15212
14935
  contextWindow: 262114,
15213
14936
  maxTokens: 262114,
15214
14937
  },
15215
- "moonshotai/kimi-k2-thinking-turbo": {
15216
- id: "moonshotai/kimi-k2-thinking-turbo",
15217
- name: "Kimi K2 Thinking Turbo",
15218
- api: "anthropic-messages",
15219
- provider: "vercel-ai-gateway",
15220
- baseUrl: "https://ai-gateway.vercel.sh",
15221
- reasoning: true,
15222
- input: ["text"],
15223
- cost: {
15224
- input: 1.15,
15225
- output: 8,
15226
- cacheRead: 0.15,
15227
- cacheWrite: 0,
15228
- },
15229
- contextWindow: 262114,
15230
- maxTokens: 262114,
15231
- },
15232
- "moonshotai/kimi-k2-turbo": {
15233
- id: "moonshotai/kimi-k2-turbo",
15234
- name: "Kimi K2 Turbo",
15235
- api: "anthropic-messages",
15236
- provider: "vercel-ai-gateway",
15237
- baseUrl: "https://ai-gateway.vercel.sh",
15238
- reasoning: false,
15239
- input: ["text"],
15240
- cost: {
15241
- input: 1.15,
15242
- output: 8,
15243
- cacheRead: 0.15,
15244
- cacheWrite: 0,
15245
- },
15246
- contextWindow: 256000,
15247
- maxTokens: 16384,
15248
- },
15249
14938
  "moonshotai/kimi-k2.5": {
15250
14939
  id: "moonshotai/kimi-k2.5",
15251
14940
  name: "Kimi K2.5",
@@ -15257,7 +14946,7 @@ export const MODELS = {
15257
14946
  cost: {
15258
14947
  input: 0.6,
15259
14948
  output: 3,
15260
- cacheRead: 0.09999999999999999,
14949
+ cacheRead: 0.1,
15261
14950
  cacheWrite: 0,
15262
14951
  },
15263
14952
  contextWindow: 262114,
@@ -15280,6 +14969,23 @@ export const MODELS = {
15280
14969
  contextWindow: 262000,
15281
14970
  maxTokens: 262000,
15282
14971
  },
14972
+ "moonshotai/kimi-k2.7-code": {
14973
+ id: "moonshotai/kimi-k2.7-code",
14974
+ name: "Kimi K2.7 Code",
14975
+ api: "anthropic-messages",
14976
+ provider: "vercel-ai-gateway",
14977
+ baseUrl: "https://ai-gateway.vercel.sh",
14978
+ reasoning: true,
14979
+ input: ["text", "image"],
14980
+ cost: {
14981
+ input: 0.95,
14982
+ output: 4,
14983
+ cacheRead: 0.19,
14984
+ cacheWrite: 0,
14985
+ },
14986
+ contextWindow: 256000,
14987
+ maxTokens: 32768,
14988
+ },
15283
14989
  "nvidia/nemotron-3-super-120b-a12b": {
15284
14990
  id: "nvidia/nemotron-3-super-120b-a12b",
15285
14991
  name: "NVIDIA Nemotron 3 Super 120B A12B",
@@ -15323,7 +15029,7 @@ export const MODELS = {
15323
15029
  reasoning: true,
15324
15030
  input: ["text", "image"],
15325
15031
  cost: {
15326
- input: 0.19999999999999998,
15032
+ input: 0.2,
15327
15033
  output: 0.6,
15328
15034
  cacheRead: 0,
15329
15035
  cacheWrite: 0,
@@ -15341,7 +15047,7 @@ export const MODELS = {
15341
15047
  input: ["text"],
15342
15048
  cost: {
15343
15049
  input: 0.06,
15344
- output: 0.22999999999999998,
15050
+ output: 0.23,
15345
15051
  cacheRead: 0,
15346
15052
  cacheWrite: 0,
15347
15053
  },
@@ -15391,9 +15097,9 @@ export const MODELS = {
15391
15097
  reasoning: false,
15392
15098
  input: ["text", "image"],
15393
15099
  cost: {
15394
- input: 0.39999999999999997,
15395
- output: 1.5999999999999999,
15396
- cacheRead: 0.09999999999999999,
15100
+ input: 0.4,
15101
+ output: 1.6,
15102
+ cacheRead: 0.1,
15397
15103
  cacheWrite: 0,
15398
15104
  },
15399
15105
  contextWindow: 1047576,
@@ -15408,9 +15114,9 @@ export const MODELS = {
15408
15114
  reasoning: false,
15409
15115
  input: ["text", "image"],
15410
15116
  cost: {
15411
- input: 0.09999999999999999,
15412
- output: 0.39999999999999997,
15413
- cacheRead: 0.024999999999999998,
15117
+ input: 0.1,
15118
+ output: 0.4,
15119
+ cacheRead: 0.025,
15414
15120
  cacheWrite: 0,
15415
15121
  },
15416
15122
  contextWindow: 1047576,
@@ -15512,7 +15218,7 @@ export const MODELS = {
15512
15218
  cost: {
15513
15219
  input: 0.25,
15514
15220
  output: 2,
15515
- cacheRead: 0.024999999999999998,
15221
+ cacheRead: 0.025,
15516
15222
  cacheWrite: 0,
15517
15223
  },
15518
15224
  contextWindow: 400000,
@@ -15527,8 +15233,8 @@ export const MODELS = {
15527
15233
  reasoning: true,
15528
15234
  input: ["text", "image"],
15529
15235
  cost: {
15530
- input: 0.049999999999999996,
15531
- output: 0.39999999999999997,
15236
+ input: 0.05,
15237
+ output: 0.4,
15532
15238
  cacheRead: 0.005,
15533
15239
  cacheWrite: 0,
15534
15240
  },
@@ -15597,7 +15303,7 @@ export const MODELS = {
15597
15303
  cost: {
15598
15304
  input: 0.25,
15599
15305
  output: 2,
15600
- cacheRead: 0.024999999999999998,
15306
+ cacheRead: 0.025,
15601
15307
  cacheWrite: 0,
15602
15308
  },
15603
15309
  contextWindow: 400000,
@@ -15791,7 +15497,7 @@ export const MODELS = {
15791
15497
  thinkingLevelMap: { "xhigh": "xhigh" },
15792
15498
  input: ["text", "image"],
15793
15499
  cost: {
15794
- input: 0.19999999999999998,
15500
+ input: 0.2,
15795
15501
  output: 1.25,
15796
15502
  cacheRead: 0.02,
15797
15503
  cacheWrite: 0,
@@ -15879,8 +15585,8 @@ export const MODELS = {
15879
15585
  reasoning: true,
15880
15586
  input: ["text"],
15881
15587
  cost: {
15882
- input: 0.049999999999999996,
15883
- output: 0.19999999999999998,
15588
+ input: 0.05,
15589
+ output: 0.2,
15884
15590
  cacheRead: 0,
15885
15591
  cacheWrite: 0,
15886
15592
  },
@@ -16066,7 +15772,7 @@ export const MODELS = {
16066
15772
  reasoning: true,
16067
15773
  input: ["text", "image"],
16068
15774
  cost: {
16069
- input: 0.19999999999999998,
15775
+ input: 0.2,
16070
15776
  output: 1.15,
16071
15777
  cacheRead: 0.04,
16072
15778
  cacheWrite: 0,
@@ -16083,9 +15789,9 @@ export const MODELS = {
16083
15789
  reasoning: false,
16084
15790
  input: ["text", "image"],
16085
15791
  cost: {
16086
- input: 0.19999999999999998,
15792
+ input: 0.2,
16087
15793
  output: 0.5,
16088
- cacheRead: 0.049999999999999996,
15794
+ cacheRead: 0.05,
16089
15795
  cacheWrite: 0,
16090
15796
  },
16091
15797
  contextWindow: 1000000,
@@ -16100,9 +15806,9 @@ export const MODELS = {
16100
15806
  reasoning: true,
16101
15807
  input: ["text", "image"],
16102
15808
  cost: {
16103
- input: 0.19999999999999998,
15809
+ input: 0.2,
16104
15810
  output: 0.5,
16105
- cacheRead: 0.049999999999999996,
15811
+ cacheRead: 0.05,
16106
15812
  cacheWrite: 0,
16107
15813
  },
16108
15814
  contextWindow: 1000000,
@@ -16119,7 +15825,7 @@ export const MODELS = {
16119
15825
  cost: {
16120
15826
  input: 1.25,
16121
15827
  output: 2.5,
16122
- cacheRead: 0.19999999999999998,
15828
+ cacheRead: 0.2,
16123
15829
  cacheWrite: 0,
16124
15830
  },
16125
15831
  contextWindow: 2000000,
@@ -16136,7 +15842,7 @@ export const MODELS = {
16136
15842
  cost: {
16137
15843
  input: 1.25,
16138
15844
  output: 2.5,
16139
- cacheRead: 0.19999999999999998,
15845
+ cacheRead: 0.2,
16140
15846
  cacheWrite: 0,
16141
15847
  },
16142
15848
  contextWindow: 2000000,
@@ -16153,7 +15859,7 @@ export const MODELS = {
16153
15859
  cost: {
16154
15860
  input: 1.25,
16155
15861
  output: 2.5,
16156
- cacheRead: 0.19999999999999998,
15862
+ cacheRead: 0.2,
16157
15863
  cacheWrite: 0,
16158
15864
  },
16159
15865
  contextWindow: 2000000,
@@ -16170,7 +15876,7 @@ export const MODELS = {
16170
15876
  cost: {
16171
15877
  input: 1.25,
16172
15878
  output: 2.5,
16173
- cacheRead: 0.19999999999999998,
15879
+ cacheRead: 0.2,
16174
15880
  cacheWrite: 0,
16175
15881
  },
16176
15882
  contextWindow: 2000000,
@@ -16187,7 +15893,7 @@ export const MODELS = {
16187
15893
  cost: {
16188
15894
  input: 1.25,
16189
15895
  output: 2.5,
16190
- cacheRead: 0.19999999999999998,
15896
+ cacheRead: 0.2,
16191
15897
  cacheWrite: 0,
16192
15898
  },
16193
15899
  contextWindow: 2000000,
@@ -16204,7 +15910,7 @@ export const MODELS = {
16204
15910
  cost: {
16205
15911
  input: 1.25,
16206
15912
  output: 2.5,
16207
- cacheRead: 0.19999999999999998,
15913
+ cacheRead: 0.2,
16208
15914
  cacheWrite: 0,
16209
15915
  },
16210
15916
  contextWindow: 2000000,
@@ -16221,7 +15927,7 @@ export const MODELS = {
16221
15927
  cost: {
16222
15928
  input: 1.25,
16223
15929
  output: 2.5,
16224
- cacheRead: 0.19999999999999998,
15930
+ cacheRead: 0.2,
16225
15931
  cacheWrite: 0,
16226
15932
  },
16227
15933
  contextWindow: 1000000,
@@ -16238,7 +15944,7 @@ export const MODELS = {
16238
15944
  cost: {
16239
15945
  input: 1,
16240
15946
  output: 2,
16241
- cacheRead: 0.19999999999999998,
15947
+ cacheRead: 0.2,
16242
15948
  cacheWrite: 0,
16243
15949
  },
16244
15950
  contextWindow: 256000,
@@ -16253,7 +15959,7 @@ export const MODELS = {
16253
15959
  reasoning: true,
16254
15960
  input: ["text"],
16255
15961
  cost: {
16256
- input: 0.09999999999999999,
15962
+ input: 0.1,
16257
15963
  output: 0.3,
16258
15964
  cacheRead: 0.01,
16259
15965
  cacheWrite: 0,
@@ -16272,7 +15978,7 @@ export const MODELS = {
16272
15978
  cost: {
16273
15979
  input: 1,
16274
15980
  output: 3,
16275
- cacheRead: 0.19999999999999998,
15981
+ cacheRead: 0.2,
16276
15982
  cacheWrite: 0,
16277
15983
  },
16278
15984
  contextWindow: 1000000,
@@ -16338,7 +16044,7 @@ export const MODELS = {
16338
16044
  reasoning: true,
16339
16045
  input: ["text"],
16340
16046
  cost: {
16341
- input: 0.19999999999999998,
16047
+ input: 0.2,
16342
16048
  output: 1.1,
16343
16049
  cacheRead: 0.03,
16344
16050
  cacheWrite: 0,
@@ -16356,7 +16062,7 @@ export const MODELS = {
16356
16062
  input: ["text", "image"],
16357
16063
  cost: {
16358
16064
  input: 0.6,
16359
- output: 1.7999999999999998,
16065
+ output: 1.8,
16360
16066
  cacheRead: 0.11,
16361
16067
  cacheWrite: 0,
16362
16068
  },
@@ -16390,8 +16096,8 @@ export const MODELS = {
16390
16096
  input: ["text", "image"],
16391
16097
  cost: {
16392
16098
  input: 0.3,
16393
- output: 0.8999999999999999,
16394
- cacheRead: 0.049999999999999996,
16099
+ output: 0.9,
16100
+ cacheRead: 0.05,
16395
16101
  cacheWrite: 0,
16396
16102
  },
16397
16103
  contextWindow: 128000,
@@ -16441,7 +16147,7 @@ export const MODELS = {
16441
16147
  input: ["text"],
16442
16148
  cost: {
16443
16149
  input: 0.07,
16444
- output: 0.39999999999999997,
16150
+ output: 0.4,
16445
16151
  cacheRead: 0,
16446
16152
  cacheWrite: 0,
16447
16153
  },
@@ -16458,7 +16164,7 @@ export const MODELS = {
16458
16164
  input: ["text"],
16459
16165
  cost: {
16460
16166
  input: 0.06,
16461
- output: 0.39999999999999997,
16167
+ output: 0.4,
16462
16168
  cacheRead: 0.01,
16463
16169
  cacheWrite: 0,
16464
16170
  },
@@ -16475,8 +16181,8 @@ export const MODELS = {
16475
16181
  input: ["text"],
16476
16182
  cost: {
16477
16183
  input: 1,
16478
- output: 3.1999999999999997,
16479
- cacheRead: 0.19999999999999998,
16184
+ output: 3.2,
16185
+ cacheRead: 0.2,
16480
16186
  cacheWrite: 0,
16481
16187
  },
16482
16188
  contextWindow: 202800,
@@ -16746,6 +16452,24 @@ export const MODELS = {
16746
16452
  contextWindow: 1048576,
16747
16453
  maxTokens: 131072,
16748
16454
  },
16455
+ "mimo-v2.5-pro-ultraspeed": {
16456
+ id: "mimo-v2.5-pro-ultraspeed",
16457
+ name: "MiMo-V2.5-Pro-UltraSpeed",
16458
+ api: "openai-completions",
16459
+ provider: "xiaomi",
16460
+ baseUrl: "https://api.xiaomimimo.com/v1",
16461
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
16462
+ reasoning: true,
16463
+ input: ["text"],
16464
+ cost: {
16465
+ input: 1.305,
16466
+ output: 2.61,
16467
+ cacheRead: 0.0108,
16468
+ cacheWrite: 0,
16469
+ },
16470
+ contextWindow: 1048576,
16471
+ maxTokens: 131072,
16472
+ },
16749
16473
  },
16750
16474
  "xiaomi-token-plan-ams": {
16751
16475
  "mimo-v2-omni": {
@@ -16820,6 +16544,24 @@ export const MODELS = {
16820
16544
  contextWindow: 1048576,
16821
16545
  maxTokens: 131072,
16822
16546
  },
16547
+ "mimo-v2.5-pro-ultraspeed": {
16548
+ id: "mimo-v2.5-pro-ultraspeed",
16549
+ name: "MiMo-V2.5-Pro-UltraSpeed",
16550
+ api: "openai-completions",
16551
+ provider: "xiaomi-token-plan-ams",
16552
+ baseUrl: "https://token-plan-ams.xiaomimimo.com/v1",
16553
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
16554
+ reasoning: true,
16555
+ input: ["text"],
16556
+ cost: {
16557
+ input: 1.305,
16558
+ output: 2.61,
16559
+ cacheRead: 0.0108,
16560
+ cacheWrite: 0,
16561
+ },
16562
+ contextWindow: 1048576,
16563
+ maxTokens: 131072,
16564
+ },
16823
16565
  },
16824
16566
  "xiaomi-token-plan-cn": {
16825
16567
  "mimo-v2-omni": {
@@ -16894,6 +16636,24 @@ export const MODELS = {
16894
16636
  contextWindow: 1048576,
16895
16637
  maxTokens: 131072,
16896
16638
  },
16639
+ "mimo-v2.5-pro-ultraspeed": {
16640
+ id: "mimo-v2.5-pro-ultraspeed",
16641
+ name: "MiMo-V2.5-Pro-UltraSpeed",
16642
+ api: "openai-completions",
16643
+ provider: "xiaomi-token-plan-cn",
16644
+ baseUrl: "https://token-plan-cn.xiaomimimo.com/v1",
16645
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
16646
+ reasoning: true,
16647
+ input: ["text"],
16648
+ cost: {
16649
+ input: 1.305,
16650
+ output: 2.61,
16651
+ cacheRead: 0.0108,
16652
+ cacheWrite: 0,
16653
+ },
16654
+ contextWindow: 1048576,
16655
+ maxTokens: 131072,
16656
+ },
16897
16657
  },
16898
16658
  "xiaomi-token-plan-sgp": {
16899
16659
  "mimo-v2-omni": {
@@ -16968,6 +16728,24 @@ export const MODELS = {
16968
16728
  contextWindow: 1048576,
16969
16729
  maxTokens: 131072,
16970
16730
  },
16731
+ "mimo-v2.5-pro-ultraspeed": {
16732
+ id: "mimo-v2.5-pro-ultraspeed",
16733
+ name: "MiMo-V2.5-Pro-UltraSpeed",
16734
+ api: "openai-completions",
16735
+ provider: "xiaomi-token-plan-sgp",
16736
+ baseUrl: "https://token-plan-sgp.xiaomimimo.com/v1",
16737
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
16738
+ reasoning: true,
16739
+ input: ["text"],
16740
+ cost: {
16741
+ input: 1.305,
16742
+ output: 2.61,
16743
+ cacheRead: 0.0108,
16744
+ cacheWrite: 0,
16745
+ },
16746
+ contextWindow: 1048576,
16747
+ maxTokens: 131072,
16748
+ },
16971
16749
  },
16972
16750
  "zai": {
16973
16751
  "glm-4.5-air": {