@earendil-works/pi-ai 0.79.0 → 0.79.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (32) hide show
  1. package/dist/image-models.generated.d.ts +2 -2
  2. package/dist/image-models.generated.d.ts.map +1 -1
  3. package/dist/image-models.generated.js +6 -6
  4. package/dist/image-models.generated.js.map +1 -1
  5. package/dist/models.generated.d.ts +602 -543
  6. package/dist/models.generated.d.ts.map +1 -1
  7. package/dist/models.generated.js +818 -826
  8. package/dist/models.generated.js.map +1 -1
  9. package/dist/providers/amazon-bedrock.d.ts.map +1 -1
  10. package/dist/providers/amazon-bedrock.js +25 -8
  11. package/dist/providers/amazon-bedrock.js.map +1 -1
  12. package/dist/providers/anthropic.d.ts +1 -1
  13. package/dist/providers/anthropic.d.ts.map +1 -1
  14. package/dist/providers/anthropic.js +19 -12
  15. package/dist/providers/anthropic.js.map +1 -1
  16. package/dist/providers/azure-openai-responses.d.ts.map +1 -1
  17. package/dist/providers/azure-openai-responses.js +1 -0
  18. package/dist/providers/azure-openai-responses.js.map +1 -1
  19. package/dist/providers/openai-codex-responses.d.ts.map +1 -1
  20. package/dist/providers/openai-codex-responses.js +3 -1
  21. package/dist/providers/openai-codex-responses.js.map +1 -1
  22. package/dist/providers/openai-completions.d.ts.map +1 -1
  23. package/dist/providers/openai-completions.js +2 -1
  24. package/dist/providers/openai-completions.js.map +1 -1
  25. package/dist/types.d.ts +1 -1
  26. package/dist/types.d.ts.map +1 -1
  27. package/dist/types.js.map +1 -1
  28. package/dist/utils/overflow.d.ts +1 -1
  29. package/dist/utils/overflow.d.ts.map +1 -1
  30. package/dist/utils/overflow.js +3 -2
  31. package/dist/utils/overflow.js.map +1 -1
  32. package/package.json +1 -1
@@ -8,7 +8,7 @@ export const MODELS = {
8
8
  api: "bedrock-converse-stream",
9
9
  provider: "amazon-bedrock",
10
10
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
11
- reasoning: false,
11
+ reasoning: true,
12
12
  input: ["text", "image"],
13
13
  cost: {
14
14
  input: 0.33,
@@ -347,6 +347,24 @@ export const MODELS = {
347
347
  contextWindow: 163840,
348
348
  maxTokens: 81920,
349
349
  },
350
+ "eu.anthropic.claude-fable-5": {
351
+ id: "eu.anthropic.claude-fable-5",
352
+ name: "Claude Fable 5 (EU)",
353
+ api: "bedrock-converse-stream",
354
+ provider: "amazon-bedrock",
355
+ baseUrl: "https://bedrock-runtime.eu-central-1.amazonaws.com",
356
+ reasoning: true,
357
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
358
+ input: ["text", "image"],
359
+ cost: {
360
+ input: 11,
361
+ output: 55,
362
+ cacheRead: 1.1,
363
+ cacheWrite: 13.75,
364
+ },
365
+ contextWindow: 1000000,
366
+ maxTokens: 128000,
367
+ },
350
368
  "eu.anthropic.claude-haiku-4-5-20251001-v1:0": {
351
369
  id: "eu.anthropic.claude-haiku-4-5-20251001-v1:0",
352
370
  name: "Claude Haiku 4.5 (EU)",
@@ -469,6 +487,24 @@ export const MODELS = {
469
487
  contextWindow: 1000000,
470
488
  maxTokens: 64000,
471
489
  },
490
+ "global.anthropic.claude-fable-5": {
491
+ id: "global.anthropic.claude-fable-5",
492
+ name: "Claude Fable 5 (Global)",
493
+ api: "bedrock-converse-stream",
494
+ provider: "amazon-bedrock",
495
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
496
+ reasoning: true,
497
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
498
+ input: ["text", "image"],
499
+ cost: {
500
+ input: 10,
501
+ output: 50,
502
+ cacheRead: 1,
503
+ cacheWrite: 12.5,
504
+ },
505
+ contextWindow: 1000000,
506
+ maxTokens: 128000,
507
+ },
472
508
  "global.anthropic.claude-haiku-4-5-20251001-v1:0": {
473
509
  id: "global.anthropic.claude-haiku-4-5-20251001-v1:0",
474
510
  name: "Claude Haiku 4.5 (Global)",
@@ -1128,7 +1164,7 @@ export const MODELS = {
1128
1164
  api: "bedrock-converse-stream",
1129
1165
  provider: "amazon-bedrock",
1130
1166
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1131
- reasoning: false,
1167
+ reasoning: true,
1132
1168
  input: ["text"],
1133
1169
  cost: {
1134
1170
  input: 0.15,
@@ -1145,7 +1181,7 @@ export const MODELS = {
1145
1181
  api: "bedrock-converse-stream",
1146
1182
  provider: "amazon-bedrock",
1147
1183
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1148
- reasoning: false,
1184
+ reasoning: true,
1149
1185
  input: ["text"],
1150
1186
  cost: {
1151
1187
  input: 0.15,
@@ -1162,7 +1198,7 @@ export const MODELS = {
1162
1198
  api: "bedrock-converse-stream",
1163
1199
  provider: "amazon-bedrock",
1164
1200
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1165
- reasoning: false,
1201
+ reasoning: true,
1166
1202
  input: ["text"],
1167
1203
  cost: {
1168
1204
  input: 0.07,
@@ -1179,7 +1215,7 @@ export const MODELS = {
1179
1215
  api: "bedrock-converse-stream",
1180
1216
  provider: "amazon-bedrock",
1181
1217
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1182
- reasoning: false,
1218
+ reasoning: true,
1183
1219
  input: ["text"],
1184
1220
  cost: {
1185
1221
  input: 0.07,
@@ -1343,6 +1379,24 @@ export const MODELS = {
1343
1379
  contextWindow: 262000,
1344
1380
  maxTokens: 262000,
1345
1381
  },
1382
+ "us.anthropic.claude-fable-5": {
1383
+ id: "us.anthropic.claude-fable-5",
1384
+ name: "Claude Fable 5 (US)",
1385
+ api: "bedrock-converse-stream",
1386
+ provider: "amazon-bedrock",
1387
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1388
+ reasoning: true,
1389
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
1390
+ input: ["text", "image"],
1391
+ cost: {
1392
+ input: 10,
1393
+ output: 50,
1394
+ cacheRead: 1,
1395
+ cacheWrite: 12.5,
1396
+ },
1397
+ contextWindow: 1000000,
1398
+ maxTokens: 128000,
1399
+ },
1346
1400
  "us.anthropic.claude-haiku-4-5-20251001-v1:0": {
1347
1401
  id: "us.anthropic.claude-haiku-4-5-20251001-v1:0",
1348
1402
  name: "Claude Haiku 4.5 (US)",
@@ -1813,6 +1867,25 @@ export const MODELS = {
1813
1867
  contextWindow: 200000,
1814
1868
  maxTokens: 4096,
1815
1869
  },
1870
+ "claude-fable-5": {
1871
+ id: "claude-fable-5",
1872
+ name: "Claude Fable 5",
1873
+ api: "anthropic-messages",
1874
+ provider: "anthropic",
1875
+ baseUrl: "https://api.anthropic.com",
1876
+ compat: { "forceAdaptiveThinking": true },
1877
+ reasoning: true,
1878
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
1879
+ input: ["text", "image"],
1880
+ cost: {
1881
+ input: 10,
1882
+ output: 50,
1883
+ cacheRead: 1,
1884
+ cacheWrite: 12.5,
1885
+ },
1886
+ contextWindow: 1000000,
1887
+ maxTokens: 128000,
1888
+ },
1816
1889
  "claude-haiku-4-5": {
1817
1890
  id: "claude-haiku-4-5",
1818
1891
  name: "Claude Haiku 4.5 (latest)",
@@ -2370,7 +2443,7 @@ export const MODELS = {
2370
2443
  cacheWrite: 0,
2371
2444
  },
2372
2445
  contextWindow: 400000,
2373
- maxTokens: 272000,
2446
+ maxTokens: 128000,
2374
2447
  },
2375
2448
  "gpt-5.1": {
2376
2449
  id: "gpt-5.1",
@@ -2603,7 +2676,7 @@ export const MODELS = {
2603
2676
  cacheRead: 0.25,
2604
2677
  cacheWrite: 0,
2605
2678
  },
2606
- contextWindow: 272000,
2679
+ contextWindow: 1050000,
2607
2680
  maxTokens: 128000,
2608
2681
  },
2609
2682
  "gpt-5.4-mini": {
@@ -2675,7 +2748,7 @@ export const MODELS = {
2675
2748
  cacheRead: 0.5,
2676
2749
  cacheWrite: 0,
2677
2750
  },
2678
- contextWindow: 272000,
2751
+ contextWindow: 1050000,
2679
2752
  maxTokens: 128000,
2680
2753
  },
2681
2754
  "gpt-5.5-pro": {
@@ -2843,30 +2916,13 @@ export const MODELS = {
2843
2916
  reasoning: true,
2844
2917
  input: ["text"],
2845
2918
  cost: {
2846
- input: 0.25,
2847
- output: 0.69,
2919
+ input: 0.35,
2920
+ output: 0.75,
2848
2921
  cacheRead: 0,
2849
2922
  cacheWrite: 0,
2850
2923
  },
2851
2924
  contextWindow: 131072,
2852
- maxTokens: 32768,
2853
- },
2854
- "llama3.1-8b": {
2855
- id: "llama3.1-8b",
2856
- name: "Llama 3.1 8B",
2857
- api: "openai-completions",
2858
- provider: "cerebras",
2859
- baseUrl: "https://api.cerebras.ai/v1",
2860
- reasoning: false,
2861
- input: ["text"],
2862
- cost: {
2863
- input: 0.1,
2864
- output: 0.1,
2865
- cacheRead: 0,
2866
- cacheWrite: 0,
2867
- },
2868
- contextWindow: 32000,
2869
- maxTokens: 8000,
2925
+ maxTokens: 40960,
2870
2926
  },
2871
2927
  "zai-glm-4.7": {
2872
2928
  id: "zai-glm-4.7",
@@ -2874,7 +2930,7 @@ export const MODELS = {
2874
2930
  api: "openai-completions",
2875
2931
  provider: "cerebras",
2876
2932
  baseUrl: "https://api.cerebras.ai/v1",
2877
- reasoning: false,
2933
+ reasoning: true,
2878
2934
  input: ["text"],
2879
2935
  cost: {
2880
2936
  input: 2.25,
@@ -2883,7 +2939,7 @@ export const MODELS = {
2883
2939
  cacheWrite: 0,
2884
2940
  },
2885
2941
  contextWindow: 131072,
2886
- maxTokens: 40000,
2942
+ maxTokens: 40960,
2887
2943
  },
2888
2944
  },
2889
2945
  "cloudflare-ai-gateway": {
@@ -2989,6 +3045,25 @@ export const MODELS = {
2989
3045
  contextWindow: 200000,
2990
3046
  maxTokens: 8192,
2991
3047
  },
3048
+ "claude-fable-5": {
3049
+ id: "claude-fable-5",
3050
+ name: "Claude Fable 5",
3051
+ api: "anthropic-messages",
3052
+ provider: "cloudflare-ai-gateway",
3053
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
3054
+ compat: { "forceAdaptiveThinking": true },
3055
+ reasoning: true,
3056
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
3057
+ input: ["text", "image"],
3058
+ cost: {
3059
+ input: 10,
3060
+ output: 50,
3061
+ cacheRead: 1,
3062
+ cacheWrite: 12.5,
3063
+ },
3064
+ contextWindow: 1000000,
3065
+ maxTokens: 128000,
3066
+ },
2992
3067
  "claude-haiku-4-5": {
2993
3068
  id: "claude-haiku-4-5",
2994
3069
  name: "Claude Haiku 4.5 (latest)",
@@ -3627,6 +3702,24 @@ export const MODELS = {
3627
3702
  contextWindow: 262144,
3628
3703
  maxTokens: 256000,
3629
3704
  },
3705
+ "@cf/moonshotai/kimi-k2.7-code": {
3706
+ id: "@cf/moonshotai/kimi-k2.7-code",
3707
+ name: "Kimi K2.7 Code",
3708
+ api: "openai-completions",
3709
+ provider: "cloudflare-workers-ai",
3710
+ baseUrl: "https://api.cloudflare.com/client/v4/accounts/{CLOUDFLARE_ACCOUNT_ID}/ai/v1",
3711
+ compat: { "sendSessionAffinityHeaders": true },
3712
+ reasoning: true,
3713
+ input: ["text", "image"],
3714
+ cost: {
3715
+ input: 0.95,
3716
+ output: 4,
3717
+ cacheRead: 0.19,
3718
+ cacheWrite: 0,
3719
+ },
3720
+ contextWindow: 262144,
3721
+ maxTokens: 262144,
3722
+ },
3630
3723
  "@cf/nvidia/nemotron-3-120b-a12b": {
3631
3724
  id: "@cf/nvidia/nemotron-3-120b-a12b",
3632
3725
  name: "Nemotron 3 Super 120B",
@@ -3995,6 +4088,25 @@ export const MODELS = {
3995
4088
  },
3996
4089
  },
3997
4090
  "github-copilot": {
4091
+ "claude-fable-5": {
4092
+ id: "claude-fable-5",
4093
+ name: "Claude Fable 5",
4094
+ api: "openai-completions",
4095
+ provider: "github-copilot",
4096
+ baseUrl: "https://api.individual.githubcopilot.com",
4097
+ headers: { "User-Agent": "GitHubCopilotChat/0.35.0", "Editor-Version": "vscode/1.107.0", "Editor-Plugin-Version": "copilot-chat/0.35.0", "Copilot-Integration-Id": "vscode-chat" },
4098
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false },
4099
+ reasoning: true,
4100
+ input: ["text", "image"],
4101
+ cost: {
4102
+ input: 10,
4103
+ output: 50,
4104
+ cacheRead: 1,
4105
+ cacheWrite: 12.5,
4106
+ },
4107
+ contextWindow: 1000000,
4108
+ maxTokens: 128000,
4109
+ },
3998
4110
  "claude-haiku-4.5": {
3999
4111
  id: "claude-haiku-4.5",
4000
4112
  name: "Claude Haiku 4.5 (latest)",
@@ -4927,336 +5039,149 @@ export const MODELS = {
4927
5039
  },
4928
5040
  },
4929
5041
  "groq": {
4930
- "deepseek-r1-distill-llama-70b": {
4931
- id: "deepseek-r1-distill-llama-70b",
4932
- name: "DeepSeek R1 Distill Llama 70B",
5042
+ "llama-3.1-8b-instant": {
5043
+ id: "llama-3.1-8b-instant",
5044
+ name: "Llama 3.1 8B",
4933
5045
  api: "openai-completions",
4934
5046
  provider: "groq",
4935
5047
  baseUrl: "https://api.groq.com/openai/v1",
4936
- reasoning: true,
5048
+ reasoning: false,
4937
5049
  input: ["text"],
4938
5050
  cost: {
4939
- input: 0.75,
4940
- output: 0.99,
5051
+ input: 0.05,
5052
+ output: 0.08,
4941
5053
  cacheRead: 0,
4942
5054
  cacheWrite: 0,
4943
5055
  },
4944
5056
  contextWindow: 131072,
4945
- maxTokens: 8192,
5057
+ maxTokens: 131072,
4946
5058
  },
4947
- "gemma2-9b-it": {
4948
- id: "gemma2-9b-it",
4949
- name: "Gemma 2 9B",
5059
+ "llama-3.3-70b-versatile": {
5060
+ id: "llama-3.3-70b-versatile",
5061
+ name: "Llama 3.3 70B",
4950
5062
  api: "openai-completions",
4951
5063
  provider: "groq",
4952
5064
  baseUrl: "https://api.groq.com/openai/v1",
4953
5065
  reasoning: false,
4954
5066
  input: ["text"],
4955
5067
  cost: {
4956
- input: 0.2,
4957
- output: 0.2,
5068
+ input: 0.59,
5069
+ output: 0.79,
4958
5070
  cacheRead: 0,
4959
5071
  cacheWrite: 0,
4960
5072
  },
4961
- contextWindow: 8192,
4962
- maxTokens: 8192,
5073
+ contextWindow: 131072,
5074
+ maxTokens: 32768,
4963
5075
  },
4964
- "groq/compound": {
4965
- id: "groq/compound",
4966
- name: "Compound",
5076
+ "meta-llama/llama-4-scout-17b-16e-instruct": {
5077
+ id: "meta-llama/llama-4-scout-17b-16e-instruct",
5078
+ name: "Llama 4 Scout 17B 16E",
4967
5079
  api: "openai-completions",
4968
5080
  provider: "groq",
4969
5081
  baseUrl: "https://api.groq.com/openai/v1",
4970
- reasoning: true,
4971
- input: ["text"],
5082
+ reasoning: false,
5083
+ input: ["text", "image"],
4972
5084
  cost: {
4973
- input: 0,
4974
- output: 0,
5085
+ input: 0.11,
5086
+ output: 0.34,
4975
5087
  cacheRead: 0,
4976
5088
  cacheWrite: 0,
4977
5089
  },
4978
5090
  contextWindow: 131072,
4979
5091
  maxTokens: 8192,
4980
5092
  },
4981
- "groq/compound-mini": {
4982
- id: "groq/compound-mini",
4983
- name: "Compound Mini",
5093
+ "openai/gpt-oss-120b": {
5094
+ id: "openai/gpt-oss-120b",
5095
+ name: "GPT OSS 120B",
4984
5096
  api: "openai-completions",
4985
5097
  provider: "groq",
4986
5098
  baseUrl: "https://api.groq.com/openai/v1",
4987
5099
  reasoning: true,
4988
5100
  input: ["text"],
4989
5101
  cost: {
4990
- input: 0,
4991
- output: 0,
4992
- cacheRead: 0,
5102
+ input: 0.15,
5103
+ output: 0.6,
5104
+ cacheRead: 0.075,
4993
5105
  cacheWrite: 0,
4994
5106
  },
4995
5107
  contextWindow: 131072,
4996
- maxTokens: 8192,
5108
+ maxTokens: 65536,
4997
5109
  },
4998
- "llama-3.1-8b-instant": {
4999
- id: "llama-3.1-8b-instant",
5000
- name: "Llama 3.1 8B Instant",
5110
+ "openai/gpt-oss-20b": {
5111
+ id: "openai/gpt-oss-20b",
5112
+ name: "GPT OSS 20B",
5001
5113
  api: "openai-completions",
5002
5114
  provider: "groq",
5003
5115
  baseUrl: "https://api.groq.com/openai/v1",
5004
- reasoning: false,
5116
+ reasoning: true,
5005
5117
  input: ["text"],
5006
5118
  cost: {
5007
- input: 0.05,
5008
- output: 0.08,
5009
- cacheRead: 0,
5119
+ input: 0.075,
5120
+ output: 0.3,
5121
+ cacheRead: 0.0375,
5010
5122
  cacheWrite: 0,
5011
5123
  },
5012
5124
  contextWindow: 131072,
5013
- maxTokens: 131072,
5125
+ maxTokens: 65536,
5014
5126
  },
5015
- "llama-3.3-70b-versatile": {
5016
- id: "llama-3.3-70b-versatile",
5017
- name: "Llama 3.3 70B Versatile",
5127
+ "openai/gpt-oss-safeguard-20b": {
5128
+ id: "openai/gpt-oss-safeguard-20b",
5129
+ name: "Safety GPT OSS 20B",
5018
5130
  api: "openai-completions",
5019
5131
  provider: "groq",
5020
5132
  baseUrl: "https://api.groq.com/openai/v1",
5021
- reasoning: false,
5133
+ reasoning: true,
5022
5134
  input: ["text"],
5023
5135
  cost: {
5024
- input: 0.59,
5025
- output: 0.79,
5026
- cacheRead: 0,
5136
+ input: 0.075,
5137
+ output: 0.3,
5138
+ cacheRead: 0.037,
5027
5139
  cacheWrite: 0,
5028
5140
  },
5029
5141
  contextWindow: 131072,
5030
- maxTokens: 32768,
5142
+ maxTokens: 65536,
5031
5143
  },
5032
- "llama3-70b-8192": {
5033
- id: "llama3-70b-8192",
5034
- name: "Llama 3 70B",
5144
+ "qwen/qwen3-32b": {
5145
+ id: "qwen/qwen3-32b",
5146
+ name: "Qwen3-32B",
5035
5147
  api: "openai-completions",
5036
5148
  provider: "groq",
5037
5149
  baseUrl: "https://api.groq.com/openai/v1",
5038
- reasoning: false,
5150
+ reasoning: true,
5151
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "default" },
5039
5152
  input: ["text"],
5040
5153
  cost: {
5041
- input: 0.59,
5042
- output: 0.79,
5154
+ input: 0.29,
5155
+ output: 0.59,
5043
5156
  cacheRead: 0,
5044
5157
  cacheWrite: 0,
5045
5158
  },
5046
- contextWindow: 8192,
5047
- maxTokens: 8192,
5159
+ contextWindow: 131072,
5160
+ maxTokens: 40960,
5048
5161
  },
5049
- "llama3-8b-8192": {
5050
- id: "llama3-8b-8192",
5051
- name: "Llama 3 8B",
5162
+ },
5163
+ "huggingface": {
5164
+ "MiniMaxAI/MiniMax-M2.1": {
5165
+ id: "MiniMaxAI/MiniMax-M2.1",
5166
+ name: "MiniMax-M2.1",
5052
5167
  api: "openai-completions",
5053
- provider: "groq",
5054
- baseUrl: "https://api.groq.com/openai/v1",
5055
- reasoning: false,
5168
+ provider: "huggingface",
5169
+ baseUrl: "https://router.huggingface.co/v1",
5170
+ compat: { "supportsDeveloperRole": false },
5171
+ reasoning: true,
5056
5172
  input: ["text"],
5057
5173
  cost: {
5058
- input: 0.05,
5059
- output: 0.08,
5174
+ input: 0.3,
5175
+ output: 1.2,
5060
5176
  cacheRead: 0,
5061
5177
  cacheWrite: 0,
5062
5178
  },
5063
- contextWindow: 8192,
5064
- maxTokens: 8192,
5179
+ contextWindow: 204800,
5180
+ maxTokens: 131072,
5065
5181
  },
5066
- "meta-llama/llama-4-maverick-17b-128e-instruct": {
5067
- id: "meta-llama/llama-4-maverick-17b-128e-instruct",
5068
- name: "Llama 4 Maverick 17B",
5069
- api: "openai-completions",
5070
- provider: "groq",
5071
- baseUrl: "https://api.groq.com/openai/v1",
5072
- reasoning: false,
5073
- input: ["text", "image"],
5074
- cost: {
5075
- input: 0.2,
5076
- output: 0.6,
5077
- cacheRead: 0,
5078
- cacheWrite: 0,
5079
- },
5080
- contextWindow: 131072,
5081
- maxTokens: 8192,
5082
- },
5083
- "meta-llama/llama-4-scout-17b-16e-instruct": {
5084
- id: "meta-llama/llama-4-scout-17b-16e-instruct",
5085
- name: "Llama 4 Scout 17B",
5086
- api: "openai-completions",
5087
- provider: "groq",
5088
- baseUrl: "https://api.groq.com/openai/v1",
5089
- reasoning: false,
5090
- input: ["text", "image"],
5091
- cost: {
5092
- input: 0.11,
5093
- output: 0.34,
5094
- cacheRead: 0,
5095
- cacheWrite: 0,
5096
- },
5097
- contextWindow: 131072,
5098
- maxTokens: 8192,
5099
- },
5100
- "mistral-saba-24b": {
5101
- id: "mistral-saba-24b",
5102
- name: "Mistral Saba 24B",
5103
- api: "openai-completions",
5104
- provider: "groq",
5105
- baseUrl: "https://api.groq.com/openai/v1",
5106
- reasoning: false,
5107
- input: ["text"],
5108
- cost: {
5109
- input: 0.79,
5110
- output: 0.79,
5111
- cacheRead: 0,
5112
- cacheWrite: 0,
5113
- },
5114
- contextWindow: 32768,
5115
- maxTokens: 32768,
5116
- },
5117
- "moonshotai/kimi-k2-instruct": {
5118
- id: "moonshotai/kimi-k2-instruct",
5119
- name: "Kimi K2 Instruct",
5120
- api: "openai-completions",
5121
- provider: "groq",
5122
- baseUrl: "https://api.groq.com/openai/v1",
5123
- reasoning: false,
5124
- input: ["text"],
5125
- cost: {
5126
- input: 1,
5127
- output: 3,
5128
- cacheRead: 0,
5129
- cacheWrite: 0,
5130
- },
5131
- contextWindow: 131072,
5132
- maxTokens: 16384,
5133
- },
5134
- "moonshotai/kimi-k2-instruct-0905": {
5135
- id: "moonshotai/kimi-k2-instruct-0905",
5136
- name: "Kimi K2 Instruct 0905",
5137
- api: "openai-completions",
5138
- provider: "groq",
5139
- baseUrl: "https://api.groq.com/openai/v1",
5140
- reasoning: false,
5141
- input: ["text"],
5142
- cost: {
5143
- input: 1,
5144
- output: 3,
5145
- cacheRead: 0.5,
5146
- cacheWrite: 0,
5147
- },
5148
- contextWindow: 262144,
5149
- maxTokens: 16384,
5150
- },
5151
- "openai/gpt-oss-120b": {
5152
- id: "openai/gpt-oss-120b",
5153
- name: "GPT OSS 120B",
5154
- api: "openai-completions",
5155
- provider: "groq",
5156
- baseUrl: "https://api.groq.com/openai/v1",
5157
- reasoning: true,
5158
- input: ["text"],
5159
- cost: {
5160
- input: 0.15,
5161
- output: 0.6,
5162
- cacheRead: 0.075,
5163
- cacheWrite: 0,
5164
- },
5165
- contextWindow: 131072,
5166
- maxTokens: 65536,
5167
- },
5168
- "openai/gpt-oss-20b": {
5169
- id: "openai/gpt-oss-20b",
5170
- name: "GPT OSS 20B",
5171
- api: "openai-completions",
5172
- provider: "groq",
5173
- baseUrl: "https://api.groq.com/openai/v1",
5174
- reasoning: true,
5175
- input: ["text"],
5176
- cost: {
5177
- input: 0.075,
5178
- output: 0.3,
5179
- cacheRead: 0.0375,
5180
- cacheWrite: 0,
5181
- },
5182
- contextWindow: 131072,
5183
- maxTokens: 65536,
5184
- },
5185
- "openai/gpt-oss-safeguard-20b": {
5186
- id: "openai/gpt-oss-safeguard-20b",
5187
- name: "Safety GPT OSS 20B",
5188
- api: "openai-completions",
5189
- provider: "groq",
5190
- baseUrl: "https://api.groq.com/openai/v1",
5191
- reasoning: true,
5192
- input: ["text"],
5193
- cost: {
5194
- input: 0.075,
5195
- output: 0.3,
5196
- cacheRead: 0.037,
5197
- cacheWrite: 0,
5198
- },
5199
- contextWindow: 131072,
5200
- maxTokens: 65536,
5201
- },
5202
- "qwen-qwq-32b": {
5203
- id: "qwen-qwq-32b",
5204
- name: "Qwen QwQ 32B",
5205
- api: "openai-completions",
5206
- provider: "groq",
5207
- baseUrl: "https://api.groq.com/openai/v1",
5208
- reasoning: true,
5209
- input: ["text"],
5210
- cost: {
5211
- input: 0.29,
5212
- output: 0.39,
5213
- cacheRead: 0,
5214
- cacheWrite: 0,
5215
- },
5216
- contextWindow: 131072,
5217
- maxTokens: 16384,
5218
- },
5219
- "qwen/qwen3-32b": {
5220
- id: "qwen/qwen3-32b",
5221
- name: "Qwen3 32B",
5222
- api: "openai-completions",
5223
- provider: "groq",
5224
- baseUrl: "https://api.groq.com/openai/v1",
5225
- reasoning: true,
5226
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "default" },
5227
- input: ["text"],
5228
- cost: {
5229
- input: 0.29,
5230
- output: 0.59,
5231
- cacheRead: 0,
5232
- cacheWrite: 0,
5233
- },
5234
- contextWindow: 131072,
5235
- maxTokens: 40960,
5236
- },
5237
- },
5238
- "huggingface": {
5239
- "MiniMaxAI/MiniMax-M2.1": {
5240
- id: "MiniMaxAI/MiniMax-M2.1",
5241
- name: "MiniMax-M2.1",
5242
- api: "openai-completions",
5243
- provider: "huggingface",
5244
- baseUrl: "https://router.huggingface.co/v1",
5245
- compat: { "supportsDeveloperRole": false },
5246
- reasoning: true,
5247
- input: ["text"],
5248
- cost: {
5249
- input: 0.3,
5250
- output: 1.2,
5251
- cacheRead: 0,
5252
- cacheWrite: 0,
5253
- },
5254
- contextWindow: 204800,
5255
- maxTokens: 131072,
5256
- },
5257
- "MiniMaxAI/MiniMax-M2.5": {
5258
- id: "MiniMaxAI/MiniMax-M2.5",
5259
- name: "MiniMax-M2.5",
5182
+ "MiniMaxAI/MiniMax-M2.5": {
5183
+ id: "MiniMaxAI/MiniMax-M2.5",
5184
+ name: "MiniMax-M2.5",
5260
5185
  api: "openai-completions",
5261
5186
  provider: "huggingface",
5262
5187
  baseUrl: "https://router.huggingface.co/v1",
@@ -5634,6 +5559,24 @@ export const MODELS = {
5634
5559
  },
5635
5560
  },
5636
5561
  "kimi-coding": {
5562
+ "k2p7": {
5563
+ id: "k2p7",
5564
+ name: "Kimi K2.7 Code",
5565
+ api: "anthropic-messages",
5566
+ provider: "kimi-coding",
5567
+ baseUrl: "https://api.kimi.com/coding",
5568
+ headers: { "User-Agent": "KimiCLI/1.5" },
5569
+ reasoning: true,
5570
+ input: ["text", "image"],
5571
+ cost: {
5572
+ input: 0,
5573
+ output: 0,
5574
+ cacheRead: 0,
5575
+ cacheWrite: 0,
5576
+ },
5577
+ contextWindow: 262144,
5578
+ maxTokens: 32768,
5579
+ },
5637
5580
  "kimi-for-coding": {
5638
5581
  id: "kimi-for-coding",
5639
5582
  name: "Kimi For Coding",
@@ -6296,7 +6239,7 @@ export const MODELS = {
6296
6239
  api: "openai-completions",
6297
6240
  provider: "moonshotai",
6298
6241
  baseUrl: "https://api.moonshot.ai/v1",
6299
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6242
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6300
6243
  reasoning: false,
6301
6244
  input: ["text"],
6302
6245
  cost: {
@@ -6314,7 +6257,7 @@ export const MODELS = {
6314
6257
  api: "openai-completions",
6315
6258
  provider: "moonshotai",
6316
6259
  baseUrl: "https://api.moonshot.ai/v1",
6317
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6260
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6318
6261
  reasoning: false,
6319
6262
  input: ["text"],
6320
6263
  cost: {
@@ -6332,7 +6275,7 @@ export const MODELS = {
6332
6275
  api: "openai-completions",
6333
6276
  provider: "moonshotai",
6334
6277
  baseUrl: "https://api.moonshot.ai/v1",
6335
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6278
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6336
6279
  reasoning: true,
6337
6280
  input: ["text"],
6338
6281
  cost: {
@@ -6350,7 +6293,7 @@ export const MODELS = {
6350
6293
  api: "openai-completions",
6351
6294
  provider: "moonshotai",
6352
6295
  baseUrl: "https://api.moonshot.ai/v1",
6353
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6296
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6354
6297
  reasoning: true,
6355
6298
  input: ["text"],
6356
6299
  cost: {
@@ -6368,7 +6311,7 @@ export const MODELS = {
6368
6311
  api: "openai-completions",
6369
6312
  provider: "moonshotai",
6370
6313
  baseUrl: "https://api.moonshot.ai/v1",
6371
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6314
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6372
6315
  reasoning: false,
6373
6316
  input: ["text"],
6374
6317
  cost: {
@@ -6386,7 +6329,7 @@ export const MODELS = {
6386
6329
  api: "openai-completions",
6387
6330
  provider: "moonshotai",
6388
6331
  baseUrl: "https://api.moonshot.ai/v1",
6389
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6332
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6390
6333
  reasoning: true,
6391
6334
  input: ["text", "image"],
6392
6335
  cost: {
@@ -6404,7 +6347,7 @@ export const MODELS = {
6404
6347
  api: "openai-completions",
6405
6348
  provider: "moonshotai",
6406
6349
  baseUrl: "https://api.moonshot.ai/v1",
6407
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6350
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6408
6351
  reasoning: true,
6409
6352
  input: ["text", "image"],
6410
6353
  cost: {
@@ -6416,6 +6359,24 @@ export const MODELS = {
6416
6359
  contextWindow: 262144,
6417
6360
  maxTokens: 262144,
6418
6361
  },
6362
+ "kimi-k2.7-code": {
6363
+ id: "kimi-k2.7-code",
6364
+ name: "Kimi K2.7 Code",
6365
+ api: "openai-completions",
6366
+ provider: "moonshotai",
6367
+ baseUrl: "https://api.moonshot.ai/v1",
6368
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6369
+ reasoning: true,
6370
+ input: ["text", "image"],
6371
+ cost: {
6372
+ input: 0.95,
6373
+ output: 4,
6374
+ cacheRead: 0.19,
6375
+ cacheWrite: 0,
6376
+ },
6377
+ contextWindow: 262144,
6378
+ maxTokens: 262144,
6379
+ },
6419
6380
  },
6420
6381
  "moonshotai-cn": {
6421
6382
  "kimi-k2-0711-preview": {
@@ -6424,7 +6385,7 @@ export const MODELS = {
6424
6385
  api: "openai-completions",
6425
6386
  provider: "moonshotai-cn",
6426
6387
  baseUrl: "https://api.moonshot.cn/v1",
6427
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6388
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6428
6389
  reasoning: false,
6429
6390
  input: ["text"],
6430
6391
  cost: {
@@ -6442,7 +6403,7 @@ export const MODELS = {
6442
6403
  api: "openai-completions",
6443
6404
  provider: "moonshotai-cn",
6444
6405
  baseUrl: "https://api.moonshot.cn/v1",
6445
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6406
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6446
6407
  reasoning: false,
6447
6408
  input: ["text"],
6448
6409
  cost: {
@@ -6460,7 +6421,7 @@ export const MODELS = {
6460
6421
  api: "openai-completions",
6461
6422
  provider: "moonshotai-cn",
6462
6423
  baseUrl: "https://api.moonshot.cn/v1",
6463
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6424
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6464
6425
  reasoning: true,
6465
6426
  input: ["text"],
6466
6427
  cost: {
@@ -6478,7 +6439,7 @@ export const MODELS = {
6478
6439
  api: "openai-completions",
6479
6440
  provider: "moonshotai-cn",
6480
6441
  baseUrl: "https://api.moonshot.cn/v1",
6481
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6442
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6482
6443
  reasoning: true,
6483
6444
  input: ["text"],
6484
6445
  cost: {
@@ -6496,7 +6457,7 @@ export const MODELS = {
6496
6457
  api: "openai-completions",
6497
6458
  provider: "moonshotai-cn",
6498
6459
  baseUrl: "https://api.moonshot.cn/v1",
6499
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6460
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6500
6461
  reasoning: false,
6501
6462
  input: ["text"],
6502
6463
  cost: {
@@ -6514,7 +6475,7 @@ export const MODELS = {
6514
6475
  api: "openai-completions",
6515
6476
  provider: "moonshotai-cn",
6516
6477
  baseUrl: "https://api.moonshot.cn/v1",
6517
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6478
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6518
6479
  reasoning: true,
6519
6480
  input: ["text", "image"],
6520
6481
  cost: {
@@ -6532,7 +6493,7 @@ export const MODELS = {
6532
6493
  api: "openai-completions",
6533
6494
  provider: "moonshotai-cn",
6534
6495
  baseUrl: "https://api.moonshot.cn/v1",
6535
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6496
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6536
6497
  reasoning: true,
6537
6498
  input: ["text", "image"],
6538
6499
  cost: {
@@ -6668,8 +6629,8 @@ export const MODELS = {
6668
6629
  baseUrl: "https://integrate.api.nvidia.com/v1",
6669
6630
  headers: { "NVCF-POLL-SECONDS": "3600" },
6670
6631
  compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6671
- reasoning: false,
6672
- input: ["text"],
6632
+ reasoning: true,
6633
+ input: ["text", "image"],
6673
6634
  cost: {
6674
6635
  input: 0,
6675
6636
  output: 0,
@@ -6698,44 +6659,6 @@ export const MODELS = {
6698
6659
  contextWindow: 262144,
6699
6660
  maxTokens: 262144,
6700
6661
  },
6701
- "nvidia/llama-3.3-nemotron-super-49b-v1": {
6702
- id: "nvidia/llama-3.3-nemotron-super-49b-v1",
6703
- name: "Llama 3.3 Nemotron Super 49B v1",
6704
- api: "openai-completions",
6705
- provider: "nvidia",
6706
- baseUrl: "https://integrate.api.nvidia.com/v1",
6707
- headers: { "NVCF-POLL-SECONDS": "3600" },
6708
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6709
- reasoning: true,
6710
- input: ["text"],
6711
- cost: {
6712
- input: 0,
6713
- output: 0,
6714
- cacheRead: 0,
6715
- cacheWrite: 0,
6716
- },
6717
- contextWindow: 131072,
6718
- maxTokens: 131072,
6719
- },
6720
- "nvidia/llama-3.3-nemotron-super-49b-v1.5": {
6721
- id: "nvidia/llama-3.3-nemotron-super-49b-v1.5",
6722
- name: "Llama 3.3 Nemotron Super 49B v1.5",
6723
- api: "openai-completions",
6724
- provider: "nvidia",
6725
- baseUrl: "https://integrate.api.nvidia.com/v1",
6726
- headers: { "NVCF-POLL-SECONDS": "3600" },
6727
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6728
- reasoning: true,
6729
- input: ["text"],
6730
- cost: {
6731
- input: 0,
6732
- output: 0,
6733
- cacheRead: 0,
6734
- cacheWrite: 0,
6735
- },
6736
- contextWindow: 131072,
6737
- maxTokens: 131072,
6738
- },
6739
6662
  "nvidia/nemotron-3-nano-30b-a3b": {
6740
6663
  id: "nvidia/nemotron-3-nano-30b-a3b",
6741
6664
  name: "nemotron-3-nano-30b-a3b",
@@ -6831,9 +6754,9 @@ export const MODELS = {
6831
6754
  contextWindow: 131072,
6832
6755
  maxTokens: 131072,
6833
6756
  },
6834
- "openai/gpt-oss-20b": {
6835
- id: "openai/gpt-oss-20b",
6836
- name: "GPT OSS 20B",
6757
+ "openai/gpt-oss-120b": {
6758
+ id: "openai/gpt-oss-120b",
6759
+ name: "GPT-OSS-120B",
6837
6760
  api: "openai-completions",
6838
6761
  provider: "nvidia",
6839
6762
  baseUrl: "https://integrate.api.nvidia.com/v1",
@@ -6847,18 +6770,18 @@ export const MODELS = {
6847
6770
  cacheRead: 0,
6848
6771
  cacheWrite: 0,
6849
6772
  },
6850
- contextWindow: 131072,
6851
- maxTokens: 32768,
6773
+ contextWindow: 128000,
6774
+ maxTokens: 8192,
6852
6775
  },
6853
- "qwen/qwen3-coder-480b-a35b-instruct": {
6854
- id: "qwen/qwen3-coder-480b-a35b-instruct",
6855
- name: "Qwen3 Coder 480B A35B Instruct",
6776
+ "openai/gpt-oss-20b": {
6777
+ id: "openai/gpt-oss-20b",
6778
+ name: "GPT OSS 20B",
6856
6779
  api: "openai-completions",
6857
6780
  provider: "nvidia",
6858
6781
  baseUrl: "https://integrate.api.nvidia.com/v1",
6859
6782
  headers: { "NVCF-POLL-SECONDS": "3600" },
6860
6783
  compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6861
- reasoning: false,
6784
+ reasoning: true,
6862
6785
  input: ["text"],
6863
6786
  cost: {
6864
6787
  input: 0,
@@ -6866,8 +6789,8 @@ export const MODELS = {
6866
6789
  cacheRead: 0,
6867
6790
  cacheWrite: 0,
6868
6791
  },
6869
- contextWindow: 262144,
6870
- maxTokens: 66536,
6792
+ contextWindow: 131072,
6793
+ maxTokens: 32768,
6871
6794
  },
6872
6795
  "qwen/qwen3.5-122b-a10b": {
6873
6796
  id: "qwen/qwen3.5-122b-a10b",
@@ -7223,7 +7146,7 @@ export const MODELS = {
7223
7146
  cacheWrite: 0,
7224
7147
  },
7225
7148
  contextWindow: 400000,
7226
- maxTokens: 272000,
7149
+ maxTokens: 128000,
7227
7150
  },
7228
7151
  "gpt-5.1": {
7229
7152
  id: "gpt-5.1",
@@ -7456,7 +7379,7 @@ export const MODELS = {
7456
7379
  cacheRead: 0.25,
7457
7380
  cacheWrite: 0,
7458
7381
  },
7459
- contextWindow: 272000,
7382
+ contextWindow: 1050000,
7460
7383
  maxTokens: 128000,
7461
7384
  },
7462
7385
  "gpt-5.4-mini": {
@@ -7528,7 +7451,7 @@ export const MODELS = {
7528
7451
  cacheRead: 0.5,
7529
7452
  cacheWrite: 0,
7530
7453
  },
7531
- contextWindow: 272000,
7454
+ contextWindow: 1050000,
7532
7455
  maxTokens: 128000,
7533
7456
  },
7534
7457
  "gpt-5.5-pro": {
@@ -7720,7 +7643,7 @@ export const MODELS = {
7720
7643
  cacheRead: 0.25,
7721
7644
  cacheWrite: 0,
7722
7645
  },
7723
- contextWindow: 272000,
7646
+ contextWindow: 1000000,
7724
7647
  maxTokens: 128000,
7725
7648
  },
7726
7649
  "gpt-5.4-mini": {
@@ -7738,7 +7661,7 @@ export const MODELS = {
7738
7661
  cacheRead: 0.075,
7739
7662
  cacheWrite: 0,
7740
7663
  },
7741
- contextWindow: 272000,
7664
+ contextWindow: 400000,
7742
7665
  maxTokens: 128000,
7743
7666
  },
7744
7667
  "gpt-5.5": {
@@ -7756,7 +7679,7 @@ export const MODELS = {
7756
7679
  cacheRead: 0.5,
7757
7680
  cacheWrite: 0,
7758
7681
  },
7759
- contextWindow: 272000,
7682
+ contextWindow: 400000,
7760
7683
  maxTokens: 128000,
7761
7684
  },
7762
7685
  },
@@ -7767,6 +7690,7 @@ export const MODELS = {
7767
7690
  api: "openai-completions",
7768
7691
  provider: "opencode",
7769
7692
  baseUrl: "https://opencode.ai/zen/v1",
7693
+ compat: { "maxTokensField": "max_tokens" },
7770
7694
  reasoning: true,
7771
7695
  input: ["text"],
7772
7696
  cost: {
@@ -7778,6 +7702,25 @@ export const MODELS = {
7778
7702
  contextWindow: 200000,
7779
7703
  maxTokens: 32000,
7780
7704
  },
7705
+ "claude-fable-5": {
7706
+ id: "claude-fable-5",
7707
+ name: "Claude Fable 5",
7708
+ api: "anthropic-messages",
7709
+ provider: "opencode",
7710
+ baseUrl: "https://opencode.ai/zen",
7711
+ compat: { "forceAdaptiveThinking": true },
7712
+ reasoning: true,
7713
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
7714
+ input: ["text", "image"],
7715
+ cost: {
7716
+ input: 10,
7717
+ output: 50,
7718
+ cacheRead: 1,
7719
+ cacheWrite: 12.5,
7720
+ },
7721
+ contextWindow: 1000000,
7722
+ maxTokens: 128000,
7723
+ },
7781
7724
  "claude-haiku-4-5": {
7782
7725
  id: "claude-haiku-4-5",
7783
7726
  name: "Claude Haiku 4.5",
@@ -7944,14 +7887,14 @@ export const MODELS = {
7944
7887
  api: "openai-completions",
7945
7888
  provider: "opencode",
7946
7889
  baseUrl: "https://opencode.ai/zen/v1",
7947
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7890
+ compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7948
7891
  reasoning: true,
7949
7892
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7950
7893
  input: ["text"],
7951
7894
  cost: {
7952
7895
  input: 0.14,
7953
7896
  output: 0.28,
7954
- cacheRead: 0.03,
7897
+ cacheRead: 0.028,
7955
7898
  cacheWrite: 0,
7956
7899
  },
7957
7900
  contextWindow: 1000000,
@@ -7963,7 +7906,7 @@ export const MODELS = {
7963
7906
  api: "openai-completions",
7964
7907
  provider: "opencode",
7965
7908
  baseUrl: "https://opencode.ai/zen/v1",
7966
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7909
+ compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7967
7910
  reasoning: true,
7968
7911
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7969
7912
  input: ["text"],
@@ -7976,6 +7919,25 @@ export const MODELS = {
7976
7919
  contextWindow: 200000,
7977
7920
  maxTokens: 128000,
7978
7921
  },
7922
+ "deepseek-v4-pro": {
7923
+ id: "deepseek-v4-pro",
7924
+ name: "DeepSeek V4 Pro",
7925
+ api: "openai-completions",
7926
+ provider: "opencode",
7927
+ baseUrl: "https://opencode.ai/zen/v1",
7928
+ compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7929
+ reasoning: true,
7930
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7931
+ input: ["text"],
7932
+ cost: {
7933
+ input: 1.74,
7934
+ output: 3.84,
7935
+ cacheRead: 0.145,
7936
+ cacheWrite: 0,
7937
+ },
7938
+ contextWindow: 1000000,
7939
+ maxTokens: 384000,
7940
+ },
7979
7941
  "gemini-3-flash": {
7980
7942
  id: "gemini-3-flash",
7981
7943
  name: "Gemini 3 Flash",
@@ -8036,6 +7998,7 @@ export const MODELS = {
8036
7998
  api: "openai-completions",
8037
7999
  provider: "opencode",
8038
8000
  baseUrl: "https://opencode.ai/zen/v1",
8001
+ compat: { "maxTokensField": "max_tokens" },
8039
8002
  reasoning: true,
8040
8003
  input: ["text"],
8041
8004
  cost: {
@@ -8053,6 +8016,7 @@ export const MODELS = {
8053
8016
  api: "openai-completions",
8054
8017
  provider: "opencode",
8055
8018
  baseUrl: "https://opencode.ai/zen/v1",
8019
+ compat: { "maxTokensField": "max_tokens" },
8056
8020
  reasoning: true,
8057
8021
  input: ["text"],
8058
8022
  cost: {
@@ -8358,7 +8322,7 @@ export const MODELS = {
8358
8322
  api: "openai-completions",
8359
8323
  provider: "opencode",
8360
8324
  baseUrl: "https://opencode.ai/zen/v1",
8361
- compat: { "supportsReasoningEffort": false },
8325
+ compat: { "supportsReasoningEffort": false, "maxTokensField": "max_tokens" },
8362
8326
  reasoning: true,
8363
8327
  thinkingLevelMap: { "off": null, "minimal": null, "low": null, "medium": null },
8364
8328
  input: ["text", "image"],
@@ -8377,6 +8341,7 @@ export const MODELS = {
8377
8341
  api: "openai-completions",
8378
8342
  provider: "opencode",
8379
8343
  baseUrl: "https://opencode.ai/zen/v1",
8344
+ compat: { "maxTokensField": "max_tokens" },
8380
8345
  reasoning: true,
8381
8346
  input: ["text", "image"],
8382
8347
  cost: {
@@ -8394,7 +8359,7 @@ export const MODELS = {
8394
8359
  api: "openai-completions",
8395
8360
  provider: "opencode",
8396
8361
  baseUrl: "https://opencode.ai/zen/v1",
8397
- compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false },
8362
+ compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false, "maxTokensField": "max_tokens" },
8398
8363
  reasoning: true,
8399
8364
  input: ["text", "image"],
8400
8365
  cost: {
@@ -8412,6 +8377,7 @@ export const MODELS = {
8412
8377
  api: "openai-completions",
8413
8378
  provider: "opencode",
8414
8379
  baseUrl: "https://opencode.ai/zen/v1",
8380
+ compat: { "maxTokensField": "max_tokens" },
8415
8381
  reasoning: true,
8416
8382
  input: ["text", "image"],
8417
8383
  cost: {
@@ -8429,6 +8395,7 @@ export const MODELS = {
8429
8395
  api: "openai-completions",
8430
8396
  provider: "opencode",
8431
8397
  baseUrl: "https://opencode.ai/zen/v1",
8398
+ compat: { "maxTokensField": "max_tokens" },
8432
8399
  reasoning: true,
8433
8400
  input: ["text"],
8434
8401
  cost: {
@@ -8446,6 +8413,7 @@ export const MODELS = {
8446
8413
  api: "openai-completions",
8447
8414
  provider: "opencode",
8448
8415
  baseUrl: "https://opencode.ai/zen/v1",
8416
+ compat: { "maxTokensField": "max_tokens" },
8449
8417
  reasoning: true,
8450
8418
  input: ["text"],
8451
8419
  cost: {
@@ -8463,6 +8431,7 @@ export const MODELS = {
8463
8431
  api: "openai-completions",
8464
8432
  provider: "opencode",
8465
8433
  baseUrl: "https://opencode.ai/zen/v1",
8434
+ compat: { "maxTokensField": "max_tokens" },
8466
8435
  reasoning: true,
8467
8436
  input: ["text"],
8468
8437
  cost: {
@@ -8474,6 +8443,24 @@ export const MODELS = {
8474
8443
  contextWindow: 1000000,
8475
8444
  maxTokens: 128000,
8476
8445
  },
8446
+ "north-mini-code-free": {
8447
+ id: "north-mini-code-free",
8448
+ name: "North Mini Code Free",
8449
+ api: "openai-completions",
8450
+ provider: "opencode",
8451
+ baseUrl: "https://opencode.ai/zen/v1",
8452
+ compat: { "maxTokensField": "max_tokens" },
8453
+ reasoning: true,
8454
+ input: ["text"],
8455
+ cost: {
8456
+ input: 0,
8457
+ output: 0,
8458
+ cacheRead: 0,
8459
+ cacheWrite: 0,
8460
+ },
8461
+ contextWindow: 256000,
8462
+ maxTokens: 64000,
8463
+ },
8477
8464
  "qwen3.5-plus": {
8478
8465
  id: "qwen3.5-plus",
8479
8466
  name: "Qwen3.5 Plus",
@@ -8516,7 +8503,7 @@ export const MODELS = {
8516
8503
  api: "openai-completions",
8517
8504
  provider: "opencode-go",
8518
8505
  baseUrl: "https://opencode.ai/zen/go/v1",
8519
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8506
+ compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8520
8507
  reasoning: true,
8521
8508
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
8522
8509
  input: ["text"],
@@ -8535,7 +8522,7 @@ export const MODELS = {
8535
8522
  api: "openai-completions",
8536
8523
  provider: "opencode-go",
8537
8524
  baseUrl: "https://opencode.ai/zen/go/v1",
8538
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8525
+ compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8539
8526
  reasoning: true,
8540
8527
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
8541
8528
  input: ["text"],
@@ -8554,6 +8541,7 @@ export const MODELS = {
8554
8541
  api: "openai-completions",
8555
8542
  provider: "opencode-go",
8556
8543
  baseUrl: "https://opencode.ai/zen/go/v1",
8544
+ compat: { "maxTokensField": "max_tokens" },
8557
8545
  reasoning: true,
8558
8546
  input: ["text"],
8559
8547
  cost: {
@@ -8571,6 +8559,7 @@ export const MODELS = {
8571
8559
  api: "openai-completions",
8572
8560
  provider: "opencode-go",
8573
8561
  baseUrl: "https://opencode.ai/zen/go/v1",
8562
+ compat: { "maxTokensField": "max_tokens" },
8574
8563
  reasoning: true,
8575
8564
  input: ["text"],
8576
8565
  cost: {
@@ -8582,41 +8571,42 @@ export const MODELS = {
8582
8571
  contextWindow: 202752,
8583
8572
  maxTokens: 32768,
8584
8573
  },
8585
- "kimi-k2.5": {
8586
- id: "kimi-k2.5",
8587
- name: "Kimi K2.5",
8574
+ "kimi-k2.6": {
8575
+ id: "kimi-k2.6",
8576
+ name: "Kimi K2.6",
8588
8577
  api: "openai-completions",
8589
8578
  provider: "opencode-go",
8590
8579
  baseUrl: "https://opencode.ai/zen/go/v1",
8580
+ compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false, "maxTokensField": "max_tokens" },
8591
8581
  reasoning: true,
8582
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
8592
8583
  input: ["text", "image"],
8593
8584
  cost: {
8594
- input: 0.6,
8595
- output: 3,
8596
- cacheRead: 0.1,
8585
+ input: 0.95,
8586
+ output: 4,
8587
+ cacheRead: 0.16,
8597
8588
  cacheWrite: 0,
8598
8589
  },
8599
8590
  contextWindow: 262144,
8600
8591
  maxTokens: 65536,
8601
8592
  },
8602
- "kimi-k2.6": {
8603
- id: "kimi-k2.6",
8604
- name: "Kimi K2.6",
8593
+ "kimi-k2.7-code": {
8594
+ id: "kimi-k2.7-code",
8595
+ name: "Kimi K2.7 Code",
8605
8596
  api: "openai-completions",
8606
8597
  provider: "opencode-go",
8607
8598
  baseUrl: "https://opencode.ai/zen/go/v1",
8608
- compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false },
8599
+ compat: { "maxTokensField": "max_tokens" },
8609
8600
  reasoning: true,
8610
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
8611
8601
  input: ["text", "image"],
8612
8602
  cost: {
8613
8603
  input: 0.95,
8614
8604
  output: 4,
8615
- cacheRead: 0.16,
8605
+ cacheRead: 0.19,
8616
8606
  cacheWrite: 0,
8617
8607
  },
8618
8608
  contextWindow: 262144,
8619
- maxTokens: 65536,
8609
+ maxTokens: 262144,
8620
8610
  },
8621
8611
  "mimo-v2.5": {
8622
8612
  id: "mimo-v2.5",
@@ -8624,6 +8614,7 @@ export const MODELS = {
8624
8614
  api: "openai-completions",
8625
8615
  provider: "opencode-go",
8626
8616
  baseUrl: "https://opencode.ai/zen/go/v1",
8617
+ compat: { "maxTokensField": "max_tokens" },
8627
8618
  reasoning: true,
8628
8619
  input: ["text", "image"],
8629
8620
  cost: {
@@ -8641,6 +8632,7 @@ export const MODELS = {
8641
8632
  api: "openai-completions",
8642
8633
  provider: "opencode-go",
8643
8634
  baseUrl: "https://opencode.ai/zen/go/v1",
8635
+ compat: { "maxTokensField": "max_tokens" },
8644
8636
  reasoning: true,
8645
8637
  input: ["text"],
8646
8638
  cost: {
@@ -8652,29 +8644,13 @@ export const MODELS = {
8652
8644
  contextWindow: 1048576,
8653
8645
  maxTokens: 128000,
8654
8646
  },
8655
- "minimax-m2.5": {
8656
- id: "minimax-m2.5",
8657
- name: "MiniMax M2.5",
8658
- api: "anthropic-messages",
8659
- provider: "opencode-go",
8660
- baseUrl: "https://opencode.ai/zen/go",
8661
- reasoning: true,
8662
- input: ["text"],
8663
- cost: {
8664
- input: 0.3,
8665
- output: 1.2,
8666
- cacheRead: 0.03,
8667
- cacheWrite: 0,
8668
- },
8669
- contextWindow: 204800,
8670
- maxTokens: 65536,
8671
- },
8672
8647
  "minimax-m2.7": {
8673
8648
  id: "minimax-m2.7",
8674
8649
  name: "MiniMax M2.7",
8675
8650
  api: "openai-completions",
8676
8651
  provider: "opencode-go",
8677
8652
  baseUrl: "https://opencode.ai/zen/go/v1",
8653
+ compat: { "maxTokensField": "max_tokens" },
8678
8654
  reasoning: true,
8679
8655
  input: ["text"],
8680
8656
  cost: {
@@ -8688,16 +8664,16 @@ export const MODELS = {
8688
8664
  },
8689
8665
  "minimax-m3": {
8690
8666
  id: "minimax-m3",
8691
- name: "MiniMax M3",
8667
+ name: "MiniMax M3 (3x usage)",
8692
8668
  api: "anthropic-messages",
8693
8669
  provider: "opencode-go",
8694
8670
  baseUrl: "https://opencode.ai/zen/go",
8695
8671
  reasoning: true,
8696
8672
  input: ["text", "image"],
8697
8673
  cost: {
8698
- input: 0.3,
8699
- output: 1.2,
8700
- cacheRead: 0.06,
8674
+ input: 0.1,
8675
+ output: 0.4,
8676
+ cacheRead: 0.02,
8701
8677
  cacheWrite: 0,
8702
8678
  },
8703
8679
  contextWindow: 512000,
@@ -8709,7 +8685,7 @@ export const MODELS = {
8709
8685
  api: "openai-completions",
8710
8686
  provider: "opencode-go",
8711
8687
  baseUrl: "https://opencode.ai/zen/go/v1",
8712
- compat: { "thinkingFormat": "qwen" },
8688
+ compat: { "thinkingFormat": "qwen", "maxTokensField": "max_tokens" },
8713
8689
  reasoning: true,
8714
8690
  input: ["text", "image"],
8715
8691
  cost: {
@@ -8851,8 +8827,8 @@ export const MODELS = {
8851
8827
  reasoning: false,
8852
8828
  input: ["text", "image"],
8853
8829
  cost: {
8854
- input: 0.7999999999999999,
8855
- output: 3.1999999999999997,
8830
+ input: 0.8,
8831
+ output: 3.2,
8856
8832
  cacheRead: 0,
8857
8833
  cacheWrite: 0,
8858
8834
  },
@@ -8885,7 +8861,7 @@ export const MODELS = {
8885
8861
  reasoning: false,
8886
8862
  input: ["text", "image"],
8887
8863
  cost: {
8888
- input: 0.7999999999999999,
8864
+ input: 0.8,
8889
8865
  output: 4,
8890
8866
  cacheRead: 0.08,
8891
8867
  cacheWrite: 1,
@@ -8893,6 +8869,23 @@ export const MODELS = {
8893
8869
  contextWindow: 200000,
8894
8870
  maxTokens: 8192,
8895
8871
  },
8872
+ "anthropic/claude-fable-5": {
8873
+ id: "anthropic/claude-fable-5",
8874
+ name: "Anthropic: Claude Fable 5",
8875
+ api: "openai-completions",
8876
+ provider: "openrouter",
8877
+ baseUrl: "https://openrouter.ai/api/v1",
8878
+ reasoning: true,
8879
+ input: ["text", "image"],
8880
+ cost: {
8881
+ input: 10,
8882
+ output: 50,
8883
+ cacheRead: 1,
8884
+ cacheWrite: 12.5,
8885
+ },
8886
+ contextWindow: 1000000,
8887
+ maxTokens: 128000,
8888
+ },
8896
8889
  "anthropic/claude-haiku-4.5": {
8897
8890
  id: "anthropic/claude-haiku-4.5",
8898
8891
  name: "Anthropic: Claude Haiku 4.5",
@@ -8904,7 +8897,7 @@ export const MODELS = {
8904
8897
  cost: {
8905
8898
  input: 1,
8906
8899
  output: 5,
8907
- cacheRead: 0.09999999999999999,
8900
+ cacheRead: 0.1,
8908
8901
  cacheWrite: 1.25,
8909
8902
  },
8910
8903
  contextWindow: 200000,
@@ -9248,8 +9241,8 @@ export const MODELS = {
9248
9241
  reasoning: true,
9249
9242
  input: ["text", "image"],
9250
9243
  cost: {
9251
- input: 0.09999999999999999,
9252
- output: 0.39999999999999997,
9244
+ input: 0.1,
9245
+ output: 0.4,
9253
9246
  cacheRead: 0,
9254
9247
  cacheWrite: 0,
9255
9248
  },
@@ -9299,8 +9292,8 @@ export const MODELS = {
9299
9292
  reasoning: false,
9300
9293
  input: ["text"],
9301
9294
  cost: {
9302
- input: 0.20020000000000002,
9303
- output: 0.8000999999999999,
9295
+ input: 0.2002,
9296
+ output: 0.8001,
9304
9297
  cacheRead: 0,
9305
9298
  cacheWrite: 0,
9306
9299
  },
@@ -9316,7 +9309,7 @@ export const MODELS = {
9316
9309
  reasoning: false,
9317
9310
  input: ["text"],
9318
9311
  cost: {
9319
- input: 0.19999999999999998,
9312
+ input: 0.2,
9320
9313
  output: 0.77,
9321
9314
  cacheRead: 0.135,
9322
9315
  cacheWrite: 0,
@@ -9334,7 +9327,7 @@ export const MODELS = {
9334
9327
  input: ["text"],
9335
9328
  cost: {
9336
9329
  input: 0.21,
9337
- output: 0.7899999999999999,
9330
+ output: 0.79,
9338
9331
  cacheRead: 0.13,
9339
9332
  cacheWrite: 0,
9340
9333
  },
@@ -9368,7 +9361,7 @@ export const MODELS = {
9368
9361
  input: ["text"],
9369
9362
  cost: {
9370
9363
  input: 0.5,
9371
- output: 2.1500000000000004,
9364
+ output: 2.15,
9372
9365
  cacheRead: 0.35,
9373
9366
  cacheWrite: 0,
9374
9367
  },
@@ -9437,13 +9430,13 @@ export const MODELS = {
9437
9430
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "xhigh" },
9438
9431
  input: ["text"],
9439
9432
  cost: {
9440
- input: 0.0983,
9441
- output: 0.1966,
9442
- cacheRead: 0.019700000000000002,
9433
+ input: 0.098,
9434
+ output: 0.196,
9435
+ cacheRead: 0.02,
9443
9436
  cacheWrite: 0,
9444
9437
  },
9445
9438
  contextWindow: 1048576,
9446
- maxTokens: 131072,
9439
+ maxTokens: 4096,
9447
9440
  },
9448
9441
  "deepseek/deepseek-v4-pro": {
9449
9442
  id: "deepseek/deepseek-v4-pro",
@@ -9493,7 +9486,7 @@ export const MODELS = {
9493
9486
  input: 0.3,
9494
9487
  output: 2.5,
9495
9488
  cacheRead: 0.03,
9496
- cacheWrite: 0.08333333333333334,
9489
+ cacheWrite: 0.083333,
9497
9490
  },
9498
9491
  contextWindow: 1048576,
9499
9492
  maxTokens: 65535,
@@ -9507,10 +9500,10 @@ export const MODELS = {
9507
9500
  reasoning: true,
9508
9501
  input: ["text", "image"],
9509
9502
  cost: {
9510
- input: 0.09999999999999999,
9511
- output: 0.39999999999999997,
9503
+ input: 0.1,
9504
+ output: 0.4,
9512
9505
  cacheRead: 0.01,
9513
- cacheWrite: 0.08333333333333334,
9506
+ cacheWrite: 0.083333,
9514
9507
  },
9515
9508
  contextWindow: 1048576,
9516
9509
  maxTokens: 65535,
@@ -9524,10 +9517,10 @@ export const MODELS = {
9524
9517
  reasoning: true,
9525
9518
  input: ["text", "image"],
9526
9519
  cost: {
9527
- input: 0.09999999999999999,
9528
- output: 0.39999999999999997,
9520
+ input: 0.1,
9521
+ output: 0.4,
9529
9522
  cacheRead: 0.01,
9530
- cacheWrite: 0.08333333333333334,
9523
+ cacheWrite: 0.083333,
9531
9524
  },
9532
9525
  contextWindow: 1048576,
9533
9526
  maxTokens: 65535,
@@ -9594,8 +9587,8 @@ export const MODELS = {
9594
9587
  cost: {
9595
9588
  input: 0.5,
9596
9589
  output: 3,
9597
- cacheRead: 0.049999999999999996,
9598
- cacheWrite: 0.08333333333333334,
9590
+ cacheRead: 0.05,
9591
+ cacheWrite: 0.083333,
9599
9592
  },
9600
9593
  contextWindow: 1048576,
9601
9594
  maxTokens: 65536,
@@ -9611,8 +9604,8 @@ export const MODELS = {
9611
9604
  cost: {
9612
9605
  input: 0.25,
9613
9606
  output: 1.5,
9614
- cacheRead: 0.024999999999999998,
9615
- cacheWrite: 0.08333333333333334,
9607
+ cacheRead: 0.025,
9608
+ cacheWrite: 0.083333,
9616
9609
  },
9617
9610
  contextWindow: 1048576,
9618
9611
  maxTokens: 65536,
@@ -9628,8 +9621,8 @@ export const MODELS = {
9628
9621
  cost: {
9629
9622
  input: 0.25,
9630
9623
  output: 1.5,
9631
- cacheRead: 0.024999999999999998,
9632
- cacheWrite: 0.08333333333333334,
9624
+ cacheRead: 0.025,
9625
+ cacheWrite: 0.083333,
9633
9626
  },
9634
9627
  contextWindow: 1048576,
9635
9628
  maxTokens: 65536,
@@ -9645,7 +9638,7 @@ export const MODELS = {
9645
9638
  cost: {
9646
9639
  input: 2,
9647
9640
  output: 12,
9648
- cacheRead: 0.19999999999999998,
9641
+ cacheRead: 0.2,
9649
9642
  cacheWrite: 0.375,
9650
9643
  },
9651
9644
  contextWindow: 1048576,
@@ -9662,7 +9655,7 @@ export const MODELS = {
9662
9655
  cost: {
9663
9656
  input: 2,
9664
9657
  output: 12,
9665
- cacheRead: 0.19999999999999998,
9658
+ cacheRead: 0.2,
9666
9659
  cacheWrite: 0.375,
9667
9660
  },
9668
9661
  contextWindow: 1048756,
@@ -9680,7 +9673,7 @@ export const MODELS = {
9680
9673
  input: 1.5,
9681
9674
  output: 9,
9682
9675
  cacheRead: 0.15,
9683
- cacheWrite: 0.08333333333333334,
9676
+ cacheWrite: 0.083333,
9684
9677
  },
9685
9678
  contextWindow: 1048576,
9686
9679
  maxTokens: 65536,
@@ -9694,7 +9687,7 @@ export const MODELS = {
9694
9687
  reasoning: false,
9695
9688
  input: ["text", "image"],
9696
9689
  cost: {
9697
- input: 0.049999999999999996,
9690
+ input: 0.05,
9698
9691
  output: 0.15,
9699
9692
  cacheRead: 0,
9700
9693
  cacheWrite: 0,
@@ -9763,12 +9756,12 @@ export const MODELS = {
9763
9756
  input: ["text", "image"],
9764
9757
  cost: {
9765
9758
  input: 0.12,
9766
- output: 0.36,
9759
+ output: 0.35,
9767
9760
  cacheRead: 0.09,
9768
9761
  cacheWrite: 0,
9769
9762
  },
9770
9763
  contextWindow: 262144,
9771
- maxTokens: 8192,
9764
+ maxTokens: 262144,
9772
9765
  },
9773
9766
  "google/gemma-4-31b-it:free": {
9774
9767
  id: "google/gemma-4-31b-it:free",
@@ -9796,9 +9789,9 @@ export const MODELS = {
9796
9789
  reasoning: false,
9797
9790
  input: ["text"],
9798
9791
  cost: {
9799
- input: 0.049999999999999996,
9800
- output: 0.09999999999999999,
9801
- cacheRead: 0.049999999999999996,
9792
+ input: 0.05,
9793
+ output: 0.1,
9794
+ cacheRead: 0.05,
9802
9795
  cacheWrite: 0,
9803
9796
  },
9804
9797
  contextWindow: 131072,
@@ -9816,7 +9809,7 @@ export const MODELS = {
9816
9809
  cost: {
9817
9810
  input: 0.25,
9818
9811
  output: 0.75,
9819
- cacheRead: 0.024999999999999998,
9812
+ cacheRead: 0.025,
9820
9813
  cacheWrite: 0,
9821
9814
  },
9822
9815
  contextWindow: 128000,
@@ -9899,8 +9892,8 @@ export const MODELS = {
9899
9892
  reasoning: false,
9900
9893
  input: ["text"],
9901
9894
  cost: {
9902
- input: 0.39999999999999997,
9903
- output: 0.39999999999999997,
9895
+ input: 0.4,
9896
+ output: 0.4,
9904
9897
  cacheRead: 0,
9905
9898
  cacheWrite: 0,
9906
9899
  },
@@ -9933,7 +9926,7 @@ export const MODELS = {
9933
9926
  reasoning: false,
9934
9927
  input: ["text"],
9935
9928
  cost: {
9936
- input: 0.09999999999999999,
9929
+ input: 0.1,
9937
9930
  output: 0.32,
9938
9931
  cacheRead: 0,
9939
9932
  cacheWrite: 0,
@@ -9984,7 +9977,7 @@ export const MODELS = {
9984
9977
  reasoning: false,
9985
9978
  input: ["text", "image"],
9986
9979
  cost: {
9987
- input: 0.09999999999999999,
9980
+ input: 0.1,
9988
9981
  output: 0.3,
9989
9982
  cacheRead: 0,
9990
9983
  cacheWrite: 0,
@@ -10001,7 +9994,7 @@ export const MODELS = {
10001
9994
  reasoning: true,
10002
9995
  input: ["text"],
10003
9996
  cost: {
10004
- input: 0.39999999999999997,
9997
+ input: 0.4,
10005
9998
  output: 2.2,
10006
9999
  cacheRead: 0,
10007
10000
  cacheWrite: 0,
@@ -10053,8 +10046,8 @@ export const MODELS = {
10053
10046
  input: ["text"],
10054
10047
  cost: {
10055
10048
  input: 0.15,
10056
- output: 1.15,
10057
- cacheRead: 0,
10049
+ output: 0.9,
10050
+ cacheRead: 0.05,
10058
10051
  cacheWrite: 0,
10059
10052
  },
10060
10053
  contextWindow: 204800,
@@ -10069,13 +10062,13 @@ export const MODELS = {
10069
10062
  reasoning: true,
10070
10063
  input: ["text"],
10071
10064
  cost: {
10072
- input: 0.27899999999999997,
10073
- output: 1.2,
10074
- cacheRead: 0,
10065
+ input: 0.25,
10066
+ output: 1,
10067
+ cacheRead: 0.05,
10075
10068
  cacheWrite: 0,
10076
10069
  },
10077
10070
  contextWindow: 204800,
10078
- maxTokens: 196608,
10071
+ maxTokens: 131072,
10079
10072
  },
10080
10073
  "minimax/minimax-m3": {
10081
10074
  id: "minimax/minimax-m3",
@@ -10104,7 +10097,7 @@ export const MODELS = {
10104
10097
  input: ["text"],
10105
10098
  cost: {
10106
10099
  input: 0.3,
10107
- output: 0.8999999999999999,
10100
+ output: 0.9,
10108
10101
  cacheRead: 0.03,
10109
10102
  cacheWrite: 0,
10110
10103
  },
@@ -10120,7 +10113,7 @@ export const MODELS = {
10120
10113
  reasoning: false,
10121
10114
  input: ["text"],
10122
10115
  cost: {
10123
- input: 0.39999999999999997,
10116
+ input: 0.4,
10124
10117
  output: 2,
10125
10118
  cacheRead: 0.04,
10126
10119
  cacheWrite: 0,
@@ -10137,8 +10130,8 @@ export const MODELS = {
10137
10130
  reasoning: false,
10138
10131
  input: ["text", "image"],
10139
10132
  cost: {
10140
- input: 0.19999999999999998,
10141
- output: 0.19999999999999998,
10133
+ input: 0.2,
10134
+ output: 0.2,
10142
10135
  cacheRead: 0.02,
10143
10136
  cacheWrite: 0,
10144
10137
  },
@@ -10154,8 +10147,8 @@ export const MODELS = {
10154
10147
  reasoning: false,
10155
10148
  input: ["text", "image"],
10156
10149
  cost: {
10157
- input: 0.09999999999999999,
10158
- output: 0.09999999999999999,
10150
+ input: 0.1,
10151
+ output: 0.1,
10159
10152
  cacheRead: 0.01,
10160
10153
  cacheWrite: 0,
10161
10154
  },
@@ -10190,7 +10183,7 @@ export const MODELS = {
10190
10183
  cost: {
10191
10184
  input: 2,
10192
10185
  output: 6,
10193
- cacheRead: 0.19999999999999998,
10186
+ cacheRead: 0.2,
10194
10187
  cacheWrite: 0,
10195
10188
  },
10196
10189
  contextWindow: 128000,
@@ -10207,7 +10200,7 @@ export const MODELS = {
10207
10200
  cost: {
10208
10201
  input: 2,
10209
10202
  output: 6,
10210
- cacheRead: 0.19999999999999998,
10203
+ cacheRead: 0.2,
10211
10204
  cacheWrite: 0,
10212
10205
  },
10213
10206
  contextWindow: 131072,
@@ -10224,7 +10217,7 @@ export const MODELS = {
10224
10217
  cost: {
10225
10218
  input: 0.5,
10226
10219
  output: 1.5,
10227
- cacheRead: 0.049999999999999996,
10220
+ cacheRead: 0.05,
10228
10221
  cacheWrite: 0,
10229
10222
  },
10230
10223
  contextWindow: 262144,
@@ -10239,7 +10232,7 @@ export const MODELS = {
10239
10232
  reasoning: false,
10240
10233
  input: ["text", "image"],
10241
10234
  cost: {
10242
- input: 0.39999999999999997,
10235
+ input: 0.4,
10243
10236
  output: 2,
10244
10237
  cacheRead: 0.04,
10245
10238
  cacheWrite: 0,
@@ -10273,7 +10266,7 @@ export const MODELS = {
10273
10266
  reasoning: false,
10274
10267
  input: ["text", "image"],
10275
10268
  cost: {
10276
- input: 0.39999999999999997,
10269
+ input: 0.4,
10277
10270
  output: 2,
10278
10271
  cacheRead: 0.04,
10279
10272
  cacheWrite: 0,
@@ -10307,7 +10300,7 @@ export const MODELS = {
10307
10300
  reasoning: false,
10308
10301
  input: ["text"],
10309
10302
  cost: {
10310
- input: 0.19999999999999998,
10303
+ input: 0.2,
10311
10304
  output: 0.6,
10312
10305
  cacheRead: 0.02,
10313
10306
  cacheWrite: 0,
@@ -10342,7 +10335,7 @@ export const MODELS = {
10342
10335
  input: ["text", "image"],
10343
10336
  cost: {
10344
10337
  input: 0.075,
10345
- output: 0.19999999999999998,
10338
+ output: 0.2,
10346
10339
  cacheRead: 0,
10347
10340
  cacheWrite: 0,
10348
10341
  },
@@ -10360,7 +10353,7 @@ export const MODELS = {
10360
10353
  cost: {
10361
10354
  input: 2,
10362
10355
  output: 6,
10363
- cacheRead: 0.19999999999999998,
10356
+ cacheRead: 0.2,
10364
10357
  cacheWrite: 0,
10365
10358
  },
10366
10359
  contextWindow: 65536,
@@ -10375,7 +10368,7 @@ export const MODELS = {
10375
10368
  reasoning: false,
10376
10369
  input: ["text"],
10377
10370
  cost: {
10378
- input: 0.09999999999999999,
10371
+ input: 0.1,
10379
10372
  output: 0.3,
10380
10373
  cacheRead: 0.01,
10381
10374
  cacheWrite: 0,
@@ -10392,7 +10385,7 @@ export const MODELS = {
10392
10385
  reasoning: false,
10393
10386
  input: ["text"],
10394
10387
  cost: {
10395
- input: 0.5700000000000001,
10388
+ input: 0.57,
10396
10389
  output: 2.3,
10397
10390
  cacheRead: 0,
10398
10391
  cacheWrite: 0,
@@ -10461,21 +10454,37 @@ export const MODELS = {
10461
10454
  reasoning: true,
10462
10455
  input: ["text", "image"],
10463
10456
  cost: {
10464
- input: 0.6799999999999999,
10457
+ input: 0.68,
10465
10458
  output: 3.41,
10466
- cacheRead: 0.33999999999999997,
10459
+ cacheRead: 0.34,
10467
10460
  cacheWrite: 0,
10468
10461
  },
10469
10462
  contextWindow: 262144,
10470
10463
  maxTokens: 262142,
10471
10464
  },
10472
- "moonshotai/kimi-k2.6:free": {
10473
- id: "moonshotai/kimi-k2.6:free",
10474
- name: "MoonshotAI: Kimi K2.6 (free)",
10465
+ "moonshotai/kimi-k2.7-code": {
10466
+ id: "moonshotai/kimi-k2.7-code",
10467
+ name: "MoonshotAI: Kimi K2.7 Code",
10468
+ api: "openai-completions",
10469
+ provider: "openrouter",
10470
+ baseUrl: "https://openrouter.ai/api/v1",
10471
+ reasoning: true,
10472
+ input: ["text", "image"],
10473
+ cost: {
10474
+ input: 0.95,
10475
+ output: 4,
10476
+ cacheRead: 0.19,
10477
+ cacheWrite: 0,
10478
+ },
10479
+ contextWindow: 262144,
10480
+ maxTokens: 4096,
10481
+ },
10482
+ "nex-agi/nex-n2-pro:free": {
10483
+ id: "nex-agi/nex-n2-pro:free",
10484
+ name: "Nex AGI: Nex-N2-Pro (free)",
10475
10485
  api: "openai-completions",
10476
10486
  provider: "openrouter",
10477
10487
  baseUrl: "https://openrouter.ai/api/v1",
10478
- compat: { "supportsDeveloperRole": false, "requiresReasoningContentOnAssistantMessages": true },
10479
10488
  reasoning: true,
10480
10489
  input: ["text", "image"],
10481
10490
  cost: {
@@ -10485,7 +10494,7 @@ export const MODELS = {
10485
10494
  cacheWrite: 0,
10486
10495
  },
10487
10496
  contextWindow: 262144,
10488
- maxTokens: 4096,
10497
+ maxTokens: 262144,
10489
10498
  },
10490
10499
  "nvidia/llama-3.3-nemotron-super-49b-v1.5": {
10491
10500
  id: "nvidia/llama-3.3-nemotron-super-49b-v1.5",
@@ -10496,8 +10505,8 @@ export const MODELS = {
10496
10505
  reasoning: true,
10497
10506
  input: ["text"],
10498
10507
  cost: {
10499
- input: 0.39999999999999997,
10500
- output: 0.39999999999999997,
10508
+ input: 0.4,
10509
+ output: 0.4,
10501
10510
  cacheRead: 0,
10502
10511
  cacheWrite: 0,
10503
10512
  },
@@ -10513,8 +10522,8 @@ export const MODELS = {
10513
10522
  reasoning: true,
10514
10523
  input: ["text"],
10515
10524
  cost: {
10516
- input: 0.049999999999999996,
10517
- output: 0.19999999999999998,
10525
+ input: 0.05,
10526
+ output: 0.2,
10518
10527
  cacheRead: 0,
10519
10528
  cacheWrite: 0,
10520
10529
  },
@@ -10565,7 +10574,7 @@ export const MODELS = {
10565
10574
  input: ["text"],
10566
10575
  cost: {
10567
10576
  input: 0.09,
10568
- output: 0.44999999999999996,
10577
+ output: 0.45,
10569
10578
  cacheRead: 0,
10570
10579
  cacheWrite: 0,
10571
10580
  },
@@ -10640,23 +10649,6 @@ export const MODELS = {
10640
10649
  contextWindow: 128000,
10641
10650
  maxTokens: 128000,
10642
10651
  },
10643
- "nvidia/nemotron-nano-9b-v2": {
10644
- id: "nvidia/nemotron-nano-9b-v2",
10645
- name: "NVIDIA: Nemotron Nano 9B V2",
10646
- api: "openai-completions",
10647
- provider: "openrouter",
10648
- baseUrl: "https://openrouter.ai/api/v1",
10649
- reasoning: true,
10650
- input: ["text"],
10651
- cost: {
10652
- input: 0.04,
10653
- output: 0.16,
10654
- cacheRead: 0,
10655
- cacheWrite: 0,
10656
- },
10657
- contextWindow: 131072,
10658
- maxTokens: 16384,
10659
- },
10660
10652
  "nvidia/nemotron-nano-9b-v2:free": {
10661
10653
  id: "nvidia/nemotron-nano-9b-v2:free",
10662
10654
  name: "NVIDIA: Nemotron Nano 9B V2 (free)",
@@ -10802,9 +10794,9 @@ export const MODELS = {
10802
10794
  reasoning: false,
10803
10795
  input: ["text", "image"],
10804
10796
  cost: {
10805
- input: 0.39999999999999997,
10806
- output: 1.5999999999999999,
10807
- cacheRead: 0.09999999999999999,
10797
+ input: 0.4,
10798
+ output: 1.6,
10799
+ cacheRead: 0.1,
10808
10800
  cacheWrite: 0,
10809
10801
  },
10810
10802
  contextWindow: 1047576,
@@ -10819,9 +10811,9 @@ export const MODELS = {
10819
10811
  reasoning: false,
10820
10812
  input: ["text", "image"],
10821
10813
  cost: {
10822
- input: 0.09999999999999999,
10823
- output: 0.39999999999999997,
10824
- cacheRead: 0.024999999999999998,
10814
+ input: 0.1,
10815
+ output: 0.4,
10816
+ cacheRead: 0.025,
10825
10817
  cacheWrite: 0,
10826
10818
  },
10827
10819
  contextWindow: 1047576,
@@ -10974,7 +10966,7 @@ export const MODELS = {
10974
10966
  cost: {
10975
10967
  input: 0.25,
10976
10968
  output: 2,
10977
- cacheRead: 0.024999999999999998,
10969
+ cacheRead: 0.025,
10978
10970
  cacheWrite: 0,
10979
10971
  },
10980
10972
  contextWindow: 400000,
@@ -10989,8 +10981,8 @@ export const MODELS = {
10989
10981
  reasoning: true,
10990
10982
  input: ["text", "image"],
10991
10983
  cost: {
10992
- input: 0.049999999999999996,
10993
- output: 0.39999999999999997,
10984
+ input: 0.05,
10985
+ output: 0.4,
10994
10986
  cacheRead: 0.01,
10995
10987
  cacheWrite: 0,
10996
10988
  },
@@ -11093,7 +11085,7 @@ export const MODELS = {
11093
11085
  cost: {
11094
11086
  input: 0.25,
11095
11087
  output: 2,
11096
- cacheRead: 0.024999999999999998,
11088
+ cacheRead: 0.025,
11097
11089
  cacheWrite: 0,
11098
11090
  },
11099
11091
  contextWindow: 400000,
@@ -11253,7 +11245,7 @@ export const MODELS = {
11253
11245
  thinkingLevelMap: { "xhigh": "xhigh" },
11254
11246
  input: ["text", "image"],
11255
11247
  cost: {
11256
- input: 0.19999999999999998,
11248
+ input: 0.2,
11257
11249
  output: 1.25,
11258
11250
  cacheRead: 0.02,
11259
11251
  cacheWrite: 0,
@@ -11698,7 +11690,7 @@ export const MODELS = {
11698
11690
  reasoning: true,
11699
11691
  input: ["text"],
11700
11692
  cost: {
11701
- input: 0.19999999999999998,
11693
+ input: 0.2,
11702
11694
  output: 1.1,
11703
11695
  cacheRead: 0,
11704
11696
  cacheWrite: 0,
@@ -11716,7 +11708,7 @@ export const MODELS = {
11716
11708
  input: ["text"],
11717
11709
  cost: {
11718
11710
  input: 0.36,
11719
- output: 0.39999999999999997,
11711
+ output: 0.4,
11720
11712
  cacheRead: 0,
11721
11713
  cacheWrite: 0,
11722
11714
  },
@@ -11734,7 +11726,7 @@ export const MODELS = {
11734
11726
  cost: {
11735
11727
  input: 0.26,
11736
11728
  output: 0.78,
11737
- cacheRead: 0.052000000000000005,
11729
+ cacheRead: 0.052,
11738
11730
  cacheWrite: 0.325,
11739
11731
  },
11740
11732
  contextWindow: 1000000,
@@ -11783,7 +11775,7 @@ export const MODELS = {
11783
11775
  reasoning: true,
11784
11776
  input: ["text"],
11785
11777
  cost: {
11786
- input: 0.09999999999999999,
11778
+ input: 0.1,
11787
11779
  output: 0.24,
11788
11780
  cacheRead: 0,
11789
11781
  cacheWrite: 0,
@@ -11800,8 +11792,8 @@ export const MODELS = {
11800
11792
  reasoning: true,
11801
11793
  input: ["text"],
11802
11794
  cost: {
11803
- input: 0.45499999999999996,
11804
- output: 1.8199999999999998,
11795
+ input: 0.455,
11796
+ output: 1.82,
11805
11797
  cacheRead: 0,
11806
11798
  cacheWrite: 0,
11807
11799
  },
@@ -11818,7 +11810,7 @@ export const MODELS = {
11818
11810
  input: ["text"],
11819
11811
  cost: {
11820
11812
  input: 0.09,
11821
- output: 0.09999999999999999,
11813
+ output: 0.1,
11822
11814
  cacheRead: 0,
11823
11815
  cacheWrite: 0,
11824
11816
  },
@@ -11834,9 +11826,9 @@ export const MODELS = {
11834
11826
  reasoning: true,
11835
11827
  input: ["text"],
11836
11828
  cost: {
11837
- input: 0.09999999999999999,
11838
- output: 0.09999999999999999,
11839
- cacheRead: 0.09999999999999999,
11829
+ input: 0.1,
11830
+ output: 0.1,
11831
+ cacheRead: 0.1,
11840
11832
  cacheWrite: 0,
11841
11833
  },
11842
11834
  contextWindow: 262144,
@@ -11886,7 +11878,7 @@ export const MODELS = {
11886
11878
  input: ["text"],
11887
11879
  cost: {
11888
11880
  input: 0.08,
11889
- output: 0.39999999999999997,
11881
+ output: 0.4,
11890
11882
  cacheRead: 0.08,
11891
11883
  cacheWrite: 0,
11892
11884
  },
@@ -11919,9 +11911,9 @@ export const MODELS = {
11919
11911
  reasoning: true,
11920
11912
  input: ["text"],
11921
11913
  cost: {
11922
- input: 0.049999999999999996,
11923
- output: 0.39999999999999997,
11924
- cacheRead: 0.049999999999999996,
11914
+ input: 0.05,
11915
+ output: 0.4,
11916
+ cacheRead: 0.05,
11925
11917
  cacheWrite: 0,
11926
11918
  },
11927
11919
  contextWindow: 131072,
@@ -11937,7 +11929,7 @@ export const MODELS = {
11937
11929
  input: ["text"],
11938
11930
  cost: {
11939
11931
  input: 0.22,
11940
- output: 1.7999999999999998,
11932
+ output: 1.8,
11941
11933
  cacheRead: 0,
11942
11934
  cacheWrite: 0,
11943
11935
  },
@@ -11988,7 +11980,7 @@ export const MODELS = {
11988
11980
  input: ["text"],
11989
11981
  cost: {
11990
11982
  input: 0.11,
11991
- output: 0.7999999999999999,
11983
+ output: 0.8,
11992
11984
  cacheRead: 0.07,
11993
11985
  cacheWrite: 0,
11994
11986
  },
@@ -12123,7 +12115,7 @@ export const MODELS = {
12123
12115
  reasoning: false,
12124
12116
  input: ["text", "image"],
12125
12117
  cost: {
12126
- input: 0.19999999999999998,
12118
+ input: 0.2,
12127
12119
  output: 0.88,
12128
12120
  cacheRead: 0.11,
12129
12121
  cacheWrite: 0,
@@ -12191,8 +12183,8 @@ export const MODELS = {
12191
12183
  reasoning: false,
12192
12184
  input: ["text", "image"],
12193
12185
  cost: {
12194
- input: 0.10400000000000001,
12195
- output: 0.41600000000000004,
12186
+ input: 0.104,
12187
+ output: 0.416,
12196
12188
  cacheRead: 0,
12197
12189
  cacheWrite: 0,
12198
12190
  },
@@ -12278,7 +12270,7 @@ export const MODELS = {
12278
12270
  cost: {
12279
12271
  input: 0.14,
12280
12272
  output: 1,
12281
- cacheRead: 0.049999999999999996,
12273
+ cacheRead: 0.05,
12282
12274
  cacheWrite: 0,
12283
12275
  },
12284
12276
  contextWindow: 262144,
@@ -12310,7 +12302,7 @@ export const MODELS = {
12310
12302
  reasoning: true,
12311
12303
  input: ["text", "image"],
12312
12304
  cost: {
12313
- input: 0.09999999999999999,
12305
+ input: 0.1,
12314
12306
  output: 0.15,
12315
12307
  cacheRead: 0,
12316
12308
  cacheWrite: 0,
@@ -12362,7 +12354,7 @@ export const MODELS = {
12362
12354
  input: ["text", "image"],
12363
12355
  cost: {
12364
12356
  input: 0.3,
12365
- output: 1.7999999999999998,
12357
+ output: 1.8,
12366
12358
  cacheRead: 0,
12367
12359
  cacheWrite: 0.375,
12368
12360
  },
@@ -12378,13 +12370,13 @@ export const MODELS = {
12378
12370
  reasoning: true,
12379
12371
  input: ["text", "image"],
12380
12372
  cost: {
12381
- input: 0.28900000000000003,
12382
- output: 2.4,
12373
+ input: 0.2885,
12374
+ output: 3.17,
12383
12375
  cacheRead: 0,
12384
12376
  cacheWrite: 0,
12385
12377
  },
12386
12378
  contextWindow: 262144,
12387
- maxTokens: 131072,
12379
+ maxTokens: 262140,
12388
12380
  },
12389
12381
  "qwen/qwen3.6-35b-a3b": {
12390
12382
  id: "qwen/qwen3.6-35b-a3b",
@@ -12395,13 +12387,13 @@ export const MODELS = {
12395
12387
  reasoning: true,
12396
12388
  input: ["text", "image"],
12397
12389
  cost: {
12398
- input: 0.14,
12390
+ input: 0.15,
12399
12391
  output: 1,
12400
- cacheRead: 0,
12392
+ cacheRead: 0.05,
12401
12393
  cacheWrite: 0,
12402
12394
  },
12403
12395
  contextWindow: 262144,
12404
- maxTokens: 262140,
12396
+ maxTokens: 262144,
12405
12397
  },
12406
12398
  "qwen/qwen3.6-flash": {
12407
12399
  id: "qwen/qwen3.6-flash",
@@ -12480,10 +12472,10 @@ export const MODELS = {
12480
12472
  reasoning: true,
12481
12473
  input: ["text", "image"],
12482
12474
  cost: {
12483
- input: 0.39999999999999997,
12484
- output: 1.5999999999999999,
12485
- cacheRead: 0.08,
12486
- cacheWrite: 0.5,
12475
+ input: 0.32,
12476
+ output: 1.28,
12477
+ cacheRead: 0.064,
12478
+ cacheWrite: 0.4,
12487
12479
  },
12488
12480
  contextWindow: 1000000,
12489
12481
  maxTokens: 65536,
@@ -12497,8 +12489,8 @@ export const MODELS = {
12497
12489
  reasoning: false,
12498
12490
  input: ["text", "image"],
12499
12491
  cost: {
12500
- input: 0.09999999999999999,
12501
- output: 0.09999999999999999,
12492
+ input: 0.1,
12493
+ output: 0.1,
12502
12494
  cacheRead: 0,
12503
12495
  cacheWrite: 0,
12504
12496
  },
@@ -12565,7 +12557,7 @@ export const MODELS = {
12565
12557
  reasoning: true,
12566
12558
  input: ["text", "image"],
12567
12559
  cost: {
12568
- input: 0.19999999999999998,
12560
+ input: 0.2,
12569
12561
  output: 1.15,
12570
12562
  cacheRead: 0.04,
12571
12563
  cacheWrite: 0,
@@ -12584,7 +12576,7 @@ export const MODELS = {
12584
12576
  cost: {
12585
12577
  input: 0.063,
12586
12578
  output: 0.21,
12587
- cacheRead: 0.020999999999999998,
12579
+ cacheRead: 0.021,
12588
12580
  cacheWrite: 0,
12589
12581
  },
12590
12582
  contextWindow: 262144,
@@ -12599,7 +12591,7 @@ export const MODELS = {
12599
12591
  reasoning: false,
12600
12592
  input: ["text"],
12601
12593
  cost: {
12602
- input: 0.16999999999999998,
12594
+ input: 0.17,
12603
12595
  output: 0.43,
12604
12596
  cacheRead: 0,
12605
12597
  cacheWrite: 0,
@@ -12616,8 +12608,8 @@ export const MODELS = {
12616
12608
  reasoning: false,
12617
12609
  input: ["text"],
12618
12610
  cost: {
12619
- input: 0.39999999999999997,
12620
- output: 0.39999999999999997,
12611
+ input: 0.4,
12612
+ output: 0.4,
12621
12613
  cacheRead: 0,
12622
12614
  cacheWrite: 0,
12623
12615
  },
@@ -12652,7 +12644,7 @@ export const MODELS = {
12652
12644
  cost: {
12653
12645
  input: 1.25,
12654
12646
  output: 2.5,
12655
- cacheRead: 0.19999999999999998,
12647
+ cacheRead: 0.2,
12656
12648
  cacheWrite: 0,
12657
12649
  },
12658
12650
  contextWindow: 2000000,
@@ -12669,7 +12661,7 @@ export const MODELS = {
12669
12661
  cost: {
12670
12662
  input: 1.25,
12671
12663
  output: 2.5,
12672
- cacheRead: 0.19999999999999998,
12664
+ cacheRead: 0.2,
12673
12665
  cacheWrite: 0,
12674
12666
  },
12675
12667
  contextWindow: 1000000,
@@ -12686,7 +12678,7 @@ export const MODELS = {
12686
12678
  cost: {
12687
12679
  input: 1,
12688
12680
  output: 2,
12689
- cacheRead: 0.19999999999999998,
12681
+ cacheRead: 0.2,
12690
12682
  cacheWrite: 0,
12691
12683
  },
12692
12684
  contextWindow: 256000,
@@ -12701,7 +12693,7 @@ export const MODELS = {
12701
12693
  reasoning: true,
12702
12694
  input: ["text"],
12703
12695
  cost: {
12704
- input: 0.09999999999999999,
12696
+ input: 0.1,
12705
12697
  output: 0.3,
12706
12698
  cacheRead: 0.01,
12707
12699
  cacheWrite: 0,
@@ -12743,23 +12735,6 @@ export const MODELS = {
12743
12735
  contextWindow: 1048576,
12744
12736
  maxTokens: 131072,
12745
12737
  },
12746
- "z-ai/glm-4-32b": {
12747
- id: "z-ai/glm-4-32b",
12748
- name: "Z.ai: GLM 4 32B ",
12749
- api: "openai-completions",
12750
- provider: "openrouter",
12751
- baseUrl: "https://openrouter.ai/api/v1",
12752
- reasoning: false,
12753
- input: ["text"],
12754
- cost: {
12755
- input: 0.09999999999999999,
12756
- output: 0.09999999999999999,
12757
- cacheRead: 0,
12758
- cacheWrite: 0,
12759
- },
12760
- contextWindow: 128000,
12761
- maxTokens: 4096,
12762
- },
12763
12738
  "z-ai/glm-4.5": {
12764
12739
  id: "z-ai/glm-4.5",
12765
12740
  name: "Z.ai: GLM 4.5",
@@ -12794,23 +12769,6 @@ export const MODELS = {
12794
12769
  contextWindow: 131072,
12795
12770
  maxTokens: 131070,
12796
12771
  },
12797
- "z-ai/glm-4.5-air:free": {
12798
- id: "z-ai/glm-4.5-air:free",
12799
- name: "Z.ai: GLM 4.5 Air (free)",
12800
- api: "openai-completions",
12801
- provider: "openrouter",
12802
- baseUrl: "https://openrouter.ai/api/v1",
12803
- reasoning: true,
12804
- input: ["text"],
12805
- cost: {
12806
- input: 0,
12807
- output: 0,
12808
- cacheRead: 0,
12809
- cacheWrite: 0,
12810
- },
12811
- contextWindow: 131072,
12812
- maxTokens: 96000,
12813
- },
12814
12772
  "z-ai/glm-4.5v": {
12815
12773
  id: "z-ai/glm-4.5v",
12816
12774
  name: "Z.ai: GLM 4.5V",
@@ -12821,7 +12779,7 @@ export const MODELS = {
12821
12779
  input: ["text", "image"],
12822
12780
  cost: {
12823
12781
  input: 0.6,
12824
- output: 1.7999999999999998,
12782
+ output: 1.8,
12825
12783
  cacheRead: 0.11,
12826
12784
  cacheWrite: 0,
12827
12785
  },
@@ -12855,12 +12813,12 @@ export const MODELS = {
12855
12813
  input: ["text", "image"],
12856
12814
  cost: {
12857
12815
  input: 0.3,
12858
- output: 0.8999999999999999,
12859
- cacheRead: 0.049999999999999996,
12816
+ output: 0.9,
12817
+ cacheRead: 0.055,
12860
12818
  cacheWrite: 0,
12861
12819
  },
12862
12820
  contextWindow: 131072,
12863
- maxTokens: 24000,
12821
+ maxTokens: 32768,
12864
12822
  },
12865
12823
  "z-ai/glm-4.7": {
12866
12824
  id: "z-ai/glm-4.7",
@@ -12871,7 +12829,7 @@ export const MODELS = {
12871
12829
  reasoning: true,
12872
12830
  input: ["text"],
12873
12831
  cost: {
12874
- input: 0.39999999999999997,
12832
+ input: 0.4,
12875
12833
  output: 1.75,
12876
12834
  cacheRead: 0.08,
12877
12835
  cacheWrite: 0,
@@ -12889,7 +12847,7 @@ export const MODELS = {
12889
12847
  input: ["text"],
12890
12848
  cost: {
12891
12849
  input: 0.06,
12892
- output: 0.39999999999999997,
12850
+ output: 0.4,
12893
12851
  cacheRead: 0.01,
12894
12852
  cacheWrite: 0,
12895
12853
  },
@@ -12927,7 +12885,7 @@ export const MODELS = {
12927
12885
  cacheRead: 0.24,
12928
12886
  cacheWrite: 0,
12929
12887
  },
12930
- contextWindow: 202752,
12888
+ contextWindow: 262144,
12931
12889
  maxTokens: 131072,
12932
12890
  },
12933
12891
  "z-ai/glm-5.1": {
@@ -12947,22 +12905,22 @@ export const MODELS = {
12947
12905
  contextWindow: 202752,
12948
12906
  maxTokens: 4096,
12949
12907
  },
12950
- "z-ai/glm-5v-turbo": {
12951
- id: "z-ai/glm-5v-turbo",
12952
- name: "Z.ai: GLM 5V Turbo",
12908
+ "~anthropic/claude-fable-latest": {
12909
+ id: "~anthropic/claude-fable-latest",
12910
+ name: "Anthropic: Claude Fable Latest",
12953
12911
  api: "openai-completions",
12954
12912
  provider: "openrouter",
12955
12913
  baseUrl: "https://openrouter.ai/api/v1",
12956
12914
  reasoning: true,
12957
12915
  input: ["text", "image"],
12958
12916
  cost: {
12959
- input: 1.2,
12960
- output: 4,
12961
- cacheRead: 0.24,
12962
- cacheWrite: 0,
12917
+ input: 10,
12918
+ output: 50,
12919
+ cacheRead: 1,
12920
+ cacheWrite: 12.5,
12963
12921
  },
12964
- contextWindow: 202752,
12965
- maxTokens: 131072,
12922
+ contextWindow: 1000000,
12923
+ maxTokens: 128000,
12966
12924
  },
12967
12925
  "~anthropic/claude-haiku-latest": {
12968
12926
  id: "~anthropic/claude-haiku-latest",
@@ -12975,7 +12933,7 @@ export const MODELS = {
12975
12933
  cost: {
12976
12934
  input: 1,
12977
12935
  output: 5,
12978
- cacheRead: 0.09999999999999999,
12936
+ cacheRead: 0.1,
12979
12937
  cacheWrite: 1.25,
12980
12938
  },
12981
12939
  contextWindow: 200000,
@@ -13027,7 +12985,7 @@ export const MODELS = {
13027
12985
  input: 1.5,
13028
12986
  output: 9,
13029
12987
  cacheRead: 0.15,
13030
- cacheWrite: 0.08333333333333334,
12988
+ cacheWrite: 0.083333,
13031
12989
  },
13032
12990
  contextWindow: 1048576,
13033
12991
  maxTokens: 65536,
@@ -13043,7 +13001,7 @@ export const MODELS = {
13043
13001
  cost: {
13044
13002
  input: 2,
13045
13003
  output: 12,
13046
- cacheRead: 0.19999999999999998,
13004
+ cacheRead: 0.2,
13047
13005
  cacheWrite: 0.375,
13048
13006
  },
13049
13007
  contextWindow: 1048576,
@@ -13058,9 +13016,9 @@ export const MODELS = {
13058
13016
  reasoning: true,
13059
13017
  input: ["text", "image"],
13060
13018
  cost: {
13061
- input: 0.6799999999999999,
13019
+ input: 0.68,
13062
13020
  output: 3.41,
13063
- cacheRead: 0.33999999999999997,
13021
+ cacheRead: 0.34,
13064
13022
  cacheWrite: 0,
13065
13023
  },
13066
13024
  contextWindow: 262144,
@@ -13102,25 +13060,6 @@ export const MODELS = {
13102
13060
  },
13103
13061
  },
13104
13062
  "together": {
13105
- "MiniMaxAI/MiniMax-M2.5": {
13106
- id: "MiniMaxAI/MiniMax-M2.5",
13107
- name: "MiniMax-M2.5",
13108
- api: "openai-completions",
13109
- provider: "together",
13110
- baseUrl: "https://api.together.ai/v1",
13111
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
13112
- reasoning: true,
13113
- thinkingLevelMap: { "off": null, "minimal": null, "low": null, "medium": null },
13114
- input: ["text"],
13115
- cost: {
13116
- input: 0.3,
13117
- output: 1.2,
13118
- cacheRead: 0.06,
13119
- cacheWrite: 0,
13120
- },
13121
- contextWindow: 204800,
13122
- maxTokens: 131072,
13123
- },
13124
13063
  "MiniMaxAI/MiniMax-M2.7": {
13125
13064
  id: "MiniMaxAI/MiniMax-M2.7",
13126
13065
  name: "MiniMax-M2.7",
@@ -13140,28 +13079,27 @@ export const MODELS = {
13140
13079
  contextWindow: 202752,
13141
13080
  maxTokens: 131072,
13142
13081
  },
13143
- "Qwen/Qwen3-235B-A22B-Instruct-2507-tput": {
13144
- id: "Qwen/Qwen3-235B-A22B-Instruct-2507-tput",
13145
- name: "Qwen3 235B A22B Instruct 2507 FP8",
13082
+ "Qwen/Qwen2.5-7B-Instruct-Turbo": {
13083
+ id: "Qwen/Qwen2.5-7B-Instruct-Turbo",
13084
+ name: "Qwen 2.5 7B Instruct Turbo",
13146
13085
  api: "openai-completions",
13147
13086
  provider: "together",
13148
13087
  baseUrl: "https://api.together.ai/v1",
13149
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13150
- reasoning: true,
13151
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13088
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
13089
+ reasoning: false,
13152
13090
  input: ["text"],
13153
13091
  cost: {
13154
- input: 0.2,
13155
- output: 0.6,
13092
+ input: 0.3,
13093
+ output: 0.3,
13156
13094
  cacheRead: 0,
13157
13095
  cacheWrite: 0,
13158
13096
  },
13159
- contextWindow: 262144,
13160
- maxTokens: 262144,
13097
+ contextWindow: 32768,
13098
+ maxTokens: 32768,
13161
13099
  },
13162
- "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8": {
13163
- id: "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
13164
- name: "Qwen3 Coder 480B A35B Instruct",
13100
+ "Qwen/Qwen3-235B-A22B-Instruct-2507-tput": {
13101
+ id: "Qwen/Qwen3-235B-A22B-Instruct-2507-tput",
13102
+ name: "Qwen3 235B A22B Instruct 2507 FP8",
13165
13103
  api: "openai-completions",
13166
13104
  provider: "together",
13167
13105
  baseUrl: "https://api.together.ai/v1",
@@ -13169,36 +13107,36 @@ export const MODELS = {
13169
13107
  reasoning: false,
13170
13108
  input: ["text"],
13171
13109
  cost: {
13172
- input: 2,
13173
- output: 2,
13110
+ input: 0.2,
13111
+ output: 0.6,
13174
13112
  cacheRead: 0,
13175
13113
  cacheWrite: 0,
13176
13114
  },
13177
13115
  contextWindow: 262144,
13178
13116
  maxTokens: 262144,
13179
13117
  },
13180
- "Qwen/Qwen3-Coder-Next-FP8": {
13181
- id: "Qwen/Qwen3-Coder-Next-FP8",
13182
- name: "Qwen3 Coder Next FP8",
13118
+ "Qwen/Qwen3.5-397B-A17B": {
13119
+ id: "Qwen/Qwen3.5-397B-A17B",
13120
+ name: "Qwen3.5 397B A17B",
13183
13121
  api: "openai-completions",
13184
13122
  provider: "together",
13185
13123
  baseUrl: "https://api.together.ai/v1",
13186
13124
  compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13187
13125
  reasoning: true,
13188
13126
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13189
- input: ["text"],
13127
+ input: ["text", "image"],
13190
13128
  cost: {
13191
- input: 0.5,
13192
- output: 1.2,
13129
+ input: 0.6,
13130
+ output: 3.6,
13193
13131
  cacheRead: 0,
13194
13132
  cacheWrite: 0,
13195
13133
  },
13196
13134
  contextWindow: 262144,
13197
- maxTokens: 262144,
13135
+ maxTokens: 130000,
13198
13136
  },
13199
- "Qwen/Qwen3.5-397B-A17B": {
13200
- id: "Qwen/Qwen3.5-397B-A17B",
13201
- name: "Qwen3.5 397B A17B",
13137
+ "Qwen/Qwen3.5-9B": {
13138
+ id: "Qwen/Qwen3.5-9B",
13139
+ name: "Qwen3.5 9B",
13202
13140
  api: "openai-completions",
13203
13141
  provider: "together",
13204
13142
  baseUrl: "https://api.together.ai/v1",
@@ -13207,13 +13145,13 @@ export const MODELS = {
13207
13145
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13208
13146
  input: ["text", "image"],
13209
13147
  cost: {
13210
- input: 0.6,
13211
- output: 3.6,
13148
+ input: 0.17,
13149
+ output: 0.25,
13212
13150
  cacheRead: 0,
13213
13151
  cacheWrite: 0,
13214
13152
  },
13215
13153
  contextWindow: 262144,
13216
- maxTokens: 130000,
13154
+ maxTokens: 65536,
13217
13155
  },
13218
13156
  "Qwen/Qwen3.6-Plus": {
13219
13157
  id: "Qwen/Qwen3.6-Plus",
@@ -13240,56 +13178,17 @@ export const MODELS = {
13240
13178
  api: "openai-completions",
13241
13179
  provider: "together",
13242
13180
  baseUrl: "https://api.together.ai/v1",
13243
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13244
- reasoning: true,
13245
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13246
- input: ["text"],
13247
- cost: {
13248
- input: 2.5,
13249
- output: 7.5,
13250
- cacheRead: 0,
13251
- cacheWrite: 0,
13252
- },
13253
- contextWindow: 1000000,
13254
- maxTokens: 500000,
13255
- },
13256
- "deepseek-ai/DeepSeek-V3": {
13257
- id: "deepseek-ai/DeepSeek-V3",
13258
- name: "DeepSeek-V3",
13259
- api: "openai-completions",
13260
- provider: "together",
13261
- baseUrl: "https://api.together.ai/v1",
13262
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13263
- reasoning: true,
13264
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13265
- input: ["text"],
13266
- cost: {
13267
- input: 1.25,
13268
- output: 1.25,
13269
- cacheRead: 0,
13270
- cacheWrite: 0,
13271
- },
13272
- contextWindow: 131072,
13273
- maxTokens: 131072,
13274
- },
13275
- "deepseek-ai/DeepSeek-V3-1": {
13276
- id: "deepseek-ai/DeepSeek-V3-1",
13277
- name: "DeepSeek V3.1",
13278
- api: "openai-completions",
13279
- provider: "together",
13280
- baseUrl: "https://api.together.ai/v1",
13281
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13282
- reasoning: true,
13283
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13181
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
13182
+ reasoning: false,
13284
13183
  input: ["text"],
13285
13184
  cost: {
13286
- input: 0.6,
13287
- output: 1.7,
13185
+ input: 2.5,
13186
+ output: 7.5,
13288
13187
  cacheRead: 0,
13289
13188
  cacheWrite: 0,
13290
13189
  },
13291
- contextWindow: 131072,
13292
- maxTokens: 131072,
13190
+ contextWindow: 1000000,
13191
+ maxTokens: 500000,
13293
13192
  },
13294
13193
  "deepseek-ai/DeepSeek-V4-Pro": {
13295
13194
  id: "deepseek-ai/DeepSeek-V4-Pro",
@@ -13302,8 +13201,8 @@ export const MODELS = {
13302
13201
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": null },
13303
13202
  input: ["text"],
13304
13203
  cost: {
13305
- input: 2.1,
13306
- output: 4.4,
13204
+ input: 1.74,
13205
+ output: 3.48,
13307
13206
  cacheRead: 0.2,
13308
13207
  cacheWrite: 0,
13309
13208
  },
@@ -13339,8 +13238,8 @@ export const MODELS = {
13339
13238
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13340
13239
  input: ["text", "image"],
13341
13240
  cost: {
13342
- input: 0.2,
13343
- output: 0.5,
13241
+ input: 0.39,
13242
+ output: 0.97,
13344
13243
  cacheRead: 0,
13345
13244
  cacheWrite: 0,
13346
13245
  },
@@ -13365,25 +13264,6 @@ export const MODELS = {
13365
13264
  contextWindow: 131072,
13366
13265
  maxTokens: 131072,
13367
13266
  },
13368
- "moonshotai/Kimi-K2.5": {
13369
- id: "moonshotai/Kimi-K2.5",
13370
- name: "Kimi K2.5",
13371
- api: "openai-completions",
13372
- provider: "together",
13373
- baseUrl: "https://api.together.ai/v1",
13374
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13375
- reasoning: true,
13376
- thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13377
- input: ["text", "image"],
13378
- cost: {
13379
- input: 0.5,
13380
- output: 2.8,
13381
- cacheRead: 0,
13382
- cacheWrite: 0,
13383
- },
13384
- contextWindow: 262144,
13385
- maxTokens: 262144,
13386
- },
13387
13267
  "moonshotai/Kimi-K2.6": {
13388
13268
  id: "moonshotai/Kimi-K2.6",
13389
13269
  name: "Kimi K2.6",
@@ -13441,6 +13321,44 @@ export const MODELS = {
13441
13321
  contextWindow: 131072,
13442
13322
  maxTokens: 131072,
13443
13323
  },
13324
+ "openai/gpt-oss-20b": {
13325
+ id: "openai/gpt-oss-20b",
13326
+ name: "GPT OSS 20B",
13327
+ api: "openai-completions",
13328
+ provider: "together",
13329
+ baseUrl: "https://api.together.ai/v1",
13330
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": true, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "openai" },
13331
+ reasoning: true,
13332
+ thinkingLevelMap: { "off": null, "minimal": null },
13333
+ input: ["text"],
13334
+ cost: {
13335
+ input: 0.05,
13336
+ output: 0.2,
13337
+ cacheRead: 0,
13338
+ cacheWrite: 0,
13339
+ },
13340
+ contextWindow: 131072,
13341
+ maxTokens: 131072,
13342
+ },
13343
+ "zai-org/GLM-5": {
13344
+ id: "zai-org/GLM-5",
13345
+ name: "GLM-5",
13346
+ api: "openai-completions",
13347
+ provider: "together",
13348
+ baseUrl: "https://api.together.ai/v1",
13349
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13350
+ reasoning: true,
13351
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13352
+ input: ["text"],
13353
+ cost: {
13354
+ input: 1,
13355
+ output: 3.2,
13356
+ cacheRead: 0,
13357
+ cacheWrite: 0,
13358
+ },
13359
+ contextWindow: 202752,
13360
+ maxTokens: 131072,
13361
+ },
13444
13362
  "zai-org/GLM-5.1": {
13445
13363
  id: "zai-org/GLM-5.1",
13446
13364
  name: "GLM-5.1",
@@ -13505,8 +13423,8 @@ export const MODELS = {
13505
13423
  reasoning: true,
13506
13424
  input: ["text"],
13507
13425
  cost: {
13508
- input: 0.08,
13509
- output: 0.29,
13426
+ input: 0.12,
13427
+ output: 0.5,
13510
13428
  cacheRead: 0,
13511
13429
  cacheWrite: 0,
13512
13430
  },
@@ -13556,7 +13474,7 @@ export const MODELS = {
13556
13474
  reasoning: true,
13557
13475
  input: ["text", "image"],
13558
13476
  cost: {
13559
- input: 0.39999999999999997,
13477
+ input: 0.4,
13560
13478
  output: 4,
13561
13479
  cacheRead: 0,
13562
13480
  cacheWrite: 0,
@@ -13626,7 +13544,7 @@ export const MODELS = {
13626
13544
  cost: {
13627
13545
  input: 1,
13628
13546
  output: 5,
13629
- cacheRead: 0.19999999999999998,
13547
+ cacheRead: 0.2,
13630
13548
  cacheWrite: 0,
13631
13549
  },
13632
13550
  contextWindow: 1000000,
@@ -13726,7 +13644,7 @@ export const MODELS = {
13726
13644
  reasoning: true,
13727
13645
  input: ["text", "image"],
13728
13646
  cost: {
13729
- input: 0.39999999999999997,
13647
+ input: 0.4,
13730
13648
  output: 4,
13731
13649
  cacheRead: 0,
13732
13650
  cacheWrite: 0,
@@ -13743,8 +13661,8 @@ export const MODELS = {
13743
13661
  reasoning: true,
13744
13662
  input: ["text", "image"],
13745
13663
  cost: {
13746
- input: 0.09999999999999999,
13747
- output: 0.39999999999999997,
13664
+ input: 0.1,
13665
+ output: 0.4,
13748
13666
  cacheRead: 0.001,
13749
13667
  cacheWrite: 0.125,
13750
13668
  },
@@ -13760,7 +13678,7 @@ export const MODELS = {
13760
13678
  reasoning: true,
13761
13679
  input: ["text", "image"],
13762
13680
  cost: {
13763
- input: 0.39999999999999997,
13681
+ input: 0.4,
13764
13682
  output: 2.4,
13765
13683
  cacheRead: 0.04,
13766
13684
  cacheWrite: 0.5,
@@ -13778,7 +13696,7 @@ export const MODELS = {
13778
13696
  input: ["text", "image"],
13779
13697
  cost: {
13780
13698
  input: 0.6,
13781
- output: 3.5999999999999996,
13699
+ output: 3.6,
13782
13700
  cacheRead: 0,
13783
13701
  cacheWrite: 0,
13784
13702
  },
@@ -13796,7 +13714,7 @@ export const MODELS = {
13796
13714
  cost: {
13797
13715
  input: 0.5,
13798
13716
  output: 3,
13799
- cacheRead: 0.09999999999999999,
13717
+ cacheRead: 0.1,
13800
13718
  cacheWrite: 0.625,
13801
13719
  },
13802
13720
  contextWindow: 1000000,
@@ -13828,8 +13746,8 @@ export const MODELS = {
13828
13746
  reasoning: true,
13829
13747
  input: ["text", "image"],
13830
13748
  cost: {
13831
- input: 0.39999999999999997,
13832
- output: 1.5999999999999999,
13749
+ input: 0.4,
13750
+ output: 1.6,
13833
13751
  cacheRead: 0.08,
13834
13752
  cacheWrite: 0.5,
13835
13753
  },
@@ -13862,7 +13780,7 @@ export const MODELS = {
13862
13780
  reasoning: false,
13863
13781
  input: ["text", "image"],
13864
13782
  cost: {
13865
- input: 0.7999999999999999,
13783
+ input: 0.8,
13866
13784
  output: 4,
13867
13785
  cacheRead: 0.08,
13868
13786
  cacheWrite: 1,
@@ -13870,6 +13788,25 @@ export const MODELS = {
13870
13788
  contextWindow: 200000,
13871
13789
  maxTokens: 8192,
13872
13790
  },
13791
+ "anthropic/claude-fable-5": {
13792
+ id: "anthropic/claude-fable-5",
13793
+ name: "Claude Fable 5",
13794
+ api: "anthropic-messages",
13795
+ provider: "vercel-ai-gateway",
13796
+ baseUrl: "https://ai-gateway.vercel.sh",
13797
+ compat: { "forceAdaptiveThinking": true },
13798
+ reasoning: true,
13799
+ thinkingLevelMap: { "off": null, "xhigh": "xhigh" },
13800
+ input: ["text", "image"],
13801
+ cost: {
13802
+ input: 10,
13803
+ output: 50,
13804
+ cacheRead: 1,
13805
+ cacheWrite: 12.5,
13806
+ },
13807
+ contextWindow: 1000000,
13808
+ maxTokens: 128000,
13809
+ },
13873
13810
  "anthropic/claude-haiku-4.5": {
13874
13811
  id: "anthropic/claude-haiku-4.5",
13875
13812
  name: "Claude Haiku 4.5",
@@ -13881,7 +13818,7 @@ export const MODELS = {
13881
13818
  cost: {
13882
13819
  input: 1,
13883
13820
  output: 5,
13884
- cacheRead: 0.09999999999999999,
13821
+ cacheRead: 0.1,
13885
13822
  cacheWrite: 1.25,
13886
13823
  },
13887
13824
  contextWindow: 200000,
@@ -14074,7 +14011,7 @@ export const MODELS = {
14074
14011
  input: ["text"],
14075
14012
  cost: {
14076
14013
  input: 0.25,
14077
- output: 0.8999999999999999,
14014
+ output: 0.9,
14078
14015
  cacheRead: 0,
14079
14016
  cacheWrite: 0,
14080
14017
  },
@@ -14092,7 +14029,7 @@ export const MODELS = {
14092
14029
  cost: {
14093
14030
  input: 0.25,
14094
14031
  output: 2,
14095
- cacheRead: 0.049999999999999996,
14032
+ cacheRead: 0.05,
14096
14033
  cacheWrite: 0,
14097
14034
  },
14098
14035
  contextWindow: 256000,
@@ -14277,8 +14214,8 @@ export const MODELS = {
14277
14214
  reasoning: true,
14278
14215
  input: ["text", "image"],
14279
14216
  cost: {
14280
- input: 0.09999999999999999,
14281
- output: 0.39999999999999997,
14217
+ input: 0.1,
14218
+ output: 0.4,
14282
14219
  cacheRead: 0.01,
14283
14220
  cacheWrite: 0,
14284
14221
  },
@@ -14313,7 +14250,7 @@ export const MODELS = {
14313
14250
  cost: {
14314
14251
  input: 0.5,
14315
14252
  output: 3,
14316
- cacheRead: 0.049999999999999996,
14253
+ cacheRead: 0.05,
14317
14254
  cacheWrite: 0,
14318
14255
  },
14319
14256
  contextWindow: 1000000,
@@ -14330,7 +14267,7 @@ export const MODELS = {
14330
14267
  cost: {
14331
14268
  input: 2,
14332
14269
  output: 12,
14333
- cacheRead: 0.19999999999999998,
14270
+ cacheRead: 0.2,
14334
14271
  cacheWrite: 0,
14335
14272
  },
14336
14273
  contextWindow: 1000000,
@@ -14381,7 +14318,7 @@ export const MODELS = {
14381
14318
  cost: {
14382
14319
  input: 2,
14383
14320
  output: 12,
14384
- cacheRead: 0.19999999999999998,
14321
+ cacheRead: 0.2,
14385
14322
  cacheWrite: 0,
14386
14323
  },
14387
14324
  contextWindow: 1000000,
@@ -14431,7 +14368,7 @@ export const MODELS = {
14431
14368
  input: ["text", "image"],
14432
14369
  cost: {
14433
14370
  input: 0.14,
14434
- output: 0.39999999999999997,
14371
+ output: 0.4,
14435
14372
  cacheRead: 0,
14436
14373
  cacheWrite: 0,
14437
14374
  },
@@ -14449,7 +14386,7 @@ export const MODELS = {
14449
14386
  cost: {
14450
14387
  input: 0.25,
14451
14388
  output: 0.75,
14452
- cacheRead: 0.024999999999999998,
14389
+ cacheRead: 0.025,
14453
14390
  cacheWrite: 0,
14454
14391
  },
14455
14392
  contextWindow: 128000,
@@ -14601,7 +14538,7 @@ export const MODELS = {
14601
14538
  input: ["text", "image"],
14602
14539
  cost: {
14603
14540
  input: 0.24,
14604
- output: 0.9700000000000001,
14541
+ output: 0.97,
14605
14542
  cacheRead: 0,
14606
14543
  cacheWrite: 0,
14607
14544
  },
@@ -14617,7 +14554,7 @@ export const MODELS = {
14617
14554
  reasoning: false,
14618
14555
  input: ["text", "image"],
14619
14556
  cost: {
14620
- input: 0.16999999999999998,
14557
+ input: 0.17,
14621
14558
  output: 0.66,
14622
14559
  cacheRead: 0,
14623
14560
  cacheWrite: 0,
@@ -14771,7 +14708,7 @@ export const MODELS = {
14771
14708
  input: ["text"],
14772
14709
  cost: {
14773
14710
  input: 0.3,
14774
- output: 0.8999999999999999,
14711
+ output: 0.9,
14775
14712
  cacheRead: 0,
14776
14713
  cacheWrite: 0,
14777
14714
  },
@@ -14787,7 +14724,7 @@ export const MODELS = {
14787
14724
  reasoning: false,
14788
14725
  input: ["text"],
14789
14726
  cost: {
14790
- input: 0.39999999999999997,
14727
+ input: 0.4,
14791
14728
  output: 2,
14792
14729
  cacheRead: 0,
14793
14730
  cacheWrite: 0,
@@ -14804,7 +14741,7 @@ export const MODELS = {
14804
14741
  reasoning: false,
14805
14742
  input: ["text"],
14806
14743
  cost: {
14807
- input: 0.09999999999999999,
14744
+ input: 0.1,
14808
14745
  output: 0.3,
14809
14746
  cacheRead: 0,
14810
14747
  cacheWrite: 0,
@@ -14821,7 +14758,7 @@ export const MODELS = {
14821
14758
  reasoning: false,
14822
14759
  input: ["text"],
14823
14760
  cost: {
14824
- input: 0.09999999999999999,
14761
+ input: 0.1,
14825
14762
  output: 0.3,
14826
14763
  cacheRead: 0,
14827
14764
  cacheWrite: 0,
@@ -14838,8 +14775,8 @@ export const MODELS = {
14838
14775
  reasoning: false,
14839
14776
  input: ["text"],
14840
14777
  cost: {
14841
- input: 0.09999999999999999,
14842
- output: 0.09999999999999999,
14778
+ input: 0.1,
14779
+ output: 0.1,
14843
14780
  cacheRead: 0,
14844
14781
  cacheWrite: 0,
14845
14782
  },
@@ -14872,7 +14809,7 @@ export const MODELS = {
14872
14809
  reasoning: false,
14873
14810
  input: ["text", "image"],
14874
14811
  cost: {
14875
- input: 0.39999999999999997,
14812
+ input: 0.4,
14876
14813
  output: 2,
14877
14814
  cacheRead: 0,
14878
14815
  cacheWrite: 0,
@@ -14923,7 +14860,7 @@ export const MODELS = {
14923
14860
  reasoning: false,
14924
14861
  input: ["text", "image"],
14925
14862
  cost: {
14926
- input: 0.09999999999999999,
14863
+ input: 0.1,
14927
14864
  output: 0.3,
14928
14865
  cacheRead: 0,
14929
14866
  cacheWrite: 0,
@@ -14974,7 +14911,7 @@ export const MODELS = {
14974
14911
  reasoning: false,
14975
14912
  input: ["text"],
14976
14913
  cost: {
14977
- input: 0.5700000000000001,
14914
+ input: 0.57,
14978
14915
  output: 2.3,
14979
14916
  cacheRead: 0,
14980
14917
  cacheWrite: 0,
@@ -14999,40 +14936,6 @@ export const MODELS = {
14999
14936
  contextWindow: 262114,
15000
14937
  maxTokens: 262114,
15001
14938
  },
15002
- "moonshotai/kimi-k2-thinking-turbo": {
15003
- id: "moonshotai/kimi-k2-thinking-turbo",
15004
- name: "Kimi K2 Thinking Turbo",
15005
- api: "anthropic-messages",
15006
- provider: "vercel-ai-gateway",
15007
- baseUrl: "https://ai-gateway.vercel.sh",
15008
- reasoning: true,
15009
- input: ["text"],
15010
- cost: {
15011
- input: 1.15,
15012
- output: 8,
15013
- cacheRead: 0.15,
15014
- cacheWrite: 0,
15015
- },
15016
- contextWindow: 262114,
15017
- maxTokens: 262114,
15018
- },
15019
- "moonshotai/kimi-k2-turbo": {
15020
- id: "moonshotai/kimi-k2-turbo",
15021
- name: "Kimi K2 Turbo",
15022
- api: "anthropic-messages",
15023
- provider: "vercel-ai-gateway",
15024
- baseUrl: "https://ai-gateway.vercel.sh",
15025
- reasoning: false,
15026
- input: ["text"],
15027
- cost: {
15028
- input: 1.15,
15029
- output: 8,
15030
- cacheRead: 0.15,
15031
- cacheWrite: 0,
15032
- },
15033
- contextWindow: 256000,
15034
- maxTokens: 16384,
15035
- },
15036
14939
  "moonshotai/kimi-k2.5": {
15037
14940
  id: "moonshotai/kimi-k2.5",
15038
14941
  name: "Kimi K2.5",
@@ -15044,7 +14947,7 @@ export const MODELS = {
15044
14947
  cost: {
15045
14948
  input: 0.6,
15046
14949
  output: 3,
15047
- cacheRead: 0.09999999999999999,
14950
+ cacheRead: 0.1,
15048
14951
  cacheWrite: 0,
15049
14952
  },
15050
14953
  contextWindow: 262114,
@@ -15067,6 +14970,23 @@ export const MODELS = {
15067
14970
  contextWindow: 262000,
15068
14971
  maxTokens: 262000,
15069
14972
  },
14973
+ "moonshotai/kimi-k2.7-code": {
14974
+ id: "moonshotai/kimi-k2.7-code",
14975
+ name: "Kimi K2.7 Code",
14976
+ api: "anthropic-messages",
14977
+ provider: "vercel-ai-gateway",
14978
+ baseUrl: "https://ai-gateway.vercel.sh",
14979
+ reasoning: true,
14980
+ input: ["text", "image"],
14981
+ cost: {
14982
+ input: 0.95,
14983
+ output: 4,
14984
+ cacheRead: 0.19,
14985
+ cacheWrite: 0,
14986
+ },
14987
+ contextWindow: 256000,
14988
+ maxTokens: 32768,
14989
+ },
15070
14990
  "nvidia/nemotron-3-super-120b-a12b": {
15071
14991
  id: "nvidia/nemotron-3-super-120b-a12b",
15072
14992
  name: "NVIDIA Nemotron 3 Super 120B A12B",
@@ -15110,7 +15030,7 @@ export const MODELS = {
15110
15030
  reasoning: true,
15111
15031
  input: ["text", "image"],
15112
15032
  cost: {
15113
- input: 0.19999999999999998,
15033
+ input: 0.2,
15114
15034
  output: 0.6,
15115
15035
  cacheRead: 0,
15116
15036
  cacheWrite: 0,
@@ -15128,7 +15048,7 @@ export const MODELS = {
15128
15048
  input: ["text"],
15129
15049
  cost: {
15130
15050
  input: 0.06,
15131
- output: 0.22999999999999998,
15051
+ output: 0.23,
15132
15052
  cacheRead: 0,
15133
15053
  cacheWrite: 0,
15134
15054
  },
@@ -15178,9 +15098,9 @@ export const MODELS = {
15178
15098
  reasoning: false,
15179
15099
  input: ["text", "image"],
15180
15100
  cost: {
15181
- input: 0.39999999999999997,
15182
- output: 1.5999999999999999,
15183
- cacheRead: 0.09999999999999999,
15101
+ input: 0.4,
15102
+ output: 1.6,
15103
+ cacheRead: 0.1,
15184
15104
  cacheWrite: 0,
15185
15105
  },
15186
15106
  contextWindow: 1047576,
@@ -15195,9 +15115,9 @@ export const MODELS = {
15195
15115
  reasoning: false,
15196
15116
  input: ["text", "image"],
15197
15117
  cost: {
15198
- input: 0.09999999999999999,
15199
- output: 0.39999999999999997,
15200
- cacheRead: 0.024999999999999998,
15118
+ input: 0.1,
15119
+ output: 0.4,
15120
+ cacheRead: 0.025,
15201
15121
  cacheWrite: 0,
15202
15122
  },
15203
15123
  contextWindow: 1047576,
@@ -15299,7 +15219,7 @@ export const MODELS = {
15299
15219
  cost: {
15300
15220
  input: 0.25,
15301
15221
  output: 2,
15302
- cacheRead: 0.024999999999999998,
15222
+ cacheRead: 0.025,
15303
15223
  cacheWrite: 0,
15304
15224
  },
15305
15225
  contextWindow: 400000,
@@ -15314,8 +15234,8 @@ export const MODELS = {
15314
15234
  reasoning: true,
15315
15235
  input: ["text", "image"],
15316
15236
  cost: {
15317
- input: 0.049999999999999996,
15318
- output: 0.39999999999999997,
15237
+ input: 0.05,
15238
+ output: 0.4,
15319
15239
  cacheRead: 0.005,
15320
15240
  cacheWrite: 0,
15321
15241
  },
@@ -15384,7 +15304,7 @@ export const MODELS = {
15384
15304
  cost: {
15385
15305
  input: 0.25,
15386
15306
  output: 2,
15387
- cacheRead: 0.024999999999999998,
15307
+ cacheRead: 0.025,
15388
15308
  cacheWrite: 0,
15389
15309
  },
15390
15310
  contextWindow: 400000,
@@ -15578,7 +15498,7 @@ export const MODELS = {
15578
15498
  thinkingLevelMap: { "xhigh": "xhigh" },
15579
15499
  input: ["text", "image"],
15580
15500
  cost: {
15581
- input: 0.19999999999999998,
15501
+ input: 0.2,
15582
15502
  output: 1.25,
15583
15503
  cacheRead: 0.02,
15584
15504
  cacheWrite: 0,
@@ -15666,8 +15586,8 @@ export const MODELS = {
15666
15586
  reasoning: true,
15667
15587
  input: ["text"],
15668
15588
  cost: {
15669
- input: 0.049999999999999996,
15670
- output: 0.19999999999999998,
15589
+ input: 0.05,
15590
+ output: 0.2,
15671
15591
  cacheRead: 0,
15672
15592
  cacheWrite: 0,
15673
15593
  },
@@ -15853,7 +15773,7 @@ export const MODELS = {
15853
15773
  reasoning: true,
15854
15774
  input: ["text", "image"],
15855
15775
  cost: {
15856
- input: 0.19999999999999998,
15776
+ input: 0.2,
15857
15777
  output: 1.15,
15858
15778
  cacheRead: 0.04,
15859
15779
  cacheWrite: 0,
@@ -15870,9 +15790,9 @@ export const MODELS = {
15870
15790
  reasoning: false,
15871
15791
  input: ["text", "image"],
15872
15792
  cost: {
15873
- input: 0.19999999999999998,
15793
+ input: 0.2,
15874
15794
  output: 0.5,
15875
- cacheRead: 0.049999999999999996,
15795
+ cacheRead: 0.05,
15876
15796
  cacheWrite: 0,
15877
15797
  },
15878
15798
  contextWindow: 1000000,
@@ -15887,9 +15807,9 @@ export const MODELS = {
15887
15807
  reasoning: true,
15888
15808
  input: ["text", "image"],
15889
15809
  cost: {
15890
- input: 0.19999999999999998,
15810
+ input: 0.2,
15891
15811
  output: 0.5,
15892
- cacheRead: 0.049999999999999996,
15812
+ cacheRead: 0.05,
15893
15813
  cacheWrite: 0,
15894
15814
  },
15895
15815
  contextWindow: 1000000,
@@ -15906,7 +15826,7 @@ export const MODELS = {
15906
15826
  cost: {
15907
15827
  input: 1.25,
15908
15828
  output: 2.5,
15909
- cacheRead: 0.19999999999999998,
15829
+ cacheRead: 0.2,
15910
15830
  cacheWrite: 0,
15911
15831
  },
15912
15832
  contextWindow: 2000000,
@@ -15923,7 +15843,7 @@ export const MODELS = {
15923
15843
  cost: {
15924
15844
  input: 1.25,
15925
15845
  output: 2.5,
15926
- cacheRead: 0.19999999999999998,
15846
+ cacheRead: 0.2,
15927
15847
  cacheWrite: 0,
15928
15848
  },
15929
15849
  contextWindow: 2000000,
@@ -15940,7 +15860,7 @@ export const MODELS = {
15940
15860
  cost: {
15941
15861
  input: 1.25,
15942
15862
  output: 2.5,
15943
- cacheRead: 0.19999999999999998,
15863
+ cacheRead: 0.2,
15944
15864
  cacheWrite: 0,
15945
15865
  },
15946
15866
  contextWindow: 2000000,
@@ -15957,7 +15877,7 @@ export const MODELS = {
15957
15877
  cost: {
15958
15878
  input: 1.25,
15959
15879
  output: 2.5,
15960
- cacheRead: 0.19999999999999998,
15880
+ cacheRead: 0.2,
15961
15881
  cacheWrite: 0,
15962
15882
  },
15963
15883
  contextWindow: 2000000,
@@ -15974,7 +15894,7 @@ export const MODELS = {
15974
15894
  cost: {
15975
15895
  input: 1.25,
15976
15896
  output: 2.5,
15977
- cacheRead: 0.19999999999999998,
15897
+ cacheRead: 0.2,
15978
15898
  cacheWrite: 0,
15979
15899
  },
15980
15900
  contextWindow: 2000000,
@@ -15991,7 +15911,7 @@ export const MODELS = {
15991
15911
  cost: {
15992
15912
  input: 1.25,
15993
15913
  output: 2.5,
15994
- cacheRead: 0.19999999999999998,
15914
+ cacheRead: 0.2,
15995
15915
  cacheWrite: 0,
15996
15916
  },
15997
15917
  contextWindow: 2000000,
@@ -16008,7 +15928,7 @@ export const MODELS = {
16008
15928
  cost: {
16009
15929
  input: 1.25,
16010
15930
  output: 2.5,
16011
- cacheRead: 0.19999999999999998,
15931
+ cacheRead: 0.2,
16012
15932
  cacheWrite: 0,
16013
15933
  },
16014
15934
  contextWindow: 1000000,
@@ -16025,7 +15945,7 @@ export const MODELS = {
16025
15945
  cost: {
16026
15946
  input: 1,
16027
15947
  output: 2,
16028
- cacheRead: 0.19999999999999998,
15948
+ cacheRead: 0.2,
16029
15949
  cacheWrite: 0,
16030
15950
  },
16031
15951
  contextWindow: 256000,
@@ -16040,7 +15960,7 @@ export const MODELS = {
16040
15960
  reasoning: true,
16041
15961
  input: ["text"],
16042
15962
  cost: {
16043
- input: 0.09999999999999999,
15963
+ input: 0.1,
16044
15964
  output: 0.3,
16045
15965
  cacheRead: 0.01,
16046
15966
  cacheWrite: 0,
@@ -16059,7 +15979,7 @@ export const MODELS = {
16059
15979
  cost: {
16060
15980
  input: 1,
16061
15981
  output: 3,
16062
- cacheRead: 0.19999999999999998,
15982
+ cacheRead: 0.2,
16063
15983
  cacheWrite: 0,
16064
15984
  },
16065
15985
  contextWindow: 1000000,
@@ -16125,7 +16045,7 @@ export const MODELS = {
16125
16045
  reasoning: true,
16126
16046
  input: ["text"],
16127
16047
  cost: {
16128
- input: 0.19999999999999998,
16048
+ input: 0.2,
16129
16049
  output: 1.1,
16130
16050
  cacheRead: 0.03,
16131
16051
  cacheWrite: 0,
@@ -16143,7 +16063,7 @@ export const MODELS = {
16143
16063
  input: ["text", "image"],
16144
16064
  cost: {
16145
16065
  input: 0.6,
16146
- output: 1.7999999999999998,
16066
+ output: 1.8,
16147
16067
  cacheRead: 0.11,
16148
16068
  cacheWrite: 0,
16149
16069
  },
@@ -16177,8 +16097,8 @@ export const MODELS = {
16177
16097
  input: ["text", "image"],
16178
16098
  cost: {
16179
16099
  input: 0.3,
16180
- output: 0.8999999999999999,
16181
- cacheRead: 0.049999999999999996,
16100
+ output: 0.9,
16101
+ cacheRead: 0.05,
16182
16102
  cacheWrite: 0,
16183
16103
  },
16184
16104
  contextWindow: 128000,
@@ -16228,7 +16148,7 @@ export const MODELS = {
16228
16148
  input: ["text"],
16229
16149
  cost: {
16230
16150
  input: 0.07,
16231
- output: 0.39999999999999997,
16151
+ output: 0.4,
16232
16152
  cacheRead: 0,
16233
16153
  cacheWrite: 0,
16234
16154
  },
@@ -16245,7 +16165,7 @@ export const MODELS = {
16245
16165
  input: ["text"],
16246
16166
  cost: {
16247
16167
  input: 0.06,
16248
- output: 0.39999999999999997,
16168
+ output: 0.4,
16249
16169
  cacheRead: 0.01,
16250
16170
  cacheWrite: 0,
16251
16171
  },
@@ -16262,8 +16182,8 @@ export const MODELS = {
16262
16182
  input: ["text"],
16263
16183
  cost: {
16264
16184
  input: 1,
16265
- output: 3.1999999999999997,
16266
- cacheRead: 0.19999999999999998,
16185
+ output: 3.2,
16186
+ cacheRead: 0.2,
16267
16187
  cacheWrite: 0,
16268
16188
  },
16269
16189
  contextWindow: 202800,
@@ -16370,7 +16290,7 @@ export const MODELS = {
16370
16290
  cacheRead: 0.2,
16371
16291
  cacheWrite: 0,
16372
16292
  },
16373
- contextWindow: 2000000,
16293
+ contextWindow: 1000000,
16374
16294
  maxTokens: 30000,
16375
16295
  },
16376
16296
  "grok-4.20-0309-reasoning": {
@@ -16387,7 +16307,7 @@ export const MODELS = {
16387
16307
  cacheRead: 0.2,
16388
16308
  cacheWrite: 0,
16389
16309
  },
16390
- contextWindow: 2000000,
16310
+ contextWindow: 1000000,
16391
16311
  maxTokens: 30000,
16392
16312
  },
16393
16313
  "grok-4.3": {
@@ -16533,6 +16453,24 @@ export const MODELS = {
16533
16453
  contextWindow: 1048576,
16534
16454
  maxTokens: 131072,
16535
16455
  },
16456
+ "mimo-v2.5-pro-ultraspeed": {
16457
+ id: "mimo-v2.5-pro-ultraspeed",
16458
+ name: "MiMo-V2.5-Pro-UltraSpeed",
16459
+ api: "openai-completions",
16460
+ provider: "xiaomi",
16461
+ baseUrl: "https://api.xiaomimimo.com/v1",
16462
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
16463
+ reasoning: true,
16464
+ input: ["text"],
16465
+ cost: {
16466
+ input: 1.305,
16467
+ output: 2.61,
16468
+ cacheRead: 0.0108,
16469
+ cacheWrite: 0,
16470
+ },
16471
+ contextWindow: 1048576,
16472
+ maxTokens: 131072,
16473
+ },
16536
16474
  },
16537
16475
  "xiaomi-token-plan-ams": {
16538
16476
  "mimo-v2-omni": {
@@ -16607,6 +16545,24 @@ export const MODELS = {
16607
16545
  contextWindow: 1048576,
16608
16546
  maxTokens: 131072,
16609
16547
  },
16548
+ "mimo-v2.5-pro-ultraspeed": {
16549
+ id: "mimo-v2.5-pro-ultraspeed",
16550
+ name: "MiMo-V2.5-Pro-UltraSpeed",
16551
+ api: "openai-completions",
16552
+ provider: "xiaomi-token-plan-ams",
16553
+ baseUrl: "https://token-plan-ams.xiaomimimo.com/v1",
16554
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
16555
+ reasoning: true,
16556
+ input: ["text"],
16557
+ cost: {
16558
+ input: 1.305,
16559
+ output: 2.61,
16560
+ cacheRead: 0.0108,
16561
+ cacheWrite: 0,
16562
+ },
16563
+ contextWindow: 1048576,
16564
+ maxTokens: 131072,
16565
+ },
16610
16566
  },
16611
16567
  "xiaomi-token-plan-cn": {
16612
16568
  "mimo-v2-omni": {
@@ -16681,6 +16637,24 @@ export const MODELS = {
16681
16637
  contextWindow: 1048576,
16682
16638
  maxTokens: 131072,
16683
16639
  },
16640
+ "mimo-v2.5-pro-ultraspeed": {
16641
+ id: "mimo-v2.5-pro-ultraspeed",
16642
+ name: "MiMo-V2.5-Pro-UltraSpeed",
16643
+ api: "openai-completions",
16644
+ provider: "xiaomi-token-plan-cn",
16645
+ baseUrl: "https://token-plan-cn.xiaomimimo.com/v1",
16646
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
16647
+ reasoning: true,
16648
+ input: ["text"],
16649
+ cost: {
16650
+ input: 1.305,
16651
+ output: 2.61,
16652
+ cacheRead: 0.0108,
16653
+ cacheWrite: 0,
16654
+ },
16655
+ contextWindow: 1048576,
16656
+ maxTokens: 131072,
16657
+ },
16684
16658
  },
16685
16659
  "xiaomi-token-plan-sgp": {
16686
16660
  "mimo-v2-omni": {
@@ -16755,6 +16729,24 @@ export const MODELS = {
16755
16729
  contextWindow: 1048576,
16756
16730
  maxTokens: 131072,
16757
16731
  },
16732
+ "mimo-v2.5-pro-ultraspeed": {
16733
+ id: "mimo-v2.5-pro-ultraspeed",
16734
+ name: "MiMo-V2.5-Pro-UltraSpeed",
16735
+ api: "openai-completions",
16736
+ provider: "xiaomi-token-plan-sgp",
16737
+ baseUrl: "https://token-plan-sgp.xiaomimimo.com/v1",
16738
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
16739
+ reasoning: true,
16740
+ input: ["text"],
16741
+ cost: {
16742
+ input: 1.305,
16743
+ output: 2.61,
16744
+ cacheRead: 0.0108,
16745
+ cacheWrite: 0,
16746
+ },
16747
+ contextWindow: 1048576,
16748
+ maxTokens: 131072,
16749
+ },
16758
16750
  },
16759
16751
  "zai": {
16760
16752
  "glm-4.5-air": {