@earendil-works/pi-ai 0.78.1 → 0.79.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (32) hide show
  1. package/README.md +4 -2
  2. package/dist/image-models.generated.d.ts +30 -0
  3. package/dist/image-models.generated.d.ts.map +1 -1
  4. package/dist/image-models.generated.js +30 -0
  5. package/dist/image-models.generated.js.map +1 -1
  6. package/dist/models.generated.d.ts +421 -97
  7. package/dist/models.generated.d.ts.map +1 -1
  8. package/dist/models.generated.js +405 -185
  9. package/dist/models.generated.js.map +1 -1
  10. package/dist/providers/amazon-bedrock.d.ts.map +1 -1
  11. package/dist/providers/amazon-bedrock.js +14 -6
  12. package/dist/providers/amazon-bedrock.js.map +1 -1
  13. package/dist/providers/anthropic.d.ts +1 -1
  14. package/dist/providers/anthropic.d.ts.map +1 -1
  15. package/dist/providers/anthropic.js +1 -1
  16. package/dist/providers/anthropic.js.map +1 -1
  17. package/dist/providers/azure-openai-responses.d.ts.map +1 -1
  18. package/dist/providers/azure-openai-responses.js +1 -0
  19. package/dist/providers/azure-openai-responses.js.map +1 -1
  20. package/dist/providers/openai-completions.d.ts.map +1 -1
  21. package/dist/providers/openai-completions.js +3 -2
  22. package/dist/providers/openai-completions.js.map +1 -1
  23. package/dist/providers/openai-responses-shared.d.ts.map +1 -1
  24. package/dist/providers/openai-responses-shared.js +2 -1
  25. package/dist/providers/openai-responses-shared.js.map +1 -1
  26. package/dist/providers/openai-responses.d.ts.map +1 -1
  27. package/dist/providers/openai-responses.js +1 -0
  28. package/dist/providers/openai-responses.js.map +1 -1
  29. package/dist/types.d.ts +4 -2
  30. package/dist/types.d.ts.map +1 -1
  31. package/dist/types.js.map +1 -1
  32. package/package.json +1 -1
@@ -8,7 +8,7 @@ export const MODELS = {
8
8
  api: "bedrock-converse-stream",
9
9
  provider: "amazon-bedrock",
10
10
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
11
- reasoning: false,
11
+ reasoning: true,
12
12
  input: ["text", "image"],
13
13
  cost: {
14
14
  input: 0.33,
@@ -347,6 +347,24 @@ export const MODELS = {
347
347
  contextWindow: 163840,
348
348
  maxTokens: 81920,
349
349
  },
350
+ "eu.anthropic.claude-fable-5": {
351
+ id: "eu.anthropic.claude-fable-5",
352
+ name: "Claude Fable 5 (EU)",
353
+ api: "bedrock-converse-stream",
354
+ provider: "amazon-bedrock",
355
+ baseUrl: "https://bedrock-runtime.eu-central-1.amazonaws.com",
356
+ reasoning: true,
357
+ thinkingLevelMap: { "xhigh": "xhigh" },
358
+ input: ["text", "image"],
359
+ cost: {
360
+ input: 11,
361
+ output: 55,
362
+ cacheRead: 1.1,
363
+ cacheWrite: 13.75,
364
+ },
365
+ contextWindow: 1000000,
366
+ maxTokens: 128000,
367
+ },
350
368
  "eu.anthropic.claude-haiku-4-5-20251001-v1:0": {
351
369
  id: "eu.anthropic.claude-haiku-4-5-20251001-v1:0",
352
370
  name: "Claude Haiku 4.5 (EU)",
@@ -469,6 +487,24 @@ export const MODELS = {
469
487
  contextWindow: 1000000,
470
488
  maxTokens: 64000,
471
489
  },
490
+ "global.anthropic.claude-fable-5": {
491
+ id: "global.anthropic.claude-fable-5",
492
+ name: "Claude Fable 5 (Global)",
493
+ api: "bedrock-converse-stream",
494
+ provider: "amazon-bedrock",
495
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
496
+ reasoning: true,
497
+ thinkingLevelMap: { "xhigh": "xhigh" },
498
+ input: ["text", "image"],
499
+ cost: {
500
+ input: 10,
501
+ output: 50,
502
+ cacheRead: 1,
503
+ cacheWrite: 12.5,
504
+ },
505
+ contextWindow: 1000000,
506
+ maxTokens: 128000,
507
+ },
472
508
  "global.anthropic.claude-haiku-4-5-20251001-v1:0": {
473
509
  id: "global.anthropic.claude-haiku-4-5-20251001-v1:0",
474
510
  name: "Claude Haiku 4.5 (Global)",
@@ -1086,13 +1122,66 @@ export const MODELS = {
1086
1122
  contextWindow: 262144,
1087
1123
  maxTokens: 131072,
1088
1124
  },
1125
+ "openai.gpt-5.4": {
1126
+ id: "openai.gpt-5.4",
1127
+ name: "GPT-5.4",
1128
+ api: "bedrock-converse-stream",
1129
+ provider: "amazon-bedrock",
1130
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1131
+ reasoning: true,
1132
+ thinkingLevelMap: { "xhigh": "xhigh" },
1133
+ input: ["text", "image"],
1134
+ cost: {
1135
+ input: 2.75,
1136
+ output: 16.5,
1137
+ cacheRead: 0.275,
1138
+ cacheWrite: 0,
1139
+ },
1140
+ contextWindow: 272000,
1141
+ maxTokens: 128000,
1142
+ },
1143
+ "openai.gpt-5.5": {
1144
+ id: "openai.gpt-5.5",
1145
+ name: "GPT-5.5",
1146
+ api: "bedrock-converse-stream",
1147
+ provider: "amazon-bedrock",
1148
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1149
+ reasoning: true,
1150
+ thinkingLevelMap: { "xhigh": "xhigh" },
1151
+ input: ["text", "image"],
1152
+ cost: {
1153
+ input: 5.5,
1154
+ output: 33,
1155
+ cacheRead: 0.55,
1156
+ cacheWrite: 0,
1157
+ },
1158
+ contextWindow: 272000,
1159
+ maxTokens: 128000,
1160
+ },
1161
+ "openai.gpt-oss-120b": {
1162
+ id: "openai.gpt-oss-120b",
1163
+ name: "gpt-oss-120b",
1164
+ api: "bedrock-converse-stream",
1165
+ provider: "amazon-bedrock",
1166
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1167
+ reasoning: true,
1168
+ input: ["text"],
1169
+ cost: {
1170
+ input: 0.15,
1171
+ output: 0.6,
1172
+ cacheRead: 0,
1173
+ cacheWrite: 0,
1174
+ },
1175
+ contextWindow: 128000,
1176
+ maxTokens: 16384,
1177
+ },
1089
1178
  "openai.gpt-oss-120b-1:0": {
1090
1179
  id: "openai.gpt-oss-120b-1:0",
1091
1180
  name: "gpt-oss-120b",
1092
1181
  api: "bedrock-converse-stream",
1093
1182
  provider: "amazon-bedrock",
1094
1183
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1095
- reasoning: false,
1184
+ reasoning: true,
1096
1185
  input: ["text"],
1097
1186
  cost: {
1098
1187
  input: 0.15,
@@ -1103,13 +1192,30 @@ export const MODELS = {
1103
1192
  contextWindow: 128000,
1104
1193
  maxTokens: 16384,
1105
1194
  },
1195
+ "openai.gpt-oss-20b": {
1196
+ id: "openai.gpt-oss-20b",
1197
+ name: "gpt-oss-20b",
1198
+ api: "bedrock-converse-stream",
1199
+ provider: "amazon-bedrock",
1200
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1201
+ reasoning: true,
1202
+ input: ["text"],
1203
+ cost: {
1204
+ input: 0.07,
1205
+ output: 0.3,
1206
+ cacheRead: 0,
1207
+ cacheWrite: 0,
1208
+ },
1209
+ contextWindow: 128000,
1210
+ maxTokens: 16384,
1211
+ },
1106
1212
  "openai.gpt-oss-20b-1:0": {
1107
1213
  id: "openai.gpt-oss-20b-1:0",
1108
1214
  name: "gpt-oss-20b",
1109
1215
  api: "bedrock-converse-stream",
1110
1216
  provider: "amazon-bedrock",
1111
1217
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1112
- reasoning: false,
1218
+ reasoning: true,
1113
1219
  input: ["text"],
1114
1220
  cost: {
1115
1221
  input: 0.07,
@@ -1273,6 +1379,24 @@ export const MODELS = {
1273
1379
  contextWindow: 262000,
1274
1380
  maxTokens: 262000,
1275
1381
  },
1382
+ "us.anthropic.claude-fable-5": {
1383
+ id: "us.anthropic.claude-fable-5",
1384
+ name: "Claude Fable 5 (US)",
1385
+ api: "bedrock-converse-stream",
1386
+ provider: "amazon-bedrock",
1387
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1388
+ reasoning: true,
1389
+ thinkingLevelMap: { "xhigh": "xhigh" },
1390
+ input: ["text", "image"],
1391
+ cost: {
1392
+ input: 10,
1393
+ output: 50,
1394
+ cacheRead: 1,
1395
+ cacheWrite: 12.5,
1396
+ },
1397
+ contextWindow: 1000000,
1398
+ maxTokens: 128000,
1399
+ },
1276
1400
  "us.anthropic.claude-haiku-4-5-20251001-v1:0": {
1277
1401
  id: "us.anthropic.claude-haiku-4-5-20251001-v1:0",
1278
1402
  name: "Claude Haiku 4.5 (US)",
@@ -1743,6 +1867,25 @@ export const MODELS = {
1743
1867
  contextWindow: 200000,
1744
1868
  maxTokens: 4096,
1745
1869
  },
1870
+ "claude-fable-5": {
1871
+ id: "claude-fable-5",
1872
+ name: "Claude Fable 5",
1873
+ api: "anthropic-messages",
1874
+ provider: "anthropic",
1875
+ baseUrl: "https://api.anthropic.com",
1876
+ compat: { "forceAdaptiveThinking": true },
1877
+ reasoning: true,
1878
+ thinkingLevelMap: { "xhigh": "xhigh" },
1879
+ input: ["text", "image"],
1880
+ cost: {
1881
+ input: 10,
1882
+ output: 50,
1883
+ cacheRead: 1,
1884
+ cacheWrite: 12.5,
1885
+ },
1886
+ contextWindow: 1000000,
1887
+ maxTokens: 128000,
1888
+ },
1746
1889
  "claude-haiku-4-5": {
1747
1890
  id: "claude-haiku-4-5",
1748
1891
  name: "Claude Haiku 4.5 (latest)",
@@ -2300,7 +2443,7 @@ export const MODELS = {
2300
2443
  cacheWrite: 0,
2301
2444
  },
2302
2445
  contextWindow: 400000,
2303
- maxTokens: 272000,
2446
+ maxTokens: 128000,
2304
2447
  },
2305
2448
  "gpt-5.1": {
2306
2449
  id: "gpt-5.1",
@@ -2533,7 +2676,7 @@ export const MODELS = {
2533
2676
  cacheRead: 0.25,
2534
2677
  cacheWrite: 0,
2535
2678
  },
2536
- contextWindow: 272000,
2679
+ contextWindow: 1050000,
2537
2680
  maxTokens: 128000,
2538
2681
  },
2539
2682
  "gpt-5.4-mini": {
@@ -2605,7 +2748,7 @@ export const MODELS = {
2605
2748
  cacheRead: 0.5,
2606
2749
  cacheWrite: 0,
2607
2750
  },
2608
- contextWindow: 272000,
2751
+ contextWindow: 1050000,
2609
2752
  maxTokens: 128000,
2610
2753
  },
2611
2754
  "gpt-5.5-pro": {
@@ -2919,6 +3062,25 @@ export const MODELS = {
2919
3062
  contextWindow: 200000,
2920
3063
  maxTokens: 8192,
2921
3064
  },
3065
+ "claude-fable-5": {
3066
+ id: "claude-fable-5",
3067
+ name: "Claude Fable 5",
3068
+ api: "anthropic-messages",
3069
+ provider: "cloudflare-ai-gateway",
3070
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
3071
+ compat: { "forceAdaptiveThinking": true },
3072
+ reasoning: true,
3073
+ thinkingLevelMap: { "xhigh": "xhigh" },
3074
+ input: ["text", "image"],
3075
+ cost: {
3076
+ input: 10,
3077
+ output: 50,
3078
+ cacheRead: 1,
3079
+ cacheWrite: 12.5,
3080
+ },
3081
+ contextWindow: 1000000,
3082
+ maxTokens: 128000,
3083
+ },
2922
3084
  "claude-haiku-4-5": {
2923
3085
  id: "claude-haiku-4-5",
2924
3086
  name: "Claude Haiku 4.5 (latest)",
@@ -3887,6 +4049,24 @@ export const MODELS = {
3887
4049
  contextWindow: 202800,
3888
4050
  maxTokens: 131072,
3889
4051
  },
4052
+ "accounts/fireworks/routers/kimi-k2p6-fast": {
4053
+ id: "accounts/fireworks/routers/kimi-k2p6-fast",
4054
+ name: "Kimi K2.6 Fast",
4055
+ api: "anthropic-messages",
4056
+ provider: "fireworks",
4057
+ baseUrl: "https://api.fireworks.ai/inference",
4058
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
4059
+ reasoning: true,
4060
+ input: ["text", "image"],
4061
+ cost: {
4062
+ input: 2,
4063
+ output: 8,
4064
+ cacheRead: 0.3,
4065
+ cacheWrite: 0,
4066
+ },
4067
+ contextWindow: 262000,
4068
+ maxTokens: 262000,
4069
+ },
3890
4070
  "accounts/fireworks/routers/kimi-k2p6-turbo": {
3891
4071
  id: "accounts/fireworks/routers/kimi-k2p6-turbo",
3892
4072
  name: "Kimi K2.6 Turbo",
@@ -6019,11 +6199,11 @@ export const MODELS = {
6019
6199
  api: "mistral-conversations",
6020
6200
  provider: "mistral",
6021
6201
  baseUrl: "https://api.mistral.ai",
6022
- reasoning: true,
6202
+ reasoning: false,
6023
6203
  input: ["text", "image"],
6024
6204
  cost: {
6025
- input: 1.5,
6026
- output: 7.5,
6205
+ input: 0.4,
6206
+ output: 2,
6027
6207
  cacheRead: 0,
6028
6208
  cacheWrite: 0,
6029
6209
  },
@@ -6208,7 +6388,7 @@ export const MODELS = {
6208
6388
  api: "openai-completions",
6209
6389
  provider: "moonshotai",
6210
6390
  baseUrl: "https://api.moonshot.ai/v1",
6211
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6391
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6212
6392
  reasoning: false,
6213
6393
  input: ["text"],
6214
6394
  cost: {
@@ -6226,7 +6406,7 @@ export const MODELS = {
6226
6406
  api: "openai-completions",
6227
6407
  provider: "moonshotai",
6228
6408
  baseUrl: "https://api.moonshot.ai/v1",
6229
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6409
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6230
6410
  reasoning: false,
6231
6411
  input: ["text"],
6232
6412
  cost: {
@@ -6244,7 +6424,7 @@ export const MODELS = {
6244
6424
  api: "openai-completions",
6245
6425
  provider: "moonshotai",
6246
6426
  baseUrl: "https://api.moonshot.ai/v1",
6247
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6427
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6248
6428
  reasoning: true,
6249
6429
  input: ["text"],
6250
6430
  cost: {
@@ -6262,7 +6442,7 @@ export const MODELS = {
6262
6442
  api: "openai-completions",
6263
6443
  provider: "moonshotai",
6264
6444
  baseUrl: "https://api.moonshot.ai/v1",
6265
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6445
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6266
6446
  reasoning: true,
6267
6447
  input: ["text"],
6268
6448
  cost: {
@@ -6280,7 +6460,7 @@ export const MODELS = {
6280
6460
  api: "openai-completions",
6281
6461
  provider: "moonshotai",
6282
6462
  baseUrl: "https://api.moonshot.ai/v1",
6283
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6463
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6284
6464
  reasoning: false,
6285
6465
  input: ["text"],
6286
6466
  cost: {
@@ -6298,7 +6478,7 @@ export const MODELS = {
6298
6478
  api: "openai-completions",
6299
6479
  provider: "moonshotai",
6300
6480
  baseUrl: "https://api.moonshot.ai/v1",
6301
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6481
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6302
6482
  reasoning: true,
6303
6483
  input: ["text", "image"],
6304
6484
  cost: {
@@ -6316,7 +6496,7 @@ export const MODELS = {
6316
6496
  api: "openai-completions",
6317
6497
  provider: "moonshotai",
6318
6498
  baseUrl: "https://api.moonshot.ai/v1",
6319
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6499
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6320
6500
  reasoning: true,
6321
6501
  input: ["text", "image"],
6322
6502
  cost: {
@@ -6336,7 +6516,7 @@ export const MODELS = {
6336
6516
  api: "openai-completions",
6337
6517
  provider: "moonshotai-cn",
6338
6518
  baseUrl: "https://api.moonshot.cn/v1",
6339
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6519
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6340
6520
  reasoning: false,
6341
6521
  input: ["text"],
6342
6522
  cost: {
@@ -6354,7 +6534,7 @@ export const MODELS = {
6354
6534
  api: "openai-completions",
6355
6535
  provider: "moonshotai-cn",
6356
6536
  baseUrl: "https://api.moonshot.cn/v1",
6357
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6537
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6358
6538
  reasoning: false,
6359
6539
  input: ["text"],
6360
6540
  cost: {
@@ -6372,7 +6552,7 @@ export const MODELS = {
6372
6552
  api: "openai-completions",
6373
6553
  provider: "moonshotai-cn",
6374
6554
  baseUrl: "https://api.moonshot.cn/v1",
6375
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6555
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6376
6556
  reasoning: true,
6377
6557
  input: ["text"],
6378
6558
  cost: {
@@ -6390,7 +6570,7 @@ export const MODELS = {
6390
6570
  api: "openai-completions",
6391
6571
  provider: "moonshotai-cn",
6392
6572
  baseUrl: "https://api.moonshot.cn/v1",
6393
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6573
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6394
6574
  reasoning: true,
6395
6575
  input: ["text"],
6396
6576
  cost: {
@@ -6408,7 +6588,7 @@ export const MODELS = {
6408
6588
  api: "openai-completions",
6409
6589
  provider: "moonshotai-cn",
6410
6590
  baseUrl: "https://api.moonshot.cn/v1",
6411
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6591
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6412
6592
  reasoning: false,
6413
6593
  input: ["text"],
6414
6594
  cost: {
@@ -6426,7 +6606,7 @@ export const MODELS = {
6426
6606
  api: "openai-completions",
6427
6607
  provider: "moonshotai-cn",
6428
6608
  baseUrl: "https://api.moonshot.cn/v1",
6429
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6609
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6430
6610
  reasoning: true,
6431
6611
  input: ["text", "image"],
6432
6612
  cost: {
@@ -6444,7 +6624,7 @@ export const MODELS = {
6444
6624
  api: "openai-completions",
6445
6625
  provider: "moonshotai-cn",
6446
6626
  baseUrl: "https://api.moonshot.cn/v1",
6447
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false },
6627
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "thinkingFormat": "deepseek" },
6448
6628
  reasoning: true,
6449
6629
  input: ["text", "image"],
6450
6630
  cost: {
@@ -6705,6 +6885,25 @@ export const MODELS = {
6705
6885
  contextWindow: 262144,
6706
6886
  maxTokens: 262144,
6707
6887
  },
6888
+ "nvidia/nemotron-3-ultra-550b-a55b": {
6889
+ id: "nvidia/nemotron-3-ultra-550b-a55b",
6890
+ name: "Nemotron 3 Ultra 550B A55B",
6891
+ api: "openai-completions",
6892
+ provider: "nvidia",
6893
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6894
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6895
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6896
+ reasoning: true,
6897
+ input: ["text"],
6898
+ cost: {
6899
+ input: 0.5,
6900
+ output: 2.5,
6901
+ cacheRead: 0.15,
6902
+ cacheWrite: 0,
6903
+ },
6904
+ contextWindow: 1000000,
6905
+ maxTokens: 65536,
6906
+ },
6708
6907
  "nvidia/nvidia-nemotron-nano-9b-v2": {
6709
6908
  id: "nvidia/nvidia-nemotron-nano-9b-v2",
6710
6909
  name: "nvidia-nemotron-nano-9b-v2",
@@ -7116,7 +7315,7 @@ export const MODELS = {
7116
7315
  cacheWrite: 0,
7117
7316
  },
7118
7317
  contextWindow: 400000,
7119
- maxTokens: 272000,
7318
+ maxTokens: 128000,
7120
7319
  },
7121
7320
  "gpt-5.1": {
7122
7321
  id: "gpt-5.1",
@@ -7660,6 +7859,7 @@ export const MODELS = {
7660
7859
  api: "openai-completions",
7661
7860
  provider: "opencode",
7662
7861
  baseUrl: "https://opencode.ai/zen/v1",
7862
+ compat: { "maxTokensField": "max_tokens" },
7663
7863
  reasoning: true,
7664
7864
  input: ["text"],
7665
7865
  cost: {
@@ -7671,6 +7871,25 @@ export const MODELS = {
7671
7871
  contextWindow: 200000,
7672
7872
  maxTokens: 32000,
7673
7873
  },
7874
+ "claude-fable-5": {
7875
+ id: "claude-fable-5",
7876
+ name: "Claude Fable 5",
7877
+ api: "anthropic-messages",
7878
+ provider: "opencode",
7879
+ baseUrl: "https://opencode.ai/zen",
7880
+ compat: { "forceAdaptiveThinking": true },
7881
+ reasoning: true,
7882
+ thinkingLevelMap: { "xhigh": "xhigh" },
7883
+ input: ["text", "image"],
7884
+ cost: {
7885
+ input: 10,
7886
+ output: 50,
7887
+ cacheRead: 1,
7888
+ cacheWrite: 12.5,
7889
+ },
7890
+ contextWindow: 1000000,
7891
+ maxTokens: 128000,
7892
+ },
7674
7893
  "claude-haiku-4-5": {
7675
7894
  id: "claude-haiku-4-5",
7676
7895
  name: "Claude Haiku 4.5",
@@ -7837,7 +8056,7 @@ export const MODELS = {
7837
8056
  api: "openai-completions",
7838
8057
  provider: "opencode",
7839
8058
  baseUrl: "https://opencode.ai/zen/v1",
7840
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8059
+ compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7841
8060
  reasoning: true,
7842
8061
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7843
8062
  input: ["text"],
@@ -7856,7 +8075,7 @@ export const MODELS = {
7856
8075
  api: "openai-completions",
7857
8076
  provider: "opencode",
7858
8077
  baseUrl: "https://opencode.ai/zen/v1",
7859
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8078
+ compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7860
8079
  reasoning: true,
7861
8080
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7862
8081
  input: ["text"],
@@ -7929,6 +8148,7 @@ export const MODELS = {
7929
8148
  api: "openai-completions",
7930
8149
  provider: "opencode",
7931
8150
  baseUrl: "https://opencode.ai/zen/v1",
8151
+ compat: { "maxTokensField": "max_tokens" },
7932
8152
  reasoning: true,
7933
8153
  input: ["text"],
7934
8154
  cost: {
@@ -7946,6 +8166,7 @@ export const MODELS = {
7946
8166
  api: "openai-completions",
7947
8167
  provider: "opencode",
7948
8168
  baseUrl: "https://opencode.ai/zen/v1",
8169
+ compat: { "maxTokensField": "max_tokens" },
7949
8170
  reasoning: true,
7950
8171
  input: ["text"],
7951
8172
  cost: {
@@ -8251,7 +8472,7 @@ export const MODELS = {
8251
8472
  api: "openai-completions",
8252
8473
  provider: "opencode",
8253
8474
  baseUrl: "https://opencode.ai/zen/v1",
8254
- compat: { "supportsReasoningEffort": false },
8475
+ compat: { "supportsReasoningEffort": false, "maxTokensField": "max_tokens" },
8255
8476
  reasoning: true,
8256
8477
  thinkingLevelMap: { "off": null, "minimal": null, "low": null, "medium": null },
8257
8478
  input: ["text", "image"],
@@ -8270,6 +8491,7 @@ export const MODELS = {
8270
8491
  api: "openai-completions",
8271
8492
  provider: "opencode",
8272
8493
  baseUrl: "https://opencode.ai/zen/v1",
8494
+ compat: { "maxTokensField": "max_tokens" },
8273
8495
  reasoning: true,
8274
8496
  input: ["text", "image"],
8275
8497
  cost: {
@@ -8287,7 +8509,7 @@ export const MODELS = {
8287
8509
  api: "openai-completions",
8288
8510
  provider: "opencode",
8289
8511
  baseUrl: "https://opencode.ai/zen/v1",
8290
- compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false },
8512
+ compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false, "maxTokensField": "max_tokens" },
8291
8513
  reasoning: true,
8292
8514
  input: ["text", "image"],
8293
8515
  cost: {
@@ -8305,6 +8527,7 @@ export const MODELS = {
8305
8527
  api: "openai-completions",
8306
8528
  provider: "opencode",
8307
8529
  baseUrl: "https://opencode.ai/zen/v1",
8530
+ compat: { "maxTokensField": "max_tokens" },
8308
8531
  reasoning: true,
8309
8532
  input: ["text", "image"],
8310
8533
  cost: {
@@ -8322,6 +8545,7 @@ export const MODELS = {
8322
8545
  api: "openai-completions",
8323
8546
  provider: "opencode",
8324
8547
  baseUrl: "https://opencode.ai/zen/v1",
8548
+ compat: { "maxTokensField": "max_tokens" },
8325
8549
  reasoning: true,
8326
8550
  input: ["text"],
8327
8551
  cost: {
@@ -8339,6 +8563,7 @@ export const MODELS = {
8339
8563
  api: "openai-completions",
8340
8564
  provider: "opencode",
8341
8565
  baseUrl: "https://opencode.ai/zen/v1",
8566
+ compat: { "maxTokensField": "max_tokens" },
8342
8567
  reasoning: true,
8343
8568
  input: ["text"],
8344
8569
  cost: {
@@ -8350,29 +8575,31 @@ export const MODELS = {
8350
8575
  contextWindow: 204800,
8351
8576
  maxTokens: 131072,
8352
8577
  },
8353
- "minimax-m3-free": {
8354
- id: "minimax-m3-free",
8355
- name: "MiniMax M3 Free",
8356
- api: "anthropic-messages",
8578
+ "nemotron-3-ultra-free": {
8579
+ id: "nemotron-3-ultra-free",
8580
+ name: "Nemotron 3 Ultra Free",
8581
+ api: "openai-completions",
8357
8582
  provider: "opencode",
8358
- baseUrl: "https://opencode.ai/zen",
8583
+ baseUrl: "https://opencode.ai/zen/v1",
8584
+ compat: { "maxTokensField": "max_tokens" },
8359
8585
  reasoning: true,
8360
- input: ["text", "image"],
8586
+ input: ["text"],
8361
8587
  cost: {
8362
8588
  input: 0,
8363
8589
  output: 0,
8364
8590
  cacheRead: 0,
8365
8591
  cacheWrite: 0,
8366
8592
  },
8367
- contextWindow: 200000,
8368
- maxTokens: 32000,
8593
+ contextWindow: 1000000,
8594
+ maxTokens: 128000,
8369
8595
  },
8370
- "nemotron-3-ultra-free": {
8371
- id: "nemotron-3-ultra-free",
8372
- name: "Nemotron 3 Ultra Free",
8596
+ "north-mini-code-free": {
8597
+ id: "north-mini-code-free",
8598
+ name: "North Mini Code Free",
8373
8599
  api: "openai-completions",
8374
8600
  provider: "opencode",
8375
8601
  baseUrl: "https://opencode.ai/zen/v1",
8602
+ compat: { "maxTokensField": "max_tokens" },
8376
8603
  reasoning: true,
8377
8604
  input: ["text"],
8378
8605
  cost: {
@@ -8381,8 +8608,8 @@ export const MODELS = {
8381
8608
  cacheRead: 0,
8382
8609
  cacheWrite: 0,
8383
8610
  },
8384
- contextWindow: 1000000,
8385
- maxTokens: 128000,
8611
+ contextWindow: 256000,
8612
+ maxTokens: 64000,
8386
8613
  },
8387
8614
  "qwen3.5-plus": {
8388
8615
  id: "qwen3.5-plus",
@@ -8426,7 +8653,7 @@ export const MODELS = {
8426
8653
  api: "openai-completions",
8427
8654
  provider: "opencode-go",
8428
8655
  baseUrl: "https://opencode.ai/zen/go/v1",
8429
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8656
+ compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8430
8657
  reasoning: true,
8431
8658
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
8432
8659
  input: ["text"],
@@ -8445,7 +8672,7 @@ export const MODELS = {
8445
8672
  api: "openai-completions",
8446
8673
  provider: "opencode-go",
8447
8674
  baseUrl: "https://opencode.ai/zen/go/v1",
8448
- compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8675
+ compat: { "maxTokensField": "max_tokens", "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
8449
8676
  reasoning: true,
8450
8677
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
8451
8678
  input: ["text"],
@@ -8464,6 +8691,7 @@ export const MODELS = {
8464
8691
  api: "openai-completions",
8465
8692
  provider: "opencode-go",
8466
8693
  baseUrl: "https://opencode.ai/zen/go/v1",
8694
+ compat: { "maxTokensField": "max_tokens" },
8467
8695
  reasoning: true,
8468
8696
  input: ["text"],
8469
8697
  cost: {
@@ -8481,6 +8709,7 @@ export const MODELS = {
8481
8709
  api: "openai-completions",
8482
8710
  provider: "opencode-go",
8483
8711
  baseUrl: "https://opencode.ai/zen/go/v1",
8712
+ compat: { "maxTokensField": "max_tokens" },
8484
8713
  reasoning: true,
8485
8714
  input: ["text"],
8486
8715
  cost: {
@@ -8498,6 +8727,7 @@ export const MODELS = {
8498
8727
  api: "openai-completions",
8499
8728
  provider: "opencode-go",
8500
8729
  baseUrl: "https://opencode.ai/zen/go/v1",
8730
+ compat: { "maxTokensField": "max_tokens" },
8501
8731
  reasoning: true,
8502
8732
  input: ["text", "image"],
8503
8733
  cost: {
@@ -8515,7 +8745,7 @@ export const MODELS = {
8515
8745
  api: "openai-completions",
8516
8746
  provider: "opencode-go",
8517
8747
  baseUrl: "https://opencode.ai/zen/go/v1",
8518
- compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false },
8748
+ compat: { "thinkingFormat": "deepseek", "supportsReasoningEffort": false, "maxTokensField": "max_tokens" },
8519
8749
  reasoning: true,
8520
8750
  thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
8521
8751
  input: ["text", "image"],
@@ -8534,6 +8764,7 @@ export const MODELS = {
8534
8764
  api: "openai-completions",
8535
8765
  provider: "opencode-go",
8536
8766
  baseUrl: "https://opencode.ai/zen/go/v1",
8767
+ compat: { "maxTokensField": "max_tokens" },
8537
8768
  reasoning: true,
8538
8769
  input: ["text", "image"],
8539
8770
  cost: {
@@ -8551,6 +8782,7 @@ export const MODELS = {
8551
8782
  api: "openai-completions",
8552
8783
  provider: "opencode-go",
8553
8784
  baseUrl: "https://opencode.ai/zen/go/v1",
8785
+ compat: { "maxTokensField": "max_tokens" },
8554
8786
  reasoning: true,
8555
8787
  input: ["text"],
8556
8788
  cost: {
@@ -8585,6 +8817,7 @@ export const MODELS = {
8585
8817
  api: "openai-completions",
8586
8818
  provider: "opencode-go",
8587
8819
  baseUrl: "https://opencode.ai/zen/go/v1",
8820
+ compat: { "maxTokensField": "max_tokens" },
8588
8821
  reasoning: true,
8589
8822
  input: ["text"],
8590
8823
  cost: {
@@ -8605,9 +8838,9 @@ export const MODELS = {
8605
8838
  reasoning: true,
8606
8839
  input: ["text", "image"],
8607
8840
  cost: {
8608
- input: 0.6,
8609
- output: 2.4,
8610
- cacheRead: 0.12,
8841
+ input: 0.3,
8842
+ output: 1.2,
8843
+ cacheRead: 0.06,
8611
8844
  cacheWrite: 0,
8612
8845
  },
8613
8846
  contextWindow: 512000,
@@ -8619,7 +8852,7 @@ export const MODELS = {
8619
8852
  api: "openai-completions",
8620
8853
  provider: "opencode-go",
8621
8854
  baseUrl: "https://opencode.ai/zen/go/v1",
8622
- compat: { "thinkingFormat": "qwen" },
8855
+ compat: { "thinkingFormat": "qwen", "maxTokensField": "max_tokens" },
8623
8856
  reasoning: true,
8624
8857
  input: ["text", "image"],
8625
8858
  cost: {
@@ -8628,7 +8861,7 @@ export const MODELS = {
8628
8861
  cacheRead: 0.05,
8629
8862
  cacheWrite: 0.625,
8630
8863
  },
8631
- contextWindow: 262144,
8864
+ contextWindow: 1000000,
8632
8865
  maxTokens: 65536,
8633
8866
  },
8634
8867
  "qwen3.7-max": {
@@ -8662,7 +8895,7 @@ export const MODELS = {
8662
8895
  cacheRead: 0.04,
8663
8896
  cacheWrite: 0.5,
8664
8897
  },
8665
- contextWindow: 262144,
8898
+ contextWindow: 1000000,
8666
8899
  maxTokens: 65536,
8667
8900
  },
8668
8901
  },
@@ -8803,6 +9036,23 @@ export const MODELS = {
8803
9036
  contextWindow: 200000,
8804
9037
  maxTokens: 8192,
8805
9038
  },
9039
+ "anthropic/claude-fable-5": {
9040
+ id: "anthropic/claude-fable-5",
9041
+ name: "Anthropic: Claude Fable 5",
9042
+ api: "openai-completions",
9043
+ provider: "openrouter",
9044
+ baseUrl: "https://openrouter.ai/api/v1",
9045
+ reasoning: true,
9046
+ input: ["text", "image"],
9047
+ cost: {
9048
+ input: 10,
9049
+ output: 50,
9050
+ cacheRead: 1,
9051
+ cacheWrite: 12.5,
9052
+ },
9053
+ contextWindow: 1000000,
9054
+ maxTokens: 128000,
9055
+ },
8806
9056
  "anthropic/claude-haiku-4.5": {
8807
9057
  id: "anthropic/claude-haiku-4.5",
8808
9058
  name: "Anthropic: Claude Haiku 4.5",
@@ -9098,23 +9348,6 @@ export const MODELS = {
9098
9348
  contextWindow: 2000000,
9099
9349
  maxTokens: 30000,
9100
9350
  },
9101
- "baidu/ernie-4.5-vl-28b-a3b": {
9102
- id: "baidu/ernie-4.5-vl-28b-a3b",
9103
- name: "Baidu: ERNIE 4.5 VL 28B A3B",
9104
- api: "openai-completions",
9105
- provider: "openrouter",
9106
- baseUrl: "https://openrouter.ai/api/v1",
9107
- reasoning: true,
9108
- input: ["text", "image"],
9109
- cost: {
9110
- input: 0.14,
9111
- output: 0.56,
9112
- cacheRead: 0,
9113
- cacheWrite: 0,
9114
- },
9115
- contextWindow: 131072,
9116
- maxTokens: 8000,
9117
- },
9118
9351
  "bytedance-seed/seed-1.6": {
9119
9352
  id: "bytedance-seed/seed-1.6",
9120
9353
  name: "ByteDance Seed: Seed 1.6",
@@ -9621,8 +9854,8 @@ export const MODELS = {
9621
9854
  reasoning: false,
9622
9855
  input: ["text", "image"],
9623
9856
  cost: {
9624
- input: 0.04,
9625
- output: 0.13,
9857
+ input: 0.049999999999999996,
9858
+ output: 0.15,
9626
9859
  cacheRead: 0,
9627
9860
  cacheWrite: 0,
9628
9861
  },
@@ -9690,12 +9923,12 @@ export const MODELS = {
9690
9923
  input: ["text", "image"],
9691
9924
  cost: {
9692
9925
  input: 0.12,
9693
- output: 0.37,
9694
- cacheRead: 0,
9926
+ output: 0.36,
9927
+ cacheRead: 0.09,
9695
9928
  cacheWrite: 0,
9696
9929
  },
9697
9930
  contextWindow: 262144,
9698
- maxTokens: 16384,
9931
+ maxTokens: 8192,
9699
9932
  },
9700
9933
  "google/gemma-4-31b-it:free": {
9701
9934
  id: "google/gemma-4-31b-it:free",
@@ -9844,7 +10077,7 @@ export const MODELS = {
9844
10077
  input: ["text"],
9845
10078
  cost: {
9846
10079
  input: 0.02,
9847
- output: 0.049999999999999996,
10080
+ output: 0.03,
9848
10081
  cacheRead: 0,
9849
10082
  cacheWrite: 0,
9850
10083
  },
@@ -9911,7 +10144,7 @@ export const MODELS = {
9911
10144
  reasoning: false,
9912
10145
  input: ["text", "image"],
9913
10146
  cost: {
9914
- input: 0.08,
10147
+ input: 0.09999999999999999,
9915
10148
  output: 0.3,
9916
10149
  cacheRead: 0,
9917
10150
  cacheWrite: 0,
@@ -9980,8 +10213,8 @@ export const MODELS = {
9980
10213
  input: ["text"],
9981
10214
  cost: {
9982
10215
  input: 0.15,
9983
- output: 1.15,
9984
- cacheRead: 0,
10216
+ output: 0.8999999999999999,
10217
+ cacheRead: 0.049999999999999996,
9985
10218
  cacheWrite: 0,
9986
10219
  },
9987
10220
  contextWindow: 204800,
@@ -9996,9 +10229,9 @@ export const MODELS = {
9996
10229
  reasoning: true,
9997
10230
  input: ["text"],
9998
10231
  cost: {
9999
- input: 0.27899999999999997,
10000
- output: 1.2,
10001
- cacheRead: 0,
10232
+ input: 0.27,
10233
+ output: 1.08,
10234
+ cacheRead: 0.054,
10002
10235
  cacheWrite: 0,
10003
10236
  },
10004
10237
  contextWindow: 204800,
@@ -10388,13 +10621,13 @@ export const MODELS = {
10388
10621
  reasoning: true,
10389
10622
  input: ["text", "image"],
10390
10623
  cost: {
10391
- input: 0.684,
10392
- output: 3.42,
10393
- cacheRead: 0.144,
10624
+ input: 0.6799999999999999,
10625
+ output: 3.41,
10626
+ cacheRead: 0.33999999999999997,
10394
10627
  cacheWrite: 0,
10395
10628
  },
10396
10629
  contextWindow: 262144,
10397
- maxTokens: 262144,
10630
+ maxTokens: 262142,
10398
10631
  },
10399
10632
  "moonshotai/kimi-k2.6:free": {
10400
10633
  id: "moonshotai/kimi-k2.6:free",
@@ -10414,22 +10647,22 @@ export const MODELS = {
10414
10647
  contextWindow: 262144,
10415
10648
  maxTokens: 4096,
10416
10649
  },
10417
- "nex-agi/deepseek-v3.1-nex-n1": {
10418
- id: "nex-agi/deepseek-v3.1-nex-n1",
10419
- name: "Nex AGI: DeepSeek V3.1 Nex N1",
10650
+ "nex-agi/nex-n2-pro:free": {
10651
+ id: "nex-agi/nex-n2-pro:free",
10652
+ name: "Nex AGI: Nex-N2-Pro (free)",
10420
10653
  api: "openai-completions",
10421
10654
  provider: "openrouter",
10422
10655
  baseUrl: "https://openrouter.ai/api/v1",
10423
- reasoning: false,
10424
- input: ["text"],
10656
+ reasoning: true,
10657
+ input: ["text", "image"],
10425
10658
  cost: {
10426
- input: 0.135,
10427
- output: 0.5,
10659
+ input: 0,
10660
+ output: 0,
10428
10661
  cacheRead: 0,
10429
10662
  cacheWrite: 0,
10430
10663
  },
10431
- contextWindow: 131072,
10432
- maxTokens: 163840,
10664
+ contextWindow: 262144,
10665
+ maxTokens: 262144,
10433
10666
  },
10434
10667
  "nvidia/llama-3.3-nemotron-super-49b-v1.5": {
10435
10668
  id: "nvidia/llama-3.3-nemotron-super-49b-v1.5",
@@ -10440,7 +10673,7 @@ export const MODELS = {
10440
10673
  reasoning: true,
10441
10674
  input: ["text"],
10442
10675
  cost: {
10443
- input: 0.09999999999999999,
10676
+ input: 0.39999999999999997,
10444
10677
  output: 0.39999999999999997,
10445
10678
  cacheRead: 0,
10446
10679
  cacheWrite: 0,
@@ -10686,23 +10919,6 @@ export const MODELS = {
10686
10919
  contextWindow: 8191,
10687
10920
  maxTokens: 4096,
10688
10921
  },
10689
- "openai/gpt-4-1106-preview": {
10690
- id: "openai/gpt-4-1106-preview",
10691
- name: "OpenAI: GPT-4 Turbo (older v1106)",
10692
- api: "openai-completions",
10693
- provider: "openrouter",
10694
- baseUrl: "https://openrouter.ai/api/v1",
10695
- reasoning: false,
10696
- input: ["text"],
10697
- cost: {
10698
- input: 10,
10699
- output: 30,
10700
- cacheRead: 0,
10701
- cacheWrite: 0,
10702
- },
10703
- contextWindow: 128000,
10704
- maxTokens: 4096,
10705
- },
10706
10922
  "openai/gpt-4-turbo": {
10707
10923
  id: "openai/gpt-4-turbo",
10708
10924
  name: "OpenAI: GPT-4 Turbo",
@@ -11778,7 +11994,7 @@ export const MODELS = {
11778
11994
  reasoning: false,
11779
11995
  input: ["text"],
11780
11996
  cost: {
11781
- input: 0.071,
11997
+ input: 0.09,
11782
11998
  output: 0.09999999999999999,
11783
11999
  cacheRead: 0,
11784
12000
  cacheWrite: 0,
@@ -11812,13 +12028,13 @@ export const MODELS = {
11812
12028
  reasoning: true,
11813
12029
  input: ["text"],
11814
12030
  cost: {
11815
- input: 0.09,
11816
- output: 0.44999999999999996,
12031
+ input: 0.12,
12032
+ output: 0.5,
11817
12033
  cacheRead: 0,
11818
12034
  cacheWrite: 0,
11819
12035
  },
11820
12036
  contextWindow: 131072,
11821
- maxTokens: 20000,
12037
+ maxTokens: 16384,
11822
12038
  },
11823
12039
  "qwen/qwen3-30b-a3b-instruct-2507": {
11824
12040
  id: "qwen/qwen3-30b-a3b-instruct-2507",
@@ -12271,13 +12487,13 @@ export const MODELS = {
12271
12487
  reasoning: true,
12272
12488
  input: ["text", "image"],
12273
12489
  cost: {
12274
- input: 0.04,
12490
+ input: 0.09999999999999999,
12275
12491
  output: 0.15,
12276
12492
  cacheRead: 0,
12277
12493
  cacheWrite: 0,
12278
12494
  },
12279
12495
  contextWindow: 262144,
12280
- maxTokens: 81920,
12496
+ maxTokens: 262144,
12281
12497
  },
12282
12498
  "qwen/qwen3.5-flash-02-23": {
12283
12499
  id: "qwen/qwen3.5-flash-02-23",
@@ -12339,13 +12555,13 @@ export const MODELS = {
12339
12555
  reasoning: true,
12340
12556
  input: ["text", "image"],
12341
12557
  cost: {
12342
- input: 0.29,
12343
- output: 3.1999999999999997,
12558
+ input: 0.28900000000000003,
12559
+ output: 2.4,
12344
12560
  cacheRead: 0,
12345
12561
  cacheWrite: 0,
12346
12562
  },
12347
12563
  contextWindow: 262144,
12348
- maxTokens: 262140,
12564
+ maxTokens: 131072,
12349
12565
  },
12350
12566
  "qwen/qwen3.6-35b-a3b": {
12351
12567
  id: "qwen/qwen3.6-35b-a3b",
@@ -12483,23 +12699,6 @@ export const MODELS = {
12483
12699
  contextWindow: 256000,
12484
12700
  maxTokens: 128000,
12485
12701
  },
12486
- "sao10k/l3-euryale-70b": {
12487
- id: "sao10k/l3-euryale-70b",
12488
- name: "Sao10k: Llama 3 Euryale 70B v2.1",
12489
- api: "openai-completions",
12490
- provider: "openrouter",
12491
- baseUrl: "https://openrouter.ai/api/v1",
12492
- reasoning: false,
12493
- input: ["text"],
12494
- cost: {
12495
- input: 1.48,
12496
- output: 1.48,
12497
- cacheRead: 0,
12498
- cacheWrite: 0,
12499
- },
12500
- contextWindow: 8192,
12501
- maxTokens: 8192,
12502
- },
12503
12702
  "sao10k/l3.1-euryale-70b": {
12504
12703
  id: "sao10k/l3.1-euryale-70b",
12505
12704
  name: "Sao10K: Llama 3.1 Euryale 70B v2.2",
@@ -12942,6 +13141,23 @@ export const MODELS = {
12942
13141
  contextWindow: 202752,
12943
13142
  maxTokens: 131072,
12944
13143
  },
13144
+ "~anthropic/claude-fable-latest": {
13145
+ id: "~anthropic/claude-fable-latest",
13146
+ name: "Anthropic: Claude Fable Latest",
13147
+ api: "openai-completions",
13148
+ provider: "openrouter",
13149
+ baseUrl: "https://openrouter.ai/api/v1",
13150
+ reasoning: true,
13151
+ input: ["text", "image"],
13152
+ cost: {
13153
+ input: 10,
13154
+ output: 50,
13155
+ cacheRead: 1,
13156
+ cacheWrite: 12.5,
13157
+ },
13158
+ contextWindow: 1000000,
13159
+ maxTokens: 128000,
13160
+ },
12945
13161
  "~anthropic/claude-haiku-latest": {
12946
13162
  id: "~anthropic/claude-haiku-latest",
12947
13163
  name: "Anthropic Claude Haiku Latest",
@@ -13036,13 +13252,13 @@ export const MODELS = {
13036
13252
  reasoning: true,
13037
13253
  input: ["text", "image"],
13038
13254
  cost: {
13039
- input: 0.684,
13040
- output: 3.42,
13041
- cacheRead: 0.144,
13255
+ input: 0.6799999999999999,
13256
+ output: 3.41,
13257
+ cacheRead: 0.33999999999999997,
13042
13258
  cacheWrite: 0,
13043
13259
  },
13044
13260
  contextWindow: 262144,
13045
- maxTokens: 262144,
13261
+ maxTokens: 262142,
13046
13262
  },
13047
13263
  "~openai/gpt-latest": {
13048
13264
  id: "~openai/gpt-latest",
@@ -13086,9 +13302,9 @@ export const MODELS = {
13086
13302
  api: "openai-completions",
13087
13303
  provider: "together",
13088
13304
  baseUrl: "https://api.together.ai/v1",
13089
- compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
13305
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13090
13306
  reasoning: true,
13091
- thinkingLevelMap: { "off": null, "minimal": null, "low": null, "medium": null },
13307
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13092
13308
  input: ["text"],
13093
13309
  cost: {
13094
13310
  input: 0.3,
@@ -13233,7 +13449,7 @@ export const MODELS = {
13233
13449
  },
13234
13450
  "deepseek-ai/DeepSeek-V3": {
13235
13451
  id: "deepseek-ai/DeepSeek-V3",
13236
- name: "DeepSeek V3",
13452
+ name: "DeepSeek-V3",
13237
13453
  api: "openai-completions",
13238
13454
  provider: "together",
13239
13455
  baseUrl: "https://api.together.ai/v1",
@@ -13381,6 +13597,25 @@ export const MODELS = {
13381
13597
  contextWindow: 262144,
13382
13598
  maxTokens: 131000,
13383
13599
  },
13600
+ "nvidia/nemotron-3-ultra-550b-a55b": {
13601
+ id: "nvidia/nemotron-3-ultra-550b-a55b",
13602
+ name: "Nemotron 3 Ultra 550B A55B",
13603
+ api: "openai-completions",
13604
+ provider: "together",
13605
+ baseUrl: "https://api.together.ai/v1",
13606
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13607
+ reasoning: true,
13608
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13609
+ input: ["text"],
13610
+ cost: {
13611
+ input: 0.6,
13612
+ output: 3.6,
13613
+ cacheRead: 0.2,
13614
+ cacheWrite: 0,
13615
+ },
13616
+ contextWindow: 512300,
13617
+ maxTokens: 512300,
13618
+ },
13384
13619
  "openai/gpt-oss-120b": {
13385
13620
  id: "openai/gpt-oss-120b",
13386
13621
  name: "GPT OSS 120B",
@@ -13464,8 +13699,8 @@ export const MODELS = {
13464
13699
  reasoning: true,
13465
13700
  input: ["text"],
13466
13701
  cost: {
13467
- input: 0.08,
13468
- output: 0.29,
13702
+ input: 0.12,
13703
+ output: 0.5,
13469
13704
  cacheRead: 0,
13470
13705
  cacheWrite: 0,
13471
13706
  },
@@ -13829,6 +14064,25 @@ export const MODELS = {
13829
14064
  contextWindow: 200000,
13830
14065
  maxTokens: 8192,
13831
14066
  },
14067
+ "anthropic/claude-fable-5": {
14068
+ id: "anthropic/claude-fable-5",
14069
+ name: "Claude Fable 5",
14070
+ api: "anthropic-messages",
14071
+ provider: "vercel-ai-gateway",
14072
+ baseUrl: "https://ai-gateway.vercel.sh",
14073
+ compat: { "forceAdaptiveThinking": true },
14074
+ reasoning: true,
14075
+ thinkingLevelMap: { "xhigh": "xhigh" },
14076
+ input: ["text", "image"],
14077
+ cost: {
14078
+ input: 10,
14079
+ output: 50,
14080
+ cacheRead: 1,
14081
+ cacheWrite: 12.5,
14082
+ },
14083
+ contextWindow: 1000000,
14084
+ maxTokens: 128000,
14085
+ },
13832
14086
  "anthropic/claude-haiku-4.5": {
13833
14087
  id: "anthropic/claude-haiku-4.5",
13834
14088
  name: "Claude Haiku 4.5",
@@ -14210,40 +14464,6 @@ export const MODELS = {
14210
14464
  contextWindow: 1000000,
14211
14465
  maxTokens: 384000,
14212
14466
  },
14213
- "google/gemini-2.0-flash": {
14214
- id: "google/gemini-2.0-flash",
14215
- name: "Gemini 2.0 Flash",
14216
- api: "anthropic-messages",
14217
- provider: "vercel-ai-gateway",
14218
- baseUrl: "https://ai-gateway.vercel.sh",
14219
- reasoning: false,
14220
- input: ["text", "image"],
14221
- cost: {
14222
- input: 0.15,
14223
- output: 0.6,
14224
- cacheRead: 0.024999999999999998,
14225
- cacheWrite: 0,
14226
- },
14227
- contextWindow: 1048576,
14228
- maxTokens: 8192,
14229
- },
14230
- "google/gemini-2.0-flash-lite": {
14231
- id: "google/gemini-2.0-flash-lite",
14232
- name: "Gemini 2.0 Flash Lite",
14233
- api: "anthropic-messages",
14234
- provider: "vercel-ai-gateway",
14235
- baseUrl: "https://ai-gateway.vercel.sh",
14236
- reasoning: false,
14237
- input: ["text", "image"],
14238
- cost: {
14239
- input: 0.075,
14240
- output: 0.3,
14241
- cacheRead: 0.02,
14242
- cacheWrite: 0,
14243
- },
14244
- contextWindow: 1048576,
14245
- maxTokens: 8192,
14246
- },
14247
14467
  "google/gemini-2.5-flash": {
14248
14468
  id: "google/gemini-2.5-flash",
14249
14469
  name: "Gemini 2.5 Flash",
@@ -15086,12 +15306,12 @@ export const MODELS = {
15086
15306
  reasoning: true,
15087
15307
  input: ["text"],
15088
15308
  cost: {
15089
- input: 0.5,
15090
- output: 2.5,
15091
- cacheRead: 0.15,
15309
+ input: 0.6,
15310
+ output: 2.4,
15311
+ cacheRead: 0.12,
15092
15312
  cacheWrite: 0,
15093
15313
  },
15094
- contextWindow: 262144,
15314
+ contextWindow: 1000000,
15095
15315
  maxTokens: 65000,
15096
15316
  },
15097
15317
  "nvidia/nemotron-nano-12b-v2-vl": {
@@ -16363,7 +16583,7 @@ export const MODELS = {
16363
16583
  cacheRead: 0.2,
16364
16584
  cacheWrite: 0,
16365
16585
  },
16366
- contextWindow: 2000000,
16586
+ contextWindow: 1000000,
16367
16587
  maxTokens: 30000,
16368
16588
  },
16369
16589
  "grok-4.20-0309-reasoning": {
@@ -16380,7 +16600,7 @@ export const MODELS = {
16380
16600
  cacheRead: 0.2,
16381
16601
  cacheWrite: 0,
16382
16602
  },
16383
- contextWindow: 2000000,
16603
+ contextWindow: 1000000,
16384
16604
  maxTokens: 30000,
16385
16605
  },
16386
16606
  "grok-4.3": {