@fleetagent/pi-ai 0.0.8 → 0.0.10

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -8,7 +8,7 @@ export const MODELS = {
8
8
  api: "bedrock-converse-stream",
9
9
  provider: "amazon-bedrock",
10
10
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
11
- reasoning: false,
11
+ reasoning: true,
12
12
  input: ["text", "image"],
13
13
  cost: {
14
14
  input: 0.33,
@@ -345,6 +345,23 @@ export const MODELS = {
345
345
  contextWindow: 163840,
346
346
  maxTokens: 81920,
347
347
  },
348
+ "eu.anthropic.claude-fable-5": {
349
+ id: "eu.anthropic.claude-fable-5",
350
+ name: "Claude Fable 5 (EU)",
351
+ api: "bedrock-converse-stream",
352
+ provider: "amazon-bedrock",
353
+ baseUrl: "https://bedrock-runtime.eu-central-1.amazonaws.com",
354
+ reasoning: true,
355
+ input: ["text", "image"],
356
+ cost: {
357
+ input: 11,
358
+ output: 55,
359
+ cacheRead: 1.1,
360
+ cacheWrite: 13.75,
361
+ },
362
+ contextWindow: 1000000,
363
+ maxTokens: 128000,
364
+ },
348
365
  "eu.anthropic.claude-haiku-4-5-20251001-v1:0": {
349
366
  id: "eu.anthropic.claude-haiku-4-5-20251001-v1:0",
350
367
  name: "Claude Haiku 4.5 (EU)",
@@ -466,6 +483,23 @@ export const MODELS = {
466
483
  contextWindow: 1000000,
467
484
  maxTokens: 64000,
468
485
  },
486
+ "global.anthropic.claude-fable-5": {
487
+ id: "global.anthropic.claude-fable-5",
488
+ name: "Claude Fable 5 (Global)",
489
+ api: "bedrock-converse-stream",
490
+ provider: "amazon-bedrock",
491
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
492
+ reasoning: true,
493
+ input: ["text", "image"],
494
+ cost: {
495
+ input: 10,
496
+ output: 50,
497
+ cacheRead: 1,
498
+ cacheWrite: 12.5,
499
+ },
500
+ contextWindow: 1000000,
501
+ maxTokens: 128000,
502
+ },
469
503
  "global.anthropic.claude-haiku-4-5-20251001-v1:0": {
470
504
  id: "global.anthropic.claude-haiku-4-5-20251001-v1:0",
471
505
  name: "Claude Haiku 4.5 (Global)",
@@ -1123,7 +1157,7 @@ export const MODELS = {
1123
1157
  api: "bedrock-converse-stream",
1124
1158
  provider: "amazon-bedrock",
1125
1159
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1126
- reasoning: false,
1160
+ reasoning: true,
1127
1161
  input: ["text"],
1128
1162
  cost: {
1129
1163
  input: 0.15,
@@ -1140,7 +1174,7 @@ export const MODELS = {
1140
1174
  api: "bedrock-converse-stream",
1141
1175
  provider: "amazon-bedrock",
1142
1176
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1143
- reasoning: false,
1177
+ reasoning: true,
1144
1178
  input: ["text"],
1145
1179
  cost: {
1146
1180
  input: 0.15,
@@ -1157,7 +1191,7 @@ export const MODELS = {
1157
1191
  api: "bedrock-converse-stream",
1158
1192
  provider: "amazon-bedrock",
1159
1193
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1160
- reasoning: false,
1194
+ reasoning: true,
1161
1195
  input: ["text"],
1162
1196
  cost: {
1163
1197
  input: 0.07,
@@ -1174,7 +1208,7 @@ export const MODELS = {
1174
1208
  api: "bedrock-converse-stream",
1175
1209
  provider: "amazon-bedrock",
1176
1210
  baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1177
- reasoning: false,
1211
+ reasoning: true,
1178
1212
  input: ["text"],
1179
1213
  cost: {
1180
1214
  input: 0.07,
@@ -1338,6 +1372,23 @@ export const MODELS = {
1338
1372
  contextWindow: 262000,
1339
1373
  maxTokens: 262000,
1340
1374
  },
1375
+ "us.anthropic.claude-fable-5": {
1376
+ id: "us.anthropic.claude-fable-5",
1377
+ name: "Claude Fable 5 (US)",
1378
+ api: "bedrock-converse-stream",
1379
+ provider: "amazon-bedrock",
1380
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1381
+ reasoning: true,
1382
+ input: ["text", "image"],
1383
+ cost: {
1384
+ input: 10,
1385
+ output: 50,
1386
+ cacheRead: 1,
1387
+ cacheWrite: 12.5,
1388
+ },
1389
+ contextWindow: 1000000,
1390
+ maxTokens: 128000,
1391
+ },
1341
1392
  "us.anthropic.claude-haiku-4-5-20251001-v1:0": {
1342
1393
  id: "us.anthropic.claude-haiku-4-5-20251001-v1:0",
1343
1394
  name: "Claude Haiku 4.5 (US)",
@@ -1750,6 +1801,23 @@ export const MODELS = {
1750
1801
  contextWindow: 200000,
1751
1802
  maxTokens: 4096,
1752
1803
  },
1804
+ "claude-fable-5": {
1805
+ id: "claude-fable-5",
1806
+ name: "Claude Fable 5",
1807
+ api: "anthropic-messages",
1808
+ provider: "anthropic",
1809
+ baseUrl: "https://api.anthropic.com",
1810
+ reasoning: true,
1811
+ input: ["text", "image"],
1812
+ cost: {
1813
+ input: 10,
1814
+ output: 50,
1815
+ cacheRead: 1,
1816
+ cacheWrite: 12.5,
1817
+ },
1818
+ contextWindow: 1000000,
1819
+ maxTokens: 128000,
1820
+ },
1753
1821
  "claude-haiku-4-5": {
1754
1822
  id: "claude-haiku-4-5",
1755
1823
  name: "Claude Haiku 4.5 (latest)",
@@ -2925,6 +2993,23 @@ export const MODELS = {
2925
2993
  contextWindow: 200000,
2926
2994
  maxTokens: 8192,
2927
2995
  },
2996
+ "claude-fable-5": {
2997
+ id: "claude-fable-5",
2998
+ name: "Claude Fable 5",
2999
+ api: "anthropic-messages",
3000
+ provider: "cloudflare-ai-gateway",
3001
+ baseUrl: "https://gateway.ai.cloudflare.com/v1/{CLOUDFLARE_ACCOUNT_ID}/{CLOUDFLARE_GATEWAY_ID}/anthropic",
3002
+ reasoning: true,
3003
+ input: ["text", "image"],
3004
+ cost: {
3005
+ input: 10,
3006
+ output: 50,
3007
+ cacheRead: 1,
3008
+ cacheWrite: 12.5,
3009
+ },
3010
+ contextWindow: 1000000,
3011
+ maxTokens: 128000,
3012
+ },
2928
3013
  "claude-haiku-4-5": {
2929
3014
  id: "claude-haiku-4-5",
2930
3015
  name: "Claude Haiku 4.5 (latest)",
@@ -3892,6 +3977,24 @@ export const MODELS = {
3892
3977
  contextWindow: 202800,
3893
3978
  maxTokens: 131072,
3894
3979
  },
3980
+ "accounts/fireworks/routers/kimi-k2p6-fast": {
3981
+ id: "accounts/fireworks/routers/kimi-k2p6-fast",
3982
+ name: "Kimi K2.6 Fast",
3983
+ api: "anthropic-messages",
3984
+ provider: "fireworks",
3985
+ baseUrl: "https://api.fireworks.ai/inference",
3986
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3987
+ reasoning: true,
3988
+ input: ["text", "image"],
3989
+ cost: {
3990
+ input: 2,
3991
+ output: 8,
3992
+ cacheRead: 0.3,
3993
+ cacheWrite: 0,
3994
+ },
3995
+ contextWindow: 262000,
3996
+ maxTokens: 262000,
3997
+ },
3895
3998
  "accounts/fireworks/routers/kimi-k2p6-turbo": {
3896
3999
  id: "accounts/fireworks/routers/kimi-k2p6-turbo",
3897
4000
  name: "Kimi K2.6 Turbo",
@@ -4843,77 +4946,9 @@ export const MODELS = {
4843
4946
  },
4844
4947
  },
4845
4948
  "groq": {
4846
- "deepseek-r1-distill-llama-70b": {
4847
- id: "deepseek-r1-distill-llama-70b",
4848
- name: "DeepSeek R1 Distill Llama 70B",
4849
- api: "openai-completions",
4850
- provider: "groq",
4851
- baseUrl: "https://api.groq.com/openai/v1",
4852
- reasoning: true,
4853
- input: ["text"],
4854
- cost: {
4855
- input: 0.75,
4856
- output: 0.99,
4857
- cacheRead: 0,
4858
- cacheWrite: 0,
4859
- },
4860
- contextWindow: 131072,
4861
- maxTokens: 8192,
4862
- },
4863
- "gemma2-9b-it": {
4864
- id: "gemma2-9b-it",
4865
- name: "Gemma 2 9B",
4866
- api: "openai-completions",
4867
- provider: "groq",
4868
- baseUrl: "https://api.groq.com/openai/v1",
4869
- reasoning: false,
4870
- input: ["text"],
4871
- cost: {
4872
- input: 0.2,
4873
- output: 0.2,
4874
- cacheRead: 0,
4875
- cacheWrite: 0,
4876
- },
4877
- contextWindow: 8192,
4878
- maxTokens: 8192,
4879
- },
4880
- "groq/compound": {
4881
- id: "groq/compound",
4882
- name: "Compound",
4883
- api: "openai-completions",
4884
- provider: "groq",
4885
- baseUrl: "https://api.groq.com/openai/v1",
4886
- reasoning: true,
4887
- input: ["text"],
4888
- cost: {
4889
- input: 0,
4890
- output: 0,
4891
- cacheRead: 0,
4892
- cacheWrite: 0,
4893
- },
4894
- contextWindow: 131072,
4895
- maxTokens: 8192,
4896
- },
4897
- "groq/compound-mini": {
4898
- id: "groq/compound-mini",
4899
- name: "Compound Mini",
4900
- api: "openai-completions",
4901
- provider: "groq",
4902
- baseUrl: "https://api.groq.com/openai/v1",
4903
- reasoning: true,
4904
- input: ["text"],
4905
- cost: {
4906
- input: 0,
4907
- output: 0,
4908
- cacheRead: 0,
4909
- cacheWrite: 0,
4910
- },
4911
- contextWindow: 131072,
4912
- maxTokens: 8192,
4913
- },
4914
4949
  "llama-3.1-8b-instant": {
4915
4950
  id: "llama-3.1-8b-instant",
4916
- name: "Llama 3.1 8B Instant",
4951
+ name: "Llama 3.1 8B",
4917
4952
  api: "openai-completions",
4918
4953
  provider: "groq",
4919
4954
  baseUrl: "https://api.groq.com/openai/v1",
@@ -4930,7 +4965,7 @@ export const MODELS = {
4930
4965
  },
4931
4966
  "llama-3.3-70b-versatile": {
4932
4967
  id: "llama-3.3-70b-versatile",
4933
- name: "Llama 3.3 70B Versatile",
4968
+ name: "Llama 3.3 70B",
4934
4969
  api: "openai-completions",
4935
4970
  provider: "groq",
4936
4971
  baseUrl: "https://api.groq.com/openai/v1",
@@ -4945,60 +4980,9 @@ export const MODELS = {
4945
4980
  contextWindow: 131072,
4946
4981
  maxTokens: 32768,
4947
4982
  },
4948
- "llama3-70b-8192": {
4949
- id: "llama3-70b-8192",
4950
- name: "Llama 3 70B",
4951
- api: "openai-completions",
4952
- provider: "groq",
4953
- baseUrl: "https://api.groq.com/openai/v1",
4954
- reasoning: false,
4955
- input: ["text"],
4956
- cost: {
4957
- input: 0.59,
4958
- output: 0.79,
4959
- cacheRead: 0,
4960
- cacheWrite: 0,
4961
- },
4962
- contextWindow: 8192,
4963
- maxTokens: 8192,
4964
- },
4965
- "llama3-8b-8192": {
4966
- id: "llama3-8b-8192",
4967
- name: "Llama 3 8B",
4968
- api: "openai-completions",
4969
- provider: "groq",
4970
- baseUrl: "https://api.groq.com/openai/v1",
4971
- reasoning: false,
4972
- input: ["text"],
4973
- cost: {
4974
- input: 0.05,
4975
- output: 0.08,
4976
- cacheRead: 0,
4977
- cacheWrite: 0,
4978
- },
4979
- contextWindow: 8192,
4980
- maxTokens: 8192,
4981
- },
4982
- "meta-llama/llama-4-maverick-17b-128e-instruct": {
4983
- id: "meta-llama/llama-4-maverick-17b-128e-instruct",
4984
- name: "Llama 4 Maverick 17B",
4985
- api: "openai-completions",
4986
- provider: "groq",
4987
- baseUrl: "https://api.groq.com/openai/v1",
4988
- reasoning: false,
4989
- input: ["text", "image"],
4990
- cost: {
4991
- input: 0.2,
4992
- output: 0.6,
4993
- cacheRead: 0,
4994
- cacheWrite: 0,
4995
- },
4996
- contextWindow: 131072,
4997
- maxTokens: 8192,
4998
- },
4999
4983
  "meta-llama/llama-4-scout-17b-16e-instruct": {
5000
4984
  id: "meta-llama/llama-4-scout-17b-16e-instruct",
5001
- name: "Llama 4 Scout 17B",
4985
+ name: "Llama 4 Scout 17B 16E",
5002
4986
  api: "openai-completions",
5003
4987
  provider: "groq",
5004
4988
  baseUrl: "https://api.groq.com/openai/v1",
@@ -5013,57 +4997,6 @@ export const MODELS = {
5013
4997
  contextWindow: 131072,
5014
4998
  maxTokens: 8192,
5015
4999
  },
5016
- "mistral-saba-24b": {
5017
- id: "mistral-saba-24b",
5018
- name: "Mistral Saba 24B",
5019
- api: "openai-completions",
5020
- provider: "groq",
5021
- baseUrl: "https://api.groq.com/openai/v1",
5022
- reasoning: false,
5023
- input: ["text"],
5024
- cost: {
5025
- input: 0.79,
5026
- output: 0.79,
5027
- cacheRead: 0,
5028
- cacheWrite: 0,
5029
- },
5030
- contextWindow: 32768,
5031
- maxTokens: 32768,
5032
- },
5033
- "moonshotai/kimi-k2-instruct": {
5034
- id: "moonshotai/kimi-k2-instruct",
5035
- name: "Kimi K2 Instruct",
5036
- api: "openai-completions",
5037
- provider: "groq",
5038
- baseUrl: "https://api.groq.com/openai/v1",
5039
- reasoning: false,
5040
- input: ["text"],
5041
- cost: {
5042
- input: 1,
5043
- output: 3,
5044
- cacheRead: 0,
5045
- cacheWrite: 0,
5046
- },
5047
- contextWindow: 131072,
5048
- maxTokens: 16384,
5049
- },
5050
- "moonshotai/kimi-k2-instruct-0905": {
5051
- id: "moonshotai/kimi-k2-instruct-0905",
5052
- name: "Kimi K2 Instruct 0905",
5053
- api: "openai-completions",
5054
- provider: "groq",
5055
- baseUrl: "https://api.groq.com/openai/v1",
5056
- reasoning: false,
5057
- input: ["text"],
5058
- cost: {
5059
- input: 1,
5060
- output: 3,
5061
- cacheRead: 0.5,
5062
- cacheWrite: 0,
5063
- },
5064
- contextWindow: 262144,
5065
- maxTokens: 16384,
5066
- },
5067
5000
  "openai/gpt-oss-120b": {
5068
5001
  id: "openai/gpt-oss-120b",
5069
5002
  name: "GPT OSS 120B",
@@ -5115,26 +5048,9 @@ export const MODELS = {
5115
5048
  contextWindow: 131072,
5116
5049
  maxTokens: 65536,
5117
5050
  },
5118
- "qwen-qwq-32b": {
5119
- id: "qwen-qwq-32b",
5120
- name: "Qwen QwQ 32B",
5121
- api: "openai-completions",
5122
- provider: "groq",
5123
- baseUrl: "https://api.groq.com/openai/v1",
5124
- reasoning: true,
5125
- input: ["text"],
5126
- cost: {
5127
- input: 0.29,
5128
- output: 0.39,
5129
- cacheRead: 0,
5130
- cacheWrite: 0,
5131
- },
5132
- contextWindow: 131072,
5133
- maxTokens: 16384,
5134
- },
5135
5051
  "qwen/qwen3-32b": {
5136
5052
  id: "qwen/qwen3-32b",
5137
- name: "Qwen3 32B",
5053
+ name: "Qwen3-32B",
5138
5054
  api: "openai-completions",
5139
5055
  provider: "groq",
5140
5056
  baseUrl: "https://api.groq.com/openai/v1",
@@ -7295,6 +7211,23 @@ export const MODELS = {
7295
7211
  contextWindow: 200000,
7296
7212
  maxTokens: 32000,
7297
7213
  },
7214
+ "claude-fable-5": {
7215
+ id: "claude-fable-5",
7216
+ name: "Claude Fable 5",
7217
+ api: "anthropic-messages",
7218
+ provider: "opencode",
7219
+ baseUrl: "https://opencode.ai/zen",
7220
+ reasoning: true,
7221
+ input: ["text", "image"],
7222
+ cost: {
7223
+ input: 10,
7224
+ output: 50,
7225
+ cacheRead: 1,
7226
+ cacheWrite: 12.5,
7227
+ },
7228
+ contextWindow: 1000000,
7229
+ maxTokens: 128000,
7230
+ },
7298
7231
  "claude-haiku-4-5": {
7299
7232
  id: "claude-haiku-4-5",
7300
7233
  name: "Claude Haiku 4.5",
@@ -7467,7 +7400,7 @@ export const MODELS = {
7467
7400
  cost: {
7468
7401
  input: 0.14,
7469
7402
  output: 0.28,
7470
- cacheRead: 0.03,
7403
+ cacheRead: 0.028,
7471
7404
  cacheWrite: 0,
7472
7405
  },
7473
7406
  contextWindow: 1000000,
@@ -7492,6 +7425,25 @@ export const MODELS = {
7492
7425
  contextWindow: 200000,
7493
7426
  maxTokens: 128000,
7494
7427
  },
7428
+ "deepseek-v4-pro": {
7429
+ id: "deepseek-v4-pro",
7430
+ name: "DeepSeek V4 Pro",
7431
+ api: "openai-completions",
7432
+ provider: "opencode",
7433
+ baseUrl: "https://opencode.ai/zen/v1",
7434
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
7435
+ reasoning: true,
7436
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null, "high": "high", "xhigh": "max" },
7437
+ input: ["text"],
7438
+ cost: {
7439
+ input: 1.74,
7440
+ output: 3.84,
7441
+ cacheRead: 0.145,
7442
+ cacheWrite: 0,
7443
+ },
7444
+ contextWindow: 1000000,
7445
+ maxTokens: 384000,
7446
+ },
7495
7447
  "gemini-3-flash": {
7496
7448
  id: "gemini-3-flash",
7497
7449
  name: "Gemini 3 Flash",
@@ -7973,26 +7925,26 @@ export const MODELS = {
7973
7925
  contextWindow: 204800,
7974
7926
  maxTokens: 131072,
7975
7927
  },
7976
- "minimax-m3-free": {
7977
- id: "minimax-m3-free",
7978
- name: "MiniMax M3 Free",
7979
- api: "anthropic-messages",
7928
+ "nemotron-3-ultra-free": {
7929
+ id: "nemotron-3-ultra-free",
7930
+ name: "Nemotron 3 Ultra Free",
7931
+ api: "openai-completions",
7980
7932
  provider: "opencode",
7981
- baseUrl: "https://opencode.ai/zen",
7933
+ baseUrl: "https://opencode.ai/zen/v1",
7982
7934
  reasoning: true,
7983
- input: ["text", "image"],
7935
+ input: ["text"],
7984
7936
  cost: {
7985
7937
  input: 0,
7986
7938
  output: 0,
7987
7939
  cacheRead: 0,
7988
7940
  cacheWrite: 0,
7989
7941
  },
7990
- contextWindow: 200000,
7991
- maxTokens: 32000,
7942
+ contextWindow: 1000000,
7943
+ maxTokens: 128000,
7992
7944
  },
7993
- "nemotron-3-ultra-free": {
7994
- id: "nemotron-3-ultra-free",
7995
- name: "Nemotron 3 Ultra Free",
7945
+ "north-mini-code-free": {
7946
+ id: "north-mini-code-free",
7947
+ name: "North Mini Code Free",
7996
7948
  api: "openai-completions",
7997
7949
  provider: "opencode",
7998
7950
  baseUrl: "https://opencode.ai/zen/v1",
@@ -8004,8 +7956,8 @@ export const MODELS = {
8004
7956
  cacheRead: 0,
8005
7957
  cacheWrite: 0,
8006
7958
  },
8007
- contextWindow: 1000000,
8008
- maxTokens: 128000,
7959
+ contextWindow: 256000,
7960
+ maxTokens: 64000,
8009
7961
  },
8010
7962
  "qwen3.5-plus": {
8011
7963
  id: "qwen3.5-plus",
@@ -8226,11 +8178,11 @@ export const MODELS = {
8226
8178
  provider: "opencode-go",
8227
8179
  baseUrl: "https://opencode.ai/zen/go",
8228
8180
  reasoning: true,
8229
- input: ["text", "image"],
8230
- cost: {
8231
- input: 0.6,
8232
- output: 2.4,
8233
- cacheRead: 0.12,
8181
+ input: ["text", "image"],
8182
+ cost: {
8183
+ input: 0.3,
8184
+ output: 1.2,
8185
+ cacheRead: 0.06,
8234
8186
  cacheWrite: 0,
8235
8187
  },
8236
8188
  contextWindow: 512000,
@@ -8426,6 +8378,23 @@ export const MODELS = {
8426
8378
  contextWindow: 200000,
8427
8379
  maxTokens: 8192,
8428
8380
  },
8381
+ "anthropic/claude-fable-5": {
8382
+ id: "anthropic/claude-fable-5",
8383
+ name: "Anthropic: Claude Fable 5",
8384
+ api: "openai-completions",
8385
+ provider: "openrouter",
8386
+ baseUrl: "https://openrouter.ai/api/v1",
8387
+ reasoning: true,
8388
+ input: ["text", "image"],
8389
+ cost: {
8390
+ input: 10,
8391
+ output: 50,
8392
+ cacheRead: 1,
8393
+ cacheWrite: 12.5,
8394
+ },
8395
+ contextWindow: 1000000,
8396
+ maxTokens: 128000,
8397
+ },
8429
8398
  "anthropic/claude-haiku-4.5": {
8430
8399
  id: "anthropic/claude-haiku-4.5",
8431
8400
  name: "Anthropic: Claude Haiku 4.5",
@@ -8719,23 +8688,6 @@ export const MODELS = {
8719
8688
  contextWindow: 2000000,
8720
8689
  maxTokens: 30000,
8721
8690
  },
8722
- "baidu/ernie-4.5-vl-28b-a3b": {
8723
- id: "baidu/ernie-4.5-vl-28b-a3b",
8724
- name: "Baidu: ERNIE 4.5 VL 28B A3B",
8725
- api: "openai-completions",
8726
- provider: "openrouter",
8727
- baseUrl: "https://openrouter.ai/api/v1",
8728
- reasoning: true,
8729
- input: ["text", "image"],
8730
- cost: {
8731
- input: 0.14,
8732
- output: 0.56,
8733
- cacheRead: 0,
8734
- cacheWrite: 0,
8735
- },
8736
- contextWindow: 131072,
8737
- maxTokens: 8000,
8738
- },
8739
8691
  "bytedance-seed/seed-1.6": {
8740
8692
  id: "bytedance-seed/seed-1.6",
8741
8693
  name: "ByteDance Seed: Seed 1.6",
@@ -8869,7 +8821,7 @@ export const MODELS = {
8869
8821
  cacheRead: 0.135,
8870
8822
  cacheWrite: 0,
8871
8823
  },
8872
- contextWindow: 163840,
8824
+ contextWindow: 131072,
8873
8825
  maxTokens: 16384,
8874
8826
  },
8875
8827
  "deepseek/deepseek-chat-v3.1": {
@@ -9242,8 +9194,8 @@ export const MODELS = {
9242
9194
  reasoning: false,
9243
9195
  input: ["text", "image"],
9244
9196
  cost: {
9245
- input: 0.04,
9246
- output: 0.13,
9197
+ input: 0.049999999999999996,
9198
+ output: 0.15,
9247
9199
  cacheRead: 0,
9248
9200
  cacheWrite: 0,
9249
9201
  },
@@ -9311,12 +9263,12 @@ export const MODELS = {
9311
9263
  input: ["text", "image"],
9312
9264
  cost: {
9313
9265
  input: 0.12,
9314
- output: 0.37,
9315
- cacheRead: 0,
9266
+ output: 0.36,
9267
+ cacheRead: 0.09,
9316
9268
  cacheWrite: 0,
9317
9269
  },
9318
9270
  contextWindow: 262144,
9319
- maxTokens: 16384,
9271
+ maxTokens: 8192,
9320
9272
  },
9321
9273
  "google/gemma-4-31b-it:free": {
9322
9274
  id: "google/gemma-4-31b-it:free",
@@ -9532,7 +9484,7 @@ export const MODELS = {
9532
9484
  reasoning: false,
9533
9485
  input: ["text", "image"],
9534
9486
  cost: {
9535
- input: 0.08,
9487
+ input: 0.09999999999999999,
9536
9488
  output: 0.3,
9537
9489
  cacheRead: 0,
9538
9490
  cacheWrite: 0,
@@ -9601,8 +9553,8 @@ export const MODELS = {
9601
9553
  input: ["text"],
9602
9554
  cost: {
9603
9555
  input: 0.15,
9604
- output: 1.15,
9605
- cacheRead: 0,
9556
+ output: 0.8999999999999999,
9557
+ cacheRead: 0.049999999999999996,
9606
9558
  cacheWrite: 0,
9607
9559
  },
9608
9560
  contextWindow: 204800,
@@ -9617,9 +9569,9 @@ export const MODELS = {
9617
9569
  reasoning: true,
9618
9570
  input: ["text"],
9619
9571
  cost: {
9620
- input: 0.27899999999999997,
9621
- output: 1.2,
9622
- cacheRead: 0,
9572
+ input: 0.27,
9573
+ output: 1.08,
9574
+ cacheRead: 0.054,
9623
9575
  cacheWrite: 0,
9624
9576
  },
9625
9577
  contextWindow: 204800,
@@ -10009,21 +9961,20 @@ export const MODELS = {
10009
9961
  reasoning: true,
10010
9962
  input: ["text", "image"],
10011
9963
  cost: {
10012
- input: 0.684,
10013
- output: 3.42,
10014
- cacheRead: 0.144,
9964
+ input: 0.6799999999999999,
9965
+ output: 3.41,
9966
+ cacheRead: 0.33999999999999997,
10015
9967
  cacheWrite: 0,
10016
9968
  },
10017
9969
  contextWindow: 262144,
10018
- maxTokens: 262144,
9970
+ maxTokens: 262142,
10019
9971
  },
10020
- "moonshotai/kimi-k2.6:free": {
10021
- id: "moonshotai/kimi-k2.6:free",
10022
- name: "MoonshotAI: Kimi K2.6 (free)",
9972
+ "nex-agi/nex-n2-pro:free": {
9973
+ id: "nex-agi/nex-n2-pro:free",
9974
+ name: "Nex AGI: Nex-N2-Pro (free)",
10023
9975
  api: "openai-completions",
10024
9976
  provider: "openrouter",
10025
9977
  baseUrl: "https://openrouter.ai/api/v1",
10026
- compat: { "supportsDeveloperRole": false },
10027
9978
  reasoning: true,
10028
9979
  input: ["text", "image"],
10029
9980
  cost: {
@@ -10033,24 +9984,7 @@ export const MODELS = {
10033
9984
  cacheWrite: 0,
10034
9985
  },
10035
9986
  contextWindow: 262144,
10036
- maxTokens: 4096,
10037
- },
10038
- "nex-agi/deepseek-v3.1-nex-n1": {
10039
- id: "nex-agi/deepseek-v3.1-nex-n1",
10040
- name: "Nex AGI: DeepSeek V3.1 Nex N1",
10041
- api: "openai-completions",
10042
- provider: "openrouter",
10043
- baseUrl: "https://openrouter.ai/api/v1",
10044
- reasoning: false,
10045
- input: ["text"],
10046
- cost: {
10047
- input: 0.135,
10048
- output: 0.5,
10049
- cacheRead: 0,
10050
- cacheWrite: 0,
10051
- },
10052
- contextWindow: 131072,
10053
- maxTokens: 163840,
9987
+ maxTokens: 262144,
10054
9988
  },
10055
9989
  "nvidia/llama-3.3-nemotron-super-49b-v1.5": {
10056
9990
  id: "nvidia/llama-3.3-nemotron-super-49b-v1.5",
@@ -10061,7 +9995,7 @@ export const MODELS = {
10061
9995
  reasoning: true,
10062
9996
  input: ["text"],
10063
9997
  cost: {
10064
- input: 0.09999999999999999,
9998
+ input: 0.39999999999999997,
10065
9999
  output: 0.39999999999999997,
10066
10000
  cacheRead: 0,
10067
10001
  cacheWrite: 0,
@@ -10307,23 +10241,6 @@ export const MODELS = {
10307
10241
  contextWindow: 8191,
10308
10242
  maxTokens: 4096,
10309
10243
  },
10310
- "openai/gpt-4-1106-preview": {
10311
- id: "openai/gpt-4-1106-preview",
10312
- name: "OpenAI: GPT-4 Turbo (older v1106)",
10313
- api: "openai-completions",
10314
- provider: "openrouter",
10315
- baseUrl: "https://openrouter.ai/api/v1",
10316
- reasoning: false,
10317
- input: ["text"],
10318
- cost: {
10319
- input: 10,
10320
- output: 30,
10321
- cacheRead: 0,
10322
- cacheWrite: 0,
10323
- },
10324
- contextWindow: 128000,
10325
- maxTokens: 4096,
10326
- },
10327
10244
  "openai/gpt-4-turbo": {
10328
10245
  id: "openai/gpt-4-turbo",
10329
10246
  name: "OpenAI: GPT-4 Turbo",
@@ -11399,7 +11316,7 @@ export const MODELS = {
11399
11316
  reasoning: false,
11400
11317
  input: ["text"],
11401
11318
  cost: {
11402
- input: 0.071,
11319
+ input: 0.09,
11403
11320
  output: 0.09999999999999999,
11404
11321
  cacheRead: 0,
11405
11322
  cacheWrite: 0,
@@ -11433,8 +11350,8 @@ export const MODELS = {
11433
11350
  reasoning: true,
11434
11351
  input: ["text"],
11435
11352
  cost: {
11436
- input: 0.09,
11437
- output: 0.44999999999999996,
11353
+ input: 0.12,
11354
+ output: 0.5,
11438
11355
  cacheRead: 0,
11439
11356
  cacheWrite: 0,
11440
11357
  },
@@ -11892,13 +11809,13 @@ export const MODELS = {
11892
11809
  reasoning: true,
11893
11810
  input: ["text", "image"],
11894
11811
  cost: {
11895
- input: 0.04,
11812
+ input: 0.09999999999999999,
11896
11813
  output: 0.15,
11897
11814
  cacheRead: 0,
11898
11815
  cacheWrite: 0,
11899
11816
  },
11900
11817
  contextWindow: 262144,
11901
- maxTokens: 81920,
11818
+ maxTokens: 262144,
11902
11819
  },
11903
11820
  "qwen/qwen3.5-flash-02-23": {
11904
11821
  id: "qwen/qwen3.5-flash-02-23",
@@ -11960,13 +11877,13 @@ export const MODELS = {
11960
11877
  reasoning: true,
11961
11878
  input: ["text", "image"],
11962
11879
  cost: {
11963
- input: 0.29,
11964
- output: 3.1999999999999997,
11880
+ input: 0.28900000000000003,
11881
+ output: 2.4,
11965
11882
  cacheRead: 0,
11966
11883
  cacheWrite: 0,
11967
11884
  },
11968
11885
  contextWindow: 262144,
11969
- maxTokens: 262140,
11886
+ maxTokens: 131072,
11970
11887
  },
11971
11888
  "qwen/qwen3.6-35b-a3b": {
11972
11889
  id: "qwen/qwen3.6-35b-a3b",
@@ -11977,13 +11894,13 @@ export const MODELS = {
11977
11894
  reasoning: true,
11978
11895
  input: ["text", "image"],
11979
11896
  cost: {
11980
- input: 0.14,
11897
+ input: 0.15,
11981
11898
  output: 1,
11982
- cacheRead: 0,
11899
+ cacheRead: 0.049999999999999996,
11983
11900
  cacheWrite: 0,
11984
11901
  },
11985
11902
  contextWindow: 262144,
11986
- maxTokens: 262140,
11903
+ maxTokens: 262144,
11987
11904
  },
11988
11905
  "qwen/qwen3.6-flash": {
11989
11906
  id: "qwen/qwen3.6-flash",
@@ -12104,23 +12021,6 @@ export const MODELS = {
12104
12021
  contextWindow: 256000,
12105
12022
  maxTokens: 128000,
12106
12023
  },
12107
- "sao10k/l3-euryale-70b": {
12108
- id: "sao10k/l3-euryale-70b",
12109
- name: "Sao10k: Llama 3 Euryale 70B v2.1",
12110
- api: "openai-completions",
12111
- provider: "openrouter",
12112
- baseUrl: "https://openrouter.ai/api/v1",
12113
- reasoning: false,
12114
- input: ["text"],
12115
- cost: {
12116
- input: 1.48,
12117
- output: 1.48,
12118
- cacheRead: 0,
12119
- cacheWrite: 0,
12120
- },
12121
- contextWindow: 8192,
12122
- maxTokens: 8192,
12123
- },
12124
12024
  "sao10k/l3.1-euryale-70b": {
12125
12025
  id: "sao10k/l3.1-euryale-70b",
12126
12026
  name: "Sao10K: Llama 3.1 Euryale 70B v2.2",
@@ -12342,23 +12242,6 @@ export const MODELS = {
12342
12242
  contextWindow: 1048576,
12343
12243
  maxTokens: 131072,
12344
12244
  },
12345
- "z-ai/glm-4-32b": {
12346
- id: "z-ai/glm-4-32b",
12347
- name: "Z.ai: GLM 4 32B ",
12348
- api: "openai-completions",
12349
- provider: "openrouter",
12350
- baseUrl: "https://openrouter.ai/api/v1",
12351
- reasoning: false,
12352
- input: ["text"],
12353
- cost: {
12354
- input: 0.09999999999999999,
12355
- output: 0.09999999999999999,
12356
- cacheRead: 0,
12357
- cacheWrite: 0,
12358
- },
12359
- contextWindow: 128000,
12360
- maxTokens: 4096,
12361
- },
12362
12245
  "z-ai/glm-4.5": {
12363
12246
  id: "z-ai/glm-4.5",
12364
12247
  name: "Z.ai: GLM 4.5",
@@ -12393,23 +12276,6 @@ export const MODELS = {
12393
12276
  contextWindow: 131072,
12394
12277
  maxTokens: 131070,
12395
12278
  },
12396
- "z-ai/glm-4.5-air:free": {
12397
- id: "z-ai/glm-4.5-air:free",
12398
- name: "Z.ai: GLM 4.5 Air (free)",
12399
- api: "openai-completions",
12400
- provider: "openrouter",
12401
- baseUrl: "https://openrouter.ai/api/v1",
12402
- reasoning: true,
12403
- input: ["text"],
12404
- cost: {
12405
- input: 0,
12406
- output: 0,
12407
- cacheRead: 0,
12408
- cacheWrite: 0,
12409
- },
12410
- contextWindow: 131072,
12411
- maxTokens: 96000,
12412
- },
12413
12279
  "z-ai/glm-4.5v": {
12414
12280
  id: "z-ai/glm-4.5v",
12415
12281
  name: "Z.ai: GLM 4.5V",
@@ -12455,11 +12321,11 @@ export const MODELS = {
12455
12321
  cost: {
12456
12322
  input: 0.3,
12457
12323
  output: 0.8999999999999999,
12458
- cacheRead: 0.049999999999999996,
12324
+ cacheRead: 0.055,
12459
12325
  cacheWrite: 0,
12460
12326
  },
12461
12327
  contextWindow: 131072,
12462
- maxTokens: 24000,
12328
+ maxTokens: 32768,
12463
12329
  },
12464
12330
  "z-ai/glm-4.7": {
12465
12331
  id: "z-ai/glm-4.7",
@@ -12526,7 +12392,7 @@ export const MODELS = {
12526
12392
  cacheRead: 0.24,
12527
12393
  cacheWrite: 0,
12528
12394
  },
12529
- contextWindow: 202752,
12395
+ contextWindow: 262144,
12530
12396
  maxTokens: 131072,
12531
12397
  },
12532
12398
  "z-ai/glm-5.1": {
@@ -12546,22 +12412,22 @@ export const MODELS = {
12546
12412
  contextWindow: 202752,
12547
12413
  maxTokens: 4096,
12548
12414
  },
12549
- "z-ai/glm-5v-turbo": {
12550
- id: "z-ai/glm-5v-turbo",
12551
- name: "Z.ai: GLM 5V Turbo",
12415
+ "~anthropic/claude-fable-latest": {
12416
+ id: "~anthropic/claude-fable-latest",
12417
+ name: "Anthropic: Claude Fable Latest",
12552
12418
  api: "openai-completions",
12553
12419
  provider: "openrouter",
12554
12420
  baseUrl: "https://openrouter.ai/api/v1",
12555
12421
  reasoning: true,
12556
12422
  input: ["text", "image"],
12557
12423
  cost: {
12558
- input: 1.2,
12559
- output: 4,
12560
- cacheRead: 0.24,
12561
- cacheWrite: 0,
12424
+ input: 10,
12425
+ output: 50,
12426
+ cacheRead: 1,
12427
+ cacheWrite: 12.5,
12562
12428
  },
12563
- contextWindow: 202752,
12564
- maxTokens: 131072,
12429
+ contextWindow: 1000000,
12430
+ maxTokens: 128000,
12565
12431
  },
12566
12432
  "~anthropic/claude-haiku-latest": {
12567
12433
  id: "~anthropic/claude-haiku-latest",
@@ -12657,13 +12523,13 @@ export const MODELS = {
12657
12523
  reasoning: true,
12658
12524
  input: ["text", "image"],
12659
12525
  cost: {
12660
- input: 0.684,
12661
- output: 3.42,
12662
- cacheRead: 0.144,
12526
+ input: 0.6799999999999999,
12527
+ output: 3.41,
12528
+ cacheRead: 0.33999999999999997,
12663
12529
  cacheWrite: 0,
12664
12530
  },
12665
12531
  contextWindow: 262144,
12666
- maxTokens: 262144,
12532
+ maxTokens: 262142,
12667
12533
  },
12668
12534
  "~openai/gpt-latest": {
12669
12535
  id: "~openai/gpt-latest",
@@ -13104,8 +12970,8 @@ export const MODELS = {
13104
12970
  reasoning: true,
13105
12971
  input: ["text"],
13106
12972
  cost: {
13107
- input: 0.08,
13108
- output: 0.29,
12973
+ input: 0.12,
12974
+ output: 0.5,
13109
12975
  cacheRead: 0,
13110
12976
  cacheWrite: 0,
13111
12977
  },
@@ -13469,6 +13335,23 @@ export const MODELS = {
13469
13335
  contextWindow: 200000,
13470
13336
  maxTokens: 8192,
13471
13337
  },
13338
+ "anthropic/claude-fable-5": {
13339
+ id: "anthropic/claude-fable-5",
13340
+ name: "Claude Fable 5",
13341
+ api: "anthropic-messages",
13342
+ provider: "vercel-ai-gateway",
13343
+ baseUrl: "https://ai-gateway.vercel.sh",
13344
+ reasoning: true,
13345
+ input: ["text", "image"],
13346
+ cost: {
13347
+ input: 10,
13348
+ output: 50,
13349
+ cacheRead: 1,
13350
+ cacheWrite: 12.5,
13351
+ },
13352
+ contextWindow: 1000000,
13353
+ maxTokens: 128000,
13354
+ },
13472
13355
  "anthropic/claude-haiku-4.5": {
13473
13356
  id: "anthropic/claude-haiku-4.5",
13474
13357
  name: "Claude Haiku 4.5",
@@ -13849,40 +13732,6 @@ export const MODELS = {
13849
13732
  contextWindow: 1000000,
13850
13733
  maxTokens: 384000,
13851
13734
  },
13852
- "google/gemini-2.0-flash": {
13853
- id: "google/gemini-2.0-flash",
13854
- name: "Gemini 2.0 Flash",
13855
- api: "anthropic-messages",
13856
- provider: "vercel-ai-gateway",
13857
- baseUrl: "https://ai-gateway.vercel.sh",
13858
- reasoning: false,
13859
- input: ["text", "image"],
13860
- cost: {
13861
- input: 0.15,
13862
- output: 0.6,
13863
- cacheRead: 0.024999999999999998,
13864
- cacheWrite: 0,
13865
- },
13866
- contextWindow: 1048576,
13867
- maxTokens: 8192,
13868
- },
13869
- "google/gemini-2.0-flash-lite": {
13870
- id: "google/gemini-2.0-flash-lite",
13871
- name: "Gemini 2.0 Flash Lite",
13872
- api: "anthropic-messages",
13873
- provider: "vercel-ai-gateway",
13874
- baseUrl: "https://ai-gateway.vercel.sh",
13875
- reasoning: false,
13876
- input: ["text", "image"],
13877
- cost: {
13878
- input: 0.075,
13879
- output: 0.3,
13880
- cacheRead: 0.02,
13881
- cacheWrite: 0,
13882
- },
13883
- contextWindow: 1048576,
13884
- maxTokens: 8192,
13885
- },
13886
13735
  "google/gemini-2.5-flash": {
13887
13736
  id: "google/gemini-2.5-flash",
13888
13737
  name: "Gemini 2.5 Flash",
@@ -16002,7 +15851,7 @@ export const MODELS = {
16002
15851
  cacheRead: 0.2,
16003
15852
  cacheWrite: 0,
16004
15853
  },
16005
- contextWindow: 2000000,
15854
+ contextWindow: 1000000,
16006
15855
  maxTokens: 30000,
16007
15856
  },
16008
15857
  "grok-4.20-0309-reasoning": {
@@ -16019,7 +15868,7 @@ export const MODELS = {
16019
15868
  cacheRead: 0.2,
16020
15869
  cacheWrite: 0,
16021
15870
  },
16022
- contextWindow: 2000000,
15871
+ contextWindow: 1000000,
16023
15872
  maxTokens: 30000,
16024
15873
  },
16025
15874
  "grok-4.3": {
@@ -16165,6 +16014,24 @@ export const MODELS = {
16165
16014
  contextWindow: 1048576,
16166
16015
  maxTokens: 131072,
16167
16016
  },
16017
+ "mimo-v2.5-pro-ultraspeed": {
16018
+ id: "mimo-v2.5-pro-ultraspeed",
16019
+ name: "MiMo-V2.5-Pro-UltraSpeed",
16020
+ api: "openai-completions",
16021
+ provider: "xiaomi",
16022
+ baseUrl: "https://api.xiaomimimo.com/v1",
16023
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
16024
+ reasoning: true,
16025
+ input: ["text"],
16026
+ cost: {
16027
+ input: 1.305,
16028
+ output: 2.61,
16029
+ cacheRead: 0.0108,
16030
+ cacheWrite: 0,
16031
+ },
16032
+ contextWindow: 1048576,
16033
+ maxTokens: 131072,
16034
+ },
16168
16035
  },
16169
16036
  "xiaomi-token-plan-ams": {
16170
16037
  "mimo-v2-omni": {
@@ -16239,6 +16106,24 @@ export const MODELS = {
16239
16106
  contextWindow: 1048576,
16240
16107
  maxTokens: 131072,
16241
16108
  },
16109
+ "mimo-v2.5-pro-ultraspeed": {
16110
+ id: "mimo-v2.5-pro-ultraspeed",
16111
+ name: "MiMo-V2.5-Pro-UltraSpeed",
16112
+ api: "openai-completions",
16113
+ provider: "xiaomi-token-plan-ams",
16114
+ baseUrl: "https://token-plan-ams.xiaomimimo.com/v1",
16115
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
16116
+ reasoning: true,
16117
+ input: ["text"],
16118
+ cost: {
16119
+ input: 1.305,
16120
+ output: 2.61,
16121
+ cacheRead: 0.0108,
16122
+ cacheWrite: 0,
16123
+ },
16124
+ contextWindow: 1048576,
16125
+ maxTokens: 131072,
16126
+ },
16242
16127
  },
16243
16128
  "xiaomi-token-plan-cn": {
16244
16129
  "mimo-v2-omni": {
@@ -16313,6 +16198,24 @@ export const MODELS = {
16313
16198
  contextWindow: 1048576,
16314
16199
  maxTokens: 131072,
16315
16200
  },
16201
+ "mimo-v2.5-pro-ultraspeed": {
16202
+ id: "mimo-v2.5-pro-ultraspeed",
16203
+ name: "MiMo-V2.5-Pro-UltraSpeed",
16204
+ api: "openai-completions",
16205
+ provider: "xiaomi-token-plan-cn",
16206
+ baseUrl: "https://token-plan-cn.xiaomimimo.com/v1",
16207
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
16208
+ reasoning: true,
16209
+ input: ["text"],
16210
+ cost: {
16211
+ input: 1.305,
16212
+ output: 2.61,
16213
+ cacheRead: 0.0108,
16214
+ cacheWrite: 0,
16215
+ },
16216
+ contextWindow: 1048576,
16217
+ maxTokens: 131072,
16218
+ },
16316
16219
  },
16317
16220
  "xiaomi-token-plan-sgp": {
16318
16221
  "mimo-v2-omni": {
@@ -16387,6 +16290,24 @@ export const MODELS = {
16387
16290
  contextWindow: 1048576,
16388
16291
  maxTokens: 131072,
16389
16292
  },
16293
+ "mimo-v2.5-pro-ultraspeed": {
16294
+ id: "mimo-v2.5-pro-ultraspeed",
16295
+ name: "MiMo-V2.5-Pro-UltraSpeed",
16296
+ api: "openai-completions",
16297
+ provider: "xiaomi-token-plan-sgp",
16298
+ baseUrl: "https://token-plan-sgp.xiaomimimo.com/v1",
16299
+ compat: { "requiresReasoningContentOnAssistantMessages": true, "thinkingFormat": "deepseek" },
16300
+ reasoning: true,
16301
+ input: ["text"],
16302
+ cost: {
16303
+ input: 1.305,
16304
+ output: 2.61,
16305
+ cacheRead: 0.0108,
16306
+ cacheWrite: 0,
16307
+ },
16308
+ contextWindow: 1048576,
16309
+ maxTokens: 131072,
16310
+ },
16390
16311
  },
16391
16312
  "zai": {
16392
16313
  "glm-4.5-air": {