@earendil-works/pi-ai 0.78.1 → 0.79.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1086,6 +1086,59 @@ export const MODELS = {
1086
1086
  contextWindow: 262144,
1087
1087
  maxTokens: 131072,
1088
1088
  },
1089
+ "openai.gpt-5.4": {
1090
+ id: "openai.gpt-5.4",
1091
+ name: "GPT-5.4",
1092
+ api: "bedrock-converse-stream",
1093
+ provider: "amazon-bedrock",
1094
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1095
+ reasoning: true,
1096
+ thinkingLevelMap: { "xhigh": "xhigh" },
1097
+ input: ["text", "image"],
1098
+ cost: {
1099
+ input: 2.75,
1100
+ output: 16.5,
1101
+ cacheRead: 0.275,
1102
+ cacheWrite: 0,
1103
+ },
1104
+ contextWindow: 272000,
1105
+ maxTokens: 128000,
1106
+ },
1107
+ "openai.gpt-5.5": {
1108
+ id: "openai.gpt-5.5",
1109
+ name: "GPT-5.5",
1110
+ api: "bedrock-converse-stream",
1111
+ provider: "amazon-bedrock",
1112
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1113
+ reasoning: true,
1114
+ thinkingLevelMap: { "xhigh": "xhigh" },
1115
+ input: ["text", "image"],
1116
+ cost: {
1117
+ input: 5.5,
1118
+ output: 33,
1119
+ cacheRead: 0.55,
1120
+ cacheWrite: 0,
1121
+ },
1122
+ contextWindow: 272000,
1123
+ maxTokens: 128000,
1124
+ },
1125
+ "openai.gpt-oss-120b": {
1126
+ id: "openai.gpt-oss-120b",
1127
+ name: "gpt-oss-120b",
1128
+ api: "bedrock-converse-stream",
1129
+ provider: "amazon-bedrock",
1130
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1131
+ reasoning: false,
1132
+ input: ["text"],
1133
+ cost: {
1134
+ input: 0.15,
1135
+ output: 0.6,
1136
+ cacheRead: 0,
1137
+ cacheWrite: 0,
1138
+ },
1139
+ contextWindow: 128000,
1140
+ maxTokens: 16384,
1141
+ },
1089
1142
  "openai.gpt-oss-120b-1:0": {
1090
1143
  id: "openai.gpt-oss-120b-1:0",
1091
1144
  name: "gpt-oss-120b",
@@ -1103,6 +1156,23 @@ export const MODELS = {
1103
1156
  contextWindow: 128000,
1104
1157
  maxTokens: 16384,
1105
1158
  },
1159
+ "openai.gpt-oss-20b": {
1160
+ id: "openai.gpt-oss-20b",
1161
+ name: "gpt-oss-20b",
1162
+ api: "bedrock-converse-stream",
1163
+ provider: "amazon-bedrock",
1164
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1165
+ reasoning: false,
1166
+ input: ["text"],
1167
+ cost: {
1168
+ input: 0.07,
1169
+ output: 0.3,
1170
+ cacheRead: 0,
1171
+ cacheWrite: 0,
1172
+ },
1173
+ contextWindow: 128000,
1174
+ maxTokens: 16384,
1175
+ },
1106
1176
  "openai.gpt-oss-20b-1:0": {
1107
1177
  id: "openai.gpt-oss-20b-1:0",
1108
1178
  name: "gpt-oss-20b",
@@ -3887,6 +3957,24 @@ export const MODELS = {
3887
3957
  contextWindow: 202800,
3888
3958
  maxTokens: 131072,
3889
3959
  },
3960
+ "accounts/fireworks/routers/kimi-k2p6-fast": {
3961
+ id: "accounts/fireworks/routers/kimi-k2p6-fast",
3962
+ name: "Kimi K2.6 Fast",
3963
+ api: "anthropic-messages",
3964
+ provider: "fireworks",
3965
+ baseUrl: "https://api.fireworks.ai/inference",
3966
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3967
+ reasoning: true,
3968
+ input: ["text", "image"],
3969
+ cost: {
3970
+ input: 2,
3971
+ output: 8,
3972
+ cacheRead: 0.3,
3973
+ cacheWrite: 0,
3974
+ },
3975
+ contextWindow: 262000,
3976
+ maxTokens: 262000,
3977
+ },
3890
3978
  "accounts/fireworks/routers/kimi-k2p6-turbo": {
3891
3979
  id: "accounts/fireworks/routers/kimi-k2p6-turbo",
3892
3980
  name: "Kimi K2.6 Turbo",
@@ -6019,11 +6107,11 @@ export const MODELS = {
6019
6107
  api: "mistral-conversations",
6020
6108
  provider: "mistral",
6021
6109
  baseUrl: "https://api.mistral.ai",
6022
- reasoning: true,
6110
+ reasoning: false,
6023
6111
  input: ["text", "image"],
6024
6112
  cost: {
6025
- input: 1.5,
6026
- output: 7.5,
6113
+ input: 0.4,
6114
+ output: 2,
6027
6115
  cacheRead: 0,
6028
6116
  cacheWrite: 0,
6029
6117
  },
@@ -6705,6 +6793,25 @@ export const MODELS = {
6705
6793
  contextWindow: 262144,
6706
6794
  maxTokens: 262144,
6707
6795
  },
6796
+ "nvidia/nemotron-3-ultra-550b-a55b": {
6797
+ id: "nvidia/nemotron-3-ultra-550b-a55b",
6798
+ name: "Nemotron 3 Ultra 550B A55B",
6799
+ api: "openai-completions",
6800
+ provider: "nvidia",
6801
+ baseUrl: "https://integrate.api.nvidia.com/v1",
6802
+ headers: { "NVCF-POLL-SECONDS": "3600" },
6803
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false },
6804
+ reasoning: true,
6805
+ input: ["text"],
6806
+ cost: {
6807
+ input: 0.5,
6808
+ output: 2.5,
6809
+ cacheRead: 0.15,
6810
+ cacheWrite: 0,
6811
+ },
6812
+ contextWindow: 1000000,
6813
+ maxTokens: 65536,
6814
+ },
6708
6815
  "nvidia/nvidia-nemotron-nano-9b-v2": {
6709
6816
  id: "nvidia/nvidia-nemotron-nano-9b-v2",
6710
6817
  name: "nvidia-nemotron-nano-9b-v2",
@@ -8350,23 +8457,6 @@ export const MODELS = {
8350
8457
  contextWindow: 204800,
8351
8458
  maxTokens: 131072,
8352
8459
  },
8353
- "minimax-m3-free": {
8354
- id: "minimax-m3-free",
8355
- name: "MiniMax M3 Free",
8356
- api: "anthropic-messages",
8357
- provider: "opencode",
8358
- baseUrl: "https://opencode.ai/zen",
8359
- reasoning: true,
8360
- input: ["text", "image"],
8361
- cost: {
8362
- input: 0,
8363
- output: 0,
8364
- cacheRead: 0,
8365
- cacheWrite: 0,
8366
- },
8367
- contextWindow: 200000,
8368
- maxTokens: 32000,
8369
- },
8370
8460
  "nemotron-3-ultra-free": {
8371
8461
  id: "nemotron-3-ultra-free",
8372
8462
  name: "Nemotron 3 Ultra Free",
@@ -8605,9 +8695,9 @@ export const MODELS = {
8605
8695
  reasoning: true,
8606
8696
  input: ["text", "image"],
8607
8697
  cost: {
8608
- input: 0.6,
8609
- output: 2.4,
8610
- cacheRead: 0.12,
8698
+ input: 0.3,
8699
+ output: 1.2,
8700
+ cacheRead: 0.06,
8611
8701
  cacheWrite: 0,
8612
8702
  },
8613
8703
  contextWindow: 512000,
@@ -8628,7 +8718,7 @@ export const MODELS = {
8628
8718
  cacheRead: 0.05,
8629
8719
  cacheWrite: 0.625,
8630
8720
  },
8631
- contextWindow: 262144,
8721
+ contextWindow: 1000000,
8632
8722
  maxTokens: 65536,
8633
8723
  },
8634
8724
  "qwen3.7-max": {
@@ -8662,7 +8752,7 @@ export const MODELS = {
8662
8752
  cacheRead: 0.04,
8663
8753
  cacheWrite: 0.5,
8664
8754
  },
8665
- contextWindow: 262144,
8755
+ contextWindow: 1000000,
8666
8756
  maxTokens: 65536,
8667
8757
  },
8668
8758
  },
@@ -9098,23 +9188,6 @@ export const MODELS = {
9098
9188
  contextWindow: 2000000,
9099
9189
  maxTokens: 30000,
9100
9190
  },
9101
- "baidu/ernie-4.5-vl-28b-a3b": {
9102
- id: "baidu/ernie-4.5-vl-28b-a3b",
9103
- name: "Baidu: ERNIE 4.5 VL 28B A3B",
9104
- api: "openai-completions",
9105
- provider: "openrouter",
9106
- baseUrl: "https://openrouter.ai/api/v1",
9107
- reasoning: true,
9108
- input: ["text", "image"],
9109
- cost: {
9110
- input: 0.14,
9111
- output: 0.56,
9112
- cacheRead: 0,
9113
- cacheWrite: 0,
9114
- },
9115
- contextWindow: 131072,
9116
- maxTokens: 8000,
9117
- },
9118
9191
  "bytedance-seed/seed-1.6": {
9119
9192
  id: "bytedance-seed/seed-1.6",
9120
9193
  name: "ByteDance Seed: Seed 1.6",
@@ -9621,8 +9694,8 @@ export const MODELS = {
9621
9694
  reasoning: false,
9622
9695
  input: ["text", "image"],
9623
9696
  cost: {
9624
- input: 0.04,
9625
- output: 0.13,
9697
+ input: 0.049999999999999996,
9698
+ output: 0.15,
9626
9699
  cacheRead: 0,
9627
9700
  cacheWrite: 0,
9628
9701
  },
@@ -9690,12 +9763,12 @@ export const MODELS = {
9690
9763
  input: ["text", "image"],
9691
9764
  cost: {
9692
9765
  input: 0.12,
9693
- output: 0.37,
9694
- cacheRead: 0,
9766
+ output: 0.36,
9767
+ cacheRead: 0.09,
9695
9768
  cacheWrite: 0,
9696
9769
  },
9697
9770
  contextWindow: 262144,
9698
- maxTokens: 16384,
9771
+ maxTokens: 8192,
9699
9772
  },
9700
9773
  "google/gemma-4-31b-it:free": {
9701
9774
  id: "google/gemma-4-31b-it:free",
@@ -9844,7 +9917,7 @@ export const MODELS = {
9844
9917
  input: ["text"],
9845
9918
  cost: {
9846
9919
  input: 0.02,
9847
- output: 0.049999999999999996,
9920
+ output: 0.03,
9848
9921
  cacheRead: 0,
9849
9922
  cacheWrite: 0,
9850
9923
  },
@@ -9911,7 +9984,7 @@ export const MODELS = {
9911
9984
  reasoning: false,
9912
9985
  input: ["text", "image"],
9913
9986
  cost: {
9914
- input: 0.08,
9987
+ input: 0.09999999999999999,
9915
9988
  output: 0.3,
9916
9989
  cacheRead: 0,
9917
9990
  cacheWrite: 0,
@@ -10002,7 +10075,7 @@ export const MODELS = {
10002
10075
  cacheWrite: 0,
10003
10076
  },
10004
10077
  contextWindow: 204800,
10005
- maxTokens: 131072,
10078
+ maxTokens: 196608,
10006
10079
  },
10007
10080
  "minimax/minimax-m3": {
10008
10081
  id: "minimax/minimax-m3",
@@ -10388,13 +10461,13 @@ export const MODELS = {
10388
10461
  reasoning: true,
10389
10462
  input: ["text", "image"],
10390
10463
  cost: {
10391
- input: 0.684,
10392
- output: 3.42,
10393
- cacheRead: 0.144,
10464
+ input: 0.6799999999999999,
10465
+ output: 3.41,
10466
+ cacheRead: 0.33999999999999997,
10394
10467
  cacheWrite: 0,
10395
10468
  },
10396
10469
  contextWindow: 262144,
10397
- maxTokens: 262144,
10470
+ maxTokens: 262142,
10398
10471
  },
10399
10472
  "moonshotai/kimi-k2.6:free": {
10400
10473
  id: "moonshotai/kimi-k2.6:free",
@@ -10414,23 +10487,6 @@ export const MODELS = {
10414
10487
  contextWindow: 262144,
10415
10488
  maxTokens: 4096,
10416
10489
  },
10417
- "nex-agi/deepseek-v3.1-nex-n1": {
10418
- id: "nex-agi/deepseek-v3.1-nex-n1",
10419
- name: "Nex AGI: DeepSeek V3.1 Nex N1",
10420
- api: "openai-completions",
10421
- provider: "openrouter",
10422
- baseUrl: "https://openrouter.ai/api/v1",
10423
- reasoning: false,
10424
- input: ["text"],
10425
- cost: {
10426
- input: 0.135,
10427
- output: 0.5,
10428
- cacheRead: 0,
10429
- cacheWrite: 0,
10430
- },
10431
- contextWindow: 131072,
10432
- maxTokens: 163840,
10433
- },
10434
10490
  "nvidia/llama-3.3-nemotron-super-49b-v1.5": {
10435
10491
  id: "nvidia/llama-3.3-nemotron-super-49b-v1.5",
10436
10492
  name: "NVIDIA: Llama 3.3 Nemotron Super 49B V1.5",
@@ -10440,7 +10496,7 @@ export const MODELS = {
10440
10496
  reasoning: true,
10441
10497
  input: ["text"],
10442
10498
  cost: {
10443
- input: 0.09999999999999999,
10499
+ input: 0.39999999999999997,
10444
10500
  output: 0.39999999999999997,
10445
10501
  cacheRead: 0,
10446
10502
  cacheWrite: 0,
@@ -10686,23 +10742,6 @@ export const MODELS = {
10686
10742
  contextWindow: 8191,
10687
10743
  maxTokens: 4096,
10688
10744
  },
10689
- "openai/gpt-4-1106-preview": {
10690
- id: "openai/gpt-4-1106-preview",
10691
- name: "OpenAI: GPT-4 Turbo (older v1106)",
10692
- api: "openai-completions",
10693
- provider: "openrouter",
10694
- baseUrl: "https://openrouter.ai/api/v1",
10695
- reasoning: false,
10696
- input: ["text"],
10697
- cost: {
10698
- input: 10,
10699
- output: 30,
10700
- cacheRead: 0,
10701
- cacheWrite: 0,
10702
- },
10703
- contextWindow: 128000,
10704
- maxTokens: 4096,
10705
- },
10706
10745
  "openai/gpt-4-turbo": {
10707
10746
  id: "openai/gpt-4-turbo",
10708
10747
  name: "OpenAI: GPT-4 Turbo",
@@ -11778,7 +11817,7 @@ export const MODELS = {
11778
11817
  reasoning: false,
11779
11818
  input: ["text"],
11780
11819
  cost: {
11781
- input: 0.071,
11820
+ input: 0.09,
11782
11821
  output: 0.09999999999999999,
11783
11822
  cacheRead: 0,
11784
11823
  cacheWrite: 0,
@@ -11812,13 +11851,13 @@ export const MODELS = {
11812
11851
  reasoning: true,
11813
11852
  input: ["text"],
11814
11853
  cost: {
11815
- input: 0.09,
11816
- output: 0.44999999999999996,
11854
+ input: 0.12,
11855
+ output: 0.5,
11817
11856
  cacheRead: 0,
11818
11857
  cacheWrite: 0,
11819
11858
  },
11820
11859
  contextWindow: 131072,
11821
- maxTokens: 20000,
11860
+ maxTokens: 16384,
11822
11861
  },
11823
11862
  "qwen/qwen3-30b-a3b-instruct-2507": {
11824
11863
  id: "qwen/qwen3-30b-a3b-instruct-2507",
@@ -12271,13 +12310,13 @@ export const MODELS = {
12271
12310
  reasoning: true,
12272
12311
  input: ["text", "image"],
12273
12312
  cost: {
12274
- input: 0.04,
12313
+ input: 0.09999999999999999,
12275
12314
  output: 0.15,
12276
12315
  cacheRead: 0,
12277
12316
  cacheWrite: 0,
12278
12317
  },
12279
12318
  contextWindow: 262144,
12280
- maxTokens: 81920,
12319
+ maxTokens: 262144,
12281
12320
  },
12282
12321
  "qwen/qwen3.5-flash-02-23": {
12283
12322
  id: "qwen/qwen3.5-flash-02-23",
@@ -12339,13 +12378,13 @@ export const MODELS = {
12339
12378
  reasoning: true,
12340
12379
  input: ["text", "image"],
12341
12380
  cost: {
12342
- input: 0.29,
12343
- output: 3.1999999999999997,
12381
+ input: 0.28900000000000003,
12382
+ output: 2.4,
12344
12383
  cacheRead: 0,
12345
12384
  cacheWrite: 0,
12346
12385
  },
12347
12386
  contextWindow: 262144,
12348
- maxTokens: 262140,
12387
+ maxTokens: 131072,
12349
12388
  },
12350
12389
  "qwen/qwen3.6-35b-a3b": {
12351
12390
  id: "qwen/qwen3.6-35b-a3b",
@@ -12483,23 +12522,6 @@ export const MODELS = {
12483
12522
  contextWindow: 256000,
12484
12523
  maxTokens: 128000,
12485
12524
  },
12486
- "sao10k/l3-euryale-70b": {
12487
- id: "sao10k/l3-euryale-70b",
12488
- name: "Sao10k: Llama 3 Euryale 70B v2.1",
12489
- api: "openai-completions",
12490
- provider: "openrouter",
12491
- baseUrl: "https://openrouter.ai/api/v1",
12492
- reasoning: false,
12493
- input: ["text"],
12494
- cost: {
12495
- input: 1.48,
12496
- output: 1.48,
12497
- cacheRead: 0,
12498
- cacheWrite: 0,
12499
- },
12500
- contextWindow: 8192,
12501
- maxTokens: 8192,
12502
- },
12503
12525
  "sao10k/l3.1-euryale-70b": {
12504
12526
  id: "sao10k/l3.1-euryale-70b",
12505
12527
  name: "Sao10K: Llama 3.1 Euryale 70B v2.2",
@@ -13036,13 +13058,13 @@ export const MODELS = {
13036
13058
  reasoning: true,
13037
13059
  input: ["text", "image"],
13038
13060
  cost: {
13039
- input: 0.684,
13040
- output: 3.42,
13041
- cacheRead: 0.144,
13061
+ input: 0.6799999999999999,
13062
+ output: 3.41,
13063
+ cacheRead: 0.33999999999999997,
13042
13064
  cacheWrite: 0,
13043
13065
  },
13044
13066
  contextWindow: 262144,
13045
- maxTokens: 262144,
13067
+ maxTokens: 262142,
13046
13068
  },
13047
13069
  "~openai/gpt-latest": {
13048
13070
  id: "~openai/gpt-latest",
@@ -13233,7 +13255,7 @@ export const MODELS = {
13233
13255
  },
13234
13256
  "deepseek-ai/DeepSeek-V3": {
13235
13257
  id: "deepseek-ai/DeepSeek-V3",
13236
- name: "DeepSeek V3",
13258
+ name: "DeepSeek-V3",
13237
13259
  api: "openai-completions",
13238
13260
  provider: "together",
13239
13261
  baseUrl: "https://api.together.ai/v1",
@@ -13381,6 +13403,25 @@ export const MODELS = {
13381
13403
  contextWindow: 262144,
13382
13404
  maxTokens: 131000,
13383
13405
  },
13406
+ "nvidia/nemotron-3-ultra-550b-a55b": {
13407
+ id: "nvidia/nemotron-3-ultra-550b-a55b",
13408
+ name: "Nemotron 3 Ultra 550B A55B",
13409
+ api: "openai-completions",
13410
+ provider: "together",
13411
+ baseUrl: "https://api.together.ai/v1",
13412
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13413
+ reasoning: true,
13414
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13415
+ input: ["text"],
13416
+ cost: {
13417
+ input: 0.6,
13418
+ output: 3.6,
13419
+ cacheRead: 0.2,
13420
+ cacheWrite: 0,
13421
+ },
13422
+ contextWindow: 512300,
13423
+ maxTokens: 512300,
13424
+ },
13384
13425
  "openai/gpt-oss-120b": {
13385
13426
  id: "openai/gpt-oss-120b",
13386
13427
  name: "GPT OSS 120B",
@@ -14210,40 +14251,6 @@ export const MODELS = {
14210
14251
  contextWindow: 1000000,
14211
14252
  maxTokens: 384000,
14212
14253
  },
14213
- "google/gemini-2.0-flash": {
14214
- id: "google/gemini-2.0-flash",
14215
- name: "Gemini 2.0 Flash",
14216
- api: "anthropic-messages",
14217
- provider: "vercel-ai-gateway",
14218
- baseUrl: "https://ai-gateway.vercel.sh",
14219
- reasoning: false,
14220
- input: ["text", "image"],
14221
- cost: {
14222
- input: 0.15,
14223
- output: 0.6,
14224
- cacheRead: 0.024999999999999998,
14225
- cacheWrite: 0,
14226
- },
14227
- contextWindow: 1048576,
14228
- maxTokens: 8192,
14229
- },
14230
- "google/gemini-2.0-flash-lite": {
14231
- id: "google/gemini-2.0-flash-lite",
14232
- name: "Gemini 2.0 Flash Lite",
14233
- api: "anthropic-messages",
14234
- provider: "vercel-ai-gateway",
14235
- baseUrl: "https://ai-gateway.vercel.sh",
14236
- reasoning: false,
14237
- input: ["text", "image"],
14238
- cost: {
14239
- input: 0.075,
14240
- output: 0.3,
14241
- cacheRead: 0.02,
14242
- cacheWrite: 0,
14243
- },
14244
- contextWindow: 1048576,
14245
- maxTokens: 8192,
14246
- },
14247
14254
  "google/gemini-2.5-flash": {
14248
14255
  id: "google/gemini-2.5-flash",
14249
14256
  name: "Gemini 2.5 Flash",
@@ -15086,12 +15093,12 @@ export const MODELS = {
15086
15093
  reasoning: true,
15087
15094
  input: ["text"],
15088
15095
  cost: {
15089
- input: 0.5,
15090
- output: 2.5,
15091
- cacheRead: 0.15,
15096
+ input: 0.6,
15097
+ output: 2.4,
15098
+ cacheRead: 0.12,
15092
15099
  cacheWrite: 0,
15093
15100
  },
15094
- contextWindow: 262144,
15101
+ contextWindow: 1000000,
15095
15102
  maxTokens: 65000,
15096
15103
  },
15097
15104
  "nvidia/nemotron-nano-12b-v2-vl": {