@fleetagent/pi-ai 0.0.7 → 0.0.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1081,6 +1081,59 @@ export const MODELS = {
1081
1081
  contextWindow: 262144,
1082
1082
  maxTokens: 131072,
1083
1083
  },
1084
+ "openai.gpt-5.4": {
1085
+ id: "openai.gpt-5.4",
1086
+ name: "GPT-5.4",
1087
+ api: "bedrock-converse-stream",
1088
+ provider: "amazon-bedrock",
1089
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1090
+ reasoning: true,
1091
+ thinkingLevelMap: { "xhigh": "xhigh" },
1092
+ input: ["text", "image"],
1093
+ cost: {
1094
+ input: 2.75,
1095
+ output: 16.5,
1096
+ cacheRead: 0.275,
1097
+ cacheWrite: 0,
1098
+ },
1099
+ contextWindow: 272000,
1100
+ maxTokens: 128000,
1101
+ },
1102
+ "openai.gpt-5.5": {
1103
+ id: "openai.gpt-5.5",
1104
+ name: "GPT-5.5",
1105
+ api: "bedrock-converse-stream",
1106
+ provider: "amazon-bedrock",
1107
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1108
+ reasoning: true,
1109
+ thinkingLevelMap: { "xhigh": "xhigh" },
1110
+ input: ["text", "image"],
1111
+ cost: {
1112
+ input: 5.5,
1113
+ output: 33,
1114
+ cacheRead: 0.55,
1115
+ cacheWrite: 0,
1116
+ },
1117
+ contextWindow: 272000,
1118
+ maxTokens: 128000,
1119
+ },
1120
+ "openai.gpt-oss-120b": {
1121
+ id: "openai.gpt-oss-120b",
1122
+ name: "gpt-oss-120b",
1123
+ api: "bedrock-converse-stream",
1124
+ provider: "amazon-bedrock",
1125
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1126
+ reasoning: false,
1127
+ input: ["text"],
1128
+ cost: {
1129
+ input: 0.15,
1130
+ output: 0.6,
1131
+ cacheRead: 0,
1132
+ cacheWrite: 0,
1133
+ },
1134
+ contextWindow: 128000,
1135
+ maxTokens: 16384,
1136
+ },
1084
1137
  "openai.gpt-oss-120b-1:0": {
1085
1138
  id: "openai.gpt-oss-120b-1:0",
1086
1139
  name: "gpt-oss-120b",
@@ -1098,6 +1151,23 @@ export const MODELS = {
1098
1151
  contextWindow: 128000,
1099
1152
  maxTokens: 16384,
1100
1153
  },
1154
+ "openai.gpt-oss-20b": {
1155
+ id: "openai.gpt-oss-20b",
1156
+ name: "gpt-oss-20b",
1157
+ api: "bedrock-converse-stream",
1158
+ provider: "amazon-bedrock",
1159
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1160
+ reasoning: false,
1161
+ input: ["text"],
1162
+ cost: {
1163
+ input: 0.07,
1164
+ output: 0.3,
1165
+ cacheRead: 0,
1166
+ cacheWrite: 0,
1167
+ },
1168
+ contextWindow: 128000,
1169
+ maxTokens: 16384,
1170
+ },
1101
1171
  "openai.gpt-oss-20b-1:0": {
1102
1172
  id: "openai.gpt-oss-20b-1:0",
1103
1173
  name: "gpt-oss-20b",
@@ -3822,6 +3892,24 @@ export const MODELS = {
3822
3892
  contextWindow: 202800,
3823
3893
  maxTokens: 131072,
3824
3894
  },
3895
+ "accounts/fireworks/routers/kimi-k2p6-fast": {
3896
+ id: "accounts/fireworks/routers/kimi-k2p6-fast",
3897
+ name: "Kimi K2.6 Fast",
3898
+ api: "anthropic-messages",
3899
+ provider: "fireworks",
3900
+ baseUrl: "https://api.fireworks.ai/inference",
3901
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3902
+ reasoning: true,
3903
+ input: ["text", "image"],
3904
+ cost: {
3905
+ input: 2,
3906
+ output: 8,
3907
+ cacheRead: 0.3,
3908
+ cacheWrite: 0,
3909
+ },
3910
+ contextWindow: 262000,
3911
+ maxTokens: 262000,
3912
+ },
3825
3913
  "accounts/fireworks/routers/kimi-k2p6-turbo": {
3826
3914
  id: "accounts/fireworks/routers/kimi-k2p6-turbo",
3827
3915
  name: "Kimi K2.6 Turbo",
@@ -5919,11 +6007,11 @@ export const MODELS = {
5919
6007
  api: "mistral-conversations",
5920
6008
  provider: "mistral",
5921
6009
  baseUrl: "https://api.mistral.ai",
5922
- reasoning: true,
6010
+ reasoning: false,
5923
6011
  input: ["text", "image"],
5924
6012
  cost: {
5925
- input: 1.5,
5926
- output: 7.5,
6013
+ input: 0.4,
6014
+ output: 2,
5927
6015
  cacheRead: 0,
5928
6016
  cacheWrite: 0,
5929
6017
  },
@@ -7903,23 +7991,6 @@ export const MODELS = {
7903
7991
  contextWindow: 204800,
7904
7992
  maxTokens: 131072,
7905
7993
  },
7906
- "minimax-m3-free": {
7907
- id: "minimax-m3-free",
7908
- name: "MiniMax M3 Free",
7909
- api: "anthropic-messages",
7910
- provider: "opencode",
7911
- baseUrl: "https://opencode.ai/zen",
7912
- reasoning: true,
7913
- input: ["text", "image"],
7914
- cost: {
7915
- input: 0,
7916
- output: 0,
7917
- cacheRead: 0,
7918
- cacheWrite: 0,
7919
- },
7920
- contextWindow: 200000,
7921
- maxTokens: 32000,
7922
- },
7923
7994
  "nemotron-3-ultra-free": {
7924
7995
  id: "nemotron-3-ultra-free",
7925
7996
  name: "Nemotron 3 Ultra Free",
@@ -8181,7 +8252,7 @@ export const MODELS = {
8181
8252
  cacheRead: 0.05,
8182
8253
  cacheWrite: 0.625,
8183
8254
  },
8184
- contextWindow: 262144,
8255
+ contextWindow: 1000000,
8185
8256
  maxTokens: 65536,
8186
8257
  },
8187
8258
  "qwen3.7-max": {
@@ -8215,7 +8286,7 @@ export const MODELS = {
8215
8286
  cacheRead: 0.04,
8216
8287
  cacheWrite: 0.5,
8217
8288
  },
8218
- contextWindow: 262144,
8289
+ contextWindow: 1000000,
8219
8290
  maxTokens: 65536,
8220
8291
  },
8221
8292
  },
@@ -8649,23 +8720,6 @@ export const MODELS = {
8649
8720
  contextWindow: 2000000,
8650
8721
  maxTokens: 30000,
8651
8722
  },
8652
- "baidu/ernie-4.5-vl-28b-a3b": {
8653
- id: "baidu/ernie-4.5-vl-28b-a3b",
8654
- name: "Baidu: ERNIE 4.5 VL 28B A3B",
8655
- api: "openai-completions",
8656
- provider: "openrouter",
8657
- baseUrl: "https://openrouter.ai/api/v1",
8658
- reasoning: true,
8659
- input: ["text", "image"],
8660
- cost: {
8661
- input: 0.14,
8662
- output: 0.56,
8663
- cacheRead: 0,
8664
- cacheWrite: 0,
8665
- },
8666
- contextWindow: 131072,
8667
- maxTokens: 8000,
8668
- },
8669
8723
  "bytedance-seed/seed-1.6": {
8670
8724
  id: "bytedance-seed/seed-1.6",
8671
8725
  name: "ByteDance Seed: Seed 1.6",
@@ -9172,8 +9226,8 @@ export const MODELS = {
9172
9226
  reasoning: false,
9173
9227
  input: ["text", "image"],
9174
9228
  cost: {
9175
- input: 0.04,
9176
- output: 0.13,
9229
+ input: 0.049999999999999996,
9230
+ output: 0.15,
9177
9231
  cacheRead: 0,
9178
9232
  cacheWrite: 0,
9179
9233
  },
@@ -9241,12 +9295,12 @@ export const MODELS = {
9241
9295
  input: ["text", "image"],
9242
9296
  cost: {
9243
9297
  input: 0.12,
9244
- output: 0.37,
9245
- cacheRead: 0,
9298
+ output: 0.36,
9299
+ cacheRead: 0.09,
9246
9300
  cacheWrite: 0,
9247
9301
  },
9248
9302
  contextWindow: 262144,
9249
- maxTokens: 16384,
9303
+ maxTokens: 8192,
9250
9304
  },
9251
9305
  "google/gemma-4-31b-it:free": {
9252
9306
  id: "google/gemma-4-31b-it:free",
@@ -9395,7 +9449,7 @@ export const MODELS = {
9395
9449
  input: ["text"],
9396
9450
  cost: {
9397
9451
  input: 0.02,
9398
- output: 0.049999999999999996,
9452
+ output: 0.03,
9399
9453
  cacheRead: 0,
9400
9454
  cacheWrite: 0,
9401
9455
  },
@@ -9462,7 +9516,7 @@ export const MODELS = {
9462
9516
  reasoning: false,
9463
9517
  input: ["text", "image"],
9464
9518
  cost: {
9465
- input: 0.08,
9519
+ input: 0.09999999999999999,
9466
9520
  output: 0.3,
9467
9521
  cacheRead: 0,
9468
9522
  cacheWrite: 0,
@@ -9553,7 +9607,7 @@ export const MODELS = {
9553
9607
  cacheWrite: 0,
9554
9608
  },
9555
9609
  contextWindow: 204800,
9556
- maxTokens: 131072,
9610
+ maxTokens: 196608,
9557
9611
  },
9558
9612
  "minimax/minimax-m3": {
9559
9613
  id: "minimax/minimax-m3",
@@ -9991,7 +10045,7 @@ export const MODELS = {
9991
10045
  reasoning: true,
9992
10046
  input: ["text"],
9993
10047
  cost: {
9994
- input: 0.09999999999999999,
10048
+ input: 0.39999999999999997,
9995
10049
  output: 0.39999999999999997,
9996
10050
  cacheRead: 0,
9997
10051
  cacheWrite: 0,
@@ -10237,23 +10291,6 @@ export const MODELS = {
10237
10291
  contextWindow: 8191,
10238
10292
  maxTokens: 4096,
10239
10293
  },
10240
- "openai/gpt-4-1106-preview": {
10241
- id: "openai/gpt-4-1106-preview",
10242
- name: "OpenAI: GPT-4 Turbo (older v1106)",
10243
- api: "openai-completions",
10244
- provider: "openrouter",
10245
- baseUrl: "https://openrouter.ai/api/v1",
10246
- reasoning: false,
10247
- input: ["text"],
10248
- cost: {
10249
- input: 10,
10250
- output: 30,
10251
- cacheRead: 0,
10252
- cacheWrite: 0,
10253
- },
10254
- contextWindow: 128000,
10255
- maxTokens: 4096,
10256
- },
10257
10294
  "openai/gpt-4-turbo": {
10258
10295
  id: "openai/gpt-4-turbo",
10259
10296
  name: "OpenAI: GPT-4 Turbo",
@@ -11329,7 +11366,7 @@ export const MODELS = {
11329
11366
  reasoning: false,
11330
11367
  input: ["text"],
11331
11368
  cost: {
11332
- input: 0.071,
11369
+ input: 0.09,
11333
11370
  output: 0.09999999999999999,
11334
11371
  cacheRead: 0,
11335
11372
  cacheWrite: 0,
@@ -11363,13 +11400,13 @@ export const MODELS = {
11363
11400
  reasoning: true,
11364
11401
  input: ["text"],
11365
11402
  cost: {
11366
- input: 0.09,
11367
- output: 0.44999999999999996,
11403
+ input: 0.12,
11404
+ output: 0.5,
11368
11405
  cacheRead: 0,
11369
11406
  cacheWrite: 0,
11370
11407
  },
11371
11408
  contextWindow: 131072,
11372
- maxTokens: 20000,
11409
+ maxTokens: 16384,
11373
11410
  },
11374
11411
  "qwen/qwen3-30b-a3b-instruct-2507": {
11375
11412
  id: "qwen/qwen3-30b-a3b-instruct-2507",
@@ -11822,13 +11859,13 @@ export const MODELS = {
11822
11859
  reasoning: true,
11823
11860
  input: ["text", "image"],
11824
11861
  cost: {
11825
- input: 0.04,
11862
+ input: 0.09999999999999999,
11826
11863
  output: 0.15,
11827
11864
  cacheRead: 0,
11828
11865
  cacheWrite: 0,
11829
11866
  },
11830
11867
  contextWindow: 262144,
11831
- maxTokens: 81920,
11868
+ maxTokens: 262144,
11832
11869
  },
11833
11870
  "qwen/qwen3.5-flash-02-23": {
11834
11871
  id: "qwen/qwen3.5-flash-02-23",
@@ -11890,13 +11927,13 @@ export const MODELS = {
11890
11927
  reasoning: true,
11891
11928
  input: ["text", "image"],
11892
11929
  cost: {
11893
- input: 0.29,
11894
- output: 3.1999999999999997,
11930
+ input: 0.28900000000000003,
11931
+ output: 2.4,
11895
11932
  cacheRead: 0,
11896
11933
  cacheWrite: 0,
11897
11934
  },
11898
11935
  contextWindow: 262144,
11899
- maxTokens: 262140,
11936
+ maxTokens: 131072,
11900
11937
  },
11901
11938
  "qwen/qwen3.6-35b-a3b": {
11902
11939
  id: "qwen/qwen3.6-35b-a3b",
@@ -12034,23 +12071,6 @@ export const MODELS = {
12034
12071
  contextWindow: 256000,
12035
12072
  maxTokens: 128000,
12036
12073
  },
12037
- "sao10k/l3-euryale-70b": {
12038
- id: "sao10k/l3-euryale-70b",
12039
- name: "Sao10k: Llama 3 Euryale 70B v2.1",
12040
- api: "openai-completions",
12041
- provider: "openrouter",
12042
- baseUrl: "https://openrouter.ai/api/v1",
12043
- reasoning: false,
12044
- input: ["text"],
12045
- cost: {
12046
- input: 1.48,
12047
- output: 1.48,
12048
- cacheRead: 0,
12049
- cacheWrite: 0,
12050
- },
12051
- contextWindow: 8192,
12052
- maxTokens: 8192,
12053
- },
12054
12074
  "sao10k/l3.1-euryale-70b": {
12055
12075
  id: "sao10k/l3.1-euryale-70b",
12056
12076
  name: "Sao10K: Llama 3.1 Euryale 70B v2.2",
@@ -12784,7 +12804,7 @@ export const MODELS = {
12784
12804
  },
12785
12805
  "deepseek-ai/DeepSeek-V3": {
12786
12806
  id: "deepseek-ai/DeepSeek-V3",
12787
- name: "DeepSeek V3",
12807
+ name: "DeepSeek-V3",
12788
12808
  api: "openai-completions",
12789
12809
  provider: "together",
12790
12810
  baseUrl: "https://api.together.ai/v1",
@@ -12932,6 +12952,25 @@ export const MODELS = {
12932
12952
  contextWindow: 262144,
12933
12953
  maxTokens: 131000,
12934
12954
  },
12955
+ "nvidia/nemotron-3-ultra-550b-a55b": {
12956
+ id: "nvidia/nemotron-3-ultra-550b-a55b",
12957
+ name: "Nemotron 3 Ultra 550B A55B",
12958
+ api: "openai-completions",
12959
+ provider: "together",
12960
+ baseUrl: "https://api.together.ai/v1",
12961
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
12962
+ reasoning: true,
12963
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
12964
+ input: ["text"],
12965
+ cost: {
12966
+ input: 0.6,
12967
+ output: 3.6,
12968
+ cacheRead: 0.2,
12969
+ cacheWrite: 0,
12970
+ },
12971
+ contextWindow: 512300,
12972
+ maxTokens: 512300,
12973
+ },
12935
12974
  "openai/gpt-oss-120b": {
12936
12975
  id: "openai/gpt-oss-120b",
12937
12976
  name: "GPT OSS 120B",
@@ -14636,12 +14675,12 @@ export const MODELS = {
14636
14675
  reasoning: true,
14637
14676
  input: ["text"],
14638
14677
  cost: {
14639
- input: 0.5,
14640
- output: 2.5,
14641
- cacheRead: 0.15,
14678
+ input: 0.6,
14679
+ output: 2.4,
14680
+ cacheRead: 0.12,
14642
14681
  cacheWrite: 0,
14643
14682
  },
14644
- contextWindow: 262144,
14683
+ contextWindow: 1000000,
14645
14684
  maxTokens: 65000,
14646
14685
  },
14647
14686
  "nvidia/nemotron-nano-12b-v2-vl": {