@fleetagent/pi-ai 0.0.7 → 0.0.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1081,6 +1081,59 @@ export const MODELS = {
1081
1081
  contextWindow: 262144,
1082
1082
  maxTokens: 131072,
1083
1083
  },
1084
+ "openai.gpt-5.4": {
1085
+ id: "openai.gpt-5.4",
1086
+ name: "GPT-5.4",
1087
+ api: "bedrock-converse-stream",
1088
+ provider: "amazon-bedrock",
1089
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1090
+ reasoning: true,
1091
+ thinkingLevelMap: { "xhigh": "xhigh" },
1092
+ input: ["text", "image"],
1093
+ cost: {
1094
+ input: 2.75,
1095
+ output: 16.5,
1096
+ cacheRead: 0.275,
1097
+ cacheWrite: 0,
1098
+ },
1099
+ contextWindow: 272000,
1100
+ maxTokens: 128000,
1101
+ },
1102
+ "openai.gpt-5.5": {
1103
+ id: "openai.gpt-5.5",
1104
+ name: "GPT-5.5",
1105
+ api: "bedrock-converse-stream",
1106
+ provider: "amazon-bedrock",
1107
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1108
+ reasoning: true,
1109
+ thinkingLevelMap: { "xhigh": "xhigh" },
1110
+ input: ["text", "image"],
1111
+ cost: {
1112
+ input: 5.5,
1113
+ output: 33,
1114
+ cacheRead: 0.55,
1115
+ cacheWrite: 0,
1116
+ },
1117
+ contextWindow: 272000,
1118
+ maxTokens: 128000,
1119
+ },
1120
+ "openai.gpt-oss-120b": {
1121
+ id: "openai.gpt-oss-120b",
1122
+ name: "gpt-oss-120b",
1123
+ api: "bedrock-converse-stream",
1124
+ provider: "amazon-bedrock",
1125
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1126
+ reasoning: false,
1127
+ input: ["text"],
1128
+ cost: {
1129
+ input: 0.15,
1130
+ output: 0.6,
1131
+ cacheRead: 0,
1132
+ cacheWrite: 0,
1133
+ },
1134
+ contextWindow: 128000,
1135
+ maxTokens: 16384,
1136
+ },
1084
1137
  "openai.gpt-oss-120b-1:0": {
1085
1138
  id: "openai.gpt-oss-120b-1:0",
1086
1139
  name: "gpt-oss-120b",
@@ -1098,6 +1151,23 @@ export const MODELS = {
1098
1151
  contextWindow: 128000,
1099
1152
  maxTokens: 16384,
1100
1153
  },
1154
+ "openai.gpt-oss-20b": {
1155
+ id: "openai.gpt-oss-20b",
1156
+ name: "gpt-oss-20b",
1157
+ api: "bedrock-converse-stream",
1158
+ provider: "amazon-bedrock",
1159
+ baseUrl: "https://bedrock-runtime.us-east-1.amazonaws.com",
1160
+ reasoning: false,
1161
+ input: ["text"],
1162
+ cost: {
1163
+ input: 0.07,
1164
+ output: 0.3,
1165
+ cacheRead: 0,
1166
+ cacheWrite: 0,
1167
+ },
1168
+ contextWindow: 128000,
1169
+ maxTokens: 16384,
1170
+ },
1101
1171
  "openai.gpt-oss-20b-1:0": {
1102
1172
  id: "openai.gpt-oss-20b-1:0",
1103
1173
  name: "gpt-oss-20b",
@@ -5919,11 +5989,11 @@ export const MODELS = {
5919
5989
  api: "mistral-conversations",
5920
5990
  provider: "mistral",
5921
5991
  baseUrl: "https://api.mistral.ai",
5922
- reasoning: true,
5992
+ reasoning: false,
5923
5993
  input: ["text", "image"],
5924
5994
  cost: {
5925
- input: 1.5,
5926
- output: 7.5,
5995
+ input: 0.4,
5996
+ output: 2,
5927
5997
  cacheRead: 0,
5928
5998
  cacheWrite: 0,
5929
5999
  },
@@ -8181,7 +8251,7 @@ export const MODELS = {
8181
8251
  cacheRead: 0.05,
8182
8252
  cacheWrite: 0.625,
8183
8253
  },
8184
- contextWindow: 262144,
8254
+ contextWindow: 1000000,
8185
8255
  maxTokens: 65536,
8186
8256
  },
8187
8257
  "qwen3.7-max": {
@@ -8215,7 +8285,7 @@ export const MODELS = {
8215
8285
  cacheRead: 0.04,
8216
8286
  cacheWrite: 0.5,
8217
8287
  },
8218
- contextWindow: 262144,
8288
+ contextWindow: 1000000,
8219
8289
  maxTokens: 65536,
8220
8290
  },
8221
8291
  },
@@ -9395,7 +9465,7 @@ export const MODELS = {
9395
9465
  input: ["text"],
9396
9466
  cost: {
9397
9467
  input: 0.02,
9398
- output: 0.049999999999999996,
9468
+ output: 0.03,
9399
9469
  cacheRead: 0,
9400
9470
  cacheWrite: 0,
9401
9471
  },
@@ -11369,7 +11439,7 @@ export const MODELS = {
11369
11439
  cacheWrite: 0,
11370
11440
  },
11371
11441
  contextWindow: 131072,
11372
- maxTokens: 20000,
11442
+ maxTokens: 16384,
11373
11443
  },
11374
11444
  "qwen/qwen3-30b-a3b-instruct-2507": {
11375
11445
  id: "qwen/qwen3-30b-a3b-instruct-2507",
@@ -12784,7 +12854,7 @@ export const MODELS = {
12784
12854
  },
12785
12855
  "deepseek-ai/DeepSeek-V3": {
12786
12856
  id: "deepseek-ai/DeepSeek-V3",
12787
- name: "DeepSeek V3",
12857
+ name: "DeepSeek-V3",
12788
12858
  api: "openai-completions",
12789
12859
  provider: "together",
12790
12860
  baseUrl: "https://api.together.ai/v1",
@@ -12932,6 +13002,25 @@ export const MODELS = {
12932
13002
  contextWindow: 262144,
12933
13003
  maxTokens: 131000,
12934
13004
  },
13005
+ "nvidia/nemotron-3-ultra-550b-a55b": {
13006
+ id: "nvidia/nemotron-3-ultra-550b-a55b",
13007
+ name: "Nemotron 3 Ultra 550B A55B",
13008
+ api: "openai-completions",
13009
+ provider: "together",
13010
+ baseUrl: "https://api.together.ai/v1",
13011
+ compat: { "supportsStore": false, "supportsDeveloperRole": false, "supportsReasoningEffort": false, "maxTokensField": "max_tokens", "supportsStrictMode": false, "supportsLongCacheRetention": false, "thinkingFormat": "together" },
13012
+ reasoning: true,
13013
+ thinkingLevelMap: { "minimal": null, "low": null, "medium": null },
13014
+ input: ["text"],
13015
+ cost: {
13016
+ input: 0.6,
13017
+ output: 3.6,
13018
+ cacheRead: 0.2,
13019
+ cacheWrite: 0,
13020
+ },
13021
+ contextWindow: 512300,
13022
+ maxTokens: 512300,
13023
+ },
12935
13024
  "openai/gpt-oss-120b": {
12936
13025
  id: "openai/gpt-oss-120b",
12937
13026
  name: "GPT OSS 120B",
@@ -14636,12 +14725,12 @@ export const MODELS = {
14636
14725
  reasoning: true,
14637
14726
  input: ["text"],
14638
14727
  cost: {
14639
- input: 0.5,
14640
- output: 2.5,
14641
- cacheRead: 0.15,
14728
+ input: 0.6,
14729
+ output: 2.4,
14730
+ cacheRead: 0.12,
14642
14731
  cacheWrite: 0,
14643
14732
  },
14644
- contextWindow: 262144,
14733
+ contextWindow: 1000000,
14645
14734
  maxTokens: 65000,
14646
14735
  },
14647
14736
  "nvidia/nemotron-nano-12b-v2-vl": {