@fleetagent/pi-ai 0.0.8 → 0.0.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -3892,6 +3892,24 @@ export const MODELS = {
3892
3892
  contextWindow: 202800,
3893
3893
  maxTokens: 131072,
3894
3894
  },
3895
+ "accounts/fireworks/routers/kimi-k2p6-fast": {
3896
+ id: "accounts/fireworks/routers/kimi-k2p6-fast",
3897
+ name: "Kimi K2.6 Fast",
3898
+ api: "anthropic-messages",
3899
+ provider: "fireworks",
3900
+ baseUrl: "https://api.fireworks.ai/inference",
3901
+ compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3902
+ reasoning: true,
3903
+ input: ["text", "image"],
3904
+ cost: {
3905
+ input: 2,
3906
+ output: 8,
3907
+ cacheRead: 0.3,
3908
+ cacheWrite: 0,
3909
+ },
3910
+ contextWindow: 262000,
3911
+ maxTokens: 262000,
3912
+ },
3895
3913
  "accounts/fireworks/routers/kimi-k2p6-turbo": {
3896
3914
  id: "accounts/fireworks/routers/kimi-k2p6-turbo",
3897
3915
  name: "Kimi K2.6 Turbo",
@@ -7973,23 +7991,6 @@ export const MODELS = {
7973
7991
  contextWindow: 204800,
7974
7992
  maxTokens: 131072,
7975
7993
  },
7976
- "minimax-m3-free": {
7977
- id: "minimax-m3-free",
7978
- name: "MiniMax M3 Free",
7979
- api: "anthropic-messages",
7980
- provider: "opencode",
7981
- baseUrl: "https://opencode.ai/zen",
7982
- reasoning: true,
7983
- input: ["text", "image"],
7984
- cost: {
7985
- input: 0,
7986
- output: 0,
7987
- cacheRead: 0,
7988
- cacheWrite: 0,
7989
- },
7990
- contextWindow: 200000,
7991
- maxTokens: 32000,
7992
- },
7993
7994
  "nemotron-3-ultra-free": {
7994
7995
  id: "nemotron-3-ultra-free",
7995
7996
  name: "Nemotron 3 Ultra Free",
@@ -8719,23 +8720,6 @@ export const MODELS = {
8719
8720
  contextWindow: 2000000,
8720
8721
  maxTokens: 30000,
8721
8722
  },
8722
- "baidu/ernie-4.5-vl-28b-a3b": {
8723
- id: "baidu/ernie-4.5-vl-28b-a3b",
8724
- name: "Baidu: ERNIE 4.5 VL 28B A3B",
8725
- api: "openai-completions",
8726
- provider: "openrouter",
8727
- baseUrl: "https://openrouter.ai/api/v1",
8728
- reasoning: true,
8729
- input: ["text", "image"],
8730
- cost: {
8731
- input: 0.14,
8732
- output: 0.56,
8733
- cacheRead: 0,
8734
- cacheWrite: 0,
8735
- },
8736
- contextWindow: 131072,
8737
- maxTokens: 8000,
8738
- },
8739
8723
  "bytedance-seed/seed-1.6": {
8740
8724
  id: "bytedance-seed/seed-1.6",
8741
8725
  name: "ByteDance Seed: Seed 1.6",
@@ -9242,8 +9226,8 @@ export const MODELS = {
9242
9226
  reasoning: false,
9243
9227
  input: ["text", "image"],
9244
9228
  cost: {
9245
- input: 0.04,
9246
- output: 0.13,
9229
+ input: 0.049999999999999996,
9230
+ output: 0.15,
9247
9231
  cacheRead: 0,
9248
9232
  cacheWrite: 0,
9249
9233
  },
@@ -9311,12 +9295,12 @@ export const MODELS = {
9311
9295
  input: ["text", "image"],
9312
9296
  cost: {
9313
9297
  input: 0.12,
9314
- output: 0.37,
9315
- cacheRead: 0,
9298
+ output: 0.36,
9299
+ cacheRead: 0.09,
9316
9300
  cacheWrite: 0,
9317
9301
  },
9318
9302
  contextWindow: 262144,
9319
- maxTokens: 16384,
9303
+ maxTokens: 8192,
9320
9304
  },
9321
9305
  "google/gemma-4-31b-it:free": {
9322
9306
  id: "google/gemma-4-31b-it:free",
@@ -9532,7 +9516,7 @@ export const MODELS = {
9532
9516
  reasoning: false,
9533
9517
  input: ["text", "image"],
9534
9518
  cost: {
9535
- input: 0.08,
9519
+ input: 0.09999999999999999,
9536
9520
  output: 0.3,
9537
9521
  cacheRead: 0,
9538
9522
  cacheWrite: 0,
@@ -9623,7 +9607,7 @@ export const MODELS = {
9623
9607
  cacheWrite: 0,
9624
9608
  },
9625
9609
  contextWindow: 204800,
9626
- maxTokens: 131072,
9610
+ maxTokens: 196608,
9627
9611
  },
9628
9612
  "minimax/minimax-m3": {
9629
9613
  id: "minimax/minimax-m3",
@@ -10061,7 +10045,7 @@ export const MODELS = {
10061
10045
  reasoning: true,
10062
10046
  input: ["text"],
10063
10047
  cost: {
10064
- input: 0.09999999999999999,
10048
+ input: 0.39999999999999997,
10065
10049
  output: 0.39999999999999997,
10066
10050
  cacheRead: 0,
10067
10051
  cacheWrite: 0,
@@ -10307,23 +10291,6 @@ export const MODELS = {
10307
10291
  contextWindow: 8191,
10308
10292
  maxTokens: 4096,
10309
10293
  },
10310
- "openai/gpt-4-1106-preview": {
10311
- id: "openai/gpt-4-1106-preview",
10312
- name: "OpenAI: GPT-4 Turbo (older v1106)",
10313
- api: "openai-completions",
10314
- provider: "openrouter",
10315
- baseUrl: "https://openrouter.ai/api/v1",
10316
- reasoning: false,
10317
- input: ["text"],
10318
- cost: {
10319
- input: 10,
10320
- output: 30,
10321
- cacheRead: 0,
10322
- cacheWrite: 0,
10323
- },
10324
- contextWindow: 128000,
10325
- maxTokens: 4096,
10326
- },
10327
10294
  "openai/gpt-4-turbo": {
10328
10295
  id: "openai/gpt-4-turbo",
10329
10296
  name: "OpenAI: GPT-4 Turbo",
@@ -11399,7 +11366,7 @@ export const MODELS = {
11399
11366
  reasoning: false,
11400
11367
  input: ["text"],
11401
11368
  cost: {
11402
- input: 0.071,
11369
+ input: 0.09,
11403
11370
  output: 0.09999999999999999,
11404
11371
  cacheRead: 0,
11405
11372
  cacheWrite: 0,
@@ -11433,8 +11400,8 @@ export const MODELS = {
11433
11400
  reasoning: true,
11434
11401
  input: ["text"],
11435
11402
  cost: {
11436
- input: 0.09,
11437
- output: 0.44999999999999996,
11403
+ input: 0.12,
11404
+ output: 0.5,
11438
11405
  cacheRead: 0,
11439
11406
  cacheWrite: 0,
11440
11407
  },
@@ -11892,13 +11859,13 @@ export const MODELS = {
11892
11859
  reasoning: true,
11893
11860
  input: ["text", "image"],
11894
11861
  cost: {
11895
- input: 0.04,
11862
+ input: 0.09999999999999999,
11896
11863
  output: 0.15,
11897
11864
  cacheRead: 0,
11898
11865
  cacheWrite: 0,
11899
11866
  },
11900
11867
  contextWindow: 262144,
11901
- maxTokens: 81920,
11868
+ maxTokens: 262144,
11902
11869
  },
11903
11870
  "qwen/qwen3.5-flash-02-23": {
11904
11871
  id: "qwen/qwen3.5-flash-02-23",
@@ -11960,13 +11927,13 @@ export const MODELS = {
11960
11927
  reasoning: true,
11961
11928
  input: ["text", "image"],
11962
11929
  cost: {
11963
- input: 0.29,
11964
- output: 3.1999999999999997,
11930
+ input: 0.28900000000000003,
11931
+ output: 2.4,
11965
11932
  cacheRead: 0,
11966
11933
  cacheWrite: 0,
11967
11934
  },
11968
11935
  contextWindow: 262144,
11969
- maxTokens: 262140,
11936
+ maxTokens: 131072,
11970
11937
  },
11971
11938
  "qwen/qwen3.6-35b-a3b": {
11972
11939
  id: "qwen/qwen3.6-35b-a3b",
@@ -12104,23 +12071,6 @@ export const MODELS = {
12104
12071
  contextWindow: 256000,
12105
12072
  maxTokens: 128000,
12106
12073
  },
12107
- "sao10k/l3-euryale-70b": {
12108
- id: "sao10k/l3-euryale-70b",
12109
- name: "Sao10k: Llama 3 Euryale 70B v2.1",
12110
- api: "openai-completions",
12111
- provider: "openrouter",
12112
- baseUrl: "https://openrouter.ai/api/v1",
12113
- reasoning: false,
12114
- input: ["text"],
12115
- cost: {
12116
- input: 1.48,
12117
- output: 1.48,
12118
- cacheRead: 0,
12119
- cacheWrite: 0,
12120
- },
12121
- contextWindow: 8192,
12122
- maxTokens: 8192,
12123
- },
12124
12074
  "sao10k/l3.1-euryale-70b": {
12125
12075
  id: "sao10k/l3.1-euryale-70b",
12126
12076
  name: "Sao10K: Llama 3.1 Euryale 70B v2.2",