@earendil-works/pi-ai 0.79.8 → 0.79.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -3927,11 +3927,12 @@ export const MODELS = {
3927
3927
  "accounts/fireworks/models/glm-5p2": {
3928
3928
  id: "accounts/fireworks/models/glm-5p2",
3929
3929
  name: "GLM 5.2",
3930
- api: "anthropic-messages",
3930
+ api: "openai-completions",
3931
3931
  provider: "fireworks",
3932
- baseUrl: "https://api.fireworks.ai/inference",
3933
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3932
+ baseUrl: "https://api.fireworks.ai/inference/v1",
3933
+ compat: { "supportsStore": false, "supportsDeveloperRole": false },
3934
3934
  reasoning: true,
3935
+ thinkingLevelMap: { "off": "none", "minimal": null, "low": "high", "medium": "high", "xhigh": "max" },
3935
3936
  input: ["text"],
3936
3937
  cost: {
3937
3938
  input: 1.4,
@@ -4848,42 +4849,6 @@ export const MODELS = {
4848
4849
  contextWindow: 262144,
4849
4850
  maxTokens: 32768,
4850
4851
  },
4851
- "gemma-4-E2B-it": {
4852
- id: "gemma-4-E2B-it",
4853
- name: "Gemma 4 E2B IT",
4854
- api: "google-generative-ai",
4855
- provider: "google",
4856
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4857
- reasoning: true,
4858
- thinkingLevelMap: { "off": null, "minimal": "MINIMAL", "low": null, "medium": null, "high": "HIGH" },
4859
- input: ["text", "image"],
4860
- cost: {
4861
- input: 0,
4862
- output: 0,
4863
- cacheRead: 0,
4864
- cacheWrite: 0,
4865
- },
4866
- contextWindow: 131072,
4867
- maxTokens: 8192,
4868
- },
4869
- "gemma-4-E4B-it": {
4870
- id: "gemma-4-E4B-it",
4871
- name: "Gemma 4 E4B IT",
4872
- api: "google-generative-ai",
4873
- provider: "google",
4874
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4875
- reasoning: true,
4876
- thinkingLevelMap: { "off": null, "minimal": "MINIMAL", "low": null, "medium": null, "high": "HIGH" },
4877
- input: ["text", "image"],
4878
- cost: {
4879
- input: 0,
4880
- output: 0,
4881
- cacheRead: 0,
4882
- cacheWrite: 0,
4883
- },
4884
- contextWindow: 131072,
4885
- maxTokens: 8192,
4886
- },
4887
4852
  },
4888
4853
  "google-vertex": {
4889
4854
  "gemini-2.5-flash": {
@@ -9187,13 +9152,13 @@ export const MODELS = {
9187
9152
  reasoning: true,
9188
9153
  input: ["text"],
9189
9154
  cost: {
9190
- input: 0.22,
9191
- output: 0.85,
9155
+ input: 0.25,
9156
+ output: 0.8,
9192
9157
  cacheRead: 0.06,
9193
9158
  cacheWrite: 0,
9194
9159
  },
9195
9160
  contextWindow: 262144,
9196
- maxTokens: 262144,
9161
+ maxTokens: 80000,
9197
9162
  },
9198
9163
  "arcee-ai/trinity-mini": {
9199
9164
  id: "arcee-ai/trinity-mini",
@@ -9689,7 +9654,7 @@ export const MODELS = {
9689
9654
  cacheRead: 0.2,
9690
9655
  cacheWrite: 0.375,
9691
9656
  },
9692
- contextWindow: 65536,
9657
+ contextWindow: 131072,
9693
9658
  maxTokens: 32768,
9694
9659
  },
9695
9660
  "google/gemini-3.1-flash-lite": {
@@ -9877,7 +9842,7 @@ export const MODELS = {
9877
9842
  cacheWrite: 0,
9878
9843
  },
9879
9844
  contextWindow: 262144,
9880
- maxTokens: 8192,
9845
+ maxTokens: 32768,
9881
9846
  },
9882
9847
  "ibm-granite/granite-4.1-8b": {
9883
9848
  id: "ibm-granite/granite-4.1-8b",
@@ -9979,8 +9944,8 @@ export const MODELS = {
9979
9944
  cacheRead: 0.06,
9980
9945
  cacheWrite: 0,
9981
9946
  },
9982
- contextWindow: 256000,
9983
- maxTokens: 80000,
9947
+ contextWindow: 262144,
9948
+ maxTokens: 144000,
9984
9949
  },
9985
9950
  "liquid/lfm-2.5-1.2b-thinking:free": {
9986
9951
  id: "liquid/lfm-2.5-1.2b-thinking:free",
@@ -10201,7 +10166,7 @@ export const MODELS = {
10201
10166
  cacheWrite: 0,
10202
10167
  },
10203
10168
  contextWindow: 1048576,
10204
- maxTokens: 512000,
10169
+ maxTokens: 4096,
10205
10170
  },
10206
10171
  "mistralai/codestral-2508": {
10207
10172
  id: "mistralai/codestral-2508",
@@ -10537,7 +10502,7 @@ export const MODELS = {
10537
10502
  cost: {
10538
10503
  input: 0.6,
10539
10504
  output: 2.5,
10540
- cacheRead: 0,
10505
+ cacheRead: 0.6,
10541
10506
  cacheWrite: 0,
10542
10507
  },
10543
10508
  contextWindow: 262144,
@@ -10570,13 +10535,13 @@ export const MODELS = {
10570
10535
  reasoning: true,
10571
10536
  input: ["text", "image"],
10572
10537
  cost: {
10573
- input: 0.67,
10538
+ input: 0.66,
10574
10539
  output: 3.5,
10575
- cacheRead: 0.2,
10540
+ cacheRead: 0.33,
10576
10541
  cacheWrite: 0,
10577
10542
  },
10578
10543
  contextWindow: 262144,
10579
- maxTokens: 262144,
10544
+ maxTokens: 262142,
10580
10545
  },
10581
10546
  "moonshotai/kimi-k2.7-code": {
10582
10547
  id: "moonshotai/kimi-k2.7-code",
@@ -10587,13 +10552,13 @@ export const MODELS = {
10587
10552
  reasoning: true,
10588
10553
  input: ["text", "image"],
10589
10554
  cost: {
10590
- input: 0.74,
10591
- output: 3.5,
10592
- cacheRead: 0.15,
10555
+ input: 0.612,
10556
+ output: 3.069,
10557
+ cacheRead: 0.1296,
10593
10558
  cacheWrite: 0,
10594
10559
  },
10595
10560
  contextWindow: 262144,
10596
- maxTokens: 16384,
10561
+ maxTokens: 262144,
10597
10562
  },
10598
10563
  "nex-agi/nex-n2-pro:free": {
10599
10564
  id: "nex-agi/nex-n2-pro:free",
@@ -10916,7 +10881,7 @@ export const MODELS = {
10916
10881
  cacheWrite: 0,
10917
10882
  },
10918
10883
  contextWindow: 1047576,
10919
- maxTokens: 32768,
10884
+ maxTokens: 4096,
10920
10885
  },
10921
10886
  "openai/gpt-4.1-nano": {
10922
10887
  id: "openai/gpt-4.1-nano",
@@ -10946,7 +10911,7 @@ export const MODELS = {
10946
10911
  cost: {
10947
10912
  input: 2.5,
10948
10913
  output: 10,
10949
- cacheRead: 0,
10914
+ cacheRead: 1.25,
10950
10915
  cacheWrite: 0,
10951
10916
  },
10952
10917
  contextWindow: 128000,
@@ -11082,11 +11047,11 @@ export const MODELS = {
11082
11047
  cost: {
11083
11048
  input: 0.25,
11084
11049
  output: 2,
11085
- cacheRead: 0.025,
11050
+ cacheRead: 0.03,
11086
11051
  cacheWrite: 0,
11087
11052
  },
11088
11053
  contextWindow: 400000,
11089
- maxTokens: 128000,
11054
+ maxTokens: 4096,
11090
11055
  },
11091
11056
  "openai/gpt-5-nano": {
11092
11057
  id: "openai/gpt-5-nano",
@@ -11150,11 +11115,11 @@ export const MODELS = {
11150
11115
  cost: {
11151
11116
  input: 1.25,
11152
11117
  output: 10,
11153
- cacheRead: 0.13,
11118
+ cacheRead: 0.125,
11154
11119
  cacheWrite: 0,
11155
11120
  },
11156
11121
  contextWindow: 128000,
11157
- maxTokens: 32000,
11122
+ maxTokens: 16384,
11158
11123
  },
11159
11124
  "openai/gpt-5.1-codex": {
11160
11125
  id: "openai/gpt-5.1-codex",
@@ -11241,7 +11206,7 @@ export const MODELS = {
11241
11206
  cacheWrite: 0,
11242
11207
  },
11243
11208
  contextWindow: 128000,
11244
- maxTokens: 16384,
11209
+ maxTokens: 32000,
11245
11210
  },
11246
11211
  "openai/gpt-5.2-codex": {
11247
11212
  id: "openai/gpt-5.2-codex",
@@ -12454,11 +12419,11 @@ export const MODELS = {
12454
12419
  cost: {
12455
12420
  input: 0.14,
12456
12421
  output: 1,
12457
- cacheRead: 0,
12422
+ cacheRead: 0.05,
12458
12423
  cacheWrite: 0,
12459
12424
  },
12460
12425
  contextWindow: 262144,
12461
- maxTokens: 262144,
12426
+ maxTokens: 81920,
12462
12427
  },
12463
12428
  "qwen/qwen3.5-397b-a17b": {
12464
12429
  id: "qwen/qwen3.5-397b-a17b",
@@ -12491,8 +12456,8 @@ export const MODELS = {
12491
12456
  cacheRead: 0,
12492
12457
  cacheWrite: 0,
12493
12458
  },
12494
- contextWindow: 262144,
12495
- maxTokens: 262144,
12459
+ contextWindow: 256000,
12460
+ maxTokens: 32768,
12496
12461
  },
12497
12462
  "qwen/qwen3.5-flash-02-23": {
12498
12463
  id: "qwen/qwen3.5-flash-02-23",
@@ -12758,13 +12723,13 @@ export const MODELS = {
12758
12723
  reasoning: true,
12759
12724
  input: ["text"],
12760
12725
  cost: {
12761
- input: 0.066,
12762
- output: 0.26,
12763
- cacheRead: 0.029,
12726
+ input: 0.063,
12727
+ output: 0.21,
12728
+ cacheRead: 0.021,
12764
12729
  cacheWrite: 0,
12765
12730
  },
12766
12731
  contextWindow: 262144,
12767
- maxTokens: 262144,
12732
+ maxTokens: 4096,
12768
12733
  },
12769
12734
  "thedrummer/rocinante-12b": {
12770
12735
  id: "thedrummer/rocinante-12b",
@@ -13079,6 +13044,7 @@ export const MODELS = {
13079
13044
  provider: "openrouter",
13080
13045
  baseUrl: "https://openrouter.ai/api/v1",
13081
13046
  reasoning: true,
13047
+ thinkingLevelMap: { "xhigh": "xhigh" },
13082
13048
  input: ["text"],
13083
13049
  cost: {
13084
13050
  input: 1.2,
@@ -13200,13 +13166,13 @@ export const MODELS = {
13200
13166
  reasoning: true,
13201
13167
  input: ["text", "image"],
13202
13168
  cost: {
13203
- input: 0.67,
13169
+ input: 0.66,
13204
13170
  output: 3.5,
13205
- cacheRead: 0.2,
13171
+ cacheRead: 0.33,
13206
13172
  cacheWrite: 0,
13207
13173
  },
13208
13174
  contextWindow: 262144,
13209
- maxTokens: 262144,
13175
+ maxTokens: 262142,
13210
13176
  },
13211
13177
  "~openai/gpt-latest": {
13212
13178
  id: "~openai/gpt-latest",
@@ -15978,8 +15944,8 @@ export const MODELS = {
15978
15944
  cost: {
15979
15945
  input: 0.09,
15980
15946
  output: 0.3,
15981
- cacheRead: 0,
15982
- cacheWrite: 0.02,
15947
+ cacheRead: 0.02,
15948
+ cacheWrite: 0,
15983
15949
  },
15984
15950
  contextWindow: 262114,
15985
15951
  maxTokens: 262114,