@earendil-works/pi-ai 0.79.8 → 0.79.10

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -3927,11 +3927,12 @@ export const MODELS = {
3927
3927
  "accounts/fireworks/models/glm-5p2": {
3928
3928
  id: "accounts/fireworks/models/glm-5p2",
3929
3929
  name: "GLM 5.2",
3930
- api: "anthropic-messages",
3930
+ api: "openai-completions",
3931
3931
  provider: "fireworks",
3932
- baseUrl: "https://api.fireworks.ai/inference",
3933
- compat: { "sendSessionAffinityHeaders": true, "supportsEagerToolInputStreaming": false, "supportsCacheControlOnTools": false, "supportsLongCacheRetention": false },
3932
+ baseUrl: "https://api.fireworks.ai/inference/v1",
3933
+ compat: { "supportsStore": false, "supportsDeveloperRole": false },
3934
3934
  reasoning: true,
3935
+ thinkingLevelMap: { "off": "none", "minimal": null, "low": "high", "medium": "high", "xhigh": "max" },
3935
3936
  input: ["text"],
3936
3937
  cost: {
3937
3938
  input: 1.4,
@@ -4848,42 +4849,6 @@ export const MODELS = {
4848
4849
  contextWindow: 262144,
4849
4850
  maxTokens: 32768,
4850
4851
  },
4851
- "gemma-4-E2B-it": {
4852
- id: "gemma-4-E2B-it",
4853
- name: "Gemma 4 E2B IT",
4854
- api: "google-generative-ai",
4855
- provider: "google",
4856
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4857
- reasoning: true,
4858
- thinkingLevelMap: { "off": null, "minimal": "MINIMAL", "low": null, "medium": null, "high": "HIGH" },
4859
- input: ["text", "image"],
4860
- cost: {
4861
- input: 0,
4862
- output: 0,
4863
- cacheRead: 0,
4864
- cacheWrite: 0,
4865
- },
4866
- contextWindow: 131072,
4867
- maxTokens: 8192,
4868
- },
4869
- "gemma-4-E4B-it": {
4870
- id: "gemma-4-E4B-it",
4871
- name: "Gemma 4 E4B IT",
4872
- api: "google-generative-ai",
4873
- provider: "google",
4874
- baseUrl: "https://generativelanguage.googleapis.com/v1beta",
4875
- reasoning: true,
4876
- thinkingLevelMap: { "off": null, "minimal": "MINIMAL", "low": null, "medium": null, "high": "HIGH" },
4877
- input: ["text", "image"],
4878
- cost: {
4879
- input: 0,
4880
- output: 0,
4881
- cacheRead: 0,
4882
- cacheWrite: 0,
4883
- },
4884
- contextWindow: 131072,
4885
- maxTokens: 8192,
4886
- },
4887
4852
  },
4888
4853
  "google-vertex": {
4889
4854
  "gemini-2.5-flash": {
@@ -8917,23 +8882,6 @@ export const MODELS = {
8917
8882
  contextWindow: 200000,
8918
8883
  maxTokens: 4096,
8919
8884
  },
8920
- "anthropic/claude-3.5-haiku": {
8921
- id: "anthropic/claude-3.5-haiku",
8922
- name: "Anthropic: Claude 3.5 Haiku",
8923
- api: "openai-completions",
8924
- provider: "openrouter",
8925
- baseUrl: "https://openrouter.ai/api/v1",
8926
- reasoning: false,
8927
- input: ["text", "image"],
8928
- cost: {
8929
- input: 0.8,
8930
- output: 4,
8931
- cacheRead: 0.08,
8932
- cacheWrite: 1,
8933
- },
8934
- contextWindow: 200000,
8935
- maxTokens: 8192,
8936
- },
8937
8885
  "anthropic/claude-fable-5": {
8938
8886
  id: "anthropic/claude-fable-5",
8939
8887
  name: "Anthropic: Claude Fable 5",
@@ -9187,13 +9135,13 @@ export const MODELS = {
9187
9135
  reasoning: true,
9188
9136
  input: ["text"],
9189
9137
  cost: {
9190
- input: 0.22,
9191
- output: 0.85,
9138
+ input: 0.25,
9139
+ output: 0.8,
9192
9140
  cacheRead: 0.06,
9193
9141
  cacheWrite: 0,
9194
9142
  },
9195
9143
  contextWindow: 262144,
9196
- maxTokens: 262144,
9144
+ maxTokens: 80000,
9197
9145
  },
9198
9146
  "arcee-ai/trinity-mini": {
9199
9147
  id: "arcee-ai/trinity-mini",
@@ -10570,9 +10518,9 @@ export const MODELS = {
10570
10518
  reasoning: true,
10571
10519
  input: ["text", "image"],
10572
10520
  cost: {
10573
- input: 0.67,
10574
- output: 3.5,
10575
- cacheRead: 0.2,
10521
+ input: 0.66,
10522
+ output: 3.41,
10523
+ cacheRead: 0.144,
10576
10524
  cacheWrite: 0,
10577
10525
  },
10578
10526
  contextWindow: 262144,
@@ -10587,13 +10535,13 @@ export const MODELS = {
10587
10535
  reasoning: true,
10588
10536
  input: ["text", "image"],
10589
10537
  cost: {
10590
- input: 0.74,
10591
- output: 3.5,
10592
- cacheRead: 0.15,
10538
+ input: 0.612,
10539
+ output: 3.069,
10540
+ cacheRead: 0.1296,
10593
10541
  cacheWrite: 0,
10594
10542
  },
10595
10543
  contextWindow: 262144,
10596
- maxTokens: 16384,
10544
+ maxTokens: 262144,
10597
10545
  },
10598
10546
  "nex-agi/nex-n2-pro:free": {
10599
10547
  id: "nex-agi/nex-n2-pro:free",
@@ -10610,7 +10558,7 @@ export const MODELS = {
10610
10558
  cacheWrite: 0,
10611
10559
  },
10612
10560
  contextWindow: 262144,
10613
- maxTokens: 262144,
10561
+ maxTokens: 256000,
10614
10562
  },
10615
10563
  "nvidia/llama-3.3-nemotron-super-49b-v1.5": {
10616
10564
  id: "nvidia/llama-3.3-nemotron-super-49b-v1.5",
@@ -12758,13 +12706,13 @@ export const MODELS = {
12758
12706
  reasoning: true,
12759
12707
  input: ["text"],
12760
12708
  cost: {
12761
- input: 0.066,
12762
- output: 0.26,
12763
- cacheRead: 0.029,
12709
+ input: 0.063,
12710
+ output: 0.21,
12711
+ cacheRead: 0.021,
12764
12712
  cacheWrite: 0,
12765
12713
  },
12766
12714
  contextWindow: 262144,
12767
- maxTokens: 262144,
12715
+ maxTokens: 4096,
12768
12716
  },
12769
12717
  "thedrummer/rocinante-12b": {
12770
12718
  id: "thedrummer/rocinante-12b",
@@ -13066,11 +13014,11 @@ export const MODELS = {
13066
13014
  cost: {
13067
13015
  input: 0.98,
13068
13016
  output: 3.08,
13069
- cacheRead: 0.182,
13017
+ cacheRead: 0.49,
13070
13018
  cacheWrite: 0,
13071
13019
  },
13072
13020
  contextWindow: 202752,
13073
- maxTokens: 4096,
13021
+ maxTokens: 65535,
13074
13022
  },
13075
13023
  "z-ai/glm-5.2": {
13076
13024
  id: "z-ai/glm-5.2",
@@ -13079,15 +13027,16 @@ export const MODELS = {
13079
13027
  provider: "openrouter",
13080
13028
  baseUrl: "https://openrouter.ai/api/v1",
13081
13029
  reasoning: true,
13030
+ thinkingLevelMap: { "xhigh": "xhigh" },
13082
13031
  input: ["text"],
13083
13032
  cost: {
13084
- input: 1.2,
13085
- output: 4.1,
13086
- cacheRead: 0.2,
13033
+ input: 1,
13034
+ output: 4,
13035
+ cacheRead: 0.18,
13087
13036
  cacheWrite: 0,
13088
13037
  },
13089
13038
  contextWindow: 1048576,
13090
- maxTokens: 131072,
13039
+ maxTokens: 32768,
13091
13040
  },
13092
13041
  "~anthropic/claude-fable-latest": {
13093
13042
  id: "~anthropic/claude-fable-latest",
@@ -13200,9 +13149,9 @@ export const MODELS = {
13200
13149
  reasoning: true,
13201
13150
  input: ["text", "image"],
13202
13151
  cost: {
13203
- input: 0.67,
13204
- output: 3.5,
13205
- cacheRead: 0.2,
13152
+ input: 0.66,
13153
+ output: 3.41,
13154
+ cacheRead: 0.144,
13206
13155
  cacheWrite: 0,
13207
13156
  },
13208
13157
  contextWindow: 262144,
@@ -15967,6 +15916,23 @@ export const MODELS = {
15967
15916
  contextWindow: 200000,
15968
15917
  maxTokens: 8000,
15969
15918
  },
15919
+ "sakana/fugu-ultra": {
15920
+ id: "sakana/fugu-ultra",
15921
+ name: "Fugu Ultra",
15922
+ api: "anthropic-messages",
15923
+ provider: "vercel-ai-gateway",
15924
+ baseUrl: "https://ai-gateway.vercel.sh",
15925
+ reasoning: true,
15926
+ input: ["text", "image"],
15927
+ cost: {
15928
+ input: 5,
15929
+ output: 30,
15930
+ cacheRead: 0.5,
15931
+ cacheWrite: 0,
15932
+ },
15933
+ contextWindow: 1000000,
15934
+ maxTokens: 1000000,
15935
+ },
15970
15936
  "stepfun/step-3.5-flash": {
15971
15937
  id: "stepfun/step-3.5-flash",
15972
15938
  name: "StepFun 3.5 Flash",
@@ -15978,8 +15944,8 @@ export const MODELS = {
15978
15944
  cost: {
15979
15945
  input: 0.09,
15980
15946
  output: 0.3,
15981
- cacheRead: 0,
15982
- cacheWrite: 0.02,
15947
+ cacheRead: 0.02,
15948
+ cacheWrite: 0,
15983
15949
  },
15984
15950
  contextWindow: 262114,
15985
15951
  maxTokens: 262114,