@mariozechner/pi-ai 0.47.0 → 0.49.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (38) hide show
  1. package/dist/index.d.ts +0 -1
  2. package/dist/index.d.ts.map +1 -1
  3. package/dist/index.js +0 -1
  4. package/dist/index.js.map +1 -1
  5. package/dist/models.generated.d.ts +161 -8
  6. package/dist/models.generated.d.ts.map +1 -1
  7. package/dist/models.generated.js +189 -36
  8. package/dist/models.generated.js.map +1 -1
  9. package/dist/providers/amazon-bedrock.d.ts.map +1 -1
  10. package/dist/providers/amazon-bedrock.js +7 -3
  11. package/dist/providers/amazon-bedrock.js.map +1 -1
  12. package/dist/providers/anthropic.d.ts.map +1 -1
  13. package/dist/providers/anthropic.js +25 -11
  14. package/dist/providers/anthropic.js.map +1 -1
  15. package/dist/providers/google-shared.d.ts.map +1 -1
  16. package/dist/providers/google-shared.js +2 -1
  17. package/dist/providers/google-shared.js.map +1 -1
  18. package/dist/providers/openai-codex-responses.d.ts.map +1 -1
  19. package/dist/providers/openai-codex-responses.js +2 -25
  20. package/dist/providers/openai-codex-responses.js.map +1 -1
  21. package/dist/providers/openai-completions.d.ts.map +1 -1
  22. package/dist/providers/openai-completions.js +16 -9
  23. package/dist/providers/openai-completions.js.map +1 -1
  24. package/dist/providers/transform-messages.d.ts.map +1 -1
  25. package/dist/providers/transform-messages.js +12 -1
  26. package/dist/providers/transform-messages.js.map +1 -1
  27. package/dist/stream.d.ts.map +1 -1
  28. package/dist/stream.js +48 -19
  29. package/dist/stream.js.map +1 -1
  30. package/dist/utils/validation.d.ts +1 -1
  31. package/dist/utils/validation.d.ts.map +1 -1
  32. package/dist/utils/validation.js +7 -4
  33. package/dist/utils/validation.js.map +1 -1
  34. package/package.json +1 -1
  35. package/dist/constants.d.ts +0 -6
  36. package/dist/constants.d.ts.map +0 -1
  37. package/dist/constants.js +0 -14
  38. package/dist/constants.js.map +0 -1
@@ -4983,13 +4983,13 @@ export const MODELS = {
4983
4983
  reasoning: true,
4984
4984
  input: ["text"],
4985
4985
  cost: {
4986
- input: 0.44999999999999996,
4987
- output: 2.1500000000000004,
4986
+ input: 0.39999999999999997,
4987
+ output: 1.75,
4988
4988
  cacheRead: 0,
4989
4989
  cacheWrite: 0,
4990
4990
  },
4991
- contextWindow: 131072,
4992
- maxTokens: 32768,
4991
+ contextWindow: 163840,
4992
+ maxTokens: 65536,
4993
4993
  },
4994
4994
  "deepseek/deepseek-r1-distill-llama-70b": {
4995
4995
  id: "deepseek/deepseek-r1-distill-llama-70b",
@@ -5088,7 +5088,7 @@ export const MODELS = {
5088
5088
  input: 0.09999999999999999,
5089
5089
  output: 0.39999999999999997,
5090
5090
  cacheRead: 0.024999999999999998,
5091
- cacheWrite: 0.18330000000000002,
5091
+ cacheWrite: 0.0833,
5092
5092
  },
5093
5093
  contextWindow: 1048576,
5094
5094
  maxTokens: 8192,
@@ -5139,7 +5139,7 @@ export const MODELS = {
5139
5139
  input: 0.3,
5140
5140
  output: 2.5,
5141
5141
  cacheRead: 0.03,
5142
- cacheWrite: 0.3833,
5142
+ cacheWrite: 0.08333333333333334,
5143
5143
  },
5144
5144
  contextWindow: 1048576,
5145
5145
  maxTokens: 65535,
@@ -5156,7 +5156,7 @@ export const MODELS = {
5156
5156
  input: 0.09999999999999999,
5157
5157
  output: 0.39999999999999997,
5158
5158
  cacheRead: 0.01,
5159
- cacheWrite: 0.18330000000000002,
5159
+ cacheWrite: 0.0833,
5160
5160
  },
5161
5161
  contextWindow: 1048576,
5162
5162
  maxTokens: 65535,
@@ -5173,7 +5173,7 @@ export const MODELS = {
5173
5173
  input: 0.09999999999999999,
5174
5174
  output: 0.39999999999999997,
5175
5175
  cacheRead: 0.01,
5176
- cacheWrite: 1,
5176
+ cacheWrite: 0.0833,
5177
5177
  },
5178
5178
  contextWindow: 1048576,
5179
5179
  maxTokens: 65536,
@@ -5190,7 +5190,7 @@ export const MODELS = {
5190
5190
  input: 0.3,
5191
5191
  output: 2.5,
5192
5192
  cacheRead: 0.075,
5193
- cacheWrite: 0.3833,
5193
+ cacheWrite: 0.0833,
5194
5194
  },
5195
5195
  contextWindow: 1048576,
5196
5196
  maxTokens: 65535,
@@ -5207,7 +5207,7 @@ export const MODELS = {
5207
5207
  input: 1.25,
5208
5208
  output: 10,
5209
5209
  cacheRead: 0.125,
5210
- cacheWrite: 1.625,
5210
+ cacheWrite: 0.375,
5211
5211
  },
5212
5212
  contextWindow: 1048576,
5213
5213
  maxTokens: 65536,
@@ -5224,7 +5224,7 @@ export const MODELS = {
5224
5224
  input: 1.25,
5225
5225
  output: 10,
5226
5226
  cacheRead: 0.31,
5227
- cacheWrite: 1.625,
5227
+ cacheWrite: 0.375,
5228
5228
  },
5229
5229
  contextWindow: 1048576,
5230
5230
  maxTokens: 65536,
@@ -5241,7 +5241,7 @@ export const MODELS = {
5241
5241
  input: 1.25,
5242
5242
  output: 10,
5243
5243
  cacheRead: 0.31,
5244
- cacheWrite: 1.625,
5244
+ cacheWrite: 0.375,
5245
5245
  },
5246
5246
  contextWindow: 1048576,
5247
5247
  maxTokens: 65535,
@@ -5275,7 +5275,7 @@ export const MODELS = {
5275
5275
  input: 2,
5276
5276
  output: 12,
5277
5277
  cacheRead: 0.19999999999999998,
5278
- cacheWrite: 2.375,
5278
+ cacheWrite: 0.375,
5279
5279
  },
5280
5280
  contextWindow: 1048576,
5281
5281
  maxTokens: 65536,
@@ -7201,6 +7201,108 @@ export const MODELS = {
7201
7201
  contextWindow: 32768,
7202
7202
  maxTokens: 4096,
7203
7203
  },
7204
+ "qwen/qwen-max": {
7205
+ id: "qwen/qwen-max",
7206
+ name: "Qwen: Qwen-Max ",
7207
+ api: "openai-completions",
7208
+ provider: "openrouter",
7209
+ baseUrl: "https://openrouter.ai/api/v1",
7210
+ reasoning: false,
7211
+ input: ["text"],
7212
+ cost: {
7213
+ input: 1.5999999999999999,
7214
+ output: 6.3999999999999995,
7215
+ cacheRead: 0.64,
7216
+ cacheWrite: 0,
7217
+ },
7218
+ contextWindow: 32768,
7219
+ maxTokens: 8192,
7220
+ },
7221
+ "qwen/qwen-plus": {
7222
+ id: "qwen/qwen-plus",
7223
+ name: "Qwen: Qwen-Plus",
7224
+ api: "openai-completions",
7225
+ provider: "openrouter",
7226
+ baseUrl: "https://openrouter.ai/api/v1",
7227
+ reasoning: false,
7228
+ input: ["text"],
7229
+ cost: {
7230
+ input: 0.39999999999999997,
7231
+ output: 1.2,
7232
+ cacheRead: 0.16,
7233
+ cacheWrite: 0,
7234
+ },
7235
+ contextWindow: 131072,
7236
+ maxTokens: 8192,
7237
+ },
7238
+ "qwen/qwen-plus-2025-07-28": {
7239
+ id: "qwen/qwen-plus-2025-07-28",
7240
+ name: "Qwen: Qwen Plus 0728",
7241
+ api: "openai-completions",
7242
+ provider: "openrouter",
7243
+ baseUrl: "https://openrouter.ai/api/v1",
7244
+ reasoning: false,
7245
+ input: ["text"],
7246
+ cost: {
7247
+ input: 0.39999999999999997,
7248
+ output: 1.2,
7249
+ cacheRead: 0,
7250
+ cacheWrite: 0,
7251
+ },
7252
+ contextWindow: 1000000,
7253
+ maxTokens: 32768,
7254
+ },
7255
+ "qwen/qwen-plus-2025-07-28:thinking": {
7256
+ id: "qwen/qwen-plus-2025-07-28:thinking",
7257
+ name: "Qwen: Qwen Plus 0728 (thinking)",
7258
+ api: "openai-completions",
7259
+ provider: "openrouter",
7260
+ baseUrl: "https://openrouter.ai/api/v1",
7261
+ reasoning: true,
7262
+ input: ["text"],
7263
+ cost: {
7264
+ input: 0.39999999999999997,
7265
+ output: 4,
7266
+ cacheRead: 0,
7267
+ cacheWrite: 0,
7268
+ },
7269
+ contextWindow: 1000000,
7270
+ maxTokens: 32768,
7271
+ },
7272
+ "qwen/qwen-turbo": {
7273
+ id: "qwen/qwen-turbo",
7274
+ name: "Qwen: Qwen-Turbo",
7275
+ api: "openai-completions",
7276
+ provider: "openrouter",
7277
+ baseUrl: "https://openrouter.ai/api/v1",
7278
+ reasoning: false,
7279
+ input: ["text"],
7280
+ cost: {
7281
+ input: 0.049999999999999996,
7282
+ output: 0.19999999999999998,
7283
+ cacheRead: 0.02,
7284
+ cacheWrite: 0,
7285
+ },
7286
+ contextWindow: 1000000,
7287
+ maxTokens: 8192,
7288
+ },
7289
+ "qwen/qwen-vl-max": {
7290
+ id: "qwen/qwen-vl-max",
7291
+ name: "Qwen: Qwen VL Max",
7292
+ api: "openai-completions",
7293
+ provider: "openrouter",
7294
+ baseUrl: "https://openrouter.ai/api/v1",
7295
+ reasoning: false,
7296
+ input: ["text", "image"],
7297
+ cost: {
7298
+ input: 0.7999999999999999,
7299
+ output: 3.1999999999999997,
7300
+ cacheRead: 0,
7301
+ cacheWrite: 0,
7302
+ },
7303
+ contextWindow: 131072,
7304
+ maxTokens: 8192,
7305
+ },
7204
7306
  "qwen/qwen3-14b": {
7205
7307
  id: "qwen/qwen3-14b",
7206
7308
  name: "Qwen: Qwen3 14B",
@@ -7405,6 +7507,40 @@ export const MODELS = {
7405
7507
  contextWindow: 160000,
7406
7508
  maxTokens: 32768,
7407
7509
  },
7510
+ "qwen/qwen3-coder-flash": {
7511
+ id: "qwen/qwen3-coder-flash",
7512
+ name: "Qwen: Qwen3 Coder Flash",
7513
+ api: "openai-completions",
7514
+ provider: "openrouter",
7515
+ baseUrl: "https://openrouter.ai/api/v1",
7516
+ reasoning: false,
7517
+ input: ["text"],
7518
+ cost: {
7519
+ input: 0.3,
7520
+ output: 1.5,
7521
+ cacheRead: 0.08,
7522
+ cacheWrite: 0,
7523
+ },
7524
+ contextWindow: 128000,
7525
+ maxTokens: 65536,
7526
+ },
7527
+ "qwen/qwen3-coder-plus": {
7528
+ id: "qwen/qwen3-coder-plus",
7529
+ name: "Qwen: Qwen3 Coder Plus",
7530
+ api: "openai-completions",
7531
+ provider: "openrouter",
7532
+ baseUrl: "https://openrouter.ai/api/v1",
7533
+ reasoning: false,
7534
+ input: ["text"],
7535
+ cost: {
7536
+ input: 1,
7537
+ output: 5,
7538
+ cacheRead: 0.09999999999999999,
7539
+ cacheWrite: 0,
7540
+ },
7541
+ contextWindow: 128000,
7542
+ maxTokens: 65536,
7543
+ },
7408
7544
  "qwen/qwen3-coder:exacto": {
7409
7545
  id: "qwen/qwen3-coder:exacto",
7410
7546
  name: "Qwen: Qwen3 Coder 480B A35B (exacto)",
@@ -7439,6 +7575,23 @@ export const MODELS = {
7439
7575
  contextWindow: 262000,
7440
7576
  maxTokens: 262000,
7441
7577
  },
7578
+ "qwen/qwen3-max": {
7579
+ id: "qwen/qwen3-max",
7580
+ name: "Qwen: Qwen3 Max",
7581
+ api: "openai-completions",
7582
+ provider: "openrouter",
7583
+ baseUrl: "https://openrouter.ai/api/v1",
7584
+ reasoning: false,
7585
+ input: ["text"],
7586
+ cost: {
7587
+ input: 1.2,
7588
+ output: 6,
7589
+ cacheRead: 0.24,
7590
+ cacheWrite: 0,
7591
+ },
7592
+ contextWindow: 256000,
7593
+ maxTokens: 32768,
7594
+ },
7442
7595
  "qwen/qwen3-next-80b-a3b-instruct": {
7443
7596
  id: "qwen/qwen3-next-80b-a3b-instruct",
7444
7597
  name: "Qwen: Qwen3 Next 80B A3B Instruct",
@@ -7487,8 +7640,8 @@ export const MODELS = {
7487
7640
  cacheRead: 0,
7488
7641
  cacheWrite: 0,
7489
7642
  },
7490
- contextWindow: 262144,
7491
- maxTokens: 262144,
7643
+ contextWindow: 128000,
7644
+ maxTokens: 4096,
7492
7645
  },
7493
7646
  "qwen/qwen3-vl-235b-a22b-instruct": {
7494
7647
  id: "qwen/qwen3-vl-235b-a22b-instruct",
@@ -7507,23 +7660,6 @@ export const MODELS = {
7507
7660
  contextWindow: 262144,
7508
7661
  maxTokens: 4096,
7509
7662
  },
7510
- "qwen/qwen3-vl-235b-a22b-thinking": {
7511
- id: "qwen/qwen3-vl-235b-a22b-thinking",
7512
- name: "Qwen: Qwen3 VL 235B A22B Thinking",
7513
- api: "openai-completions",
7514
- provider: "openrouter",
7515
- baseUrl: "https://openrouter.ai/api/v1",
7516
- reasoning: true,
7517
- input: ["text", "image"],
7518
- cost: {
7519
- input: 0.44999999999999996,
7520
- output: 3.5,
7521
- cacheRead: 0,
7522
- cacheWrite: 0,
7523
- },
7524
- contextWindow: 262144,
7525
- maxTokens: 262144,
7526
- },
7527
7663
  "qwen/qwen3-vl-30b-a3b-instruct": {
7528
7664
  id: "qwen/qwen3-vl-30b-a3b-instruct",
7529
7665
  name: "Qwen: Qwen3 VL 30B A3B Instruct",
@@ -7575,6 +7711,23 @@ export const MODELS = {
7575
7711
  contextWindow: 131072,
7576
7712
  maxTokens: 32768,
7577
7713
  },
7714
+ "qwen/qwen3-vl-8b-thinking": {
7715
+ id: "qwen/qwen3-vl-8b-thinking",
7716
+ name: "Qwen: Qwen3 VL 8B Thinking",
7717
+ api: "openai-completions",
7718
+ provider: "openrouter",
7719
+ baseUrl: "https://openrouter.ai/api/v1",
7720
+ reasoning: true,
7721
+ input: ["text", "image"],
7722
+ cost: {
7723
+ input: 0.18,
7724
+ output: 2.0999999999999996,
7725
+ cacheRead: 0,
7726
+ cacheWrite: 0,
7727
+ },
7728
+ contextWindow: 256000,
7729
+ maxTokens: 32768,
7730
+ },
7578
7731
  "qwen/qwq-32b": {
7579
7732
  id: "qwen/qwq-32b",
7580
7733
  name: "Qwen: QwQ 32B",
@@ -7890,13 +8043,13 @@ export const MODELS = {
7890
8043
  reasoning: true,
7891
8044
  input: ["text"],
7892
8045
  cost: {
7893
- input: 0.09999999999999999,
7894
- output: 0.3,
7895
- cacheRead: 0.02,
8046
+ input: 0.09,
8047
+ output: 0.29,
8048
+ cacheRead: 0,
7896
8049
  cacheWrite: 0,
7897
8050
  },
7898
8051
  contextWindow: 262144,
7899
- maxTokens: 32000,
8052
+ maxTokens: 4096,
7900
8053
  },
7901
8054
  "xiaomi/mimo-v2-flash:free": {
7902
8055
  id: "xiaomi/mimo-v2-flash:free",