@pydantic/genai-prices 0.0.67 → 0.0.68
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/cli.js +354 -27
- package/dist/index.cjs +5 -5
- package/dist/index.js +333 -6
- package/package.json +1 -1
package/dist/index.js
CHANGED
|
@@ -621,6 +621,51 @@ const G = [
|
|
|
621
621
|
}
|
|
622
622
|
]
|
|
623
623
|
},
|
|
624
|
+
{
|
|
625
|
+
id: "claude-sonnet-5",
|
|
626
|
+
name: "Claude Sonnet 5",
|
|
627
|
+
description: "Our most agentic Sonnet model, approaching Opus 4.8 capability at lower cost",
|
|
628
|
+
match: {
|
|
629
|
+
or: [
|
|
630
|
+
{
|
|
631
|
+
starts_with: "claude-sonnet-5"
|
|
632
|
+
},
|
|
633
|
+
{
|
|
634
|
+
starts_with: "claude-sonnet-5.0"
|
|
635
|
+
},
|
|
636
|
+
{
|
|
637
|
+
starts_with: "claude-5-sonnet"
|
|
638
|
+
},
|
|
639
|
+
{
|
|
640
|
+
starts_with: "claude-5.0-sonnet"
|
|
641
|
+
}
|
|
642
|
+
]
|
|
643
|
+
},
|
|
644
|
+
context_window: 1e6,
|
|
645
|
+
price_comments: "Flat pricing across full 1M context window (no tiered pricing). Introductory pricing ($2/$10 per MTok) applies through 2026-08-31; standard pricing ($3/$15) applies from 2026-09-01. Ref: https://www.anthropic.com/news/claude-sonnet-5",
|
|
646
|
+
prices: [
|
|
647
|
+
{
|
|
648
|
+
prices: {
|
|
649
|
+
input_mtok: 2,
|
|
650
|
+
cache_write_mtok: 2.5,
|
|
651
|
+
cache_read_mtok: 0.2,
|
|
652
|
+
output_mtok: 10
|
|
653
|
+
}
|
|
654
|
+
},
|
|
655
|
+
{
|
|
656
|
+
constraint: {
|
|
657
|
+
start_date: "2026-09-01",
|
|
658
|
+
type: "start_date"
|
|
659
|
+
},
|
|
660
|
+
prices: {
|
|
661
|
+
input_mtok: 3,
|
|
662
|
+
cache_write_mtok: 3.75,
|
|
663
|
+
cache_read_mtok: 0.3,
|
|
664
|
+
output_mtok: 15
|
|
665
|
+
}
|
|
666
|
+
}
|
|
667
|
+
]
|
|
668
|
+
},
|
|
624
669
|
{
|
|
625
670
|
id: "claude-v1",
|
|
626
671
|
description: "Retired, here to match price sources",
|
|
@@ -1058,6 +1103,35 @@ const G = [
|
|
|
1058
1103
|
}
|
|
1059
1104
|
}
|
|
1060
1105
|
},
|
|
1106
|
+
{
|
|
1107
|
+
id: "global.anthropic.claude-sonnet-5-v1:0",
|
|
1108
|
+
match: {
|
|
1109
|
+
contains: "global.anthropic.claude-sonnet-5"
|
|
1110
|
+
},
|
|
1111
|
+
price_comments: "Flat pricing across full 1M context window (no tiered pricing). Promotional launch pricing ($2/$10 per MTok) through 2026-08-31; standard ($3/$15) from 2026-09-01. Ref: https://aws.amazon.com/bedrock/pricing/",
|
|
1112
|
+
prices: [
|
|
1113
|
+
{
|
|
1114
|
+
prices: {
|
|
1115
|
+
input_mtok: 2,
|
|
1116
|
+
cache_write_mtok: 2.5,
|
|
1117
|
+
cache_read_mtok: 0.2,
|
|
1118
|
+
output_mtok: 10
|
|
1119
|
+
}
|
|
1120
|
+
},
|
|
1121
|
+
{
|
|
1122
|
+
constraint: {
|
|
1123
|
+
start_date: "2026-09-01",
|
|
1124
|
+
type: "start_date"
|
|
1125
|
+
},
|
|
1126
|
+
prices: {
|
|
1127
|
+
input_mtok: 3,
|
|
1128
|
+
cache_write_mtok: 3.75,
|
|
1129
|
+
cache_read_mtok: 0.3,
|
|
1130
|
+
output_mtok: 15
|
|
1131
|
+
}
|
|
1132
|
+
}
|
|
1133
|
+
]
|
|
1134
|
+
},
|
|
1061
1135
|
{
|
|
1062
1136
|
id: "google.gemma-3-12b-it",
|
|
1063
1137
|
name: "Gemma 3 12B IT",
|
|
@@ -1388,6 +1462,30 @@ const G = [
|
|
|
1388
1462
|
output_mtok: 0.65
|
|
1389
1463
|
}
|
|
1390
1464
|
},
|
|
1465
|
+
{
|
|
1466
|
+
id: "openai.gpt-5.4",
|
|
1467
|
+
name: "GPT-5.4",
|
|
1468
|
+
match: {
|
|
1469
|
+
equals: "openai.gpt-5.4"
|
|
1470
|
+
},
|
|
1471
|
+
prices: {
|
|
1472
|
+
input_mtok: 2.75,
|
|
1473
|
+
cache_read_mtok: 0.275,
|
|
1474
|
+
output_mtok: 16.5
|
|
1475
|
+
}
|
|
1476
|
+
},
|
|
1477
|
+
{
|
|
1478
|
+
id: "openai.gpt-5.5",
|
|
1479
|
+
name: "GPT-5.5",
|
|
1480
|
+
match: {
|
|
1481
|
+
equals: "openai.gpt-5.5"
|
|
1482
|
+
},
|
|
1483
|
+
prices: {
|
|
1484
|
+
input_mtok: 5.5,
|
|
1485
|
+
cache_read_mtok: 0.55,
|
|
1486
|
+
output_mtok: 33
|
|
1487
|
+
}
|
|
1488
|
+
},
|
|
1391
1489
|
{
|
|
1392
1490
|
id: "openai.gpt-oss-120b-1:0",
|
|
1393
1491
|
name: "gpt-oss-120b",
|
|
@@ -2015,6 +2113,60 @@ const G = [
|
|
|
2015
2113
|
]
|
|
2016
2114
|
}
|
|
2017
2115
|
}
|
|
2116
|
+
},
|
|
2117
|
+
{
|
|
2118
|
+
id: "regional.anthropic.claude-sonnet-5-v1:0",
|
|
2119
|
+
match: {
|
|
2120
|
+
or: [
|
|
2121
|
+
{
|
|
2122
|
+
starts_with: "anthropic.claude-sonnet-5"
|
|
2123
|
+
},
|
|
2124
|
+
{
|
|
2125
|
+
starts_with: "claude-sonnet-5"
|
|
2126
|
+
},
|
|
2127
|
+
{
|
|
2128
|
+
contains: "us.anthropic.claude-sonnet-5"
|
|
2129
|
+
},
|
|
2130
|
+
{
|
|
2131
|
+
contains: "au.anthropic.claude-sonnet-5"
|
|
2132
|
+
},
|
|
2133
|
+
{
|
|
2134
|
+
contains: "apac.anthropic.claude-sonnet-5"
|
|
2135
|
+
},
|
|
2136
|
+
{
|
|
2137
|
+
contains: "eu.anthropic.claude-sonnet-5"
|
|
2138
|
+
},
|
|
2139
|
+
{
|
|
2140
|
+
contains: "us-gov.anthropic.claude-sonnet-5"
|
|
2141
|
+
},
|
|
2142
|
+
{
|
|
2143
|
+
contains: "jp.anthropic.claude-sonnet-5"
|
|
2144
|
+
}
|
|
2145
|
+
]
|
|
2146
|
+
},
|
|
2147
|
+
price_comments: "Regional/cross-region endpoints carry a 10% premium over global (AWS published only the global promo rate; regional computed as global +10%, per the documented regional premium). Promotional launch pricing through 2026-08-31; standard from 2026-09-01. Ref: https://aws.amazon.com/bedrock/pricing/",
|
|
2148
|
+
prices: [
|
|
2149
|
+
{
|
|
2150
|
+
prices: {
|
|
2151
|
+
input_mtok: 2.2,
|
|
2152
|
+
cache_write_mtok: 2.75,
|
|
2153
|
+
cache_read_mtok: 0.22,
|
|
2154
|
+
output_mtok: 11
|
|
2155
|
+
}
|
|
2156
|
+
},
|
|
2157
|
+
{
|
|
2158
|
+
constraint: {
|
|
2159
|
+
start_date: "2026-09-01",
|
|
2160
|
+
type: "start_date"
|
|
2161
|
+
},
|
|
2162
|
+
prices: {
|
|
2163
|
+
input_mtok: 3.3,
|
|
2164
|
+
cache_write_mtok: 4.125,
|
|
2165
|
+
cache_read_mtok: 0.33,
|
|
2166
|
+
output_mtok: 16.5
|
|
2167
|
+
}
|
|
2168
|
+
}
|
|
2169
|
+
]
|
|
2018
2170
|
}
|
|
2019
2171
|
]
|
|
2020
2172
|
},
|
|
@@ -3307,6 +3459,20 @@ Compared to other leading proprietary and open-weights models Command A delivers
|
|
|
3307
3459
|
output_mtok: 4.4
|
|
3308
3460
|
}
|
|
3309
3461
|
},
|
|
3462
|
+
{
|
|
3463
|
+
id: "glm-5p2",
|
|
3464
|
+
name: "GLM-5.2",
|
|
3465
|
+
description: "GLM-5.2 introduces a robust 1M-token context and advanced, multi-effort coding capabilities to significantly enhance performance on long-horizon tasks. Features a new IndexShare architecture and improved MTP layer for greater efficiency. 743B parameter MoE model from Z.ai.",
|
|
3466
|
+
match: {
|
|
3467
|
+
equals: "accounts/fireworks/models/glm-5p2"
|
|
3468
|
+
},
|
|
3469
|
+
context_window: 104e4,
|
|
3470
|
+
prices: {
|
|
3471
|
+
input_mtok: 1.4,
|
|
3472
|
+
cache_read_mtok: 0.14,
|
|
3473
|
+
output_mtok: 4.4
|
|
3474
|
+
}
|
|
3475
|
+
},
|
|
3310
3476
|
{
|
|
3311
3477
|
id: "gpt-oss-120b",
|
|
3312
3478
|
name: "OpenAI gpt-oss-120b",
|
|
@@ -3361,6 +3527,20 @@ Compared to other leading proprietary and open-weights models Command A delivers
|
|
|
3361
3527
|
output_mtok: 4
|
|
3362
3528
|
}
|
|
3363
3529
|
},
|
|
3530
|
+
{
|
|
3531
|
+
id: "kimi-k2p7-code",
|
|
3532
|
+
name: "Kimi K2.7 Code",
|
|
3533
|
+
description: "Kimi K2.7 Code is a coding-focused agentic model built upon Kimi K2.6, delivering substantial improvements on real-world long-horizon coding tasks while reducing thinking tokens by roughly 30% compared to its predecessor.",
|
|
3534
|
+
match: {
|
|
3535
|
+
equals: "accounts/fireworks/models/kimi-k2p7-code"
|
|
3536
|
+
},
|
|
3537
|
+
context_window: 262144,
|
|
3538
|
+
prices: {
|
|
3539
|
+
input_mtok: 0.95,
|
|
3540
|
+
cache_read_mtok: 0.19,
|
|
3541
|
+
output_mtok: 4
|
|
3542
|
+
}
|
|
3543
|
+
},
|
|
3364
3544
|
{
|
|
3365
3545
|
id: "llama-v3p1-8b-instruct",
|
|
3366
3546
|
name: "Llama 3.1 8B Instruct",
|
|
@@ -3427,6 +3607,20 @@ Compared to other leading proprietary and open-weights models Command A delivers
|
|
|
3427
3607
|
output_mtok: 1.2
|
|
3428
3608
|
}
|
|
3429
3609
|
},
|
|
3610
|
+
{
|
|
3611
|
+
id: "nemotron-3-ultra-nvfp4",
|
|
3612
|
+
name: "NVIDIA Nemotron 3 Ultra NVFP4",
|
|
3613
|
+
description: "Frontier-scale LLM from NVIDIA using a hybrid Latent Mixture-of-Experts (LatentMoE) architecture with interleaved Mamba-2 and MoE layers plus select Attention layers. Features 55B active parameters out of 550B total and Multi-Token Prediction layers for faster generation, optimized for complex multi-step agents, long-context analysis, and high-accuracy reasoning over code, math, and science.",
|
|
3614
|
+
match: {
|
|
3615
|
+
equals: "accounts/fireworks/models/nemotron-3-ultra-nvfp4"
|
|
3616
|
+
},
|
|
3617
|
+
context_window: 262e3,
|
|
3618
|
+
prices: {
|
|
3619
|
+
input_mtok: 0.6,
|
|
3620
|
+
cache_read_mtok: 0.12,
|
|
3621
|
+
output_mtok: 2.4
|
|
3622
|
+
}
|
|
3623
|
+
},
|
|
3430
3624
|
{
|
|
3431
3625
|
id: "qwen2p5-vl-72b-instruct",
|
|
3432
3626
|
name: "Qwen2.5-VL 72B Instruct",
|
|
@@ -3465,6 +3659,20 @@ Compared to other leading proprietary and open-weights models Command A delivers
|
|
|
3465
3659
|
cache_read_mtok: 0.1,
|
|
3466
3660
|
output_mtok: 3
|
|
3467
3661
|
}
|
|
3662
|
+
},
|
|
3663
|
+
{
|
|
3664
|
+
id: "qwen3p7-plus",
|
|
3665
|
+
name: "Qwen3.7 Plus",
|
|
3666
|
+
description: "Qwen3.7 Plus is Alibaba's latest flagship closed model, available exclusively through Fireworks AI outside of Alibaba's own infrastructure.",
|
|
3667
|
+
match: {
|
|
3668
|
+
equals: "accounts/fireworks/models/qwen3p7-plus"
|
|
3669
|
+
},
|
|
3670
|
+
context_window: 262144,
|
|
3671
|
+
prices: {
|
|
3672
|
+
input_mtok: 0.4,
|
|
3673
|
+
cache_read_mtok: 0.08,
|
|
3674
|
+
output_mtok: 1.6
|
|
3675
|
+
}
|
|
3468
3676
|
}
|
|
3469
3677
|
]
|
|
3470
3678
|
},
|
|
@@ -8876,6 +9084,65 @@ Compared to other leading proprietary and open-weights models Command A delivers
|
|
|
8876
9084
|
]
|
|
8877
9085
|
},
|
|
8878
9086
|
extractors: [
|
|
9087
|
+
{
|
|
9088
|
+
api_flavor: "default",
|
|
9089
|
+
root: "usage",
|
|
9090
|
+
model_path: "model",
|
|
9091
|
+
mappings: [
|
|
9092
|
+
{
|
|
9093
|
+
path: "input_tokens",
|
|
9094
|
+
dest: "input_tokens",
|
|
9095
|
+
required: !0
|
|
9096
|
+
},
|
|
9097
|
+
{
|
|
9098
|
+
path: "cache_creation_input_tokens",
|
|
9099
|
+
dest: "input_tokens",
|
|
9100
|
+
required: !1
|
|
9101
|
+
},
|
|
9102
|
+
{
|
|
9103
|
+
path: "cache_read_input_tokens",
|
|
9104
|
+
dest: "input_tokens",
|
|
9105
|
+
required: !1
|
|
9106
|
+
},
|
|
9107
|
+
{
|
|
9108
|
+
path: "cache_creation_input_tokens",
|
|
9109
|
+
dest: "cache_write_tokens",
|
|
9110
|
+
required: !1
|
|
9111
|
+
},
|
|
9112
|
+
{
|
|
9113
|
+
path: "cache_read_input_tokens",
|
|
9114
|
+
dest: "cache_read_tokens",
|
|
9115
|
+
required: !1
|
|
9116
|
+
},
|
|
9117
|
+
{
|
|
9118
|
+
path: "output_tokens",
|
|
9119
|
+
dest: "output_tokens",
|
|
9120
|
+
required: !0
|
|
9121
|
+
}
|
|
9122
|
+
]
|
|
9123
|
+
},
|
|
9124
|
+
{
|
|
9125
|
+
api_flavor: "responses",
|
|
9126
|
+
root: "usage",
|
|
9127
|
+
model_path: "model",
|
|
9128
|
+
mappings: [
|
|
9129
|
+
{
|
|
9130
|
+
path: "input_tokens",
|
|
9131
|
+
dest: "input_tokens",
|
|
9132
|
+
required: !0
|
|
9133
|
+
},
|
|
9134
|
+
{
|
|
9135
|
+
path: ["input_tokens_details", "cached_tokens"],
|
|
9136
|
+
dest: "cache_read_tokens",
|
|
9137
|
+
required: !1
|
|
9138
|
+
},
|
|
9139
|
+
{
|
|
9140
|
+
path: "output_tokens",
|
|
9141
|
+
dest: "output_tokens",
|
|
9142
|
+
required: !0
|
|
9143
|
+
}
|
|
9144
|
+
]
|
|
9145
|
+
},
|
|
8879
9146
|
{
|
|
8880
9147
|
api_flavor: "chat",
|
|
8881
9148
|
root: "usage",
|
|
@@ -12572,6 +12839,43 @@ Compared to other leading proprietary and open-weights models Command A delivers
|
|
|
12572
12839
|
output_mtok: 15
|
|
12573
12840
|
}
|
|
12574
12841
|
},
|
|
12842
|
+
{
|
|
12843
|
+
id: "anthropic/claude-sonnet-5",
|
|
12844
|
+
match: {
|
|
12845
|
+
or: [
|
|
12846
|
+
{
|
|
12847
|
+
equals: "anthropic/claude-sonnet-5"
|
|
12848
|
+
},
|
|
12849
|
+
{
|
|
12850
|
+
equals: "anthropic/claude-sonnet-5:beta"
|
|
12851
|
+
}
|
|
12852
|
+
]
|
|
12853
|
+
},
|
|
12854
|
+
context_window: 1e6,
|
|
12855
|
+
price_comments: "Flat pricing across full 1M context window (no tiered pricing). Introductory pricing ($2/$10 per MTok) applies through 2026-08-31; standard ($3/$15) from 2026-09-01. OpenRouter mirrors Anthropic first-party pricing; $2/$10 verified live via the OpenRouter API on 2026-06-30. Ref: https://openrouter.ai/anthropic/claude-sonnet-5",
|
|
12856
|
+
prices: [
|
|
12857
|
+
{
|
|
12858
|
+
prices: {
|
|
12859
|
+
input_mtok: 2,
|
|
12860
|
+
cache_write_mtok: 2.5,
|
|
12861
|
+
cache_read_mtok: 0.2,
|
|
12862
|
+
output_mtok: 10
|
|
12863
|
+
}
|
|
12864
|
+
},
|
|
12865
|
+
{
|
|
12866
|
+
constraint: {
|
|
12867
|
+
start_date: "2026-09-01",
|
|
12868
|
+
type: "start_date"
|
|
12869
|
+
},
|
|
12870
|
+
prices: {
|
|
12871
|
+
input_mtok: 3,
|
|
12872
|
+
cache_write_mtok: 3.75,
|
|
12873
|
+
cache_read_mtok: 0.3,
|
|
12874
|
+
output_mtok: 15
|
|
12875
|
+
}
|
|
12876
|
+
}
|
|
12877
|
+
]
|
|
12878
|
+
},
|
|
12575
12879
|
{
|
|
12576
12880
|
id: "anubis-pro-105b-v1",
|
|
12577
12881
|
name: "Anubis Pro 105B V1",
|
|
@@ -14132,7 +14436,14 @@ Compared to other leading proprietary and open-weights models Command A delivers
|
|
|
14132
14436
|
id: "google/gemini-3.5-flash",
|
|
14133
14437
|
name: "Gemini 3.5 Flash",
|
|
14134
14438
|
match: {
|
|
14135
|
-
|
|
14439
|
+
or: [
|
|
14440
|
+
{
|
|
14441
|
+
equals: "google/gemini-3.5-flash"
|
|
14442
|
+
},
|
|
14443
|
+
{
|
|
14444
|
+
regex: "^google/gemini-3\\.5-flash-\\d{8}$"
|
|
14445
|
+
}
|
|
14446
|
+
]
|
|
14136
14447
|
},
|
|
14137
14448
|
prices: {
|
|
14138
14449
|
input_mtok: 1.5,
|
|
@@ -19298,7 +19609,14 @@ Compared to other leading proprietary and open-weights models Command A delivers
|
|
|
19298
19609
|
id: "x-ai/grok-4.3",
|
|
19299
19610
|
name: "Grok 4.3",
|
|
19300
19611
|
match: {
|
|
19301
|
-
|
|
19612
|
+
or: [
|
|
19613
|
+
{
|
|
19614
|
+
equals: "x-ai/grok-4.3"
|
|
19615
|
+
},
|
|
19616
|
+
{
|
|
19617
|
+
regex: "^x-ai/grok-4\\.3-\\d{8}$"
|
|
19618
|
+
}
|
|
19619
|
+
]
|
|
19302
19620
|
},
|
|
19303
19621
|
prices: {
|
|
19304
19622
|
input_mtok: 1.25,
|
|
@@ -21505,6 +21823,15 @@ Compared to other leading proprietary and open-weights models Command A delivers
|
|
|
21505
21823
|
{
|
|
21506
21824
|
equals: "grok-4.3"
|
|
21507
21825
|
},
|
|
21826
|
+
{
|
|
21827
|
+
regex: "^grok-4\\.3-\\d{8}$"
|
|
21828
|
+
},
|
|
21829
|
+
{
|
|
21830
|
+
equals: "x-ai/grok-4.3"
|
|
21831
|
+
},
|
|
21832
|
+
{
|
|
21833
|
+
regex: "^x-ai/grok-4\\.3-\\d{8}$"
|
|
21834
|
+
},
|
|
21508
21835
|
{
|
|
21509
21836
|
equals: "grok-4.3-latest"
|
|
21510
21837
|
},
|
|
@@ -22012,7 +22339,7 @@ function j(e, t, i) {
|
|
|
22012
22339
|
function H(e) {
|
|
22013
22340
|
return M?.(), x(k, e);
|
|
22014
22341
|
}
|
|
22015
|
-
function
|
|
22342
|
+
function $(e, t, i) {
|
|
22016
22343
|
if (i = i ?? "default", !e.extractors)
|
|
22017
22344
|
throw new Error("No extraction logic defined for this provider");
|
|
22018
22345
|
const a = e.extractors.find((s) => s.api_flavor === i);
|
|
@@ -22105,7 +22432,7 @@ const q = {
|
|
|
22105
22432
|
guard: (e) => typeof e == "number",
|
|
22106
22433
|
name: "number"
|
|
22107
22434
|
}, h = (e, t) => [...e.map(L), ...t.map(L)].join("."), L = (e) => typeof e == "string" ? e : JSON.stringify(e);
|
|
22108
|
-
class
|
|
22435
|
+
class U {
|
|
22109
22436
|
base;
|
|
22110
22437
|
tiers;
|
|
22111
22438
|
constructor(t) {
|
|
@@ -22114,9 +22441,9 @@ class $ {
|
|
|
22114
22441
|
}
|
|
22115
22442
|
export {
|
|
22116
22443
|
R as REMOTE_DATA_JSON_URL,
|
|
22117
|
-
|
|
22444
|
+
U as TieredPrices,
|
|
22118
22445
|
j as calcPrice,
|
|
22119
|
-
|
|
22446
|
+
$ as extractUsage,
|
|
22120
22447
|
H as findProvider,
|
|
22121
22448
|
O as updatePrices,
|
|
22122
22449
|
K as waitForUpdate
|