tokencostauto 0.1.346__tar.gz → 0.1.350__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: tokencostauto
3
- Version: 0.1.346
3
+ Version: 0.1.350
4
4
  Summary: To calculate token and translated USD cost of string and message calls to OpenAI, for example when used by AI agents
5
5
  Author-email: Trisha Pan <trishaepan@gmail.com>, Alex Reibman <areibman@gmail.com>, Pratyush Shukla <ps4534@nyu.edu>, Thiago MadPin <madpin@gmail.com>
6
6
  Project-URL: Homepage, https://github.com/madpin/tokencostaudo
@@ -11,7 +11,7 @@ tokencostauto = ["model_prices.json"]
11
11
  [project]
12
12
 
13
13
  name = "tokencostauto"
14
- version = "0.1.346"
14
+ version = "0.1.350"
15
15
 
16
16
  authors = [
17
17
  { name = "Trisha Pan", email = "trishaepan@gmail.com" },
@@ -11817,14 +11817,14 @@
11817
11817
  },
11818
11818
  "azure/o3-2025-04-16": {
11819
11819
  "deprecation_date": "2026-04-16",
11820
- "cache_read_input_token_cost": 2.5e-06,
11821
- "input_cost_per_token": 1e-05,
11820
+ "cache_read_input_token_cost": 5e-07,
11821
+ "input_cost_per_token": 2e-06,
11822
11822
  "litellm_provider": "azure",
11823
11823
  "max_input_tokens": 200000,
11824
11824
  "max_output_tokens": 100000,
11825
11825
  "max_tokens": 100000,
11826
11826
  "mode": "chat",
11827
- "output_cost_per_token": 4e-05,
11827
+ "output_cost_per_token": 8e-06,
11828
11828
  "supported_endpoints": [
11829
11829
  "/v1/chat/completions",
11830
11830
  "/v1/batch",
@@ -25280,7 +25280,7 @@
25280
25280
  "fal_ai/fal-ai/flux-pro/v1.1-ultra": {
25281
25281
  "litellm_provider": "fal_ai",
25282
25282
  "mode": "image_generation",
25283
- "output_cost_per_image": 0.0398,
25283
+ "output_cost_per_image": 0.06,
25284
25284
  "supported_endpoints": [
25285
25285
  "/v1/images/generations"
25286
25286
  ]
@@ -26186,5 +26186,390 @@
26186
26186
  "metadata": {
26187
26187
  "comment": "Estimated cost based on standard TTS pricing. RunwayML uses ElevenLabs models."
26188
26188
  }
26189
+ },
26190
+ "fal_ai/fal-ai/flux-pro/v1.1": {
26191
+ "litellm_provider": "fal_ai",
26192
+ "mode": "image_generation",
26193
+ "output_cost_per_image": 0.04,
26194
+ "supported_endpoints": [
26195
+ "/v1/images/generations"
26196
+ ]
26197
+ },
26198
+ "fal_ai/fal-ai/bytedance/seedream/v3/text-to-image": {
26199
+ "litellm_provider": "fal_ai",
26200
+ "mode": "image_generation",
26201
+ "output_cost_per_image": 0.03,
26202
+ "supported_endpoints": [
26203
+ "/v1/images/generations"
26204
+ ]
26205
+ },
26206
+ "fal_ai/fal-ai/bytedance/dreamina/v3.1/text-to-image": {
26207
+ "litellm_provider": "fal_ai",
26208
+ "mode": "image_generation",
26209
+ "output_cost_per_image": 0.03,
26210
+ "supported_endpoints": [
26211
+ "/v1/images/generations"
26212
+ ]
26213
+ },
26214
+ "fal_ai/fal-ai/ideogram/v3": {
26215
+ "litellm_provider": "fal_ai",
26216
+ "mode": "image_generation",
26217
+ "output_cost_per_image": 0.06,
26218
+ "supported_endpoints": [
26219
+ "/v1/images/generations"
26220
+ ]
26221
+ },
26222
+ "vertex_ai/moonshotai/kimi-k2-thinking-maas": {
26223
+ "input_cost_per_token": 6e-07,
26224
+ "litellm_provider": "vertex_ai-moonshot_models",
26225
+ "max_input_tokens": 256000,
26226
+ "max_output_tokens": 256000,
26227
+ "max_tokens": 256000,
26228
+ "mode": "chat",
26229
+ "output_cost_per_token": 2.5e-06,
26230
+ "source": "https://cloud.google.com/vertex-ai/generative-ai/pricing#partner-models",
26231
+ "supports_function_calling": true,
26232
+ "supports_tool_choice": true,
26233
+ "supports_web_search": true
26234
+ },
26235
+ "azure/eu/gpt-5-2025-08-07": {
26236
+ "cache_read_input_token_cost": 1.375e-07,
26237
+ "input_cost_per_token": 1.375e-06,
26238
+ "litellm_provider": "azure",
26239
+ "max_input_tokens": 272000,
26240
+ "max_output_tokens": 128000,
26241
+ "max_tokens": 128000,
26242
+ "mode": "chat",
26243
+ "output_cost_per_token": 1.1e-05,
26244
+ "supported_endpoints": [
26245
+ "/v1/chat/completions",
26246
+ "/v1/batch",
26247
+ "/v1/responses"
26248
+ ],
26249
+ "supported_modalities": [
26250
+ "text",
26251
+ "image"
26252
+ ],
26253
+ "supported_output_modalities": [
26254
+ "text"
26255
+ ],
26256
+ "supports_function_calling": true,
26257
+ "supports_native_streaming": true,
26258
+ "supports_parallel_function_calling": true,
26259
+ "supports_pdf_input": true,
26260
+ "supports_prompt_caching": true,
26261
+ "supports_reasoning": true,
26262
+ "supports_response_schema": true,
26263
+ "supports_system_messages": true,
26264
+ "supports_tool_choice": true,
26265
+ "supports_vision": true
26266
+ },
26267
+ "azure/eu/gpt-5-mini-2025-08-07": {
26268
+ "cache_read_input_token_cost": 2.75e-08,
26269
+ "input_cost_per_token": 2.75e-07,
26270
+ "litellm_provider": "azure",
26271
+ "max_input_tokens": 272000,
26272
+ "max_output_tokens": 128000,
26273
+ "max_tokens": 128000,
26274
+ "mode": "chat",
26275
+ "output_cost_per_token": 2.2e-06,
26276
+ "supported_endpoints": [
26277
+ "/v1/chat/completions",
26278
+ "/v1/batch",
26279
+ "/v1/responses"
26280
+ ],
26281
+ "supported_modalities": [
26282
+ "text",
26283
+ "image"
26284
+ ],
26285
+ "supported_output_modalities": [
26286
+ "text"
26287
+ ],
26288
+ "supports_function_calling": true,
26289
+ "supports_native_streaming": true,
26290
+ "supports_parallel_function_calling": true,
26291
+ "supports_pdf_input": true,
26292
+ "supports_prompt_caching": true,
26293
+ "supports_reasoning": true,
26294
+ "supports_response_schema": true,
26295
+ "supports_system_messages": true,
26296
+ "supports_tool_choice": true,
26297
+ "supports_vision": true
26298
+ },
26299
+ "azure/eu/gpt-5-nano-2025-08-07": {
26300
+ "cache_read_input_token_cost": 5.5e-09,
26301
+ "input_cost_per_token": 5.5e-08,
26302
+ "litellm_provider": "azure",
26303
+ "max_input_tokens": 272000,
26304
+ "max_output_tokens": 128000,
26305
+ "max_tokens": 128000,
26306
+ "mode": "chat",
26307
+ "output_cost_per_token": 4.4e-07,
26308
+ "supported_endpoints": [
26309
+ "/v1/chat/completions",
26310
+ "/v1/batch",
26311
+ "/v1/responses"
26312
+ ],
26313
+ "supported_modalities": [
26314
+ "text",
26315
+ "image"
26316
+ ],
26317
+ "supported_output_modalities": [
26318
+ "text"
26319
+ ],
26320
+ "supports_function_calling": true,
26321
+ "supports_native_streaming": true,
26322
+ "supports_parallel_function_calling": true,
26323
+ "supports_pdf_input": true,
26324
+ "supports_prompt_caching": true,
26325
+ "supports_reasoning": true,
26326
+ "supports_response_schema": true,
26327
+ "supports_system_messages": true,
26328
+ "supports_tool_choice": true,
26329
+ "supports_vision": true
26330
+ },
26331
+ "azure/us/gpt-4.1-2025-04-14": {
26332
+ "deprecation_date": "2026-11-04",
26333
+ "cache_read_input_token_cost": 5.5e-07,
26334
+ "input_cost_per_token": 2.2e-06,
26335
+ "input_cost_per_token_batches": 1.1e-06,
26336
+ "litellm_provider": "azure",
26337
+ "max_input_tokens": 1047576,
26338
+ "max_output_tokens": 32768,
26339
+ "max_tokens": 32768,
26340
+ "mode": "chat",
26341
+ "output_cost_per_token": 8.8e-06,
26342
+ "output_cost_per_token_batches": 4.4e-06,
26343
+ "supported_endpoints": [
26344
+ "/v1/chat/completions",
26345
+ "/v1/batch",
26346
+ "/v1/responses"
26347
+ ],
26348
+ "supported_modalities": [
26349
+ "text",
26350
+ "image"
26351
+ ],
26352
+ "supported_output_modalities": [
26353
+ "text"
26354
+ ],
26355
+ "supports_function_calling": true,
26356
+ "supports_native_streaming": true,
26357
+ "supports_parallel_function_calling": true,
26358
+ "supports_prompt_caching": true,
26359
+ "supports_response_schema": true,
26360
+ "supports_system_messages": true,
26361
+ "supports_tool_choice": true,
26362
+ "supports_vision": true,
26363
+ "supports_web_search": false
26364
+ },
26365
+ "azure/us/gpt-4.1-mini-2025-04-14": {
26366
+ "deprecation_date": "2026-11-04",
26367
+ "cache_read_input_token_cost": 1.1e-07,
26368
+ "input_cost_per_token": 4.4e-07,
26369
+ "input_cost_per_token_batches": 2.2e-07,
26370
+ "litellm_provider": "azure",
26371
+ "max_input_tokens": 1047576,
26372
+ "max_output_tokens": 32768,
26373
+ "max_tokens": 32768,
26374
+ "mode": "chat",
26375
+ "output_cost_per_token": 1.76e-06,
26376
+ "output_cost_per_token_batches": 8.8e-07,
26377
+ "supported_endpoints": [
26378
+ "/v1/chat/completions",
26379
+ "/v1/batch",
26380
+ "/v1/responses"
26381
+ ],
26382
+ "supported_modalities": [
26383
+ "text",
26384
+ "image"
26385
+ ],
26386
+ "supported_output_modalities": [
26387
+ "text"
26388
+ ],
26389
+ "supports_function_calling": true,
26390
+ "supports_native_streaming": true,
26391
+ "supports_parallel_function_calling": true,
26392
+ "supports_prompt_caching": true,
26393
+ "supports_response_schema": true,
26394
+ "supports_system_messages": true,
26395
+ "supports_tool_choice": true,
26396
+ "supports_vision": true,
26397
+ "supports_web_search": false
26398
+ },
26399
+ "azure/us/gpt-4.1-nano-2025-04-14": {
26400
+ "deprecation_date": "2026-11-04",
26401
+ "cache_read_input_token_cost": 2.5e-08,
26402
+ "input_cost_per_token": 1.1e-07,
26403
+ "input_cost_per_token_batches": 6e-08,
26404
+ "litellm_provider": "azure",
26405
+ "max_input_tokens": 1047576,
26406
+ "max_output_tokens": 32768,
26407
+ "max_tokens": 32768,
26408
+ "mode": "chat",
26409
+ "output_cost_per_token": 4.4e-07,
26410
+ "output_cost_per_token_batches": 2.2e-07,
26411
+ "supported_endpoints": [
26412
+ "/v1/chat/completions",
26413
+ "/v1/batch",
26414
+ "/v1/responses"
26415
+ ],
26416
+ "supported_modalities": [
26417
+ "text",
26418
+ "image"
26419
+ ],
26420
+ "supported_output_modalities": [
26421
+ "text"
26422
+ ],
26423
+ "supports_function_calling": true,
26424
+ "supports_native_streaming": true,
26425
+ "supports_parallel_function_calling": true,
26426
+ "supports_prompt_caching": true,
26427
+ "supports_response_schema": true,
26428
+ "supports_system_messages": true,
26429
+ "supports_tool_choice": true,
26430
+ "supports_vision": true
26431
+ },
26432
+ "azure/us/gpt-5-2025-08-07": {
26433
+ "cache_read_input_token_cost": 1.375e-07,
26434
+ "input_cost_per_token": 1.375e-06,
26435
+ "litellm_provider": "azure",
26436
+ "max_input_tokens": 272000,
26437
+ "max_output_tokens": 128000,
26438
+ "max_tokens": 128000,
26439
+ "mode": "chat",
26440
+ "output_cost_per_token": 1.1e-05,
26441
+ "supported_endpoints": [
26442
+ "/v1/chat/completions",
26443
+ "/v1/batch",
26444
+ "/v1/responses"
26445
+ ],
26446
+ "supported_modalities": [
26447
+ "text",
26448
+ "image"
26449
+ ],
26450
+ "supported_output_modalities": [
26451
+ "text"
26452
+ ],
26453
+ "supports_function_calling": true,
26454
+ "supports_native_streaming": true,
26455
+ "supports_parallel_function_calling": true,
26456
+ "supports_pdf_input": true,
26457
+ "supports_prompt_caching": true,
26458
+ "supports_reasoning": true,
26459
+ "supports_response_schema": true,
26460
+ "supports_system_messages": true,
26461
+ "supports_tool_choice": true,
26462
+ "supports_vision": true
26463
+ },
26464
+ "azure/us/gpt-5-mini-2025-08-07": {
26465
+ "cache_read_input_token_cost": 2.75e-08,
26466
+ "input_cost_per_token": 2.75e-07,
26467
+ "litellm_provider": "azure",
26468
+ "max_input_tokens": 272000,
26469
+ "max_output_tokens": 128000,
26470
+ "max_tokens": 128000,
26471
+ "mode": "chat",
26472
+ "output_cost_per_token": 2.2e-06,
26473
+ "supported_endpoints": [
26474
+ "/v1/chat/completions",
26475
+ "/v1/batch",
26476
+ "/v1/responses"
26477
+ ],
26478
+ "supported_modalities": [
26479
+ "text",
26480
+ "image"
26481
+ ],
26482
+ "supported_output_modalities": [
26483
+ "text"
26484
+ ],
26485
+ "supports_function_calling": true,
26486
+ "supports_native_streaming": true,
26487
+ "supports_parallel_function_calling": true,
26488
+ "supports_pdf_input": true,
26489
+ "supports_prompt_caching": true,
26490
+ "supports_reasoning": true,
26491
+ "supports_response_schema": true,
26492
+ "supports_system_messages": true,
26493
+ "supports_tool_choice": true,
26494
+ "supports_vision": true
26495
+ },
26496
+ "azure/us/gpt-5-nano-2025-08-07": {
26497
+ "cache_read_input_token_cost": 5.5e-09,
26498
+ "input_cost_per_token": 5.5e-08,
26499
+ "litellm_provider": "azure",
26500
+ "max_input_tokens": 272000,
26501
+ "max_output_tokens": 128000,
26502
+ "max_tokens": 128000,
26503
+ "mode": "chat",
26504
+ "output_cost_per_token": 4.4e-07,
26505
+ "supported_endpoints": [
26506
+ "/v1/chat/completions",
26507
+ "/v1/batch",
26508
+ "/v1/responses"
26509
+ ],
26510
+ "supported_modalities": [
26511
+ "text",
26512
+ "image"
26513
+ ],
26514
+ "supported_output_modalities": [
26515
+ "text"
26516
+ ],
26517
+ "supports_function_calling": true,
26518
+ "supports_native_streaming": true,
26519
+ "supports_parallel_function_calling": true,
26520
+ "supports_pdf_input": true,
26521
+ "supports_prompt_caching": true,
26522
+ "supports_reasoning": true,
26523
+ "supports_response_schema": true,
26524
+ "supports_system_messages": true,
26525
+ "supports_tool_choice": true,
26526
+ "supports_vision": true
26527
+ },
26528
+ "azure/us/o3-2025-04-16": {
26529
+ "deprecation_date": "2026-04-16",
26530
+ "cache_read_input_token_cost": 5.5e-07,
26531
+ "input_cost_per_token": 2.2e-06,
26532
+ "litellm_provider": "azure",
26533
+ "max_input_tokens": 200000,
26534
+ "max_output_tokens": 100000,
26535
+ "max_tokens": 100000,
26536
+ "mode": "chat",
26537
+ "output_cost_per_token": 8.8e-06,
26538
+ "supported_endpoints": [
26539
+ "/v1/chat/completions",
26540
+ "/v1/batch",
26541
+ "/v1/responses"
26542
+ ],
26543
+ "supported_modalities": [
26544
+ "text",
26545
+ "image"
26546
+ ],
26547
+ "supported_output_modalities": [
26548
+ "text"
26549
+ ],
26550
+ "supports_function_calling": true,
26551
+ "supports_parallel_function_calling": false,
26552
+ "supports_prompt_caching": true,
26553
+ "supports_reasoning": true,
26554
+ "supports_response_schema": true,
26555
+ "supports_tool_choice": true,
26556
+ "supports_vision": true
26557
+ },
26558
+ "azure/us/o4-mini-2025-04-16": {
26559
+ "cache_read_input_token_cost": 3.1e-07,
26560
+ "input_cost_per_token": 1.21e-06,
26561
+ "litellm_provider": "azure",
26562
+ "max_input_tokens": 200000,
26563
+ "max_output_tokens": 100000,
26564
+ "max_tokens": 100000,
26565
+ "mode": "chat",
26566
+ "output_cost_per_token": 4.84e-06,
26567
+ "supports_function_calling": true,
26568
+ "supports_parallel_function_calling": false,
26569
+ "supports_prompt_caching": true,
26570
+ "supports_reasoning": true,
26571
+ "supports_response_schema": true,
26572
+ "supports_tool_choice": true,
26573
+ "supports_vision": true
26189
26574
  }
26190
26575
  }
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: tokencostauto
3
- Version: 0.1.346
3
+ Version: 0.1.350
4
4
  Summary: To calculate token and translated USD cost of string and message calls to OpenAI, for example when used by AI agents
5
5
  Author-email: Trisha Pan <trishaepan@gmail.com>, Alex Reibman <areibman@gmail.com>, Pratyush Shukla <ps4534@nyu.edu>, Thiago MadPin <madpin@gmail.com>
6
6
  Project-URL: Homepage, https://github.com/madpin/tokencostaudo
File without changes