tokencostauto 0.1.376__py3-none-any.whl → 0.1.380__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -553,6 +553,7 @@
553
553
  "supports_tool_choice": true
554
554
  },
555
555
  "ft:gpt-4o-2024-08-06": {
556
+ "cache_read_input_token_cost": 1.875e-06,
556
557
  "input_cost_per_token": 3.75e-06,
557
558
  "input_cost_per_token_batches": 1.875e-06,
558
559
  "litellm_provider": "openai",
@@ -565,6 +566,7 @@
565
566
  "supports_function_calling": true,
566
567
  "supports_parallel_function_calling": true,
567
568
  "supports_pdf_input": true,
569
+ "supports_prompt_caching": true,
568
570
  "supports_response_schema": true,
569
571
  "supports_system_messages": true,
570
572
  "supports_tool_choice": true,
@@ -587,29 +589,28 @@
587
589
  "supports_prompt_caching": true,
588
590
  "supports_response_schema": true,
589
591
  "supports_system_messages": true,
590
- "supports_tool_choice": true,
591
- "supports_vision": true
592
+ "supports_tool_choice": true
592
593
  },
593
594
  "ft:davinci-002": {
594
- "input_cost_per_token": 2e-06,
595
+ "input_cost_per_token": 1.2e-05,
595
596
  "input_cost_per_token_batches": 1e-06,
596
597
  "litellm_provider": "text-completion-openai",
597
598
  "max_input_tokens": 16384,
598
599
  "max_output_tokens": 4096,
599
600
  "max_tokens": 16384,
600
601
  "mode": "completion",
601
- "output_cost_per_token": 2e-06,
602
+ "output_cost_per_token": 1.2e-05,
602
603
  "output_cost_per_token_batches": 1e-06
603
604
  },
604
605
  "ft:babbage-002": {
605
- "input_cost_per_token": 4e-07,
606
+ "input_cost_per_token": 1.6e-06,
606
607
  "input_cost_per_token_batches": 2e-07,
607
608
  "litellm_provider": "text-completion-openai",
608
609
  "max_input_tokens": 16384,
609
610
  "max_output_tokens": 4096,
610
611
  "max_tokens": 16384,
611
612
  "mode": "completion",
612
- "output_cost_per_token": 4e-07,
613
+ "output_cost_per_token": 1.6e-06,
613
614
  "output_cost_per_token_batches": 2e-07
614
615
  },
615
616
  "text-embedding-3-large": {
@@ -7234,7 +7235,7 @@
7234
7235
  "output_cost_per_token": 0.0
7235
7236
  },
7236
7237
  "databricks/databricks-meta-llama-3-1-405b-instruct": {
7237
- "input_cost_per_token": 5e-06,
7238
+ "input_cost_per_token": 5.00003e-06,
7238
7239
  "input_dbu_cost_per_token": 7.1429e-05,
7239
7240
  "litellm_provider": "databricks",
7240
7241
  "max_input_tokens": 128000,
@@ -7244,8 +7245,8 @@
7244
7245
  "notes": "Input/output cost per token is dbu cost * $0.070, based on databricks Llama 3.1 70B conversion. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
7245
7246
  },
7246
7247
  "mode": "chat",
7247
- "output_cost_per_token": 1.500002e-05,
7248
- "output_db_cost_per_token": 0.000214286,
7248
+ "output_cost_per_token": 1.5000020000000002e-05,
7249
+ "output_dbu_cost_per_token": 0.000214286,
7249
7250
  "source": "https://www.databricks.com/product/pricing/foundation-model-serving",
7250
7251
  "supports_tool_choice": true
7251
7252
  },
@@ -7292,7 +7293,7 @@
7292
7293
  "notes": "Input/output cost per token is dbu cost * $0.070, based on databricks Llama 3.1 70B conversion. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
7293
7294
  },
7294
7295
  "mode": "chat",
7295
- "output_cost_per_token": 2.99999e-06,
7296
+ "output_cost_per_token": 2.9999900000000002e-06,
7296
7297
  "output_dbu_cost_per_token": 4.2857e-05,
7297
7298
  "source": "https://www.databricks.com/product/pricing/foundation-model-serving",
7298
7299
  "supports_tool_choice": true
@@ -7308,7 +7309,7 @@
7308
7309
  "notes": "Input/output cost per token is dbu cost * $0.070, based on databricks Llama 3.1 70B conversion. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
7309
7310
  },
7310
7311
  "mode": "chat",
7311
- "output_cost_per_token": 1.5e-06,
7312
+ "output_cost_per_token": 1.5000300000000002e-06,
7312
7313
  "output_dbu_cost_per_token": 2.1429e-05,
7313
7314
  "source": "https://www.databricks.com/product/pricing/foundation-model-serving",
7314
7315
  "supports_tool_choice": true
@@ -7324,13 +7325,13 @@
7324
7325
  "notes": "Input/output cost per token is dbu cost * $0.070, based on databricks Llama 3.1 70B conversion. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
7325
7326
  },
7326
7327
  "mode": "chat",
7327
- "output_cost_per_token": 9.9902e-07,
7328
+ "output_cost_per_token": 1.00002e-06,
7328
7329
  "output_dbu_cost_per_token": 1.4286e-05,
7329
7330
  "source": "https://www.databricks.com/product/pricing/foundation-model-serving",
7330
7331
  "supports_tool_choice": true
7331
7332
  },
7332
7333
  "databricks/databricks-mpt-30b-instruct": {
7333
- "input_cost_per_token": 9.9902e-07,
7334
+ "input_cost_per_token": 1.00002e-06,
7334
7335
  "input_dbu_cost_per_token": 1.4286e-05,
7335
7336
  "litellm_provider": "databricks",
7336
7337
  "max_input_tokens": 8192,
@@ -7340,7 +7341,7 @@
7340
7341
  "notes": "Input/output cost per token is dbu cost * $0.070, based on databricks Llama 3.1 70B conversion. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
7341
7342
  },
7342
7343
  "mode": "chat",
7343
- "output_cost_per_token": 9.9902e-07,
7344
+ "output_cost_per_token": 1.00002e-06,
7344
7345
  "output_dbu_cost_per_token": 1.4286e-05,
7345
7346
  "source": "https://www.databricks.com/product/pricing/foundation-model-serving",
7346
7347
  "supports_tool_choice": true
@@ -7377,7 +7378,7 @@
7377
7378
  "source": "https://www.databricks.com/product/pricing/foundation-model-serving"
7378
7379
  },
7379
7380
  "databricks/databricks-gte-large-en": {
7380
- "input_cost_per_token": 1.2999e-07,
7381
+ "input_cost_per_token": 1.2999000000000001e-07,
7381
7382
  "input_dbu_cost_per_token": 1.857e-06,
7382
7383
  "litellm_provider": "databricks",
7383
7384
  "max_input_tokens": 8192,
@@ -7747,8 +7748,7 @@
7747
7748
  "supports_prompt_caching": true,
7748
7749
  "supports_response_schema": true,
7749
7750
  "supports_system_messages": true,
7750
- "supports_tool_choice": true,
7751
- "supports_vision": true
7751
+ "supports_tool_choice": true
7752
7752
  },
7753
7753
  "azure/gpt-4o-2024-11-20": {
7754
7754
  "deprecation_date": "2026-03-01",
@@ -13185,27 +13185,27 @@
13185
13185
  "output_cost_per_token": 9e-07
13186
13186
  },
13187
13187
  "databricks/databricks-claude-3-7-sonnet": {
13188
- "input_cost_per_token": 2.5e-06,
13189
- "input_dbu_cost_per_token": 3.571e-05,
13188
+ "input_cost_per_token": 2.9999900000000002e-06,
13189
+ "input_dbu_cost_per_token": 4.2857e-05,
13190
13190
  "litellm_provider": "databricks",
13191
13191
  "max_input_tokens": 200000,
13192
13192
  "max_output_tokens": 128000,
13193
13193
  "max_tokens": 200000,
13194
13194
  "metadata": {
13195
- "notes": "Input/output cost per token is dbu cost * $0.070, based on databricks Claude 3.7 conversion. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
13195
+ "notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
13196
13196
  },
13197
13197
  "mode": "chat",
13198
- "output_cost_per_token": 1.7857e-05,
13199
- "output_db_cost_per_token": 0.000214286,
13200
- "source": "https://www.databricks.com/product/pricing/foundation-model-serving",
13198
+ "output_cost_per_token": 1.5000020000000002e-05,
13199
+ "output_dbu_cost_per_token": 0.000214286,
13200
+ "source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving",
13201
13201
  "supports_assistant_prefill": true,
13202
13202
  "supports_function_calling": true,
13203
13203
  "supports_reasoning": true,
13204
13204
  "supports_tool_choice": true
13205
13205
  },
13206
13206
  "databricks/databricks-meta-llama-3-3-70b-instruct": {
13207
- "input_cost_per_token": 1.00002e-06,
13208
- "input_dbu_cost_per_token": 1.4286e-05,
13207
+ "input_cost_per_token": 5.0001e-07,
13208
+ "input_dbu_cost_per_token": 7.143e-06,
13209
13209
  "litellm_provider": "databricks",
13210
13210
  "max_input_tokens": 128000,
13211
13211
  "max_output_tokens": 128000,
@@ -13214,8 +13214,8 @@
13214
13214
  "notes": "Input/output cost per token is dbu cost * $0.070, based on databricks Llama 3.1 70B conversion. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
13215
13215
  },
13216
13216
  "mode": "chat",
13217
- "output_cost_per_token": 2.99999e-06,
13218
- "output_dbu_cost_per_token": 4.2857e-05,
13217
+ "output_cost_per_token": 1.5000300000000002e-06,
13218
+ "output_dbu_cost_per_token": 2.1429e-05,
13219
13219
  "source": "https://www.databricks.com/product/pricing/foundation-model-serving",
13220
13220
  "supports_tool_choice": true
13221
13221
  },
@@ -14261,8 +14261,8 @@
14261
14261
  "tool_use_system_prompt_tokens": 159
14262
14262
  },
14263
14263
  "databricks/databricks-llama-4-maverick": {
14264
- "input_cost_per_token": 5e-06,
14265
- "input_dbu_cost_per_token": 7.143e-05,
14264
+ "input_cost_per_token": 5.0001e-07,
14265
+ "input_dbu_cost_per_token": 7.143e-06,
14266
14266
  "litellm_provider": "databricks",
14267
14267
  "max_input_tokens": 128000,
14268
14268
  "max_output_tokens": 128000,
@@ -14271,8 +14271,8 @@
14271
14271
  "notes": "Databricks documentation now provides both DBU costs (_dbu_cost_per_token) and dollar costs(_cost_per_token)."
14272
14272
  },
14273
14273
  "mode": "chat",
14274
- "output_cost_per_token": 1.5e-05,
14275
- "output_dbu_cost_per_token": 0.00021429,
14274
+ "output_cost_per_token": 1.5000300000000002e-06,
14275
+ "output_dbu_cost_per_token": 2.1429e-05,
14276
14276
  "source": "https://www.databricks.com/product/pricing/foundation-model-serving",
14277
14277
  "supports_tool_choice": true
14278
14278
  },
@@ -28335,5 +28335,622 @@
28335
28335
  "supports_function_calling": true,
28336
28336
  "supports_response_schema": true,
28337
28337
  "supports_tool_choice": true
28338
+ },
28339
+ "claude-opus-4-5": {
28340
+ "cache_creation_input_token_cost": 6.25e-06,
28341
+ "cache_creation_input_token_cost_above_1hr": 1e-05,
28342
+ "cache_read_input_token_cost": 5e-07,
28343
+ "input_cost_per_token": 5e-06,
28344
+ "litellm_provider": "anthropic",
28345
+ "max_input_tokens": 200000,
28346
+ "max_output_tokens": 64000,
28347
+ "max_tokens": 64000,
28348
+ "mode": "chat",
28349
+ "output_cost_per_token": 2.5e-05,
28350
+ "search_context_cost_per_query": {
28351
+ "search_context_size_high": 0.01,
28352
+ "search_context_size_low": 0.01,
28353
+ "search_context_size_medium": 0.01
28354
+ },
28355
+ "supports_assistant_prefill": true,
28356
+ "supports_computer_use": true,
28357
+ "supports_function_calling": true,
28358
+ "supports_pdf_input": true,
28359
+ "supports_prompt_caching": true,
28360
+ "supports_reasoning": true,
28361
+ "supports_response_schema": true,
28362
+ "supports_tool_choice": true,
28363
+ "supports_vision": true,
28364
+ "tool_use_system_prompt_tokens": 159
28365
+ },
28366
+ "databricks/databricks-claude-haiku-4-5": {
28367
+ "input_cost_per_token": 1.00002e-06,
28368
+ "input_dbu_cost_per_token": 1.4286e-05,
28369
+ "litellm_provider": "databricks",
28370
+ "max_input_tokens": 200000,
28371
+ "max_output_tokens": 64000,
28372
+ "max_tokens": 200000,
28373
+ "metadata": {
28374
+ "notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
28375
+ },
28376
+ "mode": "chat",
28377
+ "output_cost_per_token": 5.00003e-06,
28378
+ "output_dbu_cost_per_token": 7.1429e-05,
28379
+ "source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving",
28380
+ "supports_assistant_prefill": true,
28381
+ "supports_function_calling": true,
28382
+ "supports_reasoning": true,
28383
+ "supports_tool_choice": true
28384
+ },
28385
+ "databricks/databricks-claude-opus-4": {
28386
+ "input_cost_per_token": 1.5000020000000002e-05,
28387
+ "input_dbu_cost_per_token": 0.000214286,
28388
+ "litellm_provider": "databricks",
28389
+ "max_input_tokens": 200000,
28390
+ "max_output_tokens": 32000,
28391
+ "max_tokens": 200000,
28392
+ "metadata": {
28393
+ "notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
28394
+ },
28395
+ "mode": "chat",
28396
+ "output_cost_per_token": 7.500003000000001e-05,
28397
+ "output_dbu_cost_per_token": 0.001071429,
28398
+ "source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving",
28399
+ "supports_assistant_prefill": true,
28400
+ "supports_function_calling": true,
28401
+ "supports_reasoning": true,
28402
+ "supports_tool_choice": true
28403
+ },
28404
+ "databricks/databricks-claude-opus-4-1": {
28405
+ "input_cost_per_token": 1.5000020000000002e-05,
28406
+ "input_dbu_cost_per_token": 0.000214286,
28407
+ "litellm_provider": "databricks",
28408
+ "max_input_tokens": 200000,
28409
+ "max_output_tokens": 32000,
28410
+ "max_tokens": 200000,
28411
+ "metadata": {
28412
+ "notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
28413
+ },
28414
+ "mode": "chat",
28415
+ "output_cost_per_token": 7.500003000000001e-05,
28416
+ "output_dbu_cost_per_token": 0.001071429,
28417
+ "source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving",
28418
+ "supports_assistant_prefill": true,
28419
+ "supports_function_calling": true,
28420
+ "supports_reasoning": true,
28421
+ "supports_tool_choice": true
28422
+ },
28423
+ "databricks/databricks-claude-opus-4-5": {
28424
+ "input_cost_per_token": 5.00003e-06,
28425
+ "input_dbu_cost_per_token": 7.1429e-05,
28426
+ "litellm_provider": "databricks",
28427
+ "max_input_tokens": 200000,
28428
+ "max_output_tokens": 64000,
28429
+ "max_tokens": 200000,
28430
+ "metadata": {
28431
+ "notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
28432
+ },
28433
+ "mode": "chat",
28434
+ "output_cost_per_token": 2.5000010000000002e-05,
28435
+ "output_dbu_cost_per_token": 0.000357143,
28436
+ "source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving",
28437
+ "supports_assistant_prefill": true,
28438
+ "supports_function_calling": true,
28439
+ "supports_reasoning": true,
28440
+ "supports_tool_choice": true
28441
+ },
28442
+ "databricks/databricks-claude-sonnet-4": {
28443
+ "input_cost_per_token": 2.9999900000000002e-06,
28444
+ "input_dbu_cost_per_token": 4.2857e-05,
28445
+ "litellm_provider": "databricks",
28446
+ "max_input_tokens": 200000,
28447
+ "max_output_tokens": 64000,
28448
+ "max_tokens": 200000,
28449
+ "metadata": {
28450
+ "notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
28451
+ },
28452
+ "mode": "chat",
28453
+ "output_cost_per_token": 1.5000020000000002e-05,
28454
+ "output_dbu_cost_per_token": 0.000214286,
28455
+ "source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving",
28456
+ "supports_assistant_prefill": true,
28457
+ "supports_function_calling": true,
28458
+ "supports_reasoning": true,
28459
+ "supports_tool_choice": true
28460
+ },
28461
+ "databricks/databricks-claude-sonnet-4-1": {
28462
+ "input_cost_per_token": 2.9999900000000002e-06,
28463
+ "input_dbu_cost_per_token": 4.2857e-05,
28464
+ "litellm_provider": "databricks",
28465
+ "max_input_tokens": 200000,
28466
+ "max_output_tokens": 64000,
28467
+ "max_tokens": 200000,
28468
+ "metadata": {
28469
+ "notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
28470
+ },
28471
+ "mode": "chat",
28472
+ "output_cost_per_token": 1.5000020000000002e-05,
28473
+ "output_dbu_cost_per_token": 0.000214286,
28474
+ "source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving",
28475
+ "supports_assistant_prefill": true,
28476
+ "supports_function_calling": true,
28477
+ "supports_reasoning": true,
28478
+ "supports_tool_choice": true
28479
+ },
28480
+ "databricks/databricks-claude-sonnet-4-5": {
28481
+ "input_cost_per_token": 2.9999900000000002e-06,
28482
+ "input_dbu_cost_per_token": 4.2857e-05,
28483
+ "litellm_provider": "databricks",
28484
+ "max_input_tokens": 200000,
28485
+ "max_output_tokens": 64000,
28486
+ "max_tokens": 200000,
28487
+ "metadata": {
28488
+ "notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
28489
+ },
28490
+ "mode": "chat",
28491
+ "output_cost_per_token": 1.5000020000000002e-05,
28492
+ "output_dbu_cost_per_token": 0.000214286,
28493
+ "source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving",
28494
+ "supports_assistant_prefill": true,
28495
+ "supports_function_calling": true,
28496
+ "supports_reasoning": true,
28497
+ "supports_tool_choice": true
28498
+ },
28499
+ "databricks/databricks-gemini-2-5-flash": {
28500
+ "input_cost_per_token": 3.0001999999999996e-07,
28501
+ "input_dbu_cost_per_token": 4.285999999999999e-06,
28502
+ "litellm_provider": "databricks",
28503
+ "max_input_tokens": 1048576,
28504
+ "max_output_tokens": 65535,
28505
+ "max_tokens": 1048576,
28506
+ "metadata": {
28507
+ "notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
28508
+ },
28509
+ "mode": "chat",
28510
+ "output_cost_per_token": 2.49998e-06,
28511
+ "output_dbu_cost_per_token": 3.5714e-05,
28512
+ "source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving",
28513
+ "supports_function_calling": true,
28514
+ "supports_tool_choice": true
28515
+ },
28516
+ "databricks/databricks-gemini-2-5-pro": {
28517
+ "input_cost_per_token": 1.24999e-06,
28518
+ "input_dbu_cost_per_token": 1.7857e-05,
28519
+ "litellm_provider": "databricks",
28520
+ "max_input_tokens": 1048576,
28521
+ "max_output_tokens": 65536,
28522
+ "max_tokens": 1048576,
28523
+ "metadata": {
28524
+ "notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
28525
+ },
28526
+ "mode": "chat",
28527
+ "output_cost_per_token": 9.999990000000002e-06,
28528
+ "output_dbu_cost_per_token": 0.000142857,
28529
+ "source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving",
28530
+ "supports_function_calling": true,
28531
+ "supports_tool_choice": true
28532
+ },
28533
+ "databricks/databricks-gemma-3-12b": {
28534
+ "input_cost_per_token": 1.5000999999999998e-07,
28535
+ "input_dbu_cost_per_token": 2.1429999999999996e-06,
28536
+ "litellm_provider": "databricks",
28537
+ "max_input_tokens": 128000,
28538
+ "max_output_tokens": 32000,
28539
+ "max_tokens": 128000,
28540
+ "metadata": {
28541
+ "notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
28542
+ },
28543
+ "mode": "chat",
28544
+ "output_cost_per_token": 5.0001e-07,
28545
+ "output_dbu_cost_per_token": 7.143e-06,
28546
+ "source": "https://www.databricks.com/product/pricing/foundation-model-serving"
28547
+ },
28548
+ "databricks/databricks-gpt-5": {
28549
+ "input_cost_per_token": 1.24999e-06,
28550
+ "input_dbu_cost_per_token": 1.7857e-05,
28551
+ "litellm_provider": "databricks",
28552
+ "max_input_tokens": 400000,
28553
+ "max_output_tokens": 128000,
28554
+ "max_tokens": 400000,
28555
+ "metadata": {
28556
+ "notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
28557
+ },
28558
+ "mode": "chat",
28559
+ "output_cost_per_token": 9.999990000000002e-06,
28560
+ "output_dbu_cost_per_token": 0.000142857,
28561
+ "source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving"
28562
+ },
28563
+ "databricks/databricks-gpt-5-1": {
28564
+ "input_cost_per_token": 1.24999e-06,
28565
+ "input_dbu_cost_per_token": 1.7857e-05,
28566
+ "litellm_provider": "databricks",
28567
+ "max_input_tokens": 400000,
28568
+ "max_output_tokens": 128000,
28569
+ "max_tokens": 400000,
28570
+ "metadata": {
28571
+ "notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
28572
+ },
28573
+ "mode": "chat",
28574
+ "output_cost_per_token": 9.999990000000002e-06,
28575
+ "output_dbu_cost_per_token": 0.000142857,
28576
+ "source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving"
28577
+ },
28578
+ "databricks/databricks-gpt-5-mini": {
28579
+ "input_cost_per_token": 2.4997000000000006e-07,
28580
+ "input_dbu_cost_per_token": 3.571e-06,
28581
+ "litellm_provider": "databricks",
28582
+ "max_input_tokens": 400000,
28583
+ "max_output_tokens": 128000,
28584
+ "max_tokens": 400000,
28585
+ "metadata": {
28586
+ "notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
28587
+ },
28588
+ "mode": "chat",
28589
+ "output_cost_per_token": 1.9999700000000004e-06,
28590
+ "output_dbu_cost_per_token": 2.8571e-05,
28591
+ "source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving"
28592
+ },
28593
+ "databricks/databricks-gpt-5-nano": {
28594
+ "input_cost_per_token": 4.998e-08,
28595
+ "input_dbu_cost_per_token": 7.14e-07,
28596
+ "litellm_provider": "databricks",
28597
+ "max_input_tokens": 400000,
28598
+ "max_output_tokens": 128000,
28599
+ "max_tokens": 400000,
28600
+ "metadata": {
28601
+ "notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
28602
+ },
28603
+ "mode": "chat",
28604
+ "output_cost_per_token": 3.9998000000000007e-07,
28605
+ "output_dbu_cost_per_token": 5.714000000000001e-06,
28606
+ "source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving"
28607
+ },
28608
+ "databricks/databricks-gpt-oss-120b": {
28609
+ "input_cost_per_token": 1.5000999999999998e-07,
28610
+ "input_dbu_cost_per_token": 2.1429999999999996e-06,
28611
+ "litellm_provider": "databricks",
28612
+ "max_input_tokens": 131072,
28613
+ "max_output_tokens": 131072,
28614
+ "max_tokens": 131072,
28615
+ "metadata": {
28616
+ "notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
28617
+ },
28618
+ "mode": "chat",
28619
+ "output_cost_per_token": 5.9997e-07,
28620
+ "output_dbu_cost_per_token": 8.571e-06,
28621
+ "source": "https://www.databricks.com/product/pricing/foundation-model-serving"
28622
+ },
28623
+ "databricks/databricks-gpt-oss-20b": {
28624
+ "input_cost_per_token": 7e-08,
28625
+ "input_dbu_cost_per_token": 1e-06,
28626
+ "litellm_provider": "databricks",
28627
+ "max_input_tokens": 131072,
28628
+ "max_output_tokens": 131072,
28629
+ "max_tokens": 131072,
28630
+ "metadata": {
28631
+ "notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
28632
+ },
28633
+ "mode": "chat",
28634
+ "output_cost_per_token": 3.0001999999999996e-07,
28635
+ "output_dbu_cost_per_token": 4.285999999999999e-06,
28636
+ "source": "https://www.databricks.com/product/pricing/foundation-model-serving"
28637
+ },
28638
+ "databricks/databricks-meta-llama-3-1-8b-instruct": {
28639
+ "input_cost_per_token": 1.5000999999999998e-07,
28640
+ "input_dbu_cost_per_token": 2.1429999999999996e-06,
28641
+ "litellm_provider": "databricks",
28642
+ "max_input_tokens": 200000,
28643
+ "max_output_tokens": 128000,
28644
+ "max_tokens": 200000,
28645
+ "metadata": {
28646
+ "notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
28647
+ },
28648
+ "mode": "chat",
28649
+ "output_cost_per_token": 4.5003000000000007e-07,
28650
+ "output_dbu_cost_per_token": 6.429000000000001e-06,
28651
+ "source": "https://www.databricks.com/product/pricing/foundation-model-serving"
28652
+ },
28653
+ "fireworks_ai/accounts/fireworks/models/deepseek-v3p2": {
28654
+ "input_cost_per_token": 1.2e-06,
28655
+ "litellm_provider": "fireworks_ai",
28656
+ "max_input_tokens": 163840,
28657
+ "max_output_tokens": 163840,
28658
+ "max_tokens": 163840,
28659
+ "mode": "chat",
28660
+ "output_cost_per_token": 1.2e-06,
28661
+ "source": "https://fireworks.ai/models/fireworks/deepseek-v3p2",
28662
+ "supports_function_calling": true,
28663
+ "supports_response_schema": true,
28664
+ "supports_tool_choice": true
28665
+ },
28666
+ "vertex_ai/chirp": {
28667
+ "input_cost_per_character": 3e-05,
28668
+ "litellm_provider": "vertex_ai",
28669
+ "mode": "audio_speech",
28670
+ "source": "https://cloud.google.com/text-to-speech/pricing",
28671
+ "supported_endpoints": [
28672
+ "/v1/audio/speech"
28673
+ ]
28674
+ },
28675
+ "zai/glm-4.6": {
28676
+ "input_cost_per_token": 6e-07,
28677
+ "output_cost_per_token": 2.2e-06,
28678
+ "litellm_provider": "zai",
28679
+ "max_input_tokens": 200000,
28680
+ "max_output_tokens": 128000,
28681
+ "mode": "chat",
28682
+ "supports_function_calling": true,
28683
+ "supports_tool_choice": true,
28684
+ "source": "https://docs.z.ai/guides/overview/pricing"
28685
+ },
28686
+ "zai/glm-4.5": {
28687
+ "input_cost_per_token": 6e-07,
28688
+ "output_cost_per_token": 2.2e-06,
28689
+ "litellm_provider": "zai",
28690
+ "max_input_tokens": 128000,
28691
+ "max_output_tokens": 32000,
28692
+ "mode": "chat",
28693
+ "supports_function_calling": true,
28694
+ "supports_tool_choice": true,
28695
+ "source": "https://docs.z.ai/guides/overview/pricing"
28696
+ },
28697
+ "zai/glm-4.5v": {
28698
+ "input_cost_per_token": 6e-07,
28699
+ "output_cost_per_token": 1.8e-06,
28700
+ "litellm_provider": "zai",
28701
+ "max_input_tokens": 128000,
28702
+ "max_output_tokens": 32000,
28703
+ "mode": "chat",
28704
+ "supports_function_calling": true,
28705
+ "supports_tool_choice": true,
28706
+ "supports_vision": true,
28707
+ "source": "https://docs.z.ai/guides/overview/pricing"
28708
+ },
28709
+ "zai/glm-4.5-x": {
28710
+ "input_cost_per_token": 2.2e-06,
28711
+ "output_cost_per_token": 8.9e-06,
28712
+ "litellm_provider": "zai",
28713
+ "max_input_tokens": 128000,
28714
+ "max_output_tokens": 32000,
28715
+ "mode": "chat",
28716
+ "supports_function_calling": true,
28717
+ "supports_tool_choice": true,
28718
+ "source": "https://docs.z.ai/guides/overview/pricing"
28719
+ },
28720
+ "zai/glm-4.5-air": {
28721
+ "input_cost_per_token": 2e-07,
28722
+ "output_cost_per_token": 1.1e-06,
28723
+ "litellm_provider": "zai",
28724
+ "max_input_tokens": 128000,
28725
+ "max_output_tokens": 32000,
28726
+ "mode": "chat",
28727
+ "supports_function_calling": true,
28728
+ "supports_tool_choice": true,
28729
+ "source": "https://docs.z.ai/guides/overview/pricing"
28730
+ },
28731
+ "zai/glm-4.5-airx": {
28732
+ "input_cost_per_token": 1.1e-06,
28733
+ "output_cost_per_token": 4.5e-06,
28734
+ "litellm_provider": "zai",
28735
+ "max_input_tokens": 128000,
28736
+ "max_output_tokens": 32000,
28737
+ "mode": "chat",
28738
+ "supports_function_calling": true,
28739
+ "supports_tool_choice": true,
28740
+ "source": "https://docs.z.ai/guides/overview/pricing"
28741
+ },
28742
+ "zai/glm-4-32b-0414-128k": {
28743
+ "input_cost_per_token": 1e-07,
28744
+ "output_cost_per_token": 1e-07,
28745
+ "litellm_provider": "zai",
28746
+ "max_input_tokens": 128000,
28747
+ "max_output_tokens": 32000,
28748
+ "mode": "chat",
28749
+ "supports_function_calling": true,
28750
+ "supports_tool_choice": true,
28751
+ "source": "https://docs.z.ai/guides/overview/pricing"
28752
+ },
28753
+ "zai/glm-4.5-flash": {
28754
+ "input_cost_per_token": 0,
28755
+ "output_cost_per_token": 0,
28756
+ "litellm_provider": "zai",
28757
+ "max_input_tokens": 128000,
28758
+ "max_output_tokens": 32000,
28759
+ "mode": "chat",
28760
+ "supports_function_calling": true,
28761
+ "supports_tool_choice": true,
28762
+ "source": "https://docs.z.ai/guides/overview/pricing"
28763
+ },
28764
+ "amazon.nova-2-lite-v1:0": {
28765
+ "input_cost_per_token": 3e-07,
28766
+ "litellm_provider": "bedrock_converse",
28767
+ "max_input_tokens": 1000000,
28768
+ "max_output_tokens": 64000,
28769
+ "max_tokens": 64000,
28770
+ "mode": "chat",
28771
+ "output_cost_per_token": 2.5e-06,
28772
+ "supports_function_calling": true,
28773
+ "supports_pdf_input": true,
28774
+ "supports_prompt_caching": true,
28775
+ "supports_reasoning": true,
28776
+ "supports_response_schema": true,
28777
+ "supports_video_input": true,
28778
+ "supports_vision": true
28779
+ },
28780
+ "apac.amazon.nova-2-lite-v1:0": {
28781
+ "input_cost_per_token": 6e-08,
28782
+ "litellm_provider": "bedrock_converse",
28783
+ "max_input_tokens": 1000000,
28784
+ "max_output_tokens": 64000,
28785
+ "max_tokens": 64000,
28786
+ "mode": "chat",
28787
+ "output_cost_per_token": 2.75e-06,
28788
+ "supports_function_calling": true,
28789
+ "supports_pdf_input": true,
28790
+ "supports_prompt_caching": true,
28791
+ "supports_reasoning": true,
28792
+ "supports_response_schema": true,
28793
+ "supports_video_input": true,
28794
+ "supports_vision": true
28795
+ },
28796
+ "eu.amazon.nova-2-lite-v1:0": {
28797
+ "input_cost_per_token": 6e-08,
28798
+ "litellm_provider": "bedrock_converse",
28799
+ "max_input_tokens": 1000000,
28800
+ "max_output_tokens": 64000,
28801
+ "max_tokens": 64000,
28802
+ "mode": "chat",
28803
+ "output_cost_per_token": 2.75e-06,
28804
+ "supports_function_calling": true,
28805
+ "supports_pdf_input": true,
28806
+ "supports_prompt_caching": true,
28807
+ "supports_reasoning": true,
28808
+ "supports_response_schema": true,
28809
+ "supports_video_input": true,
28810
+ "supports_vision": true
28811
+ },
28812
+ "us.amazon.nova-2-lite-v1:0": {
28813
+ "input_cost_per_token": 6e-08,
28814
+ "litellm_provider": "bedrock_converse",
28815
+ "max_input_tokens": 1000000,
28816
+ "max_output_tokens": 64000,
28817
+ "max_tokens": 64000,
28818
+ "mode": "chat",
28819
+ "output_cost_per_token": 2.75e-06,
28820
+ "supports_function_calling": true,
28821
+ "supports_pdf_input": true,
28822
+ "supports_prompt_caching": true,
28823
+ "supports_reasoning": true,
28824
+ "supports_response_schema": true,
28825
+ "supports_video_input": true,
28826
+ "supports_vision": true
28827
+ },
28828
+ "deepseek/deepseek-v3.2": {
28829
+ "input_cost_per_token": 2.8e-07,
28830
+ "input_cost_per_token_cache_hit": 2.8e-08,
28831
+ "litellm_provider": "deepseek",
28832
+ "max_input_tokens": 163840,
28833
+ "max_output_tokens": 163840,
28834
+ "max_tokens": 8192,
28835
+ "mode": "chat",
28836
+ "output_cost_per_token": 4e-07,
28837
+ "supports_assistant_prefill": true,
28838
+ "supports_function_calling": true,
28839
+ "supports_prompt_caching": true,
28840
+ "supports_reasoning": true,
28841
+ "supports_tool_choice": true
28842
+ },
28843
+ "ft:gpt-4.1-2025-04-14": {
28844
+ "cache_read_input_token_cost": 7.5e-07,
28845
+ "input_cost_per_token": 3e-06,
28846
+ "input_cost_per_token_batches": 1.5e-06,
28847
+ "litellm_provider": "openai",
28848
+ "max_input_tokens": 1047576,
28849
+ "max_output_tokens": 32768,
28850
+ "max_tokens": 32768,
28851
+ "mode": "chat",
28852
+ "output_cost_per_token": 1.2e-05,
28853
+ "output_cost_per_token_batches": 6e-06,
28854
+ "supports_function_calling": true,
28855
+ "supports_parallel_function_calling": true,
28856
+ "supports_prompt_caching": true,
28857
+ "supports_response_schema": true,
28858
+ "supports_system_messages": true,
28859
+ "supports_tool_choice": true
28860
+ },
28861
+ "ft:gpt-4.1-mini-2025-04-14": {
28862
+ "cache_read_input_token_cost": 2e-07,
28863
+ "input_cost_per_token": 8e-07,
28864
+ "input_cost_per_token_batches": 4e-07,
28865
+ "litellm_provider": "openai",
28866
+ "max_input_tokens": 1047576,
28867
+ "max_output_tokens": 32768,
28868
+ "max_tokens": 32768,
28869
+ "mode": "chat",
28870
+ "output_cost_per_token": 3.2e-06,
28871
+ "output_cost_per_token_batches": 1.6e-06,
28872
+ "supports_function_calling": true,
28873
+ "supports_parallel_function_calling": true,
28874
+ "supports_prompt_caching": true,
28875
+ "supports_response_schema": true,
28876
+ "supports_system_messages": true,
28877
+ "supports_tool_choice": true
28878
+ },
28879
+ "ft:gpt-4.1-nano-2025-04-14": {
28880
+ "cache_read_input_token_cost": 5e-08,
28881
+ "input_cost_per_token": 2e-07,
28882
+ "input_cost_per_token_batches": 1e-07,
28883
+ "litellm_provider": "openai",
28884
+ "max_input_tokens": 1047576,
28885
+ "max_output_tokens": 32768,
28886
+ "max_tokens": 32768,
28887
+ "mode": "chat",
28888
+ "output_cost_per_token": 8e-07,
28889
+ "output_cost_per_token_batches": 4e-07,
28890
+ "supports_function_calling": true,
28891
+ "supports_parallel_function_calling": true,
28892
+ "supports_prompt_caching": true,
28893
+ "supports_response_schema": true,
28894
+ "supports_system_messages": true,
28895
+ "supports_tool_choice": true
28896
+ },
28897
+ "ft:o4-mini-2025-04-16": {
28898
+ "cache_read_input_token_cost": 1e-06,
28899
+ "input_cost_per_token": 4e-06,
28900
+ "input_cost_per_token_batches": 2e-06,
28901
+ "litellm_provider": "openai",
28902
+ "max_input_tokens": 200000,
28903
+ "max_output_tokens": 100000,
28904
+ "max_tokens": 100000,
28905
+ "mode": "chat",
28906
+ "output_cost_per_token": 1.6e-05,
28907
+ "output_cost_per_token_batches": 8e-06,
28908
+ "supports_function_calling": true,
28909
+ "supports_parallel_function_calling": false,
28910
+ "supports_prompt_caching": true,
28911
+ "supports_reasoning": true,
28912
+ "supports_response_schema": true,
28913
+ "supports_tool_choice": true
28914
+ },
28915
+ "openrouter/deepseek/deepseek-v3.2": {
28916
+ "input_cost_per_token": 2.8e-07,
28917
+ "input_cost_per_token_cache_hit": 2.8e-08,
28918
+ "litellm_provider": "openrouter",
28919
+ "max_input_tokens": 163840,
28920
+ "max_output_tokens": 163840,
28921
+ "max_tokens": 8192,
28922
+ "mode": "chat",
28923
+ "output_cost_per_token": 4e-07,
28924
+ "supports_assistant_prefill": true,
28925
+ "supports_function_calling": true,
28926
+ "supports_prompt_caching": true,
28927
+ "supports_reasoning": true,
28928
+ "supports_tool_choice": true
28929
+ },
28930
+ "global.anthropic.claude-opus-4-5-20251101-v1:0": {
28931
+ "cache_creation_input_token_cost": 6.25e-06,
28932
+ "cache_read_input_token_cost": 5e-07,
28933
+ "input_cost_per_token": 5e-06,
28934
+ "litellm_provider": "bedrock_converse",
28935
+ "max_input_tokens": 200000,
28936
+ "max_output_tokens": 64000,
28937
+ "max_tokens": 64000,
28938
+ "mode": "chat",
28939
+ "output_cost_per_token": 2.5e-05,
28940
+ "search_context_cost_per_query": {
28941
+ "search_context_size_high": 0.01,
28942
+ "search_context_size_low": 0.01,
28943
+ "search_context_size_medium": 0.01
28944
+ },
28945
+ "supports_assistant_prefill": true,
28946
+ "supports_computer_use": true,
28947
+ "supports_function_calling": true,
28948
+ "supports_pdf_input": true,
28949
+ "supports_prompt_caching": true,
28950
+ "supports_reasoning": true,
28951
+ "supports_response_schema": true,
28952
+ "supports_tool_choice": true,
28953
+ "supports_vision": true,
28954
+ "tool_use_system_prompt_tokens": 159
28338
28955
  }
28339
28956
  }
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: tokencostauto
3
- Version: 0.1.376
3
+ Version: 0.1.380
4
4
  Summary: To calculate token and translated USD cost of string and message calls to OpenAI, for example when used by AI agents
5
5
  Author-email: Trisha Pan <trishaepan@gmail.com>, Alex Reibman <areibman@gmail.com>, Pratyush Shukla <ps4534@nyu.edu>, Thiago MadPin <madpin@gmail.com>
6
6
  Project-URL: Homepage, https://github.com/madpin/tokencostaudo
@@ -0,0 +1,9 @@
1
+ tokencostauto/__init__.py,sha256=-4d_ryFH62SgNXPXA8vGPFZoAKtOBjnsg37EB_RkZG8,289
2
+ tokencostauto/constants.py,sha256=_82MlTkTrdrwzyRosQD7d3JdgNP9KAUM-cZo8DE00P0,3395
3
+ tokencostauto/costs.py,sha256=tXsgrTypq-dCHaHtoXcg2XepezWsAvZpl9gEsv_53iE,10679
4
+ tokencostauto/model_prices.json,sha256=GQo71l4_B2fpRWiZG4LAsezobw-GzGLfU87ZiJ1NKbA,1032350
5
+ tokencostauto-0.1.380.dist-info/licenses/LICENSE,sha256=4PLv_CD6Ughnsvg_nM2XeTqGwVK6lQVR77kVWbPq-0U,1065
6
+ tokencostauto-0.1.380.dist-info/METADATA,sha256=92Bcw6am7Ru01cYZY5rvk444pTP3bl0nCg8eyqL2vtk,204076
7
+ tokencostauto-0.1.380.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
8
+ tokencostauto-0.1.380.dist-info/top_level.txt,sha256=szZQTUJRotfIaeZCDsOgvofIkLt2ak88RP13oI51-TU,14
9
+ tokencostauto-0.1.380.dist-info/RECORD,,
@@ -1,9 +0,0 @@
1
- tokencostauto/__init__.py,sha256=-4d_ryFH62SgNXPXA8vGPFZoAKtOBjnsg37EB_RkZG8,289
2
- tokencostauto/constants.py,sha256=_82MlTkTrdrwzyRosQD7d3JdgNP9KAUM-cZo8DE00P0,3395
3
- tokencostauto/costs.py,sha256=tXsgrTypq-dCHaHtoXcg2XepezWsAvZpl9gEsv_53iE,10679
4
- tokencostauto/model_prices.json,sha256=ppcRA-03vZZBhzFyGsxg97rrHiitQmiQI38LHlTNX5A,1006772
5
- tokencostauto-0.1.376.dist-info/licenses/LICENSE,sha256=4PLv_CD6Ughnsvg_nM2XeTqGwVK6lQVR77kVWbPq-0U,1065
6
- tokencostauto-0.1.376.dist-info/METADATA,sha256=bvFO8RvysChQTCXeFlqeo75XRwE6caFjJWA07-Fx670,204076
7
- tokencostauto-0.1.376.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
8
- tokencostauto-0.1.376.dist-info/top_level.txt,sha256=szZQTUJRotfIaeZCDsOgvofIkLt2ak88RP13oI51-TU,14
9
- tokencostauto-0.1.376.dist-info/RECORD,,