tokencostauto 0.1.376__py3-none-any.whl → 0.1.378__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- tokencostauto/model_prices.json +448 -23
- {tokencostauto-0.1.376.dist-info → tokencostauto-0.1.378.dist-info}/METADATA +1 -1
- tokencostauto-0.1.378.dist-info/RECORD +9 -0
- tokencostauto-0.1.376.dist-info/RECORD +0 -9
- {tokencostauto-0.1.376.dist-info → tokencostauto-0.1.378.dist-info}/WHEEL +0 -0
- {tokencostauto-0.1.376.dist-info → tokencostauto-0.1.378.dist-info}/licenses/LICENSE +0 -0
- {tokencostauto-0.1.376.dist-info → tokencostauto-0.1.378.dist-info}/top_level.txt +0 -0
tokencostauto/model_prices.json
CHANGED
|
@@ -7234,7 +7234,7 @@
|
|
|
7234
7234
|
"output_cost_per_token": 0.0
|
|
7235
7235
|
},
|
|
7236
7236
|
"databricks/databricks-meta-llama-3-1-405b-instruct": {
|
|
7237
|
-
"input_cost_per_token":
|
|
7237
|
+
"input_cost_per_token": 5.00003e-06,
|
|
7238
7238
|
"input_dbu_cost_per_token": 7.1429e-05,
|
|
7239
7239
|
"litellm_provider": "databricks",
|
|
7240
7240
|
"max_input_tokens": 128000,
|
|
@@ -7244,8 +7244,8 @@
|
|
|
7244
7244
|
"notes": "Input/output cost per token is dbu cost * $0.070, based on databricks Llama 3.1 70B conversion. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
|
|
7245
7245
|
},
|
|
7246
7246
|
"mode": "chat",
|
|
7247
|
-
"output_cost_per_token": 1.
|
|
7248
|
-
"
|
|
7247
|
+
"output_cost_per_token": 1.5000020000000002e-05,
|
|
7248
|
+
"output_dbu_cost_per_token": 0.000214286,
|
|
7249
7249
|
"source": "https://www.databricks.com/product/pricing/foundation-model-serving",
|
|
7250
7250
|
"supports_tool_choice": true
|
|
7251
7251
|
},
|
|
@@ -7292,7 +7292,7 @@
|
|
|
7292
7292
|
"notes": "Input/output cost per token is dbu cost * $0.070, based on databricks Llama 3.1 70B conversion. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
|
|
7293
7293
|
},
|
|
7294
7294
|
"mode": "chat",
|
|
7295
|
-
"output_cost_per_token": 2.
|
|
7295
|
+
"output_cost_per_token": 2.9999900000000002e-06,
|
|
7296
7296
|
"output_dbu_cost_per_token": 4.2857e-05,
|
|
7297
7297
|
"source": "https://www.databricks.com/product/pricing/foundation-model-serving",
|
|
7298
7298
|
"supports_tool_choice": true
|
|
@@ -7308,7 +7308,7 @@
|
|
|
7308
7308
|
"notes": "Input/output cost per token is dbu cost * $0.070, based on databricks Llama 3.1 70B conversion. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
|
|
7309
7309
|
},
|
|
7310
7310
|
"mode": "chat",
|
|
7311
|
-
"output_cost_per_token": 1.
|
|
7311
|
+
"output_cost_per_token": 1.5000300000000002e-06,
|
|
7312
7312
|
"output_dbu_cost_per_token": 2.1429e-05,
|
|
7313
7313
|
"source": "https://www.databricks.com/product/pricing/foundation-model-serving",
|
|
7314
7314
|
"supports_tool_choice": true
|
|
@@ -7324,13 +7324,13 @@
|
|
|
7324
7324
|
"notes": "Input/output cost per token is dbu cost * $0.070, based on databricks Llama 3.1 70B conversion. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
|
|
7325
7325
|
},
|
|
7326
7326
|
"mode": "chat",
|
|
7327
|
-
"output_cost_per_token":
|
|
7327
|
+
"output_cost_per_token": 1.00002e-06,
|
|
7328
7328
|
"output_dbu_cost_per_token": 1.4286e-05,
|
|
7329
7329
|
"source": "https://www.databricks.com/product/pricing/foundation-model-serving",
|
|
7330
7330
|
"supports_tool_choice": true
|
|
7331
7331
|
},
|
|
7332
7332
|
"databricks/databricks-mpt-30b-instruct": {
|
|
7333
|
-
"input_cost_per_token":
|
|
7333
|
+
"input_cost_per_token": 1.00002e-06,
|
|
7334
7334
|
"input_dbu_cost_per_token": 1.4286e-05,
|
|
7335
7335
|
"litellm_provider": "databricks",
|
|
7336
7336
|
"max_input_tokens": 8192,
|
|
@@ -7340,7 +7340,7 @@
|
|
|
7340
7340
|
"notes": "Input/output cost per token is dbu cost * $0.070, based on databricks Llama 3.1 70B conversion. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
|
|
7341
7341
|
},
|
|
7342
7342
|
"mode": "chat",
|
|
7343
|
-
"output_cost_per_token":
|
|
7343
|
+
"output_cost_per_token": 1.00002e-06,
|
|
7344
7344
|
"output_dbu_cost_per_token": 1.4286e-05,
|
|
7345
7345
|
"source": "https://www.databricks.com/product/pricing/foundation-model-serving",
|
|
7346
7346
|
"supports_tool_choice": true
|
|
@@ -7377,7 +7377,7 @@
|
|
|
7377
7377
|
"source": "https://www.databricks.com/product/pricing/foundation-model-serving"
|
|
7378
7378
|
},
|
|
7379
7379
|
"databricks/databricks-gte-large-en": {
|
|
7380
|
-
"input_cost_per_token": 1.
|
|
7380
|
+
"input_cost_per_token": 1.2999000000000001e-07,
|
|
7381
7381
|
"input_dbu_cost_per_token": 1.857e-06,
|
|
7382
7382
|
"litellm_provider": "databricks",
|
|
7383
7383
|
"max_input_tokens": 8192,
|
|
@@ -13185,27 +13185,27 @@
|
|
|
13185
13185
|
"output_cost_per_token": 9e-07
|
|
13186
13186
|
},
|
|
13187
13187
|
"databricks/databricks-claude-3-7-sonnet": {
|
|
13188
|
-
"input_cost_per_token": 2.
|
|
13189
|
-
"input_dbu_cost_per_token":
|
|
13188
|
+
"input_cost_per_token": 2.9999900000000002e-06,
|
|
13189
|
+
"input_dbu_cost_per_token": 4.2857e-05,
|
|
13190
13190
|
"litellm_provider": "databricks",
|
|
13191
13191
|
"max_input_tokens": 200000,
|
|
13192
13192
|
"max_output_tokens": 128000,
|
|
13193
13193
|
"max_tokens": 200000,
|
|
13194
13194
|
"metadata": {
|
|
13195
|
-
"notes": "Input/output cost per token is dbu cost * $0.070
|
|
13195
|
+
"notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
|
|
13196
13196
|
},
|
|
13197
13197
|
"mode": "chat",
|
|
13198
|
-
"output_cost_per_token": 1.
|
|
13199
|
-
"
|
|
13200
|
-
"source": "https://www.databricks.com/product/pricing/foundation-model-serving",
|
|
13198
|
+
"output_cost_per_token": 1.5000020000000002e-05,
|
|
13199
|
+
"output_dbu_cost_per_token": 0.000214286,
|
|
13200
|
+
"source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving",
|
|
13201
13201
|
"supports_assistant_prefill": true,
|
|
13202
13202
|
"supports_function_calling": true,
|
|
13203
13203
|
"supports_reasoning": true,
|
|
13204
13204
|
"supports_tool_choice": true
|
|
13205
13205
|
},
|
|
13206
13206
|
"databricks/databricks-meta-llama-3-3-70b-instruct": {
|
|
13207
|
-
"input_cost_per_token":
|
|
13208
|
-
"input_dbu_cost_per_token":
|
|
13207
|
+
"input_cost_per_token": 5.0001e-07,
|
|
13208
|
+
"input_dbu_cost_per_token": 7.143e-06,
|
|
13209
13209
|
"litellm_provider": "databricks",
|
|
13210
13210
|
"max_input_tokens": 128000,
|
|
13211
13211
|
"max_output_tokens": 128000,
|
|
@@ -13214,8 +13214,8 @@
|
|
|
13214
13214
|
"notes": "Input/output cost per token is dbu cost * $0.070, based on databricks Llama 3.1 70B conversion. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
|
|
13215
13215
|
},
|
|
13216
13216
|
"mode": "chat",
|
|
13217
|
-
"output_cost_per_token":
|
|
13218
|
-
"output_dbu_cost_per_token":
|
|
13217
|
+
"output_cost_per_token": 1.5000300000000002e-06,
|
|
13218
|
+
"output_dbu_cost_per_token": 2.1429e-05,
|
|
13219
13219
|
"source": "https://www.databricks.com/product/pricing/foundation-model-serving",
|
|
13220
13220
|
"supports_tool_choice": true
|
|
13221
13221
|
},
|
|
@@ -14261,8 +14261,8 @@
|
|
|
14261
14261
|
"tool_use_system_prompt_tokens": 159
|
|
14262
14262
|
},
|
|
14263
14263
|
"databricks/databricks-llama-4-maverick": {
|
|
14264
|
-
"input_cost_per_token":
|
|
14265
|
-
"input_dbu_cost_per_token": 7.143e-
|
|
14264
|
+
"input_cost_per_token": 5.0001e-07,
|
|
14265
|
+
"input_dbu_cost_per_token": 7.143e-06,
|
|
14266
14266
|
"litellm_provider": "databricks",
|
|
14267
14267
|
"max_input_tokens": 128000,
|
|
14268
14268
|
"max_output_tokens": 128000,
|
|
@@ -14271,8 +14271,8 @@
|
|
|
14271
14271
|
"notes": "Databricks documentation now provides both DBU costs (_dbu_cost_per_token) and dollar costs(_cost_per_token)."
|
|
14272
14272
|
},
|
|
14273
14273
|
"mode": "chat",
|
|
14274
|
-
"output_cost_per_token": 1.
|
|
14275
|
-
"output_dbu_cost_per_token":
|
|
14274
|
+
"output_cost_per_token": 1.5000300000000002e-06,
|
|
14275
|
+
"output_dbu_cost_per_token": 2.1429e-05,
|
|
14276
14276
|
"source": "https://www.databricks.com/product/pricing/foundation-model-serving",
|
|
14277
14277
|
"supports_tool_choice": true
|
|
14278
14278
|
},
|
|
@@ -28335,5 +28335,430 @@
|
|
|
28335
28335
|
"supports_function_calling": true,
|
|
28336
28336
|
"supports_response_schema": true,
|
|
28337
28337
|
"supports_tool_choice": true
|
|
28338
|
+
},
|
|
28339
|
+
"claude-opus-4-5": {
|
|
28340
|
+
"cache_creation_input_token_cost": 6.25e-06,
|
|
28341
|
+
"cache_creation_input_token_cost_above_1hr": 1e-05,
|
|
28342
|
+
"cache_read_input_token_cost": 5e-07,
|
|
28343
|
+
"input_cost_per_token": 5e-06,
|
|
28344
|
+
"litellm_provider": "anthropic",
|
|
28345
|
+
"max_input_tokens": 200000,
|
|
28346
|
+
"max_output_tokens": 64000,
|
|
28347
|
+
"max_tokens": 64000,
|
|
28348
|
+
"mode": "chat",
|
|
28349
|
+
"output_cost_per_token": 2.5e-05,
|
|
28350
|
+
"search_context_cost_per_query": {
|
|
28351
|
+
"search_context_size_high": 0.01,
|
|
28352
|
+
"search_context_size_low": 0.01,
|
|
28353
|
+
"search_context_size_medium": 0.01
|
|
28354
|
+
},
|
|
28355
|
+
"supports_assistant_prefill": true,
|
|
28356
|
+
"supports_computer_use": true,
|
|
28357
|
+
"supports_function_calling": true,
|
|
28358
|
+
"supports_pdf_input": true,
|
|
28359
|
+
"supports_prompt_caching": true,
|
|
28360
|
+
"supports_reasoning": true,
|
|
28361
|
+
"supports_response_schema": true,
|
|
28362
|
+
"supports_tool_choice": true,
|
|
28363
|
+
"supports_vision": true,
|
|
28364
|
+
"tool_use_system_prompt_tokens": 159
|
|
28365
|
+
},
|
|
28366
|
+
"databricks/databricks-claude-haiku-4-5": {
|
|
28367
|
+
"input_cost_per_token": 1.00002e-06,
|
|
28368
|
+
"input_dbu_cost_per_token": 1.4286e-05,
|
|
28369
|
+
"litellm_provider": "databricks",
|
|
28370
|
+
"max_input_tokens": 200000,
|
|
28371
|
+
"max_output_tokens": 64000,
|
|
28372
|
+
"max_tokens": 200000,
|
|
28373
|
+
"metadata": {
|
|
28374
|
+
"notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
|
|
28375
|
+
},
|
|
28376
|
+
"mode": "chat",
|
|
28377
|
+
"output_cost_per_token": 5.00003e-06,
|
|
28378
|
+
"output_dbu_cost_per_token": 7.1429e-05,
|
|
28379
|
+
"source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving",
|
|
28380
|
+
"supports_assistant_prefill": true,
|
|
28381
|
+
"supports_function_calling": true,
|
|
28382
|
+
"supports_reasoning": true,
|
|
28383
|
+
"supports_tool_choice": true
|
|
28384
|
+
},
|
|
28385
|
+
"databricks/databricks-claude-opus-4": {
|
|
28386
|
+
"input_cost_per_token": 1.5000020000000002e-05,
|
|
28387
|
+
"input_dbu_cost_per_token": 0.000214286,
|
|
28388
|
+
"litellm_provider": "databricks",
|
|
28389
|
+
"max_input_tokens": 200000,
|
|
28390
|
+
"max_output_tokens": 32000,
|
|
28391
|
+
"max_tokens": 200000,
|
|
28392
|
+
"metadata": {
|
|
28393
|
+
"notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
|
|
28394
|
+
},
|
|
28395
|
+
"mode": "chat",
|
|
28396
|
+
"output_cost_per_token": 7.500003000000001e-05,
|
|
28397
|
+
"output_dbu_cost_per_token": 0.001071429,
|
|
28398
|
+
"source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving",
|
|
28399
|
+
"supports_assistant_prefill": true,
|
|
28400
|
+
"supports_function_calling": true,
|
|
28401
|
+
"supports_reasoning": true,
|
|
28402
|
+
"supports_tool_choice": true
|
|
28403
|
+
},
|
|
28404
|
+
"databricks/databricks-claude-opus-4-1": {
|
|
28405
|
+
"input_cost_per_token": 1.5000020000000002e-05,
|
|
28406
|
+
"input_dbu_cost_per_token": 0.000214286,
|
|
28407
|
+
"litellm_provider": "databricks",
|
|
28408
|
+
"max_input_tokens": 200000,
|
|
28409
|
+
"max_output_tokens": 32000,
|
|
28410
|
+
"max_tokens": 200000,
|
|
28411
|
+
"metadata": {
|
|
28412
|
+
"notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
|
|
28413
|
+
},
|
|
28414
|
+
"mode": "chat",
|
|
28415
|
+
"output_cost_per_token": 7.500003000000001e-05,
|
|
28416
|
+
"output_dbu_cost_per_token": 0.001071429,
|
|
28417
|
+
"source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving",
|
|
28418
|
+
"supports_assistant_prefill": true,
|
|
28419
|
+
"supports_function_calling": true,
|
|
28420
|
+
"supports_reasoning": true,
|
|
28421
|
+
"supports_tool_choice": true
|
|
28422
|
+
},
|
|
28423
|
+
"databricks/databricks-claude-opus-4-5": {
|
|
28424
|
+
"input_cost_per_token": 5.00003e-06,
|
|
28425
|
+
"input_dbu_cost_per_token": 7.1429e-05,
|
|
28426
|
+
"litellm_provider": "databricks",
|
|
28427
|
+
"max_input_tokens": 200000,
|
|
28428
|
+
"max_output_tokens": 64000,
|
|
28429
|
+
"max_tokens": 200000,
|
|
28430
|
+
"metadata": {
|
|
28431
|
+
"notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
|
|
28432
|
+
},
|
|
28433
|
+
"mode": "chat",
|
|
28434
|
+
"output_cost_per_token": 2.5000010000000002e-05,
|
|
28435
|
+
"output_dbu_cost_per_token": 0.000357143,
|
|
28436
|
+
"source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving",
|
|
28437
|
+
"supports_assistant_prefill": true,
|
|
28438
|
+
"supports_function_calling": true,
|
|
28439
|
+
"supports_reasoning": true,
|
|
28440
|
+
"supports_tool_choice": true
|
|
28441
|
+
},
|
|
28442
|
+
"databricks/databricks-claude-sonnet-4": {
|
|
28443
|
+
"input_cost_per_token": 2.9999900000000002e-06,
|
|
28444
|
+
"input_dbu_cost_per_token": 4.2857e-05,
|
|
28445
|
+
"litellm_provider": "databricks",
|
|
28446
|
+
"max_input_tokens": 200000,
|
|
28447
|
+
"max_output_tokens": 64000,
|
|
28448
|
+
"max_tokens": 200000,
|
|
28449
|
+
"metadata": {
|
|
28450
|
+
"notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
|
|
28451
|
+
},
|
|
28452
|
+
"mode": "chat",
|
|
28453
|
+
"output_cost_per_token": 1.5000020000000002e-05,
|
|
28454
|
+
"output_dbu_cost_per_token": 0.000214286,
|
|
28455
|
+
"source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving",
|
|
28456
|
+
"supports_assistant_prefill": true,
|
|
28457
|
+
"supports_function_calling": true,
|
|
28458
|
+
"supports_reasoning": true,
|
|
28459
|
+
"supports_tool_choice": true
|
|
28460
|
+
},
|
|
28461
|
+
"databricks/databricks-claude-sonnet-4-1": {
|
|
28462
|
+
"input_cost_per_token": 2.9999900000000002e-06,
|
|
28463
|
+
"input_dbu_cost_per_token": 4.2857e-05,
|
|
28464
|
+
"litellm_provider": "databricks",
|
|
28465
|
+
"max_input_tokens": 200000,
|
|
28466
|
+
"max_output_tokens": 64000,
|
|
28467
|
+
"max_tokens": 200000,
|
|
28468
|
+
"metadata": {
|
|
28469
|
+
"notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
|
|
28470
|
+
},
|
|
28471
|
+
"mode": "chat",
|
|
28472
|
+
"output_cost_per_token": 1.5000020000000002e-05,
|
|
28473
|
+
"output_dbu_cost_per_token": 0.000214286,
|
|
28474
|
+
"source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving",
|
|
28475
|
+
"supports_assistant_prefill": true,
|
|
28476
|
+
"supports_function_calling": true,
|
|
28477
|
+
"supports_reasoning": true,
|
|
28478
|
+
"supports_tool_choice": true
|
|
28479
|
+
},
|
|
28480
|
+
"databricks/databricks-claude-sonnet-4-5": {
|
|
28481
|
+
"input_cost_per_token": 2.9999900000000002e-06,
|
|
28482
|
+
"input_dbu_cost_per_token": 4.2857e-05,
|
|
28483
|
+
"litellm_provider": "databricks",
|
|
28484
|
+
"max_input_tokens": 200000,
|
|
28485
|
+
"max_output_tokens": 64000,
|
|
28486
|
+
"max_tokens": 200000,
|
|
28487
|
+
"metadata": {
|
|
28488
|
+
"notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
|
|
28489
|
+
},
|
|
28490
|
+
"mode": "chat",
|
|
28491
|
+
"output_cost_per_token": 1.5000020000000002e-05,
|
|
28492
|
+
"output_dbu_cost_per_token": 0.000214286,
|
|
28493
|
+
"source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving",
|
|
28494
|
+
"supports_assistant_prefill": true,
|
|
28495
|
+
"supports_function_calling": true,
|
|
28496
|
+
"supports_reasoning": true,
|
|
28497
|
+
"supports_tool_choice": true
|
|
28498
|
+
},
|
|
28499
|
+
"databricks/databricks-gemini-2-5-flash": {
|
|
28500
|
+
"input_cost_per_token": 3.0001999999999996e-07,
|
|
28501
|
+
"input_dbu_cost_per_token": 4.285999999999999e-06,
|
|
28502
|
+
"litellm_provider": "databricks",
|
|
28503
|
+
"max_input_tokens": 1048576,
|
|
28504
|
+
"max_output_tokens": 65535,
|
|
28505
|
+
"max_tokens": 1048576,
|
|
28506
|
+
"metadata": {
|
|
28507
|
+
"notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
|
|
28508
|
+
},
|
|
28509
|
+
"mode": "chat",
|
|
28510
|
+
"output_cost_per_token": 2.49998e-06,
|
|
28511
|
+
"output_dbu_cost_per_token": 3.5714e-05,
|
|
28512
|
+
"source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving",
|
|
28513
|
+
"supports_function_calling": true,
|
|
28514
|
+
"supports_tool_choice": true
|
|
28515
|
+
},
|
|
28516
|
+
"databricks/databricks-gemini-2-5-pro": {
|
|
28517
|
+
"input_cost_per_token": 1.24999e-06,
|
|
28518
|
+
"input_dbu_cost_per_token": 1.7857e-05,
|
|
28519
|
+
"litellm_provider": "databricks",
|
|
28520
|
+
"max_input_tokens": 1048576,
|
|
28521
|
+
"max_output_tokens": 65536,
|
|
28522
|
+
"max_tokens": 1048576,
|
|
28523
|
+
"metadata": {
|
|
28524
|
+
"notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
|
|
28525
|
+
},
|
|
28526
|
+
"mode": "chat",
|
|
28527
|
+
"output_cost_per_token": 9.999990000000002e-06,
|
|
28528
|
+
"output_dbu_cost_per_token": 0.000142857,
|
|
28529
|
+
"source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving",
|
|
28530
|
+
"supports_function_calling": true,
|
|
28531
|
+
"supports_tool_choice": true
|
|
28532
|
+
},
|
|
28533
|
+
"databricks/databricks-gemma-3-12b": {
|
|
28534
|
+
"input_cost_per_token": 1.5000999999999998e-07,
|
|
28535
|
+
"input_dbu_cost_per_token": 2.1429999999999996e-06,
|
|
28536
|
+
"litellm_provider": "databricks",
|
|
28537
|
+
"max_input_tokens": 128000,
|
|
28538
|
+
"max_output_tokens": 32000,
|
|
28539
|
+
"max_tokens": 128000,
|
|
28540
|
+
"metadata": {
|
|
28541
|
+
"notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
|
|
28542
|
+
},
|
|
28543
|
+
"mode": "chat",
|
|
28544
|
+
"output_cost_per_token": 5.0001e-07,
|
|
28545
|
+
"output_dbu_cost_per_token": 7.143e-06,
|
|
28546
|
+
"source": "https://www.databricks.com/product/pricing/foundation-model-serving"
|
|
28547
|
+
},
|
|
28548
|
+
"databricks/databricks-gpt-5": {
|
|
28549
|
+
"input_cost_per_token": 1.24999e-06,
|
|
28550
|
+
"input_dbu_cost_per_token": 1.7857e-05,
|
|
28551
|
+
"litellm_provider": "databricks",
|
|
28552
|
+
"max_input_tokens": 400000,
|
|
28553
|
+
"max_output_tokens": 128000,
|
|
28554
|
+
"max_tokens": 400000,
|
|
28555
|
+
"metadata": {
|
|
28556
|
+
"notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
|
|
28557
|
+
},
|
|
28558
|
+
"mode": "chat",
|
|
28559
|
+
"output_cost_per_token": 9.999990000000002e-06,
|
|
28560
|
+
"output_dbu_cost_per_token": 0.000142857,
|
|
28561
|
+
"source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving"
|
|
28562
|
+
},
|
|
28563
|
+
"databricks/databricks-gpt-5-1": {
|
|
28564
|
+
"input_cost_per_token": 1.24999e-06,
|
|
28565
|
+
"input_dbu_cost_per_token": 1.7857e-05,
|
|
28566
|
+
"litellm_provider": "databricks",
|
|
28567
|
+
"max_input_tokens": 400000,
|
|
28568
|
+
"max_output_tokens": 128000,
|
|
28569
|
+
"max_tokens": 400000,
|
|
28570
|
+
"metadata": {
|
|
28571
|
+
"notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
|
|
28572
|
+
},
|
|
28573
|
+
"mode": "chat",
|
|
28574
|
+
"output_cost_per_token": 9.999990000000002e-06,
|
|
28575
|
+
"output_dbu_cost_per_token": 0.000142857,
|
|
28576
|
+
"source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving"
|
|
28577
|
+
},
|
|
28578
|
+
"databricks/databricks-gpt-5-mini": {
|
|
28579
|
+
"input_cost_per_token": 2.4997000000000006e-07,
|
|
28580
|
+
"input_dbu_cost_per_token": 3.571e-06,
|
|
28581
|
+
"litellm_provider": "databricks",
|
|
28582
|
+
"max_input_tokens": 400000,
|
|
28583
|
+
"max_output_tokens": 128000,
|
|
28584
|
+
"max_tokens": 400000,
|
|
28585
|
+
"metadata": {
|
|
28586
|
+
"notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
|
|
28587
|
+
},
|
|
28588
|
+
"mode": "chat",
|
|
28589
|
+
"output_cost_per_token": 1.9999700000000004e-06,
|
|
28590
|
+
"output_dbu_cost_per_token": 2.8571e-05,
|
|
28591
|
+
"source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving"
|
|
28592
|
+
},
|
|
28593
|
+
"databricks/databricks-gpt-5-nano": {
|
|
28594
|
+
"input_cost_per_token": 4.998e-08,
|
|
28595
|
+
"input_dbu_cost_per_token": 7.14e-07,
|
|
28596
|
+
"litellm_provider": "databricks",
|
|
28597
|
+
"max_input_tokens": 400000,
|
|
28598
|
+
"max_output_tokens": 128000,
|
|
28599
|
+
"max_tokens": 400000,
|
|
28600
|
+
"metadata": {
|
|
28601
|
+
"notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
|
|
28602
|
+
},
|
|
28603
|
+
"mode": "chat",
|
|
28604
|
+
"output_cost_per_token": 3.9998000000000007e-07,
|
|
28605
|
+
"output_dbu_cost_per_token": 5.714000000000001e-06,
|
|
28606
|
+
"source": "https://www.databricks.com/product/pricing/proprietary-foundation-model-serving"
|
|
28607
|
+
},
|
|
28608
|
+
"databricks/databricks-gpt-oss-120b": {
|
|
28609
|
+
"input_cost_per_token": 1.5000999999999998e-07,
|
|
28610
|
+
"input_dbu_cost_per_token": 2.1429999999999996e-06,
|
|
28611
|
+
"litellm_provider": "databricks",
|
|
28612
|
+
"max_input_tokens": 131072,
|
|
28613
|
+
"max_output_tokens": 131072,
|
|
28614
|
+
"max_tokens": 131072,
|
|
28615
|
+
"metadata": {
|
|
28616
|
+
"notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
|
|
28617
|
+
},
|
|
28618
|
+
"mode": "chat",
|
|
28619
|
+
"output_cost_per_token": 5.9997e-07,
|
|
28620
|
+
"output_dbu_cost_per_token": 8.571e-06,
|
|
28621
|
+
"source": "https://www.databricks.com/product/pricing/foundation-model-serving"
|
|
28622
|
+
},
|
|
28623
|
+
"databricks/databricks-gpt-oss-20b": {
|
|
28624
|
+
"input_cost_per_token": 7e-08,
|
|
28625
|
+
"input_dbu_cost_per_token": 1e-06,
|
|
28626
|
+
"litellm_provider": "databricks",
|
|
28627
|
+
"max_input_tokens": 131072,
|
|
28628
|
+
"max_output_tokens": 131072,
|
|
28629
|
+
"max_tokens": 131072,
|
|
28630
|
+
"metadata": {
|
|
28631
|
+
"notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
|
|
28632
|
+
},
|
|
28633
|
+
"mode": "chat",
|
|
28634
|
+
"output_cost_per_token": 3.0001999999999996e-07,
|
|
28635
|
+
"output_dbu_cost_per_token": 4.285999999999999e-06,
|
|
28636
|
+
"source": "https://www.databricks.com/product/pricing/foundation-model-serving"
|
|
28637
|
+
},
|
|
28638
|
+
"databricks/databricks-meta-llama-3-1-8b-instruct": {
|
|
28639
|
+
"input_cost_per_token": 1.5000999999999998e-07,
|
|
28640
|
+
"input_dbu_cost_per_token": 2.1429999999999996e-06,
|
|
28641
|
+
"litellm_provider": "databricks",
|
|
28642
|
+
"max_input_tokens": 200000,
|
|
28643
|
+
"max_output_tokens": 128000,
|
|
28644
|
+
"max_tokens": 200000,
|
|
28645
|
+
"metadata": {
|
|
28646
|
+
"notes": "Input/output cost per token is dbu cost * $0.070. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."
|
|
28647
|
+
},
|
|
28648
|
+
"mode": "chat",
|
|
28649
|
+
"output_cost_per_token": 4.5003000000000007e-07,
|
|
28650
|
+
"output_dbu_cost_per_token": 6.429000000000001e-06,
|
|
28651
|
+
"source": "https://www.databricks.com/product/pricing/foundation-model-serving"
|
|
28652
|
+
},
|
|
28653
|
+
"fireworks_ai/accounts/fireworks/models/deepseek-v3p2": {
|
|
28654
|
+
"input_cost_per_token": 1.2e-06,
|
|
28655
|
+
"litellm_provider": "fireworks_ai",
|
|
28656
|
+
"max_input_tokens": 163840,
|
|
28657
|
+
"max_output_tokens": 163840,
|
|
28658
|
+
"max_tokens": 163840,
|
|
28659
|
+
"mode": "chat",
|
|
28660
|
+
"output_cost_per_token": 1.2e-06,
|
|
28661
|
+
"source": "https://fireworks.ai/models/fireworks/deepseek-v3p2",
|
|
28662
|
+
"supports_function_calling": true,
|
|
28663
|
+
"supports_response_schema": true,
|
|
28664
|
+
"supports_tool_choice": true
|
|
28665
|
+
},
|
|
28666
|
+
"vertex_ai/chirp": {
|
|
28667
|
+
"input_cost_per_character": 3e-05,
|
|
28668
|
+
"litellm_provider": "vertex_ai",
|
|
28669
|
+
"mode": "audio_speech",
|
|
28670
|
+
"source": "https://cloud.google.com/text-to-speech/pricing",
|
|
28671
|
+
"supported_endpoints": [
|
|
28672
|
+
"/v1/audio/speech"
|
|
28673
|
+
]
|
|
28674
|
+
},
|
|
28675
|
+
"zai/glm-4.6": {
|
|
28676
|
+
"input_cost_per_token": 6e-07,
|
|
28677
|
+
"output_cost_per_token": 2.2e-06,
|
|
28678
|
+
"litellm_provider": "zai",
|
|
28679
|
+
"max_input_tokens": 200000,
|
|
28680
|
+
"max_output_tokens": 128000,
|
|
28681
|
+
"mode": "chat",
|
|
28682
|
+
"supports_function_calling": true,
|
|
28683
|
+
"supports_tool_choice": true,
|
|
28684
|
+
"source": "https://docs.z.ai/guides/overview/pricing"
|
|
28685
|
+
},
|
|
28686
|
+
"zai/glm-4.5": {
|
|
28687
|
+
"input_cost_per_token": 6e-07,
|
|
28688
|
+
"output_cost_per_token": 2.2e-06,
|
|
28689
|
+
"litellm_provider": "zai",
|
|
28690
|
+
"max_input_tokens": 128000,
|
|
28691
|
+
"max_output_tokens": 32000,
|
|
28692
|
+
"mode": "chat",
|
|
28693
|
+
"supports_function_calling": true,
|
|
28694
|
+
"supports_tool_choice": true,
|
|
28695
|
+
"source": "https://docs.z.ai/guides/overview/pricing"
|
|
28696
|
+
},
|
|
28697
|
+
"zai/glm-4.5v": {
|
|
28698
|
+
"input_cost_per_token": 6e-07,
|
|
28699
|
+
"output_cost_per_token": 1.8e-06,
|
|
28700
|
+
"litellm_provider": "zai",
|
|
28701
|
+
"max_input_tokens": 128000,
|
|
28702
|
+
"max_output_tokens": 32000,
|
|
28703
|
+
"mode": "chat",
|
|
28704
|
+
"supports_function_calling": true,
|
|
28705
|
+
"supports_tool_choice": true,
|
|
28706
|
+
"supports_vision": true,
|
|
28707
|
+
"source": "https://docs.z.ai/guides/overview/pricing"
|
|
28708
|
+
},
|
|
28709
|
+
"zai/glm-4.5-x": {
|
|
28710
|
+
"input_cost_per_token": 2.2e-06,
|
|
28711
|
+
"output_cost_per_token": 8.9e-06,
|
|
28712
|
+
"litellm_provider": "zai",
|
|
28713
|
+
"max_input_tokens": 128000,
|
|
28714
|
+
"max_output_tokens": 32000,
|
|
28715
|
+
"mode": "chat",
|
|
28716
|
+
"supports_function_calling": true,
|
|
28717
|
+
"supports_tool_choice": true,
|
|
28718
|
+
"source": "https://docs.z.ai/guides/overview/pricing"
|
|
28719
|
+
},
|
|
28720
|
+
"zai/glm-4.5-air": {
|
|
28721
|
+
"input_cost_per_token": 2e-07,
|
|
28722
|
+
"output_cost_per_token": 1.1e-06,
|
|
28723
|
+
"litellm_provider": "zai",
|
|
28724
|
+
"max_input_tokens": 128000,
|
|
28725
|
+
"max_output_tokens": 32000,
|
|
28726
|
+
"mode": "chat",
|
|
28727
|
+
"supports_function_calling": true,
|
|
28728
|
+
"supports_tool_choice": true,
|
|
28729
|
+
"source": "https://docs.z.ai/guides/overview/pricing"
|
|
28730
|
+
},
|
|
28731
|
+
"zai/glm-4.5-airx": {
|
|
28732
|
+
"input_cost_per_token": 1.1e-06,
|
|
28733
|
+
"output_cost_per_token": 4.5e-06,
|
|
28734
|
+
"litellm_provider": "zai",
|
|
28735
|
+
"max_input_tokens": 128000,
|
|
28736
|
+
"max_output_tokens": 32000,
|
|
28737
|
+
"mode": "chat",
|
|
28738
|
+
"supports_function_calling": true,
|
|
28739
|
+
"supports_tool_choice": true,
|
|
28740
|
+
"source": "https://docs.z.ai/guides/overview/pricing"
|
|
28741
|
+
},
|
|
28742
|
+
"zai/glm-4-32b-0414-128k": {
|
|
28743
|
+
"input_cost_per_token": 1e-07,
|
|
28744
|
+
"output_cost_per_token": 1e-07,
|
|
28745
|
+
"litellm_provider": "zai",
|
|
28746
|
+
"max_input_tokens": 128000,
|
|
28747
|
+
"max_output_tokens": 32000,
|
|
28748
|
+
"mode": "chat",
|
|
28749
|
+
"supports_function_calling": true,
|
|
28750
|
+
"supports_tool_choice": true,
|
|
28751
|
+
"source": "https://docs.z.ai/guides/overview/pricing"
|
|
28752
|
+
},
|
|
28753
|
+
"zai/glm-4.5-flash": {
|
|
28754
|
+
"input_cost_per_token": 0,
|
|
28755
|
+
"output_cost_per_token": 0,
|
|
28756
|
+
"litellm_provider": "zai",
|
|
28757
|
+
"max_input_tokens": 128000,
|
|
28758
|
+
"max_output_tokens": 32000,
|
|
28759
|
+
"mode": "chat",
|
|
28760
|
+
"supports_function_calling": true,
|
|
28761
|
+
"supports_tool_choice": true,
|
|
28762
|
+
"source": "https://docs.z.ai/guides/overview/pricing"
|
|
28338
28763
|
}
|
|
28339
28764
|
}
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: tokencostauto
|
|
3
|
-
Version: 0.1.
|
|
3
|
+
Version: 0.1.378
|
|
4
4
|
Summary: To calculate token and translated USD cost of string and message calls to OpenAI, for example when used by AI agents
|
|
5
5
|
Author-email: Trisha Pan <trishaepan@gmail.com>, Alex Reibman <areibman@gmail.com>, Pratyush Shukla <ps4534@nyu.edu>, Thiago MadPin <madpin@gmail.com>
|
|
6
6
|
Project-URL: Homepage, https://github.com/madpin/tokencostaudo
|
|
@@ -0,0 +1,9 @@
|
|
|
1
|
+
tokencostauto/__init__.py,sha256=-4d_ryFH62SgNXPXA8vGPFZoAKtOBjnsg37EB_RkZG8,289
|
|
2
|
+
tokencostauto/constants.py,sha256=_82MlTkTrdrwzyRosQD7d3JdgNP9KAUM-cZo8DE00P0,3395
|
|
3
|
+
tokencostauto/costs.py,sha256=tXsgrTypq-dCHaHtoXcg2XepezWsAvZpl9gEsv_53iE,10679
|
|
4
|
+
tokencostauto/model_prices.json,sha256=7g_kbAkIB8zhogHHKj_XSSS1I61XqMsUxG3Z7O2tbiw,1025225
|
|
5
|
+
tokencostauto-0.1.378.dist-info/licenses/LICENSE,sha256=4PLv_CD6Ughnsvg_nM2XeTqGwVK6lQVR77kVWbPq-0U,1065
|
|
6
|
+
tokencostauto-0.1.378.dist-info/METADATA,sha256=npBBO1a4KYQ8olhQ9M9La_jxgY39lPHI7zxOAO5CgoQ,204076
|
|
7
|
+
tokencostauto-0.1.378.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
|
8
|
+
tokencostauto-0.1.378.dist-info/top_level.txt,sha256=szZQTUJRotfIaeZCDsOgvofIkLt2ak88RP13oI51-TU,14
|
|
9
|
+
tokencostauto-0.1.378.dist-info/RECORD,,
|
|
@@ -1,9 +0,0 @@
|
|
|
1
|
-
tokencostauto/__init__.py,sha256=-4d_ryFH62SgNXPXA8vGPFZoAKtOBjnsg37EB_RkZG8,289
|
|
2
|
-
tokencostauto/constants.py,sha256=_82MlTkTrdrwzyRosQD7d3JdgNP9KAUM-cZo8DE00P0,3395
|
|
3
|
-
tokencostauto/costs.py,sha256=tXsgrTypq-dCHaHtoXcg2XepezWsAvZpl9gEsv_53iE,10679
|
|
4
|
-
tokencostauto/model_prices.json,sha256=ppcRA-03vZZBhzFyGsxg97rrHiitQmiQI38LHlTNX5A,1006772
|
|
5
|
-
tokencostauto-0.1.376.dist-info/licenses/LICENSE,sha256=4PLv_CD6Ughnsvg_nM2XeTqGwVK6lQVR77kVWbPq-0U,1065
|
|
6
|
-
tokencostauto-0.1.376.dist-info/METADATA,sha256=bvFO8RvysChQTCXeFlqeo75XRwE6caFjJWA07-Fx670,204076
|
|
7
|
-
tokencostauto-0.1.376.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
|
8
|
-
tokencostauto-0.1.376.dist-info/top_level.txt,sha256=szZQTUJRotfIaeZCDsOgvofIkLt2ak88RP13oI51-TU,14
|
|
9
|
-
tokencostauto-0.1.376.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|
|
File without changes
|