tokencostauto 0.1.333__py3-none-any.whl → 0.1.362__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- tokencostauto/model_prices.json +2304 -42
- {tokencostauto-0.1.333.dist-info → tokencostauto-0.1.362.dist-info}/METADATA +1 -1
- tokencostauto-0.1.362.dist-info/RECORD +9 -0
- tokencostauto-0.1.333.dist-info/RECORD +0 -9
- {tokencostauto-0.1.333.dist-info → tokencostauto-0.1.362.dist-info}/WHEEL +0 -0
- {tokencostauto-0.1.333.dist-info → tokencostauto-0.1.362.dist-info}/licenses/LICENSE +0 -0
- {tokencostauto-0.1.333.dist-info → tokencostauto-0.1.362.dist-info}/top_level.txt +0 -0
tokencostauto/model_prices.json
CHANGED
|
@@ -9266,6 +9266,7 @@
|
|
|
9266
9266
|
"supports_function_calling": false,
|
|
9267
9267
|
"supports_parallel_function_calling": true,
|
|
9268
9268
|
"supports_prompt_caching": true,
|
|
9269
|
+
"supports_reasoning": true,
|
|
9269
9270
|
"supports_response_schema": false,
|
|
9270
9271
|
"supports_system_messages": true,
|
|
9271
9272
|
"supports_tool_choice": true,
|
|
@@ -10442,6 +10443,7 @@
|
|
|
10442
10443
|
"supports_audio_output": true,
|
|
10443
10444
|
"supports_function_calling": true,
|
|
10444
10445
|
"supports_prompt_caching": true,
|
|
10446
|
+
"supports_reasoning": true,
|
|
10445
10447
|
"supports_response_schema": true,
|
|
10446
10448
|
"supports_system_messages": true,
|
|
10447
10449
|
"supports_tool_choice": true,
|
|
@@ -10473,7 +10475,7 @@
|
|
|
10473
10475
|
"supports_audio_output": false,
|
|
10474
10476
|
"supports_function_calling": true,
|
|
10475
10477
|
"supports_response_schema": true,
|
|
10476
|
-
"supports_system_messages":
|
|
10478
|
+
"supports_system_messages": false,
|
|
10477
10479
|
"supports_tool_choice": true,
|
|
10478
10480
|
"supports_vision": true
|
|
10479
10481
|
},
|
|
@@ -11815,14 +11817,14 @@
|
|
|
11815
11817
|
},
|
|
11816
11818
|
"azure/o3-2025-04-16": {
|
|
11817
11819
|
"deprecation_date": "2026-04-16",
|
|
11818
|
-
"cache_read_input_token_cost":
|
|
11819
|
-
"input_cost_per_token":
|
|
11820
|
+
"cache_read_input_token_cost": 5e-07,
|
|
11821
|
+
"input_cost_per_token": 2e-06,
|
|
11820
11822
|
"litellm_provider": "azure",
|
|
11821
11823
|
"max_input_tokens": 200000,
|
|
11822
11824
|
"max_output_tokens": 100000,
|
|
11823
11825
|
"max_tokens": 100000,
|
|
11824
11826
|
"mode": "chat",
|
|
11825
|
-
"output_cost_per_token":
|
|
11827
|
+
"output_cost_per_token": 8e-06,
|
|
11826
11828
|
"supported_endpoints": [
|
|
11827
11829
|
"/v1/chat/completions",
|
|
11828
11830
|
"/v1/batch",
|
|
@@ -15602,7 +15604,7 @@
|
|
|
15602
15604
|
"tool_use_system_prompt_tokens": 159
|
|
15603
15605
|
},
|
|
15604
15606
|
"gemini/gemini-2.5-flash": {
|
|
15605
|
-
"cache_read_input_token_cost":
|
|
15607
|
+
"cache_read_input_token_cost": 3e-08,
|
|
15606
15608
|
"input_cost_per_audio_token": 1e-06,
|
|
15607
15609
|
"input_cost_per_token": 3e-07,
|
|
15608
15610
|
"litellm_provider": "gemini",
|
|
@@ -17812,15 +17814,16 @@
|
|
|
17812
17814
|
"supports_tool_choice": true
|
|
17813
17815
|
},
|
|
17814
17816
|
"openrouter/qwen/qwen3-coder": {
|
|
17815
|
-
"input_cost_per_token":
|
|
17817
|
+
"input_cost_per_token": 2.2e-07,
|
|
17816
17818
|
"litellm_provider": "openrouter",
|
|
17817
|
-
"max_input_tokens":
|
|
17818
|
-
"max_output_tokens":
|
|
17819
|
-
"max_tokens":
|
|
17819
|
+
"max_input_tokens": 262100,
|
|
17820
|
+
"max_output_tokens": 262100,
|
|
17821
|
+
"max_tokens": 262100,
|
|
17820
17822
|
"mode": "chat",
|
|
17821
|
-
"output_cost_per_token": 5e-
|
|
17823
|
+
"output_cost_per_token": 9.5e-07,
|
|
17822
17824
|
"source": "https://openrouter.ai/qwen/qwen3-coder",
|
|
17823
|
-
"supports_tool_choice": true
|
|
17825
|
+
"supports_tool_choice": true,
|
|
17826
|
+
"supports_function_calling": true
|
|
17824
17827
|
},
|
|
17825
17828
|
"gemini/imagen-4.0-generate-preview-06-06": {
|
|
17826
17829
|
"output_cost_per_image": 0.04,
|
|
@@ -21714,7 +21717,7 @@
|
|
|
21714
21717
|
"max_input_tokens": 1024,
|
|
21715
21718
|
"max_tokens": 1024,
|
|
21716
21719
|
"mode": "video_generation",
|
|
21717
|
-
"output_cost_per_second": 0.
|
|
21720
|
+
"output_cost_per_second": 0.4,
|
|
21718
21721
|
"source": "https://ai.google.dev/gemini-api/docs/video",
|
|
21719
21722
|
"supported_modalities": [
|
|
21720
21723
|
"text"
|
|
@@ -21728,7 +21731,7 @@
|
|
|
21728
21731
|
"max_input_tokens": 1024,
|
|
21729
21732
|
"max_tokens": 1024,
|
|
21730
21733
|
"mode": "video_generation",
|
|
21731
|
-
"output_cost_per_second": 0.
|
|
21734
|
+
"output_cost_per_second": 0.15,
|
|
21732
21735
|
"source": "https://ai.google.dev/gemini-api/docs/video",
|
|
21733
21736
|
"supported_modalities": [
|
|
21734
21737
|
"text"
|
|
@@ -24519,58 +24522,67 @@
|
|
|
24519
24522
|
"cache_creation_input_token_cost": 1.25e-06,
|
|
24520
24523
|
"cache_read_input_token_cost": 1e-07,
|
|
24521
24524
|
"input_cost_per_token": 1e-06,
|
|
24522
|
-
"litellm_provider": "
|
|
24525
|
+
"litellm_provider": "bedrock_converse",
|
|
24523
24526
|
"max_input_tokens": 200000,
|
|
24524
|
-
"max_output_tokens":
|
|
24525
|
-
"max_tokens":
|
|
24527
|
+
"max_output_tokens": 64000,
|
|
24528
|
+
"max_tokens": 64000,
|
|
24526
24529
|
"mode": "chat",
|
|
24527
24530
|
"output_cost_per_token": 5e-06,
|
|
24528
24531
|
"source": "https://aws.amazon.com/about-aws/whats-new/2025/10/claude-4-5-haiku-anthropic-amazon-bedrock",
|
|
24529
24532
|
"supports_assistant_prefill": true,
|
|
24533
|
+
"supports_computer_use": true,
|
|
24530
24534
|
"supports_function_calling": true,
|
|
24531
24535
|
"supports_pdf_input": true,
|
|
24532
24536
|
"supports_prompt_caching": true,
|
|
24533
24537
|
"supports_reasoning": true,
|
|
24534
24538
|
"supports_response_schema": true,
|
|
24535
|
-
"supports_tool_choice": true
|
|
24539
|
+
"supports_tool_choice": true,
|
|
24540
|
+
"supports_vision": true,
|
|
24541
|
+
"tool_use_system_prompt_tokens": 346
|
|
24536
24542
|
},
|
|
24537
24543
|
"anthropic.claude-haiku-4-5@20251001": {
|
|
24538
24544
|
"cache_creation_input_token_cost": 1.25e-06,
|
|
24539
24545
|
"cache_read_input_token_cost": 1e-07,
|
|
24540
24546
|
"input_cost_per_token": 1e-06,
|
|
24541
|
-
"litellm_provider": "
|
|
24547
|
+
"litellm_provider": "bedrock_converse",
|
|
24542
24548
|
"max_input_tokens": 200000,
|
|
24543
|
-
"max_output_tokens":
|
|
24544
|
-
"max_tokens":
|
|
24549
|
+
"max_output_tokens": 64000,
|
|
24550
|
+
"max_tokens": 64000,
|
|
24545
24551
|
"mode": "chat",
|
|
24546
24552
|
"output_cost_per_token": 5e-06,
|
|
24547
24553
|
"source": "https://aws.amazon.com/about-aws/whats-new/2025/10/claude-4-5-haiku-anthropic-amazon-bedrock",
|
|
24548
24554
|
"supports_assistant_prefill": true,
|
|
24555
|
+
"supports_computer_use": true,
|
|
24549
24556
|
"supports_function_calling": true,
|
|
24550
24557
|
"supports_pdf_input": true,
|
|
24551
24558
|
"supports_prompt_caching": true,
|
|
24552
24559
|
"supports_reasoning": true,
|
|
24553
24560
|
"supports_response_schema": true,
|
|
24554
|
-
"supports_tool_choice": true
|
|
24561
|
+
"supports_tool_choice": true,
|
|
24562
|
+
"supports_vision": true,
|
|
24563
|
+
"tool_use_system_prompt_tokens": 346
|
|
24555
24564
|
},
|
|
24556
24565
|
"apac.anthropic.claude-haiku-4-5-20251001-v1:0": {
|
|
24557
24566
|
"cache_creation_input_token_cost": 1.375e-06,
|
|
24558
24567
|
"cache_read_input_token_cost": 1.1e-07,
|
|
24559
24568
|
"input_cost_per_token": 1.1e-06,
|
|
24560
|
-
"litellm_provider": "
|
|
24569
|
+
"litellm_provider": "bedrock_converse",
|
|
24561
24570
|
"max_input_tokens": 200000,
|
|
24562
|
-
"max_output_tokens":
|
|
24563
|
-
"max_tokens":
|
|
24571
|
+
"max_output_tokens": 64000,
|
|
24572
|
+
"max_tokens": 64000,
|
|
24564
24573
|
"mode": "chat",
|
|
24565
24574
|
"output_cost_per_token": 5.5e-06,
|
|
24566
24575
|
"source": "https://aws.amazon.com/about-aws/whats-new/2025/10/claude-4-5-haiku-anthropic-amazon-bedrock",
|
|
24567
24576
|
"supports_assistant_prefill": true,
|
|
24577
|
+
"supports_computer_use": true,
|
|
24568
24578
|
"supports_function_calling": true,
|
|
24569
24579
|
"supports_pdf_input": true,
|
|
24570
24580
|
"supports_prompt_caching": true,
|
|
24571
24581
|
"supports_reasoning": true,
|
|
24572
24582
|
"supports_response_schema": true,
|
|
24573
|
-
"supports_tool_choice": true
|
|
24583
|
+
"supports_tool_choice": true,
|
|
24584
|
+
"supports_vision": true,
|
|
24585
|
+
"tool_use_system_prompt_tokens": 346
|
|
24574
24586
|
},
|
|
24575
24587
|
"claude-haiku-4-5-20251001": {
|
|
24576
24588
|
"cache_creation_input_token_cost": 1.25e-06,
|
|
@@ -24619,20 +24631,23 @@
|
|
|
24619
24631
|
"cache_read_input_token_cost": 1.1e-07,
|
|
24620
24632
|
"input_cost_per_token": 1.1e-06,
|
|
24621
24633
|
"deprecation_date": "2026-10-15",
|
|
24622
|
-
"litellm_provider": "
|
|
24634
|
+
"litellm_provider": "bedrock_converse",
|
|
24623
24635
|
"max_input_tokens": 200000,
|
|
24624
|
-
"max_output_tokens":
|
|
24625
|
-
"max_tokens":
|
|
24636
|
+
"max_output_tokens": 64000,
|
|
24637
|
+
"max_tokens": 64000,
|
|
24626
24638
|
"mode": "chat",
|
|
24627
24639
|
"output_cost_per_token": 5.5e-06,
|
|
24628
24640
|
"source": "https://aws.amazon.com/about-aws/whats-new/2025/10/claude-4-5-haiku-anthropic-amazon-bedrock",
|
|
24629
24641
|
"supports_assistant_prefill": true,
|
|
24642
|
+
"supports_computer_use": true,
|
|
24630
24643
|
"supports_function_calling": true,
|
|
24631
24644
|
"supports_pdf_input": true,
|
|
24632
24645
|
"supports_prompt_caching": true,
|
|
24633
24646
|
"supports_reasoning": true,
|
|
24634
24647
|
"supports_response_schema": true,
|
|
24635
|
-
"supports_tool_choice": true
|
|
24648
|
+
"supports_tool_choice": true,
|
|
24649
|
+
"supports_vision": true,
|
|
24650
|
+
"tool_use_system_prompt_tokens": 346
|
|
24636
24651
|
},
|
|
24637
24652
|
"gemini-2.5-flash-image": {
|
|
24638
24653
|
"cache_read_input_token_cost": 3e-08,
|
|
@@ -24689,6 +24704,7 @@
|
|
|
24689
24704
|
"litellm_provider": "vertex_ai-language-models",
|
|
24690
24705
|
"max_audio_length_hours": 8.4,
|
|
24691
24706
|
"max_audio_per_prompt": 1,
|
|
24707
|
+
"supports_reasoning": false,
|
|
24692
24708
|
"max_images_per_prompt": 3000,
|
|
24693
24709
|
"max_input_tokens": 32768,
|
|
24694
24710
|
"max_output_tokens": 32768,
|
|
@@ -24782,39 +24798,45 @@
|
|
|
24782
24798
|
"cache_creation_input_token_cost": 1.375e-06,
|
|
24783
24799
|
"cache_read_input_token_cost": 1.1e-07,
|
|
24784
24800
|
"input_cost_per_token": 1.1e-06,
|
|
24785
|
-
"litellm_provider": "
|
|
24801
|
+
"litellm_provider": "bedrock_converse",
|
|
24786
24802
|
"max_input_tokens": 200000,
|
|
24787
|
-
"max_output_tokens":
|
|
24788
|
-
"max_tokens":
|
|
24803
|
+
"max_output_tokens": 64000,
|
|
24804
|
+
"max_tokens": 64000,
|
|
24789
24805
|
"mode": "chat",
|
|
24790
24806
|
"output_cost_per_token": 5.5e-06,
|
|
24791
24807
|
"source": "https://aws.amazon.com/about-aws/whats-new/2025/10/claude-4-5-haiku-anthropic-amazon-bedrock",
|
|
24792
24808
|
"supports_assistant_prefill": true,
|
|
24809
|
+
"supports_computer_use": true,
|
|
24793
24810
|
"supports_function_calling": true,
|
|
24794
24811
|
"supports_pdf_input": true,
|
|
24795
24812
|
"supports_prompt_caching": true,
|
|
24796
24813
|
"supports_reasoning": true,
|
|
24797
24814
|
"supports_response_schema": true,
|
|
24798
|
-
"supports_tool_choice": true
|
|
24815
|
+
"supports_tool_choice": true,
|
|
24816
|
+
"supports_vision": true,
|
|
24817
|
+
"tool_use_system_prompt_tokens": 346
|
|
24799
24818
|
},
|
|
24800
24819
|
"us.anthropic.claude-haiku-4-5-20251001-v1:0": {
|
|
24801
24820
|
"cache_creation_input_token_cost": 1.375e-06,
|
|
24802
24821
|
"cache_read_input_token_cost": 1.1e-07,
|
|
24803
24822
|
"input_cost_per_token": 1.1e-06,
|
|
24804
|
-
"litellm_provider": "
|
|
24823
|
+
"litellm_provider": "bedrock_converse",
|
|
24805
24824
|
"max_input_tokens": 200000,
|
|
24806
|
-
"max_output_tokens":
|
|
24807
|
-
"max_tokens":
|
|
24825
|
+
"max_output_tokens": 64000,
|
|
24826
|
+
"max_tokens": 64000,
|
|
24808
24827
|
"mode": "chat",
|
|
24809
24828
|
"output_cost_per_token": 5.5e-06,
|
|
24810
24829
|
"source": "https://aws.amazon.com/about-aws/whats-new/2025/10/claude-4-5-haiku-anthropic-amazon-bedrock",
|
|
24811
24830
|
"supports_assistant_prefill": true,
|
|
24831
|
+
"supports_computer_use": true,
|
|
24812
24832
|
"supports_function_calling": true,
|
|
24813
24833
|
"supports_pdf_input": true,
|
|
24814
24834
|
"supports_prompt_caching": true,
|
|
24815
24835
|
"supports_reasoning": true,
|
|
24816
24836
|
"supports_response_schema": true,
|
|
24817
|
-
"supports_tool_choice": true
|
|
24837
|
+
"supports_tool_choice": true,
|
|
24838
|
+
"supports_vision": true,
|
|
24839
|
+
"tool_use_system_prompt_tokens": 346
|
|
24818
24840
|
},
|
|
24819
24841
|
"vertex_ai/claude-haiku-4-5@20251001": {
|
|
24820
24842
|
"cache_creation_input_token_cost": 1.25e-06,
|
|
@@ -24882,12 +24904,13 @@
|
|
|
24882
24904
|
"input_cost_per_token": 1.1e-06,
|
|
24883
24905
|
"litellm_provider": "bedrock_converse",
|
|
24884
24906
|
"max_input_tokens": 200000,
|
|
24885
|
-
"max_output_tokens":
|
|
24886
|
-
"max_tokens":
|
|
24907
|
+
"max_output_tokens": 64000,
|
|
24908
|
+
"max_tokens": 64000,
|
|
24887
24909
|
"mode": "chat",
|
|
24888
24910
|
"output_cost_per_token": 5.5e-06,
|
|
24889
24911
|
"source": "https://aws.amazon.com/about-aws/whats-new/2025/10/claude-4-5-haiku-anthropic-amazon-bedrock",
|
|
24890
24912
|
"supports_assistant_prefill": true,
|
|
24913
|
+
"supports_computer_use": true,
|
|
24891
24914
|
"supports_function_calling": true,
|
|
24892
24915
|
"supports_pdf_input": true,
|
|
24893
24916
|
"supports_prompt_caching": true,
|
|
@@ -24903,14 +24926,16 @@
|
|
|
24903
24926
|
"input_cost_per_token": 1.1e-06,
|
|
24904
24927
|
"litellm_provider": "bedrock_converse",
|
|
24905
24928
|
"max_input_tokens": 200000,
|
|
24906
|
-
"max_output_tokens":
|
|
24907
|
-
"max_tokens":
|
|
24929
|
+
"max_output_tokens": 64000,
|
|
24930
|
+
"max_tokens": 64000,
|
|
24908
24931
|
"mode": "chat",
|
|
24909
24932
|
"output_cost_per_token": 5.5e-06,
|
|
24910
24933
|
"supports_assistant_prefill": true,
|
|
24934
|
+
"supports_computer_use": true,
|
|
24911
24935
|
"supports_function_calling": true,
|
|
24912
24936
|
"supports_pdf_input": true,
|
|
24913
24937
|
"supports_prompt_caching": true,
|
|
24938
|
+
"supports_reasoning": true,
|
|
24914
24939
|
"supports_response_schema": true,
|
|
24915
24940
|
"supports_tool_choice": true,
|
|
24916
24941
|
"supports_vision": true,
|
|
@@ -25276,7 +25301,7 @@
|
|
|
25276
25301
|
"fal_ai/fal-ai/flux-pro/v1.1-ultra": {
|
|
25277
25302
|
"litellm_provider": "fal_ai",
|
|
25278
25303
|
"mode": "image_generation",
|
|
25279
|
-
"output_cost_per_image": 0.
|
|
25304
|
+
"output_cost_per_image": 0.06,
|
|
25280
25305
|
"supported_endpoints": [
|
|
25281
25306
|
"/v1/images/generations"
|
|
25282
25307
|
]
|
|
@@ -25709,5 +25734,2242 @@
|
|
|
25709
25734
|
"source": "https://cloud.google.com/vertex-ai/generative-ai/pricing#partner-models",
|
|
25710
25735
|
"supports_function_calling": true,
|
|
25711
25736
|
"supports_tool_choice": true
|
|
25737
|
+
},
|
|
25738
|
+
"cohere/embed-v4.0": {
|
|
25739
|
+
"input_cost_per_token": 1.2e-07,
|
|
25740
|
+
"litellm_provider": "cohere",
|
|
25741
|
+
"max_input_tokens": 128000,
|
|
25742
|
+
"max_tokens": 128000,
|
|
25743
|
+
"mode": "embedding",
|
|
25744
|
+
"output_cost_per_token": 0.0,
|
|
25745
|
+
"output_vector_size": 1536,
|
|
25746
|
+
"supports_embedding_image_input": true
|
|
25747
|
+
},
|
|
25748
|
+
"gemini/veo-3.1-fast-generate-preview": {
|
|
25749
|
+
"litellm_provider": "gemini",
|
|
25750
|
+
"max_input_tokens": 1024,
|
|
25751
|
+
"max_tokens": 1024,
|
|
25752
|
+
"mode": "video_generation",
|
|
25753
|
+
"output_cost_per_second": 0.15,
|
|
25754
|
+
"source": "https://ai.google.dev/gemini-api/docs/video",
|
|
25755
|
+
"supported_modalities": [
|
|
25756
|
+
"text"
|
|
25757
|
+
],
|
|
25758
|
+
"supported_output_modalities": [
|
|
25759
|
+
"video"
|
|
25760
|
+
]
|
|
25761
|
+
},
|
|
25762
|
+
"gemini/veo-3.1-generate-preview": {
|
|
25763
|
+
"litellm_provider": "gemini",
|
|
25764
|
+
"max_input_tokens": 1024,
|
|
25765
|
+
"max_tokens": 1024,
|
|
25766
|
+
"mode": "video_generation",
|
|
25767
|
+
"output_cost_per_second": 0.4,
|
|
25768
|
+
"source": "https://ai.google.dev/gemini-api/docs/video",
|
|
25769
|
+
"supported_modalities": [
|
|
25770
|
+
"text"
|
|
25771
|
+
],
|
|
25772
|
+
"supported_output_modalities": [
|
|
25773
|
+
"video"
|
|
25774
|
+
]
|
|
25775
|
+
},
|
|
25776
|
+
"vertex_ai/veo-3.1-generate-preview": {
|
|
25777
|
+
"litellm_provider": "vertex_ai-video-models",
|
|
25778
|
+
"max_input_tokens": 1024,
|
|
25779
|
+
"max_tokens": 1024,
|
|
25780
|
+
"mode": "video_generation",
|
|
25781
|
+
"output_cost_per_second": 0.4,
|
|
25782
|
+
"source": "https://cloud.google.com/vertex-ai/generative-ai/docs/model-reference/veo",
|
|
25783
|
+
"supported_modalities": [
|
|
25784
|
+
"text"
|
|
25785
|
+
],
|
|
25786
|
+
"supported_output_modalities": [
|
|
25787
|
+
"video"
|
|
25788
|
+
]
|
|
25789
|
+
},
|
|
25790
|
+
"vertex_ai/veo-3.1-fast-generate-preview": {
|
|
25791
|
+
"litellm_provider": "vertex_ai-video-models",
|
|
25792
|
+
"max_input_tokens": 1024,
|
|
25793
|
+
"max_tokens": 1024,
|
|
25794
|
+
"mode": "video_generation",
|
|
25795
|
+
"output_cost_per_second": 0.15,
|
|
25796
|
+
"source": "https://cloud.google.com/vertex-ai/generative-ai/docs/model-reference/veo",
|
|
25797
|
+
"supported_modalities": [
|
|
25798
|
+
"text"
|
|
25799
|
+
],
|
|
25800
|
+
"supported_output_modalities": [
|
|
25801
|
+
"video"
|
|
25802
|
+
]
|
|
25803
|
+
},
|
|
25804
|
+
"moonshot/kimi-k2-thinking": {
|
|
25805
|
+
"cache_read_input_token_cost": 1.5e-07,
|
|
25806
|
+
"input_cost_per_token": 6e-07,
|
|
25807
|
+
"litellm_provider": "moonshot",
|
|
25808
|
+
"max_input_tokens": 262144,
|
|
25809
|
+
"max_output_tokens": 262144,
|
|
25810
|
+
"max_tokens": 262144,
|
|
25811
|
+
"mode": "chat",
|
|
25812
|
+
"output_cost_per_token": 2.5e-06,
|
|
25813
|
+
"source": "https://platform.moonshot.ai/docs/pricing/chat#generation-model-kimi-k2",
|
|
25814
|
+
"supports_function_calling": true,
|
|
25815
|
+
"supports_tool_choice": true,
|
|
25816
|
+
"supports_web_search": true
|
|
25817
|
+
},
|
|
25818
|
+
"mistral/magistral-medium-2509": {
|
|
25819
|
+
"input_cost_per_token": 2e-06,
|
|
25820
|
+
"litellm_provider": "mistral",
|
|
25821
|
+
"max_input_tokens": 40000,
|
|
25822
|
+
"max_output_tokens": 40000,
|
|
25823
|
+
"max_tokens": 40000,
|
|
25824
|
+
"mode": "chat",
|
|
25825
|
+
"output_cost_per_token": 5e-06,
|
|
25826
|
+
"source": "https://mistral.ai/news/magistral",
|
|
25827
|
+
"supports_assistant_prefill": true,
|
|
25828
|
+
"supports_function_calling": true,
|
|
25829
|
+
"supports_reasoning": true,
|
|
25830
|
+
"supports_response_schema": true,
|
|
25831
|
+
"supports_tool_choice": true
|
|
25832
|
+
},
|
|
25833
|
+
"openrouter/deepseek/deepseek-v3.2-exp": {
|
|
25834
|
+
"input_cost_per_token": 2e-07,
|
|
25835
|
+
"input_cost_per_token_cache_hit": 2e-08,
|
|
25836
|
+
"litellm_provider": "openrouter",
|
|
25837
|
+
"max_input_tokens": 163840,
|
|
25838
|
+
"max_output_tokens": 163840,
|
|
25839
|
+
"max_tokens": 8192,
|
|
25840
|
+
"mode": "chat",
|
|
25841
|
+
"output_cost_per_token": 4e-07,
|
|
25842
|
+
"supports_assistant_prefill": true,
|
|
25843
|
+
"supports_function_calling": true,
|
|
25844
|
+
"supports_prompt_caching": true,
|
|
25845
|
+
"supports_reasoning": false,
|
|
25846
|
+
"supports_tool_choice": true
|
|
25847
|
+
},
|
|
25848
|
+
"openrouter/minimax/minimax-m2": {
|
|
25849
|
+
"input_cost_per_token": 2.55e-07,
|
|
25850
|
+
"litellm_provider": "openrouter",
|
|
25851
|
+
"max_input_tokens": 204800,
|
|
25852
|
+
"max_output_tokens": 204800,
|
|
25853
|
+
"max_tokens": 32768,
|
|
25854
|
+
"mode": "chat",
|
|
25855
|
+
"output_cost_per_token": 1.02e-06,
|
|
25856
|
+
"supports_function_calling": true,
|
|
25857
|
+
"supports_prompt_caching": false,
|
|
25858
|
+
"supports_reasoning": true,
|
|
25859
|
+
"supports_tool_choice": true
|
|
25860
|
+
},
|
|
25861
|
+
"openrouter/z-ai/glm-4.6": {
|
|
25862
|
+
"input_cost_per_token": 4e-07,
|
|
25863
|
+
"litellm_provider": "openrouter",
|
|
25864
|
+
"max_input_tokens": 202800,
|
|
25865
|
+
"max_output_tokens": 131000,
|
|
25866
|
+
"max_tokens": 202800,
|
|
25867
|
+
"mode": "chat",
|
|
25868
|
+
"output_cost_per_token": 1.75e-06,
|
|
25869
|
+
"source": "https://openrouter.ai/z-ai/glm-4.6",
|
|
25870
|
+
"supports_function_calling": true,
|
|
25871
|
+
"supports_reasoning": true,
|
|
25872
|
+
"supports_tool_choice": true
|
|
25873
|
+
},
|
|
25874
|
+
"openrouter/z-ai/glm-4.6:exacto": {
|
|
25875
|
+
"input_cost_per_token": 4.5e-07,
|
|
25876
|
+
"litellm_provider": "openrouter",
|
|
25877
|
+
"max_input_tokens": 202800,
|
|
25878
|
+
"max_output_tokens": 131000,
|
|
25879
|
+
"max_tokens": 202800,
|
|
25880
|
+
"mode": "chat",
|
|
25881
|
+
"output_cost_per_token": 1.9e-06,
|
|
25882
|
+
"source": "https://openrouter.ai/z-ai/glm-4.6:exacto",
|
|
25883
|
+
"supports_function_calling": true,
|
|
25884
|
+
"supports_reasoning": true,
|
|
25885
|
+
"supports_tool_choice": true
|
|
25886
|
+
},
|
|
25887
|
+
"runwayml/gen4_turbo": {
|
|
25888
|
+
"litellm_provider": "runwayml",
|
|
25889
|
+
"mode": "video_generation",
|
|
25890
|
+
"output_cost_per_video_per_second": 0.05,
|
|
25891
|
+
"source": "https://docs.dev.runwayml.com/guides/pricing/",
|
|
25892
|
+
"supported_modalities": [
|
|
25893
|
+
"text",
|
|
25894
|
+
"image"
|
|
25895
|
+
],
|
|
25896
|
+
"supported_output_modalities": [
|
|
25897
|
+
"video"
|
|
25898
|
+
],
|
|
25899
|
+
"supported_resolutions": [
|
|
25900
|
+
"1280x720",
|
|
25901
|
+
"720x1280"
|
|
25902
|
+
],
|
|
25903
|
+
"metadata": {
|
|
25904
|
+
"comment": "5 credits per second @ $0.01 per credit = $0.05 per second"
|
|
25905
|
+
}
|
|
25906
|
+
},
|
|
25907
|
+
"runwayml/gen4_aleph": {
|
|
25908
|
+
"litellm_provider": "runwayml",
|
|
25909
|
+
"mode": "video_generation",
|
|
25910
|
+
"output_cost_per_video_per_second": 0.15,
|
|
25911
|
+
"source": "https://docs.dev.runwayml.com/guides/pricing/",
|
|
25912
|
+
"supported_modalities": [
|
|
25913
|
+
"text",
|
|
25914
|
+
"image"
|
|
25915
|
+
],
|
|
25916
|
+
"supported_output_modalities": [
|
|
25917
|
+
"video"
|
|
25918
|
+
],
|
|
25919
|
+
"supported_resolutions": [
|
|
25920
|
+
"1280x720",
|
|
25921
|
+
"720x1280"
|
|
25922
|
+
],
|
|
25923
|
+
"metadata": {
|
|
25924
|
+
"comment": "15 credits per second @ $0.01 per credit = $0.15 per second"
|
|
25925
|
+
}
|
|
25926
|
+
},
|
|
25927
|
+
"runwayml/gen3a_turbo": {
|
|
25928
|
+
"litellm_provider": "runwayml",
|
|
25929
|
+
"mode": "video_generation",
|
|
25930
|
+
"output_cost_per_video_per_second": 0.05,
|
|
25931
|
+
"source": "https://docs.dev.runwayml.com/guides/pricing/",
|
|
25932
|
+
"supported_modalities": [
|
|
25933
|
+
"text",
|
|
25934
|
+
"image"
|
|
25935
|
+
],
|
|
25936
|
+
"supported_output_modalities": [
|
|
25937
|
+
"video"
|
|
25938
|
+
],
|
|
25939
|
+
"supported_resolutions": [
|
|
25940
|
+
"1280x720",
|
|
25941
|
+
"720x1280"
|
|
25942
|
+
],
|
|
25943
|
+
"metadata": {
|
|
25944
|
+
"comment": "5 credits per second @ $0.01 per credit = $0.05 per second"
|
|
25945
|
+
}
|
|
25946
|
+
},
|
|
25947
|
+
"runwayml/gen4_image": {
|
|
25948
|
+
"litellm_provider": "runwayml",
|
|
25949
|
+
"mode": "image_generation",
|
|
25950
|
+
"input_cost_per_image": 0.05,
|
|
25951
|
+
"output_cost_per_image": 0.05,
|
|
25952
|
+
"source": "https://docs.dev.runwayml.com/guides/pricing/",
|
|
25953
|
+
"supported_modalities": [
|
|
25954
|
+
"text",
|
|
25955
|
+
"image"
|
|
25956
|
+
],
|
|
25957
|
+
"supported_output_modalities": [
|
|
25958
|
+
"image"
|
|
25959
|
+
],
|
|
25960
|
+
"supported_resolutions": [
|
|
25961
|
+
"1280x720",
|
|
25962
|
+
"1920x1080"
|
|
25963
|
+
],
|
|
25964
|
+
"metadata": {
|
|
25965
|
+
"comment": "5 credits per 720p image or 8 credits per 1080p image @ $0.01 per credit. Using 5 credits ($0.05) as base cost"
|
|
25966
|
+
}
|
|
25967
|
+
},
|
|
25968
|
+
"runwayml/gen4_image_turbo": {
|
|
25969
|
+
"litellm_provider": "runwayml",
|
|
25970
|
+
"mode": "image_generation",
|
|
25971
|
+
"input_cost_per_image": 0.02,
|
|
25972
|
+
"output_cost_per_image": 0.02,
|
|
25973
|
+
"source": "https://docs.dev.runwayml.com/guides/pricing/",
|
|
25974
|
+
"supported_modalities": [
|
|
25975
|
+
"text",
|
|
25976
|
+
"image"
|
|
25977
|
+
],
|
|
25978
|
+
"supported_output_modalities": [
|
|
25979
|
+
"image"
|
|
25980
|
+
],
|
|
25981
|
+
"supported_resolutions": [
|
|
25982
|
+
"1280x720",
|
|
25983
|
+
"1920x1080"
|
|
25984
|
+
],
|
|
25985
|
+
"metadata": {
|
|
25986
|
+
"comment": "2 credits per image (any resolution) @ $0.01 per credit = $0.02 per image"
|
|
25987
|
+
}
|
|
25988
|
+
},
|
|
25989
|
+
"gpt-5.1": {
|
|
25990
|
+
"cache_read_input_token_cost": 1.25e-07,
|
|
25991
|
+
"cache_read_input_token_cost_priority": 2.5e-07,
|
|
25992
|
+
"input_cost_per_token": 1.25e-06,
|
|
25993
|
+
"input_cost_per_token_priority": 2.5e-06,
|
|
25994
|
+
"litellm_provider": "openai",
|
|
25995
|
+
"max_input_tokens": 272000,
|
|
25996
|
+
"max_output_tokens": 128000,
|
|
25997
|
+
"max_tokens": 128000,
|
|
25998
|
+
"mode": "chat",
|
|
25999
|
+
"output_cost_per_token": 1e-05,
|
|
26000
|
+
"output_cost_per_token_priority": 2e-05,
|
|
26001
|
+
"supported_endpoints": [
|
|
26002
|
+
"/v1/chat/completions",
|
|
26003
|
+
"/v1/responses"
|
|
26004
|
+
],
|
|
26005
|
+
"supported_modalities": [
|
|
26006
|
+
"text",
|
|
26007
|
+
"image"
|
|
26008
|
+
],
|
|
26009
|
+
"supported_output_modalities": [
|
|
26010
|
+
"text",
|
|
26011
|
+
"image"
|
|
26012
|
+
],
|
|
26013
|
+
"supports_function_calling": true,
|
|
26014
|
+
"supports_native_streaming": true,
|
|
26015
|
+
"supports_parallel_function_calling": true,
|
|
26016
|
+
"supports_pdf_input": true,
|
|
26017
|
+
"supports_prompt_caching": true,
|
|
26018
|
+
"supports_reasoning": true,
|
|
26019
|
+
"supports_response_schema": true,
|
|
26020
|
+
"supports_system_messages": true,
|
|
26021
|
+
"supports_tool_choice": true,
|
|
26022
|
+
"supports_service_tier": true,
|
|
26023
|
+
"supports_vision": true
|
|
26024
|
+
},
|
|
26025
|
+
"gpt-5.1-2025-11-13": {
|
|
26026
|
+
"cache_read_input_token_cost": 1.25e-07,
|
|
26027
|
+
"cache_read_input_token_cost_priority": 2.5e-07,
|
|
26028
|
+
"input_cost_per_token": 1.25e-06,
|
|
26029
|
+
"input_cost_per_token_priority": 2.5e-06,
|
|
26030
|
+
"litellm_provider": "openai",
|
|
26031
|
+
"max_input_tokens": 272000,
|
|
26032
|
+
"max_output_tokens": 128000,
|
|
26033
|
+
"max_tokens": 128000,
|
|
26034
|
+
"mode": "chat",
|
|
26035
|
+
"output_cost_per_token": 1e-05,
|
|
26036
|
+
"output_cost_per_token_priority": 2e-05,
|
|
26037
|
+
"supported_endpoints": [
|
|
26038
|
+
"/v1/chat/completions",
|
|
26039
|
+
"/v1/responses"
|
|
26040
|
+
],
|
|
26041
|
+
"supported_modalities": [
|
|
26042
|
+
"text",
|
|
26043
|
+
"image"
|
|
26044
|
+
],
|
|
26045
|
+
"supported_output_modalities": [
|
|
26046
|
+
"text",
|
|
26047
|
+
"image"
|
|
26048
|
+
],
|
|
26049
|
+
"supports_function_calling": true,
|
|
26050
|
+
"supports_native_streaming": true,
|
|
26051
|
+
"supports_parallel_function_calling": true,
|
|
26052
|
+
"supports_pdf_input": true,
|
|
26053
|
+
"supports_prompt_caching": true,
|
|
26054
|
+
"supports_reasoning": true,
|
|
26055
|
+
"supports_response_schema": true,
|
|
26056
|
+
"supports_system_messages": true,
|
|
26057
|
+
"supports_tool_choice": true,
|
|
26058
|
+
"supports_service_tier": true,
|
|
26059
|
+
"supports_vision": true
|
|
26060
|
+
},
|
|
26061
|
+
"gpt-5.1-chat-latest": {
|
|
26062
|
+
"cache_read_input_token_cost": 1.25e-07,
|
|
26063
|
+
"cache_read_input_token_cost_priority": 2.5e-07,
|
|
26064
|
+
"input_cost_per_token": 1.25e-06,
|
|
26065
|
+
"input_cost_per_token_priority": 2.5e-06,
|
|
26066
|
+
"litellm_provider": "openai",
|
|
26067
|
+
"max_input_tokens": 128000,
|
|
26068
|
+
"max_output_tokens": 16384,
|
|
26069
|
+
"max_tokens": 16384,
|
|
26070
|
+
"mode": "chat",
|
|
26071
|
+
"output_cost_per_token": 1e-05,
|
|
26072
|
+
"output_cost_per_token_priority": 2e-05,
|
|
26073
|
+
"supported_endpoints": [
|
|
26074
|
+
"/v1/chat/completions",
|
|
26075
|
+
"/v1/responses"
|
|
26076
|
+
],
|
|
26077
|
+
"supported_modalities": [
|
|
26078
|
+
"text",
|
|
26079
|
+
"image"
|
|
26080
|
+
],
|
|
26081
|
+
"supported_output_modalities": [
|
|
26082
|
+
"text",
|
|
26083
|
+
"image"
|
|
26084
|
+
],
|
|
26085
|
+
"supports_function_calling": false,
|
|
26086
|
+
"supports_native_streaming": true,
|
|
26087
|
+
"supports_parallel_function_calling": false,
|
|
26088
|
+
"supports_pdf_input": true,
|
|
26089
|
+
"supports_prompt_caching": true,
|
|
26090
|
+
"supports_reasoning": true,
|
|
26091
|
+
"supports_response_schema": true,
|
|
26092
|
+
"supports_system_messages": true,
|
|
26093
|
+
"supports_tool_choice": false,
|
|
26094
|
+
"supports_vision": true
|
|
26095
|
+
},
|
|
26096
|
+
"gpt-5.1-codex": {
|
|
26097
|
+
"cache_read_input_token_cost": 1.25e-07,
|
|
26098
|
+
"cache_read_input_token_cost_priority": 2.5e-07,
|
|
26099
|
+
"input_cost_per_token": 1.25e-06,
|
|
26100
|
+
"input_cost_per_token_priority": 2.5e-06,
|
|
26101
|
+
"litellm_provider": "openai",
|
|
26102
|
+
"max_input_tokens": 272000,
|
|
26103
|
+
"max_output_tokens": 128000,
|
|
26104
|
+
"max_tokens": 128000,
|
|
26105
|
+
"mode": "responses",
|
|
26106
|
+
"output_cost_per_token": 1e-05,
|
|
26107
|
+
"output_cost_per_token_priority": 2e-05,
|
|
26108
|
+
"supported_endpoints": [
|
|
26109
|
+
"/v1/responses"
|
|
26110
|
+
],
|
|
26111
|
+
"supported_modalities": [
|
|
26112
|
+
"text",
|
|
26113
|
+
"image"
|
|
26114
|
+
],
|
|
26115
|
+
"supported_output_modalities": [
|
|
26116
|
+
"text"
|
|
26117
|
+
],
|
|
26118
|
+
"supports_function_calling": true,
|
|
26119
|
+
"supports_native_streaming": true,
|
|
26120
|
+
"supports_parallel_function_calling": true,
|
|
26121
|
+
"supports_pdf_input": true,
|
|
26122
|
+
"supports_prompt_caching": true,
|
|
26123
|
+
"supports_reasoning": true,
|
|
26124
|
+
"supports_response_schema": true,
|
|
26125
|
+
"supports_system_messages": false,
|
|
26126
|
+
"supports_tool_choice": true,
|
|
26127
|
+
"supports_vision": true
|
|
26128
|
+
},
|
|
26129
|
+
"gpt-5.1-codex-mini": {
|
|
26130
|
+
"cache_read_input_token_cost": 2.5e-08,
|
|
26131
|
+
"cache_read_input_token_cost_priority": 4.5e-08,
|
|
26132
|
+
"input_cost_per_token": 2.5e-07,
|
|
26133
|
+
"input_cost_per_token_priority": 4.5e-07,
|
|
26134
|
+
"litellm_provider": "openai",
|
|
26135
|
+
"max_input_tokens": 272000,
|
|
26136
|
+
"max_output_tokens": 128000,
|
|
26137
|
+
"max_tokens": 128000,
|
|
26138
|
+
"mode": "responses",
|
|
26139
|
+
"output_cost_per_token": 2e-06,
|
|
26140
|
+
"output_cost_per_token_priority": 3.6e-06,
|
|
26141
|
+
"supported_endpoints": [
|
|
26142
|
+
"/v1/responses"
|
|
26143
|
+
],
|
|
26144
|
+
"supported_modalities": [
|
|
26145
|
+
"text",
|
|
26146
|
+
"image"
|
|
26147
|
+
],
|
|
26148
|
+
"supported_output_modalities": [
|
|
26149
|
+
"text"
|
|
26150
|
+
],
|
|
26151
|
+
"supports_function_calling": true,
|
|
26152
|
+
"supports_native_streaming": true,
|
|
26153
|
+
"supports_parallel_function_calling": true,
|
|
26154
|
+
"supports_pdf_input": true,
|
|
26155
|
+
"supports_prompt_caching": true,
|
|
26156
|
+
"supports_reasoning": true,
|
|
26157
|
+
"supports_response_schema": true,
|
|
26158
|
+
"supports_system_messages": false,
|
|
26159
|
+
"supports_tool_choice": true,
|
|
26160
|
+
"supports_vision": true
|
|
26161
|
+
},
|
|
26162
|
+
"fal_ai/fal-ai/flux/schnell": {
|
|
26163
|
+
"litellm_provider": "fal_ai",
|
|
26164
|
+
"mode": "image_generation",
|
|
26165
|
+
"output_cost_per_image": 0.003,
|
|
26166
|
+
"supported_endpoints": [
|
|
26167
|
+
"/v1/images/generations"
|
|
26168
|
+
]
|
|
26169
|
+
},
|
|
26170
|
+
"fal_ai/fal-ai/imagen4/preview/fast": {
|
|
26171
|
+
"litellm_provider": "fal_ai",
|
|
26172
|
+
"mode": "image_generation",
|
|
26173
|
+
"output_cost_per_image": 0.02,
|
|
26174
|
+
"supported_endpoints": [
|
|
26175
|
+
"/v1/images/generations"
|
|
26176
|
+
]
|
|
26177
|
+
},
|
|
26178
|
+
"fal_ai/fal-ai/imagen4/preview/ultra": {
|
|
26179
|
+
"litellm_provider": "fal_ai",
|
|
26180
|
+
"mode": "image_generation",
|
|
26181
|
+
"output_cost_per_image": 0.06,
|
|
26182
|
+
"supported_endpoints": [
|
|
26183
|
+
"/v1/images/generations"
|
|
26184
|
+
]
|
|
26185
|
+
},
|
|
26186
|
+
"voyage/voyage-3.5": {
|
|
26187
|
+
"input_cost_per_token": 6e-08,
|
|
26188
|
+
"litellm_provider": "voyage",
|
|
26189
|
+
"max_input_tokens": 32000,
|
|
26190
|
+
"max_tokens": 32000,
|
|
26191
|
+
"mode": "embedding",
|
|
26192
|
+
"output_cost_per_token": 0.0
|
|
26193
|
+
},
|
|
26194
|
+
"voyage/voyage-3.5-lite": {
|
|
26195
|
+
"input_cost_per_token": 2e-08,
|
|
26196
|
+
"litellm_provider": "voyage",
|
|
26197
|
+
"max_input_tokens": 32000,
|
|
26198
|
+
"max_tokens": 32000,
|
|
26199
|
+
"mode": "embedding",
|
|
26200
|
+
"output_cost_per_token": 0.0
|
|
26201
|
+
},
|
|
26202
|
+
"runwayml/eleven_multilingual_v2": {
|
|
26203
|
+
"litellm_provider": "runwayml",
|
|
26204
|
+
"mode": "audio_speech",
|
|
26205
|
+
"input_cost_per_character": 3e-07,
|
|
26206
|
+
"source": "https://docs.dev.runwayml.com/guides/pricing/",
|
|
26207
|
+
"metadata": {
|
|
26208
|
+
"comment": "Estimated cost based on standard TTS pricing. RunwayML uses ElevenLabs models."
|
|
26209
|
+
}
|
|
26210
|
+
},
|
|
26211
|
+
"fal_ai/fal-ai/flux-pro/v1.1": {
|
|
26212
|
+
"litellm_provider": "fal_ai",
|
|
26213
|
+
"mode": "image_generation",
|
|
26214
|
+
"output_cost_per_image": 0.04,
|
|
26215
|
+
"supported_endpoints": [
|
|
26216
|
+
"/v1/images/generations"
|
|
26217
|
+
]
|
|
26218
|
+
},
|
|
26219
|
+
"fal_ai/fal-ai/bytedance/seedream/v3/text-to-image": {
|
|
26220
|
+
"litellm_provider": "fal_ai",
|
|
26221
|
+
"mode": "image_generation",
|
|
26222
|
+
"output_cost_per_image": 0.03,
|
|
26223
|
+
"supported_endpoints": [
|
|
26224
|
+
"/v1/images/generations"
|
|
26225
|
+
]
|
|
26226
|
+
},
|
|
26227
|
+
"fal_ai/fal-ai/bytedance/dreamina/v3.1/text-to-image": {
|
|
26228
|
+
"litellm_provider": "fal_ai",
|
|
26229
|
+
"mode": "image_generation",
|
|
26230
|
+
"output_cost_per_image": 0.03,
|
|
26231
|
+
"supported_endpoints": [
|
|
26232
|
+
"/v1/images/generations"
|
|
26233
|
+
]
|
|
26234
|
+
},
|
|
26235
|
+
"fal_ai/fal-ai/ideogram/v3": {
|
|
26236
|
+
"litellm_provider": "fal_ai",
|
|
26237
|
+
"mode": "image_generation",
|
|
26238
|
+
"output_cost_per_image": 0.06,
|
|
26239
|
+
"supported_endpoints": [
|
|
26240
|
+
"/v1/images/generations"
|
|
26241
|
+
]
|
|
26242
|
+
},
|
|
26243
|
+
"vertex_ai/moonshotai/kimi-k2-thinking-maas": {
|
|
26244
|
+
"input_cost_per_token": 6e-07,
|
|
26245
|
+
"litellm_provider": "vertex_ai-moonshot_models",
|
|
26246
|
+
"max_input_tokens": 256000,
|
|
26247
|
+
"max_output_tokens": 256000,
|
|
26248
|
+
"max_tokens": 256000,
|
|
26249
|
+
"mode": "chat",
|
|
26250
|
+
"output_cost_per_token": 2.5e-06,
|
|
26251
|
+
"source": "https://cloud.google.com/vertex-ai/generative-ai/pricing#partner-models",
|
|
26252
|
+
"supports_function_calling": true,
|
|
26253
|
+
"supports_tool_choice": true,
|
|
26254
|
+
"supports_web_search": true
|
|
26255
|
+
},
|
|
26256
|
+
"azure/eu/gpt-5-2025-08-07": {
|
|
26257
|
+
"cache_read_input_token_cost": 1.375e-07,
|
|
26258
|
+
"input_cost_per_token": 1.375e-06,
|
|
26259
|
+
"litellm_provider": "azure",
|
|
26260
|
+
"max_input_tokens": 272000,
|
|
26261
|
+
"max_output_tokens": 128000,
|
|
26262
|
+
"max_tokens": 128000,
|
|
26263
|
+
"mode": "chat",
|
|
26264
|
+
"output_cost_per_token": 1.1e-05,
|
|
26265
|
+
"supported_endpoints": [
|
|
26266
|
+
"/v1/chat/completions",
|
|
26267
|
+
"/v1/batch",
|
|
26268
|
+
"/v1/responses"
|
|
26269
|
+
],
|
|
26270
|
+
"supported_modalities": [
|
|
26271
|
+
"text",
|
|
26272
|
+
"image"
|
|
26273
|
+
],
|
|
26274
|
+
"supported_output_modalities": [
|
|
26275
|
+
"text"
|
|
26276
|
+
],
|
|
26277
|
+
"supports_function_calling": true,
|
|
26278
|
+
"supports_native_streaming": true,
|
|
26279
|
+
"supports_parallel_function_calling": true,
|
|
26280
|
+
"supports_pdf_input": true,
|
|
26281
|
+
"supports_prompt_caching": true,
|
|
26282
|
+
"supports_reasoning": true,
|
|
26283
|
+
"supports_response_schema": true,
|
|
26284
|
+
"supports_system_messages": true,
|
|
26285
|
+
"supports_tool_choice": true,
|
|
26286
|
+
"supports_vision": true
|
|
26287
|
+
},
|
|
26288
|
+
"azure/eu/gpt-5-mini-2025-08-07": {
|
|
26289
|
+
"cache_read_input_token_cost": 2.75e-08,
|
|
26290
|
+
"input_cost_per_token": 2.75e-07,
|
|
26291
|
+
"litellm_provider": "azure",
|
|
26292
|
+
"max_input_tokens": 272000,
|
|
26293
|
+
"max_output_tokens": 128000,
|
|
26294
|
+
"max_tokens": 128000,
|
|
26295
|
+
"mode": "chat",
|
|
26296
|
+
"output_cost_per_token": 2.2e-06,
|
|
26297
|
+
"supported_endpoints": [
|
|
26298
|
+
"/v1/chat/completions",
|
|
26299
|
+
"/v1/batch",
|
|
26300
|
+
"/v1/responses"
|
|
26301
|
+
],
|
|
26302
|
+
"supported_modalities": [
|
|
26303
|
+
"text",
|
|
26304
|
+
"image"
|
|
26305
|
+
],
|
|
26306
|
+
"supported_output_modalities": [
|
|
26307
|
+
"text"
|
|
26308
|
+
],
|
|
26309
|
+
"supports_function_calling": true,
|
|
26310
|
+
"supports_native_streaming": true,
|
|
26311
|
+
"supports_parallel_function_calling": true,
|
|
26312
|
+
"supports_pdf_input": true,
|
|
26313
|
+
"supports_prompt_caching": true,
|
|
26314
|
+
"supports_reasoning": true,
|
|
26315
|
+
"supports_response_schema": true,
|
|
26316
|
+
"supports_system_messages": true,
|
|
26317
|
+
"supports_tool_choice": true,
|
|
26318
|
+
"supports_vision": true
|
|
26319
|
+
},
|
|
26320
|
+
"azure/eu/gpt-5-nano-2025-08-07": {
|
|
26321
|
+
"cache_read_input_token_cost": 5.5e-09,
|
|
26322
|
+
"input_cost_per_token": 5.5e-08,
|
|
26323
|
+
"litellm_provider": "azure",
|
|
26324
|
+
"max_input_tokens": 272000,
|
|
26325
|
+
"max_output_tokens": 128000,
|
|
26326
|
+
"max_tokens": 128000,
|
|
26327
|
+
"mode": "chat",
|
|
26328
|
+
"output_cost_per_token": 4.4e-07,
|
|
26329
|
+
"supported_endpoints": [
|
|
26330
|
+
"/v1/chat/completions",
|
|
26331
|
+
"/v1/batch",
|
|
26332
|
+
"/v1/responses"
|
|
26333
|
+
],
|
|
26334
|
+
"supported_modalities": [
|
|
26335
|
+
"text",
|
|
26336
|
+
"image"
|
|
26337
|
+
],
|
|
26338
|
+
"supported_output_modalities": [
|
|
26339
|
+
"text"
|
|
26340
|
+
],
|
|
26341
|
+
"supports_function_calling": true,
|
|
26342
|
+
"supports_native_streaming": true,
|
|
26343
|
+
"supports_parallel_function_calling": true,
|
|
26344
|
+
"supports_pdf_input": true,
|
|
26345
|
+
"supports_prompt_caching": true,
|
|
26346
|
+
"supports_reasoning": true,
|
|
26347
|
+
"supports_response_schema": true,
|
|
26348
|
+
"supports_system_messages": true,
|
|
26349
|
+
"supports_tool_choice": true,
|
|
26350
|
+
"supports_vision": true
|
|
26351
|
+
},
|
|
26352
|
+
"azure/us/gpt-4.1-2025-04-14": {
|
|
26353
|
+
"deprecation_date": "2026-11-04",
|
|
26354
|
+
"cache_read_input_token_cost": 5.5e-07,
|
|
26355
|
+
"input_cost_per_token": 2.2e-06,
|
|
26356
|
+
"input_cost_per_token_batches": 1.1e-06,
|
|
26357
|
+
"litellm_provider": "azure",
|
|
26358
|
+
"max_input_tokens": 1047576,
|
|
26359
|
+
"max_output_tokens": 32768,
|
|
26360
|
+
"max_tokens": 32768,
|
|
26361
|
+
"mode": "chat",
|
|
26362
|
+
"output_cost_per_token": 8.8e-06,
|
|
26363
|
+
"output_cost_per_token_batches": 4.4e-06,
|
|
26364
|
+
"supported_endpoints": [
|
|
26365
|
+
"/v1/chat/completions",
|
|
26366
|
+
"/v1/batch",
|
|
26367
|
+
"/v1/responses"
|
|
26368
|
+
],
|
|
26369
|
+
"supported_modalities": [
|
|
26370
|
+
"text",
|
|
26371
|
+
"image"
|
|
26372
|
+
],
|
|
26373
|
+
"supported_output_modalities": [
|
|
26374
|
+
"text"
|
|
26375
|
+
],
|
|
26376
|
+
"supports_function_calling": true,
|
|
26377
|
+
"supports_native_streaming": true,
|
|
26378
|
+
"supports_parallel_function_calling": true,
|
|
26379
|
+
"supports_prompt_caching": true,
|
|
26380
|
+
"supports_response_schema": true,
|
|
26381
|
+
"supports_system_messages": true,
|
|
26382
|
+
"supports_tool_choice": true,
|
|
26383
|
+
"supports_vision": true,
|
|
26384
|
+
"supports_web_search": false
|
|
26385
|
+
},
|
|
26386
|
+
"azure/us/gpt-4.1-mini-2025-04-14": {
|
|
26387
|
+
"deprecation_date": "2026-11-04",
|
|
26388
|
+
"cache_read_input_token_cost": 1.1e-07,
|
|
26389
|
+
"input_cost_per_token": 4.4e-07,
|
|
26390
|
+
"input_cost_per_token_batches": 2.2e-07,
|
|
26391
|
+
"litellm_provider": "azure",
|
|
26392
|
+
"max_input_tokens": 1047576,
|
|
26393
|
+
"max_output_tokens": 32768,
|
|
26394
|
+
"max_tokens": 32768,
|
|
26395
|
+
"mode": "chat",
|
|
26396
|
+
"output_cost_per_token": 1.76e-06,
|
|
26397
|
+
"output_cost_per_token_batches": 8.8e-07,
|
|
26398
|
+
"supported_endpoints": [
|
|
26399
|
+
"/v1/chat/completions",
|
|
26400
|
+
"/v1/batch",
|
|
26401
|
+
"/v1/responses"
|
|
26402
|
+
],
|
|
26403
|
+
"supported_modalities": [
|
|
26404
|
+
"text",
|
|
26405
|
+
"image"
|
|
26406
|
+
],
|
|
26407
|
+
"supported_output_modalities": [
|
|
26408
|
+
"text"
|
|
26409
|
+
],
|
|
26410
|
+
"supports_function_calling": true,
|
|
26411
|
+
"supports_native_streaming": true,
|
|
26412
|
+
"supports_parallel_function_calling": true,
|
|
26413
|
+
"supports_prompt_caching": true,
|
|
26414
|
+
"supports_response_schema": true,
|
|
26415
|
+
"supports_system_messages": true,
|
|
26416
|
+
"supports_tool_choice": true,
|
|
26417
|
+
"supports_vision": true,
|
|
26418
|
+
"supports_web_search": false
|
|
26419
|
+
},
|
|
26420
|
+
"azure/us/gpt-4.1-nano-2025-04-14": {
|
|
26421
|
+
"deprecation_date": "2026-11-04",
|
|
26422
|
+
"cache_read_input_token_cost": 2.5e-08,
|
|
26423
|
+
"input_cost_per_token": 1.1e-07,
|
|
26424
|
+
"input_cost_per_token_batches": 6e-08,
|
|
26425
|
+
"litellm_provider": "azure",
|
|
26426
|
+
"max_input_tokens": 1047576,
|
|
26427
|
+
"max_output_tokens": 32768,
|
|
26428
|
+
"max_tokens": 32768,
|
|
26429
|
+
"mode": "chat",
|
|
26430
|
+
"output_cost_per_token": 4.4e-07,
|
|
26431
|
+
"output_cost_per_token_batches": 2.2e-07,
|
|
26432
|
+
"supported_endpoints": [
|
|
26433
|
+
"/v1/chat/completions",
|
|
26434
|
+
"/v1/batch",
|
|
26435
|
+
"/v1/responses"
|
|
26436
|
+
],
|
|
26437
|
+
"supported_modalities": [
|
|
26438
|
+
"text",
|
|
26439
|
+
"image"
|
|
26440
|
+
],
|
|
26441
|
+
"supported_output_modalities": [
|
|
26442
|
+
"text"
|
|
26443
|
+
],
|
|
26444
|
+
"supports_function_calling": true,
|
|
26445
|
+
"supports_native_streaming": true,
|
|
26446
|
+
"supports_parallel_function_calling": true,
|
|
26447
|
+
"supports_prompt_caching": true,
|
|
26448
|
+
"supports_response_schema": true,
|
|
26449
|
+
"supports_system_messages": true,
|
|
26450
|
+
"supports_tool_choice": true,
|
|
26451
|
+
"supports_vision": true
|
|
26452
|
+
},
|
|
26453
|
+
"azure/us/gpt-5-2025-08-07": {
|
|
26454
|
+
"cache_read_input_token_cost": 1.375e-07,
|
|
26455
|
+
"input_cost_per_token": 1.375e-06,
|
|
26456
|
+
"litellm_provider": "azure",
|
|
26457
|
+
"max_input_tokens": 272000,
|
|
26458
|
+
"max_output_tokens": 128000,
|
|
26459
|
+
"max_tokens": 128000,
|
|
26460
|
+
"mode": "chat",
|
|
26461
|
+
"output_cost_per_token": 1.1e-05,
|
|
26462
|
+
"supported_endpoints": [
|
|
26463
|
+
"/v1/chat/completions",
|
|
26464
|
+
"/v1/batch",
|
|
26465
|
+
"/v1/responses"
|
|
26466
|
+
],
|
|
26467
|
+
"supported_modalities": [
|
|
26468
|
+
"text",
|
|
26469
|
+
"image"
|
|
26470
|
+
],
|
|
26471
|
+
"supported_output_modalities": [
|
|
26472
|
+
"text"
|
|
26473
|
+
],
|
|
26474
|
+
"supports_function_calling": true,
|
|
26475
|
+
"supports_native_streaming": true,
|
|
26476
|
+
"supports_parallel_function_calling": true,
|
|
26477
|
+
"supports_pdf_input": true,
|
|
26478
|
+
"supports_prompt_caching": true,
|
|
26479
|
+
"supports_reasoning": true,
|
|
26480
|
+
"supports_response_schema": true,
|
|
26481
|
+
"supports_system_messages": true,
|
|
26482
|
+
"supports_tool_choice": true,
|
|
26483
|
+
"supports_vision": true
|
|
26484
|
+
},
|
|
26485
|
+
"azure/us/gpt-5-mini-2025-08-07": {
|
|
26486
|
+
"cache_read_input_token_cost": 2.75e-08,
|
|
26487
|
+
"input_cost_per_token": 2.75e-07,
|
|
26488
|
+
"litellm_provider": "azure",
|
|
26489
|
+
"max_input_tokens": 272000,
|
|
26490
|
+
"max_output_tokens": 128000,
|
|
26491
|
+
"max_tokens": 128000,
|
|
26492
|
+
"mode": "chat",
|
|
26493
|
+
"output_cost_per_token": 2.2e-06,
|
|
26494
|
+
"supported_endpoints": [
|
|
26495
|
+
"/v1/chat/completions",
|
|
26496
|
+
"/v1/batch",
|
|
26497
|
+
"/v1/responses"
|
|
26498
|
+
],
|
|
26499
|
+
"supported_modalities": [
|
|
26500
|
+
"text",
|
|
26501
|
+
"image"
|
|
26502
|
+
],
|
|
26503
|
+
"supported_output_modalities": [
|
|
26504
|
+
"text"
|
|
26505
|
+
],
|
|
26506
|
+
"supports_function_calling": true,
|
|
26507
|
+
"supports_native_streaming": true,
|
|
26508
|
+
"supports_parallel_function_calling": true,
|
|
26509
|
+
"supports_pdf_input": true,
|
|
26510
|
+
"supports_prompt_caching": true,
|
|
26511
|
+
"supports_reasoning": true,
|
|
26512
|
+
"supports_response_schema": true,
|
|
26513
|
+
"supports_system_messages": true,
|
|
26514
|
+
"supports_tool_choice": true,
|
|
26515
|
+
"supports_vision": true
|
|
26516
|
+
},
|
|
26517
|
+
"azure/us/gpt-5-nano-2025-08-07": {
|
|
26518
|
+
"cache_read_input_token_cost": 5.5e-09,
|
|
26519
|
+
"input_cost_per_token": 5.5e-08,
|
|
26520
|
+
"litellm_provider": "azure",
|
|
26521
|
+
"max_input_tokens": 272000,
|
|
26522
|
+
"max_output_tokens": 128000,
|
|
26523
|
+
"max_tokens": 128000,
|
|
26524
|
+
"mode": "chat",
|
|
26525
|
+
"output_cost_per_token": 4.4e-07,
|
|
26526
|
+
"supported_endpoints": [
|
|
26527
|
+
"/v1/chat/completions",
|
|
26528
|
+
"/v1/batch",
|
|
26529
|
+
"/v1/responses"
|
|
26530
|
+
],
|
|
26531
|
+
"supported_modalities": [
|
|
26532
|
+
"text",
|
|
26533
|
+
"image"
|
|
26534
|
+
],
|
|
26535
|
+
"supported_output_modalities": [
|
|
26536
|
+
"text"
|
|
26537
|
+
],
|
|
26538
|
+
"supports_function_calling": true,
|
|
26539
|
+
"supports_native_streaming": true,
|
|
26540
|
+
"supports_parallel_function_calling": true,
|
|
26541
|
+
"supports_pdf_input": true,
|
|
26542
|
+
"supports_prompt_caching": true,
|
|
26543
|
+
"supports_reasoning": true,
|
|
26544
|
+
"supports_response_schema": true,
|
|
26545
|
+
"supports_system_messages": true,
|
|
26546
|
+
"supports_tool_choice": true,
|
|
26547
|
+
"supports_vision": true
|
|
26548
|
+
},
|
|
26549
|
+
"azure/us/o3-2025-04-16": {
|
|
26550
|
+
"deprecation_date": "2026-04-16",
|
|
26551
|
+
"cache_read_input_token_cost": 5.5e-07,
|
|
26552
|
+
"input_cost_per_token": 2.2e-06,
|
|
26553
|
+
"litellm_provider": "azure",
|
|
26554
|
+
"max_input_tokens": 200000,
|
|
26555
|
+
"max_output_tokens": 100000,
|
|
26556
|
+
"max_tokens": 100000,
|
|
26557
|
+
"mode": "chat",
|
|
26558
|
+
"output_cost_per_token": 8.8e-06,
|
|
26559
|
+
"supported_endpoints": [
|
|
26560
|
+
"/v1/chat/completions",
|
|
26561
|
+
"/v1/batch",
|
|
26562
|
+
"/v1/responses"
|
|
26563
|
+
],
|
|
26564
|
+
"supported_modalities": [
|
|
26565
|
+
"text",
|
|
26566
|
+
"image"
|
|
26567
|
+
],
|
|
26568
|
+
"supported_output_modalities": [
|
|
26569
|
+
"text"
|
|
26570
|
+
],
|
|
26571
|
+
"supports_function_calling": true,
|
|
26572
|
+
"supports_parallel_function_calling": false,
|
|
26573
|
+
"supports_prompt_caching": true,
|
|
26574
|
+
"supports_reasoning": true,
|
|
26575
|
+
"supports_response_schema": true,
|
|
26576
|
+
"supports_tool_choice": true,
|
|
26577
|
+
"supports_vision": true
|
|
26578
|
+
},
|
|
26579
|
+
"azure/us/o4-mini-2025-04-16": {
|
|
26580
|
+
"cache_read_input_token_cost": 3.1e-07,
|
|
26581
|
+
"input_cost_per_token": 1.21e-06,
|
|
26582
|
+
"litellm_provider": "azure",
|
|
26583
|
+
"max_input_tokens": 200000,
|
|
26584
|
+
"max_output_tokens": 100000,
|
|
26585
|
+
"max_tokens": 100000,
|
|
26586
|
+
"mode": "chat",
|
|
26587
|
+
"output_cost_per_token": 4.84e-06,
|
|
26588
|
+
"supports_function_calling": true,
|
|
26589
|
+
"supports_parallel_function_calling": false,
|
|
26590
|
+
"supports_prompt_caching": true,
|
|
26591
|
+
"supports_reasoning": true,
|
|
26592
|
+
"supports_response_schema": true,
|
|
26593
|
+
"supports_tool_choice": true,
|
|
26594
|
+
"supports_vision": true
|
|
26595
|
+
},
|
|
26596
|
+
"fireworks_ai/accounts/fireworks/models/deepseek-v3p1-terminus": {
|
|
26597
|
+
"input_cost_per_token": 5.6e-07,
|
|
26598
|
+
"litellm_provider": "fireworks_ai",
|
|
26599
|
+
"max_input_tokens": 128000,
|
|
26600
|
+
"max_output_tokens": 8192,
|
|
26601
|
+
"max_tokens": 8192,
|
|
26602
|
+
"mode": "chat",
|
|
26603
|
+
"output_cost_per_token": 1.68e-06,
|
|
26604
|
+
"source": "https://fireworks.ai/pricing",
|
|
26605
|
+
"supports_response_schema": true,
|
|
26606
|
+
"supports_tool_choice": true
|
|
26607
|
+
},
|
|
26608
|
+
"fireworks_ai/accounts/fireworks/models/kimi-k2-thinking": {
|
|
26609
|
+
"input_cost_per_token": 6e-07,
|
|
26610
|
+
"litellm_provider": "fireworks_ai",
|
|
26611
|
+
"max_input_tokens": 262144,
|
|
26612
|
+
"max_output_tokens": 262144,
|
|
26613
|
+
"max_tokens": 262144,
|
|
26614
|
+
"mode": "chat",
|
|
26615
|
+
"output_cost_per_token": 2.5e-06,
|
|
26616
|
+
"source": "https://fireworks.ai/pricing",
|
|
26617
|
+
"supports_function_calling": true,
|
|
26618
|
+
"supports_response_schema": true,
|
|
26619
|
+
"supports_tool_choice": true,
|
|
26620
|
+
"supports_web_search": true
|
|
26621
|
+
},
|
|
26622
|
+
"gemini-3-pro-preview": {
|
|
26623
|
+
"cache_read_input_token_cost": 2e-07,
|
|
26624
|
+
"cache_read_input_token_cost_above_200k_tokens": 4e-07,
|
|
26625
|
+
"cache_creation_input_token_cost_above_200k_tokens": 2.5e-07,
|
|
26626
|
+
"input_cost_per_token": 2e-06,
|
|
26627
|
+
"input_cost_per_token_above_200k_tokens": 4e-06,
|
|
26628
|
+
"input_cost_per_token_batches": 1e-06,
|
|
26629
|
+
"litellm_provider": "vertex_ai-language-models",
|
|
26630
|
+
"max_audio_length_hours": 8.4,
|
|
26631
|
+
"max_audio_per_prompt": 1,
|
|
26632
|
+
"max_images_per_prompt": 3000,
|
|
26633
|
+
"max_input_tokens": 1048576,
|
|
26634
|
+
"max_output_tokens": 65535,
|
|
26635
|
+
"max_pdf_size_mb": 30,
|
|
26636
|
+
"max_tokens": 65535,
|
|
26637
|
+
"max_video_length": 1,
|
|
26638
|
+
"max_videos_per_prompt": 10,
|
|
26639
|
+
"mode": "chat",
|
|
26640
|
+
"output_cost_per_token": 1.2e-05,
|
|
26641
|
+
"output_cost_per_token_above_200k_tokens": 1.8e-05,
|
|
26642
|
+
"output_cost_per_token_batches": 6e-06,
|
|
26643
|
+
"source": "https://cloud.google.com/vertex-ai/generative-ai/pricing",
|
|
26644
|
+
"supported_endpoints": [
|
|
26645
|
+
"/v1/chat/completions",
|
|
26646
|
+
"/v1/completions",
|
|
26647
|
+
"/v1/batch"
|
|
26648
|
+
],
|
|
26649
|
+
"supported_modalities": [
|
|
26650
|
+
"text",
|
|
26651
|
+
"image",
|
|
26652
|
+
"audio",
|
|
26653
|
+
"video"
|
|
26654
|
+
],
|
|
26655
|
+
"supported_output_modalities": [
|
|
26656
|
+
"text"
|
|
26657
|
+
],
|
|
26658
|
+
"supports_audio_input": true,
|
|
26659
|
+
"supports_function_calling": true,
|
|
26660
|
+
"supports_pdf_input": true,
|
|
26661
|
+
"supports_prompt_caching": true,
|
|
26662
|
+
"supports_reasoning": true,
|
|
26663
|
+
"supports_response_schema": true,
|
|
26664
|
+
"supports_system_messages": true,
|
|
26665
|
+
"supports_tool_choice": true,
|
|
26666
|
+
"supports_video_input": true,
|
|
26667
|
+
"supports_vision": true,
|
|
26668
|
+
"supports_web_search": true
|
|
26669
|
+
},
|
|
26670
|
+
"gemini/gemini-3-pro-preview": {
|
|
26671
|
+
"cache_read_input_token_cost": 2e-07,
|
|
26672
|
+
"cache_read_input_token_cost_above_200k_tokens": 4e-07,
|
|
26673
|
+
"input_cost_per_token": 2e-06,
|
|
26674
|
+
"input_cost_per_token_above_200k_tokens": 4e-06,
|
|
26675
|
+
"input_cost_per_token_batches": 1e-06,
|
|
26676
|
+
"litellm_provider": "gemini",
|
|
26677
|
+
"max_audio_length_hours": 8.4,
|
|
26678
|
+
"max_audio_per_prompt": 1,
|
|
26679
|
+
"max_images_per_prompt": 3000,
|
|
26680
|
+
"max_input_tokens": 1048576,
|
|
26681
|
+
"max_output_tokens": 65535,
|
|
26682
|
+
"max_pdf_size_mb": 30,
|
|
26683
|
+
"max_tokens": 65535,
|
|
26684
|
+
"max_video_length": 1,
|
|
26685
|
+
"max_videos_per_prompt": 10,
|
|
26686
|
+
"mode": "chat",
|
|
26687
|
+
"output_cost_per_token": 1.2e-05,
|
|
26688
|
+
"output_cost_per_token_above_200k_tokens": 1.8e-05,
|
|
26689
|
+
"output_cost_per_token_batches": 6e-06,
|
|
26690
|
+
"rpm": 2000,
|
|
26691
|
+
"source": "https://cloud.google.com/vertex-ai/generative-ai/pricing",
|
|
26692
|
+
"supported_endpoints": [
|
|
26693
|
+
"/v1/chat/completions",
|
|
26694
|
+
"/v1/completions",
|
|
26695
|
+
"/v1/batch"
|
|
26696
|
+
],
|
|
26697
|
+
"supported_modalities": [
|
|
26698
|
+
"text",
|
|
26699
|
+
"image",
|
|
26700
|
+
"audio",
|
|
26701
|
+
"video"
|
|
26702
|
+
],
|
|
26703
|
+
"supported_output_modalities": [
|
|
26704
|
+
"text"
|
|
26705
|
+
],
|
|
26706
|
+
"supports_audio_input": true,
|
|
26707
|
+
"supports_function_calling": true,
|
|
26708
|
+
"supports_pdf_input": true,
|
|
26709
|
+
"supports_prompt_caching": true,
|
|
26710
|
+
"supports_reasoning": true,
|
|
26711
|
+
"supports_response_schema": true,
|
|
26712
|
+
"supports_system_messages": true,
|
|
26713
|
+
"supports_tool_choice": true,
|
|
26714
|
+
"supports_video_input": true,
|
|
26715
|
+
"supports_vision": true,
|
|
26716
|
+
"supports_web_search": true,
|
|
26717
|
+
"tpm": 800000
|
|
26718
|
+
},
|
|
26719
|
+
"vertex_ai/veo-3.0-fast-generate-001": {
|
|
26720
|
+
"litellm_provider": "vertex_ai-video-models",
|
|
26721
|
+
"max_input_tokens": 1024,
|
|
26722
|
+
"max_tokens": 1024,
|
|
26723
|
+
"mode": "video_generation",
|
|
26724
|
+
"output_cost_per_second": 0.15,
|
|
26725
|
+
"source": "https://ai.google.dev/gemini-api/docs/video",
|
|
26726
|
+
"supported_modalities": [
|
|
26727
|
+
"text"
|
|
26728
|
+
],
|
|
26729
|
+
"supported_output_modalities": [
|
|
26730
|
+
"video"
|
|
26731
|
+
]
|
|
26732
|
+
},
|
|
26733
|
+
"vertex_ai/veo-3.0-generate-001": {
|
|
26734
|
+
"litellm_provider": "vertex_ai-video-models",
|
|
26735
|
+
"max_input_tokens": 1024,
|
|
26736
|
+
"max_tokens": 1024,
|
|
26737
|
+
"mode": "video_generation",
|
|
26738
|
+
"output_cost_per_second": 0.4,
|
|
26739
|
+
"source": "https://ai.google.dev/gemini-api/docs/video",
|
|
26740
|
+
"supported_modalities": [
|
|
26741
|
+
"text"
|
|
26742
|
+
],
|
|
26743
|
+
"supported_output_modalities": [
|
|
26744
|
+
"video"
|
|
26745
|
+
]
|
|
26746
|
+
},
|
|
26747
|
+
"azure/gpt-audio-2025-08-28": {
|
|
26748
|
+
"input_cost_per_audio_token": 4e-05,
|
|
26749
|
+
"input_cost_per_token": 2.5e-06,
|
|
26750
|
+
"litellm_provider": "azure",
|
|
26751
|
+
"max_input_tokens": 128000,
|
|
26752
|
+
"max_output_tokens": 16384,
|
|
26753
|
+
"max_tokens": 16384,
|
|
26754
|
+
"mode": "chat",
|
|
26755
|
+
"output_cost_per_audio_token": 8e-05,
|
|
26756
|
+
"output_cost_per_token": 1e-05,
|
|
26757
|
+
"supported_endpoints": [
|
|
26758
|
+
"/v1/chat/completions"
|
|
26759
|
+
],
|
|
26760
|
+
"supported_modalities": [
|
|
26761
|
+
"text",
|
|
26762
|
+
"audio"
|
|
26763
|
+
],
|
|
26764
|
+
"supported_output_modalities": [
|
|
26765
|
+
"text",
|
|
26766
|
+
"audio"
|
|
26767
|
+
],
|
|
26768
|
+
"supports_function_calling": true,
|
|
26769
|
+
"supports_native_streaming": true,
|
|
26770
|
+
"supports_parallel_function_calling": true,
|
|
26771
|
+
"supports_prompt_caching": false,
|
|
26772
|
+
"supports_reasoning": false,
|
|
26773
|
+
"supports_response_schema": false,
|
|
26774
|
+
"supports_system_messages": true,
|
|
26775
|
+
"supports_tool_choice": true,
|
|
26776
|
+
"supports_vision": false
|
|
26777
|
+
},
|
|
26778
|
+
"azure/gpt-audio-mini-2025-10-06": {
|
|
26779
|
+
"input_cost_per_audio_token": 1e-05,
|
|
26780
|
+
"input_cost_per_token": 6e-07,
|
|
26781
|
+
"litellm_provider": "azure",
|
|
26782
|
+
"max_input_tokens": 128000,
|
|
26783
|
+
"max_output_tokens": 16384,
|
|
26784
|
+
"max_tokens": 16384,
|
|
26785
|
+
"mode": "chat",
|
|
26786
|
+
"output_cost_per_audio_token": 2e-05,
|
|
26787
|
+
"output_cost_per_token": 2.4e-06,
|
|
26788
|
+
"supported_endpoints": [
|
|
26789
|
+
"/v1/chat/completions"
|
|
26790
|
+
],
|
|
26791
|
+
"supported_modalities": [
|
|
26792
|
+
"text",
|
|
26793
|
+
"audio"
|
|
26794
|
+
],
|
|
26795
|
+
"supported_output_modalities": [
|
|
26796
|
+
"text",
|
|
26797
|
+
"audio"
|
|
26798
|
+
],
|
|
26799
|
+
"supports_function_calling": true,
|
|
26800
|
+
"supports_native_streaming": true,
|
|
26801
|
+
"supports_parallel_function_calling": true,
|
|
26802
|
+
"supports_prompt_caching": false,
|
|
26803
|
+
"supports_reasoning": false,
|
|
26804
|
+
"supports_response_schema": false,
|
|
26805
|
+
"supports_system_messages": true,
|
|
26806
|
+
"supports_tool_choice": true,
|
|
26807
|
+
"supports_vision": false
|
|
26808
|
+
},
|
|
26809
|
+
"azure/gpt-realtime-2025-08-28": {
|
|
26810
|
+
"cache_creation_input_audio_token_cost": 4e-06,
|
|
26811
|
+
"cache_read_input_token_cost": 4e-06,
|
|
26812
|
+
"input_cost_per_audio_token": 3.2e-05,
|
|
26813
|
+
"input_cost_per_image": 5e-06,
|
|
26814
|
+
"input_cost_per_token": 4e-06,
|
|
26815
|
+
"litellm_provider": "azure",
|
|
26816
|
+
"max_input_tokens": 32000,
|
|
26817
|
+
"max_output_tokens": 4096,
|
|
26818
|
+
"max_tokens": 4096,
|
|
26819
|
+
"mode": "chat",
|
|
26820
|
+
"output_cost_per_audio_token": 6.4e-05,
|
|
26821
|
+
"output_cost_per_token": 1.6e-05,
|
|
26822
|
+
"supported_endpoints": [
|
|
26823
|
+
"/v1/realtime"
|
|
26824
|
+
],
|
|
26825
|
+
"supported_modalities": [
|
|
26826
|
+
"text",
|
|
26827
|
+
"image",
|
|
26828
|
+
"audio"
|
|
26829
|
+
],
|
|
26830
|
+
"supported_output_modalities": [
|
|
26831
|
+
"text",
|
|
26832
|
+
"audio"
|
|
26833
|
+
],
|
|
26834
|
+
"supports_audio_input": true,
|
|
26835
|
+
"supports_audio_output": true,
|
|
26836
|
+
"supports_function_calling": true,
|
|
26837
|
+
"supports_parallel_function_calling": true,
|
|
26838
|
+
"supports_system_messages": true,
|
|
26839
|
+
"supports_tool_choice": true
|
|
26840
|
+
},
|
|
26841
|
+
"azure/gpt-realtime-mini-2025-10-06": {
|
|
26842
|
+
"cache_creation_input_audio_token_cost": 3e-07,
|
|
26843
|
+
"cache_read_input_token_cost": 6e-08,
|
|
26844
|
+
"input_cost_per_audio_token": 1e-05,
|
|
26845
|
+
"input_cost_per_image": 8e-07,
|
|
26846
|
+
"input_cost_per_token": 6e-07,
|
|
26847
|
+
"litellm_provider": "azure",
|
|
26848
|
+
"max_input_tokens": 32000,
|
|
26849
|
+
"max_output_tokens": 4096,
|
|
26850
|
+
"max_tokens": 4096,
|
|
26851
|
+
"mode": "chat",
|
|
26852
|
+
"output_cost_per_audio_token": 2e-05,
|
|
26853
|
+
"output_cost_per_token": 2.4e-06,
|
|
26854
|
+
"supported_endpoints": [
|
|
26855
|
+
"/v1/realtime"
|
|
26856
|
+
],
|
|
26857
|
+
"supported_modalities": [
|
|
26858
|
+
"text",
|
|
26859
|
+
"image",
|
|
26860
|
+
"audio"
|
|
26861
|
+
],
|
|
26862
|
+
"supported_output_modalities": [
|
|
26863
|
+
"text",
|
|
26864
|
+
"audio"
|
|
26865
|
+
],
|
|
26866
|
+
"supports_audio_input": true,
|
|
26867
|
+
"supports_audio_output": true,
|
|
26868
|
+
"supports_function_calling": true,
|
|
26869
|
+
"supports_parallel_function_calling": true,
|
|
26870
|
+
"supports_system_messages": true,
|
|
26871
|
+
"supports_tool_choice": true
|
|
26872
|
+
},
|
|
26873
|
+
"azure/gpt-4o-transcribe-diarize": {
|
|
26874
|
+
"input_cost_per_audio_token": 6e-06,
|
|
26875
|
+
"input_cost_per_token": 2.5e-06,
|
|
26876
|
+
"litellm_provider": "azure",
|
|
26877
|
+
"max_input_tokens": 16000,
|
|
26878
|
+
"max_output_tokens": 2000,
|
|
26879
|
+
"mode": "audio_transcription",
|
|
26880
|
+
"output_cost_per_token": 1e-05,
|
|
26881
|
+
"supported_endpoints": [
|
|
26882
|
+
"/v1/audio/transcriptions"
|
|
26883
|
+
]
|
|
26884
|
+
},
|
|
26885
|
+
"azure/gpt-5.1-2025-11-13": {
|
|
26886
|
+
"cache_read_input_token_cost": 1.25e-07,
|
|
26887
|
+
"cache_read_input_token_cost_priority": 2.5e-07,
|
|
26888
|
+
"input_cost_per_token": 1.25e-06,
|
|
26889
|
+
"input_cost_per_token_priority": 2.5e-06,
|
|
26890
|
+
"litellm_provider": "azure",
|
|
26891
|
+
"max_input_tokens": 272000,
|
|
26892
|
+
"max_output_tokens": 128000,
|
|
26893
|
+
"max_tokens": 128000,
|
|
26894
|
+
"mode": "chat",
|
|
26895
|
+
"output_cost_per_token": 1e-05,
|
|
26896
|
+
"output_cost_per_token_priority": 2e-05,
|
|
26897
|
+
"supported_endpoints": [
|
|
26898
|
+
"/v1/chat/completions",
|
|
26899
|
+
"/v1/responses"
|
|
26900
|
+
],
|
|
26901
|
+
"supported_modalities": [
|
|
26902
|
+
"text",
|
|
26903
|
+
"image"
|
|
26904
|
+
],
|
|
26905
|
+
"supported_output_modalities": [
|
|
26906
|
+
"text",
|
|
26907
|
+
"image"
|
|
26908
|
+
],
|
|
26909
|
+
"supports_function_calling": true,
|
|
26910
|
+
"supports_native_streaming": true,
|
|
26911
|
+
"supports_parallel_function_calling": true,
|
|
26912
|
+
"supports_pdf_input": true,
|
|
26913
|
+
"supports_prompt_caching": true,
|
|
26914
|
+
"supports_reasoning": true,
|
|
26915
|
+
"supports_response_schema": true,
|
|
26916
|
+
"supports_system_messages": true,
|
|
26917
|
+
"supports_tool_choice": true,
|
|
26918
|
+
"supports_service_tier": true,
|
|
26919
|
+
"supports_vision": true
|
|
26920
|
+
},
|
|
26921
|
+
"azure/gpt-5.1-chat-2025-11-13": {
|
|
26922
|
+
"cache_read_input_token_cost": 1.25e-07,
|
|
26923
|
+
"cache_read_input_token_cost_priority": 2.5e-07,
|
|
26924
|
+
"input_cost_per_token": 1.25e-06,
|
|
26925
|
+
"input_cost_per_token_priority": 2.5e-06,
|
|
26926
|
+
"litellm_provider": "azure",
|
|
26927
|
+
"max_input_tokens": 128000,
|
|
26928
|
+
"max_output_tokens": 16384,
|
|
26929
|
+
"max_tokens": 16384,
|
|
26930
|
+
"mode": "chat",
|
|
26931
|
+
"output_cost_per_token": 1e-05,
|
|
26932
|
+
"output_cost_per_token_priority": 2e-05,
|
|
26933
|
+
"supported_endpoints": [
|
|
26934
|
+
"/v1/chat/completions",
|
|
26935
|
+
"/v1/responses"
|
|
26936
|
+
],
|
|
26937
|
+
"supported_modalities": [
|
|
26938
|
+
"text",
|
|
26939
|
+
"image"
|
|
26940
|
+
],
|
|
26941
|
+
"supported_output_modalities": [
|
|
26942
|
+
"text",
|
|
26943
|
+
"image"
|
|
26944
|
+
],
|
|
26945
|
+
"supports_function_calling": false,
|
|
26946
|
+
"supports_native_streaming": true,
|
|
26947
|
+
"supports_parallel_function_calling": false,
|
|
26948
|
+
"supports_pdf_input": true,
|
|
26949
|
+
"supports_prompt_caching": true,
|
|
26950
|
+
"supports_reasoning": true,
|
|
26951
|
+
"supports_response_schema": true,
|
|
26952
|
+
"supports_system_messages": true,
|
|
26953
|
+
"supports_tool_choice": false,
|
|
26954
|
+
"supports_vision": true
|
|
26955
|
+
},
|
|
26956
|
+
"azure/gpt-5.1-codex-2025-11-13": {
|
|
26957
|
+
"cache_read_input_token_cost": 1.25e-07,
|
|
26958
|
+
"cache_read_input_token_cost_priority": 2.5e-07,
|
|
26959
|
+
"input_cost_per_token": 1.25e-06,
|
|
26960
|
+
"input_cost_per_token_priority": 2.5e-06,
|
|
26961
|
+
"litellm_provider": "azure",
|
|
26962
|
+
"max_input_tokens": 272000,
|
|
26963
|
+
"max_output_tokens": 128000,
|
|
26964
|
+
"max_tokens": 128000,
|
|
26965
|
+
"mode": "responses",
|
|
26966
|
+
"output_cost_per_token": 1e-05,
|
|
26967
|
+
"output_cost_per_token_priority": 2e-05,
|
|
26968
|
+
"supported_endpoints": [
|
|
26969
|
+
"/v1/responses"
|
|
26970
|
+
],
|
|
26971
|
+
"supported_modalities": [
|
|
26972
|
+
"text",
|
|
26973
|
+
"image"
|
|
26974
|
+
],
|
|
26975
|
+
"supported_output_modalities": [
|
|
26976
|
+
"text"
|
|
26977
|
+
],
|
|
26978
|
+
"supports_function_calling": true,
|
|
26979
|
+
"supports_native_streaming": true,
|
|
26980
|
+
"supports_parallel_function_calling": true,
|
|
26981
|
+
"supports_pdf_input": true,
|
|
26982
|
+
"supports_prompt_caching": true,
|
|
26983
|
+
"supports_reasoning": true,
|
|
26984
|
+
"supports_response_schema": true,
|
|
26985
|
+
"supports_system_messages": false,
|
|
26986
|
+
"supports_tool_choice": true,
|
|
26987
|
+
"supports_vision": true
|
|
26988
|
+
},
|
|
26989
|
+
"azure/gpt-5.1-codex-mini-2025-11-13": {
|
|
26990
|
+
"cache_read_input_token_cost": 2.5e-08,
|
|
26991
|
+
"cache_read_input_token_cost_priority": 4.5e-08,
|
|
26992
|
+
"input_cost_per_token": 2.5e-07,
|
|
26993
|
+
"input_cost_per_token_priority": 4.5e-07,
|
|
26994
|
+
"litellm_provider": "azure",
|
|
26995
|
+
"max_input_tokens": 272000,
|
|
26996
|
+
"max_output_tokens": 128000,
|
|
26997
|
+
"max_tokens": 128000,
|
|
26998
|
+
"mode": "responses",
|
|
26999
|
+
"output_cost_per_token": 2e-06,
|
|
27000
|
+
"output_cost_per_token_priority": 3.6e-06,
|
|
27001
|
+
"supported_endpoints": [
|
|
27002
|
+
"/v1/responses"
|
|
27003
|
+
],
|
|
27004
|
+
"supported_modalities": [
|
|
27005
|
+
"text",
|
|
27006
|
+
"image"
|
|
27007
|
+
],
|
|
27008
|
+
"supported_output_modalities": [
|
|
27009
|
+
"text"
|
|
27010
|
+
],
|
|
27011
|
+
"supports_function_calling": true,
|
|
27012
|
+
"supports_native_streaming": true,
|
|
27013
|
+
"supports_parallel_function_calling": true,
|
|
27014
|
+
"supports_pdf_input": true,
|
|
27015
|
+
"supports_prompt_caching": true,
|
|
27016
|
+
"supports_reasoning": true,
|
|
27017
|
+
"supports_response_schema": true,
|
|
27018
|
+
"supports_system_messages": false,
|
|
27019
|
+
"supports_tool_choice": true,
|
|
27020
|
+
"supports_vision": true
|
|
27021
|
+
},
|
|
27022
|
+
"azure/eu/gpt-5.1": {
|
|
27023
|
+
"cache_read_input_token_cost": 1.4e-07,
|
|
27024
|
+
"input_cost_per_token": 1.38e-06,
|
|
27025
|
+
"litellm_provider": "azure",
|
|
27026
|
+
"max_input_tokens": 272000,
|
|
27027
|
+
"max_output_tokens": 128000,
|
|
27028
|
+
"max_tokens": 128000,
|
|
27029
|
+
"mode": "chat",
|
|
27030
|
+
"output_cost_per_token": 1.1e-05,
|
|
27031
|
+
"supported_endpoints": [
|
|
27032
|
+
"/v1/chat/completions",
|
|
27033
|
+
"/v1/batch",
|
|
27034
|
+
"/v1/responses"
|
|
27035
|
+
],
|
|
27036
|
+
"supported_modalities": [
|
|
27037
|
+
"text",
|
|
27038
|
+
"image"
|
|
27039
|
+
],
|
|
27040
|
+
"supported_output_modalities": [
|
|
27041
|
+
"text",
|
|
27042
|
+
"image"
|
|
27043
|
+
],
|
|
27044
|
+
"supports_function_calling": true,
|
|
27045
|
+
"supports_native_streaming": true,
|
|
27046
|
+
"supports_parallel_function_calling": true,
|
|
27047
|
+
"supports_pdf_input": true,
|
|
27048
|
+
"supports_prompt_caching": true,
|
|
27049
|
+
"supports_reasoning": true,
|
|
27050
|
+
"supports_response_schema": true,
|
|
27051
|
+
"supports_system_messages": true,
|
|
27052
|
+
"supports_tool_choice": true,
|
|
27053
|
+
"supports_vision": true
|
|
27054
|
+
},
|
|
27055
|
+
"azure/eu/gpt-5.1-chat": {
|
|
27056
|
+
"cache_read_input_token_cost": 1.4e-07,
|
|
27057
|
+
"input_cost_per_token": 1.38e-06,
|
|
27058
|
+
"litellm_provider": "azure",
|
|
27059
|
+
"max_input_tokens": 272000,
|
|
27060
|
+
"max_output_tokens": 128000,
|
|
27061
|
+
"max_tokens": 128000,
|
|
27062
|
+
"mode": "chat",
|
|
27063
|
+
"output_cost_per_token": 1.1e-05,
|
|
27064
|
+
"supported_endpoints": [
|
|
27065
|
+
"/v1/chat/completions",
|
|
27066
|
+
"/v1/batch",
|
|
27067
|
+
"/v1/responses"
|
|
27068
|
+
],
|
|
27069
|
+
"supported_modalities": [
|
|
27070
|
+
"text",
|
|
27071
|
+
"image"
|
|
27072
|
+
],
|
|
27073
|
+
"supported_output_modalities": [
|
|
27074
|
+
"text",
|
|
27075
|
+
"image"
|
|
27076
|
+
],
|
|
27077
|
+
"supports_function_calling": true,
|
|
27078
|
+
"supports_native_streaming": true,
|
|
27079
|
+
"supports_parallel_function_calling": true,
|
|
27080
|
+
"supports_pdf_input": true,
|
|
27081
|
+
"supports_prompt_caching": true,
|
|
27082
|
+
"supports_reasoning": true,
|
|
27083
|
+
"supports_response_schema": true,
|
|
27084
|
+
"supports_system_messages": true,
|
|
27085
|
+
"supports_tool_choice": true,
|
|
27086
|
+
"supports_vision": true
|
|
27087
|
+
},
|
|
27088
|
+
"azure/eu/gpt-5.1-codex": {
|
|
27089
|
+
"cache_read_input_token_cost": 1.4e-07,
|
|
27090
|
+
"input_cost_per_token": 1.38e-06,
|
|
27091
|
+
"litellm_provider": "azure",
|
|
27092
|
+
"max_input_tokens": 272000,
|
|
27093
|
+
"max_output_tokens": 128000,
|
|
27094
|
+
"max_tokens": 128000,
|
|
27095
|
+
"mode": "responses",
|
|
27096
|
+
"output_cost_per_token": 1.1e-05,
|
|
27097
|
+
"supported_endpoints": [
|
|
27098
|
+
"/v1/responses"
|
|
27099
|
+
],
|
|
27100
|
+
"supported_modalities": [
|
|
27101
|
+
"text",
|
|
27102
|
+
"image"
|
|
27103
|
+
],
|
|
27104
|
+
"supported_output_modalities": [
|
|
27105
|
+
"text"
|
|
27106
|
+
],
|
|
27107
|
+
"supports_function_calling": true,
|
|
27108
|
+
"supports_native_streaming": true,
|
|
27109
|
+
"supports_parallel_function_calling": true,
|
|
27110
|
+
"supports_pdf_input": true,
|
|
27111
|
+
"supports_prompt_caching": true,
|
|
27112
|
+
"supports_reasoning": true,
|
|
27113
|
+
"supports_response_schema": true,
|
|
27114
|
+
"supports_system_messages": false,
|
|
27115
|
+
"supports_tool_choice": true,
|
|
27116
|
+
"supports_vision": true
|
|
27117
|
+
},
|
|
27118
|
+
"azure/eu/gpt-5.1-codex-mini": {
|
|
27119
|
+
"cache_read_input_token_cost": 2.8e-08,
|
|
27120
|
+
"input_cost_per_token": 2.75e-07,
|
|
27121
|
+
"litellm_provider": "azure",
|
|
27122
|
+
"max_input_tokens": 272000,
|
|
27123
|
+
"max_output_tokens": 128000,
|
|
27124
|
+
"max_tokens": 128000,
|
|
27125
|
+
"mode": "responses",
|
|
27126
|
+
"output_cost_per_token": 2.2e-06,
|
|
27127
|
+
"supported_endpoints": [
|
|
27128
|
+
"/v1/responses"
|
|
27129
|
+
],
|
|
27130
|
+
"supported_modalities": [
|
|
27131
|
+
"text",
|
|
27132
|
+
"image"
|
|
27133
|
+
],
|
|
27134
|
+
"supported_output_modalities": [
|
|
27135
|
+
"text"
|
|
27136
|
+
],
|
|
27137
|
+
"supports_function_calling": true,
|
|
27138
|
+
"supports_native_streaming": true,
|
|
27139
|
+
"supports_parallel_function_calling": true,
|
|
27140
|
+
"supports_pdf_input": true,
|
|
27141
|
+
"supports_prompt_caching": true,
|
|
27142
|
+
"supports_reasoning": true,
|
|
27143
|
+
"supports_response_schema": true,
|
|
27144
|
+
"supports_system_messages": false,
|
|
27145
|
+
"supports_tool_choice": true,
|
|
27146
|
+
"supports_vision": true
|
|
27147
|
+
},
|
|
27148
|
+
"azure/global/gpt-5.1": {
|
|
27149
|
+
"cache_read_input_token_cost": 1.25e-07,
|
|
27150
|
+
"input_cost_per_token": 1.25e-06,
|
|
27151
|
+
"litellm_provider": "azure",
|
|
27152
|
+
"max_input_tokens": 272000,
|
|
27153
|
+
"max_output_tokens": 128000,
|
|
27154
|
+
"max_tokens": 128000,
|
|
27155
|
+
"mode": "chat",
|
|
27156
|
+
"output_cost_per_token": 1e-05,
|
|
27157
|
+
"supported_endpoints": [
|
|
27158
|
+
"/v1/chat/completions",
|
|
27159
|
+
"/v1/batch",
|
|
27160
|
+
"/v1/responses"
|
|
27161
|
+
],
|
|
27162
|
+
"supported_modalities": [
|
|
27163
|
+
"text",
|
|
27164
|
+
"image"
|
|
27165
|
+
],
|
|
27166
|
+
"supported_output_modalities": [
|
|
27167
|
+
"text",
|
|
27168
|
+
"image"
|
|
27169
|
+
],
|
|
27170
|
+
"supports_function_calling": true,
|
|
27171
|
+
"supports_native_streaming": true,
|
|
27172
|
+
"supports_parallel_function_calling": true,
|
|
27173
|
+
"supports_pdf_input": true,
|
|
27174
|
+
"supports_prompt_caching": true,
|
|
27175
|
+
"supports_reasoning": true,
|
|
27176
|
+
"supports_response_schema": true,
|
|
27177
|
+
"supports_system_messages": true,
|
|
27178
|
+
"supports_tool_choice": true,
|
|
27179
|
+
"supports_vision": true
|
|
27180
|
+
},
|
|
27181
|
+
"azure/global/gpt-5.1-chat": {
|
|
27182
|
+
"cache_read_input_token_cost": 1.25e-07,
|
|
27183
|
+
"input_cost_per_token": 1.25e-06,
|
|
27184
|
+
"litellm_provider": "azure",
|
|
27185
|
+
"max_input_tokens": 272000,
|
|
27186
|
+
"max_output_tokens": 128000,
|
|
27187
|
+
"max_tokens": 128000,
|
|
27188
|
+
"mode": "chat",
|
|
27189
|
+
"output_cost_per_token": 1e-05,
|
|
27190
|
+
"supported_endpoints": [
|
|
27191
|
+
"/v1/chat/completions",
|
|
27192
|
+
"/v1/batch",
|
|
27193
|
+
"/v1/responses"
|
|
27194
|
+
],
|
|
27195
|
+
"supported_modalities": [
|
|
27196
|
+
"text",
|
|
27197
|
+
"image"
|
|
27198
|
+
],
|
|
27199
|
+
"supported_output_modalities": [
|
|
27200
|
+
"text",
|
|
27201
|
+
"image"
|
|
27202
|
+
],
|
|
27203
|
+
"supports_function_calling": true,
|
|
27204
|
+
"supports_native_streaming": true,
|
|
27205
|
+
"supports_parallel_function_calling": true,
|
|
27206
|
+
"supports_pdf_input": true,
|
|
27207
|
+
"supports_prompt_caching": true,
|
|
27208
|
+
"supports_reasoning": true,
|
|
27209
|
+
"supports_response_schema": true,
|
|
27210
|
+
"supports_system_messages": true,
|
|
27211
|
+
"supports_tool_choice": true,
|
|
27212
|
+
"supports_vision": true
|
|
27213
|
+
},
|
|
27214
|
+
"azure/global/gpt-5.1-codex": {
|
|
27215
|
+
"cache_read_input_token_cost": 1.25e-07,
|
|
27216
|
+
"input_cost_per_token": 1.25e-06,
|
|
27217
|
+
"litellm_provider": "azure",
|
|
27218
|
+
"max_input_tokens": 272000,
|
|
27219
|
+
"max_output_tokens": 128000,
|
|
27220
|
+
"max_tokens": 128000,
|
|
27221
|
+
"mode": "responses",
|
|
27222
|
+
"output_cost_per_token": 1e-05,
|
|
27223
|
+
"supported_endpoints": [
|
|
27224
|
+
"/v1/responses"
|
|
27225
|
+
],
|
|
27226
|
+
"supported_modalities": [
|
|
27227
|
+
"text",
|
|
27228
|
+
"image"
|
|
27229
|
+
],
|
|
27230
|
+
"supported_output_modalities": [
|
|
27231
|
+
"text"
|
|
27232
|
+
],
|
|
27233
|
+
"supports_function_calling": true,
|
|
27234
|
+
"supports_native_streaming": true,
|
|
27235
|
+
"supports_parallel_function_calling": true,
|
|
27236
|
+
"supports_pdf_input": true,
|
|
27237
|
+
"supports_prompt_caching": true,
|
|
27238
|
+
"supports_reasoning": true,
|
|
27239
|
+
"supports_response_schema": true,
|
|
27240
|
+
"supports_system_messages": false,
|
|
27241
|
+
"supports_tool_choice": true,
|
|
27242
|
+
"supports_vision": true
|
|
27243
|
+
},
|
|
27244
|
+
"azure/global/gpt-5.1-codex-mini": {
|
|
27245
|
+
"cache_read_input_token_cost": 2.5e-08,
|
|
27246
|
+
"input_cost_per_token": 2.5e-07,
|
|
27247
|
+
"litellm_provider": "azure",
|
|
27248
|
+
"max_input_tokens": 272000,
|
|
27249
|
+
"max_output_tokens": 128000,
|
|
27250
|
+
"max_tokens": 128000,
|
|
27251
|
+
"mode": "responses",
|
|
27252
|
+
"output_cost_per_token": 2e-06,
|
|
27253
|
+
"supported_endpoints": [
|
|
27254
|
+
"/v1/responses"
|
|
27255
|
+
],
|
|
27256
|
+
"supported_modalities": [
|
|
27257
|
+
"text",
|
|
27258
|
+
"image"
|
|
27259
|
+
],
|
|
27260
|
+
"supported_output_modalities": [
|
|
27261
|
+
"text"
|
|
27262
|
+
],
|
|
27263
|
+
"supports_function_calling": true,
|
|
27264
|
+
"supports_native_streaming": true,
|
|
27265
|
+
"supports_parallel_function_calling": true,
|
|
27266
|
+
"supports_pdf_input": true,
|
|
27267
|
+
"supports_prompt_caching": true,
|
|
27268
|
+
"supports_reasoning": true,
|
|
27269
|
+
"supports_response_schema": true,
|
|
27270
|
+
"supports_system_messages": false,
|
|
27271
|
+
"supports_tool_choice": true,
|
|
27272
|
+
"supports_vision": true
|
|
27273
|
+
},
|
|
27274
|
+
"azure/gpt-5.1": {
|
|
27275
|
+
"cache_read_input_token_cost": 1.25e-07,
|
|
27276
|
+
"input_cost_per_token": 1.25e-06,
|
|
27277
|
+
"litellm_provider": "azure",
|
|
27278
|
+
"max_input_tokens": 272000,
|
|
27279
|
+
"max_output_tokens": 128000,
|
|
27280
|
+
"max_tokens": 128000,
|
|
27281
|
+
"mode": "chat",
|
|
27282
|
+
"output_cost_per_token": 1e-05,
|
|
27283
|
+
"supported_endpoints": [
|
|
27284
|
+
"/v1/chat/completions",
|
|
27285
|
+
"/v1/batch",
|
|
27286
|
+
"/v1/responses"
|
|
27287
|
+
],
|
|
27288
|
+
"supported_modalities": [
|
|
27289
|
+
"text",
|
|
27290
|
+
"image"
|
|
27291
|
+
],
|
|
27292
|
+
"supported_output_modalities": [
|
|
27293
|
+
"text",
|
|
27294
|
+
"image"
|
|
27295
|
+
],
|
|
27296
|
+
"supports_function_calling": true,
|
|
27297
|
+
"supports_native_streaming": true,
|
|
27298
|
+
"supports_parallel_function_calling": true,
|
|
27299
|
+
"supports_pdf_input": true,
|
|
27300
|
+
"supports_prompt_caching": true,
|
|
27301
|
+
"supports_reasoning": true,
|
|
27302
|
+
"supports_response_schema": true,
|
|
27303
|
+
"supports_system_messages": true,
|
|
27304
|
+
"supports_tool_choice": true,
|
|
27305
|
+
"supports_vision": true
|
|
27306
|
+
},
|
|
27307
|
+
"azure/gpt-5.1-chat": {
|
|
27308
|
+
"cache_read_input_token_cost": 1.25e-07,
|
|
27309
|
+
"input_cost_per_token": 1.25e-06,
|
|
27310
|
+
"litellm_provider": "azure",
|
|
27311
|
+
"max_input_tokens": 272000,
|
|
27312
|
+
"max_output_tokens": 128000,
|
|
27313
|
+
"max_tokens": 128000,
|
|
27314
|
+
"mode": "chat",
|
|
27315
|
+
"output_cost_per_token": 1e-05,
|
|
27316
|
+
"supported_endpoints": [
|
|
27317
|
+
"/v1/chat/completions",
|
|
27318
|
+
"/v1/batch",
|
|
27319
|
+
"/v1/responses"
|
|
27320
|
+
],
|
|
27321
|
+
"supported_modalities": [
|
|
27322
|
+
"text",
|
|
27323
|
+
"image"
|
|
27324
|
+
],
|
|
27325
|
+
"supported_output_modalities": [
|
|
27326
|
+
"text",
|
|
27327
|
+
"image"
|
|
27328
|
+
],
|
|
27329
|
+
"supports_function_calling": true,
|
|
27330
|
+
"supports_native_streaming": true,
|
|
27331
|
+
"supports_parallel_function_calling": true,
|
|
27332
|
+
"supports_pdf_input": true,
|
|
27333
|
+
"supports_prompt_caching": true,
|
|
27334
|
+
"supports_reasoning": true,
|
|
27335
|
+
"supports_response_schema": true,
|
|
27336
|
+
"supports_system_messages": true,
|
|
27337
|
+
"supports_tool_choice": true,
|
|
27338
|
+
"supports_vision": true
|
|
27339
|
+
},
|
|
27340
|
+
"azure/gpt-5.1-codex": {
|
|
27341
|
+
"cache_read_input_token_cost": 1.25e-07,
|
|
27342
|
+
"input_cost_per_token": 1.25e-06,
|
|
27343
|
+
"litellm_provider": "azure",
|
|
27344
|
+
"max_input_tokens": 272000,
|
|
27345
|
+
"max_output_tokens": 128000,
|
|
27346
|
+
"max_tokens": 128000,
|
|
27347
|
+
"mode": "responses",
|
|
27348
|
+
"output_cost_per_token": 1e-05,
|
|
27349
|
+
"supported_endpoints": [
|
|
27350
|
+
"/v1/responses"
|
|
27351
|
+
],
|
|
27352
|
+
"supported_modalities": [
|
|
27353
|
+
"text",
|
|
27354
|
+
"image"
|
|
27355
|
+
],
|
|
27356
|
+
"supported_output_modalities": [
|
|
27357
|
+
"text"
|
|
27358
|
+
],
|
|
27359
|
+
"supports_function_calling": true,
|
|
27360
|
+
"supports_native_streaming": true,
|
|
27361
|
+
"supports_parallel_function_calling": true,
|
|
27362
|
+
"supports_pdf_input": true,
|
|
27363
|
+
"supports_prompt_caching": true,
|
|
27364
|
+
"supports_reasoning": true,
|
|
27365
|
+
"supports_response_schema": true,
|
|
27366
|
+
"supports_system_messages": false,
|
|
27367
|
+
"supports_tool_choice": true,
|
|
27368
|
+
"supports_vision": true
|
|
27369
|
+
},
|
|
27370
|
+
"azure/gpt-5.1-codex-mini": {
|
|
27371
|
+
"cache_read_input_token_cost": 2.5e-08,
|
|
27372
|
+
"input_cost_per_token": 2.5e-07,
|
|
27373
|
+
"litellm_provider": "azure",
|
|
27374
|
+
"max_input_tokens": 272000,
|
|
27375
|
+
"max_output_tokens": 128000,
|
|
27376
|
+
"max_tokens": 128000,
|
|
27377
|
+
"mode": "responses",
|
|
27378
|
+
"output_cost_per_token": 2e-06,
|
|
27379
|
+
"supported_endpoints": [
|
|
27380
|
+
"/v1/responses"
|
|
27381
|
+
],
|
|
27382
|
+
"supported_modalities": [
|
|
27383
|
+
"text",
|
|
27384
|
+
"image"
|
|
27385
|
+
],
|
|
27386
|
+
"supported_output_modalities": [
|
|
27387
|
+
"text"
|
|
27388
|
+
],
|
|
27389
|
+
"supports_function_calling": true,
|
|
27390
|
+
"supports_native_streaming": true,
|
|
27391
|
+
"supports_parallel_function_calling": true,
|
|
27392
|
+
"supports_pdf_input": true,
|
|
27393
|
+
"supports_prompt_caching": true,
|
|
27394
|
+
"supports_reasoning": true,
|
|
27395
|
+
"supports_response_schema": true,
|
|
27396
|
+
"supports_system_messages": false,
|
|
27397
|
+
"supports_tool_choice": true,
|
|
27398
|
+
"supports_vision": true
|
|
27399
|
+
},
|
|
27400
|
+
"azure/us/gpt-5.1": {
|
|
27401
|
+
"cache_read_input_token_cost": 1.4e-07,
|
|
27402
|
+
"input_cost_per_token": 1.38e-06,
|
|
27403
|
+
"litellm_provider": "azure",
|
|
27404
|
+
"max_input_tokens": 272000,
|
|
27405
|
+
"max_output_tokens": 128000,
|
|
27406
|
+
"max_tokens": 128000,
|
|
27407
|
+
"mode": "chat",
|
|
27408
|
+
"output_cost_per_token": 1.1e-05,
|
|
27409
|
+
"supported_endpoints": [
|
|
27410
|
+
"/v1/chat/completions",
|
|
27411
|
+
"/v1/batch",
|
|
27412
|
+
"/v1/responses"
|
|
27413
|
+
],
|
|
27414
|
+
"supported_modalities": [
|
|
27415
|
+
"text",
|
|
27416
|
+
"image"
|
|
27417
|
+
],
|
|
27418
|
+
"supported_output_modalities": [
|
|
27419
|
+
"text",
|
|
27420
|
+
"image"
|
|
27421
|
+
],
|
|
27422
|
+
"supports_function_calling": true,
|
|
27423
|
+
"supports_native_streaming": true,
|
|
27424
|
+
"supports_parallel_function_calling": true,
|
|
27425
|
+
"supports_pdf_input": true,
|
|
27426
|
+
"supports_prompt_caching": true,
|
|
27427
|
+
"supports_reasoning": true,
|
|
27428
|
+
"supports_response_schema": true,
|
|
27429
|
+
"supports_system_messages": true,
|
|
27430
|
+
"supports_tool_choice": true,
|
|
27431
|
+
"supports_vision": true
|
|
27432
|
+
},
|
|
27433
|
+
"azure/us/gpt-5.1-chat": {
|
|
27434
|
+
"cache_read_input_token_cost": 1.4e-07,
|
|
27435
|
+
"input_cost_per_token": 1.38e-06,
|
|
27436
|
+
"litellm_provider": "azure",
|
|
27437
|
+
"max_input_tokens": 272000,
|
|
27438
|
+
"max_output_tokens": 128000,
|
|
27439
|
+
"max_tokens": 128000,
|
|
27440
|
+
"mode": "chat",
|
|
27441
|
+
"output_cost_per_token": 1.1e-05,
|
|
27442
|
+
"supported_endpoints": [
|
|
27443
|
+
"/v1/chat/completions",
|
|
27444
|
+
"/v1/batch",
|
|
27445
|
+
"/v1/responses"
|
|
27446
|
+
],
|
|
27447
|
+
"supported_modalities": [
|
|
27448
|
+
"text",
|
|
27449
|
+
"image"
|
|
27450
|
+
],
|
|
27451
|
+
"supported_output_modalities": [
|
|
27452
|
+
"text",
|
|
27453
|
+
"image"
|
|
27454
|
+
],
|
|
27455
|
+
"supports_function_calling": true,
|
|
27456
|
+
"supports_native_streaming": true,
|
|
27457
|
+
"supports_parallel_function_calling": true,
|
|
27458
|
+
"supports_pdf_input": true,
|
|
27459
|
+
"supports_prompt_caching": true,
|
|
27460
|
+
"supports_reasoning": true,
|
|
27461
|
+
"supports_response_schema": true,
|
|
27462
|
+
"supports_system_messages": true,
|
|
27463
|
+
"supports_tool_choice": true,
|
|
27464
|
+
"supports_vision": true
|
|
27465
|
+
},
|
|
27466
|
+
"azure/us/gpt-5.1-codex": {
|
|
27467
|
+
"cache_read_input_token_cost": 1.4e-07,
|
|
27468
|
+
"input_cost_per_token": 1.38e-06,
|
|
27469
|
+
"litellm_provider": "azure",
|
|
27470
|
+
"max_input_tokens": 272000,
|
|
27471
|
+
"max_output_tokens": 128000,
|
|
27472
|
+
"max_tokens": 128000,
|
|
27473
|
+
"mode": "responses",
|
|
27474
|
+
"output_cost_per_token": 1.1e-05,
|
|
27475
|
+
"supported_endpoints": [
|
|
27476
|
+
"/v1/responses"
|
|
27477
|
+
],
|
|
27478
|
+
"supported_modalities": [
|
|
27479
|
+
"text",
|
|
27480
|
+
"image"
|
|
27481
|
+
],
|
|
27482
|
+
"supported_output_modalities": [
|
|
27483
|
+
"text"
|
|
27484
|
+
],
|
|
27485
|
+
"supports_function_calling": true,
|
|
27486
|
+
"supports_native_streaming": true,
|
|
27487
|
+
"supports_parallel_function_calling": true,
|
|
27488
|
+
"supports_pdf_input": true,
|
|
27489
|
+
"supports_prompt_caching": true,
|
|
27490
|
+
"supports_reasoning": true,
|
|
27491
|
+
"supports_response_schema": true,
|
|
27492
|
+
"supports_system_messages": false,
|
|
27493
|
+
"supports_tool_choice": true,
|
|
27494
|
+
"supports_vision": true
|
|
27495
|
+
},
|
|
27496
|
+
"azure/us/gpt-5.1-codex-mini": {
|
|
27497
|
+
"cache_read_input_token_cost": 2.8e-08,
|
|
27498
|
+
"input_cost_per_token": 2.75e-07,
|
|
27499
|
+
"litellm_provider": "azure",
|
|
27500
|
+
"max_input_tokens": 272000,
|
|
27501
|
+
"max_output_tokens": 128000,
|
|
27502
|
+
"max_tokens": 128000,
|
|
27503
|
+
"mode": "responses",
|
|
27504
|
+
"output_cost_per_token": 2.2e-06,
|
|
27505
|
+
"supported_endpoints": [
|
|
27506
|
+
"/v1/responses"
|
|
27507
|
+
],
|
|
27508
|
+
"supported_modalities": [
|
|
27509
|
+
"text",
|
|
27510
|
+
"image"
|
|
27511
|
+
],
|
|
27512
|
+
"supported_output_modalities": [
|
|
27513
|
+
"text"
|
|
27514
|
+
],
|
|
27515
|
+
"supports_function_calling": true,
|
|
27516
|
+
"supports_native_streaming": true,
|
|
27517
|
+
"supports_parallel_function_calling": true,
|
|
27518
|
+
"supports_pdf_input": true,
|
|
27519
|
+
"supports_prompt_caching": true,
|
|
27520
|
+
"supports_reasoning": true,
|
|
27521
|
+
"supports_response_schema": true,
|
|
27522
|
+
"supports_system_messages": false,
|
|
27523
|
+
"supports_tool_choice": true,
|
|
27524
|
+
"supports_vision": true
|
|
27525
|
+
},
|
|
27526
|
+
"vertex_ai/gemini-3-pro-preview": {
|
|
27527
|
+
"cache_read_input_token_cost": 2e-07,
|
|
27528
|
+
"cache_read_input_token_cost_above_200k_tokens": 4e-07,
|
|
27529
|
+
"cache_creation_input_token_cost_above_200k_tokens": 2.5e-07,
|
|
27530
|
+
"input_cost_per_token": 2e-06,
|
|
27531
|
+
"input_cost_per_token_above_200k_tokens": 4e-06,
|
|
27532
|
+
"input_cost_per_token_batches": 1e-06,
|
|
27533
|
+
"litellm_provider": "vertex_ai",
|
|
27534
|
+
"max_audio_length_hours": 8.4,
|
|
27535
|
+
"max_audio_per_prompt": 1,
|
|
27536
|
+
"max_images_per_prompt": 3000,
|
|
27537
|
+
"max_input_tokens": 1048576,
|
|
27538
|
+
"max_output_tokens": 65535,
|
|
27539
|
+
"max_pdf_size_mb": 30,
|
|
27540
|
+
"max_tokens": 65535,
|
|
27541
|
+
"max_video_length": 1,
|
|
27542
|
+
"max_videos_per_prompt": 10,
|
|
27543
|
+
"mode": "chat",
|
|
27544
|
+
"output_cost_per_token": 1.2e-05,
|
|
27545
|
+
"output_cost_per_token_above_200k_tokens": 1.8e-05,
|
|
27546
|
+
"output_cost_per_token_batches": 6e-06,
|
|
27547
|
+
"source": "https://cloud.google.com/vertex-ai/generative-ai/pricing",
|
|
27548
|
+
"supported_endpoints": [
|
|
27549
|
+
"/v1/chat/completions",
|
|
27550
|
+
"/v1/completions",
|
|
27551
|
+
"/v1/batch"
|
|
27552
|
+
],
|
|
27553
|
+
"supported_modalities": [
|
|
27554
|
+
"text",
|
|
27555
|
+
"image",
|
|
27556
|
+
"audio",
|
|
27557
|
+
"video"
|
|
27558
|
+
],
|
|
27559
|
+
"supported_output_modalities": [
|
|
27560
|
+
"text"
|
|
27561
|
+
],
|
|
27562
|
+
"supports_audio_input": true,
|
|
27563
|
+
"supports_function_calling": true,
|
|
27564
|
+
"supports_pdf_input": true,
|
|
27565
|
+
"supports_prompt_caching": true,
|
|
27566
|
+
"supports_reasoning": true,
|
|
27567
|
+
"supports_response_schema": true,
|
|
27568
|
+
"supports_system_messages": true,
|
|
27569
|
+
"supports_tool_choice": true,
|
|
27570
|
+
"supports_video_input": true,
|
|
27571
|
+
"supports_vision": true,
|
|
27572
|
+
"supports_web_search": true
|
|
27573
|
+
},
|
|
27574
|
+
"vertex_ai/gemini-2.5-flash-image": {
|
|
27575
|
+
"cache_read_input_token_cost": 3e-08,
|
|
27576
|
+
"input_cost_per_audio_token": 1e-06,
|
|
27577
|
+
"input_cost_per_token": 3e-07,
|
|
27578
|
+
"litellm_provider": "vertex_ai-language-models",
|
|
27579
|
+
"max_audio_length_hours": 8.4,
|
|
27580
|
+
"max_audio_per_prompt": 1,
|
|
27581
|
+
"max_images_per_prompt": 3000,
|
|
27582
|
+
"max_input_tokens": 32768,
|
|
27583
|
+
"max_output_tokens": 32768,
|
|
27584
|
+
"max_tokens": 32768,
|
|
27585
|
+
"max_pdf_size_mb": 30,
|
|
27586
|
+
"max_video_length": 1,
|
|
27587
|
+
"max_videos_per_prompt": 10,
|
|
27588
|
+
"mode": "image_generation",
|
|
27589
|
+
"output_cost_per_image": 0.039,
|
|
27590
|
+
"output_cost_per_reasoning_token": 2.5e-06,
|
|
27591
|
+
"output_cost_per_token": 2.5e-06,
|
|
27592
|
+
"rpm": 100000,
|
|
27593
|
+
"source": "https://cloud.google.com/vertex-ai/generative-ai/docs/multimodal/image-generation#edit-an-image",
|
|
27594
|
+
"supported_endpoints": [
|
|
27595
|
+
"/v1/chat/completions",
|
|
27596
|
+
"/v1/completions",
|
|
27597
|
+
"/v1/batch"
|
|
27598
|
+
],
|
|
27599
|
+
"supported_modalities": [
|
|
27600
|
+
"text",
|
|
27601
|
+
"image",
|
|
27602
|
+
"audio",
|
|
27603
|
+
"video"
|
|
27604
|
+
],
|
|
27605
|
+
"supported_output_modalities": [
|
|
27606
|
+
"text",
|
|
27607
|
+
"image"
|
|
27608
|
+
],
|
|
27609
|
+
"supports_audio_output": false,
|
|
27610
|
+
"supports_function_calling": true,
|
|
27611
|
+
"supports_parallel_function_calling": true,
|
|
27612
|
+
"supports_pdf_input": true,
|
|
27613
|
+
"supports_prompt_caching": true,
|
|
27614
|
+
"supports_response_schema": true,
|
|
27615
|
+
"supports_system_messages": true,
|
|
27616
|
+
"supports_tool_choice": true,
|
|
27617
|
+
"supports_url_context": true,
|
|
27618
|
+
"supports_vision": true,
|
|
27619
|
+
"supports_web_search": false,
|
|
27620
|
+
"tpm": 8000000
|
|
27621
|
+
},
|
|
27622
|
+
"vertex_ai/imagen-3.0-capability-001": {
|
|
27623
|
+
"litellm_provider": "vertex_ai-image-models",
|
|
27624
|
+
"mode": "image_generation",
|
|
27625
|
+
"output_cost_per_image": 0.04,
|
|
27626
|
+
"source": "https://cloud.google.com/vertex-ai/generative-ai/docs/image/edit-insert-objects"
|
|
27627
|
+
},
|
|
27628
|
+
"cerebras/gpt-oss-120b": {
|
|
27629
|
+
"input_cost_per_token": 2.5e-07,
|
|
27630
|
+
"litellm_provider": "cerebras",
|
|
27631
|
+
"max_input_tokens": 131072,
|
|
27632
|
+
"max_output_tokens": 32768,
|
|
27633
|
+
"max_tokens": 32768,
|
|
27634
|
+
"mode": "chat",
|
|
27635
|
+
"output_cost_per_token": 6.9e-07,
|
|
27636
|
+
"source": "https://www.cerebras.ai/blog/openai-gpt-oss-120b-runs-fastest-on-cerebras",
|
|
27637
|
+
"supports_function_calling": true,
|
|
27638
|
+
"supports_parallel_function_calling": true,
|
|
27639
|
+
"supports_reasoning": true,
|
|
27640
|
+
"supports_response_schema": true,
|
|
27641
|
+
"supports_tool_choice": true
|
|
27642
|
+
},
|
|
27643
|
+
"gemini-3-pro-image-preview": {
|
|
27644
|
+
"input_cost_per_image": 0.0011,
|
|
27645
|
+
"input_cost_per_token": 2e-06,
|
|
27646
|
+
"input_cost_per_token_batches": 1e-06,
|
|
27647
|
+
"litellm_provider": "vertex_ai-language-models",
|
|
27648
|
+
"max_input_tokens": 65536,
|
|
27649
|
+
"max_output_tokens": 32768,
|
|
27650
|
+
"max_tokens": 65536,
|
|
27651
|
+
"mode": "image_generation",
|
|
27652
|
+
"output_cost_per_image": 0.134,
|
|
27653
|
+
"output_cost_per_token": 1.2e-05,
|
|
27654
|
+
"output_cost_per_token_batches": 6e-06,
|
|
27655
|
+
"source": "https://ai.google.dev/gemini-api/docs/pricing",
|
|
27656
|
+
"supported_endpoints": [
|
|
27657
|
+
"/v1/chat/completions",
|
|
27658
|
+
"/v1/completions",
|
|
27659
|
+
"/v1/batch"
|
|
27660
|
+
],
|
|
27661
|
+
"supported_modalities": [
|
|
27662
|
+
"text",
|
|
27663
|
+
"image"
|
|
27664
|
+
],
|
|
27665
|
+
"supported_output_modalities": [
|
|
27666
|
+
"text",
|
|
27667
|
+
"image"
|
|
27668
|
+
],
|
|
27669
|
+
"supports_function_calling": false,
|
|
27670
|
+
"supports_prompt_caching": true,
|
|
27671
|
+
"supports_response_schema": true,
|
|
27672
|
+
"supports_system_messages": true,
|
|
27673
|
+
"supports_vision": true,
|
|
27674
|
+
"supports_web_search": true
|
|
27675
|
+
},
|
|
27676
|
+
"gemini/gemini-3-pro-image-preview": {
|
|
27677
|
+
"input_cost_per_image": 0.0011,
|
|
27678
|
+
"input_cost_per_token": 2e-06,
|
|
27679
|
+
"input_cost_per_token_batches": 1e-06,
|
|
27680
|
+
"litellm_provider": "gemini",
|
|
27681
|
+
"max_input_tokens": 65536,
|
|
27682
|
+
"max_output_tokens": 32768,
|
|
27683
|
+
"max_tokens": 65536,
|
|
27684
|
+
"mode": "image_generation",
|
|
27685
|
+
"output_cost_per_image": 0.134,
|
|
27686
|
+
"output_cost_per_token": 1.2e-05,
|
|
27687
|
+
"rpm": 1000,
|
|
27688
|
+
"tpm": 4000000,
|
|
27689
|
+
"output_cost_per_token_batches": 6e-06,
|
|
27690
|
+
"source": "https://ai.google.dev/gemini-api/docs/pricing",
|
|
27691
|
+
"supported_endpoints": [
|
|
27692
|
+
"/v1/chat/completions",
|
|
27693
|
+
"/v1/completions",
|
|
27694
|
+
"/v1/batch"
|
|
27695
|
+
],
|
|
27696
|
+
"supported_modalities": [
|
|
27697
|
+
"text",
|
|
27698
|
+
"image"
|
|
27699
|
+
],
|
|
27700
|
+
"supported_output_modalities": [
|
|
27701
|
+
"text",
|
|
27702
|
+
"image"
|
|
27703
|
+
],
|
|
27704
|
+
"supports_function_calling": false,
|
|
27705
|
+
"supports_prompt_caching": true,
|
|
27706
|
+
"supports_response_schema": true,
|
|
27707
|
+
"supports_system_messages": true,
|
|
27708
|
+
"supports_vision": true,
|
|
27709
|
+
"supports_web_search": true
|
|
27710
|
+
},
|
|
27711
|
+
"openrouter/google/gemini-3-pro-preview": {
|
|
27712
|
+
"cache_read_input_token_cost": 2e-07,
|
|
27713
|
+
"cache_read_input_token_cost_above_200k_tokens": 4e-07,
|
|
27714
|
+
"cache_creation_input_token_cost_above_200k_tokens": 2.5e-07,
|
|
27715
|
+
"input_cost_per_token": 2e-06,
|
|
27716
|
+
"input_cost_per_token_above_200k_tokens": 4e-06,
|
|
27717
|
+
"input_cost_per_token_batches": 1e-06,
|
|
27718
|
+
"litellm_provider": "openrouter",
|
|
27719
|
+
"max_audio_length_hours": 8.4,
|
|
27720
|
+
"max_audio_per_prompt": 1,
|
|
27721
|
+
"max_images_per_prompt": 3000,
|
|
27722
|
+
"max_input_tokens": 1048576,
|
|
27723
|
+
"max_output_tokens": 65535,
|
|
27724
|
+
"max_pdf_size_mb": 30,
|
|
27725
|
+
"max_tokens": 65535,
|
|
27726
|
+
"max_video_length": 1,
|
|
27727
|
+
"max_videos_per_prompt": 10,
|
|
27728
|
+
"mode": "chat",
|
|
27729
|
+
"output_cost_per_token": 1.2e-05,
|
|
27730
|
+
"output_cost_per_token_above_200k_tokens": 1.8e-05,
|
|
27731
|
+
"output_cost_per_token_batches": 6e-06,
|
|
27732
|
+
"supported_endpoints": [
|
|
27733
|
+
"/v1/chat/completions",
|
|
27734
|
+
"/v1/completions",
|
|
27735
|
+
"/v1/batch"
|
|
27736
|
+
],
|
|
27737
|
+
"supported_modalities": [
|
|
27738
|
+
"text",
|
|
27739
|
+
"image",
|
|
27740
|
+
"audio",
|
|
27741
|
+
"video"
|
|
27742
|
+
],
|
|
27743
|
+
"supported_output_modalities": [
|
|
27744
|
+
"text"
|
|
27745
|
+
],
|
|
27746
|
+
"supports_audio_input": true,
|
|
27747
|
+
"supports_function_calling": true,
|
|
27748
|
+
"supports_pdf_input": true,
|
|
27749
|
+
"supports_prompt_caching": true,
|
|
27750
|
+
"supports_reasoning": true,
|
|
27751
|
+
"supports_response_schema": true,
|
|
27752
|
+
"supports_system_messages": true,
|
|
27753
|
+
"supports_tool_choice": true,
|
|
27754
|
+
"supports_video_input": true,
|
|
27755
|
+
"supports_vision": true,
|
|
27756
|
+
"supports_web_search": true
|
|
27757
|
+
},
|
|
27758
|
+
"together_ai/zai-org/GLM-4.6": {
|
|
27759
|
+
"input_cost_per_token": 6e-07,
|
|
27760
|
+
"litellm_provider": "together_ai",
|
|
27761
|
+
"max_input_tokens": 200000,
|
|
27762
|
+
"max_output_tokens": 200000,
|
|
27763
|
+
"max_tokens": 200000,
|
|
27764
|
+
"mode": "chat",
|
|
27765
|
+
"output_cost_per_token": 2.2e-06,
|
|
27766
|
+
"source": "https://www.together.ai/models/glm-4-6",
|
|
27767
|
+
"supports_function_calling": true,
|
|
27768
|
+
"supports_parallel_function_calling": true,
|
|
27769
|
+
"supports_reasoning": true,
|
|
27770
|
+
"supports_tool_choice": true
|
|
27771
|
+
},
|
|
27772
|
+
"vertex_ai/gemini-3-pro-image-preview": {
|
|
27773
|
+
"input_cost_per_image": 0.0011,
|
|
27774
|
+
"input_cost_per_token": 2e-06,
|
|
27775
|
+
"input_cost_per_token_batches": 1e-06,
|
|
27776
|
+
"litellm_provider": "vertex_ai-language-models",
|
|
27777
|
+
"max_input_tokens": 65536,
|
|
27778
|
+
"max_output_tokens": 32768,
|
|
27779
|
+
"max_tokens": 65536,
|
|
27780
|
+
"mode": "image_generation",
|
|
27781
|
+
"output_cost_per_image": 0.134,
|
|
27782
|
+
"output_cost_per_token": 1.2e-05,
|
|
27783
|
+
"output_cost_per_token_batches": 6e-06,
|
|
27784
|
+
"source": "https://docs.cloud.google.com/vertex-ai/generative-ai/docs/models/gemini/3-pro-image"
|
|
27785
|
+
},
|
|
27786
|
+
"xai/grok-4-1-fast": {
|
|
27787
|
+
"cache_read_input_token_cost": 5e-08,
|
|
27788
|
+
"input_cost_per_token": 2e-07,
|
|
27789
|
+
"input_cost_per_token_above_128k_tokens": 4e-07,
|
|
27790
|
+
"litellm_provider": "xai",
|
|
27791
|
+
"max_input_tokens": 2000000.0,
|
|
27792
|
+
"max_output_tokens": 2000000.0,
|
|
27793
|
+
"max_tokens": 2000000.0,
|
|
27794
|
+
"mode": "chat",
|
|
27795
|
+
"output_cost_per_token": 5e-07,
|
|
27796
|
+
"output_cost_per_token_above_128k_tokens": 1e-06,
|
|
27797
|
+
"source": "https://docs.x.ai/docs/models/grok-4-1-fast-reasoning",
|
|
27798
|
+
"supports_audio_input": true,
|
|
27799
|
+
"supports_function_calling": true,
|
|
27800
|
+
"supports_reasoning": true,
|
|
27801
|
+
"supports_response_schema": true,
|
|
27802
|
+
"supports_tool_choice": true,
|
|
27803
|
+
"supports_vision": true,
|
|
27804
|
+
"supports_web_search": true
|
|
27805
|
+
},
|
|
27806
|
+
"xai/grok-4-1-fast-reasoning": {
|
|
27807
|
+
"cache_read_input_token_cost": 5e-08,
|
|
27808
|
+
"input_cost_per_token": 2e-07,
|
|
27809
|
+
"input_cost_per_token_above_128k_tokens": 4e-07,
|
|
27810
|
+
"litellm_provider": "xai",
|
|
27811
|
+
"max_input_tokens": 2000000.0,
|
|
27812
|
+
"max_output_tokens": 2000000.0,
|
|
27813
|
+
"max_tokens": 2000000.0,
|
|
27814
|
+
"mode": "chat",
|
|
27815
|
+
"output_cost_per_token": 5e-07,
|
|
27816
|
+
"output_cost_per_token_above_128k_tokens": 1e-06,
|
|
27817
|
+
"source": "https://docs.x.ai/docs/models/grok-4-1-fast-reasoning",
|
|
27818
|
+
"supports_audio_input": true,
|
|
27819
|
+
"supports_function_calling": true,
|
|
27820
|
+
"supports_reasoning": true,
|
|
27821
|
+
"supports_response_schema": true,
|
|
27822
|
+
"supports_tool_choice": true,
|
|
27823
|
+
"supports_vision": true,
|
|
27824
|
+
"supports_web_search": true
|
|
27825
|
+
},
|
|
27826
|
+
"xai/grok-4-1-fast-reasoning-latest": {
|
|
27827
|
+
"cache_read_input_token_cost": 5e-08,
|
|
27828
|
+
"input_cost_per_token": 2e-07,
|
|
27829
|
+
"input_cost_per_token_above_128k_tokens": 4e-07,
|
|
27830
|
+
"litellm_provider": "xai",
|
|
27831
|
+
"max_input_tokens": 2000000.0,
|
|
27832
|
+
"max_output_tokens": 2000000.0,
|
|
27833
|
+
"max_tokens": 2000000.0,
|
|
27834
|
+
"mode": "chat",
|
|
27835
|
+
"output_cost_per_token": 5e-07,
|
|
27836
|
+
"output_cost_per_token_above_128k_tokens": 1e-06,
|
|
27837
|
+
"source": "https://docs.x.ai/docs/models/grok-4-1-fast-reasoning",
|
|
27838
|
+
"supports_audio_input": true,
|
|
27839
|
+
"supports_function_calling": true,
|
|
27840
|
+
"supports_reasoning": true,
|
|
27841
|
+
"supports_response_schema": true,
|
|
27842
|
+
"supports_tool_choice": true,
|
|
27843
|
+
"supports_vision": true,
|
|
27844
|
+
"supports_web_search": true
|
|
27845
|
+
},
|
|
27846
|
+
"xai/grok-4-1-fast-non-reasoning": {
|
|
27847
|
+
"cache_read_input_token_cost": 5e-08,
|
|
27848
|
+
"input_cost_per_token": 2e-07,
|
|
27849
|
+
"input_cost_per_token_above_128k_tokens": 4e-07,
|
|
27850
|
+
"litellm_provider": "xai",
|
|
27851
|
+
"max_input_tokens": 2000000.0,
|
|
27852
|
+
"max_output_tokens": 2000000.0,
|
|
27853
|
+
"max_tokens": 2000000.0,
|
|
27854
|
+
"mode": "chat",
|
|
27855
|
+
"output_cost_per_token": 5e-07,
|
|
27856
|
+
"output_cost_per_token_above_128k_tokens": 1e-06,
|
|
27857
|
+
"source": "https://docs.x.ai/docs/models/grok-4-1-fast-non-reasoning",
|
|
27858
|
+
"supports_audio_input": true,
|
|
27859
|
+
"supports_function_calling": true,
|
|
27860
|
+
"supports_response_schema": true,
|
|
27861
|
+
"supports_tool_choice": true,
|
|
27862
|
+
"supports_vision": true,
|
|
27863
|
+
"supports_web_search": true
|
|
27864
|
+
},
|
|
27865
|
+
"xai/grok-4-1-fast-non-reasoning-latest": {
|
|
27866
|
+
"cache_read_input_token_cost": 5e-08,
|
|
27867
|
+
"input_cost_per_token": 2e-07,
|
|
27868
|
+
"input_cost_per_token_above_128k_tokens": 4e-07,
|
|
27869
|
+
"litellm_provider": "xai",
|
|
27870
|
+
"max_input_tokens": 2000000.0,
|
|
27871
|
+
"max_output_tokens": 2000000.0,
|
|
27872
|
+
"max_tokens": 2000000.0,
|
|
27873
|
+
"mode": "chat",
|
|
27874
|
+
"output_cost_per_token": 5e-07,
|
|
27875
|
+
"output_cost_per_token_above_128k_tokens": 1e-06,
|
|
27876
|
+
"source": "https://docs.x.ai/docs/models/grok-4-1-fast-non-reasoning",
|
|
27877
|
+
"supports_audio_input": true,
|
|
27878
|
+
"supports_function_calling": true,
|
|
27879
|
+
"supports_response_schema": true,
|
|
27880
|
+
"supports_tool_choice": true,
|
|
27881
|
+
"supports_vision": true,
|
|
27882
|
+
"supports_web_search": true
|
|
27883
|
+
},
|
|
27884
|
+
"anthropic.claude-sonnet-4-5-20250929-v1:0": {
|
|
27885
|
+
"cache_creation_input_token_cost": 3.75e-06,
|
|
27886
|
+
"cache_read_input_token_cost": 3e-07,
|
|
27887
|
+
"input_cost_per_token": 3e-06,
|
|
27888
|
+
"input_cost_per_token_above_200k_tokens": 6e-06,
|
|
27889
|
+
"output_cost_per_token_above_200k_tokens": 2.25e-05,
|
|
27890
|
+
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
|
|
27891
|
+
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
|
|
27892
|
+
"litellm_provider": "bedrock_converse",
|
|
27893
|
+
"max_input_tokens": 200000,
|
|
27894
|
+
"max_output_tokens": 64000,
|
|
27895
|
+
"max_tokens": 64000,
|
|
27896
|
+
"mode": "chat",
|
|
27897
|
+
"output_cost_per_token": 1.5e-05,
|
|
27898
|
+
"search_context_cost_per_query": {
|
|
27899
|
+
"search_context_size_high": 0.01,
|
|
27900
|
+
"search_context_size_low": 0.01,
|
|
27901
|
+
"search_context_size_medium": 0.01
|
|
27902
|
+
},
|
|
27903
|
+
"supports_assistant_prefill": true,
|
|
27904
|
+
"supports_computer_use": true,
|
|
27905
|
+
"supports_function_calling": true,
|
|
27906
|
+
"supports_pdf_input": true,
|
|
27907
|
+
"supports_prompt_caching": true,
|
|
27908
|
+
"supports_reasoning": true,
|
|
27909
|
+
"supports_response_schema": true,
|
|
27910
|
+
"supports_tool_choice": true,
|
|
27911
|
+
"supports_vision": true,
|
|
27912
|
+
"tool_use_system_prompt_tokens": 159
|
|
27913
|
+
},
|
|
27914
|
+
"bedrock/us-gov-east-1/claude-sonnet-4-5-20250929-v1:0": {
|
|
27915
|
+
"input_cost_per_token": 3.3e-06,
|
|
27916
|
+
"litellm_provider": "bedrock",
|
|
27917
|
+
"max_input_tokens": 200000,
|
|
27918
|
+
"max_output_tokens": 4096,
|
|
27919
|
+
"max_tokens": 4096,
|
|
27920
|
+
"mode": "chat",
|
|
27921
|
+
"output_cost_per_token": 1.65e-05,
|
|
27922
|
+
"supports_assistant_prefill": true,
|
|
27923
|
+
"supports_computer_use": true,
|
|
27924
|
+
"supports_function_calling": true,
|
|
27925
|
+
"supports_pdf_input": true,
|
|
27926
|
+
"supports_prompt_caching": true,
|
|
27927
|
+
"supports_reasoning": true,
|
|
27928
|
+
"supports_response_schema": true,
|
|
27929
|
+
"supports_tool_choice": true,
|
|
27930
|
+
"supports_vision": true
|
|
27931
|
+
},
|
|
27932
|
+
"bedrock/us-gov-west-1/claude-sonnet-4-5-20250929-v1:0": {
|
|
27933
|
+
"input_cost_per_token": 3.3e-06,
|
|
27934
|
+
"litellm_provider": "bedrock",
|
|
27935
|
+
"max_input_tokens": 200000,
|
|
27936
|
+
"max_output_tokens": 4096,
|
|
27937
|
+
"max_tokens": 4096,
|
|
27938
|
+
"mode": "chat",
|
|
27939
|
+
"output_cost_per_token": 1.65e-05,
|
|
27940
|
+
"supports_assistant_prefill": true,
|
|
27941
|
+
"supports_computer_use": true,
|
|
27942
|
+
"supports_function_calling": true,
|
|
27943
|
+
"supports_pdf_input": true,
|
|
27944
|
+
"supports_prompt_caching": true,
|
|
27945
|
+
"supports_reasoning": true,
|
|
27946
|
+
"supports_response_schema": true,
|
|
27947
|
+
"supports_tool_choice": true,
|
|
27948
|
+
"supports_vision": true
|
|
27949
|
+
},
|
|
27950
|
+
"claude-sonnet-4-5-20250929-v1:0": {
|
|
27951
|
+
"cache_creation_input_token_cost": 3.75e-06,
|
|
27952
|
+
"cache_read_input_token_cost": 3e-07,
|
|
27953
|
+
"input_cost_per_token": 3e-06,
|
|
27954
|
+
"input_cost_per_token_above_200k_tokens": 6e-06,
|
|
27955
|
+
"output_cost_per_token_above_200k_tokens": 2.25e-05,
|
|
27956
|
+
"cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
|
|
27957
|
+
"cache_read_input_token_cost_above_200k_tokens": 6e-07,
|
|
27958
|
+
"litellm_provider": "bedrock",
|
|
27959
|
+
"max_input_tokens": 200000,
|
|
27960
|
+
"max_output_tokens": 64000,
|
|
27961
|
+
"max_tokens": 64000,
|
|
27962
|
+
"mode": "chat",
|
|
27963
|
+
"output_cost_per_token": 1.5e-05,
|
|
27964
|
+
"supports_assistant_prefill": true,
|
|
27965
|
+
"supports_computer_use": true,
|
|
27966
|
+
"supports_function_calling": true,
|
|
27967
|
+
"supports_pdf_input": true,
|
|
27968
|
+
"supports_prompt_caching": true,
|
|
27969
|
+
"supports_reasoning": true,
|
|
27970
|
+
"supports_response_schema": true,
|
|
27971
|
+
"supports_tool_choice": true,
|
|
27972
|
+
"supports_vision": true,
|
|
27973
|
+
"tool_use_system_prompt_tokens": 159
|
|
25712
27974
|
}
|
|
25713
27975
|
}
|