tokencostauto 0.1.333__py3-none-any.whl → 0.1.362__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -9266,6 +9266,7 @@
9266
9266
  "supports_function_calling": false,
9267
9267
  "supports_parallel_function_calling": true,
9268
9268
  "supports_prompt_caching": true,
9269
+ "supports_reasoning": true,
9269
9270
  "supports_response_schema": false,
9270
9271
  "supports_system_messages": true,
9271
9272
  "supports_tool_choice": true,
@@ -10442,6 +10443,7 @@
10442
10443
  "supports_audio_output": true,
10443
10444
  "supports_function_calling": true,
10444
10445
  "supports_prompt_caching": true,
10446
+ "supports_reasoning": true,
10445
10447
  "supports_response_schema": true,
10446
10448
  "supports_system_messages": true,
10447
10449
  "supports_tool_choice": true,
@@ -10473,7 +10475,7 @@
10473
10475
  "supports_audio_output": false,
10474
10476
  "supports_function_calling": true,
10475
10477
  "supports_response_schema": true,
10476
- "supports_system_messages": true,
10478
+ "supports_system_messages": false,
10477
10479
  "supports_tool_choice": true,
10478
10480
  "supports_vision": true
10479
10481
  },
@@ -11815,14 +11817,14 @@
11815
11817
  },
11816
11818
  "azure/o3-2025-04-16": {
11817
11819
  "deprecation_date": "2026-04-16",
11818
- "cache_read_input_token_cost": 2.5e-06,
11819
- "input_cost_per_token": 1e-05,
11820
+ "cache_read_input_token_cost": 5e-07,
11821
+ "input_cost_per_token": 2e-06,
11820
11822
  "litellm_provider": "azure",
11821
11823
  "max_input_tokens": 200000,
11822
11824
  "max_output_tokens": 100000,
11823
11825
  "max_tokens": 100000,
11824
11826
  "mode": "chat",
11825
- "output_cost_per_token": 4e-05,
11827
+ "output_cost_per_token": 8e-06,
11826
11828
  "supported_endpoints": [
11827
11829
  "/v1/chat/completions",
11828
11830
  "/v1/batch",
@@ -15602,7 +15604,7 @@
15602
15604
  "tool_use_system_prompt_tokens": 159
15603
15605
  },
15604
15606
  "gemini/gemini-2.5-flash": {
15605
- "cache_read_input_token_cost": 7.5e-08,
15607
+ "cache_read_input_token_cost": 3e-08,
15606
15608
  "input_cost_per_audio_token": 1e-06,
15607
15609
  "input_cost_per_token": 3e-07,
15608
15610
  "litellm_provider": "gemini",
@@ -17812,15 +17814,16 @@
17812
17814
  "supports_tool_choice": true
17813
17815
  },
17814
17816
  "openrouter/qwen/qwen3-coder": {
17815
- "input_cost_per_token": 1e-06,
17817
+ "input_cost_per_token": 2.2e-07,
17816
17818
  "litellm_provider": "openrouter",
17817
- "max_input_tokens": 1000000,
17818
- "max_output_tokens": 1000000,
17819
- "max_tokens": 1000000,
17819
+ "max_input_tokens": 262100,
17820
+ "max_output_tokens": 262100,
17821
+ "max_tokens": 262100,
17820
17822
  "mode": "chat",
17821
- "output_cost_per_token": 5e-06,
17823
+ "output_cost_per_token": 9.5e-07,
17822
17824
  "source": "https://openrouter.ai/qwen/qwen3-coder",
17823
- "supports_tool_choice": true
17825
+ "supports_tool_choice": true,
17826
+ "supports_function_calling": true
17824
17827
  },
17825
17828
  "gemini/imagen-4.0-generate-preview-06-06": {
17826
17829
  "output_cost_per_image": 0.04,
@@ -21714,7 +21717,7 @@
21714
21717
  "max_input_tokens": 1024,
21715
21718
  "max_tokens": 1024,
21716
21719
  "mode": "video_generation",
21717
- "output_cost_per_second": 0.75,
21720
+ "output_cost_per_second": 0.4,
21718
21721
  "source": "https://ai.google.dev/gemini-api/docs/video",
21719
21722
  "supported_modalities": [
21720
21723
  "text"
@@ -21728,7 +21731,7 @@
21728
21731
  "max_input_tokens": 1024,
21729
21732
  "max_tokens": 1024,
21730
21733
  "mode": "video_generation",
21731
- "output_cost_per_second": 0.4,
21734
+ "output_cost_per_second": 0.15,
21732
21735
  "source": "https://ai.google.dev/gemini-api/docs/video",
21733
21736
  "supported_modalities": [
21734
21737
  "text"
@@ -24519,58 +24522,67 @@
24519
24522
  "cache_creation_input_token_cost": 1.25e-06,
24520
24523
  "cache_read_input_token_cost": 1e-07,
24521
24524
  "input_cost_per_token": 1e-06,
24522
- "litellm_provider": "bedrock",
24525
+ "litellm_provider": "bedrock_converse",
24523
24526
  "max_input_tokens": 200000,
24524
- "max_output_tokens": 8192,
24525
- "max_tokens": 8192,
24527
+ "max_output_tokens": 64000,
24528
+ "max_tokens": 64000,
24526
24529
  "mode": "chat",
24527
24530
  "output_cost_per_token": 5e-06,
24528
24531
  "source": "https://aws.amazon.com/about-aws/whats-new/2025/10/claude-4-5-haiku-anthropic-amazon-bedrock",
24529
24532
  "supports_assistant_prefill": true,
24533
+ "supports_computer_use": true,
24530
24534
  "supports_function_calling": true,
24531
24535
  "supports_pdf_input": true,
24532
24536
  "supports_prompt_caching": true,
24533
24537
  "supports_reasoning": true,
24534
24538
  "supports_response_schema": true,
24535
- "supports_tool_choice": true
24539
+ "supports_tool_choice": true,
24540
+ "supports_vision": true,
24541
+ "tool_use_system_prompt_tokens": 346
24536
24542
  },
24537
24543
  "anthropic.claude-haiku-4-5@20251001": {
24538
24544
  "cache_creation_input_token_cost": 1.25e-06,
24539
24545
  "cache_read_input_token_cost": 1e-07,
24540
24546
  "input_cost_per_token": 1e-06,
24541
- "litellm_provider": "bedrock",
24547
+ "litellm_provider": "bedrock_converse",
24542
24548
  "max_input_tokens": 200000,
24543
- "max_output_tokens": 8192,
24544
- "max_tokens": 8192,
24549
+ "max_output_tokens": 64000,
24550
+ "max_tokens": 64000,
24545
24551
  "mode": "chat",
24546
24552
  "output_cost_per_token": 5e-06,
24547
24553
  "source": "https://aws.amazon.com/about-aws/whats-new/2025/10/claude-4-5-haiku-anthropic-amazon-bedrock",
24548
24554
  "supports_assistant_prefill": true,
24555
+ "supports_computer_use": true,
24549
24556
  "supports_function_calling": true,
24550
24557
  "supports_pdf_input": true,
24551
24558
  "supports_prompt_caching": true,
24552
24559
  "supports_reasoning": true,
24553
24560
  "supports_response_schema": true,
24554
- "supports_tool_choice": true
24561
+ "supports_tool_choice": true,
24562
+ "supports_vision": true,
24563
+ "tool_use_system_prompt_tokens": 346
24555
24564
  },
24556
24565
  "apac.anthropic.claude-haiku-4-5-20251001-v1:0": {
24557
24566
  "cache_creation_input_token_cost": 1.375e-06,
24558
24567
  "cache_read_input_token_cost": 1.1e-07,
24559
24568
  "input_cost_per_token": 1.1e-06,
24560
- "litellm_provider": "bedrock",
24569
+ "litellm_provider": "bedrock_converse",
24561
24570
  "max_input_tokens": 200000,
24562
- "max_output_tokens": 8192,
24563
- "max_tokens": 8192,
24571
+ "max_output_tokens": 64000,
24572
+ "max_tokens": 64000,
24564
24573
  "mode": "chat",
24565
24574
  "output_cost_per_token": 5.5e-06,
24566
24575
  "source": "https://aws.amazon.com/about-aws/whats-new/2025/10/claude-4-5-haiku-anthropic-amazon-bedrock",
24567
24576
  "supports_assistant_prefill": true,
24577
+ "supports_computer_use": true,
24568
24578
  "supports_function_calling": true,
24569
24579
  "supports_pdf_input": true,
24570
24580
  "supports_prompt_caching": true,
24571
24581
  "supports_reasoning": true,
24572
24582
  "supports_response_schema": true,
24573
- "supports_tool_choice": true
24583
+ "supports_tool_choice": true,
24584
+ "supports_vision": true,
24585
+ "tool_use_system_prompt_tokens": 346
24574
24586
  },
24575
24587
  "claude-haiku-4-5-20251001": {
24576
24588
  "cache_creation_input_token_cost": 1.25e-06,
@@ -24619,20 +24631,23 @@
24619
24631
  "cache_read_input_token_cost": 1.1e-07,
24620
24632
  "input_cost_per_token": 1.1e-06,
24621
24633
  "deprecation_date": "2026-10-15",
24622
- "litellm_provider": "bedrock",
24634
+ "litellm_provider": "bedrock_converse",
24623
24635
  "max_input_tokens": 200000,
24624
- "max_output_tokens": 8192,
24625
- "max_tokens": 8192,
24636
+ "max_output_tokens": 64000,
24637
+ "max_tokens": 64000,
24626
24638
  "mode": "chat",
24627
24639
  "output_cost_per_token": 5.5e-06,
24628
24640
  "source": "https://aws.amazon.com/about-aws/whats-new/2025/10/claude-4-5-haiku-anthropic-amazon-bedrock",
24629
24641
  "supports_assistant_prefill": true,
24642
+ "supports_computer_use": true,
24630
24643
  "supports_function_calling": true,
24631
24644
  "supports_pdf_input": true,
24632
24645
  "supports_prompt_caching": true,
24633
24646
  "supports_reasoning": true,
24634
24647
  "supports_response_schema": true,
24635
- "supports_tool_choice": true
24648
+ "supports_tool_choice": true,
24649
+ "supports_vision": true,
24650
+ "tool_use_system_prompt_tokens": 346
24636
24651
  },
24637
24652
  "gemini-2.5-flash-image": {
24638
24653
  "cache_read_input_token_cost": 3e-08,
@@ -24689,6 +24704,7 @@
24689
24704
  "litellm_provider": "vertex_ai-language-models",
24690
24705
  "max_audio_length_hours": 8.4,
24691
24706
  "max_audio_per_prompt": 1,
24707
+ "supports_reasoning": false,
24692
24708
  "max_images_per_prompt": 3000,
24693
24709
  "max_input_tokens": 32768,
24694
24710
  "max_output_tokens": 32768,
@@ -24782,39 +24798,45 @@
24782
24798
  "cache_creation_input_token_cost": 1.375e-06,
24783
24799
  "cache_read_input_token_cost": 1.1e-07,
24784
24800
  "input_cost_per_token": 1.1e-06,
24785
- "litellm_provider": "bedrock",
24801
+ "litellm_provider": "bedrock_converse",
24786
24802
  "max_input_tokens": 200000,
24787
- "max_output_tokens": 8192,
24788
- "max_tokens": 8192,
24803
+ "max_output_tokens": 64000,
24804
+ "max_tokens": 64000,
24789
24805
  "mode": "chat",
24790
24806
  "output_cost_per_token": 5.5e-06,
24791
24807
  "source": "https://aws.amazon.com/about-aws/whats-new/2025/10/claude-4-5-haiku-anthropic-amazon-bedrock",
24792
24808
  "supports_assistant_prefill": true,
24809
+ "supports_computer_use": true,
24793
24810
  "supports_function_calling": true,
24794
24811
  "supports_pdf_input": true,
24795
24812
  "supports_prompt_caching": true,
24796
24813
  "supports_reasoning": true,
24797
24814
  "supports_response_schema": true,
24798
- "supports_tool_choice": true
24815
+ "supports_tool_choice": true,
24816
+ "supports_vision": true,
24817
+ "tool_use_system_prompt_tokens": 346
24799
24818
  },
24800
24819
  "us.anthropic.claude-haiku-4-5-20251001-v1:0": {
24801
24820
  "cache_creation_input_token_cost": 1.375e-06,
24802
24821
  "cache_read_input_token_cost": 1.1e-07,
24803
24822
  "input_cost_per_token": 1.1e-06,
24804
- "litellm_provider": "bedrock",
24823
+ "litellm_provider": "bedrock_converse",
24805
24824
  "max_input_tokens": 200000,
24806
- "max_output_tokens": 8192,
24807
- "max_tokens": 8192,
24825
+ "max_output_tokens": 64000,
24826
+ "max_tokens": 64000,
24808
24827
  "mode": "chat",
24809
24828
  "output_cost_per_token": 5.5e-06,
24810
24829
  "source": "https://aws.amazon.com/about-aws/whats-new/2025/10/claude-4-5-haiku-anthropic-amazon-bedrock",
24811
24830
  "supports_assistant_prefill": true,
24831
+ "supports_computer_use": true,
24812
24832
  "supports_function_calling": true,
24813
24833
  "supports_pdf_input": true,
24814
24834
  "supports_prompt_caching": true,
24815
24835
  "supports_reasoning": true,
24816
24836
  "supports_response_schema": true,
24817
- "supports_tool_choice": true
24837
+ "supports_tool_choice": true,
24838
+ "supports_vision": true,
24839
+ "tool_use_system_prompt_tokens": 346
24818
24840
  },
24819
24841
  "vertex_ai/claude-haiku-4-5@20251001": {
24820
24842
  "cache_creation_input_token_cost": 1.25e-06,
@@ -24882,12 +24904,13 @@
24882
24904
  "input_cost_per_token": 1.1e-06,
24883
24905
  "litellm_provider": "bedrock_converse",
24884
24906
  "max_input_tokens": 200000,
24885
- "max_output_tokens": 8192,
24886
- "max_tokens": 8192,
24907
+ "max_output_tokens": 64000,
24908
+ "max_tokens": 64000,
24887
24909
  "mode": "chat",
24888
24910
  "output_cost_per_token": 5.5e-06,
24889
24911
  "source": "https://aws.amazon.com/about-aws/whats-new/2025/10/claude-4-5-haiku-anthropic-amazon-bedrock",
24890
24912
  "supports_assistant_prefill": true,
24913
+ "supports_computer_use": true,
24891
24914
  "supports_function_calling": true,
24892
24915
  "supports_pdf_input": true,
24893
24916
  "supports_prompt_caching": true,
@@ -24903,14 +24926,16 @@
24903
24926
  "input_cost_per_token": 1.1e-06,
24904
24927
  "litellm_provider": "bedrock_converse",
24905
24928
  "max_input_tokens": 200000,
24906
- "max_output_tokens": 8192,
24907
- "max_tokens": 8192,
24929
+ "max_output_tokens": 64000,
24930
+ "max_tokens": 64000,
24908
24931
  "mode": "chat",
24909
24932
  "output_cost_per_token": 5.5e-06,
24910
24933
  "supports_assistant_prefill": true,
24934
+ "supports_computer_use": true,
24911
24935
  "supports_function_calling": true,
24912
24936
  "supports_pdf_input": true,
24913
24937
  "supports_prompt_caching": true,
24938
+ "supports_reasoning": true,
24914
24939
  "supports_response_schema": true,
24915
24940
  "supports_tool_choice": true,
24916
24941
  "supports_vision": true,
@@ -25276,7 +25301,7 @@
25276
25301
  "fal_ai/fal-ai/flux-pro/v1.1-ultra": {
25277
25302
  "litellm_provider": "fal_ai",
25278
25303
  "mode": "image_generation",
25279
- "output_cost_per_image": 0.0398,
25304
+ "output_cost_per_image": 0.06,
25280
25305
  "supported_endpoints": [
25281
25306
  "/v1/images/generations"
25282
25307
  ]
@@ -25709,5 +25734,2242 @@
25709
25734
  "source": "https://cloud.google.com/vertex-ai/generative-ai/pricing#partner-models",
25710
25735
  "supports_function_calling": true,
25711
25736
  "supports_tool_choice": true
25737
+ },
25738
+ "cohere/embed-v4.0": {
25739
+ "input_cost_per_token": 1.2e-07,
25740
+ "litellm_provider": "cohere",
25741
+ "max_input_tokens": 128000,
25742
+ "max_tokens": 128000,
25743
+ "mode": "embedding",
25744
+ "output_cost_per_token": 0.0,
25745
+ "output_vector_size": 1536,
25746
+ "supports_embedding_image_input": true
25747
+ },
25748
+ "gemini/veo-3.1-fast-generate-preview": {
25749
+ "litellm_provider": "gemini",
25750
+ "max_input_tokens": 1024,
25751
+ "max_tokens": 1024,
25752
+ "mode": "video_generation",
25753
+ "output_cost_per_second": 0.15,
25754
+ "source": "https://ai.google.dev/gemini-api/docs/video",
25755
+ "supported_modalities": [
25756
+ "text"
25757
+ ],
25758
+ "supported_output_modalities": [
25759
+ "video"
25760
+ ]
25761
+ },
25762
+ "gemini/veo-3.1-generate-preview": {
25763
+ "litellm_provider": "gemini",
25764
+ "max_input_tokens": 1024,
25765
+ "max_tokens": 1024,
25766
+ "mode": "video_generation",
25767
+ "output_cost_per_second": 0.4,
25768
+ "source": "https://ai.google.dev/gemini-api/docs/video",
25769
+ "supported_modalities": [
25770
+ "text"
25771
+ ],
25772
+ "supported_output_modalities": [
25773
+ "video"
25774
+ ]
25775
+ },
25776
+ "vertex_ai/veo-3.1-generate-preview": {
25777
+ "litellm_provider": "vertex_ai-video-models",
25778
+ "max_input_tokens": 1024,
25779
+ "max_tokens": 1024,
25780
+ "mode": "video_generation",
25781
+ "output_cost_per_second": 0.4,
25782
+ "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/model-reference/veo",
25783
+ "supported_modalities": [
25784
+ "text"
25785
+ ],
25786
+ "supported_output_modalities": [
25787
+ "video"
25788
+ ]
25789
+ },
25790
+ "vertex_ai/veo-3.1-fast-generate-preview": {
25791
+ "litellm_provider": "vertex_ai-video-models",
25792
+ "max_input_tokens": 1024,
25793
+ "max_tokens": 1024,
25794
+ "mode": "video_generation",
25795
+ "output_cost_per_second": 0.15,
25796
+ "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/model-reference/veo",
25797
+ "supported_modalities": [
25798
+ "text"
25799
+ ],
25800
+ "supported_output_modalities": [
25801
+ "video"
25802
+ ]
25803
+ },
25804
+ "moonshot/kimi-k2-thinking": {
25805
+ "cache_read_input_token_cost": 1.5e-07,
25806
+ "input_cost_per_token": 6e-07,
25807
+ "litellm_provider": "moonshot",
25808
+ "max_input_tokens": 262144,
25809
+ "max_output_tokens": 262144,
25810
+ "max_tokens": 262144,
25811
+ "mode": "chat",
25812
+ "output_cost_per_token": 2.5e-06,
25813
+ "source": "https://platform.moonshot.ai/docs/pricing/chat#generation-model-kimi-k2",
25814
+ "supports_function_calling": true,
25815
+ "supports_tool_choice": true,
25816
+ "supports_web_search": true
25817
+ },
25818
+ "mistral/magistral-medium-2509": {
25819
+ "input_cost_per_token": 2e-06,
25820
+ "litellm_provider": "mistral",
25821
+ "max_input_tokens": 40000,
25822
+ "max_output_tokens": 40000,
25823
+ "max_tokens": 40000,
25824
+ "mode": "chat",
25825
+ "output_cost_per_token": 5e-06,
25826
+ "source": "https://mistral.ai/news/magistral",
25827
+ "supports_assistant_prefill": true,
25828
+ "supports_function_calling": true,
25829
+ "supports_reasoning": true,
25830
+ "supports_response_schema": true,
25831
+ "supports_tool_choice": true
25832
+ },
25833
+ "openrouter/deepseek/deepseek-v3.2-exp": {
25834
+ "input_cost_per_token": 2e-07,
25835
+ "input_cost_per_token_cache_hit": 2e-08,
25836
+ "litellm_provider": "openrouter",
25837
+ "max_input_tokens": 163840,
25838
+ "max_output_tokens": 163840,
25839
+ "max_tokens": 8192,
25840
+ "mode": "chat",
25841
+ "output_cost_per_token": 4e-07,
25842
+ "supports_assistant_prefill": true,
25843
+ "supports_function_calling": true,
25844
+ "supports_prompt_caching": true,
25845
+ "supports_reasoning": false,
25846
+ "supports_tool_choice": true
25847
+ },
25848
+ "openrouter/minimax/minimax-m2": {
25849
+ "input_cost_per_token": 2.55e-07,
25850
+ "litellm_provider": "openrouter",
25851
+ "max_input_tokens": 204800,
25852
+ "max_output_tokens": 204800,
25853
+ "max_tokens": 32768,
25854
+ "mode": "chat",
25855
+ "output_cost_per_token": 1.02e-06,
25856
+ "supports_function_calling": true,
25857
+ "supports_prompt_caching": false,
25858
+ "supports_reasoning": true,
25859
+ "supports_tool_choice": true
25860
+ },
25861
+ "openrouter/z-ai/glm-4.6": {
25862
+ "input_cost_per_token": 4e-07,
25863
+ "litellm_provider": "openrouter",
25864
+ "max_input_tokens": 202800,
25865
+ "max_output_tokens": 131000,
25866
+ "max_tokens": 202800,
25867
+ "mode": "chat",
25868
+ "output_cost_per_token": 1.75e-06,
25869
+ "source": "https://openrouter.ai/z-ai/glm-4.6",
25870
+ "supports_function_calling": true,
25871
+ "supports_reasoning": true,
25872
+ "supports_tool_choice": true
25873
+ },
25874
+ "openrouter/z-ai/glm-4.6:exacto": {
25875
+ "input_cost_per_token": 4.5e-07,
25876
+ "litellm_provider": "openrouter",
25877
+ "max_input_tokens": 202800,
25878
+ "max_output_tokens": 131000,
25879
+ "max_tokens": 202800,
25880
+ "mode": "chat",
25881
+ "output_cost_per_token": 1.9e-06,
25882
+ "source": "https://openrouter.ai/z-ai/glm-4.6:exacto",
25883
+ "supports_function_calling": true,
25884
+ "supports_reasoning": true,
25885
+ "supports_tool_choice": true
25886
+ },
25887
+ "runwayml/gen4_turbo": {
25888
+ "litellm_provider": "runwayml",
25889
+ "mode": "video_generation",
25890
+ "output_cost_per_video_per_second": 0.05,
25891
+ "source": "https://docs.dev.runwayml.com/guides/pricing/",
25892
+ "supported_modalities": [
25893
+ "text",
25894
+ "image"
25895
+ ],
25896
+ "supported_output_modalities": [
25897
+ "video"
25898
+ ],
25899
+ "supported_resolutions": [
25900
+ "1280x720",
25901
+ "720x1280"
25902
+ ],
25903
+ "metadata": {
25904
+ "comment": "5 credits per second @ $0.01 per credit = $0.05 per second"
25905
+ }
25906
+ },
25907
+ "runwayml/gen4_aleph": {
25908
+ "litellm_provider": "runwayml",
25909
+ "mode": "video_generation",
25910
+ "output_cost_per_video_per_second": 0.15,
25911
+ "source": "https://docs.dev.runwayml.com/guides/pricing/",
25912
+ "supported_modalities": [
25913
+ "text",
25914
+ "image"
25915
+ ],
25916
+ "supported_output_modalities": [
25917
+ "video"
25918
+ ],
25919
+ "supported_resolutions": [
25920
+ "1280x720",
25921
+ "720x1280"
25922
+ ],
25923
+ "metadata": {
25924
+ "comment": "15 credits per second @ $0.01 per credit = $0.15 per second"
25925
+ }
25926
+ },
25927
+ "runwayml/gen3a_turbo": {
25928
+ "litellm_provider": "runwayml",
25929
+ "mode": "video_generation",
25930
+ "output_cost_per_video_per_second": 0.05,
25931
+ "source": "https://docs.dev.runwayml.com/guides/pricing/",
25932
+ "supported_modalities": [
25933
+ "text",
25934
+ "image"
25935
+ ],
25936
+ "supported_output_modalities": [
25937
+ "video"
25938
+ ],
25939
+ "supported_resolutions": [
25940
+ "1280x720",
25941
+ "720x1280"
25942
+ ],
25943
+ "metadata": {
25944
+ "comment": "5 credits per second @ $0.01 per credit = $0.05 per second"
25945
+ }
25946
+ },
25947
+ "runwayml/gen4_image": {
25948
+ "litellm_provider": "runwayml",
25949
+ "mode": "image_generation",
25950
+ "input_cost_per_image": 0.05,
25951
+ "output_cost_per_image": 0.05,
25952
+ "source": "https://docs.dev.runwayml.com/guides/pricing/",
25953
+ "supported_modalities": [
25954
+ "text",
25955
+ "image"
25956
+ ],
25957
+ "supported_output_modalities": [
25958
+ "image"
25959
+ ],
25960
+ "supported_resolutions": [
25961
+ "1280x720",
25962
+ "1920x1080"
25963
+ ],
25964
+ "metadata": {
25965
+ "comment": "5 credits per 720p image or 8 credits per 1080p image @ $0.01 per credit. Using 5 credits ($0.05) as base cost"
25966
+ }
25967
+ },
25968
+ "runwayml/gen4_image_turbo": {
25969
+ "litellm_provider": "runwayml",
25970
+ "mode": "image_generation",
25971
+ "input_cost_per_image": 0.02,
25972
+ "output_cost_per_image": 0.02,
25973
+ "source": "https://docs.dev.runwayml.com/guides/pricing/",
25974
+ "supported_modalities": [
25975
+ "text",
25976
+ "image"
25977
+ ],
25978
+ "supported_output_modalities": [
25979
+ "image"
25980
+ ],
25981
+ "supported_resolutions": [
25982
+ "1280x720",
25983
+ "1920x1080"
25984
+ ],
25985
+ "metadata": {
25986
+ "comment": "2 credits per image (any resolution) @ $0.01 per credit = $0.02 per image"
25987
+ }
25988
+ },
25989
+ "gpt-5.1": {
25990
+ "cache_read_input_token_cost": 1.25e-07,
25991
+ "cache_read_input_token_cost_priority": 2.5e-07,
25992
+ "input_cost_per_token": 1.25e-06,
25993
+ "input_cost_per_token_priority": 2.5e-06,
25994
+ "litellm_provider": "openai",
25995
+ "max_input_tokens": 272000,
25996
+ "max_output_tokens": 128000,
25997
+ "max_tokens": 128000,
25998
+ "mode": "chat",
25999
+ "output_cost_per_token": 1e-05,
26000
+ "output_cost_per_token_priority": 2e-05,
26001
+ "supported_endpoints": [
26002
+ "/v1/chat/completions",
26003
+ "/v1/responses"
26004
+ ],
26005
+ "supported_modalities": [
26006
+ "text",
26007
+ "image"
26008
+ ],
26009
+ "supported_output_modalities": [
26010
+ "text",
26011
+ "image"
26012
+ ],
26013
+ "supports_function_calling": true,
26014
+ "supports_native_streaming": true,
26015
+ "supports_parallel_function_calling": true,
26016
+ "supports_pdf_input": true,
26017
+ "supports_prompt_caching": true,
26018
+ "supports_reasoning": true,
26019
+ "supports_response_schema": true,
26020
+ "supports_system_messages": true,
26021
+ "supports_tool_choice": true,
26022
+ "supports_service_tier": true,
26023
+ "supports_vision": true
26024
+ },
26025
+ "gpt-5.1-2025-11-13": {
26026
+ "cache_read_input_token_cost": 1.25e-07,
26027
+ "cache_read_input_token_cost_priority": 2.5e-07,
26028
+ "input_cost_per_token": 1.25e-06,
26029
+ "input_cost_per_token_priority": 2.5e-06,
26030
+ "litellm_provider": "openai",
26031
+ "max_input_tokens": 272000,
26032
+ "max_output_tokens": 128000,
26033
+ "max_tokens": 128000,
26034
+ "mode": "chat",
26035
+ "output_cost_per_token": 1e-05,
26036
+ "output_cost_per_token_priority": 2e-05,
26037
+ "supported_endpoints": [
26038
+ "/v1/chat/completions",
26039
+ "/v1/responses"
26040
+ ],
26041
+ "supported_modalities": [
26042
+ "text",
26043
+ "image"
26044
+ ],
26045
+ "supported_output_modalities": [
26046
+ "text",
26047
+ "image"
26048
+ ],
26049
+ "supports_function_calling": true,
26050
+ "supports_native_streaming": true,
26051
+ "supports_parallel_function_calling": true,
26052
+ "supports_pdf_input": true,
26053
+ "supports_prompt_caching": true,
26054
+ "supports_reasoning": true,
26055
+ "supports_response_schema": true,
26056
+ "supports_system_messages": true,
26057
+ "supports_tool_choice": true,
26058
+ "supports_service_tier": true,
26059
+ "supports_vision": true
26060
+ },
26061
+ "gpt-5.1-chat-latest": {
26062
+ "cache_read_input_token_cost": 1.25e-07,
26063
+ "cache_read_input_token_cost_priority": 2.5e-07,
26064
+ "input_cost_per_token": 1.25e-06,
26065
+ "input_cost_per_token_priority": 2.5e-06,
26066
+ "litellm_provider": "openai",
26067
+ "max_input_tokens": 128000,
26068
+ "max_output_tokens": 16384,
26069
+ "max_tokens": 16384,
26070
+ "mode": "chat",
26071
+ "output_cost_per_token": 1e-05,
26072
+ "output_cost_per_token_priority": 2e-05,
26073
+ "supported_endpoints": [
26074
+ "/v1/chat/completions",
26075
+ "/v1/responses"
26076
+ ],
26077
+ "supported_modalities": [
26078
+ "text",
26079
+ "image"
26080
+ ],
26081
+ "supported_output_modalities": [
26082
+ "text",
26083
+ "image"
26084
+ ],
26085
+ "supports_function_calling": false,
26086
+ "supports_native_streaming": true,
26087
+ "supports_parallel_function_calling": false,
26088
+ "supports_pdf_input": true,
26089
+ "supports_prompt_caching": true,
26090
+ "supports_reasoning": true,
26091
+ "supports_response_schema": true,
26092
+ "supports_system_messages": true,
26093
+ "supports_tool_choice": false,
26094
+ "supports_vision": true
26095
+ },
26096
+ "gpt-5.1-codex": {
26097
+ "cache_read_input_token_cost": 1.25e-07,
26098
+ "cache_read_input_token_cost_priority": 2.5e-07,
26099
+ "input_cost_per_token": 1.25e-06,
26100
+ "input_cost_per_token_priority": 2.5e-06,
26101
+ "litellm_provider": "openai",
26102
+ "max_input_tokens": 272000,
26103
+ "max_output_tokens": 128000,
26104
+ "max_tokens": 128000,
26105
+ "mode": "responses",
26106
+ "output_cost_per_token": 1e-05,
26107
+ "output_cost_per_token_priority": 2e-05,
26108
+ "supported_endpoints": [
26109
+ "/v1/responses"
26110
+ ],
26111
+ "supported_modalities": [
26112
+ "text",
26113
+ "image"
26114
+ ],
26115
+ "supported_output_modalities": [
26116
+ "text"
26117
+ ],
26118
+ "supports_function_calling": true,
26119
+ "supports_native_streaming": true,
26120
+ "supports_parallel_function_calling": true,
26121
+ "supports_pdf_input": true,
26122
+ "supports_prompt_caching": true,
26123
+ "supports_reasoning": true,
26124
+ "supports_response_schema": true,
26125
+ "supports_system_messages": false,
26126
+ "supports_tool_choice": true,
26127
+ "supports_vision": true
26128
+ },
26129
+ "gpt-5.1-codex-mini": {
26130
+ "cache_read_input_token_cost": 2.5e-08,
26131
+ "cache_read_input_token_cost_priority": 4.5e-08,
26132
+ "input_cost_per_token": 2.5e-07,
26133
+ "input_cost_per_token_priority": 4.5e-07,
26134
+ "litellm_provider": "openai",
26135
+ "max_input_tokens": 272000,
26136
+ "max_output_tokens": 128000,
26137
+ "max_tokens": 128000,
26138
+ "mode": "responses",
26139
+ "output_cost_per_token": 2e-06,
26140
+ "output_cost_per_token_priority": 3.6e-06,
26141
+ "supported_endpoints": [
26142
+ "/v1/responses"
26143
+ ],
26144
+ "supported_modalities": [
26145
+ "text",
26146
+ "image"
26147
+ ],
26148
+ "supported_output_modalities": [
26149
+ "text"
26150
+ ],
26151
+ "supports_function_calling": true,
26152
+ "supports_native_streaming": true,
26153
+ "supports_parallel_function_calling": true,
26154
+ "supports_pdf_input": true,
26155
+ "supports_prompt_caching": true,
26156
+ "supports_reasoning": true,
26157
+ "supports_response_schema": true,
26158
+ "supports_system_messages": false,
26159
+ "supports_tool_choice": true,
26160
+ "supports_vision": true
26161
+ },
26162
+ "fal_ai/fal-ai/flux/schnell": {
26163
+ "litellm_provider": "fal_ai",
26164
+ "mode": "image_generation",
26165
+ "output_cost_per_image": 0.003,
26166
+ "supported_endpoints": [
26167
+ "/v1/images/generations"
26168
+ ]
26169
+ },
26170
+ "fal_ai/fal-ai/imagen4/preview/fast": {
26171
+ "litellm_provider": "fal_ai",
26172
+ "mode": "image_generation",
26173
+ "output_cost_per_image": 0.02,
26174
+ "supported_endpoints": [
26175
+ "/v1/images/generations"
26176
+ ]
26177
+ },
26178
+ "fal_ai/fal-ai/imagen4/preview/ultra": {
26179
+ "litellm_provider": "fal_ai",
26180
+ "mode": "image_generation",
26181
+ "output_cost_per_image": 0.06,
26182
+ "supported_endpoints": [
26183
+ "/v1/images/generations"
26184
+ ]
26185
+ },
26186
+ "voyage/voyage-3.5": {
26187
+ "input_cost_per_token": 6e-08,
26188
+ "litellm_provider": "voyage",
26189
+ "max_input_tokens": 32000,
26190
+ "max_tokens": 32000,
26191
+ "mode": "embedding",
26192
+ "output_cost_per_token": 0.0
26193
+ },
26194
+ "voyage/voyage-3.5-lite": {
26195
+ "input_cost_per_token": 2e-08,
26196
+ "litellm_provider": "voyage",
26197
+ "max_input_tokens": 32000,
26198
+ "max_tokens": 32000,
26199
+ "mode": "embedding",
26200
+ "output_cost_per_token": 0.0
26201
+ },
26202
+ "runwayml/eleven_multilingual_v2": {
26203
+ "litellm_provider": "runwayml",
26204
+ "mode": "audio_speech",
26205
+ "input_cost_per_character": 3e-07,
26206
+ "source": "https://docs.dev.runwayml.com/guides/pricing/",
26207
+ "metadata": {
26208
+ "comment": "Estimated cost based on standard TTS pricing. RunwayML uses ElevenLabs models."
26209
+ }
26210
+ },
26211
+ "fal_ai/fal-ai/flux-pro/v1.1": {
26212
+ "litellm_provider": "fal_ai",
26213
+ "mode": "image_generation",
26214
+ "output_cost_per_image": 0.04,
26215
+ "supported_endpoints": [
26216
+ "/v1/images/generations"
26217
+ ]
26218
+ },
26219
+ "fal_ai/fal-ai/bytedance/seedream/v3/text-to-image": {
26220
+ "litellm_provider": "fal_ai",
26221
+ "mode": "image_generation",
26222
+ "output_cost_per_image": 0.03,
26223
+ "supported_endpoints": [
26224
+ "/v1/images/generations"
26225
+ ]
26226
+ },
26227
+ "fal_ai/fal-ai/bytedance/dreamina/v3.1/text-to-image": {
26228
+ "litellm_provider": "fal_ai",
26229
+ "mode": "image_generation",
26230
+ "output_cost_per_image": 0.03,
26231
+ "supported_endpoints": [
26232
+ "/v1/images/generations"
26233
+ ]
26234
+ },
26235
+ "fal_ai/fal-ai/ideogram/v3": {
26236
+ "litellm_provider": "fal_ai",
26237
+ "mode": "image_generation",
26238
+ "output_cost_per_image": 0.06,
26239
+ "supported_endpoints": [
26240
+ "/v1/images/generations"
26241
+ ]
26242
+ },
26243
+ "vertex_ai/moonshotai/kimi-k2-thinking-maas": {
26244
+ "input_cost_per_token": 6e-07,
26245
+ "litellm_provider": "vertex_ai-moonshot_models",
26246
+ "max_input_tokens": 256000,
26247
+ "max_output_tokens": 256000,
26248
+ "max_tokens": 256000,
26249
+ "mode": "chat",
26250
+ "output_cost_per_token": 2.5e-06,
26251
+ "source": "https://cloud.google.com/vertex-ai/generative-ai/pricing#partner-models",
26252
+ "supports_function_calling": true,
26253
+ "supports_tool_choice": true,
26254
+ "supports_web_search": true
26255
+ },
26256
+ "azure/eu/gpt-5-2025-08-07": {
26257
+ "cache_read_input_token_cost": 1.375e-07,
26258
+ "input_cost_per_token": 1.375e-06,
26259
+ "litellm_provider": "azure",
26260
+ "max_input_tokens": 272000,
26261
+ "max_output_tokens": 128000,
26262
+ "max_tokens": 128000,
26263
+ "mode": "chat",
26264
+ "output_cost_per_token": 1.1e-05,
26265
+ "supported_endpoints": [
26266
+ "/v1/chat/completions",
26267
+ "/v1/batch",
26268
+ "/v1/responses"
26269
+ ],
26270
+ "supported_modalities": [
26271
+ "text",
26272
+ "image"
26273
+ ],
26274
+ "supported_output_modalities": [
26275
+ "text"
26276
+ ],
26277
+ "supports_function_calling": true,
26278
+ "supports_native_streaming": true,
26279
+ "supports_parallel_function_calling": true,
26280
+ "supports_pdf_input": true,
26281
+ "supports_prompt_caching": true,
26282
+ "supports_reasoning": true,
26283
+ "supports_response_schema": true,
26284
+ "supports_system_messages": true,
26285
+ "supports_tool_choice": true,
26286
+ "supports_vision": true
26287
+ },
26288
+ "azure/eu/gpt-5-mini-2025-08-07": {
26289
+ "cache_read_input_token_cost": 2.75e-08,
26290
+ "input_cost_per_token": 2.75e-07,
26291
+ "litellm_provider": "azure",
26292
+ "max_input_tokens": 272000,
26293
+ "max_output_tokens": 128000,
26294
+ "max_tokens": 128000,
26295
+ "mode": "chat",
26296
+ "output_cost_per_token": 2.2e-06,
26297
+ "supported_endpoints": [
26298
+ "/v1/chat/completions",
26299
+ "/v1/batch",
26300
+ "/v1/responses"
26301
+ ],
26302
+ "supported_modalities": [
26303
+ "text",
26304
+ "image"
26305
+ ],
26306
+ "supported_output_modalities": [
26307
+ "text"
26308
+ ],
26309
+ "supports_function_calling": true,
26310
+ "supports_native_streaming": true,
26311
+ "supports_parallel_function_calling": true,
26312
+ "supports_pdf_input": true,
26313
+ "supports_prompt_caching": true,
26314
+ "supports_reasoning": true,
26315
+ "supports_response_schema": true,
26316
+ "supports_system_messages": true,
26317
+ "supports_tool_choice": true,
26318
+ "supports_vision": true
26319
+ },
26320
+ "azure/eu/gpt-5-nano-2025-08-07": {
26321
+ "cache_read_input_token_cost": 5.5e-09,
26322
+ "input_cost_per_token": 5.5e-08,
26323
+ "litellm_provider": "azure",
26324
+ "max_input_tokens": 272000,
26325
+ "max_output_tokens": 128000,
26326
+ "max_tokens": 128000,
26327
+ "mode": "chat",
26328
+ "output_cost_per_token": 4.4e-07,
26329
+ "supported_endpoints": [
26330
+ "/v1/chat/completions",
26331
+ "/v1/batch",
26332
+ "/v1/responses"
26333
+ ],
26334
+ "supported_modalities": [
26335
+ "text",
26336
+ "image"
26337
+ ],
26338
+ "supported_output_modalities": [
26339
+ "text"
26340
+ ],
26341
+ "supports_function_calling": true,
26342
+ "supports_native_streaming": true,
26343
+ "supports_parallel_function_calling": true,
26344
+ "supports_pdf_input": true,
26345
+ "supports_prompt_caching": true,
26346
+ "supports_reasoning": true,
26347
+ "supports_response_schema": true,
26348
+ "supports_system_messages": true,
26349
+ "supports_tool_choice": true,
26350
+ "supports_vision": true
26351
+ },
26352
+ "azure/us/gpt-4.1-2025-04-14": {
26353
+ "deprecation_date": "2026-11-04",
26354
+ "cache_read_input_token_cost": 5.5e-07,
26355
+ "input_cost_per_token": 2.2e-06,
26356
+ "input_cost_per_token_batches": 1.1e-06,
26357
+ "litellm_provider": "azure",
26358
+ "max_input_tokens": 1047576,
26359
+ "max_output_tokens": 32768,
26360
+ "max_tokens": 32768,
26361
+ "mode": "chat",
26362
+ "output_cost_per_token": 8.8e-06,
26363
+ "output_cost_per_token_batches": 4.4e-06,
26364
+ "supported_endpoints": [
26365
+ "/v1/chat/completions",
26366
+ "/v1/batch",
26367
+ "/v1/responses"
26368
+ ],
26369
+ "supported_modalities": [
26370
+ "text",
26371
+ "image"
26372
+ ],
26373
+ "supported_output_modalities": [
26374
+ "text"
26375
+ ],
26376
+ "supports_function_calling": true,
26377
+ "supports_native_streaming": true,
26378
+ "supports_parallel_function_calling": true,
26379
+ "supports_prompt_caching": true,
26380
+ "supports_response_schema": true,
26381
+ "supports_system_messages": true,
26382
+ "supports_tool_choice": true,
26383
+ "supports_vision": true,
26384
+ "supports_web_search": false
26385
+ },
26386
+ "azure/us/gpt-4.1-mini-2025-04-14": {
26387
+ "deprecation_date": "2026-11-04",
26388
+ "cache_read_input_token_cost": 1.1e-07,
26389
+ "input_cost_per_token": 4.4e-07,
26390
+ "input_cost_per_token_batches": 2.2e-07,
26391
+ "litellm_provider": "azure",
26392
+ "max_input_tokens": 1047576,
26393
+ "max_output_tokens": 32768,
26394
+ "max_tokens": 32768,
26395
+ "mode": "chat",
26396
+ "output_cost_per_token": 1.76e-06,
26397
+ "output_cost_per_token_batches": 8.8e-07,
26398
+ "supported_endpoints": [
26399
+ "/v1/chat/completions",
26400
+ "/v1/batch",
26401
+ "/v1/responses"
26402
+ ],
26403
+ "supported_modalities": [
26404
+ "text",
26405
+ "image"
26406
+ ],
26407
+ "supported_output_modalities": [
26408
+ "text"
26409
+ ],
26410
+ "supports_function_calling": true,
26411
+ "supports_native_streaming": true,
26412
+ "supports_parallel_function_calling": true,
26413
+ "supports_prompt_caching": true,
26414
+ "supports_response_schema": true,
26415
+ "supports_system_messages": true,
26416
+ "supports_tool_choice": true,
26417
+ "supports_vision": true,
26418
+ "supports_web_search": false
26419
+ },
26420
+ "azure/us/gpt-4.1-nano-2025-04-14": {
26421
+ "deprecation_date": "2026-11-04",
26422
+ "cache_read_input_token_cost": 2.5e-08,
26423
+ "input_cost_per_token": 1.1e-07,
26424
+ "input_cost_per_token_batches": 6e-08,
26425
+ "litellm_provider": "azure",
26426
+ "max_input_tokens": 1047576,
26427
+ "max_output_tokens": 32768,
26428
+ "max_tokens": 32768,
26429
+ "mode": "chat",
26430
+ "output_cost_per_token": 4.4e-07,
26431
+ "output_cost_per_token_batches": 2.2e-07,
26432
+ "supported_endpoints": [
26433
+ "/v1/chat/completions",
26434
+ "/v1/batch",
26435
+ "/v1/responses"
26436
+ ],
26437
+ "supported_modalities": [
26438
+ "text",
26439
+ "image"
26440
+ ],
26441
+ "supported_output_modalities": [
26442
+ "text"
26443
+ ],
26444
+ "supports_function_calling": true,
26445
+ "supports_native_streaming": true,
26446
+ "supports_parallel_function_calling": true,
26447
+ "supports_prompt_caching": true,
26448
+ "supports_response_schema": true,
26449
+ "supports_system_messages": true,
26450
+ "supports_tool_choice": true,
26451
+ "supports_vision": true
26452
+ },
26453
+ "azure/us/gpt-5-2025-08-07": {
26454
+ "cache_read_input_token_cost": 1.375e-07,
26455
+ "input_cost_per_token": 1.375e-06,
26456
+ "litellm_provider": "azure",
26457
+ "max_input_tokens": 272000,
26458
+ "max_output_tokens": 128000,
26459
+ "max_tokens": 128000,
26460
+ "mode": "chat",
26461
+ "output_cost_per_token": 1.1e-05,
26462
+ "supported_endpoints": [
26463
+ "/v1/chat/completions",
26464
+ "/v1/batch",
26465
+ "/v1/responses"
26466
+ ],
26467
+ "supported_modalities": [
26468
+ "text",
26469
+ "image"
26470
+ ],
26471
+ "supported_output_modalities": [
26472
+ "text"
26473
+ ],
26474
+ "supports_function_calling": true,
26475
+ "supports_native_streaming": true,
26476
+ "supports_parallel_function_calling": true,
26477
+ "supports_pdf_input": true,
26478
+ "supports_prompt_caching": true,
26479
+ "supports_reasoning": true,
26480
+ "supports_response_schema": true,
26481
+ "supports_system_messages": true,
26482
+ "supports_tool_choice": true,
26483
+ "supports_vision": true
26484
+ },
26485
+ "azure/us/gpt-5-mini-2025-08-07": {
26486
+ "cache_read_input_token_cost": 2.75e-08,
26487
+ "input_cost_per_token": 2.75e-07,
26488
+ "litellm_provider": "azure",
26489
+ "max_input_tokens": 272000,
26490
+ "max_output_tokens": 128000,
26491
+ "max_tokens": 128000,
26492
+ "mode": "chat",
26493
+ "output_cost_per_token": 2.2e-06,
26494
+ "supported_endpoints": [
26495
+ "/v1/chat/completions",
26496
+ "/v1/batch",
26497
+ "/v1/responses"
26498
+ ],
26499
+ "supported_modalities": [
26500
+ "text",
26501
+ "image"
26502
+ ],
26503
+ "supported_output_modalities": [
26504
+ "text"
26505
+ ],
26506
+ "supports_function_calling": true,
26507
+ "supports_native_streaming": true,
26508
+ "supports_parallel_function_calling": true,
26509
+ "supports_pdf_input": true,
26510
+ "supports_prompt_caching": true,
26511
+ "supports_reasoning": true,
26512
+ "supports_response_schema": true,
26513
+ "supports_system_messages": true,
26514
+ "supports_tool_choice": true,
26515
+ "supports_vision": true
26516
+ },
26517
+ "azure/us/gpt-5-nano-2025-08-07": {
26518
+ "cache_read_input_token_cost": 5.5e-09,
26519
+ "input_cost_per_token": 5.5e-08,
26520
+ "litellm_provider": "azure",
26521
+ "max_input_tokens": 272000,
26522
+ "max_output_tokens": 128000,
26523
+ "max_tokens": 128000,
26524
+ "mode": "chat",
26525
+ "output_cost_per_token": 4.4e-07,
26526
+ "supported_endpoints": [
26527
+ "/v1/chat/completions",
26528
+ "/v1/batch",
26529
+ "/v1/responses"
26530
+ ],
26531
+ "supported_modalities": [
26532
+ "text",
26533
+ "image"
26534
+ ],
26535
+ "supported_output_modalities": [
26536
+ "text"
26537
+ ],
26538
+ "supports_function_calling": true,
26539
+ "supports_native_streaming": true,
26540
+ "supports_parallel_function_calling": true,
26541
+ "supports_pdf_input": true,
26542
+ "supports_prompt_caching": true,
26543
+ "supports_reasoning": true,
26544
+ "supports_response_schema": true,
26545
+ "supports_system_messages": true,
26546
+ "supports_tool_choice": true,
26547
+ "supports_vision": true
26548
+ },
26549
+ "azure/us/o3-2025-04-16": {
26550
+ "deprecation_date": "2026-04-16",
26551
+ "cache_read_input_token_cost": 5.5e-07,
26552
+ "input_cost_per_token": 2.2e-06,
26553
+ "litellm_provider": "azure",
26554
+ "max_input_tokens": 200000,
26555
+ "max_output_tokens": 100000,
26556
+ "max_tokens": 100000,
26557
+ "mode": "chat",
26558
+ "output_cost_per_token": 8.8e-06,
26559
+ "supported_endpoints": [
26560
+ "/v1/chat/completions",
26561
+ "/v1/batch",
26562
+ "/v1/responses"
26563
+ ],
26564
+ "supported_modalities": [
26565
+ "text",
26566
+ "image"
26567
+ ],
26568
+ "supported_output_modalities": [
26569
+ "text"
26570
+ ],
26571
+ "supports_function_calling": true,
26572
+ "supports_parallel_function_calling": false,
26573
+ "supports_prompt_caching": true,
26574
+ "supports_reasoning": true,
26575
+ "supports_response_schema": true,
26576
+ "supports_tool_choice": true,
26577
+ "supports_vision": true
26578
+ },
26579
+ "azure/us/o4-mini-2025-04-16": {
26580
+ "cache_read_input_token_cost": 3.1e-07,
26581
+ "input_cost_per_token": 1.21e-06,
26582
+ "litellm_provider": "azure",
26583
+ "max_input_tokens": 200000,
26584
+ "max_output_tokens": 100000,
26585
+ "max_tokens": 100000,
26586
+ "mode": "chat",
26587
+ "output_cost_per_token": 4.84e-06,
26588
+ "supports_function_calling": true,
26589
+ "supports_parallel_function_calling": false,
26590
+ "supports_prompt_caching": true,
26591
+ "supports_reasoning": true,
26592
+ "supports_response_schema": true,
26593
+ "supports_tool_choice": true,
26594
+ "supports_vision": true
26595
+ },
26596
+ "fireworks_ai/accounts/fireworks/models/deepseek-v3p1-terminus": {
26597
+ "input_cost_per_token": 5.6e-07,
26598
+ "litellm_provider": "fireworks_ai",
26599
+ "max_input_tokens": 128000,
26600
+ "max_output_tokens": 8192,
26601
+ "max_tokens": 8192,
26602
+ "mode": "chat",
26603
+ "output_cost_per_token": 1.68e-06,
26604
+ "source": "https://fireworks.ai/pricing",
26605
+ "supports_response_schema": true,
26606
+ "supports_tool_choice": true
26607
+ },
26608
+ "fireworks_ai/accounts/fireworks/models/kimi-k2-thinking": {
26609
+ "input_cost_per_token": 6e-07,
26610
+ "litellm_provider": "fireworks_ai",
26611
+ "max_input_tokens": 262144,
26612
+ "max_output_tokens": 262144,
26613
+ "max_tokens": 262144,
26614
+ "mode": "chat",
26615
+ "output_cost_per_token": 2.5e-06,
26616
+ "source": "https://fireworks.ai/pricing",
26617
+ "supports_function_calling": true,
26618
+ "supports_response_schema": true,
26619
+ "supports_tool_choice": true,
26620
+ "supports_web_search": true
26621
+ },
26622
+ "gemini-3-pro-preview": {
26623
+ "cache_read_input_token_cost": 2e-07,
26624
+ "cache_read_input_token_cost_above_200k_tokens": 4e-07,
26625
+ "cache_creation_input_token_cost_above_200k_tokens": 2.5e-07,
26626
+ "input_cost_per_token": 2e-06,
26627
+ "input_cost_per_token_above_200k_tokens": 4e-06,
26628
+ "input_cost_per_token_batches": 1e-06,
26629
+ "litellm_provider": "vertex_ai-language-models",
26630
+ "max_audio_length_hours": 8.4,
26631
+ "max_audio_per_prompt": 1,
26632
+ "max_images_per_prompt": 3000,
26633
+ "max_input_tokens": 1048576,
26634
+ "max_output_tokens": 65535,
26635
+ "max_pdf_size_mb": 30,
26636
+ "max_tokens": 65535,
26637
+ "max_video_length": 1,
26638
+ "max_videos_per_prompt": 10,
26639
+ "mode": "chat",
26640
+ "output_cost_per_token": 1.2e-05,
26641
+ "output_cost_per_token_above_200k_tokens": 1.8e-05,
26642
+ "output_cost_per_token_batches": 6e-06,
26643
+ "source": "https://cloud.google.com/vertex-ai/generative-ai/pricing",
26644
+ "supported_endpoints": [
26645
+ "/v1/chat/completions",
26646
+ "/v1/completions",
26647
+ "/v1/batch"
26648
+ ],
26649
+ "supported_modalities": [
26650
+ "text",
26651
+ "image",
26652
+ "audio",
26653
+ "video"
26654
+ ],
26655
+ "supported_output_modalities": [
26656
+ "text"
26657
+ ],
26658
+ "supports_audio_input": true,
26659
+ "supports_function_calling": true,
26660
+ "supports_pdf_input": true,
26661
+ "supports_prompt_caching": true,
26662
+ "supports_reasoning": true,
26663
+ "supports_response_schema": true,
26664
+ "supports_system_messages": true,
26665
+ "supports_tool_choice": true,
26666
+ "supports_video_input": true,
26667
+ "supports_vision": true,
26668
+ "supports_web_search": true
26669
+ },
26670
+ "gemini/gemini-3-pro-preview": {
26671
+ "cache_read_input_token_cost": 2e-07,
26672
+ "cache_read_input_token_cost_above_200k_tokens": 4e-07,
26673
+ "input_cost_per_token": 2e-06,
26674
+ "input_cost_per_token_above_200k_tokens": 4e-06,
26675
+ "input_cost_per_token_batches": 1e-06,
26676
+ "litellm_provider": "gemini",
26677
+ "max_audio_length_hours": 8.4,
26678
+ "max_audio_per_prompt": 1,
26679
+ "max_images_per_prompt": 3000,
26680
+ "max_input_tokens": 1048576,
26681
+ "max_output_tokens": 65535,
26682
+ "max_pdf_size_mb": 30,
26683
+ "max_tokens": 65535,
26684
+ "max_video_length": 1,
26685
+ "max_videos_per_prompt": 10,
26686
+ "mode": "chat",
26687
+ "output_cost_per_token": 1.2e-05,
26688
+ "output_cost_per_token_above_200k_tokens": 1.8e-05,
26689
+ "output_cost_per_token_batches": 6e-06,
26690
+ "rpm": 2000,
26691
+ "source": "https://cloud.google.com/vertex-ai/generative-ai/pricing",
26692
+ "supported_endpoints": [
26693
+ "/v1/chat/completions",
26694
+ "/v1/completions",
26695
+ "/v1/batch"
26696
+ ],
26697
+ "supported_modalities": [
26698
+ "text",
26699
+ "image",
26700
+ "audio",
26701
+ "video"
26702
+ ],
26703
+ "supported_output_modalities": [
26704
+ "text"
26705
+ ],
26706
+ "supports_audio_input": true,
26707
+ "supports_function_calling": true,
26708
+ "supports_pdf_input": true,
26709
+ "supports_prompt_caching": true,
26710
+ "supports_reasoning": true,
26711
+ "supports_response_schema": true,
26712
+ "supports_system_messages": true,
26713
+ "supports_tool_choice": true,
26714
+ "supports_video_input": true,
26715
+ "supports_vision": true,
26716
+ "supports_web_search": true,
26717
+ "tpm": 800000
26718
+ },
26719
+ "vertex_ai/veo-3.0-fast-generate-001": {
26720
+ "litellm_provider": "vertex_ai-video-models",
26721
+ "max_input_tokens": 1024,
26722
+ "max_tokens": 1024,
26723
+ "mode": "video_generation",
26724
+ "output_cost_per_second": 0.15,
26725
+ "source": "https://ai.google.dev/gemini-api/docs/video",
26726
+ "supported_modalities": [
26727
+ "text"
26728
+ ],
26729
+ "supported_output_modalities": [
26730
+ "video"
26731
+ ]
26732
+ },
26733
+ "vertex_ai/veo-3.0-generate-001": {
26734
+ "litellm_provider": "vertex_ai-video-models",
26735
+ "max_input_tokens": 1024,
26736
+ "max_tokens": 1024,
26737
+ "mode": "video_generation",
26738
+ "output_cost_per_second": 0.4,
26739
+ "source": "https://ai.google.dev/gemini-api/docs/video",
26740
+ "supported_modalities": [
26741
+ "text"
26742
+ ],
26743
+ "supported_output_modalities": [
26744
+ "video"
26745
+ ]
26746
+ },
26747
+ "azure/gpt-audio-2025-08-28": {
26748
+ "input_cost_per_audio_token": 4e-05,
26749
+ "input_cost_per_token": 2.5e-06,
26750
+ "litellm_provider": "azure",
26751
+ "max_input_tokens": 128000,
26752
+ "max_output_tokens": 16384,
26753
+ "max_tokens": 16384,
26754
+ "mode": "chat",
26755
+ "output_cost_per_audio_token": 8e-05,
26756
+ "output_cost_per_token": 1e-05,
26757
+ "supported_endpoints": [
26758
+ "/v1/chat/completions"
26759
+ ],
26760
+ "supported_modalities": [
26761
+ "text",
26762
+ "audio"
26763
+ ],
26764
+ "supported_output_modalities": [
26765
+ "text",
26766
+ "audio"
26767
+ ],
26768
+ "supports_function_calling": true,
26769
+ "supports_native_streaming": true,
26770
+ "supports_parallel_function_calling": true,
26771
+ "supports_prompt_caching": false,
26772
+ "supports_reasoning": false,
26773
+ "supports_response_schema": false,
26774
+ "supports_system_messages": true,
26775
+ "supports_tool_choice": true,
26776
+ "supports_vision": false
26777
+ },
26778
+ "azure/gpt-audio-mini-2025-10-06": {
26779
+ "input_cost_per_audio_token": 1e-05,
26780
+ "input_cost_per_token": 6e-07,
26781
+ "litellm_provider": "azure",
26782
+ "max_input_tokens": 128000,
26783
+ "max_output_tokens": 16384,
26784
+ "max_tokens": 16384,
26785
+ "mode": "chat",
26786
+ "output_cost_per_audio_token": 2e-05,
26787
+ "output_cost_per_token": 2.4e-06,
26788
+ "supported_endpoints": [
26789
+ "/v1/chat/completions"
26790
+ ],
26791
+ "supported_modalities": [
26792
+ "text",
26793
+ "audio"
26794
+ ],
26795
+ "supported_output_modalities": [
26796
+ "text",
26797
+ "audio"
26798
+ ],
26799
+ "supports_function_calling": true,
26800
+ "supports_native_streaming": true,
26801
+ "supports_parallel_function_calling": true,
26802
+ "supports_prompt_caching": false,
26803
+ "supports_reasoning": false,
26804
+ "supports_response_schema": false,
26805
+ "supports_system_messages": true,
26806
+ "supports_tool_choice": true,
26807
+ "supports_vision": false
26808
+ },
26809
+ "azure/gpt-realtime-2025-08-28": {
26810
+ "cache_creation_input_audio_token_cost": 4e-06,
26811
+ "cache_read_input_token_cost": 4e-06,
26812
+ "input_cost_per_audio_token": 3.2e-05,
26813
+ "input_cost_per_image": 5e-06,
26814
+ "input_cost_per_token": 4e-06,
26815
+ "litellm_provider": "azure",
26816
+ "max_input_tokens": 32000,
26817
+ "max_output_tokens": 4096,
26818
+ "max_tokens": 4096,
26819
+ "mode": "chat",
26820
+ "output_cost_per_audio_token": 6.4e-05,
26821
+ "output_cost_per_token": 1.6e-05,
26822
+ "supported_endpoints": [
26823
+ "/v1/realtime"
26824
+ ],
26825
+ "supported_modalities": [
26826
+ "text",
26827
+ "image",
26828
+ "audio"
26829
+ ],
26830
+ "supported_output_modalities": [
26831
+ "text",
26832
+ "audio"
26833
+ ],
26834
+ "supports_audio_input": true,
26835
+ "supports_audio_output": true,
26836
+ "supports_function_calling": true,
26837
+ "supports_parallel_function_calling": true,
26838
+ "supports_system_messages": true,
26839
+ "supports_tool_choice": true
26840
+ },
26841
+ "azure/gpt-realtime-mini-2025-10-06": {
26842
+ "cache_creation_input_audio_token_cost": 3e-07,
26843
+ "cache_read_input_token_cost": 6e-08,
26844
+ "input_cost_per_audio_token": 1e-05,
26845
+ "input_cost_per_image": 8e-07,
26846
+ "input_cost_per_token": 6e-07,
26847
+ "litellm_provider": "azure",
26848
+ "max_input_tokens": 32000,
26849
+ "max_output_tokens": 4096,
26850
+ "max_tokens": 4096,
26851
+ "mode": "chat",
26852
+ "output_cost_per_audio_token": 2e-05,
26853
+ "output_cost_per_token": 2.4e-06,
26854
+ "supported_endpoints": [
26855
+ "/v1/realtime"
26856
+ ],
26857
+ "supported_modalities": [
26858
+ "text",
26859
+ "image",
26860
+ "audio"
26861
+ ],
26862
+ "supported_output_modalities": [
26863
+ "text",
26864
+ "audio"
26865
+ ],
26866
+ "supports_audio_input": true,
26867
+ "supports_audio_output": true,
26868
+ "supports_function_calling": true,
26869
+ "supports_parallel_function_calling": true,
26870
+ "supports_system_messages": true,
26871
+ "supports_tool_choice": true
26872
+ },
26873
+ "azure/gpt-4o-transcribe-diarize": {
26874
+ "input_cost_per_audio_token": 6e-06,
26875
+ "input_cost_per_token": 2.5e-06,
26876
+ "litellm_provider": "azure",
26877
+ "max_input_tokens": 16000,
26878
+ "max_output_tokens": 2000,
26879
+ "mode": "audio_transcription",
26880
+ "output_cost_per_token": 1e-05,
26881
+ "supported_endpoints": [
26882
+ "/v1/audio/transcriptions"
26883
+ ]
26884
+ },
26885
+ "azure/gpt-5.1-2025-11-13": {
26886
+ "cache_read_input_token_cost": 1.25e-07,
26887
+ "cache_read_input_token_cost_priority": 2.5e-07,
26888
+ "input_cost_per_token": 1.25e-06,
26889
+ "input_cost_per_token_priority": 2.5e-06,
26890
+ "litellm_provider": "azure",
26891
+ "max_input_tokens": 272000,
26892
+ "max_output_tokens": 128000,
26893
+ "max_tokens": 128000,
26894
+ "mode": "chat",
26895
+ "output_cost_per_token": 1e-05,
26896
+ "output_cost_per_token_priority": 2e-05,
26897
+ "supported_endpoints": [
26898
+ "/v1/chat/completions",
26899
+ "/v1/responses"
26900
+ ],
26901
+ "supported_modalities": [
26902
+ "text",
26903
+ "image"
26904
+ ],
26905
+ "supported_output_modalities": [
26906
+ "text",
26907
+ "image"
26908
+ ],
26909
+ "supports_function_calling": true,
26910
+ "supports_native_streaming": true,
26911
+ "supports_parallel_function_calling": true,
26912
+ "supports_pdf_input": true,
26913
+ "supports_prompt_caching": true,
26914
+ "supports_reasoning": true,
26915
+ "supports_response_schema": true,
26916
+ "supports_system_messages": true,
26917
+ "supports_tool_choice": true,
26918
+ "supports_service_tier": true,
26919
+ "supports_vision": true
26920
+ },
26921
+ "azure/gpt-5.1-chat-2025-11-13": {
26922
+ "cache_read_input_token_cost": 1.25e-07,
26923
+ "cache_read_input_token_cost_priority": 2.5e-07,
26924
+ "input_cost_per_token": 1.25e-06,
26925
+ "input_cost_per_token_priority": 2.5e-06,
26926
+ "litellm_provider": "azure",
26927
+ "max_input_tokens": 128000,
26928
+ "max_output_tokens": 16384,
26929
+ "max_tokens": 16384,
26930
+ "mode": "chat",
26931
+ "output_cost_per_token": 1e-05,
26932
+ "output_cost_per_token_priority": 2e-05,
26933
+ "supported_endpoints": [
26934
+ "/v1/chat/completions",
26935
+ "/v1/responses"
26936
+ ],
26937
+ "supported_modalities": [
26938
+ "text",
26939
+ "image"
26940
+ ],
26941
+ "supported_output_modalities": [
26942
+ "text",
26943
+ "image"
26944
+ ],
26945
+ "supports_function_calling": false,
26946
+ "supports_native_streaming": true,
26947
+ "supports_parallel_function_calling": false,
26948
+ "supports_pdf_input": true,
26949
+ "supports_prompt_caching": true,
26950
+ "supports_reasoning": true,
26951
+ "supports_response_schema": true,
26952
+ "supports_system_messages": true,
26953
+ "supports_tool_choice": false,
26954
+ "supports_vision": true
26955
+ },
26956
+ "azure/gpt-5.1-codex-2025-11-13": {
26957
+ "cache_read_input_token_cost": 1.25e-07,
26958
+ "cache_read_input_token_cost_priority": 2.5e-07,
26959
+ "input_cost_per_token": 1.25e-06,
26960
+ "input_cost_per_token_priority": 2.5e-06,
26961
+ "litellm_provider": "azure",
26962
+ "max_input_tokens": 272000,
26963
+ "max_output_tokens": 128000,
26964
+ "max_tokens": 128000,
26965
+ "mode": "responses",
26966
+ "output_cost_per_token": 1e-05,
26967
+ "output_cost_per_token_priority": 2e-05,
26968
+ "supported_endpoints": [
26969
+ "/v1/responses"
26970
+ ],
26971
+ "supported_modalities": [
26972
+ "text",
26973
+ "image"
26974
+ ],
26975
+ "supported_output_modalities": [
26976
+ "text"
26977
+ ],
26978
+ "supports_function_calling": true,
26979
+ "supports_native_streaming": true,
26980
+ "supports_parallel_function_calling": true,
26981
+ "supports_pdf_input": true,
26982
+ "supports_prompt_caching": true,
26983
+ "supports_reasoning": true,
26984
+ "supports_response_schema": true,
26985
+ "supports_system_messages": false,
26986
+ "supports_tool_choice": true,
26987
+ "supports_vision": true
26988
+ },
26989
+ "azure/gpt-5.1-codex-mini-2025-11-13": {
26990
+ "cache_read_input_token_cost": 2.5e-08,
26991
+ "cache_read_input_token_cost_priority": 4.5e-08,
26992
+ "input_cost_per_token": 2.5e-07,
26993
+ "input_cost_per_token_priority": 4.5e-07,
26994
+ "litellm_provider": "azure",
26995
+ "max_input_tokens": 272000,
26996
+ "max_output_tokens": 128000,
26997
+ "max_tokens": 128000,
26998
+ "mode": "responses",
26999
+ "output_cost_per_token": 2e-06,
27000
+ "output_cost_per_token_priority": 3.6e-06,
27001
+ "supported_endpoints": [
27002
+ "/v1/responses"
27003
+ ],
27004
+ "supported_modalities": [
27005
+ "text",
27006
+ "image"
27007
+ ],
27008
+ "supported_output_modalities": [
27009
+ "text"
27010
+ ],
27011
+ "supports_function_calling": true,
27012
+ "supports_native_streaming": true,
27013
+ "supports_parallel_function_calling": true,
27014
+ "supports_pdf_input": true,
27015
+ "supports_prompt_caching": true,
27016
+ "supports_reasoning": true,
27017
+ "supports_response_schema": true,
27018
+ "supports_system_messages": false,
27019
+ "supports_tool_choice": true,
27020
+ "supports_vision": true
27021
+ },
27022
+ "azure/eu/gpt-5.1": {
27023
+ "cache_read_input_token_cost": 1.4e-07,
27024
+ "input_cost_per_token": 1.38e-06,
27025
+ "litellm_provider": "azure",
27026
+ "max_input_tokens": 272000,
27027
+ "max_output_tokens": 128000,
27028
+ "max_tokens": 128000,
27029
+ "mode": "chat",
27030
+ "output_cost_per_token": 1.1e-05,
27031
+ "supported_endpoints": [
27032
+ "/v1/chat/completions",
27033
+ "/v1/batch",
27034
+ "/v1/responses"
27035
+ ],
27036
+ "supported_modalities": [
27037
+ "text",
27038
+ "image"
27039
+ ],
27040
+ "supported_output_modalities": [
27041
+ "text",
27042
+ "image"
27043
+ ],
27044
+ "supports_function_calling": true,
27045
+ "supports_native_streaming": true,
27046
+ "supports_parallel_function_calling": true,
27047
+ "supports_pdf_input": true,
27048
+ "supports_prompt_caching": true,
27049
+ "supports_reasoning": true,
27050
+ "supports_response_schema": true,
27051
+ "supports_system_messages": true,
27052
+ "supports_tool_choice": true,
27053
+ "supports_vision": true
27054
+ },
27055
+ "azure/eu/gpt-5.1-chat": {
27056
+ "cache_read_input_token_cost": 1.4e-07,
27057
+ "input_cost_per_token": 1.38e-06,
27058
+ "litellm_provider": "azure",
27059
+ "max_input_tokens": 272000,
27060
+ "max_output_tokens": 128000,
27061
+ "max_tokens": 128000,
27062
+ "mode": "chat",
27063
+ "output_cost_per_token": 1.1e-05,
27064
+ "supported_endpoints": [
27065
+ "/v1/chat/completions",
27066
+ "/v1/batch",
27067
+ "/v1/responses"
27068
+ ],
27069
+ "supported_modalities": [
27070
+ "text",
27071
+ "image"
27072
+ ],
27073
+ "supported_output_modalities": [
27074
+ "text",
27075
+ "image"
27076
+ ],
27077
+ "supports_function_calling": true,
27078
+ "supports_native_streaming": true,
27079
+ "supports_parallel_function_calling": true,
27080
+ "supports_pdf_input": true,
27081
+ "supports_prompt_caching": true,
27082
+ "supports_reasoning": true,
27083
+ "supports_response_schema": true,
27084
+ "supports_system_messages": true,
27085
+ "supports_tool_choice": true,
27086
+ "supports_vision": true
27087
+ },
27088
+ "azure/eu/gpt-5.1-codex": {
27089
+ "cache_read_input_token_cost": 1.4e-07,
27090
+ "input_cost_per_token": 1.38e-06,
27091
+ "litellm_provider": "azure",
27092
+ "max_input_tokens": 272000,
27093
+ "max_output_tokens": 128000,
27094
+ "max_tokens": 128000,
27095
+ "mode": "responses",
27096
+ "output_cost_per_token": 1.1e-05,
27097
+ "supported_endpoints": [
27098
+ "/v1/responses"
27099
+ ],
27100
+ "supported_modalities": [
27101
+ "text",
27102
+ "image"
27103
+ ],
27104
+ "supported_output_modalities": [
27105
+ "text"
27106
+ ],
27107
+ "supports_function_calling": true,
27108
+ "supports_native_streaming": true,
27109
+ "supports_parallel_function_calling": true,
27110
+ "supports_pdf_input": true,
27111
+ "supports_prompt_caching": true,
27112
+ "supports_reasoning": true,
27113
+ "supports_response_schema": true,
27114
+ "supports_system_messages": false,
27115
+ "supports_tool_choice": true,
27116
+ "supports_vision": true
27117
+ },
27118
+ "azure/eu/gpt-5.1-codex-mini": {
27119
+ "cache_read_input_token_cost": 2.8e-08,
27120
+ "input_cost_per_token": 2.75e-07,
27121
+ "litellm_provider": "azure",
27122
+ "max_input_tokens": 272000,
27123
+ "max_output_tokens": 128000,
27124
+ "max_tokens": 128000,
27125
+ "mode": "responses",
27126
+ "output_cost_per_token": 2.2e-06,
27127
+ "supported_endpoints": [
27128
+ "/v1/responses"
27129
+ ],
27130
+ "supported_modalities": [
27131
+ "text",
27132
+ "image"
27133
+ ],
27134
+ "supported_output_modalities": [
27135
+ "text"
27136
+ ],
27137
+ "supports_function_calling": true,
27138
+ "supports_native_streaming": true,
27139
+ "supports_parallel_function_calling": true,
27140
+ "supports_pdf_input": true,
27141
+ "supports_prompt_caching": true,
27142
+ "supports_reasoning": true,
27143
+ "supports_response_schema": true,
27144
+ "supports_system_messages": false,
27145
+ "supports_tool_choice": true,
27146
+ "supports_vision": true
27147
+ },
27148
+ "azure/global/gpt-5.1": {
27149
+ "cache_read_input_token_cost": 1.25e-07,
27150
+ "input_cost_per_token": 1.25e-06,
27151
+ "litellm_provider": "azure",
27152
+ "max_input_tokens": 272000,
27153
+ "max_output_tokens": 128000,
27154
+ "max_tokens": 128000,
27155
+ "mode": "chat",
27156
+ "output_cost_per_token": 1e-05,
27157
+ "supported_endpoints": [
27158
+ "/v1/chat/completions",
27159
+ "/v1/batch",
27160
+ "/v1/responses"
27161
+ ],
27162
+ "supported_modalities": [
27163
+ "text",
27164
+ "image"
27165
+ ],
27166
+ "supported_output_modalities": [
27167
+ "text",
27168
+ "image"
27169
+ ],
27170
+ "supports_function_calling": true,
27171
+ "supports_native_streaming": true,
27172
+ "supports_parallel_function_calling": true,
27173
+ "supports_pdf_input": true,
27174
+ "supports_prompt_caching": true,
27175
+ "supports_reasoning": true,
27176
+ "supports_response_schema": true,
27177
+ "supports_system_messages": true,
27178
+ "supports_tool_choice": true,
27179
+ "supports_vision": true
27180
+ },
27181
+ "azure/global/gpt-5.1-chat": {
27182
+ "cache_read_input_token_cost": 1.25e-07,
27183
+ "input_cost_per_token": 1.25e-06,
27184
+ "litellm_provider": "azure",
27185
+ "max_input_tokens": 272000,
27186
+ "max_output_tokens": 128000,
27187
+ "max_tokens": 128000,
27188
+ "mode": "chat",
27189
+ "output_cost_per_token": 1e-05,
27190
+ "supported_endpoints": [
27191
+ "/v1/chat/completions",
27192
+ "/v1/batch",
27193
+ "/v1/responses"
27194
+ ],
27195
+ "supported_modalities": [
27196
+ "text",
27197
+ "image"
27198
+ ],
27199
+ "supported_output_modalities": [
27200
+ "text",
27201
+ "image"
27202
+ ],
27203
+ "supports_function_calling": true,
27204
+ "supports_native_streaming": true,
27205
+ "supports_parallel_function_calling": true,
27206
+ "supports_pdf_input": true,
27207
+ "supports_prompt_caching": true,
27208
+ "supports_reasoning": true,
27209
+ "supports_response_schema": true,
27210
+ "supports_system_messages": true,
27211
+ "supports_tool_choice": true,
27212
+ "supports_vision": true
27213
+ },
27214
+ "azure/global/gpt-5.1-codex": {
27215
+ "cache_read_input_token_cost": 1.25e-07,
27216
+ "input_cost_per_token": 1.25e-06,
27217
+ "litellm_provider": "azure",
27218
+ "max_input_tokens": 272000,
27219
+ "max_output_tokens": 128000,
27220
+ "max_tokens": 128000,
27221
+ "mode": "responses",
27222
+ "output_cost_per_token": 1e-05,
27223
+ "supported_endpoints": [
27224
+ "/v1/responses"
27225
+ ],
27226
+ "supported_modalities": [
27227
+ "text",
27228
+ "image"
27229
+ ],
27230
+ "supported_output_modalities": [
27231
+ "text"
27232
+ ],
27233
+ "supports_function_calling": true,
27234
+ "supports_native_streaming": true,
27235
+ "supports_parallel_function_calling": true,
27236
+ "supports_pdf_input": true,
27237
+ "supports_prompt_caching": true,
27238
+ "supports_reasoning": true,
27239
+ "supports_response_schema": true,
27240
+ "supports_system_messages": false,
27241
+ "supports_tool_choice": true,
27242
+ "supports_vision": true
27243
+ },
27244
+ "azure/global/gpt-5.1-codex-mini": {
27245
+ "cache_read_input_token_cost": 2.5e-08,
27246
+ "input_cost_per_token": 2.5e-07,
27247
+ "litellm_provider": "azure",
27248
+ "max_input_tokens": 272000,
27249
+ "max_output_tokens": 128000,
27250
+ "max_tokens": 128000,
27251
+ "mode": "responses",
27252
+ "output_cost_per_token": 2e-06,
27253
+ "supported_endpoints": [
27254
+ "/v1/responses"
27255
+ ],
27256
+ "supported_modalities": [
27257
+ "text",
27258
+ "image"
27259
+ ],
27260
+ "supported_output_modalities": [
27261
+ "text"
27262
+ ],
27263
+ "supports_function_calling": true,
27264
+ "supports_native_streaming": true,
27265
+ "supports_parallel_function_calling": true,
27266
+ "supports_pdf_input": true,
27267
+ "supports_prompt_caching": true,
27268
+ "supports_reasoning": true,
27269
+ "supports_response_schema": true,
27270
+ "supports_system_messages": false,
27271
+ "supports_tool_choice": true,
27272
+ "supports_vision": true
27273
+ },
27274
+ "azure/gpt-5.1": {
27275
+ "cache_read_input_token_cost": 1.25e-07,
27276
+ "input_cost_per_token": 1.25e-06,
27277
+ "litellm_provider": "azure",
27278
+ "max_input_tokens": 272000,
27279
+ "max_output_tokens": 128000,
27280
+ "max_tokens": 128000,
27281
+ "mode": "chat",
27282
+ "output_cost_per_token": 1e-05,
27283
+ "supported_endpoints": [
27284
+ "/v1/chat/completions",
27285
+ "/v1/batch",
27286
+ "/v1/responses"
27287
+ ],
27288
+ "supported_modalities": [
27289
+ "text",
27290
+ "image"
27291
+ ],
27292
+ "supported_output_modalities": [
27293
+ "text",
27294
+ "image"
27295
+ ],
27296
+ "supports_function_calling": true,
27297
+ "supports_native_streaming": true,
27298
+ "supports_parallel_function_calling": true,
27299
+ "supports_pdf_input": true,
27300
+ "supports_prompt_caching": true,
27301
+ "supports_reasoning": true,
27302
+ "supports_response_schema": true,
27303
+ "supports_system_messages": true,
27304
+ "supports_tool_choice": true,
27305
+ "supports_vision": true
27306
+ },
27307
+ "azure/gpt-5.1-chat": {
27308
+ "cache_read_input_token_cost": 1.25e-07,
27309
+ "input_cost_per_token": 1.25e-06,
27310
+ "litellm_provider": "azure",
27311
+ "max_input_tokens": 272000,
27312
+ "max_output_tokens": 128000,
27313
+ "max_tokens": 128000,
27314
+ "mode": "chat",
27315
+ "output_cost_per_token": 1e-05,
27316
+ "supported_endpoints": [
27317
+ "/v1/chat/completions",
27318
+ "/v1/batch",
27319
+ "/v1/responses"
27320
+ ],
27321
+ "supported_modalities": [
27322
+ "text",
27323
+ "image"
27324
+ ],
27325
+ "supported_output_modalities": [
27326
+ "text",
27327
+ "image"
27328
+ ],
27329
+ "supports_function_calling": true,
27330
+ "supports_native_streaming": true,
27331
+ "supports_parallel_function_calling": true,
27332
+ "supports_pdf_input": true,
27333
+ "supports_prompt_caching": true,
27334
+ "supports_reasoning": true,
27335
+ "supports_response_schema": true,
27336
+ "supports_system_messages": true,
27337
+ "supports_tool_choice": true,
27338
+ "supports_vision": true
27339
+ },
27340
+ "azure/gpt-5.1-codex": {
27341
+ "cache_read_input_token_cost": 1.25e-07,
27342
+ "input_cost_per_token": 1.25e-06,
27343
+ "litellm_provider": "azure",
27344
+ "max_input_tokens": 272000,
27345
+ "max_output_tokens": 128000,
27346
+ "max_tokens": 128000,
27347
+ "mode": "responses",
27348
+ "output_cost_per_token": 1e-05,
27349
+ "supported_endpoints": [
27350
+ "/v1/responses"
27351
+ ],
27352
+ "supported_modalities": [
27353
+ "text",
27354
+ "image"
27355
+ ],
27356
+ "supported_output_modalities": [
27357
+ "text"
27358
+ ],
27359
+ "supports_function_calling": true,
27360
+ "supports_native_streaming": true,
27361
+ "supports_parallel_function_calling": true,
27362
+ "supports_pdf_input": true,
27363
+ "supports_prompt_caching": true,
27364
+ "supports_reasoning": true,
27365
+ "supports_response_schema": true,
27366
+ "supports_system_messages": false,
27367
+ "supports_tool_choice": true,
27368
+ "supports_vision": true
27369
+ },
27370
+ "azure/gpt-5.1-codex-mini": {
27371
+ "cache_read_input_token_cost": 2.5e-08,
27372
+ "input_cost_per_token": 2.5e-07,
27373
+ "litellm_provider": "azure",
27374
+ "max_input_tokens": 272000,
27375
+ "max_output_tokens": 128000,
27376
+ "max_tokens": 128000,
27377
+ "mode": "responses",
27378
+ "output_cost_per_token": 2e-06,
27379
+ "supported_endpoints": [
27380
+ "/v1/responses"
27381
+ ],
27382
+ "supported_modalities": [
27383
+ "text",
27384
+ "image"
27385
+ ],
27386
+ "supported_output_modalities": [
27387
+ "text"
27388
+ ],
27389
+ "supports_function_calling": true,
27390
+ "supports_native_streaming": true,
27391
+ "supports_parallel_function_calling": true,
27392
+ "supports_pdf_input": true,
27393
+ "supports_prompt_caching": true,
27394
+ "supports_reasoning": true,
27395
+ "supports_response_schema": true,
27396
+ "supports_system_messages": false,
27397
+ "supports_tool_choice": true,
27398
+ "supports_vision": true
27399
+ },
27400
+ "azure/us/gpt-5.1": {
27401
+ "cache_read_input_token_cost": 1.4e-07,
27402
+ "input_cost_per_token": 1.38e-06,
27403
+ "litellm_provider": "azure",
27404
+ "max_input_tokens": 272000,
27405
+ "max_output_tokens": 128000,
27406
+ "max_tokens": 128000,
27407
+ "mode": "chat",
27408
+ "output_cost_per_token": 1.1e-05,
27409
+ "supported_endpoints": [
27410
+ "/v1/chat/completions",
27411
+ "/v1/batch",
27412
+ "/v1/responses"
27413
+ ],
27414
+ "supported_modalities": [
27415
+ "text",
27416
+ "image"
27417
+ ],
27418
+ "supported_output_modalities": [
27419
+ "text",
27420
+ "image"
27421
+ ],
27422
+ "supports_function_calling": true,
27423
+ "supports_native_streaming": true,
27424
+ "supports_parallel_function_calling": true,
27425
+ "supports_pdf_input": true,
27426
+ "supports_prompt_caching": true,
27427
+ "supports_reasoning": true,
27428
+ "supports_response_schema": true,
27429
+ "supports_system_messages": true,
27430
+ "supports_tool_choice": true,
27431
+ "supports_vision": true
27432
+ },
27433
+ "azure/us/gpt-5.1-chat": {
27434
+ "cache_read_input_token_cost": 1.4e-07,
27435
+ "input_cost_per_token": 1.38e-06,
27436
+ "litellm_provider": "azure",
27437
+ "max_input_tokens": 272000,
27438
+ "max_output_tokens": 128000,
27439
+ "max_tokens": 128000,
27440
+ "mode": "chat",
27441
+ "output_cost_per_token": 1.1e-05,
27442
+ "supported_endpoints": [
27443
+ "/v1/chat/completions",
27444
+ "/v1/batch",
27445
+ "/v1/responses"
27446
+ ],
27447
+ "supported_modalities": [
27448
+ "text",
27449
+ "image"
27450
+ ],
27451
+ "supported_output_modalities": [
27452
+ "text",
27453
+ "image"
27454
+ ],
27455
+ "supports_function_calling": true,
27456
+ "supports_native_streaming": true,
27457
+ "supports_parallel_function_calling": true,
27458
+ "supports_pdf_input": true,
27459
+ "supports_prompt_caching": true,
27460
+ "supports_reasoning": true,
27461
+ "supports_response_schema": true,
27462
+ "supports_system_messages": true,
27463
+ "supports_tool_choice": true,
27464
+ "supports_vision": true
27465
+ },
27466
+ "azure/us/gpt-5.1-codex": {
27467
+ "cache_read_input_token_cost": 1.4e-07,
27468
+ "input_cost_per_token": 1.38e-06,
27469
+ "litellm_provider": "azure",
27470
+ "max_input_tokens": 272000,
27471
+ "max_output_tokens": 128000,
27472
+ "max_tokens": 128000,
27473
+ "mode": "responses",
27474
+ "output_cost_per_token": 1.1e-05,
27475
+ "supported_endpoints": [
27476
+ "/v1/responses"
27477
+ ],
27478
+ "supported_modalities": [
27479
+ "text",
27480
+ "image"
27481
+ ],
27482
+ "supported_output_modalities": [
27483
+ "text"
27484
+ ],
27485
+ "supports_function_calling": true,
27486
+ "supports_native_streaming": true,
27487
+ "supports_parallel_function_calling": true,
27488
+ "supports_pdf_input": true,
27489
+ "supports_prompt_caching": true,
27490
+ "supports_reasoning": true,
27491
+ "supports_response_schema": true,
27492
+ "supports_system_messages": false,
27493
+ "supports_tool_choice": true,
27494
+ "supports_vision": true
27495
+ },
27496
+ "azure/us/gpt-5.1-codex-mini": {
27497
+ "cache_read_input_token_cost": 2.8e-08,
27498
+ "input_cost_per_token": 2.75e-07,
27499
+ "litellm_provider": "azure",
27500
+ "max_input_tokens": 272000,
27501
+ "max_output_tokens": 128000,
27502
+ "max_tokens": 128000,
27503
+ "mode": "responses",
27504
+ "output_cost_per_token": 2.2e-06,
27505
+ "supported_endpoints": [
27506
+ "/v1/responses"
27507
+ ],
27508
+ "supported_modalities": [
27509
+ "text",
27510
+ "image"
27511
+ ],
27512
+ "supported_output_modalities": [
27513
+ "text"
27514
+ ],
27515
+ "supports_function_calling": true,
27516
+ "supports_native_streaming": true,
27517
+ "supports_parallel_function_calling": true,
27518
+ "supports_pdf_input": true,
27519
+ "supports_prompt_caching": true,
27520
+ "supports_reasoning": true,
27521
+ "supports_response_schema": true,
27522
+ "supports_system_messages": false,
27523
+ "supports_tool_choice": true,
27524
+ "supports_vision": true
27525
+ },
27526
+ "vertex_ai/gemini-3-pro-preview": {
27527
+ "cache_read_input_token_cost": 2e-07,
27528
+ "cache_read_input_token_cost_above_200k_tokens": 4e-07,
27529
+ "cache_creation_input_token_cost_above_200k_tokens": 2.5e-07,
27530
+ "input_cost_per_token": 2e-06,
27531
+ "input_cost_per_token_above_200k_tokens": 4e-06,
27532
+ "input_cost_per_token_batches": 1e-06,
27533
+ "litellm_provider": "vertex_ai",
27534
+ "max_audio_length_hours": 8.4,
27535
+ "max_audio_per_prompt": 1,
27536
+ "max_images_per_prompt": 3000,
27537
+ "max_input_tokens": 1048576,
27538
+ "max_output_tokens": 65535,
27539
+ "max_pdf_size_mb": 30,
27540
+ "max_tokens": 65535,
27541
+ "max_video_length": 1,
27542
+ "max_videos_per_prompt": 10,
27543
+ "mode": "chat",
27544
+ "output_cost_per_token": 1.2e-05,
27545
+ "output_cost_per_token_above_200k_tokens": 1.8e-05,
27546
+ "output_cost_per_token_batches": 6e-06,
27547
+ "source": "https://cloud.google.com/vertex-ai/generative-ai/pricing",
27548
+ "supported_endpoints": [
27549
+ "/v1/chat/completions",
27550
+ "/v1/completions",
27551
+ "/v1/batch"
27552
+ ],
27553
+ "supported_modalities": [
27554
+ "text",
27555
+ "image",
27556
+ "audio",
27557
+ "video"
27558
+ ],
27559
+ "supported_output_modalities": [
27560
+ "text"
27561
+ ],
27562
+ "supports_audio_input": true,
27563
+ "supports_function_calling": true,
27564
+ "supports_pdf_input": true,
27565
+ "supports_prompt_caching": true,
27566
+ "supports_reasoning": true,
27567
+ "supports_response_schema": true,
27568
+ "supports_system_messages": true,
27569
+ "supports_tool_choice": true,
27570
+ "supports_video_input": true,
27571
+ "supports_vision": true,
27572
+ "supports_web_search": true
27573
+ },
27574
+ "vertex_ai/gemini-2.5-flash-image": {
27575
+ "cache_read_input_token_cost": 3e-08,
27576
+ "input_cost_per_audio_token": 1e-06,
27577
+ "input_cost_per_token": 3e-07,
27578
+ "litellm_provider": "vertex_ai-language-models",
27579
+ "max_audio_length_hours": 8.4,
27580
+ "max_audio_per_prompt": 1,
27581
+ "max_images_per_prompt": 3000,
27582
+ "max_input_tokens": 32768,
27583
+ "max_output_tokens": 32768,
27584
+ "max_tokens": 32768,
27585
+ "max_pdf_size_mb": 30,
27586
+ "max_video_length": 1,
27587
+ "max_videos_per_prompt": 10,
27588
+ "mode": "image_generation",
27589
+ "output_cost_per_image": 0.039,
27590
+ "output_cost_per_reasoning_token": 2.5e-06,
27591
+ "output_cost_per_token": 2.5e-06,
27592
+ "rpm": 100000,
27593
+ "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/multimodal/image-generation#edit-an-image",
27594
+ "supported_endpoints": [
27595
+ "/v1/chat/completions",
27596
+ "/v1/completions",
27597
+ "/v1/batch"
27598
+ ],
27599
+ "supported_modalities": [
27600
+ "text",
27601
+ "image",
27602
+ "audio",
27603
+ "video"
27604
+ ],
27605
+ "supported_output_modalities": [
27606
+ "text",
27607
+ "image"
27608
+ ],
27609
+ "supports_audio_output": false,
27610
+ "supports_function_calling": true,
27611
+ "supports_parallel_function_calling": true,
27612
+ "supports_pdf_input": true,
27613
+ "supports_prompt_caching": true,
27614
+ "supports_response_schema": true,
27615
+ "supports_system_messages": true,
27616
+ "supports_tool_choice": true,
27617
+ "supports_url_context": true,
27618
+ "supports_vision": true,
27619
+ "supports_web_search": false,
27620
+ "tpm": 8000000
27621
+ },
27622
+ "vertex_ai/imagen-3.0-capability-001": {
27623
+ "litellm_provider": "vertex_ai-image-models",
27624
+ "mode": "image_generation",
27625
+ "output_cost_per_image": 0.04,
27626
+ "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/image/edit-insert-objects"
27627
+ },
27628
+ "cerebras/gpt-oss-120b": {
27629
+ "input_cost_per_token": 2.5e-07,
27630
+ "litellm_provider": "cerebras",
27631
+ "max_input_tokens": 131072,
27632
+ "max_output_tokens": 32768,
27633
+ "max_tokens": 32768,
27634
+ "mode": "chat",
27635
+ "output_cost_per_token": 6.9e-07,
27636
+ "source": "https://www.cerebras.ai/blog/openai-gpt-oss-120b-runs-fastest-on-cerebras",
27637
+ "supports_function_calling": true,
27638
+ "supports_parallel_function_calling": true,
27639
+ "supports_reasoning": true,
27640
+ "supports_response_schema": true,
27641
+ "supports_tool_choice": true
27642
+ },
27643
+ "gemini-3-pro-image-preview": {
27644
+ "input_cost_per_image": 0.0011,
27645
+ "input_cost_per_token": 2e-06,
27646
+ "input_cost_per_token_batches": 1e-06,
27647
+ "litellm_provider": "vertex_ai-language-models",
27648
+ "max_input_tokens": 65536,
27649
+ "max_output_tokens": 32768,
27650
+ "max_tokens": 65536,
27651
+ "mode": "image_generation",
27652
+ "output_cost_per_image": 0.134,
27653
+ "output_cost_per_token": 1.2e-05,
27654
+ "output_cost_per_token_batches": 6e-06,
27655
+ "source": "https://ai.google.dev/gemini-api/docs/pricing",
27656
+ "supported_endpoints": [
27657
+ "/v1/chat/completions",
27658
+ "/v1/completions",
27659
+ "/v1/batch"
27660
+ ],
27661
+ "supported_modalities": [
27662
+ "text",
27663
+ "image"
27664
+ ],
27665
+ "supported_output_modalities": [
27666
+ "text",
27667
+ "image"
27668
+ ],
27669
+ "supports_function_calling": false,
27670
+ "supports_prompt_caching": true,
27671
+ "supports_response_schema": true,
27672
+ "supports_system_messages": true,
27673
+ "supports_vision": true,
27674
+ "supports_web_search": true
27675
+ },
27676
+ "gemini/gemini-3-pro-image-preview": {
27677
+ "input_cost_per_image": 0.0011,
27678
+ "input_cost_per_token": 2e-06,
27679
+ "input_cost_per_token_batches": 1e-06,
27680
+ "litellm_provider": "gemini",
27681
+ "max_input_tokens": 65536,
27682
+ "max_output_tokens": 32768,
27683
+ "max_tokens": 65536,
27684
+ "mode": "image_generation",
27685
+ "output_cost_per_image": 0.134,
27686
+ "output_cost_per_token": 1.2e-05,
27687
+ "rpm": 1000,
27688
+ "tpm": 4000000,
27689
+ "output_cost_per_token_batches": 6e-06,
27690
+ "source": "https://ai.google.dev/gemini-api/docs/pricing",
27691
+ "supported_endpoints": [
27692
+ "/v1/chat/completions",
27693
+ "/v1/completions",
27694
+ "/v1/batch"
27695
+ ],
27696
+ "supported_modalities": [
27697
+ "text",
27698
+ "image"
27699
+ ],
27700
+ "supported_output_modalities": [
27701
+ "text",
27702
+ "image"
27703
+ ],
27704
+ "supports_function_calling": false,
27705
+ "supports_prompt_caching": true,
27706
+ "supports_response_schema": true,
27707
+ "supports_system_messages": true,
27708
+ "supports_vision": true,
27709
+ "supports_web_search": true
27710
+ },
27711
+ "openrouter/google/gemini-3-pro-preview": {
27712
+ "cache_read_input_token_cost": 2e-07,
27713
+ "cache_read_input_token_cost_above_200k_tokens": 4e-07,
27714
+ "cache_creation_input_token_cost_above_200k_tokens": 2.5e-07,
27715
+ "input_cost_per_token": 2e-06,
27716
+ "input_cost_per_token_above_200k_tokens": 4e-06,
27717
+ "input_cost_per_token_batches": 1e-06,
27718
+ "litellm_provider": "openrouter",
27719
+ "max_audio_length_hours": 8.4,
27720
+ "max_audio_per_prompt": 1,
27721
+ "max_images_per_prompt": 3000,
27722
+ "max_input_tokens": 1048576,
27723
+ "max_output_tokens": 65535,
27724
+ "max_pdf_size_mb": 30,
27725
+ "max_tokens": 65535,
27726
+ "max_video_length": 1,
27727
+ "max_videos_per_prompt": 10,
27728
+ "mode": "chat",
27729
+ "output_cost_per_token": 1.2e-05,
27730
+ "output_cost_per_token_above_200k_tokens": 1.8e-05,
27731
+ "output_cost_per_token_batches": 6e-06,
27732
+ "supported_endpoints": [
27733
+ "/v1/chat/completions",
27734
+ "/v1/completions",
27735
+ "/v1/batch"
27736
+ ],
27737
+ "supported_modalities": [
27738
+ "text",
27739
+ "image",
27740
+ "audio",
27741
+ "video"
27742
+ ],
27743
+ "supported_output_modalities": [
27744
+ "text"
27745
+ ],
27746
+ "supports_audio_input": true,
27747
+ "supports_function_calling": true,
27748
+ "supports_pdf_input": true,
27749
+ "supports_prompt_caching": true,
27750
+ "supports_reasoning": true,
27751
+ "supports_response_schema": true,
27752
+ "supports_system_messages": true,
27753
+ "supports_tool_choice": true,
27754
+ "supports_video_input": true,
27755
+ "supports_vision": true,
27756
+ "supports_web_search": true
27757
+ },
27758
+ "together_ai/zai-org/GLM-4.6": {
27759
+ "input_cost_per_token": 6e-07,
27760
+ "litellm_provider": "together_ai",
27761
+ "max_input_tokens": 200000,
27762
+ "max_output_tokens": 200000,
27763
+ "max_tokens": 200000,
27764
+ "mode": "chat",
27765
+ "output_cost_per_token": 2.2e-06,
27766
+ "source": "https://www.together.ai/models/glm-4-6",
27767
+ "supports_function_calling": true,
27768
+ "supports_parallel_function_calling": true,
27769
+ "supports_reasoning": true,
27770
+ "supports_tool_choice": true
27771
+ },
27772
+ "vertex_ai/gemini-3-pro-image-preview": {
27773
+ "input_cost_per_image": 0.0011,
27774
+ "input_cost_per_token": 2e-06,
27775
+ "input_cost_per_token_batches": 1e-06,
27776
+ "litellm_provider": "vertex_ai-language-models",
27777
+ "max_input_tokens": 65536,
27778
+ "max_output_tokens": 32768,
27779
+ "max_tokens": 65536,
27780
+ "mode": "image_generation",
27781
+ "output_cost_per_image": 0.134,
27782
+ "output_cost_per_token": 1.2e-05,
27783
+ "output_cost_per_token_batches": 6e-06,
27784
+ "source": "https://docs.cloud.google.com/vertex-ai/generative-ai/docs/models/gemini/3-pro-image"
27785
+ },
27786
+ "xai/grok-4-1-fast": {
27787
+ "cache_read_input_token_cost": 5e-08,
27788
+ "input_cost_per_token": 2e-07,
27789
+ "input_cost_per_token_above_128k_tokens": 4e-07,
27790
+ "litellm_provider": "xai",
27791
+ "max_input_tokens": 2000000.0,
27792
+ "max_output_tokens": 2000000.0,
27793
+ "max_tokens": 2000000.0,
27794
+ "mode": "chat",
27795
+ "output_cost_per_token": 5e-07,
27796
+ "output_cost_per_token_above_128k_tokens": 1e-06,
27797
+ "source": "https://docs.x.ai/docs/models/grok-4-1-fast-reasoning",
27798
+ "supports_audio_input": true,
27799
+ "supports_function_calling": true,
27800
+ "supports_reasoning": true,
27801
+ "supports_response_schema": true,
27802
+ "supports_tool_choice": true,
27803
+ "supports_vision": true,
27804
+ "supports_web_search": true
27805
+ },
27806
+ "xai/grok-4-1-fast-reasoning": {
27807
+ "cache_read_input_token_cost": 5e-08,
27808
+ "input_cost_per_token": 2e-07,
27809
+ "input_cost_per_token_above_128k_tokens": 4e-07,
27810
+ "litellm_provider": "xai",
27811
+ "max_input_tokens": 2000000.0,
27812
+ "max_output_tokens": 2000000.0,
27813
+ "max_tokens": 2000000.0,
27814
+ "mode": "chat",
27815
+ "output_cost_per_token": 5e-07,
27816
+ "output_cost_per_token_above_128k_tokens": 1e-06,
27817
+ "source": "https://docs.x.ai/docs/models/grok-4-1-fast-reasoning",
27818
+ "supports_audio_input": true,
27819
+ "supports_function_calling": true,
27820
+ "supports_reasoning": true,
27821
+ "supports_response_schema": true,
27822
+ "supports_tool_choice": true,
27823
+ "supports_vision": true,
27824
+ "supports_web_search": true
27825
+ },
27826
+ "xai/grok-4-1-fast-reasoning-latest": {
27827
+ "cache_read_input_token_cost": 5e-08,
27828
+ "input_cost_per_token": 2e-07,
27829
+ "input_cost_per_token_above_128k_tokens": 4e-07,
27830
+ "litellm_provider": "xai",
27831
+ "max_input_tokens": 2000000.0,
27832
+ "max_output_tokens": 2000000.0,
27833
+ "max_tokens": 2000000.0,
27834
+ "mode": "chat",
27835
+ "output_cost_per_token": 5e-07,
27836
+ "output_cost_per_token_above_128k_tokens": 1e-06,
27837
+ "source": "https://docs.x.ai/docs/models/grok-4-1-fast-reasoning",
27838
+ "supports_audio_input": true,
27839
+ "supports_function_calling": true,
27840
+ "supports_reasoning": true,
27841
+ "supports_response_schema": true,
27842
+ "supports_tool_choice": true,
27843
+ "supports_vision": true,
27844
+ "supports_web_search": true
27845
+ },
27846
+ "xai/grok-4-1-fast-non-reasoning": {
27847
+ "cache_read_input_token_cost": 5e-08,
27848
+ "input_cost_per_token": 2e-07,
27849
+ "input_cost_per_token_above_128k_tokens": 4e-07,
27850
+ "litellm_provider": "xai",
27851
+ "max_input_tokens": 2000000.0,
27852
+ "max_output_tokens": 2000000.0,
27853
+ "max_tokens": 2000000.0,
27854
+ "mode": "chat",
27855
+ "output_cost_per_token": 5e-07,
27856
+ "output_cost_per_token_above_128k_tokens": 1e-06,
27857
+ "source": "https://docs.x.ai/docs/models/grok-4-1-fast-non-reasoning",
27858
+ "supports_audio_input": true,
27859
+ "supports_function_calling": true,
27860
+ "supports_response_schema": true,
27861
+ "supports_tool_choice": true,
27862
+ "supports_vision": true,
27863
+ "supports_web_search": true
27864
+ },
27865
+ "xai/grok-4-1-fast-non-reasoning-latest": {
27866
+ "cache_read_input_token_cost": 5e-08,
27867
+ "input_cost_per_token": 2e-07,
27868
+ "input_cost_per_token_above_128k_tokens": 4e-07,
27869
+ "litellm_provider": "xai",
27870
+ "max_input_tokens": 2000000.0,
27871
+ "max_output_tokens": 2000000.0,
27872
+ "max_tokens": 2000000.0,
27873
+ "mode": "chat",
27874
+ "output_cost_per_token": 5e-07,
27875
+ "output_cost_per_token_above_128k_tokens": 1e-06,
27876
+ "source": "https://docs.x.ai/docs/models/grok-4-1-fast-non-reasoning",
27877
+ "supports_audio_input": true,
27878
+ "supports_function_calling": true,
27879
+ "supports_response_schema": true,
27880
+ "supports_tool_choice": true,
27881
+ "supports_vision": true,
27882
+ "supports_web_search": true
27883
+ },
27884
+ "anthropic.claude-sonnet-4-5-20250929-v1:0": {
27885
+ "cache_creation_input_token_cost": 3.75e-06,
27886
+ "cache_read_input_token_cost": 3e-07,
27887
+ "input_cost_per_token": 3e-06,
27888
+ "input_cost_per_token_above_200k_tokens": 6e-06,
27889
+ "output_cost_per_token_above_200k_tokens": 2.25e-05,
27890
+ "cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
27891
+ "cache_read_input_token_cost_above_200k_tokens": 6e-07,
27892
+ "litellm_provider": "bedrock_converse",
27893
+ "max_input_tokens": 200000,
27894
+ "max_output_tokens": 64000,
27895
+ "max_tokens": 64000,
27896
+ "mode": "chat",
27897
+ "output_cost_per_token": 1.5e-05,
27898
+ "search_context_cost_per_query": {
27899
+ "search_context_size_high": 0.01,
27900
+ "search_context_size_low": 0.01,
27901
+ "search_context_size_medium": 0.01
27902
+ },
27903
+ "supports_assistant_prefill": true,
27904
+ "supports_computer_use": true,
27905
+ "supports_function_calling": true,
27906
+ "supports_pdf_input": true,
27907
+ "supports_prompt_caching": true,
27908
+ "supports_reasoning": true,
27909
+ "supports_response_schema": true,
27910
+ "supports_tool_choice": true,
27911
+ "supports_vision": true,
27912
+ "tool_use_system_prompt_tokens": 159
27913
+ },
27914
+ "bedrock/us-gov-east-1/claude-sonnet-4-5-20250929-v1:0": {
27915
+ "input_cost_per_token": 3.3e-06,
27916
+ "litellm_provider": "bedrock",
27917
+ "max_input_tokens": 200000,
27918
+ "max_output_tokens": 4096,
27919
+ "max_tokens": 4096,
27920
+ "mode": "chat",
27921
+ "output_cost_per_token": 1.65e-05,
27922
+ "supports_assistant_prefill": true,
27923
+ "supports_computer_use": true,
27924
+ "supports_function_calling": true,
27925
+ "supports_pdf_input": true,
27926
+ "supports_prompt_caching": true,
27927
+ "supports_reasoning": true,
27928
+ "supports_response_schema": true,
27929
+ "supports_tool_choice": true,
27930
+ "supports_vision": true
27931
+ },
27932
+ "bedrock/us-gov-west-1/claude-sonnet-4-5-20250929-v1:0": {
27933
+ "input_cost_per_token": 3.3e-06,
27934
+ "litellm_provider": "bedrock",
27935
+ "max_input_tokens": 200000,
27936
+ "max_output_tokens": 4096,
27937
+ "max_tokens": 4096,
27938
+ "mode": "chat",
27939
+ "output_cost_per_token": 1.65e-05,
27940
+ "supports_assistant_prefill": true,
27941
+ "supports_computer_use": true,
27942
+ "supports_function_calling": true,
27943
+ "supports_pdf_input": true,
27944
+ "supports_prompt_caching": true,
27945
+ "supports_reasoning": true,
27946
+ "supports_response_schema": true,
27947
+ "supports_tool_choice": true,
27948
+ "supports_vision": true
27949
+ },
27950
+ "claude-sonnet-4-5-20250929-v1:0": {
27951
+ "cache_creation_input_token_cost": 3.75e-06,
27952
+ "cache_read_input_token_cost": 3e-07,
27953
+ "input_cost_per_token": 3e-06,
27954
+ "input_cost_per_token_above_200k_tokens": 6e-06,
27955
+ "output_cost_per_token_above_200k_tokens": 2.25e-05,
27956
+ "cache_creation_input_token_cost_above_200k_tokens": 7.5e-06,
27957
+ "cache_read_input_token_cost_above_200k_tokens": 6e-07,
27958
+ "litellm_provider": "bedrock",
27959
+ "max_input_tokens": 200000,
27960
+ "max_output_tokens": 64000,
27961
+ "max_tokens": 64000,
27962
+ "mode": "chat",
27963
+ "output_cost_per_token": 1.5e-05,
27964
+ "supports_assistant_prefill": true,
27965
+ "supports_computer_use": true,
27966
+ "supports_function_calling": true,
27967
+ "supports_pdf_input": true,
27968
+ "supports_prompt_caching": true,
27969
+ "supports_reasoning": true,
27970
+ "supports_response_schema": true,
27971
+ "supports_tool_choice": true,
27972
+ "supports_vision": true,
27973
+ "tool_use_system_prompt_tokens": 159
25712
27974
  }
25713
27975
  }