@pydantic/genai-prices 0.0.43 → 0.0.45
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/cli.js +3290 -397
- package/dist/index.cjs +4 -4
- package/dist/index.js +3167 -274
- package/package.json +1 -1
package/dist/index.cjs
CHANGED
|
@@ -1,10 +1,10 @@
|
|
|
1
|
-
"use strict";Object.defineProperty(exports,Symbol.toStringTag,{value:"Module"});const
|
|
2
|
-
`,match:{or:[{starts_with:"claude-2"},{contains:"claude-v2"}]},context_window:2e5,prices:{input_mtok:8,output_mtok:24}},{id:"claude-3-5-haiku-latest",name:"Claude Haiku 3.5",description:"Fastest, most cost-effective model",match:{or:[{starts_with:"claude-3-5-haiku"},{starts_with:"claude-3.5-haiku"}]},context_window:2e5,prices:{input_mtok:.8,cache_write_mtok:1,cache_read_mtok:.08,output_mtok:4}},{id:"claude-3-5-sonnet",name:"Claude Sonnet 3.5",description:"Claude 3.5 Sonnet is an ideal balance of intelligence and speed for enterprise workloads. Maximum utility at a lower price, dependable, balanced for scaled deployments.",match:{or:[{starts_with:"claude-3-5-sonnet"},{starts_with:"claude-3.5-sonnet"}]},context_window:2e5,prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"claude-3-7-sonnet-latest",name:"Claude Sonnet 3.7",description:"Claude 3.7 Sonnet is an advanced large language model with improved reasoning, coding, and problem-solving capabilities.",match:{or:[{starts_with:"claude-3-7-sonnet"},{starts_with:"claude-3.7-sonnet"},{starts_with:"claude-sonnet-3.7"},{starts_with:"claude-sonnet-3-7"}]},context_window:2e5,prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"claude-3-haiku",name:"Claude Haiku 3",description:"Fastest, most cost-effective model",match:{starts_with:"claude-3-haiku"},context_window:2e5,prices:{input_mtok:.25,cache_write_mtok:.3,cache_read_mtok:.03,output_mtok:1.25}},{id:"claude-3-opus-latest",name:"Claude Opus 3",description:"Claude 3 Opus was Anthropic's most powerful model for highly complex tasks. It boasts top-level performance, intelligence, fluency, and understanding.",match:{starts_with:"claude-3-opus"},context_window:2e5,prices:{input_mtok:15,cache_write_mtok:18.75,cache_read_mtok:1.5,output_mtok:75}},{id:"claude-3-sonnet",name:"Claude 3 Sonnet",description:"Claude 3 Sonnet is an ideal balance of intelligence and speed for enterprise workloads. Maximum utility at a lower price, dependable, balanced for scaled deployments.",match:{starts_with:"claude-3-sonnet"},context_window:2e5,prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"claude-haiku-4-5",name:"Claude Haiku 4.5",description:"Fastest and most intelligent Haiku model",match:{or:[{starts_with:"claude-haiku-4-5"},{starts_with:"claude-haiku-4.5"},{starts_with:"claude-4-5-haiku"},{starts_with:"claude-4.5-haiku"}]},context_window:2e5,prices:{input_mtok:1,cache_write_mtok:1.25,cache_read_mtok:.1,output_mtok:5}},{id:"claude-instant-1",description:"Retired, here to match price sources",match:{equals:"claude-instant-1"},prices:{input_mtok:1.63,output_mtok:55.1}},{id:"claude-instant-1.2",description:"Retired, here to match price sources",match:{equals:"claude-instant-1.2"},prices:{input_mtok:1.63,output_mtok:5.51}},{id:"claude-opus-4-0",name:"Claude Opus 4",description:"Most intelligent model for complex tasks",match:{or:[{starts_with:"claude-opus-4-0"},{starts_with:"claude-4-opus"},{equals:"claude-opus-4"},{equals:"claude-opus-4-20250514"}]},context_window:2e5,prices:{input_mtok:15,cache_write_mtok:18.75,cache_read_mtok:1.5,output_mtok:75}},{id:"claude-opus-4-1",name:"Claude Opus 4.1",description:"Most intelligent model for complex tasks",match:{or:[{starts_with:"claude-opus-4-1"},{starts_with:"claude-opus-4.1"}]},context_window:2e5,prices:{input_mtok:15,cache_write_mtok:18.75,cache_read_mtok:1.5,output_mtok:75}},{id:"claude-sonnet-4-0",name:"Claude Sonnet 4",description:"Optimal balance of intelligence, cost, and speed",match:{or:[{starts_with:"claude-sonnet-4-2025"},{starts_with:"claude-sonnet-4-0"},{starts_with:"claude-sonnet-4@"},{equals:"claude-sonnet-4"},{starts_with:"claude-4-sonnet"}]},context_window:2e5,prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"claude-sonnet-4-5",name:"Claude Sonnet 4.5",description:"Most intelligent model for building agents and coding",match:{or:[{starts_with:"claude-sonnet-4-5"},{starts_with:"claude-sonnet-4.5"}]},context_window:1e6,prices:{input_mtok:{base:3,tiers:[{start:2e5,price:6}]},cache_write_mtok:{base:3.75,tiers:[{start:2e5,price:7.5}]},cache_read_mtok:{base:.3,tiers:[{start:2e5,price:.6}]},output_mtok:{base:15,tiers:[{start:2e5,price:22.5}]}}},{id:"claude-v1",description:"Retired, here to match price sources",match:{equals:"claude-v1"},prices:{input_mtok:8,output_mtok:24}}]},{id:"avian",name:"Avian",pricing_urls:["https://avian.io/pricing/"],api_pattern:"https://api\\.avian\\.io",models:[{id:"Meta-Llama-3.1-405B-Instruct",match:{equals:"Meta-Llama-3.1-405B-Instruct"},prices:{input_mtok:1.5,output_mtok:1.5}},{id:"Meta-Llama-3.1-70B-Instruct",match:{equals:"Meta-Llama-3.1-70B-Instruct"},prices:{input_mtok:.45,output_mtok:.45}},{id:"Meta-Llama-3.1-8B-Instruct",match:{equals:"Meta-Llama-3.1-8B-Instruct"},prices:{input_mtok:.1,output_mtok:.1}},{id:"Meta-Llama-3.3-70B-Instruct",match:{equals:"Meta-Llama-3.3-70B-Instruct"},prices:{input_mtok:.45,output_mtok:.45}}]},{id:"aws",name:"AWS Bedrock",pricing_urls:["https://aws.amazon.com/bedrock/pricing/"],api_pattern:"https://bedrock-runtime\\.[a-z0-9-]+\\.amazonaws\\.com/",provider_match:{contains:"bedrock"},extractors:[{api_flavor:"default",root:"usage",model_path:"model",mappings:[{path:"inputTokens",dest:"input_tokens",required:!0},{path:"outputTokens",dest:"output_tokens",required:!0}]},{api_flavor:"anthropic",root:"usage",model_path:"model",mappings:[{path:"input_tokens",dest:"input_tokens",required:!0},{path:"cache_creation_input_tokens",dest:"input_tokens",required:!1},{path:"cache_read_input_tokens",dest:"input_tokens",required:!1},{path:"cache_creation_input_tokens",dest:"cache_write_tokens",required:!1},{path:"cache_read_input_tokens",dest:"cache_read_tokens",required:!1},{path:"output_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"amazon.nova-lite-v1:0",name:"Nova Lite",description:"Amazon Nova Lite 1.0 is a very low-cost multimodal model from Amazon that focused on fast processing of image, video, and text inputs to generate text output. Amazon Nova Lite can handle real-time customer interactions, document analysis, and visual question-answering tasks with high accuracy.",match:{contains:"nova-lite"},prices:{input_mtok:.06,cache_read_mtok:.015,output_mtok:.24}},{id:"amazon.nova-micro-v1:0",name:"Nova Micro",description:"Amazon Nova Micro 1.0 is a text-only model that delivers the lowest latency responses in the Amazon Nova family of models at a very low cost. With a context length of 128K tokens and optimized for speed and cost, Amazon Nova Micro excels at tasks such as text summarization, translation, content classification, interactive chat, and brainstorming. It has simple mathematical reasoning and coding abilities.",match:{contains:"nova-micro"},prices:{input_mtok:.035,cache_read_mtok:.00875,output_mtok:.14}},{id:"amazon.nova-premier-v1:0",name:"Nova Premier",match:{contains:"nova-premier"},prices:{input_mtok:2.5,cache_read_mtok:.625,output_mtok:12.5}},{id:"amazon.nova-pro-v1:0",name:"Nova Pro",description:"Amazon Nova Pro 1.0 is a capable multimodal model from Amazon focused on providing a combination of accuracy, speed, and cost for a wide range of tasks. As of December 2024, it achieves state-of-the-art performance on key benchmarks including visual question answering (TextVQA) and video understanding (VATEX).",match:{contains:"nova-pro"},prices:{input_mtok:.8,cache_read_mtok:.2,output_mtok:3.2}},{id:"amazon.nova-sonic-v1:0",name:"Nova Sonic",match:{contains:"nova-sonic"},prices:{input_mtok:.06,output_mtok:.24,input_audio_mtok:3.4,output_audio_mtok:13.6}},{id:"amazon.titan-embed-text-v1",name:"Titan Embeddings G1 - Text",match:{contains:"titan-embed-text"},prices:{input_mtok:.1}},{id:"amazon.titan-text-express-v1",name:"Titan Text G1 - Express",match:{contains:"titan-text-express"},prices:{input_mtok:.2,output_mtok:.6}},{id:"amazon.titan-text-lite-v1",name:"Titan Text G1 - Lite",match:{contains:"titan-text-lite"},prices:{input_mtok:.15,output_mtok:.2}},{id:"deepseek.r1-v1:0",name:"DeepSeek-R1",match:{contains:"r1"},prices:{input_mtok:1.35,output_mtok:5.4}},{id:"global.anthropic.claude-haiku-4-5-20251001-v1:0",match:{starts_with:"global.anthropic.claude-haiku-4-5-20251001-v1"},prices:{input_mtok:1,cache_write_mtok:1.25,cache_read_mtok:.1,output_mtok:5}},{id:"global.anthropic.claude-sonnet-4-20250514-v1:0",match:{starts_with:"global.anthropic.claude-sonnet-4-20250514-v1"},prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"global.anthropic.claude-sonnet-4-5-20250929-v1:0",match:{starts_with:"global.anthropic.claude-sonnet-4-5-20250929-v1"},prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"meta.llama3-1-70b-instruct-v1:0",name:"Llama 3.1 70B Instruct",match:{contains:"llama3-1-70b-instruct"},prices:{input_mtok:.72,output_mtok:.72}},{id:"meta.llama3-1-8b-instruct-v1:0",name:"Llama 3.1 8B Instruct",match:{contains:"llama3-1-8b-instruct"},prices:{input_mtok:.22,output_mtok:.22}},{id:"meta.llama3-2-11b-instruct-v1:0",name:"Llama 3.2 11B Instruct",match:{contains:"llama3-2-11b-instruct"},prices:{input_mtok:.16,output_mtok:.16}},{id:"meta.llama3-2-1b-instruct-v1:0",name:"Llama 3.2 1B Instruct",match:{contains:"llama3-2-1b-instruct"},prices:{input_mtok:.1,output_mtok:.1}},{id:"meta.llama3-2-3b-instruct-v1:0",name:"Llama 3.2 3B Instruct",match:{contains:"llama3-2-3b-instruct"},prices:{input_mtok:.15,output_mtok:.15}},{id:"meta.llama3-2-90b-instruct-v1:0",name:"Llama 3.2 90B Instruct",match:{contains:"llama3-2-90b-instruct"},prices:{input_mtok:.72,output_mtok:.72}},{id:"meta.llama3-3-70b-instruct-v1:0",name:"Llama 3.3 70B Instruct",match:{contains:"llama3-3-70b-instruct"},prices:{input_mtok:.72,output_mtok:.72}},{id:"meta.llama3-70b-instruct-v1:0",name:"Llama 3 70B Instruct",match:{contains:"llama3-70b-instruct"},prices:{input_mtok:2.65,output_mtok:3.5}},{id:"meta.llama3-8b-instruct-v1:0",name:"Llama 3 8B Instruct",match:{contains:"llama3-8b-instruct"},prices:{input_mtok:.3,output_mtok:.6}},{id:"meta.llama4-maverick-17b-instruct-v1:0",name:"Llama 4 Maverick 17B Instruct",match:{contains:"llama4-maverick-17b-instruct"},prices:{input_mtok:.24,output_mtok:.97}},{id:"meta.llama4-scout-17b-instruct-v1:0",name:"Llama 4 Scout 17B Instruct",match:{contains:"llama4-scout-17b-instruct"},prices:{input_mtok:.17,output_mtok:.66}},{id:"mistral.mistral-7b-instruct-v0:2",name:"Mistral 7B Instruct",match:{contains:"mistral-7b-instruct"},prices:{input_mtok:.15,output_mtok:.2}},{id:"mistral.mistral-large-2402-v1:0",name:"Mistral Large (24.02)",match:{contains:"mistral-large-2402"},prices:{input_mtok:4,output_mtok:12}},{id:"mistral.mistral-small-2402-v1:0",name:"Mistral Small (24.02)",match:{contains:"mistral-small-2402"},prices:{input_mtok:1,output_mtok:3}},{id:"mistral.mixtral-8x7b-instruct-v0:1",name:"Mixtral 8x7B Instruct",match:{contains:"mixtral-8x7b-instruct"},prices:{input_mtok:.45,output_mtok:.7}},{id:"mistral.pixtral-large-2502-v1:0",name:"Pixtral Large (25.02)",match:{contains:"pixtral-large-2502"},prices:{input_mtok:2,output_mtok:6}},{id:"openai.gpt-oss-120b-1:0",name:"gpt-oss-120b",match:{contains:"gpt-oss-120b"},prices:{input_mtok:.15,output_mtok:.6}},{id:"openai.gpt-oss-20b-1:0",name:"gpt-oss-20b",match:{contains:"gpt-oss-20b"},prices:{input_mtok:.07,output_mtok:.3}},{id:"qwen.qwen3-32b-v1:0",name:"Qwen3 32B (dense)",match:{contains:"qwen3-32b"},prices:{input_mtok:.15,output_mtok:.6}},{id:"qwen.qwen3-coder-30b-a3b-v1:0",name:"Qwen3-Coder-30B-A3B-Instruct",match:{contains:"qwen3-coder-30b-a3b"},prices:{input_mtok:.15,output_mtok:.6}},{id:"regional.anthropic.claude-3-5-haiku-20241022-v1:0",match:{or:[{starts_with:"us.anthropic.claude-3-5-haiku-20241022-v1"},{starts_with:"au.anthropic.claude-3-5-haiku-20241022-v1"},{starts_with:"apac.anthropic.claude-3-5-haiku-20241022-v1"},{starts_with:"eu.anthropic.claude-3-5-haiku-20241022-v1"},{starts_with:"us-gov.anthropic.claude-3-5-haiku-20241022-v1"},{starts_with:"jp.anthropic.claude-3-5-haiku-20241022-v1"}]},prices:{input_mtok:.8,cache_write_mtok:1,cache_read_mtok:.08,output_mtok:4}},{id:"regional.anthropic.claude-3-5-sonnet-20240620-v1:0",match:{or:[{starts_with:"us.anthropic.claude-3-5-sonnet-20240620-v1"},{starts_with:"au.anthropic.claude-3-5-sonnet-20240620-v1"},{starts_with:"apac.anthropic.claude-3-5-sonnet-20240620-v1"},{starts_with:"eu.anthropic.claude-3-5-sonnet-20240620-v1"},{starts_with:"us-gov.anthropic.claude-3-5-sonnet-20240620-v1"},{starts_with:"jp.anthropic.claude-3-5-sonnet-20240620-v1"}]},prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"regional.anthropic.claude-3-5-sonnet-20241022-v2:0",match:{or:[{starts_with:"us.anthropic.claude-3-5-sonnet-20241022-v2"},{starts_with:"au.anthropic.claude-3-5-sonnet-20241022-v2"},{starts_with:"apac.anthropic.claude-3-5-sonnet-20241022-v2"},{starts_with:"eu.anthropic.claude-3-5-sonnet-20241022-v2"},{starts_with:"us-gov.anthropic.claude-3-5-sonnet-20241022-v2"},{starts_with:"jp.anthropic.claude-3-5-sonnet-20241022-v2"}]},prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"regional.anthropic.claude-3-7-sonnet-20250219-v1:0",match:{or:[{starts_with:"us.anthropic.claude-3-7-sonnet-20250219-v1"},{starts_with:"au.anthropic.claude-3-7-sonnet-20250219-v1"},{starts_with:"apac.anthropic.claude-3-7-sonnet-20250219-v1"},{starts_with:"eu.anthropic.claude-3-7-sonnet-20250219-v1"},{starts_with:"us-gov.anthropic.claude-3-7-sonnet-20250219-v1"},{starts_with:"jp.anthropic.claude-3-7-sonnet-20250219-v1"}]},prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"regional.anthropic.claude-3-haiku-20240307-v1:0",match:{or:[{starts_with:"us.anthropic.claude-3-haiku-20240307-v1"},{starts_with:"au.anthropic.claude-3-haiku-20240307-v1"},{starts_with:"apac.anthropic.claude-3-haiku-20240307-v1"},{starts_with:"eu.anthropic.claude-3-haiku-20240307-v1"},{starts_with:"us-gov.anthropic.claude-3-haiku-20240307-v1"},{starts_with:"jp.anthropic.claude-3-haiku-20240307-v1"}]},prices:{input_mtok:.25,output_mtok:1.25}},{id:"regional.anthropic.claude-3-opus-20240229-v1:0",match:{or:[{starts_with:"us.anthropic.claude-3-opus-20240229-v1"},{starts_with:"au.anthropic.claude-3-opus-20240229-v1"},{starts_with:"apac.anthropic.claude-3-opus-20240229-v1"},{starts_with:"eu.anthropic.claude-3-opus-20240229-v1"},{starts_with:"us-gov.anthropic.claude-3-opus-20240229-v1"},{starts_with:"jp.anthropic.claude-3-opus-20240229-v1"}]},prices:{input_mtok:15,output_mtok:75}},{id:"regional.anthropic.claude-3-sonnet-20240229-v1:0",match:{or:[{starts_with:"us.anthropic.claude-3-sonnet-20240229-v1"},{starts_with:"au.anthropic.claude-3-sonnet-20240229-v1"},{starts_with:"apac.anthropic.claude-3-sonnet-20240229-v1"},{starts_with:"eu.anthropic.claude-3-sonnet-20240229-v1"},{starts_with:"us-gov.anthropic.claude-3-sonnet-20240229-v1"},{starts_with:"jp.anthropic.claude-3-sonnet-20240229-v1"}]},prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"regional.anthropic.claude-haiku-4-5-20251001-v1:0",match:{or:[{starts_with:"us.anthropic.claude-haiku-4-5-20251001-v1"},{starts_with:"au.anthropic.claude-haiku-4-5-20251001-v1"},{starts_with:"apac.anthropic.claude-haiku-4-5-20251001-v1"},{starts_with:"eu.anthropic.claude-haiku-4-5-20251001-v1"},{starts_with:"us-gov.anthropic.claude-haiku-4-5-20251001-v1"},{starts_with:"jp.anthropic.claude-haiku-4-5-20251001-v1"}]},prices:{input_mtok:1.1,cache_write_mtok:1.375,cache_read_mtok:.11,output_mtok:5.5}},{id:"regional.anthropic.claude-opus-4-1-20250805-v1:0",match:{or:[{starts_with:"us.anthropic.claude-opus-4-1-20250805-v1"},{starts_with:"au.anthropic.claude-opus-4-1-20250805-v1"},{starts_with:"apac.anthropic.claude-opus-4-1-20250805-v1"},{starts_with:"eu.anthropic.claude-opus-4-1-20250805-v1"},{starts_with:"us-gov.anthropic.claude-opus-4-1-20250805-v1"},{starts_with:"jp.anthropic.claude-opus-4-1-20250805-v1"}]},prices:{input_mtok:15,cache_write_mtok:18.75,cache_read_mtok:1.5,output_mtok:75}},{id:"regional.anthropic.claude-opus-4-20250514-v1:0",match:{or:[{starts_with:"us.anthropic.claude-opus-4-20250514-v1"},{starts_with:"au.anthropic.claude-opus-4-20250514-v1"},{starts_with:"apac.anthropic.claude-opus-4-20250514-v1"},{starts_with:"eu.anthropic.claude-opus-4-20250514-v1"},{starts_with:"us-gov.anthropic.claude-opus-4-20250514-v1"},{starts_with:"jp.anthropic.claude-opus-4-20250514-v1"}]},prices:{input_mtok:15,cache_write_mtok:18.75,cache_read_mtok:1.5,output_mtok:75}},{id:"regional.anthropic.claude-sonnet-4-20250514-v1:0",match:{or:[{starts_with:"us.anthropic.claude-sonnet-4-20250514-v1"},{starts_with:"au.anthropic.claude-sonnet-4-20250514-v1"},{starts_with:"apac.anthropic.claude-sonnet-4-20250514-v1"},{starts_with:"eu.anthropic.claude-sonnet-4-20250514-v1"},{starts_with:"us-gov.anthropic.claude-sonnet-4-20250514-v1"},{starts_with:"jp.anthropic.claude-sonnet-4-20250514-v1"}]},prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"regional.anthropic.claude-sonnet-4-5-20250929-v1:0",match:{or:[{starts_with:"us.anthropic.claude-sonnet-4-5-20250929-v1"},{starts_with:"au.anthropic.claude-sonnet-4-5-20250929-v1"},{starts_with:"apac.anthropic.claude-sonnet-4-5-20250929-v1"},{starts_with:"eu.anthropic.claude-sonnet-4-5-20250929-v1"},{starts_with:"us-gov.anthropic.claude-sonnet-4-5-20250929-v1"},{starts_with:"jp.anthropic.claude-sonnet-4-5-20250929-v1"}]},prices:{input_mtok:3.3,cache_write_mtok:4.125,cache_read_mtok:.33,output_mtok:16.5}}]},{id:"azure",name:"Microsoft Azure",pricing_urls:["https://azure.microsoft.com/en-us/pricing/details/cognitive-services/openai-service/#pricing"],api_pattern:"(https?://)?([^.]*\\.)?(?:openai\\.azure\\.com|azure-api\\.net|cognitiveservices\\.azure\\.com)",price_comments:'These are prices for "*-Global" models, prices for "Regional" models are often slightly higher. Retired models are listed at https://learn.microsoft.com/th-th/azure/ai-foundry/openai/concepts/legacy-models',models:[{id:"ada",match:{or:[{equals:"ada"},{equals:"text-embedding-ada"},{equals:"text-embedding-ada-002"},{equals:"text-embedding-ada-002-v2"}]},prices:{input_mtok:.1}},{id:"babbage",match:{or:[{equals:"babbage"},{equals:"babbage-002"}]},prices:{input_mtok:.4}},{id:"curie",match:{or:[{equals:"curie"},{equals:"text-curie"},{equals:"text-curie-001"}]},prices:{input_mtok:2}},{id:"davinci",match:{or:[{equals:"davinci"},{equals:"davinci-002"},{equals:"text-davinci"},{equals:"text-davinci-002"}]},prices:{input_mtok:2}},{id:"gpt-3.5-turbo",match:{or:[{equals:"gpt-3.5-turbo"},{equals:"gpt-3.5-turbo-0301"},{equals:"gpt-3.5-turbo-0613"},{equals:"gpt-3.5-turbo-instruct"},{equals:"gpt-3.5-turbo-instruct-0914"}]},prices:{input_mtok:1.5,output_mtok:2}},{id:"gpt-3.5-turbo-0125",match:{equals:"gpt-3.5-turbo-0125"},prices:{input_mtok:.5,output_mtok:1.5}},{id:"gpt-3.5-turbo-1106",match:{equals:"gpt-3.5-turbo-1106"},prices:{input_mtok:1,output_mtok:2}},{id:"gpt-3.5-turbo-16k-0613",match:{equals:"gpt-3.5-turbo-16k-0613"},prices:{input_mtok:3,output_mtok:4}},{id:"gpt-35-16k",match:{equals:"gpt-35-16k"},prices:{input_mtok:3,output_mtok:4}},{id:"gpt-35-turbo",match:{or:[{equals:"gpt-35-turbo"},{equals:"gpt-35-turbo-0613"},{equals:"gpt-35-turbo-1106"}]},prices:{input_mtok:1.5,output_mtok:2}},{id:"gpt-35-turbo-16k",match:{or:[{equals:"gpt-35-turbo-16k"},{equals:"gpt-35-turbo-16k-0613"}]},prices:{input_mtok:3,output_mtok:4}},{id:"gpt-4",match:{or:[{equals:"gpt-4"},{equals:"gpt-4-0314"},{equals:"gpt-4-0613"}]},prices:{input_mtok:30,output_mtok:60}},{id:"gpt-4-0125-preview",match:{equals:"gpt-4-0125-preview"},prices:{input_mtok:10,output_mtok:30}},{id:"gpt-4-1106-preview",match:{equals:"gpt-4-1106-preview"},prices:{input_mtok:10,output_mtok:30}},{id:"gpt-4-1106-vision-preview",match:{equals:"gpt-4-1106-vision-preview"},prices:{input_mtok:10,output_mtok:30}},{id:"gpt-4-32k",match:{or:[{equals:"gpt-4-32k"},{equals:"gpt-4-32k-0314"},{equals:"gpt-4-32k-0613"}]},prices:{input_mtok:60,output_mtok:120}},{id:"gpt-4-preview-1106",match:{equals:"gpt-4-preview-1106"},prices:{input_mtok:10,output_mtok:30}},{id:"gpt-4-turbo",match:{or:[{equals:"gpt-4-turbo"},{equals:"gpt-4-turbo-0125-preview"},{equals:"gpt-4-turbo-2024-04-09"},{equals:"gpt-4-turbo-preview"}]},prices:{input_mtok:10,output_mtok:30}},{id:"gpt-4-vision",match:{or:[{equals:"gpt-4-vision"},{equals:"gpt-4-vision-preview"}]},prices:{input_mtok:10,output_mtok:30}},{id:"gpt-4.1",match:{or:[{equals:"gpt-4.1"},{equals:"gpt-4.1-2025-04-14"}]},prices:{input_mtok:2,cache_read_mtok:.5,output_mtok:8}},{id:"gpt-4.1-mini",match:{or:[{equals:"gpt-4.1-mini"},{equals:"gpt-4.1-mini-2025-04-14"}]},prices:{input_mtok:.4,cache_read_mtok:.1,output_mtok:1.6}},{id:"gpt-4.1-nano",match:{or:[{equals:"gpt-4.1-nano"},{equals:"gpt-4.1-nano-2025-04-14"}]},prices:{input_mtok:.1,cache_read_mtok:.03,output_mtok:.4}},{id:"gpt-4o-2024-0513",match:{or:[{equals:"gpt-4o-2024-05-13"},{equals:"gpt-4o-2024-0513"}]},prices:{input_mtok:5,output_mtok:15}},{id:"gpt-4o-2024-08-06",match:{equals:"gpt-4o-2024-08-06"},prices:{input_mtok:2.5,cache_read_mtok:1.25,output_mtok:10}},{id:"gpt-4o-2024-1120",match:{or:[{equals:"gpt-4o-2024-1120"},{equals:"gpt-4o-2024-11-20"}]},prices:{input_mtok:2.5,cache_read_mtok:1.25,output_mtok:10}},{id:"gpt-4o-mini",match:{or:[{equals:"gpt-4o-mini"},{equals:"gpt-4o-mini-0718"},{starts_with:"gpt-4o-mini-audio"}]},context_window:128e3,prices:{input_mtok:.15,cache_read_mtok:.075,output_mtok:.6,input_audio_mtok:10,output_audio_mtok:20}},{id:"gpt-4o-mini-realtime",match:{starts_with:"gpt-4o-mini-realtime"},prices:{input_mtok:.6,cache_read_mtok:.3,output_mtok:2.4,input_audio_mtok:10,cache_audio_read_mtok:.3,output_audio_mtok:20}},{id:"gpt-4o-realtime",match:{starts_with:"gpt-4o-realtime"},prices:{input_mtok:5,cache_read_mtok:2.5,output_mtok:20,input_audio_mtok:40,cache_audio_read_mtok:2.5,output_audio_mtok:80}},{id:"gpt-5",name:"GPT-5",description:"GPT-5 is OpenAI's flagship model for coding, reasoning, and agentic tasks across domains.",match:{or:[{equals:"gpt-5"},{equals:"gpt-5-2025-08-07"}]},context_window:4e5,prices:{input_mtok:1.25,cache_read_mtok:.125,output_mtok:10}},{id:"gpt-5-mini",name:"GPT-5 mini",description:"GPT-5 mini is a faster, more cost-efficient version of GPT-5. It's great for well-defined tasks and precise prompts.",match:{or:[{equals:"gpt-5-mini"},{equals:"gpt-5-mini-2025-08-07"}]},context_window:4e5,prices:{input_mtok:.25,cache_read_mtok:.025,output_mtok:2}},{id:"gpt-5-nano",name:"GPT-5 nano",description:"GPT-5 Nano is OpenAI's fastest, cheapest version of GPT-5. It's great for summarization and classification tasks.",match:{or:[{equals:"gpt-5-nano"},{equals:"gpt-5-nano-2025-04-14"}]},context_window:4e5,prices:{input_mtok:.05,cache_read_mtok:.005,output_mtok:.4}},{id:"gpt35",match:{equals:"gpt35"},prices:{input_mtok:1.5,output_mtok:2}},{id:"gpt4-turbo-preview",match:{equals:"gpt4-turbo-preview"},prices:{input_mtok:10,output_mtok:30}},{id:"mai-ds-r1:free",name:"MAI DS R1 (free)",description:"MAI-DS-R1 is a post-trained variant of DeepSeek-R1 developed by the Microsoft AI team to improve the model's responsiveness on previously blocked topics while enhancing its safety profile. Built on top of DeepSeek-R1's reasoning foundation, it integrates 110k examples from the Tulu-3 SFT dataset and 350k internally curated multilingual safety-alignment samples. The model retains strong reasoning, coding, and problem-solving capabilities, while unblocking a wide range of prompts previously restricted in R1.",match:{equals:"mai-ds-r1:free"},prices:{}},{id:"o1",match:{or:[{equals:"o1"},{equals:"o1-2024-12-17"},{equals:"o1-preview"},{equals:"o1-preview-2024-09-12"}]},prices:{input_mtok:15,cache_read_mtok:7.5,output_mtok:60}},{id:"o1-mini",match:{or:[{equals:"o1-mini"},{equals:"o1-mini-2024-09-12"}]},prices:{input_mtok:1.1,cache_read_mtok:.55,output_mtok:4.4}},{id:"o3-2025-04-16",match:{or:[{equals:"o3"},{equals:"o3-2025-04-16"}]},prices:{input_mtok:2,cache_read_mtok:.5,output_mtok:8}},{id:"o3-mini",match:{or:[{equals:"o3-mini"},{equals:"o3-mini-2025-01-31"}]},prices:{input_mtok:1.1,cache_read_mtok:.55,output_mtok:4.4}},{id:"o4-mini",match:{or:[{contains:"o4-mini"},{contains:"o4-mini-2025-04-16"}]},prices:{input_mtok:1.1,cache_read_mtok:.28,output_mtok:4.4}},{id:"phi-3-medium-128k-instruct",name:"Phi-3 Medium 128K Instruct",description:"Phi-3 128K Medium is a powerful 14-billion parameter model designed for advanced language understanding, reasoning, and instruction following. Optimized through supervised fine-tuning and preference adjustments, it excels in tasks involving common sense, mathematics, logical reasoning, and code processing.",match:{equals:"phi-3-medium-128k-instruct"},prices:{input_mtok:1,output_mtok:1}},{id:"phi-3-mini-128k-instruct",name:"Phi-3 Mini 128K Instruct",description:"Phi-3 Mini is a powerful 3.8B parameter model designed for advanced language understanding, reasoning, and instruction following. Optimized through supervised fine-tuning and preference adjustments, it excels in tasks involving common sense, mathematics, logical reasoning, and code processing.",match:{equals:"phi-3-mini-128k-instruct"},prices:{input_mtok:.1,output_mtok:.1}},{id:"phi-3.5-mini-128k-instruct",name:"Phi-3.5 Mini 128K Instruct",description:"Phi-3.5 models are lightweight, state-of-the-art open models. These models were trained with Phi-3 datasets that include both synthetic data and the filtered, publicly available websites data, with a focus on high quality and reasoning-dense properties. Phi-3.5 Mini uses 3.8B parameters, and is a dense decoder-only transformer model using the same tokenizer as Phi-3 Mini.",match:{equals:"phi-3.5-mini-128k-instruct"},prices:{input_mtok:.1,output_mtok:.1}},{id:"phi-4",name:"Phi 4",description:"Microsoft Research Phi-4 is designed to perform well in complex reasoning tasks and can operate efficiently in situations with limited memory or where quick responses are needed.",match:{equals:"phi-4"},prices:{input_mtok:.07,output_mtok:.14}},{id:"phi-4-multimodal-instruct",name:"Phi 4 Multimodal Instruct",description:"Phi-4 Multimodal Instruct is a versatile 5.6B parameter foundation model that combines advanced reasoning and instruction-following capabilities across both text and visual inputs, providing accurate text outputs. The unified architecture enables efficient, low-latency inference, suitable for edge and mobile deployments. Phi-4 Multimodal Instruct supports text inputs in multiple languages including Arabic, Chinese, English, French, German, Japanese, Spanish, and more, with visual input optimized primarily for English. It delivers impressive performance on multimodal tasks involving mathematical, scientific, and document reasoning, providing developers and enterprises a powerful yet compact model for sophisticated interactive applications. For more information, see the Phi-4 Multimodal blog post.",match:{equals:"phi-4-multimodal-instruct"},prices:{input_mtok:.05,output_mtok:.1}},{id:"phi-4-reasoning-plus",name:"Phi 4 Reasoning Plus",description:"Phi-4-reasoning-plus is an enhanced 14B parameter model from Microsoft, fine-tuned from Phi-4 with additional reinforcement learning to boost accuracy on math, science, and code reasoning tasks. It uses the same dense decoder-only transformer architecture as Phi-4, but generates longer, more comprehensive outputs structured into a step-by-step reasoning trace and final answer.",match:{equals:"phi-4-reasoning-plus"},prices:{input_mtok:.07,output_mtok:.35}},{id:"phi-4-reasoning-plus:free",name:"Phi 4 Reasoning Plus (free)",description:"Phi-4-reasoning-plus is an enhanced 14B parameter model from Microsoft, fine-tuned from Phi-4 with additional reinforcement learning to boost accuracy on math, science, and code reasoning tasks. It uses the same dense decoder-only transformer architecture as Phi-4, but generates longer, more comprehensive outputs structured into a step-by-step reasoning trace and final answer.",match:{equals:"phi-4-reasoning-plus:free"},prices:{}},{id:"phi-4-reasoning:free",name:"Phi 4 Reasoning (free)",description:"Phi-4-reasoning is a 14B parameter dense decoder-only transformer developed by Microsoft, fine-tuned from Phi-4 to enhance complex reasoning capabilities. It uses a combination of supervised fine-tuning on chain-of-thought traces and reinforcement learning, targeting math, science, and code reasoning tasks. With a 32k context window and high inference efficiency, it is optimized for structured responses in a two-part format: reasoning trace followed by a final solution.",match:{equals:"phi-4-reasoning:free"},prices:{}},{id:"text-embedding-3-large",match:{equals:"text-embedding-3-large"},prices:{input_mtok:.13}},{id:"text-embedding-3-small",match:{equals:"text-embedding-3-small"},prices:{input_mtok:.02}},{id:"wizardlm-2-8x22b",name:"WizardLM-2 8x22B",description:"WizardLM-2 8x22B is Microsoft AI's most advanced Wizard model. It demonstrates highly competitive performance compared to leading proprietary models, and it consistently outperforms all existing state-of-the-art opensource models.",match:{equals:"wizardlm-2-8x22b"},prices:{input_mtok:.48,output_mtok:.48}}]},{id:"cerebras",name:"Cerebras",pricing_urls:["https://www.cerebras.ai/pricing#pricing","https://inference-docs.cerebras.ai/models/openai-oss"],api_pattern:"https://api\\.cerebras\\.ai",model_match:{contains:"cerebras"},provider_match:{contains:"cerebras"},extractors:[{api_flavor:"chat",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0},{path:"completion_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"gpt-oss-120b",name:"GPT-OSS 120B",description:"OpenAI's flagship open source model, built on a Mixture-of-Experts (MoE) architecture with 120 billion parameters and 128 experts. Delivers frontier reasoning capabilities with record-breaking inference speeds on Cerebras hardware (~3,000 tokens/second).",match:{or:[{equals:"gpt-oss-120b"},{starts_with:"cerebras/gpt-oss-120b"},{starts_with:"cerebras:gpt-oss-120b"}]},context_window:131072,price_comments:"Developer tier pricing. Free tier: 65k context, Paid tier: 131k context.",prices:{input_mtok:.35,output_mtok:.75}},{id:"llama-3.3-70b",name:"Llama 3.3 70B",description:"Meta's enhanced 70B model delivering 405B-level accuracy. Optimized for chat, coding, instruction following, mathematics, and reasoning with high-speed inference on Cerebras hardware (~2,100 tokens/second).",match:{or:[{equals:"llama-3.3-70b"},{starts_with:"cerebras/llama-3.3-70b"},{starts_with:"cerebras:llama-3.3-70b"}]},context_window:128e3,price_comments:"Developer tier pricing. Free tier: 65k context, Paid tier: 128k context.",prices:{input_mtok:.85,output_mtok:1.2}},{id:"llama3.1-8b",name:"Llama 3.1 8B",description:"Meta's Llama 3.1 8B model for general-purpose tasks including chat, coding, and instruction following. Optimized for fast inference on Cerebras hardware (~2,200 tokens/second).",match:{or:[{equals:"llama3.1-8b"},{starts_with:"cerebras/llama3.1-8b"},{starts_with:"cerebras:llama3.1-8b"}]},context_window:32768,price_comments:"Developer tier pricing. Free tier: 8k context, Paid tier: 32k context.",prices:{input_mtok:.1,output_mtok:.1}},{id:"qwen-3-32b",name:"Qwen 3 32B",description:"Qwen's 32B parameter model with enhanced reasoning and coding capabilities. Supports both standard and reasoning modes for complex tasks, with fast inference speeds on Cerebras hardware (~2,600 tokens/second).",match:{or:[{equals:"qwen-3-32b"},{starts_with:"cerebras/qwen-3-32b"},{starts_with:"cerebras:qwen-3-32b"}]},context_window:131072,price_comments:"Developer tier pricing. Free tier: 65k context, Paid tier: 131k context.",prices:{input_mtok:.4,output_mtok:.8}}]},{id:"cohere",name:"Cohere",pricing_urls:["https://cohere.com/pricing"],api_pattern:"https://api\\.cohere\\.ai",model_match:{starts_with:"command-"},provider_match:{contains:"cohere"},extractors:[{api_flavor:"default",root:["usage","billed_units"],model_path:"model",mappings:[{path:"input_tokens",dest:"input_tokens",required:!0},{path:"output_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"command",name:"Command",description:"Command is an instruction-following conversational model that performs language tasks with high quality, more reliably and with a longer context than our base generative models.",match:{equals:"command"},prices:{input_mtok:1,output_mtok:2}},{id:"command-a",name:"Command A",description:`Command A is an open-weights 111B parameter model with a 256k context window focused on delivering great performance across agentic, multilingual, and coding use cases.
|
|
1
|
+
"use strict";Object.defineProperty(exports,Symbol.toStringTag,{value:"Module"});const B=[{id:"anthropic",name:"Anthropic",pricing_urls:["https://www.anthropic.com/pricing#api"],api_pattern:"https://api\\.anthropic\\.com",model_match:{contains:"claude"},provider_match:{contains:"anthropic"},extractors:[{api_flavor:"default",root:"usage",model_path:"model",mappings:[{path:"input_tokens",dest:"input_tokens",required:!0},{path:"cache_creation_input_tokens",dest:"input_tokens",required:!1},{path:"cache_read_input_tokens",dest:"input_tokens",required:!1},{path:"cache_creation_input_tokens",dest:"cache_write_tokens",required:!1},{path:"cache_read_input_tokens",dest:"cache_read_tokens",required:!1},{path:"output_tokens",dest:"output_tokens",required:!0}]},{api_flavor:"chat",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0},{path:"cached_tokens",dest:"cache_read_tokens",required:!1},{path:"completion_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"claude-2",name:"Claude 2.0 / 2.1",description:`Claude 2 is Anthropic's previous generation model, offering reliable performance for various tasks. This includes Claude 2.0 and Claude 2.1.
|
|
2
|
+
`,match:{or:[{starts_with:"claude-2"},{contains:"claude-v2"}]},context_window:2e5,prices:{input_mtok:8,output_mtok:24}},{id:"claude-3-5-haiku-latest",name:"Claude Haiku 3.5",description:"Fastest, most cost-effective model",match:{or:[{starts_with:"claude-3-5-haiku"},{starts_with:"claude-3.5-haiku"}]},context_window:2e5,prices:{input_mtok:.8,cache_write_mtok:1,cache_read_mtok:.08,output_mtok:4}},{id:"claude-3-5-sonnet",name:"Claude Sonnet 3.5",description:"Claude 3.5 Sonnet is an ideal balance of intelligence and speed for enterprise workloads. Maximum utility at a lower price, dependable, balanced for scaled deployments.",match:{or:[{starts_with:"claude-3-5-sonnet"},{starts_with:"claude-3.5-sonnet"}]},context_window:2e5,prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"claude-3-7-sonnet-latest",name:"Claude Sonnet 3.7",description:"Claude 3.7 Sonnet is an advanced large language model with improved reasoning, coding, and problem-solving capabilities.",match:{or:[{starts_with:"claude-3-7-sonnet"},{starts_with:"claude-3.7-sonnet"},{starts_with:"claude-sonnet-3.7"},{starts_with:"claude-sonnet-3-7"}]},context_window:2e5,prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"claude-3-haiku",name:"Claude Haiku 3",description:"Fastest, most cost-effective model",match:{starts_with:"claude-3-haiku"},context_window:2e5,prices:{input_mtok:.25,cache_write_mtok:.3,cache_read_mtok:.03,output_mtok:1.25}},{id:"claude-3-opus-latest",name:"Claude Opus 3",description:"Claude 3 Opus was Anthropic's most powerful model for highly complex tasks. It boasts top-level performance, intelligence, fluency, and understanding.",match:{starts_with:"claude-3-opus"},context_window:2e5,prices:{input_mtok:15,cache_write_mtok:18.75,cache_read_mtok:1.5,output_mtok:75}},{id:"claude-3-sonnet",name:"Claude 3 Sonnet",description:"Claude 3 Sonnet is an ideal balance of intelligence and speed for enterprise workloads. Maximum utility at a lower price, dependable, balanced for scaled deployments.",match:{starts_with:"claude-3-sonnet"},context_window:2e5,prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"claude-haiku-4-5",name:"Claude Haiku 4.5",description:"Fastest and most intelligent Haiku model",match:{or:[{starts_with:"claude-haiku-4-5"},{starts_with:"claude-haiku-4.5"},{starts_with:"claude-4-5-haiku"},{starts_with:"claude-4.5-haiku"}]},context_window:2e5,prices:{input_mtok:1,cache_write_mtok:1.25,cache_read_mtok:.1,output_mtok:5}},{id:"claude-instant-1",description:"Retired, here to match price sources",match:{equals:"claude-instant-1"},prices:{input_mtok:1.63,output_mtok:55.1}},{id:"claude-instant-1.2",description:"Retired, here to match price sources",match:{equals:"claude-instant-1.2"},prices:{input_mtok:1.63,output_mtok:5.51}},{id:"claude-opus-4-0",name:"Claude Opus 4",description:"Most intelligent model for complex tasks",match:{or:[{starts_with:"claude-opus-4-0"},{starts_with:"claude-4-opus"},{equals:"claude-opus-4"},{equals:"claude-opus-4-20250514"}]},context_window:2e5,prices:{input_mtok:15,cache_write_mtok:18.75,cache_read_mtok:1.5,output_mtok:75}},{id:"claude-opus-4-1",name:"Claude Opus 4.1",description:"Most intelligent model for complex tasks",match:{or:[{starts_with:"claude-opus-4-1"},{starts_with:"claude-opus-4.1"}]},context_window:2e5,prices:{input_mtok:15,cache_write_mtok:18.75,cache_read_mtok:1.5,output_mtok:75}},{id:"claude-opus-4-5",name:"Claude Opus 4.5",description:"Premium model combining maximum intelligence with practical performance",match:{or:[{starts_with:"claude-opus-4-5"},{starts_with:"claude-opus-4.5"},{starts_with:"claude-4-5-opus"},{starts_with:"claude-4.5-opus"}]},context_window:2e5,prices:{input_mtok:5,cache_write_mtok:6.25,cache_read_mtok:.5,output_mtok:25}},{id:"claude-sonnet-4-0",name:"Claude Sonnet 4",description:"Optimal balance of intelligence, cost, and speed",match:{or:[{starts_with:"claude-sonnet-4-2025"},{starts_with:"claude-sonnet-4-0"},{starts_with:"claude-sonnet-4@"},{equals:"claude-sonnet-4"},{starts_with:"claude-4-sonnet"}]},context_window:2e5,prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"claude-sonnet-4-5",name:"Claude Sonnet 4.5",description:"Most intelligent model for building agents and coding",match:{or:[{starts_with:"claude-sonnet-4-5"},{starts_with:"claude-sonnet-4.5"}]},context_window:1e6,prices:{input_mtok:{base:3,tiers:[{start:2e5,price:6}]},cache_write_mtok:{base:3.75,tiers:[{start:2e5,price:7.5}]},cache_read_mtok:{base:.3,tiers:[{start:2e5,price:.6}]},output_mtok:{base:15,tiers:[{start:2e5,price:22.5}]}}},{id:"claude-v1",description:"Retired, here to match price sources",match:{equals:"claude-v1"},prices:{input_mtok:8,output_mtok:24}}]},{id:"avian",name:"Avian",pricing_urls:["https://avian.io/pricing/"],api_pattern:"https://api\\.avian\\.io",models:[{id:"Meta-Llama-3.1-405B-Instruct",match:{equals:"Meta-Llama-3.1-405B-Instruct"},prices:{input_mtok:1.5,output_mtok:1.5}},{id:"Meta-Llama-3.1-70B-Instruct",match:{equals:"Meta-Llama-3.1-70B-Instruct"},prices:{input_mtok:.45,output_mtok:.45}},{id:"Meta-Llama-3.1-8B-Instruct",match:{equals:"Meta-Llama-3.1-8B-Instruct"},prices:{input_mtok:.1,output_mtok:.1}},{id:"Meta-Llama-3.3-70B-Instruct",match:{equals:"Meta-Llama-3.3-70B-Instruct"},prices:{input_mtok:.45,output_mtok:.45}}]},{id:"aws",name:"AWS Bedrock",pricing_urls:["https://aws.amazon.com/bedrock/pricing/"],api_pattern:"https://bedrock-runtime\\.[a-z0-9-]+\\.amazonaws\\.com/",provider_match:{contains:"bedrock"},extractors:[{api_flavor:"default",root:"usage",model_path:"model",mappings:[{path:"inputTokens",dest:"input_tokens",required:!0},{path:"outputTokens",dest:"output_tokens",required:!0}]},{api_flavor:"anthropic",root:"usage",model_path:"model",mappings:[{path:"input_tokens",dest:"input_tokens",required:!0},{path:"cache_creation_input_tokens",dest:"input_tokens",required:!1},{path:"cache_read_input_tokens",dest:"input_tokens",required:!1},{path:"cache_creation_input_tokens",dest:"cache_write_tokens",required:!1},{path:"cache_read_input_tokens",dest:"cache_read_tokens",required:!1},{path:"output_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"amazon.nova-lite-v1:0",name:"Nova Lite",description:"Amazon Nova Lite 1.0 is a very low-cost multimodal model from Amazon that focused on fast processing of image, video, and text inputs to generate text output. Amazon Nova Lite can handle real-time customer interactions, document analysis, and visual question-answering tasks with high accuracy.",match:{contains:"nova-lite"},prices:{input_mtok:.06,cache_read_mtok:.015,output_mtok:.24}},{id:"amazon.nova-micro-v1:0",name:"Nova Micro",description:"Amazon Nova Micro 1.0 is a text-only model that delivers the lowest latency responses in the Amazon Nova family of models at a very low cost. With a context length of 128K tokens and optimized for speed and cost, Amazon Nova Micro excels at tasks such as text summarization, translation, content classification, interactive chat, and brainstorming. It has simple mathematical reasoning and coding abilities.",match:{contains:"nova-micro"},prices:{input_mtok:.035,cache_read_mtok:.00875,output_mtok:.14}},{id:"amazon.nova-premier-v1:0",name:"Nova Premier",match:{contains:"nova-premier"},prices:{input_mtok:2.5,cache_read_mtok:.625,output_mtok:12.5}},{id:"amazon.nova-pro-v1:0",name:"Nova Pro",description:"Amazon Nova Pro 1.0 is a capable multimodal model from Amazon focused on providing a combination of accuracy, speed, and cost for a wide range of tasks. As of December 2024, it achieves state-of-the-art performance on key benchmarks including visual question answering (TextVQA) and video understanding (VATEX).",match:{contains:"nova-pro"},prices:{input_mtok:.8,cache_read_mtok:.2,output_mtok:3.2}},{id:"amazon.nova-sonic-v1:0",name:"Nova Sonic",match:{contains:"nova-sonic"},prices:{input_mtok:.06,output_mtok:.24,input_audio_mtok:3.4,output_audio_mtok:13.6}},{id:"amazon.titan-embed-text-v1",name:"Titan Embeddings G1 - Text",match:{contains:"titan-embed-text"},prices:{input_mtok:.1}},{id:"amazon.titan-text-express-v1",name:"Titan Text G1 - Express",match:{contains:"titan-text-express"},prices:{input_mtok:.2,output_mtok:.6}},{id:"amazon.titan-text-lite-v1",name:"Titan Text G1 - Lite",match:{contains:"titan-text-lite"},prices:{input_mtok:.15,output_mtok:.2}},{id:"deepseek.r1-v1:0",name:"DeepSeek-R1",match:{contains:"r1"},prices:{input_mtok:1.35,output_mtok:5.4}},{id:"global.anthropic.claude-haiku-4-5-20251001-v1:0",match:{starts_with:"global.anthropic.claude-haiku-4-5-20251001-v1"},prices:{input_mtok:1,cache_write_mtok:1.25,cache_read_mtok:.1,output_mtok:5}},{id:"global.anthropic.claude-sonnet-4-20250514-v1:0",match:{starts_with:"global.anthropic.claude-sonnet-4-20250514-v1"},prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"global.anthropic.claude-sonnet-4-5-20250929-v1:0",match:{starts_with:"global.anthropic.claude-sonnet-4-5-20250929-v1"},prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"meta.llama3-1-70b-instruct-v1:0",name:"Llama 3.1 70B Instruct",match:{contains:"llama3-1-70b-instruct"},prices:{input_mtok:.72,output_mtok:.72}},{id:"meta.llama3-1-8b-instruct-v1:0",name:"Llama 3.1 8B Instruct",match:{contains:"llama3-1-8b-instruct"},prices:{input_mtok:.22,output_mtok:.22}},{id:"meta.llama3-2-11b-instruct-v1:0",name:"Llama 3.2 11B Instruct",match:{contains:"llama3-2-11b-instruct"},prices:{input_mtok:.16,output_mtok:.16}},{id:"meta.llama3-2-1b-instruct-v1:0",name:"Llama 3.2 1B Instruct",match:{contains:"llama3-2-1b-instruct"},prices:{input_mtok:.1,output_mtok:.1}},{id:"meta.llama3-2-3b-instruct-v1:0",name:"Llama 3.2 3B Instruct",match:{contains:"llama3-2-3b-instruct"},prices:{input_mtok:.15,output_mtok:.15}},{id:"meta.llama3-2-90b-instruct-v1:0",name:"Llama 3.2 90B Instruct",match:{contains:"llama3-2-90b-instruct"},prices:{input_mtok:.72,output_mtok:.72}},{id:"meta.llama3-3-70b-instruct-v1:0",name:"Llama 3.3 70B Instruct",match:{contains:"llama3-3-70b-instruct"},prices:{input_mtok:.72,output_mtok:.72}},{id:"meta.llama3-70b-instruct-v1:0",name:"Llama 3 70B Instruct",match:{contains:"llama3-70b-instruct"},prices:{input_mtok:2.65,output_mtok:3.5}},{id:"meta.llama3-8b-instruct-v1:0",name:"Llama 3 8B Instruct",match:{contains:"llama3-8b-instruct"},prices:{input_mtok:.3,output_mtok:.6}},{id:"meta.llama4-maverick-17b-instruct-v1:0",name:"Llama 4 Maverick 17B Instruct",match:{contains:"llama4-maverick-17b-instruct"},prices:{input_mtok:.24,output_mtok:.97}},{id:"meta.llama4-scout-17b-instruct-v1:0",name:"Llama 4 Scout 17B Instruct",match:{contains:"llama4-scout-17b-instruct"},prices:{input_mtok:.17,output_mtok:.66}},{id:"mistral.mistral-7b-instruct-v0:2",name:"Mistral 7B Instruct",match:{contains:"mistral-7b-instruct"},prices:{input_mtok:.15,output_mtok:.2}},{id:"mistral.mistral-large-2402-v1:0",name:"Mistral Large (24.02)",match:{contains:"mistral-large-2402"},prices:{input_mtok:4,output_mtok:12}},{id:"mistral.mistral-small-2402-v1:0",name:"Mistral Small (24.02)",match:{contains:"mistral-small-2402"},prices:{input_mtok:1,output_mtok:3}},{id:"mistral.mixtral-8x7b-instruct-v0:1",name:"Mixtral 8x7B Instruct",match:{contains:"mixtral-8x7b-instruct"},prices:{input_mtok:.45,output_mtok:.7}},{id:"mistral.pixtral-large-2502-v1:0",name:"Pixtral Large (25.02)",match:{contains:"pixtral-large-2502"},prices:{input_mtok:2,output_mtok:6}},{id:"openai.gpt-oss-120b-1:0",name:"gpt-oss-120b",match:{contains:"gpt-oss-120b"},prices:{input_mtok:.15,output_mtok:.6}},{id:"openai.gpt-oss-20b-1:0",name:"gpt-oss-20b",match:{contains:"gpt-oss-20b"},prices:{input_mtok:.07,output_mtok:.3}},{id:"qwen.qwen3-32b-v1:0",name:"Qwen3 32B (dense)",match:{contains:"qwen3-32b"},prices:{input_mtok:.15,output_mtok:.6}},{id:"qwen.qwen3-coder-30b-a3b-v1:0",name:"Qwen3-Coder-30B-A3B-Instruct",match:{contains:"qwen3-coder-30b-a3b"},prices:{input_mtok:.15,output_mtok:.6}},{id:"regional.anthropic.claude-3-5-haiku-20241022-v1:0",match:{or:[{starts_with:"us.anthropic.claude-3-5-haiku-20241022-v1"},{starts_with:"au.anthropic.claude-3-5-haiku-20241022-v1"},{starts_with:"apac.anthropic.claude-3-5-haiku-20241022-v1"},{starts_with:"eu.anthropic.claude-3-5-haiku-20241022-v1"},{starts_with:"us-gov.anthropic.claude-3-5-haiku-20241022-v1"},{starts_with:"jp.anthropic.claude-3-5-haiku-20241022-v1"}]},prices:{input_mtok:.8,cache_write_mtok:1,cache_read_mtok:.08,output_mtok:4}},{id:"regional.anthropic.claude-3-5-sonnet-20240620-v1:0",match:{or:[{starts_with:"us.anthropic.claude-3-5-sonnet-20240620-v1"},{starts_with:"au.anthropic.claude-3-5-sonnet-20240620-v1"},{starts_with:"apac.anthropic.claude-3-5-sonnet-20240620-v1"},{starts_with:"eu.anthropic.claude-3-5-sonnet-20240620-v1"},{starts_with:"us-gov.anthropic.claude-3-5-sonnet-20240620-v1"},{starts_with:"jp.anthropic.claude-3-5-sonnet-20240620-v1"}]},prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"regional.anthropic.claude-3-5-sonnet-20241022-v2:0",match:{or:[{starts_with:"us.anthropic.claude-3-5-sonnet-20241022-v2"},{starts_with:"au.anthropic.claude-3-5-sonnet-20241022-v2"},{starts_with:"apac.anthropic.claude-3-5-sonnet-20241022-v2"},{starts_with:"eu.anthropic.claude-3-5-sonnet-20241022-v2"},{starts_with:"us-gov.anthropic.claude-3-5-sonnet-20241022-v2"},{starts_with:"jp.anthropic.claude-3-5-sonnet-20241022-v2"}]},prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"regional.anthropic.claude-3-7-sonnet-20250219-v1:0",match:{or:[{starts_with:"us.anthropic.claude-3-7-sonnet-20250219-v1"},{starts_with:"au.anthropic.claude-3-7-sonnet-20250219-v1"},{starts_with:"apac.anthropic.claude-3-7-sonnet-20250219-v1"},{starts_with:"eu.anthropic.claude-3-7-sonnet-20250219-v1"},{starts_with:"us-gov.anthropic.claude-3-7-sonnet-20250219-v1"},{starts_with:"jp.anthropic.claude-3-7-sonnet-20250219-v1"}]},prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"regional.anthropic.claude-3-haiku-20240307-v1:0",match:{or:[{starts_with:"us.anthropic.claude-3-haiku-20240307-v1"},{starts_with:"au.anthropic.claude-3-haiku-20240307-v1"},{starts_with:"apac.anthropic.claude-3-haiku-20240307-v1"},{starts_with:"eu.anthropic.claude-3-haiku-20240307-v1"},{starts_with:"us-gov.anthropic.claude-3-haiku-20240307-v1"},{starts_with:"jp.anthropic.claude-3-haiku-20240307-v1"}]},prices:{input_mtok:.25,output_mtok:1.25}},{id:"regional.anthropic.claude-3-opus-20240229-v1:0",match:{or:[{starts_with:"us.anthropic.claude-3-opus-20240229-v1"},{starts_with:"au.anthropic.claude-3-opus-20240229-v1"},{starts_with:"apac.anthropic.claude-3-opus-20240229-v1"},{starts_with:"eu.anthropic.claude-3-opus-20240229-v1"},{starts_with:"us-gov.anthropic.claude-3-opus-20240229-v1"},{starts_with:"jp.anthropic.claude-3-opus-20240229-v1"}]},prices:{input_mtok:15,output_mtok:75}},{id:"regional.anthropic.claude-3-sonnet-20240229-v1:0",match:{or:[{starts_with:"us.anthropic.claude-3-sonnet-20240229-v1"},{starts_with:"au.anthropic.claude-3-sonnet-20240229-v1"},{starts_with:"apac.anthropic.claude-3-sonnet-20240229-v1"},{starts_with:"eu.anthropic.claude-3-sonnet-20240229-v1"},{starts_with:"us-gov.anthropic.claude-3-sonnet-20240229-v1"},{starts_with:"jp.anthropic.claude-3-sonnet-20240229-v1"}]},prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"regional.anthropic.claude-haiku-4-5-20251001-v1:0",match:{or:[{starts_with:"us.anthropic.claude-haiku-4-5-20251001-v1"},{starts_with:"au.anthropic.claude-haiku-4-5-20251001-v1"},{starts_with:"apac.anthropic.claude-haiku-4-5-20251001-v1"},{starts_with:"eu.anthropic.claude-haiku-4-5-20251001-v1"},{starts_with:"us-gov.anthropic.claude-haiku-4-5-20251001-v1"},{starts_with:"jp.anthropic.claude-haiku-4-5-20251001-v1"}]},prices:{input_mtok:1.1,cache_write_mtok:1.375,cache_read_mtok:.11,output_mtok:5.5}},{id:"regional.anthropic.claude-opus-4-1-20250805-v1:0",match:{or:[{starts_with:"us.anthropic.claude-opus-4-1-20250805-v1"},{starts_with:"au.anthropic.claude-opus-4-1-20250805-v1"},{starts_with:"apac.anthropic.claude-opus-4-1-20250805-v1"},{starts_with:"eu.anthropic.claude-opus-4-1-20250805-v1"},{starts_with:"us-gov.anthropic.claude-opus-4-1-20250805-v1"},{starts_with:"jp.anthropic.claude-opus-4-1-20250805-v1"}]},prices:{input_mtok:15,cache_write_mtok:18.75,cache_read_mtok:1.5,output_mtok:75}},{id:"regional.anthropic.claude-opus-4-20250514-v1:0",match:{or:[{starts_with:"us.anthropic.claude-opus-4-20250514-v1"},{starts_with:"au.anthropic.claude-opus-4-20250514-v1"},{starts_with:"apac.anthropic.claude-opus-4-20250514-v1"},{starts_with:"eu.anthropic.claude-opus-4-20250514-v1"},{starts_with:"us-gov.anthropic.claude-opus-4-20250514-v1"},{starts_with:"jp.anthropic.claude-opus-4-20250514-v1"}]},prices:{input_mtok:15,cache_write_mtok:18.75,cache_read_mtok:1.5,output_mtok:75}},{id:"regional.anthropic.claude-sonnet-4-20250514-v1:0",match:{or:[{starts_with:"us.anthropic.claude-sonnet-4-20250514-v1"},{starts_with:"au.anthropic.claude-sonnet-4-20250514-v1"},{starts_with:"apac.anthropic.claude-sonnet-4-20250514-v1"},{starts_with:"eu.anthropic.claude-sonnet-4-20250514-v1"},{starts_with:"us-gov.anthropic.claude-sonnet-4-20250514-v1"},{starts_with:"jp.anthropic.claude-sonnet-4-20250514-v1"}]},prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"regional.anthropic.claude-sonnet-4-5-20250929-v1:0",match:{or:[{starts_with:"us.anthropic.claude-sonnet-4-5-20250929-v1"},{starts_with:"au.anthropic.claude-sonnet-4-5-20250929-v1"},{starts_with:"apac.anthropic.claude-sonnet-4-5-20250929-v1"},{starts_with:"eu.anthropic.claude-sonnet-4-5-20250929-v1"},{starts_with:"us-gov.anthropic.claude-sonnet-4-5-20250929-v1"},{starts_with:"jp.anthropic.claude-sonnet-4-5-20250929-v1"}]},prices:{input_mtok:3.3,cache_write_mtok:4.125,cache_read_mtok:.33,output_mtok:16.5}}]},{id:"azure",name:"Microsoft Azure",pricing_urls:["https://azure.microsoft.com/en-us/pricing/details/cognitive-services/openai-service/#pricing"],api_pattern:"(https?://)?([^.]*\\.)?(?:openai\\.azure\\.com|azure-api\\.net|cognitiveservices\\.azure\\.com)",price_comments:'These are prices for "*-Global" models, prices for "Regional" models are often slightly higher. Retired models are listed at https://learn.microsoft.com/th-th/azure/ai-foundry/openai/concepts/legacy-models',extractors:[{api_flavor:"chat",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0},{path:["prompt_tokens_details","cached_tokens"],dest:"cache_read_tokens",required:!1},{path:["prompt_tokens_details","audio_tokens"],dest:"input_audio_tokens",required:!1},{path:["completion_tokens_details","audio_tokens"],dest:"output_audio_tokens",required:!1},{path:"completion_tokens",dest:"output_tokens",required:!0}]},{api_flavor:"responses",root:"usage",model_path:"model",mappings:[{path:"input_tokens",dest:"input_tokens",required:!0},{path:["input_tokens_details","cached_tokens"],dest:"cache_read_tokens",required:!1},{path:"output_tokens",dest:"output_tokens",required:!0}]},{api_flavor:"embeddings",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0}]},{api_flavor:"anthropic",root:"usage",model_path:"model",mappings:[{path:"input_tokens",dest:"input_tokens",required:!0},{path:"cache_creation_input_tokens",dest:"input_tokens",required:!1},{path:"cache_read_input_tokens",dest:"input_tokens",required:!1},{path:"cache_creation_input_tokens",dest:"cache_write_tokens",required:!1},{path:"cache_read_input_tokens",dest:"cache_read_tokens",required:!1},{path:"output_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"ada",match:{or:[{equals:"ada"},{equals:"text-embedding-ada"},{equals:"text-embedding-ada-002"},{equals:"text-embedding-ada-002-v2"}]},prices:{input_mtok:.1}},{id:"babbage",match:{or:[{equals:"babbage"},{equals:"babbage-002"}]},prices:{input_mtok:.4}},{id:"curie",match:{or:[{equals:"curie"},{equals:"text-curie"},{equals:"text-curie-001"}]},prices:{input_mtok:2}},{id:"davinci",match:{or:[{equals:"davinci"},{equals:"davinci-002"},{equals:"text-davinci"},{equals:"text-davinci-002"}]},prices:{input_mtok:2}},{id:"gpt-3.5-turbo",match:{or:[{equals:"gpt-3.5-turbo"},{equals:"gpt-3.5-turbo-0301"},{equals:"gpt-3.5-turbo-0613"},{equals:"gpt-3.5-turbo-instruct"},{equals:"gpt-3.5-turbo-instruct-0914"}]},prices:{input_mtok:1.5,output_mtok:2}},{id:"gpt-3.5-turbo-0125",match:{equals:"gpt-3.5-turbo-0125"},prices:{input_mtok:.5,output_mtok:1.5}},{id:"gpt-3.5-turbo-1106",match:{equals:"gpt-3.5-turbo-1106"},prices:{input_mtok:1,output_mtok:2}},{id:"gpt-3.5-turbo-16k-0613",match:{equals:"gpt-3.5-turbo-16k-0613"},prices:{input_mtok:3,output_mtok:4}},{id:"gpt-35-16k",match:{equals:"gpt-35-16k"},prices:{input_mtok:3,output_mtok:4}},{id:"gpt-35-turbo",match:{or:[{equals:"gpt-35-turbo"},{equals:"gpt-35-turbo-0613"},{equals:"gpt-35-turbo-1106"}]},prices:{input_mtok:1.5,output_mtok:2}},{id:"gpt-35-turbo-16k",match:{or:[{equals:"gpt-35-turbo-16k"},{equals:"gpt-35-turbo-16k-0613"}]},prices:{input_mtok:3,output_mtok:4}},{id:"gpt-4",match:{or:[{equals:"gpt-4"},{equals:"gpt-4-0314"},{equals:"gpt-4-0613"}]},prices:{input_mtok:30,output_mtok:60}},{id:"gpt-4-0125-preview",match:{equals:"gpt-4-0125-preview"},prices:{input_mtok:10,output_mtok:30}},{id:"gpt-4-1106-preview",match:{equals:"gpt-4-1106-preview"},prices:{input_mtok:10,output_mtok:30}},{id:"gpt-4-1106-vision-preview",match:{equals:"gpt-4-1106-vision-preview"},prices:{input_mtok:10,output_mtok:30}},{id:"gpt-4-32k",match:{or:[{equals:"gpt-4-32k"},{equals:"gpt-4-32k-0314"},{equals:"gpt-4-32k-0613"}]},prices:{input_mtok:60,output_mtok:120}},{id:"gpt-4-preview-1106",match:{equals:"gpt-4-preview-1106"},prices:{input_mtok:10,output_mtok:30}},{id:"gpt-4-turbo",match:{or:[{equals:"gpt-4-turbo"},{equals:"gpt-4-turbo-0125-preview"},{equals:"gpt-4-turbo-2024-04-09"},{equals:"gpt-4-turbo-preview"}]},prices:{input_mtok:10,output_mtok:30}},{id:"gpt-4-vision",match:{or:[{equals:"gpt-4-vision"},{equals:"gpt-4-vision-preview"}]},prices:{input_mtok:10,output_mtok:30}},{id:"gpt-4.1",match:{or:[{equals:"gpt-4.1"},{equals:"gpt-4.1-2025-04-14"}]},prices:{input_mtok:2,cache_read_mtok:.5,output_mtok:8}},{id:"gpt-4.1-mini",match:{or:[{equals:"gpt-4.1-mini"},{equals:"gpt-4.1-mini-2025-04-14"}]},prices:{input_mtok:.4,cache_read_mtok:.1,output_mtok:1.6}},{id:"gpt-4.1-nano",match:{or:[{equals:"gpt-4.1-nano"},{equals:"gpt-4.1-nano-2025-04-14"}]},prices:{input_mtok:.1,cache_read_mtok:.03,output_mtok:.4}},{id:"gpt-4o-2024-0513",match:{or:[{equals:"gpt-4o-2024-05-13"},{equals:"gpt-4o-2024-0513"}]},prices:{input_mtok:5,output_mtok:15}},{id:"gpt-4o-2024-08-06",match:{equals:"gpt-4o-2024-08-06"},prices:{input_mtok:2.5,cache_read_mtok:1.25,output_mtok:10}},{id:"gpt-4o-2024-1120",match:{or:[{equals:"gpt-4o-2024-1120"},{equals:"gpt-4o-2024-11-20"}]},prices:{input_mtok:2.5,cache_read_mtok:1.25,output_mtok:10}},{id:"gpt-4o-mini",match:{or:[{equals:"gpt-4o-mini"},{equals:"gpt-4o-mini-0718"},{starts_with:"gpt-4o-mini-audio"}]},context_window:128e3,prices:{input_mtok:.15,cache_read_mtok:.075,output_mtok:.6,input_audio_mtok:10,output_audio_mtok:20}},{id:"gpt-4o-mini-realtime",match:{starts_with:"gpt-4o-mini-realtime"},prices:{input_mtok:.6,cache_read_mtok:.3,output_mtok:2.4,input_audio_mtok:10,cache_audio_read_mtok:.3,output_audio_mtok:20}},{id:"gpt-4o-realtime",match:{starts_with:"gpt-4o-realtime"},prices:{input_mtok:5,cache_read_mtok:2.5,output_mtok:20,input_audio_mtok:40,cache_audio_read_mtok:2.5,output_audio_mtok:80}},{id:"gpt-5",name:"GPT-5",description:"GPT-5 is OpenAI's flagship model for coding, reasoning, and agentic tasks across domains.",match:{or:[{equals:"gpt-5"},{equals:"gpt-5-2025-08-07"}]},context_window:4e5,prices:{input_mtok:1.25,cache_read_mtok:.125,output_mtok:10}},{id:"gpt-5-mini",name:"GPT-5 mini",description:"GPT-5 mini is a faster, more cost-efficient version of GPT-5. It's great for well-defined tasks and precise prompts.",match:{or:[{equals:"gpt-5-mini"},{equals:"gpt-5-mini-2025-08-07"}]},context_window:4e5,prices:{input_mtok:.25,cache_read_mtok:.025,output_mtok:2}},{id:"gpt-5-nano",name:"GPT-5 nano",description:"GPT-5 Nano is OpenAI's fastest, cheapest version of GPT-5. It's great for summarization and classification tasks.",match:{or:[{equals:"gpt-5-nano"},{equals:"gpt-5-nano-2025-04-14"}]},context_window:4e5,prices:{input_mtok:.05,cache_read_mtok:.005,output_mtok:.4}},{id:"gpt35",match:{equals:"gpt35"},prices:{input_mtok:1.5,output_mtok:2}},{id:"gpt4-turbo-preview",match:{equals:"gpt4-turbo-preview"},prices:{input_mtok:10,output_mtok:30}},{id:"mai-ds-r1:free",name:"MAI DS R1 (free)",description:"MAI-DS-R1 is a post-trained variant of DeepSeek-R1 developed by the Microsoft AI team to improve the model's responsiveness on previously blocked topics while enhancing its safety profile. Built on top of DeepSeek-R1's reasoning foundation, it integrates 110k examples from the Tulu-3 SFT dataset and 350k internally curated multilingual safety-alignment samples. The model retains strong reasoning, coding, and problem-solving capabilities, while unblocking a wide range of prompts previously restricted in R1.",match:{equals:"mai-ds-r1:free"},prices:{}},{id:"o1",match:{or:[{equals:"o1"},{equals:"o1-2024-12-17"},{equals:"o1-preview"},{equals:"o1-preview-2024-09-12"}]},prices:{input_mtok:15,cache_read_mtok:7.5,output_mtok:60}},{id:"o1-mini",match:{or:[{equals:"o1-mini"},{equals:"o1-mini-2024-09-12"}]},prices:{input_mtok:1.1,cache_read_mtok:.55,output_mtok:4.4}},{id:"o3-2025-04-16",match:{or:[{equals:"o3"},{equals:"o3-2025-04-16"}]},prices:{input_mtok:2,cache_read_mtok:.5,output_mtok:8}},{id:"o3-mini",match:{or:[{equals:"o3-mini"},{equals:"o3-mini-2025-01-31"}]},prices:{input_mtok:1.1,cache_read_mtok:.55,output_mtok:4.4}},{id:"o4-mini",match:{or:[{contains:"o4-mini"},{contains:"o4-mini-2025-04-16"}]},prices:{input_mtok:1.1,cache_read_mtok:.28,output_mtok:4.4}},{id:"phi-3-medium-128k-instruct",name:"Phi-3 Medium 128K Instruct",description:"Phi-3 128K Medium is a powerful 14-billion parameter model designed for advanced language understanding, reasoning, and instruction following. Optimized through supervised fine-tuning and preference adjustments, it excels in tasks involving common sense, mathematics, logical reasoning, and code processing.",match:{equals:"phi-3-medium-128k-instruct"},prices:{input_mtok:1,output_mtok:1}},{id:"phi-3-mini-128k-instruct",name:"Phi-3 Mini 128K Instruct",description:"Phi-3 Mini is a powerful 3.8B parameter model designed for advanced language understanding, reasoning, and instruction following. Optimized through supervised fine-tuning and preference adjustments, it excels in tasks involving common sense, mathematics, logical reasoning, and code processing.",match:{equals:"phi-3-mini-128k-instruct"},prices:{input_mtok:.1,output_mtok:.1}},{id:"phi-3.5-mini-128k-instruct",name:"Phi-3.5 Mini 128K Instruct",description:"Phi-3.5 models are lightweight, state-of-the-art open models. These models were trained with Phi-3 datasets that include both synthetic data and the filtered, publicly available websites data, with a focus on high quality and reasoning-dense properties. Phi-3.5 Mini uses 3.8B parameters, and is a dense decoder-only transformer model using the same tokenizer as Phi-3 Mini.",match:{equals:"phi-3.5-mini-128k-instruct"},prices:{input_mtok:.1,output_mtok:.1}},{id:"phi-4",name:"Phi 4",description:"Microsoft Research Phi-4 is designed to perform well in complex reasoning tasks and can operate efficiently in situations with limited memory or where quick responses are needed.",match:{equals:"phi-4"},prices:{input_mtok:.07,output_mtok:.14}},{id:"phi-4-multimodal-instruct",name:"Phi 4 Multimodal Instruct",description:"Phi-4 Multimodal Instruct is a versatile 5.6B parameter foundation model that combines advanced reasoning and instruction-following capabilities across both text and visual inputs, providing accurate text outputs. The unified architecture enables efficient, low-latency inference, suitable for edge and mobile deployments. Phi-4 Multimodal Instruct supports text inputs in multiple languages including Arabic, Chinese, English, French, German, Japanese, Spanish, and more, with visual input optimized primarily for English. It delivers impressive performance on multimodal tasks involving mathematical, scientific, and document reasoning, providing developers and enterprises a powerful yet compact model for sophisticated interactive applications. For more information, see the Phi-4 Multimodal blog post.",match:{equals:"phi-4-multimodal-instruct"},prices:{input_mtok:.05,output_mtok:.1}},{id:"phi-4-reasoning-plus",name:"Phi 4 Reasoning Plus",description:"Phi-4-reasoning-plus is an enhanced 14B parameter model from Microsoft, fine-tuned from Phi-4 with additional reinforcement learning to boost accuracy on math, science, and code reasoning tasks. It uses the same dense decoder-only transformer architecture as Phi-4, but generates longer, more comprehensive outputs structured into a step-by-step reasoning trace and final answer.",match:{equals:"phi-4-reasoning-plus"},prices:{input_mtok:.07,output_mtok:.35}},{id:"phi-4-reasoning-plus:free",name:"Phi 4 Reasoning Plus (free)",description:"Phi-4-reasoning-plus is an enhanced 14B parameter model from Microsoft, fine-tuned from Phi-4 with additional reinforcement learning to boost accuracy on math, science, and code reasoning tasks. It uses the same dense decoder-only transformer architecture as Phi-4, but generates longer, more comprehensive outputs structured into a step-by-step reasoning trace and final answer.",match:{equals:"phi-4-reasoning-plus:free"},prices:{}},{id:"phi-4-reasoning:free",name:"Phi 4 Reasoning (free)",description:"Phi-4-reasoning is a 14B parameter dense decoder-only transformer developed by Microsoft, fine-tuned from Phi-4 to enhance complex reasoning capabilities. It uses a combination of supervised fine-tuning on chain-of-thought traces and reinforcement learning, targeting math, science, and code reasoning tasks. With a 32k context window and high inference efficiency, it is optimized for structured responses in a two-part format: reasoning trace followed by a final solution.",match:{equals:"phi-4-reasoning:free"},prices:{}},{id:"text-embedding-3-large",match:{equals:"text-embedding-3-large"},prices:{input_mtok:.13}},{id:"text-embedding-3-small",match:{equals:"text-embedding-3-small"},prices:{input_mtok:.02}},{id:"wizardlm-2-8x22b",name:"WizardLM-2 8x22B",description:"WizardLM-2 8x22B is Microsoft AI's most advanced Wizard model. It demonstrates highly competitive performance compared to leading proprietary models, and it consistently outperforms all existing state-of-the-art opensource models.",match:{equals:"wizardlm-2-8x22b"},prices:{input_mtok:.48,output_mtok:.48}}]},{id:"cerebras",name:"Cerebras",pricing_urls:["https://www.cerebras.ai/pricing#pricing","https://inference-docs.cerebras.ai/models/openai-oss"],api_pattern:"https://api\\.cerebras\\.ai",model_match:{contains:"cerebras"},provider_match:{contains:"cerebras"},extractors:[{api_flavor:"chat",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0},{path:"completion_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"gpt-oss-120b",name:"GPT-OSS 120B",description:"OpenAI's flagship open source model, built on a Mixture-of-Experts (MoE) architecture with 120 billion parameters and 128 experts. Delivers frontier reasoning capabilities with record-breaking inference speeds on Cerebras hardware (~3,000 tokens/second).",match:{or:[{equals:"gpt-oss-120b"},{starts_with:"cerebras/gpt-oss-120b"},{starts_with:"cerebras:gpt-oss-120b"}]},context_window:131072,price_comments:"Developer tier pricing. Free tier: 65k context, Paid tier: 131k context.",prices:{input_mtok:.35,output_mtok:.75}},{id:"llama-3.3-70b",name:"Llama 3.3 70B",description:"Meta's enhanced 70B model delivering 405B-level accuracy. Optimized for chat, coding, instruction following, mathematics, and reasoning with high-speed inference on Cerebras hardware (~2,100 tokens/second).",match:{or:[{equals:"llama-3.3-70b"},{starts_with:"cerebras/llama-3.3-70b"},{starts_with:"cerebras:llama-3.3-70b"}]},context_window:128e3,price_comments:"Developer tier pricing. Free tier: 65k context, Paid tier: 128k context.",prices:{input_mtok:.85,output_mtok:1.2}},{id:"llama3.1-8b",name:"Llama 3.1 8B",description:"Meta's Llama 3.1 8B model for general-purpose tasks including chat, coding, and instruction following. Optimized for fast inference on Cerebras hardware (~2,200 tokens/second).",match:{or:[{equals:"llama3.1-8b"},{starts_with:"cerebras/llama3.1-8b"},{starts_with:"cerebras:llama3.1-8b"}]},context_window:32768,price_comments:"Developer tier pricing. Free tier: 8k context, Paid tier: 32k context.",prices:{input_mtok:.1,output_mtok:.1}},{id:"qwen-3-32b",name:"Qwen 3 32B",description:"Qwen's 32B parameter model with enhanced reasoning and coding capabilities. Supports both standard and reasoning modes for complex tasks, with fast inference speeds on Cerebras hardware (~2,600 tokens/second).",match:{or:[{equals:"qwen-3-32b"},{starts_with:"cerebras/qwen-3-32b"},{starts_with:"cerebras:qwen-3-32b"}]},context_window:131072,price_comments:"Developer tier pricing. Free tier: 65k context, Paid tier: 131k context.",prices:{input_mtok:.4,output_mtok:.8}}]},{id:"cohere",name:"Cohere",pricing_urls:["https://cohere.com/pricing"],api_pattern:"https://api\\.cohere\\.ai",model_match:{starts_with:"command-"},provider_match:{contains:"cohere"},extractors:[{api_flavor:"default",root:["usage","billed_units"],model_path:"model",mappings:[{path:"input_tokens",dest:"input_tokens",required:!0},{path:"output_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"command",name:"Command",description:"Command is an instruction-following conversational model that performs language tasks with high quality, more reliably and with a longer context than our base generative models.",match:{equals:"command"},prices:{input_mtok:1,output_mtok:2}},{id:"command-a",name:"Command A",description:`Command A is an open-weights 111B parameter model with a 256k context window focused on delivering great performance across agentic, multilingual, and coding use cases.
|
|
3
3
|
Compared to other leading proprietary and open-weights models Command A delivers maximum performance with minimum hardware costs, excelling on business-critical agentic and multilingual tasks.`,match:{starts_with:"command-a"},prices:{input_mtok:2.5,output_mtok:10}},{id:"command-r",name:"Command R",description:"Command-R is a 35B parameter model that performs conversational language tasks at a higher quality, more reliably, and with a longer context than previous models. It can be used for complex workflows like code generation, retrieval augmented generation (RAG), tool use, and agents.",match:{or:[{equals:"command-r"},{equals:"command-r-08-2024"}]},prices:{input_mtok:.15,output_mtok:.6}},{id:"command-r-plus",name:"Command R+",description:"Command R+ is a new, 104B-parameter LLM from Cohere. It's useful for roleplay, general consumer usecases, and Retrieval Augmented Generation (RAG).",match:{or:[{equals:"command-r-plus"},{equals:"command-r-plus-08-2024"}]},prices:{input_mtok:2.5,output_mtok:10}},{id:"command-r7b",name:"Command R7B",description:"Command R7B (12-2024) is a small, fast update of the Command R+ model, delivered in December 2024. It excels at RAG, tool use, agents, and similar tasks requiring complex reasoning and multiple steps.",match:{or:[{equals:"command-r7b"},{equals:"command-r7b-12-2024"}]},prices:{input_mtok:.0375,output_mtok:.15}}]},{id:"deepseek",name:"Deepseek",pricing_urls:["https://api-docs.deepseek.com/quick_start/pricing"],api_pattern:"https://api\\.deepseek\\.com",price_comments:'Deepseek off-peak pricing applies "UTC 16:30-00:30" so we switch it around and use the off-peak pricing as the default (first) price then the second price with a constraint is the "standard" pricing that applies "UTC 00:30-16:30".',model_match:{contains:"deepseek"},extractors:[{api_flavor:"chat",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0},{path:["prompt_tokens_details","cached_tokens"],dest:"cache_read_tokens",required:!1},{path:["completion_tokens_details","audio_tokens"],dest:"output_audio_tokens",required:!1},{path:"completion_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"deepseek-chat",name:"DeepSeek Chat",description:"DeepSeek-V3 is the latest model from the DeepSeek team, building upon the instruction following and coding abilities of the previous versions. Pre-trained on nearly 15 trillion tokens, the reported evaluations reveal that the model outperforms other open-source models and rivals leading closed-source models.",match:{or:[{starts_with:"deepseek-chat"},{equals:"deepseek-chat-v3-0324"}]},context_window:64e3,prices:[{prices:{input_mtok:.135,cache_read_mtok:.035,output_mtok:.55}},{constraint:{start_time:"00:30:00Z",end_time:"16:30:00Z",type:"time_of_date"},prices:{input_mtok:.27,cache_read_mtok:.07,output_mtok:1.1}}]},{id:"deepseek-reasoner",name:"Deepseek R1",description:"DeepSeek R1 is here: Performance on par with OpenAI o1, but open-sourced and with fully open reasoning tokens. It's 671B parameters in size, with 37B active in an inference pass.",match:{or:[{equals:"deepseek-reasoner"},{starts_with:"deepseek-r1"},{equals:"deepseek-r1-0528"}]},context_window:64e3,prices:[{prices:{input_mtok:.135,cache_read_mtok:.035,output_mtok:.55}},{constraint:{start_time:"00:30:00Z",end_time:"16:30:00Z",type:"time_of_date"},prices:{input_mtok:.55,cache_read_mtok:.14,output_mtok:2.19}}]}]},{id:"fireworks",name:"Fireworks",pricing_urls:["https://fireworks.ai/pricing"],api_pattern:"https://api\\.fireworks\\.ai",model_match:{starts_with:"accounts/fireworks/models/"},extractors:[{api_flavor:"chat",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0},{path:["prompt_tokens_details","cached_tokens"],dest:"cache_read_tokens",required:!1},{path:["completion_tokens_details","audio_tokens"],dest:"output_audio_tokens",required:!1},{path:"completion_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"deepseek-r1-0528",name:"DeepSeek R1 0528",description:"The updated DeepSeek-R1-0528 model delivers major improvements in reasoning, inference, and accuracy through enhanced post-training optimization and greater computational resources. It now performs at a level approaching top-tier models like O3 and Gemini 2.5 Pro, with notable gains in complex tasks such as math and programming.",match:{equals:"accounts/fireworks/models/deepseek-r1-0528"},context_window:16e4,prices:{input_mtok:3,output_mtok:8}},{id:"deepseek-v3-0324",name:"Deepseek V3 03-24",description:"A strong Mixture-of-Experts (MoE) language model with 671B total parameters with 37B activated for each token from Deepseek. Updated checkpoint.",match:{equals:"accounts/fireworks/models/deepseek-v3-0324"},context_window:16e4,price_comments:`docs give just one price - "Pricing Per 1M Tokens", we assume that's input and output`,prices:{input_mtok:.9,output_mtok:.9}},{id:"gemma-3-27b-it",name:"Gemma 3 27B Instruct",match:{equals:"accounts/fireworks/models/gemma-3-27b-it"},context_window:131e3,price_comments:`docs give just one price - "Pricing Per 1M Tokens", we assume that's input and output`,prices:{input_mtok:.1,output_mtok:.1}},{id:"llama-v3p1-8b-instruct",name:"Llama 3.1 8B Instruct",description:"The Meta Llama 3.1 collection of multilingual large language models (LLMs) is a collection of pretrained and instruction tuned generative models in 8B, 70B and 405B sizes. The Llama 3.1 instruction tuned text only models (8B, 70B, 405B) are optimized for multilingual dialogue use cases and outperform many of the available open source and closed chat models on common industry benchmarks.",match:{equals:"accounts/fireworks/models/llama-v3p1-8b-instruct"},context_window:131e3,price_comments:`docs give just one price - "Pricing Per 1M Tokens", we assume that's input and output`,prices:{input_mtok:.2,output_mtok:.2}},{id:"llama4-maverick-instruct-basic",name:"Llama 4 Maverick Instruct (Basic)",description:"The Meta Llama 3.1 collection of multilingual large language models (LLMs) is a collection of pretrained and instruction tuned generative models in 8B, 70B and 405B sizes. The Llama 3.1 instruction tuned text only models (8B, 70B, 405B) are optimized for multilingual dialogue use cases and outperform many of the available open source and closed chat models on common industry benchmarks.",match:{equals:"accounts/fireworks/models/llama4-maverick-instruct-basic"},context_window:1e6,prices:{input_mtok:.22,output_mtok:.88}},{id:"qwen2p5-vl-72b-instruct",name:"Qwen2.5-VL 72B Instruct",description:"Latest Qwen's VLM model",match:{equals:"accounts/fireworks/models/qwen2p5-vl-72b-instruct"},context_window:128e3,price_comments:`docs give just one price - "Pricing Per 1M Tokens", we assume that's input and output`,prices:{input_mtok:.9,output_mtok:.9}},{id:"qwen3-235b-a22b",name:"Qwen3 235B-A22B",description:'Qwen3 is the latest evolution in the Qwen LLM series, featuring both dense and MoE models with major advancements in reasoning, agent capabilities, multilingual support, and instruction following. It uniquely allows seamless switching between "thinking" (for complex logic, math, coding) and "non-thinking" modes (for fast, general dialogue), delivering strong performance across tasks.',match:{equals:"accounts/fireworks/models/qwen3-235b-a22b"},context_window:128e3,prices:{input_mtok:.22,output_mtok:.88}}]},{id:"google",name:"Google",pricing_urls:["https://ai.google.dev/gemini-api/docs/pricing","https://cloud.google.com/vertex-ai/generative-ai/pricing"],api_pattern:"https://(.*\\.)?googleapis\\.com",model_match:{contains:"gemini"},provider_match:{or:[{contains:"google"},{contains:"vertex"},{contains:"gemini"}]},extractors:[{api_flavor:"default",root:"usageMetadata",model_path:"modelVersion",mappings:[{path:"promptTokenCount",dest:"input_tokens",required:!1},{path:"cachedContentTokenCount",dest:"cache_read_tokens",required:!1},{path:["cacheTokensDetails",{type:"array-match",field:"modality",match:{equals:"AUDIO"}},"tokenCount"],dest:"cache_audio_read_tokens",required:!1},{path:["promptTokensDetails",{type:"array-match",field:"modality",match:{equals:"AUDIO"}},"tokenCount"],dest:"input_audio_tokens",required:!1},{path:["candidatesTokensDetails",{type:"array-match",field:"modality",match:{equals:"AUDIO"}},"tokenCount"],dest:"output_audio_tokens",required:!1},{path:"candidatesTokenCount",dest:"output_tokens",required:!1},{path:"thoughtsTokenCount",dest:"output_tokens",required:!1},{path:"toolUsePromptTokenCount",dest:"output_tokens",required:!1}]},{api_flavor:"anthropic",root:"usage",model_path:"model",mappings:[{path:"input_tokens",dest:"input_tokens",required:!0},{path:"cache_creation_input_tokens",dest:"input_tokens",required:!1},{path:"cache_read_input_tokens",dest:"input_tokens",required:!1},{path:"cache_creation_input_tokens",dest:"cache_write_tokens",required:!1},{path:"cache_read_input_tokens",dest:"cache_read_tokens",required:!1},{path:"output_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"claude-3-5-haiku",match:{contains:"claude-3-5-haiku"},context_window:2e5,prices:{input_mtok:.8,cache_write_mtok:1,cache_read_mtok:.08,output_mtok:4}},{id:"claude-3-5-sonnet",match:{contains:"claude-3-5-sonnet"},context_window:2e5,prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"claude-3-7-sonnet",match:{contains:"claude-3-7-sonnet"},context_window:2e5,prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"claude-3-haiku",match:{contains:"claude-3-haiku"},context_window:2e5,prices:{input_mtok:.25,cache_write_mtok:.3,cache_read_mtok:.03,output_mtok:1.25}},{id:"claude-3-opus",match:{contains:"claude-3-opus"},prices:{input_mtok:15,cache_write_mtok:18.75,cache_read_mtok:1.5,output_mtok:75}},{id:"claude-4-opus",match:{or:[{contains:"claude-4-opus"},{contains:"claude-opus-4"}]},context_window:2e5,prices:{input_mtok:15,cache_write_mtok:18.75,cache_read_mtok:1.5,output_mtok:75}},{id:"claude-4-sonnet",match:{or:[{contains:"claude-4-sonnet"},{contains:"claude-sonnet-4"}]},context_window:2e5,prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"gemini-1.0-pro-vision-001",name:"gemini 1.0 pro vision",description:"Google's first-generation advanced multimodal model that can understand text, code, and images. It provides strong reasoning capabilities and follows instructions effectively.",match:{equals:"gemini-1.0-pro-vision-001"},context_window:32768,price_comments:"I can't find anything about this model or it's pricing, so trusting the original source",prices:{input_mtok:.125,output_mtok:.375}},{id:"gemini-1.5-flash",name:"gemini 1.5 flash",description:"A faster, more cost-effective variant of Gemini 1.5 that maintains strong capabilities while optimizing for performance and cost efficiency. Suitable for production deployments requiring high throughput.",match:{contains:"gemini-1.5-flash"},context_window:1e6,prices:{input_mtok:{base:.075,tiers:[{start:128e3,price:.15}]},cache_read_mtok:{base:.01875,tiers:[{start:128e3,price:.0375}]},output_mtok:{base:.3,tiers:[{start:128e3,price:.6}]}}},{id:"gemini-1.5-pro",name:"gemini 1.5 Pro",description:"Google's most capable multimodal model with an extremely long context window of up to 1 million tokens. It excels at complex reasoning, long-form content processing, and multimodal understanding.",match:{contains:"gemini-1.5-pro"},context_window:1e6,prices:{input_mtok:{base:1.25,tiers:[{start:128e3,price:2.5}]},output_mtok:{base:5,tiers:[{start:128e3,price:10}]}}},{id:"gemini-2.0-flash",name:"gemini 2.0 flash",description:"The newest generation of Google's Gemini models, featuring improved reasoning, instruction following, and factual accuracy, with the Flash variant optimized for cost-efficiency and performance.",match:{or:[{contains:"gemini-2.0-flash"},{equals:"gemini-2.0-flash-lite-001"},{equals:"gemini-2.0-flash-001"},{equals:"gemini-2.0-flash-exp:free"}]},context_window:1e6,prices:{input_mtok:.1,cache_read_mtok:{base:.025,tiers:[{start:1e6,price:.175}]},output_mtok:.4,input_audio_mtok:.7}},{id:"gemini-2.0-flash-lite",name:"gemini 2.0 flash lite",description:"A lighter, more cost-effective version of Gemini 2.0 Flash, designed for applications requiring high efficiency while maintaining good performance. Ideal for high-volume, cost-sensitive deployments.",match:{contains:"gemini-2.0-flash-lite"},context_window:1e6,prices:{input_mtok:.075,output_mtok:.3}},{id:"gemini-2.5-flash",name:"Gemini 2.5 Flash",description:`Gemini 2.5 Flash is Google's state-of-the-art workhorse model, specifically designed for advanced reasoning, coding, mathematics, and scientific tasks. It includes built-in "thinking" capabilities, enabling it to provide responses with greater accuracy and nuanced context handling.`,match:{or:[{equals:"gemini-2.5-flash"},{equals:"gemini-2.5-flash-latest"},{equals:"gemini-2.5-flash-preview-09-2025"}]},prices:{input_mtok:.3,cache_read_mtok:.03,output_mtok:2.5,input_audio_mtok:1,cache_audio_read_mtok:.1}},{id:"gemini-2.5-flash-image",name:"Gemini 2.5 Flash Image",description:"Google's specialized image generation model optimized for fast, high-quality image generation. Outputs images at 1024x1024 resolution, with each image consuming 1290 output tokens.",match:{or:[{equals:"gemini-2.5-flash-image"},{equals:"gemini-2.5-flash-image-preview"}]},context_window:1e6,price_comments:"See https://ai.google.dev/gemini-api/docs/pricing#gemini-2.5-flash-image. Image output is priced at $30 per 1M tokens, with each 1024x1024 image = 1290 tokens = $0.039/image. Cache pricing is not available for this model.",prices:{input_mtok:.3,output_mtok:30}},{id:"gemini-2.5-flash-lite",name:"Gemini 2.5 Flash Lite",description:'Gemini 2.5 Flash-Lite is a lightweight reasoning model in the Gemini 2.5 family, optimized for ultra-low latency and cost efficiency. It offers improved throughput, faster token generation, and better performance across common benchmarks compared to earlier Flash models. By default, "thinking" (i.e. multi-pass reasoning) is disabled to prioritize speed, but developers can enable it via the Reasoning API parameter to selectively trade off cost for intelligence.',match:{or:[{equals:"gemini-2.5-flash-lite"},{starts_with:"gemini-2.5-flash-lite-preview"}]},context_window:1e6,prices:{input_mtok:.1,cache_read_mtok:.01,output_mtok:.4,input_audio_mtok:.3,cache_audio_read_mtok:.03}},{id:"gemini-2.5-flash-preview",name:"Gemini 2.5 Flash Preview 05-20",description:`Gemini 2.5 Flash May 20th Checkpoint is Google's state-of-the-art workhorse model, specifically designed for advanced reasoning, coding, mathematics, and scientific tasks. It includes built-in "thinking" capabilities, enabling it to provide responses with greater accuracy and nuanced context handling.`,match:{or:[{contains:"gemini-2.5-flash-preview-05-20"},{contains:"gemini-2.5-flash-preview-04-17"},{equals:"gemini-2.5-flash-preview-05-20:thinking"},{equals:"gemini-2.5-flash-preview"},{equals:"gemini-2.5-flash-preview:thinking"}]},price_comments:"from https://cloud.google.com/vertex-ai/generative-ai/pricing should be retired 2025-07-15",prices:{input_mtok:.15,output_mtok:.6}},{id:"gemini-2.5-pro",name:"Gemini 2.5 Pro",description:`Gemini 2.5 Pro is Google's state-of-the-art AI model designed for advanced reasoning, coding, mathematics, and scientific tasks. It employs "thinking" capabilities, enabling it to reason through responses with enhanced accuracy and nuanced context handling. Gemini 2.5 Pro achieves top-tier performance on multiple benchmarks, including first-place positioning on the LMArena leaderboard, reflecting superior human-preference alignment and complex problem-solving abilities.`,match:{starts_with:"gemini-2.5-pro"},price_comments:"See https://ai.google.dev/gemini-api/docs/pricing#gemini-2.5-pro",prices:{input_mtok:{base:1.25,tiers:[{start:2e5,price:2.5}]},cache_read_mtok:{base:.125,tiers:[{start:2e5,price:.25}]},output_mtok:{base:10,tiers:[{start:2e5,price:15}]}}},{id:"gemini-3-pro-preview",name:"Gemini 3 Pro Preview",description:"The best model in the world for multimodal understanding, and our most powerful agentic and vibe-coding model yet.",match:{starts_with:"gemini-3-pro-preview"},prices:{input_mtok:{base:2,tiers:[{start:2e5,price:4}]},cache_read_mtok:{base:.2,tiers:[{start:2e5,price:.4}]},output_mtok:{base:12,tiers:[{start:2e5,price:18}]}}},{id:"gemini-embedding-001",match:{equals:"gemini-embedding-001"},prices:{input_mtok:.15}},{id:"gemini-flash-1.5",name:"Gemini 1.5 Flash",description:"Gemini 1.5 Flash is a foundation model that performs well at a variety of multimodal tasks such as visual understanding, classification, summarization, and creating content from image, audio and video. It's adept at processing visual and text inputs such as photographs, documents, infographics, and screenshots.",match:{equals:"gemini-flash-1.5"},price_comments:"See https://ai.google.dev/gemini-api/docs/pricing#gemini-1.5-flash",prices:{input_mtok:{base:.075,tiers:[{start:128e3,price:.15}]},cache_read_mtok:{base:.01875,tiers:[{start:128e3,price:.0375}]},output_mtok:{base:.3,tiers:[{start:128e3,price:.6}]}}},{id:"gemini-flash-1.5-8b",name:"gemini 1.5 flash",description:"A faster, more cost-effective variant of Gemini 1.5 that maintains strong capabilities while optimizing for performance and cost efficiency. Suitable for production deployments requiring high throughput.",match:{equals:"gemini-flash-1.5-8b"},context_window:1e6,price_comments:"See https://ai.google.dev/gemini-api/docs/pricing#gemini-1.5-flash-8b",prices:{input_mtok:{base:.0375,tiers:[{start:128e3,price:.075}]},cache_read_mtok:{base:.01,tiers:[{start:128e3,price:.02}]},output_mtok:{base:.15,tiers:[{start:128e3,price:.3}]}}},{id:"gemini-live-2.5-flash-preview",match:{or:[{starts_with:"gemini-live-2.5-flash-preview"},{starts_with:"gemini-2.5-flash-native-audio-preview"}]},prices:{input_mtok:.5,output_mtok:2,input_audio_mtok:3,output_audio_mtok:12}},{id:"gemini-pro",name:"gemini 1.0 pro",description:"Google's first-generation advanced multimodal model that can understand text, code, and images. It provides strong reasoning capabilities and follows instructions effectively.",match:{or:[{equals:"gemini-pro"},{equals:"gemini-1.0-pro"}]},context_window:32768,price_comments:"I can't find anything so trusting these prices, not sure the model still exists",prices:{input_mtok:.125,output_mtok:.375}},{id:"gemini-pro-1.5",name:"Gemini 1.5 Pro",description:"Google's latest multimodal model, supports image and video[0] in text or chat prompts.",match:{equals:"gemini-pro-1.5"},context_window:2e6,price_comments:"See https://ai.google.dev/gemini-api/docs/pricing#gemini-1.5-pro",prices:{input_mtok:{base:1.25,tiers:[{start:128e3,price:2.5}]},cache_read_mtok:{base:.3125,tiers:[{start:128e3,price:.625}]},output_mtok:{base:5,tiers:[{start:128e3,price:10}]}}},{id:"gemma-3",name:"Gemma 3 (free)",description:"Lightweight, state-of the art, open model built from the same technology that powers our Gemini models.",match:{or:[{starts_with:"gemma-3-"},{equals:"gemma-3"}]},prices:{}},{id:"gemma-3n",name:"Gemma 3n (free)",description:"Our open model built for efficient performance on everyday devices like mobile phones, laptops, and tablets.",match:{or:[{starts_with:"gemma-3n"}]},prices:{}}]},{id:"groq",name:"Groq",pricing_urls:["https://groq.com/pricing/"],api_pattern:"https://api\\.groq\\.com",extractors:[{api_flavor:"default",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0},{path:"completion_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"deepseek-r1-distill-llama-70b",name:"DeepSeek R1 Distill Llama 70B",match:{equals:"deepseek-r1-distill-llama-70b"},context_window:131072,prices:{input_mtok:.75,output_mtok:.99}},{id:"gemma-7b-it",match:{equals:"gemma-7b-it"},prices:{input_mtok:.07,output_mtok:.07}},{id:"gemma2-9b-it",name:"Gemma 2 9B 8k",match:{or:[{equals:"gemma2-9b-it"},{equals:"gemma2-9b"}]},prices:{input_mtok:.2,output_mtok:.2}},{id:"llama-3.1-405b-reasoning",match:{equals:"llama-3.1-405b-reasoning"},prices:{input_mtok:.59,output_mtok:.79}},{id:"llama-3.1-70b-versatile",match:{equals:"llama-3.1-70b-versatile"},prices:{input_mtok:.59,output_mtok:.79}},{id:"llama-3.1-8b-instant",name:"Llama 3.1 8B Instant 128k",match:{equals:"llama-3.1-8b-instant"},prices:{input_mtok:.05,output_mtok:.08}},{id:"llama-3.2-11b-text-preview",match:{equals:"llama-3.2-11b-text-preview"},prices:{input_mtok:.18,output_mtok:.18}},{id:"llama-3.2-11b-vision-preview",match:{equals:"llama-3.2-11b-vision-preview"},prices:{input_mtok:.18,output_mtok:.18}},{id:"llama-3.2-1b-preview",match:{equals:"llama-3.2-1b-preview"},prices:{input_mtok:.04,output_mtok:.04}},{id:"llama-3.2-3b-preview",match:{equals:"llama-3.2-3b-preview"},prices:{input_mtok:.06,output_mtok:.06}},{id:"llama-3.2-90b-text-preview",match:{equals:"llama-3.2-90b-text-preview"},prices:{input_mtok:.9,output_mtok:.9}},{id:"llama-3.2-90b-vision-preview",match:{equals:"llama-3.2-90b-vision-preview"},prices:{input_mtok:.9,output_mtok:.9}},{id:"llama-3.3-70b-specdec",match:{equals:"llama-3.3-70b-specdec"},prices:{input_mtok:.59,output_mtok:.99}},{id:"llama-3.3-70b-versatile",name:"Llama 3.3 70B Versatile 128k",match:{equals:"llama-3.3-70b-versatile"},prices:{input_mtok:.59,output_mtok:.79}},{id:"llama-guard-3-8b",match:{equals:"llama-guard-3-8b"},prices:{input_mtok:.2,output_mtok:.2}},{id:"llama2-70b-4096",match:{equals:"llama2-70b-4096"},prices:{input_mtok:.7,output_mtok:.8}},{id:"llama3-70b-8192",match:{equals:"llama3-70b-8192"},prices:{input_mtok:.59,output_mtok:.79}},{id:"llama3-8b-8192",match:{equals:"llama3-8b-8192"},prices:{input_mtok:.05,output_mtok:.08}},{id:"llama3-groq-70b-8192-tool-use-preview",match:{equals:"llama3-groq-70b-8192-tool-use-preview"},prices:{input_mtok:.89,output_mtok:.89}},{id:"llama3-groq-8b-8192-tool-use-preview",match:{equals:"llama3-groq-8b-8192-tool-use-preview"},prices:{input_mtok:.19,output_mtok:.19}},{id:"meta-llama/llama-4-maverick-17b-128e-instruct",name:"Llama 4 Maverick 17B 128E",match:{equals:"meta-llama/llama-4-maverick-17b-128e-instruct"},context_window:131072,prices:{input_mtok:.2,output_mtok:.6}},{id:"meta-llama/llama-4-scout-17b-16e-instruct",name:"Llama 4 Scout (17Bx16E) 128k",match:{equals:"meta-llama/llama-4-scout-17b-16e-instruct"},prices:{input_mtok:.11,output_mtok:.34}},{id:"meta-llama/llama-guard-4-12b",name:"Llama Guard 4 12B",match:{equals:"meta-llama/llama-guard-4-12b"},context_window:131072,prices:{input_mtok:.2,output_mtok:.2}},{id:"mistral-saba-24b",match:{equals:"mistral-saba-24b"},prices:{input_mtok:.79,output_mtok:.79}},{id:"mixtral-8x7b-32768",match:{equals:"mixtral-8x7b-32768"},prices:{input_mtok:.24,output_mtok:.24}},{id:"moonshotai/kimi-k2-instruct",name:"Kimi K2 1T 128k",match:{or:[{equals:"moonshotai/kimi-k2-instruct"},{equals:"moonshotai/kimi-k2-instruct-0905"}]},context_window:131072,prices:{input_mtok:1,cache_read_mtok:.5,output_mtok:3}},{id:"openai/gpt-oss-120b",description:`GPT-OSS 120B is OpenAI's flagship open source model, built on a Mixture-of-Experts (MoE) architecture with
|
|
4
4
|
120 billion parameters and 128 experts.
|
|
5
5
|
`,match:{or:[{equals:"openai/gpt-oss-120b"},{equals:"openai/gpt-oss-safeguard-20b"}]},context_window:131072,prices:{input_mtok:.15,cache_read_mtok:.075,output_mtok:.6}},{id:"openai/gpt-oss-20b",description:`GPT-OSS 20B is OpenAI's flagship open source model, built on a Mixture-of-Experts (MoE) architecture with
|
|
6
6
|
20 billion parameters and 32 experts.
|
|
7
|
-
`,match:{equals:"openai/gpt-oss-20b"},context_window:131072,prices:{input_mtok:.075,cache_read_mtok:.0375,output_mtok:.3}},{id:"qwen/qwen3-32b",name:"Qwen3 32B 131k",match:{equals:"qwen/qwen3-32b"},prices:{input_mtok:.29,output_mtok:.59}}]},{id:"mistral",name:"Mistral",pricing_urls:["https://mistral.ai/pricing#api-pricing"],api_pattern:"https://api\\.mistral\\.ai",model_match:{regex:"(?:mi|code|dev|magi|mini)stral"},provider_match:{starts_with:"mistral"},extractors:[{api_flavor:"default",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0},{path:"completion_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"codestral",name:"Codestral",description:"Mistral's cutting-edge language model for coding. Codestral specializes in low-latency, high-frequency tasks such as fill-in-the-middle (FIM), code correction and test generation.",match:{or:[{equals:"codestral-latest"},{equals:"codestral-2501"}]},prices:{input_mtok:.3,output_mtok:.9}},{id:"devstral-small",name:"Devstral Small",description:"Devstral-Small-2505 is a 24B parameter agentic LLM fine-tuned from Mistral-Small-3.1, jointly developed by Mistral AI and All Hands AI for advanced software engineering tasks. It is optimized for codebase exploration, multi-file editing, and integration into coding agents, achieving state-of-the-art results on SWE-Bench Verified (46.8%).",match:{equals:"devstral-small"},prices:{input_mtok:.06,output_mtok:.12}},{id:"devstral-small:free",name:"Devstral Small (free)",description:"Devstral-Small-2505 is a 24B parameter agentic LLM fine-tuned from Mistral-Small-3.1, jointly developed by Mistral AI and All Hands AI for advanced software engineering tasks. It is optimized for codebase exploration, multi-file editing, and integration into coding agents, achieving state-of-the-art results on SWE-Bench Verified (46.8%).",match:{equals:"devstral-small:free"},prices:{}},{id:"magistral-medium",name:"Magistral Medium",description:"Magistral is Mistral's first reasoning model. It is ideal for general purpose use requiring longer thought processing and better accuracy than with non-reasoning LLMs. From legal research and financial forecasting to software development and creative storytelling — this model solves multi-step challenges where transparency and precision are critical.",match:{or:[{starts_with:"magistral-medium"}]},prices:{input_mtok:2,output_mtok:5}},{id:"magistral-small",name:"Magistral Small",description:"Magistral Small is a 24B parameter instruction-tuned model based on Mistral-Small-3.1 (2503), enhanced through supervised fine-tuning on traces from Magistral Medium and further refined via reinforcement learning. It is optimized for reasoning and supports a wide multilingual range, including over 20 languages.",match:{starts_with:"magistral-small-"},prices:{input_mtok:.5,output_mtok:1.5}},{id:"ministral-3b",name:"Ministral 3B",description:"Ministral 3B is a 3B parameter model optimized for on-device and edge computing. It excels in knowledge, commonsense reasoning, and function-calling, outperforming larger models like Mistral 7B on most benchmarks. Supporting up to 128k context length, it's ideal for orchestrating agentic workflows and specialist tasks with efficient inference.",match:{equals:"ministral-3b"},prices:{input_mtok:.04,output_mtok:.04}},{id:"ministral-8b",name:"Ministral 8B 24.10",description:"Ministral 8B is an 8B parameter model featuring a unique interleaved sliding-window attention pattern for faster, memory-efficient inference. Designed for edge use cases, it supports up to 128k context length and excels in knowledge and reasoning tasks. It outperforms peers in the sub-10B category, making it perfect for low-latency, privacy-first applications.",match:{starts_with:"ministral-8b"},prices:{input_mtok:.1,output_mtok:1}},{id:"mistral-7b",name:"Mistral 7B",match:{or:[{equals:"mistral-7b"},{equals:"open-mistral-7b"}]},prices:{input_mtok:.25,output_mtok:.25}},{id:"mistral-embed",match:{equals:"mistral-embed"},prices:{input_mtok:.1,output_mtok:.1}},{id:"mistral-large",name:"Mistral Large",description:"This is Mistral AI's flagship model, Mistral Large 2 (version `mistral-large-2407`). It's a proprietary weights-available model and excels at reasoning, code, JSON, chat, and more. Read the launch announcement here.",match:{or:[{equals:"mistral-large"},{equals:"mistral-large-latest"},{equals:"mistral-large-2407"},{equals:"mistral-large-2411"}]},prices:{input_mtok:2,output_mtok:6}},{id:"mistral-medium-3",name:"Mistral Medium 3",description:"Mistral Medium 3 is a high-performance enterprise-grade language model designed to deliver frontier-level capabilities at significantly reduced operational cost. It balances state-of-the-art reasoning and multimodal performance with 8× lower cost compared to traditional large models, making it suitable for scalable deployments across professional and industrial use cases.",match:{starts_with:"mistral-medium"},prices:{input_mtok:.4,output_mtok:2}},{id:"mistral-nemo",name:"Mistral NeMo",description:"A 12B parameter model with a 128k token context length built by Mistral in collaboration with NVIDIA.",match:{or:[{equals:"mistral-nemo"},{equals:"open-mistral-nemo"}]},prices:{input_mtok:.15,output_mtok:.15}},{id:"mistral-nemo:free",name:"Mistral Nemo (free)",description:"A 12B parameter model with a 128k token context length built by Mistral in collaboration with NVIDIA.",match:{equals:"mistral-nemo:free"},prices:{}},{id:"mistral-saba",name:"Mistral Saba",description:"Mistral Saba is a 24B-parameter language model specifically designed for the Middle East and South Asia, delivering accurate and contextually relevant responses while maintaining efficient performance. Trained on curated regional datasets, it supports multiple Indian-origin languages—including Tamil and Malayalam—alongside Arabic. This makes it a versatile option for a range of regional and multilingual applications. Read more at the blog post here",match:{or:[{equals:"mistral-saba"},{equals:"mistral-saba-latest"}]},prices:{input_mtok:.2,output_mtok:.6}},{id:"mistral-small",name:"Mistral Small",description:"With 22 billion parameters, Mistral Small v24.09 offers a convenient mid-point between (Mistral NeMo 12B)[/mistralai/mistral-nemo] and (Mistral Large 2)[/mistralai/mistral-large], providing a cost-effective solution that can be deployed across various platforms and environments. It has better reasoning, exhibits more capabilities, can produce and reason about code, and is multiligual, supporting English, French, German, Italian, and Spanish.",match:{starts_with:"mistral-small"},prices:{input_mtok:.2,output_mtok:.6}},{id:"mistral-small-24b-instruct-2501",name:"Mistral Small 3",description:"Mistral Small 3 is a 24B-parameter language model optimized for low-latency performance across common AI tasks. Released under the Apache 2.0 license, it features both pre-trained and instruction-tuned versions designed for efficient local deployment.",match:{equals:"mistral-small-24b-instruct-2501"},price_comments:"Can't find pricing on this model, so just trusting open router",prices:{input_mtok:.05,output_mtok:.08}},{id:"mistral-small-24b-instruct-2501:free",name:"Mistral Small 3 (free)",description:"Mistral Small 3 is a 24B-parameter language model optimized for low-latency performance across common AI tasks. Released under the Apache 2.0 license, it features both pre-trained and instruction-tuned versions designed for efficient local deployment.",match:{equals:"mistral-small-24b-instruct-2501:free"},prices:{}},{id:"mistral-small-latest",name:"Mistral Small 3.2",description:"SOTA. Multimodal. Multilingual. Apache 2.0.",match:{equals:"mistral-small-latest"},prices:{input_mtok:.1,output_mtok:.3}},{id:"mistral-tiny",name:"Mistral Tiny",description:"Note: This model is being deprecated. Recommended replacement is the newer Ministral 8B",match:{equals:"mistral-tiny"},prices:{input_mtok:.25,output_mtok:.25}},{id:"mixtral-8x22b-instruct",name:"Mixtral 8x22B Instruct",description:`Mistral's official instruct fine-tuned version of Mixtral 8x22B. It uses 39B active parameters out of 141B, offering unparalleled cost efficiency for its size. Its strengths include:
|
|
7
|
+
`,match:{equals:"openai/gpt-oss-20b"},context_window:131072,prices:{input_mtok:.075,cache_read_mtok:.0375,output_mtok:.3}},{id:"qwen/qwen3-32b",name:"Qwen3 32B 131k",match:{equals:"qwen/qwen3-32b"},prices:{input_mtok:.29,output_mtok:.59}}]},{id:"huggingface_cerebras",name:"HuggingFace (cerebras)",pricing_urls:["https://router.huggingface.co/v1/models","https://huggingface.co/inference/models"],api_pattern:"https://router\\.huggingface\\.co/cerebras",provider_match:{and:[{contains:"huggingface"},{contains:"cerebras"}]},extractors:[{api_flavor:"chat",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0},{path:["prompt_tokens_details","cached_tokens"],dest:"cache_read_tokens",required:!1},{path:["prompt_tokens_details","audio_tokens"],dest:"input_audio_tokens",required:!1},{path:["completion_tokens_details","audio_tokens"],dest:"output_audio_tokens",required:!1},{path:"completion_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"Qwen/Qwen3-235B-A22B-Instruct-2507",name:"Qwen3-235B-A22B-Instruct-2507",match:{equals:"Qwen/Qwen3-235B-A22B-Instruct-2507"},prices:{input_mtok:.6,output_mtok:1.2}},{id:"Qwen/Qwen3-32B",name:"Qwen3-32B",match:{equals:"Qwen/Qwen3-32B"},prices:{input_mtok:.4,output_mtok:.8}},{id:"meta-llama/Llama-3.1-8B-Instruct",name:"Llama-3.1-8B-Instruct",match:{equals:"meta-llama/Llama-3.1-8B-Instruct"},prices:{input_mtok:.1,output_mtok:.1}},{id:"meta-llama/Llama-3.3-70B-Instruct",name:"Llama-3.3-70B-Instruct",match:{equals:"meta-llama/Llama-3.3-70B-Instruct"},prices:{input_mtok:.85,output_mtok:1.2}},{id:"openai/gpt-oss-120b",name:"gpt-oss-120b",match:{equals:"openai/gpt-oss-120b"},prices:{input_mtok:.25,output_mtok:.69}}]},{id:"huggingface_fireworks-ai",name:"HuggingFace (fireworks-ai)",pricing_urls:["https://router.huggingface.co/v1/models","https://huggingface.co/inference/models"],api_pattern:"https://router\\.huggingface\\.co/fireworks-ai",provider_match:{and:[{contains:"huggingface"},{contains:"fireworks-ai"}]},extractors:[{api_flavor:"chat",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0},{path:["prompt_tokens_details","cached_tokens"],dest:"cache_read_tokens",required:!1},{path:["prompt_tokens_details","audio_tokens"],dest:"input_audio_tokens",required:!1},{path:["completion_tokens_details","audio_tokens"],dest:"output_audio_tokens",required:!1},{path:"completion_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"Qwen/Qwen2.5-VL-32B-Instruct",name:"Qwen2.5-VL-32B-Instruct",match:{equals:"Qwen/Qwen2.5-VL-32B-Instruct"},context_window:128e3,prices:{input_mtok:.22,output_mtok:.88}},{id:"Qwen/Qwen3-235B-A22B",name:"Qwen3-235B-A22B",match:{or:[{equals:"Qwen/Qwen3-235B-A22B"},{equals:"Qwen/Qwen3-235B-A22B-Instruct-2507"}]},context_window:131072,prices:{input_mtok:.22,output_mtok:.88}},{id:"Qwen/Qwen3-30B-A3B",name:"Qwen3-30B-A3B",match:{equals:"Qwen/Qwen3-30B-A3B"},context_window:131072,prices:{input_mtok:.15,output_mtok:.6}},{id:"Qwen/Qwen3-Coder-480B-A35B-Instruct",name:"Qwen3-Coder-480B-A35B-Instruct",match:{equals:"Qwen/Qwen3-Coder-480B-A35B-Instruct"},context_window:262144,prices:{input_mtok:.45,output_mtok:1.8}},{id:"SentientAGI/Dobby-Unhinged-Llama-3.3-70B",name:"Dobby-Unhinged-Llama-3.3-70B",match:{equals:"SentientAGI/Dobby-Unhinged-Llama-3.3-70B"},context_window:131072,prices:{input_mtok:.9,output_mtok:.9}},{id:"deepseek-ai/DeepSeek-R1-0528",name:"DeepSeek-R1-0528",match:{equals:"deepseek-ai/DeepSeek-R1-0528"},context_window:163840,prices:{input_mtok:3,output_mtok:8}},{id:"deepseek-ai/DeepSeek-V3-0324",name:"DeepSeek-V3-0324",match:{equals:"deepseek-ai/DeepSeek-V3-0324"},context_window:163840,prices:{input_mtok:.9,output_mtok:.9}},{id:"meta-llama/Llama-3.1-405B-Instruct",name:"Llama-3.1-405B-Instruct",match:{equals:"meta-llama/Llama-3.1-405B-Instruct"},context_window:131072,prices:{input_mtok:3,output_mtok:3}},{id:"meta-llama/Llama-3.1-70B-Instruct",name:"Llama-3.1-70B-Instruct",match:{equals:"meta-llama/Llama-3.1-70B-Instruct"},context_window:131072,prices:{input_mtok:.9,output_mtok:.9}},{id:"meta-llama/Llama-3.1-8B-Instruct",name:"Llama-3.1-8B-Instruct",match:{equals:"meta-llama/Llama-3.1-8B-Instruct"},context_window:131072,prices:{input_mtok:.2,output_mtok:.2}},{id:"meta-llama/Llama-3.3-70B-Instruct",name:"Llama-3.3-70B-Instruct",match:{equals:"meta-llama/Llama-3.3-70B-Instruct"},context_window:131072,prices:{input_mtok:.9,output_mtok:.9}},{id:"meta-llama/Llama-4-Maverick-17B-128E-Instruct",name:"Llama-4-Maverick-17B-128E-Instruct",match:{equals:"meta-llama/Llama-4-Maverick-17B-128E-Instruct"},context_window:1048576,prices:{input_mtok:.22,output_mtok:.88}},{id:"meta-llama/Llama-4-Scout-17B-16E-Instruct",name:"Llama-4-Scout-17B-16E-Instruct",match:{equals:"meta-llama/Llama-4-Scout-17B-16E-Instruct"},context_window:1048576,prices:{input_mtok:.15,output_mtok:.6}},{id:"moonshotai/Kimi-K2-Instruct",name:"Kimi-K2-Instruct",match:{equals:"moonshotai/Kimi-K2-Instruct"},context_window:131072,prices:{input_mtok:.6,output_mtok:2.5}},{id:"openai/gpt-oss-120b",name:"gpt-oss-120b",match:{equals:"openai/gpt-oss-120b"},context_window:131072,prices:{input_mtok:.15,output_mtok:.6}},{id:"openai/gpt-oss-20b",name:"gpt-oss-20b",match:{equals:"openai/gpt-oss-20b"},context_window:131072,prices:{input_mtok:.05,output_mtok:.2}},{id:"zai-org/GLM-4.5",name:"GLM-4.5",match:{equals:"zai-org/GLM-4.5"},context_window:131072,prices:{input_mtok:.55,output_mtok:2.19}}]},{id:"huggingface_groq",name:"HuggingFace (groq)",pricing_urls:["https://router.huggingface.co/v1/models","https://huggingface.co/inference/models"],api_pattern:"https://router\\.huggingface\\.co/groq",provider_match:{and:[{contains:"huggingface"},{contains:"groq"}]},extractors:[{api_flavor:"chat",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0},{path:["prompt_tokens_details","cached_tokens"],dest:"cache_read_tokens",required:!1},{path:["prompt_tokens_details","audio_tokens"],dest:"input_audio_tokens",required:!1},{path:["completion_tokens_details","audio_tokens"],dest:"output_audio_tokens",required:!1},{path:"completion_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"Qwen/Qwen3-32B",name:"Qwen3-32B",match:{equals:"Qwen/Qwen3-32B"},context_window:131072,prices:{input_mtok:.29,output_mtok:.59}},{id:"meta-llama/Llama-3.3-70B-Instruct",name:"Llama-3.3-70B-Instruct",match:{equals:"meta-llama/Llama-3.3-70B-Instruct"},context_window:131072,prices:{input_mtok:.59,output_mtok:.79}},{id:"meta-llama/Llama-4-Maverick-17B-128E-Instruct",name:"Llama-4-Maverick-17B-128E-Instruct",match:{equals:"meta-llama/Llama-4-Maverick-17B-128E-Instruct"},context_window:131072,prices:{input_mtok:.2,output_mtok:.6}},{id:"meta-llama/Llama-4-Scout-17B-16E-Instruct",name:"Llama-4-Scout-17B-16E-Instruct",match:{equals:"meta-llama/Llama-4-Scout-17B-16E-Instruct"},context_window:131072,prices:{input_mtok:.11,output_mtok:.34}},{id:"meta-llama/Llama-Guard-4-12B",name:"Llama-Guard-4-12B",match:{equals:"meta-llama/Llama-Guard-4-12B"},context_window:131072,prices:{input_mtok:.2,output_mtok:.2}},{id:"openai/gpt-oss-120b",name:"gpt-oss-120b",match:{equals:"openai/gpt-oss-120b"},context_window:131072,prices:{input_mtok:.15,output_mtok:.75}},{id:"openai/gpt-oss-20b",name:"gpt-oss-20b",match:{equals:"openai/gpt-oss-20b"},context_window:131072,prices:{input_mtok:.1,output_mtok:.5}}]},{id:"huggingface_hyperbolic",name:"HuggingFace (hyperbolic)",pricing_urls:["https://router.huggingface.co/v1/models","https://huggingface.co/inference/models"],api_pattern:"https://router\\.huggingface\\.co/hyperbolic",provider_match:{and:[{contains:"huggingface"},{contains:"hyperbolic"}]},extractors:[{api_flavor:"chat",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0},{path:["prompt_tokens_details","cached_tokens"],dest:"cache_read_tokens",required:!1},{path:["prompt_tokens_details","audio_tokens"],dest:"input_audio_tokens",required:!1},{path:["completion_tokens_details","audio_tokens"],dest:"output_audio_tokens",required:!1},{path:"completion_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"Qwen/QwQ-32B",name:"QwQ-32B",match:{equals:"Qwen/QwQ-32B"},context_window:131072,prices:{input_mtok:.4,output_mtok:.4}},{id:"Qwen/Qwen2.5-72B-Instruct",name:"Qwen2.5-72B-Instruct",match:{equals:"Qwen/Qwen2.5-72B-Instruct"},context_window:131072,prices:{input_mtok:.4,output_mtok:.4}},{id:"Qwen/Qwen2.5-Coder-32B-Instruct",name:"Qwen2.5-Coder-32B-Instruct",match:{equals:"Qwen/Qwen2.5-Coder-32B-Instruct"},context_window:32768,prices:{input_mtok:.2,output_mtok:.2}},{id:"Qwen/Qwen2.5-VL-72B-Instruct",name:"Qwen2.5-VL-72B-Instruct",match:{equals:"Qwen/Qwen2.5-VL-72B-Instruct"},context_window:32768,prices:{input_mtok:.6,output_mtok:.6}},{id:"Qwen/Qwen2.5-VL-7B-Instruct",name:"Qwen2.5-VL-7B-Instruct",match:{equals:"Qwen/Qwen2.5-VL-7B-Instruct"},context_window:32768,prices:{input_mtok:.2,output_mtok:.2}},{id:"Qwen/Qwen3-235B-A22B-Instruct-2507",name:"Qwen3-235B-A22B-Instruct-2507",match:{equals:"Qwen/Qwen3-235B-A22B-Instruct-2507"},context_window:262144,prices:{input_mtok:2,output_mtok:2}},{id:"Qwen/Qwen3-Coder-480B-A35B-Instruct",name:"Qwen3-Coder-480B-A35B-Instruct",match:{equals:"Qwen/Qwen3-Coder-480B-A35B-Instruct"},context_window:262144,prices:{input_mtok:2,output_mtok:2}},{id:"Qwen/Qwen3-Next-80B-A3B-Instruct",name:"Qwen3-Next-80B-A3B-Instruct",match:{equals:"Qwen/Qwen3-Next-80B-A3B-Instruct"},context_window:262144,prices:{input_mtok:.3,output_mtok:.3}},{id:"Qwen/Qwen3-Next-80B-A3B-Thinking",name:"Qwen3-Next-80B-A3B-Thinking",match:{equals:"Qwen/Qwen3-Next-80B-A3B-Thinking"},context_window:262144,prices:{input_mtok:.3,output_mtok:.3}},{id:"deepseek-ai/DeepSeek-R1",name:"DeepSeek-R1",match:{equals:"deepseek-ai/DeepSeek-R1"},context_window:163840,prices:{input_mtok:2,output_mtok:2}},{id:"deepseek-ai/DeepSeek-R1-0528",name:"DeepSeek-R1-0528",match:{equals:"deepseek-ai/DeepSeek-R1-0528"},context_window:163840,prices:{input_mtok:3,output_mtok:3}},{id:"deepseek-ai/DeepSeek-V3-0324",name:"DeepSeek-V3-0324",match:{equals:"deepseek-ai/DeepSeek-V3-0324"},context_window:163840,prices:{input_mtok:1.25,output_mtok:1.25}},{id:"meta-llama/Llama-3.1-70B-Instruct",name:"Llama-3.1-70B-Instruct",match:{equals:"meta-llama/Llama-3.1-70B-Instruct"},context_window:131072,prices:{input_mtok:.4,output_mtok:.4}},{id:"meta-llama/Llama-3.1-8B-Instruct",name:"Llama-3.1-8B-Instruct",match:{equals:"meta-llama/Llama-3.1-8B-Instruct"},context_window:131072,prices:{input_mtok:.1,output_mtok:.1}},{id:"meta-llama/Llama-3.2-3B-Instruct",name:"Llama-3.2-3B-Instruct",match:{equals:"meta-llama/Llama-3.2-3B-Instruct"},context_window:131072,prices:{input_mtok:.1,output_mtok:.1}},{id:"meta-llama/Llama-3.3-70B-Instruct",name:"Llama-3.3-70B-Instruct",match:{equals:"meta-llama/Llama-3.3-70B-Instruct"},context_window:131072,prices:{input_mtok:.4,output_mtok:.4}},{id:"meta-llama/Meta-Llama-3-70B-Instruct",name:"Meta-Llama-3-70B-Instruct",match:{equals:"meta-llama/Meta-Llama-3-70B-Instruct"},context_window:8192,prices:{input_mtok:.4,output_mtok:.4}},{id:"openai/gpt-oss-120b",name:"gpt-oss-120b",match:{equals:"openai/gpt-oss-120b"},context_window:131072,prices:{input_mtok:.3,output_mtok:.3}},{id:"openai/gpt-oss-20b",name:"gpt-oss-20b",match:{equals:"openai/gpt-oss-20b"},context_window:131072,prices:{input_mtok:.1,output_mtok:.1}}]},{id:"huggingface_nebius",name:"HuggingFace (nebius)",pricing_urls:["https://router.huggingface.co/v1/models","https://huggingface.co/inference/models"],api_pattern:"https://router\\.huggingface\\.co/nebius",provider_match:{and:[{contains:"huggingface"},{contains:"nebius"}]},extractors:[{api_flavor:"chat",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0},{path:["prompt_tokens_details","cached_tokens"],dest:"cache_read_tokens",required:!1},{path:["prompt_tokens_details","audio_tokens"],dest:"input_audio_tokens",required:!1},{path:["completion_tokens_details","audio_tokens"],dest:"output_audio_tokens",required:!1},{path:"completion_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"NousResearch/Hermes-4-405B",name:"Hermes-4-405B",match:{equals:"NousResearch/Hermes-4-405B"},context_window:131072,prices:{input_mtok:1,output_mtok:3}},{id:"NousResearch/Hermes-4-70B",name:"Hermes-4-70B",match:{equals:"NousResearch/Hermes-4-70B"},context_window:131072,prices:{input_mtok:.13,output_mtok:.4}},{id:"Qwen/Qwen2.5-Coder-7B",name:"Qwen2.5-Coder-7B",match:{equals:"Qwen/Qwen2.5-Coder-7B"},context_window:32768,prices:{input_mtok:.03,output_mtok:.09}},{id:"Qwen/Qwen2.5-VL-72B-Instruct",name:"Qwen2.5-VL-72B-Instruct",match:{equals:"Qwen/Qwen2.5-VL-72B-Instruct"},context_window:32e3,prices:{input_mtok:.25,output_mtok:.75}},{id:"Qwen/Qwen3-235B-A22B-Instruct-2507",name:"Qwen3-235B-A22B-Instruct-2507",match:{equals:"Qwen/Qwen3-235B-A22B-Instruct-2507"},context_window:262144,prices:{input_mtok:.2,output_mtok:.6}},{id:"Qwen/Qwen3-30B-A3B-Instruct-2507",name:"Qwen3-30B-A3B-Instruct-2507",match:{equals:"Qwen/Qwen3-30B-A3B-Instruct-2507"},context_window:262144,prices:{input_mtok:.1,output_mtok:.3}},{id:"Qwen/Qwen3-30B-A3B-Thinking-2507",name:"Qwen3-30B-A3B-Thinking-2507",match:{equals:"Qwen/Qwen3-30B-A3B-Thinking-2507"},context_window:262144,prices:{input_mtok:.1,output_mtok:.3}},{id:"Qwen/Qwen3-32B",name:"Qwen3-32B",match:{equals:"Qwen/Qwen3-32B"},context_window:40960,prices:{input_mtok:.1,output_mtok:.3}},{id:"Qwen/Qwen3-Coder-30B-A3B-Instruct",name:"Qwen3-Coder-30B-A3B-Instruct",match:{equals:"Qwen/Qwen3-Coder-30B-A3B-Instruct"},context_window:262144,prices:{input_mtok:.1,output_mtok:.3}},{id:"Qwen/Qwen3-Coder-480B-A35B-Instruct",name:"Qwen3-Coder-480B-A35B-Instruct",match:{equals:"Qwen/Qwen3-Coder-480B-A35B-Instruct"},context_window:262144,prices:{input_mtok:.4,output_mtok:1.8}},{id:"deepseek-ai/DeepSeek-R1-0528",name:"DeepSeek-R1-0528",match:{equals:"deepseek-ai/DeepSeek-R1-0528"},context_window:163840,prices:{input_mtok:.8,output_mtok:2.4}},{id:"deepseek-ai/DeepSeek-V3-0324",name:"DeepSeek-V3-0324",match:{equals:"deepseek-ai/DeepSeek-V3-0324"},context_window:32768,prices:{input_mtok:.75,output_mtok:2.25}},{id:"google/gemma-2-2b-it",name:"gemma-2-2b-it",match:{equals:"google/gemma-2-2b-it"},context_window:8192,prices:{input_mtok:.02,output_mtok:.06}},{id:"google/gemma-2-9b-it",name:"gemma-2-9b-it",match:{equals:"google/gemma-2-9b-it"},context_window:8192,prices:{input_mtok:.03,output_mtok:.09}},{id:"google/gemma-3-27b-it",name:"gemma-3-27b-it",match:{equals:"google/gemma-3-27b-it"},context_window:11e4,prices:{input_mtok:.2,output_mtok:.6}},{id:"meta-llama/Llama-3.1-8B-Instruct",name:"Llama-3.1-8B-Instruct",match:{equals:"meta-llama/Llama-3.1-8B-Instruct"},context_window:131072,prices:{input_mtok:.03,output_mtok:.09}},{id:"meta-llama/Llama-3.3-70B-Instruct",name:"Llama-3.3-70B-Instruct",match:{equals:"meta-llama/Llama-3.3-70B-Instruct"},context_window:131072,prices:{input_mtok:.25,output_mtok:.75}},{id:"moonshotai/Kimi-K2-Instruct",name:"Kimi-K2-Instruct",match:{equals:"moonshotai/Kimi-K2-Instruct"},context_window:131072,prices:{input_mtok:.5,output_mtok:2.4}},{id:"nvidia/Llama-3_1-Nemotron-Ultra-253B-v1",name:"Llama-3_1-Nemotron-Ultra-253B-v1",match:{equals:"nvidia/Llama-3_1-Nemotron-Ultra-253B-v1"},context_window:131072,prices:{input_mtok:.6,output_mtok:1.8}},{id:"nvidia/NVIDIA-Nemotron-Nano-12B-v2",name:"NVIDIA-Nemotron-Nano-12B-v2",match:{equals:"nvidia/NVIDIA-Nemotron-Nano-12B-v2"},context_window:131072,prices:{input_mtok:.07,output_mtok:.2}},{id:"openai/gpt-oss-120b",name:"gpt-oss-120b",match:{equals:"openai/gpt-oss-120b"},context_window:131072,prices:{input_mtok:.15,output_mtok:.6}},{id:"openai/gpt-oss-20b",name:"gpt-oss-20b",match:{equals:"openai/gpt-oss-20b"},context_window:131072,prices:{input_mtok:.05,output_mtok:.2}},{id:"zai-org/GLM-4.5",name:"GLM-4.5",match:{equals:"zai-org/GLM-4.5"},context_window:131072,prices:{input_mtok:.6,output_mtok:2.2}},{id:"zai-org/GLM-4.5-Air",name:"GLM-4.5-Air",match:{equals:"zai-org/GLM-4.5-Air"},context_window:131072,prices:{input_mtok:.2,output_mtok:1.2}}]},{id:"huggingface_novita",name:"HuggingFace (novita)",pricing_urls:["https://router.huggingface.co/v1/models","https://huggingface.co/inference/models"],api_pattern:"https://router\\.huggingface\\.co/novita",provider_match:{and:[{contains:"huggingface"},{contains:"novita"}]},extractors:[{api_flavor:"chat",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0},{path:["prompt_tokens_details","cached_tokens"],dest:"cache_read_tokens",required:!1},{path:["prompt_tokens_details","audio_tokens"],dest:"input_audio_tokens",required:!1},{path:["completion_tokens_details","audio_tokens"],dest:"output_audio_tokens",required:!1},{path:"completion_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"MiniMaxAI/MiniMax-M1-80k",name:"MiniMax-M1-80k",match:{equals:"MiniMaxAI/MiniMax-M1-80k"},context_window:1e6,prices:{input_mtok:.44,output_mtok:1.76}},{id:"MiniMaxAI/MiniMax-M2",name:"MiniMax-M2",match:{equals:"MiniMaxAI/MiniMax-M2"},context_window:204800,prices:{input_mtok:.24,output_mtok:.96}},{id:"NousResearch/Hermes-2-Pro-Llama-3-8B",name:"Hermes-2-Pro-Llama-3-8B",match:{equals:"NousResearch/Hermes-2-Pro-Llama-3-8B"},context_window:8192,prices:{input_mtok:.14,output_mtok:.14}},{id:"Qwen/Qwen2.5-72B-Instruct",name:"Qwen2.5-72B-Instruct",match:{equals:"Qwen/Qwen2.5-72B-Instruct"},context_window:32e3,prices:{input_mtok:.304,output_mtok:.32}},{id:"Qwen/Qwen3-235B-A22B",name:"Qwen3-235B-A22B",match:{equals:"Qwen/Qwen3-235B-A22B"},context_window:40960,prices:{input_mtok:.16,output_mtok:.64}},{id:"Qwen/Qwen3-235B-A22B-Instruct-2507",name:"Qwen3-235B-A22B-Instruct-2507",match:{equals:"Qwen/Qwen3-235B-A22B-Instruct-2507"},context_window:131072,prices:{input_mtok:.072,output_mtok:.464}},{id:"Qwen/Qwen3-235B-A22B-Thinking-2507",name:"Qwen3-235B-A22B-Thinking-2507",match:{equals:"Qwen/Qwen3-235B-A22B-Thinking-2507"},context_window:131072,prices:{input_mtok:.24,output_mtok:2.4}},{id:"Qwen/Qwen3-30B-A3B",name:"Qwen3-30B-A3B",match:{equals:"Qwen/Qwen3-30B-A3B"},context_window:40960,prices:{input_mtok:.072,output_mtok:.36}},{id:"Qwen/Qwen3-32B",name:"Qwen3-32B",match:{equals:"Qwen/Qwen3-32B"},context_window:40960,prices:{input_mtok:.08,output_mtok:.36}},{id:"Qwen/Qwen3-Coder-480B-A35B-Instruct",name:"Qwen3-Coder-480B-A35B-Instruct",match:{equals:"Qwen/Qwen3-Coder-480B-A35B-Instruct"},context_window:262144,prices:{input_mtok:.232,output_mtok:.96}},{id:"Qwen/Qwen3-Next-80B-A3B-Instruct",name:"Qwen3-Next-80B-A3B-Instruct",match:{equals:"Qwen/Qwen3-Next-80B-A3B-Instruct"},context_window:131072,prices:{input_mtok:.12,output_mtok:1.2}},{id:"Qwen/Qwen3-Next-80B-A3B-Thinking",name:"Qwen3-Next-80B-A3B-Thinking",match:{equals:"Qwen/Qwen3-Next-80B-A3B-Thinking"},context_window:131072,prices:{input_mtok:.12,output_mtok:1.2}},{id:"Qwen/Qwen3-VL-235B-A22B-Instruct",name:"Qwen3-VL-235B-A22B-Instruct",match:{equals:"Qwen/Qwen3-VL-235B-A22B-Instruct"},context_window:131072,prices:{input_mtok:.24,output_mtok:1.2}},{id:"Qwen/Qwen3-VL-235B-A22B-Thinking",name:"Qwen3-VL-235B-A22B-Thinking",match:{equals:"Qwen/Qwen3-VL-235B-A22B-Thinking"},context_window:131072,prices:{input_mtok:.784,output_mtok:3.16}},{id:"Qwen/Qwen3-VL-30B-A3B-Instruct",name:"Qwen3-VL-30B-A3B-Instruct",match:{equals:"Qwen/Qwen3-VL-30B-A3B-Instruct"},context_window:131072,prices:{input_mtok:.16,output_mtok:.56}},{id:"Qwen/Qwen3-VL-30B-A3B-Thinking",name:"Qwen3-VL-30B-A3B-Thinking",match:{equals:"Qwen/Qwen3-VL-30B-A3B-Thinking"},context_window:131072,prices:{input_mtok:.16,output_mtok:.8}},{id:"Qwen/Qwen3-VL-8B-Instruct",name:"Qwen3-VL-8B-Instruct",match:{equals:"Qwen/Qwen3-VL-8B-Instruct"},context_window:131072,prices:{input_mtok:.064,output_mtok:.4}},{id:"Sao10K/L3-70B-Euryale-v2.1",name:"L3-70B-Euryale-v2.1",match:{equals:"Sao10K/L3-70B-Euryale-v2.1"},context_window:8192,prices:{input_mtok:1.48,output_mtok:1.48}},{id:"Sao10K/L3-8B-Lunaris-v1",name:"L3-8B-Lunaris-v1",match:{equals:"Sao10K/L3-8B-Lunaris-v1"},context_window:8192,prices:{input_mtok:.05,output_mtok:.05}},{id:"Sao10K/L3-8B-Stheno-v3.2",name:"L3-8B-Stheno-v3.2",match:{equals:"Sao10K/L3-8B-Stheno-v3.2"},context_window:8192,prices:{input_mtok:.05,output_mtok:.05}},{id:"alpindale/WizardLM-2-8x22B",name:"WizardLM-2-8x22B",match:{equals:"alpindale/WizardLM-2-8x22B"},context_window:65535,prices:{input_mtok:.496,output_mtok:.496}},{id:"baichuan-inc/Baichuan-M2-32B",name:"Baichuan-M2-32B",match:{equals:"baichuan-inc/Baichuan-M2-32B"},context_window:131072,prices:{input_mtok:.056,output_mtok:.056}},{id:"baidu/ERNIE-4.5-21B-A3B-PT",name:"ERNIE-4.5-21B-A3B-PT",match:{equals:"baidu/ERNIE-4.5-21B-A3B-PT"},context_window:12e4,prices:{input_mtok:.056,output_mtok:.224}},{id:"baidu/ERNIE-4.5-300B-A47B-Base-PT",name:"ERNIE-4.5-300B-A47B-Base-PT",match:{equals:"baidu/ERNIE-4.5-300B-A47B-Base-PT"},context_window:123e3,prices:{input_mtok:.224,output_mtok:.88}},{id:"baidu/ERNIE-4.5-VL-28B-A3B-PT",name:"ERNIE-4.5-VL-28B-A3B-PT",match:{equals:"baidu/ERNIE-4.5-VL-28B-A3B-PT"},context_window:3e4,prices:{input_mtok:.112,output_mtok:.448}},{id:"baidu/ERNIE-4.5-VL-424B-A47B-Base-PT",name:"ERNIE-4.5-VL-424B-A47B-Base-PT",match:{equals:"baidu/ERNIE-4.5-VL-424B-A47B-Base-PT"},context_window:123e3,prices:{input_mtok:.336,output_mtok:1}},{id:"deepseek-ai/DeepSeek-Prover-V2-671B",name:"DeepSeek-Prover-V2-671B",match:{equals:"deepseek-ai/DeepSeek-Prover-V2-671B"},context_window:16e4,prices:{input_mtok:.56,output_mtok:2}},{id:"deepseek-ai/DeepSeek-R1",name:"DeepSeek-R1",match:{or:[{equals:"deepseek-ai/DeepSeek-R1"},{equals:"deepseek-ai/DeepSeek-R1-0528"}]},context_window:64e3,prices:{input_mtok:.56,output_mtok:2}},{id:"deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",name:"DeepSeek-R1-0528-Qwen3-8B",match:{equals:"deepseek-ai/DeepSeek-R1-0528-Qwen3-8B"},context_window:128e3,prices:{input_mtok:.06,output_mtok:.09}},{id:"deepseek-ai/DeepSeek-R1-Distill-Llama-70B",name:"DeepSeek-R1-Distill-Llama-70B",match:{equals:"deepseek-ai/DeepSeek-R1-Distill-Llama-70B"},context_window:8192,prices:{input_mtok:.64,output_mtok:.64}},{id:"deepseek-ai/DeepSeek-R1-Distill-Qwen-14B",name:"DeepSeek-R1-Distill-Qwen-14B",match:{equals:"deepseek-ai/DeepSeek-R1-Distill-Qwen-14B"},context_window:32768,prices:{input_mtok:.15,output_mtok:.15}},{id:"deepseek-ai/DeepSeek-R1-Distill-Qwen-32B",name:"DeepSeek-R1-Distill-Qwen-32B",match:{equals:"deepseek-ai/DeepSeek-R1-Distill-Qwen-32B"},context_window:64e3,prices:{input_mtok:.24,output_mtok:.24}},{id:"deepseek-ai/DeepSeek-V3",name:"DeepSeek-V3",match:{equals:"deepseek-ai/DeepSeek-V3"},context_window:64e3,prices:{input_mtok:.32,output_mtok:1.04}},{id:"deepseek-ai/DeepSeek-V3-0324",name:"DeepSeek-V3-0324",match:{equals:"deepseek-ai/DeepSeek-V3-0324"},context_window:163840,prices:{input_mtok:.216,output_mtok:.896}},{id:"deepseek-ai/DeepSeek-V3.1",name:"DeepSeek-V3.1",match:{or:[{equals:"deepseek-ai/DeepSeek-V3.1"},{equals:"deepseek-ai/DeepSeek-V3.1-Terminus"}]},context_window:131072,prices:{input_mtok:.216,output_mtok:.8}},{id:"deepseek-ai/DeepSeek-V3.2-Exp",name:"DeepSeek-V3.2-Exp",match:{equals:"deepseek-ai/DeepSeek-V3.2-Exp"},context_window:163840,prices:{input_mtok:.216,output_mtok:.328}},{id:"meta-llama/Llama-3.1-8B-Instruct",name:"Llama-3.1-8B-Instruct",match:{equals:"meta-llama/Llama-3.1-8B-Instruct"},context_window:16384,prices:{input_mtok:.02,output_mtok:.05}},{id:"meta-llama/Llama-3.2-3B-Instruct",name:"Llama-3.2-3B-Instruct",match:{equals:"meta-llama/Llama-3.2-3B-Instruct"},context_window:32768,prices:{input_mtok:.024,output_mtok:.04}},{id:"meta-llama/Llama-3.3-70B-Instruct",name:"Llama-3.3-70B-Instruct",match:{equals:"meta-llama/Llama-3.3-70B-Instruct"},context_window:131072,prices:{input_mtok:.104,output_mtok:.312}},{id:"meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",name:"Llama-4-Maverick-17B-128E-Instruct-FP8",match:{equals:"meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8"},context_window:1048576,prices:{input_mtok:.136,output_mtok:.68}},{id:"meta-llama/Llama-4-Scout-17B-16E-Instruct",name:"Llama-4-Scout-17B-16E-Instruct",match:{equals:"meta-llama/Llama-4-Scout-17B-16E-Instruct"},context_window:131072,prices:{input_mtok:.08,output_mtok:.4}},{id:"meta-llama/Meta-Llama-3-70B-Instruct",name:"Meta-Llama-3-70B-Instruct",match:{equals:"meta-llama/Meta-Llama-3-70B-Instruct"},context_window:8192,prices:{input_mtok:.51,output_mtok:.74}},{id:"meta-llama/Meta-Llama-3-8B-Instruct",name:"Meta-Llama-3-8B-Instruct",match:{equals:"meta-llama/Meta-Llama-3-8B-Instruct"},context_window:8192,prices:{input_mtok:.032,output_mtok:.032}},{id:"moonshotai/Kimi-K2-Instruct",name:"Kimi-K2-Instruct",match:{equals:"moonshotai/Kimi-K2-Instruct"},context_window:131072,prices:{input_mtok:.456,output_mtok:1.84}},{id:"moonshotai/Kimi-K2-Instruct-0905",name:"Kimi-K2-Instruct-0905",match:{equals:"moonshotai/Kimi-K2-Instruct-0905"},context_window:262144,prices:{input_mtok:.48,output_mtok:2}},{id:"moonshotai/Kimi-K2-Thinking",name:"Kimi-K2-Thinking",match:{equals:"moonshotai/Kimi-K2-Thinking"},context_window:262144,prices:{input_mtok:.48,output_mtok:2}},{id:"openai/gpt-oss-120b",name:"gpt-oss-120b",match:{equals:"openai/gpt-oss-120b"},context_window:131072,prices:{input_mtok:.04,output_mtok:.2}},{id:"openai/gpt-oss-20b",name:"gpt-oss-20b",match:{equals:"openai/gpt-oss-20b"},context_window:131072,prices:{input_mtok:.032,output_mtok:.12}},{id:"zai-org/GLM-4-32B-0414",name:"GLM-4-32B-0414",match:{equals:"zai-org/GLM-4-32B-0414"},context_window:32e3,prices:{input_mtok:.55,output_mtok:1.66}},{id:"zai-org/GLM-4.1V-9B-Thinking",name:"GLM-4.1V-9B-Thinking",match:{equals:"zai-org/GLM-4.1V-9B-Thinking"},context_window:65536,prices:{input_mtok:.028,output_mtok:.1104}},{id:"zai-org/GLM-4.5",name:"GLM-4.5",match:{equals:"zai-org/GLM-4.5"},context_window:131072,prices:{input_mtok:.48,output_mtok:1.76}},{id:"zai-org/GLM-4.5-Air",name:"GLM-4.5-Air",match:{equals:"zai-org/GLM-4.5-Air"},context_window:131072,prices:{input_mtok:.104,output_mtok:.68}},{id:"zai-org/GLM-4.5V",name:"GLM-4.5V",match:{equals:"zai-org/GLM-4.5V"},context_window:65536,prices:{input_mtok:.48,output_mtok:1.44}},{id:"zai-org/GLM-4.6",name:"GLM-4.6",match:{equals:"zai-org/GLM-4.6"},context_window:204800,prices:{input_mtok:.48,output_mtok:1.76}}]},{id:"huggingface_nscale",name:"HuggingFace (nscale)",pricing_urls:["https://router.huggingface.co/v1/models","https://huggingface.co/inference/models"],api_pattern:"https://router\\.huggingface\\.co/nscale",provider_match:{and:[{contains:"huggingface"},{contains:"nscale"}]},extractors:[{api_flavor:"chat",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0},{path:["prompt_tokens_details","cached_tokens"],dest:"cache_read_tokens",required:!1},{path:["prompt_tokens_details","audio_tokens"],dest:"input_audio_tokens",required:!1},{path:["completion_tokens_details","audio_tokens"],dest:"output_audio_tokens",required:!1},{path:"completion_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"Qwen/QwQ-32B",name:"QwQ-32B",match:{equals:"Qwen/QwQ-32B"},context_window:131072,prices:{input_mtok:.18,output_mtok:.2}},{id:"Qwen/Qwen2.5-Coder-32B-Instruct",name:"Qwen2.5-Coder-32B-Instruct",match:{equals:"Qwen/Qwen2.5-Coder-32B-Instruct"},context_window:131072,prices:{input_mtok:.06,output_mtok:.2}},{id:"Qwen/Qwen2.5-Coder-3B-Instruct",name:"Qwen2.5-Coder-3B-Instruct",match:{equals:"Qwen/Qwen2.5-Coder-3B-Instruct"},context_window:32768,prices:{input_mtok:.01,output_mtok:.03}},{id:"Qwen/Qwen2.5-Coder-7B-Instruct",name:"Qwen2.5-Coder-7B-Instruct",match:{equals:"Qwen/Qwen2.5-Coder-7B-Instruct"},context_window:131072,prices:{input_mtok:.01,output_mtok:.03}},{id:"Qwen/Qwen3-14B",name:"Qwen3-14B",match:{equals:"Qwen/Qwen3-14B"},context_window:40960,prices:{input_mtok:.07,output_mtok:.2}},{id:"Qwen/Qwen3-235B-A22B",name:"Qwen3-235B-A22B",match:{or:[{equals:"Qwen/Qwen3-235B-A22B"},{equals:"Qwen/Qwen3-235B-A22B-Instruct-2507"}]},context_window:32e3,prices:{input_mtok:.2,output_mtok:.6}},{id:"Qwen/Qwen3-32B",name:"Qwen3-32B",match:{equals:"Qwen/Qwen3-32B"},context_window:40960,prices:{input_mtok:.08,output_mtok:.25}},{id:"Qwen/Qwen3-4B-Instruct-2507",name:"Qwen3-4B-Instruct-2507",match:{equals:"Qwen/Qwen3-4B-Instruct-2507"},context_window:262144,prices:{input_mtok:.01,output_mtok:.03}},{id:"Qwen/Qwen3-4B-Thinking-2507",name:"Qwen3-4B-Thinking-2507",match:{equals:"Qwen/Qwen3-4B-Thinking-2507"},context_window:262144,prices:{input_mtok:.01,output_mtok:.03}},{id:"Qwen/Qwen3-8B",name:"Qwen3-8B",match:{equals:"Qwen/Qwen3-8B"},context_window:40960,prices:{input_mtok:.07,output_mtok:.18}},{id:"deepseek-ai/DeepSeek-R1-Distill-Llama-70B",name:"DeepSeek-R1-Distill-Llama-70B",match:{equals:"deepseek-ai/DeepSeek-R1-Distill-Llama-70B"},context_window:131072,prices:{input_mtok:.75,output_mtok:.75}},{id:"deepseek-ai/DeepSeek-R1-Distill-Llama-8B",name:"DeepSeek-R1-Distill-Llama-8B",match:{equals:"deepseek-ai/DeepSeek-R1-Distill-Llama-8B"},context_window:131072,prices:{input_mtok:.05,output_mtok:.05}},{id:"deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B",name:"DeepSeek-R1-Distill-Qwen-1.5B",match:{equals:"deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B"},context_window:131072,prices:{input_mtok:.1,output_mtok:.1}},{id:"deepseek-ai/DeepSeek-R1-Distill-Qwen-14B",name:"DeepSeek-R1-Distill-Qwen-14B",match:{equals:"deepseek-ai/DeepSeek-R1-Distill-Qwen-14B"},context_window:131072,prices:{input_mtok:.2,output_mtok:.2}},{id:"deepseek-ai/DeepSeek-R1-Distill-Qwen-32B",name:"DeepSeek-R1-Distill-Qwen-32B",match:{equals:"deepseek-ai/DeepSeek-R1-Distill-Qwen-32B"},context_window:131072,prices:{input_mtok:.3,output_mtok:.3}},{id:"deepseek-ai/DeepSeek-R1-Distill-Qwen-7B",name:"DeepSeek-R1-Distill-Qwen-7B",match:{equals:"deepseek-ai/DeepSeek-R1-Distill-Qwen-7B"},context_window:131072,prices:{input_mtok:.15,output_mtok:.15}},{id:"meta-llama/Llama-3.1-8B-Instruct",name:"Llama-3.1-8B-Instruct",match:{equals:"meta-llama/Llama-3.1-8B-Instruct"},context_window:131072,prices:{input_mtok:.06,output_mtok:.06}},{id:"meta-llama/Llama-3.3-70B-Instruct",name:"Llama-3.3-70B-Instruct",match:{equals:"meta-llama/Llama-3.3-70B-Instruct"},context_window:131072,prices:{input_mtok:.4,output_mtok:.4}},{id:"meta-llama/Llama-4-Scout-17B-16E-Instruct",name:"Llama-4-Scout-17B-16E-Instruct",match:{equals:"meta-llama/Llama-4-Scout-17B-16E-Instruct"},context_window:89e4,prices:{input_mtok:.09,output_mtok:.29}},{id:"openai/gpt-oss-120b",name:"gpt-oss-120b",match:{equals:"openai/gpt-oss-120b"},context_window:131072,prices:{input_mtok:.1,output_mtok:.4}},{id:"openai/gpt-oss-20b",name:"gpt-oss-20b",match:{equals:"openai/gpt-oss-20b"},context_window:131072,prices:{input_mtok:.05,output_mtok:.2}}]},{id:"huggingface_publicai",name:"HuggingFace (publicai)",pricing_urls:["https://router.huggingface.co/v1/models","https://huggingface.co/inference/models"],api_pattern:"https://router\\.huggingface\\.co/publicai",provider_match:{and:[{contains:"huggingface"},{contains:"publicai"}]},extractors:[{api_flavor:"chat",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0},{path:["prompt_tokens_details","cached_tokens"],dest:"cache_read_tokens",required:!1},{path:["prompt_tokens_details","audio_tokens"],dest:"input_audio_tokens",required:!1},{path:["completion_tokens_details","audio_tokens"],dest:"output_audio_tokens",required:!1},{path:"completion_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"aisingapore/Gemma-SEA-LION-v4-27B-IT",name:"Gemma-SEA-LION-v4-27B-IT",match:{equals:"aisingapore/Gemma-SEA-LION-v4-27B-IT"},prices:{}},{id:"swiss-ai/Apertus-70B-Instruct-2509",name:"Apertus-70B-Instruct-2509",match:{equals:"swiss-ai/Apertus-70B-Instruct-2509"},prices:{}},{id:"swiss-ai/Apertus-8B-Instruct-2509",name:"Apertus-8B-Instruct-2509",match:{equals:"swiss-ai/Apertus-8B-Instruct-2509"},prices:{}}]},{id:"huggingface_sambanova",name:"HuggingFace (sambanova)",pricing_urls:["https://router.huggingface.co/v1/models","https://huggingface.co/inference/models"],api_pattern:"https://router\\.huggingface\\.co/sambanova",provider_match:{and:[{contains:"huggingface"},{contains:"sambanova"}]},extractors:[{api_flavor:"chat",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0},{path:["prompt_tokens_details","cached_tokens"],dest:"cache_read_tokens",required:!1},{path:["prompt_tokens_details","audio_tokens"],dest:"input_audio_tokens",required:!1},{path:["completion_tokens_details","audio_tokens"],dest:"output_audio_tokens",required:!1},{path:"completion_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"Qwen/Qwen3-32B",name:"Qwen3-32B",match:{equals:"Qwen/Qwen3-32B"},context_window:32768,prices:{input_mtok:.4,output_mtok:.8}},{id:"deepseek-ai/DeepSeek-R1-0528",name:"DeepSeek-R1-0528",match:{equals:"deepseek-ai/DeepSeek-R1-0528"},context_window:131072,prices:{input_mtok:5,output_mtok:7}},{id:"deepseek-ai/DeepSeek-R1-Distill-Llama-70B",name:"DeepSeek-R1-Distill-Llama-70B",match:{equals:"deepseek-ai/DeepSeek-R1-Distill-Llama-70B"},context_window:131072,prices:{input_mtok:.7,output_mtok:1.4}},{id:"deepseek-ai/DeepSeek-V3-0324",name:"DeepSeek-V3-0324",match:{equals:"deepseek-ai/DeepSeek-V3-0324"},context_window:131072,prices:{input_mtok:3,output_mtok:4.5}},{id:"meta-llama/Llama-3.1-8B-Instruct",name:"Llama-3.1-8B-Instruct",match:{equals:"meta-llama/Llama-3.1-8B-Instruct"},context_window:16384,prices:{input_mtok:.1,output_mtok:.2}},{id:"meta-llama/Llama-3.3-70B-Instruct",name:"Llama-3.3-70B-Instruct",match:{equals:"meta-llama/Llama-3.3-70B-Instruct"},context_window:131072,prices:{input_mtok:.6,output_mtok:1.2}},{id:"meta-llama/Llama-4-Maverick-17B-128E-Instruct",name:"Llama-4-Maverick-17B-128E-Instruct",match:{equals:"meta-llama/Llama-4-Maverick-17B-128E-Instruct"},context_window:131072,prices:{input_mtok:.63,output_mtok:1.8}},{id:"tokyotech-llm/Llama-3.3-Swallow-70B-Instruct-v0.4",name:"Llama-3.3-Swallow-70B-Instruct-v0.4",match:{equals:"tokyotech-llm/Llama-3.3-Swallow-70B-Instruct-v0.4"},context_window:131072,prices:{input_mtok:.6,output_mtok:1.2}}]},{id:"huggingface_together",name:"HuggingFace (together)",pricing_urls:["https://router.huggingface.co/v1/models","https://huggingface.co/inference/models"],api_pattern:"https://router\\.huggingface\\.co/together",provider_match:{and:[{contains:"huggingface"},{contains:"together"}]},extractors:[{api_flavor:"chat",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0},{path:["prompt_tokens_details","cached_tokens"],dest:"cache_read_tokens",required:!1},{path:["prompt_tokens_details","audio_tokens"],dest:"input_audio_tokens",required:!1},{path:["completion_tokens_details","audio_tokens"],dest:"output_audio_tokens",required:!1},{path:"completion_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"Qwen/Qwen2.5-72B-Instruct",name:"Qwen2.5-72B-Instruct",match:{equals:"Qwen/Qwen2.5-72B-Instruct"},context_window:131072,prices:{input_mtok:1.2,output_mtok:1.2}},{id:"Qwen/Qwen2.5-7B-Instruct",name:"Qwen2.5-7B-Instruct",match:{equals:"Qwen/Qwen2.5-7B-Instruct"},context_window:32768,prices:{input_mtok:.3,output_mtok:.3}},{id:"Qwen/Qwen3-235B-A22B",name:"Qwen3-235B-A22B",match:{or:[{equals:"Qwen/Qwen3-235B-A22B"},{equals:"Qwen/Qwen3-235B-A22B-FP8"},{equals:"Qwen/Qwen3-235B-A22B-Instruct-2507"}]},context_window:40960,prices:{input_mtok:.2,output_mtok:.6}},{id:"Qwen/Qwen3-Coder-480B-A35B-Instruct",name:"Qwen3-Coder-480B-A35B-Instruct",match:{or:[{equals:"Qwen/Qwen3-Coder-480B-A35B-Instruct"},{equals:"Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8"}]},context_window:262144,prices:{input_mtok:2,output_mtok:2}},{id:"Qwen/Qwen3-Next-80B-A3B-Instruct",name:"Qwen3-Next-80B-A3B-Instruct",match:{equals:"Qwen/Qwen3-Next-80B-A3B-Instruct"},context_window:262144,prices:{input_mtok:.15,output_mtok:1.5}},{id:"Qwen/Qwen3-Next-80B-A3B-Thinking",name:"Qwen3-Next-80B-A3B-Thinking",match:{equals:"Qwen/Qwen3-Next-80B-A3B-Thinking"},context_window:262144,prices:{input_mtok:.15,output_mtok:1.5}},{id:"deepcogito/cogito-671b-v2.1",name:"cogito-671b-v2.1",match:{or:[{equals:"deepcogito/cogito-671b-v2.1"},{equals:"deepcogito/cogito-671b-v2.1-FP8"}]},context_window:163840,prices:{input_mtok:1.25,output_mtok:1.25}},{id:"deepcogito/cogito-v2-preview-llama-109B-MoE",name:"cogito-v2-preview-llama-109B-MoE",match:{equals:"deepcogito/cogito-v2-preview-llama-109B-MoE"},context_window:32767,prices:{input_mtok:.18000000000000002,output_mtok:.5900000000000001}},{id:"deepcogito/cogito-v2-preview-llama-405B",name:"cogito-v2-preview-llama-405B",match:{equals:"deepcogito/cogito-v2-preview-llama-405B"},context_window:32768,prices:{input_mtok:3.5,output_mtok:3.5}},{id:"deepcogito/cogito-v2-preview-llama-70B",name:"cogito-v2-preview-llama-70B",match:{equals:"deepcogito/cogito-v2-preview-llama-70B"},context_window:32768,prices:{input_mtok:.88,output_mtok:.88}},{id:"deepseek-ai/DeepSeek-R1",name:"DeepSeek-R1",match:{or:[{equals:"deepseek-ai/DeepSeek-R1"},{equals:"deepseek-ai/DeepSeek-R1-0528"}]},context_window:163840,prices:{input_mtok:3,output_mtok:7}},{id:"deepseek-ai/DeepSeek-V3",name:"DeepSeek-V3",match:{or:[{equals:"deepseek-ai/DeepSeek-V3"},{equals:"deepseek-ai/DeepSeek-V3-0324"}]},context_window:131072,prices:{input_mtok:1.25,output_mtok:1.25}},{id:"deepseek-ai/DeepSeek-V3.1",name:"DeepSeek-V3.1",match:{equals:"deepseek-ai/DeepSeek-V3.1"},context_window:131072,prices:{input_mtok:.6,output_mtok:1.7}},{id:"marin-community/marin-8b-instruct",name:"marin-8b-instruct",match:{equals:"marin-community/marin-8b-instruct"},context_window:4096,prices:{input_mtok:.18000000000000002,output_mtok:.18000000000000002}},{id:"meta-llama/Llama-3.2-3B-Instruct",name:"Llama-3.2-3B-Instruct",match:{equals:"meta-llama/Llama-3.2-3B-Instruct"},context_window:131072,prices:{input_mtok:.060000000000000005,output_mtok:.060000000000000005}},{id:"meta-llama/Llama-3.3-70B-Instruct",name:"Llama-3.3-70B-Instruct",match:{equals:"meta-llama/Llama-3.3-70B-Instruct"},context_window:131072,prices:{input_mtok:.88,output_mtok:.88}},{id:"meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",name:"Llama-4-Maverick-17B-128E-Instruct-FP8",match:{equals:"meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8"},context_window:1048576,prices:{input_mtok:.27,output_mtok:.85}},{id:"meta-llama/Llama-4-Scout-17B-16E-Instruct",name:"Llama-4-Scout-17B-16E-Instruct",match:{equals:"meta-llama/Llama-4-Scout-17B-16E-Instruct"},context_window:1048576,prices:{input_mtok:.18000000000000002,output_mtok:.5900000000000001}},{id:"meta-llama/Meta-Llama-3-70B-Instruct",name:"Meta-Llama-3-70B-Instruct",match:{equals:"meta-llama/Meta-Llama-3-70B-Instruct"},context_window:8192,prices:{input_mtok:.88,output_mtok:.88}},{id:"moonshotai/Kimi-K2-Instruct",name:"Kimi-K2-Instruct",match:{or:[{equals:"moonshotai/Kimi-K2-Instruct"},{equals:"moonshotai/Kimi-K2-Instruct-0905"}]},context_window:131072,prices:{input_mtok:1,output_mtok:3}},{id:"moonshotai/Kimi-K2-Thinking",name:"Kimi-K2-Thinking",match:{equals:"moonshotai/Kimi-K2-Thinking"},context_window:262144,prices:{input_mtok:1.2,output_mtok:4}},{id:"openai/gpt-oss-120b",name:"gpt-oss-120b",match:{equals:"openai/gpt-oss-120b"},context_window:131072,prices:{input_mtok:.15,output_mtok:.6}},{id:"openai/gpt-oss-20b",name:"gpt-oss-20b",match:{equals:"openai/gpt-oss-20b"},context_window:131072,prices:{input_mtok:.05,output_mtok:.2}},{id:"zai-org/GLM-4.5-Air-FP8",name:"GLM-4.5-Air-FP8",match:{equals:"zai-org/GLM-4.5-Air-FP8"},context_window:131072,prices:{input_mtok:.2,output_mtok:1.1}}]},{id:"mistral",name:"Mistral",pricing_urls:["https://mistral.ai/pricing#api-pricing"],api_pattern:"https://api\\.mistral\\.ai",model_match:{regex:"(?:mi|code|dev|magi|mini)stral"},provider_match:{starts_with:"mistral"},extractors:[{api_flavor:"default",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0},{path:"completion_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"codestral",name:"Codestral",description:"Mistral's cutting-edge language model for coding. Codestral specializes in low-latency, high-frequency tasks such as fill-in-the-middle (FIM), code correction and test generation.",match:{or:[{equals:"codestral-latest"},{equals:"codestral-2501"}]},prices:{input_mtok:.3,output_mtok:.9}},{id:"devstral-small",name:"Devstral Small",description:"Devstral-Small-2505 is a 24B parameter agentic LLM fine-tuned from Mistral-Small-3.1, jointly developed by Mistral AI and All Hands AI for advanced software engineering tasks. It is optimized for codebase exploration, multi-file editing, and integration into coding agents, achieving state-of-the-art results on SWE-Bench Verified (46.8%).",match:{equals:"devstral-small"},prices:{input_mtok:.06,output_mtok:.12}},{id:"devstral-small:free",name:"Devstral Small (free)",description:"Devstral-Small-2505 is a 24B parameter agentic LLM fine-tuned from Mistral-Small-3.1, jointly developed by Mistral AI and All Hands AI for advanced software engineering tasks. It is optimized for codebase exploration, multi-file editing, and integration into coding agents, achieving state-of-the-art results on SWE-Bench Verified (46.8%).",match:{equals:"devstral-small:free"},prices:{}},{id:"magistral-medium",name:"Magistral Medium",description:"Magistral is Mistral's first reasoning model. It is ideal for general purpose use requiring longer thought processing and better accuracy than with non-reasoning LLMs. From legal research and financial forecasting to software development and creative storytelling — this model solves multi-step challenges where transparency and precision are critical.",match:{or:[{starts_with:"magistral-medium"}]},prices:{input_mtok:2,output_mtok:5}},{id:"magistral-small",name:"Magistral Small",description:"Magistral Small is a 24B parameter instruction-tuned model based on Mistral-Small-3.1 (2503), enhanced through supervised fine-tuning on traces from Magistral Medium and further refined via reinforcement learning. It is optimized for reasoning and supports a wide multilingual range, including over 20 languages.",match:{starts_with:"magistral-small-"},prices:{input_mtok:.5,output_mtok:1.5}},{id:"ministral-3b",name:"Ministral 3B",description:"Ministral 3B is a 3B parameter model optimized for on-device and edge computing. It excels in knowledge, commonsense reasoning, and function-calling, outperforming larger models like Mistral 7B on most benchmarks. Supporting up to 128k context length, it's ideal for orchestrating agentic workflows and specialist tasks with efficient inference.",match:{equals:"ministral-3b"},prices:{input_mtok:.04,output_mtok:.04}},{id:"ministral-8b",name:"Ministral 8B 24.10",description:"Ministral 8B is an 8B parameter model featuring a unique interleaved sliding-window attention pattern for faster, memory-efficient inference. Designed for edge use cases, it supports up to 128k context length and excels in knowledge and reasoning tasks. It outperforms peers in the sub-10B category, making it perfect for low-latency, privacy-first applications.",match:{starts_with:"ministral-8b"},prices:{input_mtok:.1,output_mtok:1}},{id:"mistral-7b",name:"Mistral 7B",match:{or:[{equals:"mistral-7b"},{equals:"open-mistral-7b"}]},prices:{input_mtok:.25,output_mtok:.25}},{id:"mistral-embed",match:{equals:"mistral-embed"},prices:{input_mtok:.1,output_mtok:.1}},{id:"mistral-large",name:"Mistral Large",description:"This is Mistral AI's flagship model, Mistral Large 2 (version `mistral-large-2407`). It's a proprietary weights-available model and excels at reasoning, code, JSON, chat, and more. Read the launch announcement here.",match:{or:[{equals:"mistral-large"},{equals:"mistral-large-latest"},{equals:"mistral-large-2407"},{equals:"mistral-large-2411"}]},prices:{input_mtok:2,output_mtok:6}},{id:"mistral-medium-3",name:"Mistral Medium 3",description:"Mistral Medium 3 is a high-performance enterprise-grade language model designed to deliver frontier-level capabilities at significantly reduced operational cost. It balances state-of-the-art reasoning and multimodal performance with 8× lower cost compared to traditional large models, making it suitable for scalable deployments across professional and industrial use cases.",match:{starts_with:"mistral-medium"},prices:{input_mtok:.4,output_mtok:2}},{id:"mistral-nemo",name:"Mistral NeMo",description:"A 12B parameter model with a 128k token context length built by Mistral in collaboration with NVIDIA.",match:{or:[{equals:"mistral-nemo"},{equals:"open-mistral-nemo"}]},prices:{input_mtok:.15,output_mtok:.15}},{id:"mistral-nemo:free",name:"Mistral Nemo (free)",description:"A 12B parameter model with a 128k token context length built by Mistral in collaboration with NVIDIA.",match:{equals:"mistral-nemo:free"},prices:{}},{id:"mistral-saba",name:"Mistral Saba",description:"Mistral Saba is a 24B-parameter language model specifically designed for the Middle East and South Asia, delivering accurate and contextually relevant responses while maintaining efficient performance. Trained on curated regional datasets, it supports multiple Indian-origin languages—including Tamil and Malayalam—alongside Arabic. This makes it a versatile option for a range of regional and multilingual applications. Read more at the blog post here",match:{or:[{equals:"mistral-saba"},{equals:"mistral-saba-latest"}]},prices:{input_mtok:.2,output_mtok:.6}},{id:"mistral-small",name:"Mistral Small",description:"With 22 billion parameters, Mistral Small v24.09 offers a convenient mid-point between (Mistral NeMo 12B)[/mistralai/mistral-nemo] and (Mistral Large 2)[/mistralai/mistral-large], providing a cost-effective solution that can be deployed across various platforms and environments. It has better reasoning, exhibits more capabilities, can produce and reason about code, and is multiligual, supporting English, French, German, Italian, and Spanish.",match:{starts_with:"mistral-small"},prices:{input_mtok:.2,output_mtok:.6}},{id:"mistral-small-24b-instruct-2501",name:"Mistral Small 3",description:"Mistral Small 3 is a 24B-parameter language model optimized for low-latency performance across common AI tasks. Released under the Apache 2.0 license, it features both pre-trained and instruction-tuned versions designed for efficient local deployment.",match:{equals:"mistral-small-24b-instruct-2501"},price_comments:"Can't find pricing on this model, so just trusting open router",prices:{input_mtok:.05,output_mtok:.08}},{id:"mistral-small-24b-instruct-2501:free",name:"Mistral Small 3 (free)",description:"Mistral Small 3 is a 24B-parameter language model optimized for low-latency performance across common AI tasks. Released under the Apache 2.0 license, it features both pre-trained and instruction-tuned versions designed for efficient local deployment.",match:{equals:"mistral-small-24b-instruct-2501:free"},prices:{}},{id:"mistral-small-latest",name:"Mistral Small 3.2",description:"SOTA. Multimodal. Multilingual. Apache 2.0.",match:{equals:"mistral-small-latest"},prices:{input_mtok:.1,output_mtok:.3}},{id:"mistral-tiny",name:"Mistral Tiny",description:"Note: This model is being deprecated. Recommended replacement is the newer Ministral 8B",match:{equals:"mistral-tiny"},prices:{input_mtok:.25,output_mtok:.25}},{id:"mixtral-8x22b-instruct",name:"Mixtral 8x22B Instruct",description:`Mistral's official instruct fine-tuned version of Mixtral 8x22B. It uses 39B active parameters out of 141B, offering unparalleled cost efficiency for its size. Its strengths include:
|
|
8
8
|
- strong math, coding, and reasoning
|
|
9
9
|
- large context length (64k)
|
|
10
|
-
- fluency in English, French, Italian, German, and Spanish`,match:{equals:"mixtral-8x22b-instruct"},prices:{input_mtok:.9,output_mtok:.9}},{id:"mixtral-8x7b",name:"Mixtral 8x7B",match:{or:[{starts_with:"mixtral-8x7b"},{equals:"open-mixtral-8x7b"}]},prices:{input_mtok:.7,output_mtok:.7}},{id:"pixtral-12b",name:"Pixtral 12B",description:"The first multi-modal, text+image-to-text model from Mistral AI. Its weights were launched via torrent: https://x.com/mistralai/status/1833758285167722836.",match:{or:[{equals:"pixtral-12b"},{equals:"pixtral-12b-latest"}]},prices:{input_mtok:.15,output_mtok:.15}},{id:"pixtral-large",name:"Pixtral Large 2411",description:"Pixtral Large is a 124B parameter, open-weight, multimodal model built on top of Mistral Large 2. The model is able to understand documents, charts and natural images.",match:{or:[{equals:"pixtral-large-latest"},{equals:"pixtral-large-2411"}]},prices:{input_mtok:2,output_mtok:6}}]},{id:"novita",name:"Novita",pricing_urls:["https://novita.ai/pricing"],api_pattern:"https://api\\.novita\\.ai",models:[{id:"Sao10K/L3-8B-Stheno-v3.2",match:{equals:"Sao10K/L3-8B-Stheno-v3.2"},prices:{input_mtok:.05,output_mtok:.05}},{id:"cognitivecomputations/dolphin-mixtral-8x22b",match:{equals:"cognitivecomputations/dolphin-mixtral-8x22b"},prices:{input_mtok:.9,output_mtok:.9}},{id:"deepseek/deepseek-r1",match:{equals:"deepseek/deepseek-r1"},prices:{input_mtok:4,output_mtok:4}},{id:"deepseek/deepseek-r1-distill-llama-70b",match:{equals:"deepseek/deepseek-r1-distill-llama-70b"},prices:{input_mtok:.8,output_mtok:.8}},{id:"deepseek/deepseek-r1-distill-llama-8b",match:{equals:"deepseek/deepseek-r1-distill-llama-8b"},prices:{input_mtok:.04,output_mtok:.04}},{id:"deepseek/deepseek-r1-distill-qwen-14b",match:{equals:"deepseek/deepseek-r1-distill-qwen-14b"},prices:{input_mtok:.15,output_mtok:.15}},{id:"deepseek/deepseek-r1-distill-qwen-32b",match:{equals:"deepseek/deepseek-r1-distill-qwen-32b"},prices:{input_mtok:.3,output_mtok:.3}},{id:"deepseek/deepseek_v3",match:{equals:"deepseek/deepseek_v3"},prices:{input_mtok:.89,output_mtok:.89}},{id:"google/gemma-2-9b-it",match:{equals:"google/gemma-2-9b-it"},prices:{input_mtok:.08,output_mtok:.08}},{id:"gryphe/mythomax-l2-13b",match:{equals:"gryphe/mythomax-l2-13b"},prices:{input_mtok:.09,output_mtok:.09}},{id:"jondurbin/airoboros-l2-70b",match:{equals:"jondurbin/airoboros-l2-70b"},prices:{input_mtok:.5,output_mtok:.5}},{id:"meta-llama/llama-3-70b-instruct",match:{equals:"meta-llama/llama-3-70b-instruct"},prices:{input_mtok:.51,output_mtok:.74}},{id:"meta-llama/llama-3-8b-instruct",match:{equals:"meta-llama/llama-3-8b-instruct"},prices:{input_mtok:.04,output_mtok:.04}},{id:"meta-llama/llama-3.1-70b-instruct",match:{equals:"meta-llama/llama-3.1-70b-instruct"},prices:{input_mtok:.34,output_mtok:.39}},{id:"meta-llama/llama-3.1-8b-instruct",match:{or:[{equals:"meta-llama/llama-3.1-8b-instruct"},{equals:"meta-llama/llama-3.1-8b-instruct-max"}]},prices:{input_mtok:.05,output_mtok:.05}},{id:"meta-llama/llama-3.1-8b-instruct-bf16",match:{equals:"meta-llama/llama-3.1-8b-instruct-bf16"},prices:{input_mtok:.06,output_mtok:.06}},{id:"meta-llama/llama-3.2-11b-vision-instruct",match:{equals:"meta-llama/llama-3.2-11b-vision-instruct"},prices:{input_mtok:.06,output_mtok:.06}},{id:"meta-llama/llama-3.2-1b-instruct",match:{equals:"meta-llama/llama-3.2-1b-instruct"},prices:{input_mtok:.02,output_mtok:.02}},{id:"meta-llama/llama-3.2-3b-instruct",match:{equals:"meta-llama/llama-3.2-3b-instruct"},prices:{input_mtok:.03,output_mtok:.05}},{id:"meta-llama/llama-3.3-70b-instruct",match:{equals:"meta-llama/llama-3.3-70b-instruct"},prices:{input_mtok:.39,output_mtok:.39}},{id:"microsoft/wizardlm-2-8x22b",match:{equals:"microsoft/wizardlm-2-8x22b"},prices:{input_mtok:.62,output_mtok:.62}},{id:"mistralai/mistral-7b-instruct",match:{equals:"mistralai/mistral-7b-instruct"},prices:{input_mtok:.059,output_mtok:.059}},{id:"mistralai/mistral-nemo",match:{equals:"mistralai/mistral-nemo"},prices:{input_mtok:.17,output_mtok:.17}},{id:"nousresearch/hermes-2-pro-llama-3-8b",match:{equals:"nousresearch/hermes-2-pro-llama-3-8b"},prices:{input_mtok:.14,output_mtok:.14}},{id:"nousresearch/nous-hermes-llama2-13b",match:{equals:"nousresearch/nous-hermes-llama2-13b"},prices:{input_mtok:.17,output_mtok:.17}},{id:"openchat/openchat-7b",match:{equals:"openchat/openchat-7b"},prices:{input_mtok:.06,output_mtok:.06}},{id:"qwen/qwen-2-7b-instruct",match:{equals:"qwen/qwen-2-7b-instruct"},prices:{input_mtok:.054,output_mtok:.054}},{id:"qwen/qwen-2-vl-72b-instruct",match:{equals:"qwen/qwen-2-vl-72b-instruct"},prices:{input_mtok:.45,output_mtok:.45}},{id:"qwen/qwen-2.5-72b-instruct",match:{equals:"qwen/qwen-2.5-72b-instruct"},prices:{input_mtok:.38,output_mtok:.4}},{id:"sao10k/l3-70b-euryale-v2.1",match:{equals:"sao10k/l3-70b-euryale-v2.1"},prices:{input_mtok:1.48,output_mtok:1.48}},{id:"sao10k/l3-8b-lunaris",match:{equals:"sao10k/l3-8b-lunaris"},prices:{input_mtok:.05,output_mtok:.05}},{id:"sao10k/l31-70b-euryale-v2.2",match:{equals:"sao10k/l31-70b-euryale-v2.2"},prices:{input_mtok:1.48,output_mtok:1.48}},{id:"sophosympatheia/midnight-rose-70b",match:{equals:"sophosympatheia/midnight-rose-70b"},prices:{input_mtok:.8,output_mtok:.8}},{id:"teknium/openhermes-2.5-mistral-7b",match:{equals:"teknium/openhermes-2.5-mistral-7b"},prices:{input_mtok:.17,output_mtok:.17}}]},{id:"openai",name:"OpenAI",pricing_urls:["https://platform.openai.com/docs/pricing","https://openai.com/api/pricing/","https://platform.openai.com/docs/models","https://help.openai.com/en/articles/7127956-how-much-does-gpt-4-cost"],api_pattern:"https://api\\.openai\\.com",model_match:{or:[{starts_with:"gpt-"},{regex:"^o[134]"}]},provider_match:{contains:"openai"},extractors:[{api_flavor:"chat",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0},{path:["prompt_tokens_details","cached_tokens"],dest:"cache_read_tokens",required:!1},{path:["prompt_tokens_details","audio_tokens"],dest:"input_audio_tokens",required:!1},{path:["completion_tokens_details","audio_tokens"],dest:"output_audio_tokens",required:!1},{path:"completion_tokens",dest:"output_tokens",required:!0}]},{api_flavor:"responses",root:"usage",model_path:"model",mappings:[{path:"input_tokens",dest:"input_tokens",required:!0},{path:["input_tokens_details","cached_tokens"],dest:"cache_read_tokens",required:!1},{path:"output_tokens",dest:"output_tokens",required:!0}]},{api_flavor:"embeddings",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0}]}],models:[{id:"ada",match:{or:[{equals:"ada"},{equals:"text-ada-001"}]},prices:{input_mtok:.4,output_mtok:.4}},{id:"babbage",match:{equals:"babbage"},prices:{input_mtok:.5,output_mtok:.5}},{id:"chatgpt-4o-latest",name:"ChatGPT-4o",description:"OpenAI ChatGPT 4o is continually updated by OpenAI to point to the current version of GPT-4o used by ChatGPT. It therefore differs slightly from the API version of GPT-4o in that it has additional RLHF. It is intended for research and evaluation.",match:{equals:"chatgpt-4o-latest"},prices:{input_mtok:5,output_mtok:15}},{id:"codex-mini",name:"Codex Mini",description:"codex-mini-latest is a fine-tuned version of o4-mini specifically for use in Codex CLI. For direct use in the API, we recommend starting with gpt-4.1.",match:{or:[{equals:"codex-mini"},{equals:"codex-mini-latest"}]},prices:{input_mtok:1.5,cache_read_mtok:.375,output_mtok:6}},{id:"computer-use",name:"Computer use",match:{starts_with:"computer-use"},prices:{input_mtok:3,output_mtok:12}},{id:"curie",match:{or:[{equals:"curie"},{equals:"text-curie-001"}]},prices:{input_mtok:2,output_mtok:2}},{id:"davinci",match:{or:[{equals:"davinci"},{equals:"text-davinci-001"}]},prices:{input_mtok:20,output_mtok:20}},{id:"ft:gpt-3.5-turbo-",description:"GPT-3.5 Turbo fine tuned.",match:{starts_with:"ft:gpt-3.5-turbo"},prices:{input_mtok:3,output_mtok:6}},{id:"ft:gpt-4o",description:"GPT-4o fine tuned.",match:{starts_with:"ft:gpt-4o-2024-"},prices:{input_mtok:3.75,output_mtok:15}},{id:"ft:gpt-4o-mini",description:"GPT-4o Mini fine tuned.",match:{starts_with:"ft:gpt-4o-mini-2024-"},prices:{input_mtok:.3,output_mtok:1.2}},{id:"gpt-3.5-0301",match:{or:[{equals:"gpt-3.5-turbo-0301"},{equals:"gpt-3.5-0301"}]},prices:{input_mtok:1.5,output_mtok:2}},{id:"gpt-3.5-turbo",name:"gpt 3.5 turbo",description:"GPT-3.5 Turbo offers a balance between cost and performance.",match:{or:[{equals:"gpt-3.5-turbo"},{equals:"gpt-35-turbo"},{equals:"gpt-3.5-turbo-0125"}]},context_window:16385,prices:{input_mtok:.5,output_mtok:1.5}},{id:"gpt-3.5-turbo-0613",match:{equals:"gpt-3.5-turbo-0613"},context_window:16385,prices:{input_mtok:1.5,output_mtok:2}},{id:"gpt-3.5-turbo-1106",match:{equals:"gpt-3.5-turbo-1106"},context_window:16385,prices:{input_mtok:1,output_mtok:2}},{id:"gpt-3.5-turbo-16k",name:"GPT-3.5 Turbo 16k",description:"This model offers four times the context length of gpt-3.5-turbo, allowing it to support approximately 20 pages of text in a single request at a higher cost. Training data: up to Sep 2021.",match:{or:[{equals:"gpt-3.5-turbo-16k"},{equals:"gpt-3.5-turbo-16k-0613"},{equals:"gpt-35-turbo-16k-0613"},{equals:"gpt-35-turbo-16k"}]},context_window:16385,prices:{input_mtok:3,output_mtok:4}},{id:"gpt-3.5-turbo-instruct",name:"gpt 3.5 turbo instruct",description:"GPT-3.5 Turbo offers a balance between cost and performance.",match:{or:[{starts_with:"gpt-3.5-turbo-instruct"},{equals:"gpt-3.5-turbo-instruct-0914"}]},context_window:16385,prices:{input_mtok:1.5,output_mtok:2}},{id:"gpt-4",name:"gpt 4",description:"GPT-4 is the latest and most advanced model in the GPT series, demonstrating sophisticated capabilities in complex reasoning, theory of mind, and narrative understanding.",match:{or:[{equals:"gpt-4"},{equals:"gpt-4-0314"},{equals:"gpt-4-0613"},{starts_with:"ft:gpt-4-0"}]},context_window:8192,prices:{input_mtok:30,output_mtok:60}},{id:"gpt-4-32k",name:"gpt 4",description:"GPT-4 is the latest and most advanced model in the GPT series, demonstrating sophisticated capabilities in complex reasoning, theory of mind, and narrative understanding.",match:{or:[{equals:"gpt-4-32k"},{equals:"gpt-4-32k-0314"},{equals:"gpt-4-32k-0613"}]},context_window:32e3,price_comments:"see https://help.openai.com/en/articles/7127956-how-much-does-gpt-4-cost",prices:{input_mtok:60,output_mtok:120}},{id:"gpt-4-turbo",name:"gpt 4 turbo",description:"GPT-4 Turbo offers a balance between cost and performance.",match:{or:[{equals:"gpt-4-turbo"},{equals:"gpt-4-turbo-2024-04-09"},{equals:"gpt-4-turbo-0125-preview"},{equals:"gpt-4-0125-preview"},{equals:"gpt-4-1106-preview"},{equals:"gpt-4-turbo-preview"}]},context_window:128e3,prices:{input_mtok:10,output_mtok:30}},{id:"gpt-4-vision-preview",name:"gpt 4 vision",description:"GPT-4 Vision is a model that offers a balance between cost and performance.",match:{or:[{equals:"gpt-4-vision-preview"},{equals:"gpt-4-1106-vision-preview"}]},context_window:128e3,prices:{input_mtok:10,output_mtok:30}},{id:"gpt-4.1",name:"gpt 4.1",description:"GPT-4.1 is OpenAI's latest flagship model, offering major improvements in coding, instruction following, and long context understanding with up to 1 million tokens of context.",match:{or:[{equals:"gpt-4.1"},{equals:"gpt-4.1-2025-04-14"}]},context_window:1e6,prices:{input_mtok:2,cache_read_mtok:.5,output_mtok:8}},{id:"gpt-4.1-mini",name:"gpt 4.1 mini",description:"GPT-4.1 Mini is a significant leap in small model performance, matching or exceeding GPT-4o in many benchmarks while reducing latency by nearly half and cost by 83%.",match:{or:[{equals:"gpt-4.1-mini"},{equals:"gpt-4.1-mini-2025-04-14"}]},context_window:1e6,prices:{input_mtok:.4,cache_read_mtok:.1,output_mtok:1.6}},{id:"gpt-4.1-nano",name:"gpt 4.1 nano",description:"GPT-4.1 Nano is OpenAI's fastest and cheapest model, delivering exceptional performance for its size with a 1 million token context window, ideal for classification and autocompletion tasks.",match:{or:[{equals:"gpt-4.1-nano"},{equals:"gpt-4.1-nano-2025-04-14"}]},context_window:1e6,prices:{input_mtok:.1,cache_read_mtok:.025,output_mtok:.4}},{id:"gpt-4.5-preview",name:"GPT-4.5 (Preview)",description:"GPT-4.5 (Preview) is a research preview of OpenAI's latest language model, designed to advance capabilities in reasoning, creativity, and multi-turn conversation. It builds on previous iterations with improvements in world knowledge, contextual coherence, and the ability to follow user intent more effectively.",match:{starts_with:"gpt-4.5-preview"},prices:{input_mtok:75,cache_read_mtok:37.5,output_mtok:150}},{id:"gpt-4o",name:"gpt 4o",description:"GPT-4 Optimized (GPT-4o) is designed for high performance in reasoning, creativity, and technical tasks while maintaining consistent output quality.",match:{or:[{equals:"gpt-4o"},{equals:"gpt-4o-2024-05-13"},{equals:"gpt-4o-2024-08-06"},{equals:"gpt-4o-2024-11-20"}]},context_window:128e3,prices:{input_mtok:2.5,cache_read_mtok:1.25,output_mtok:10}},{id:"gpt-4o-audio-preview",name:"gpt 4o audio preview",description:"Audio model for gpt-4o",match:{starts_with:"gpt-4o-audio-preview"},context_window:128e3,prices:{output_mtok:10,input_audio_mtok:2.5}},{id:"gpt-4o-mini",name:"gpt 4o mini",description:"GPT-4o Mini is a cost-optimized variant of GPT-4o, designed for high-efficiency processing while maintaining strong performance. It excels in rapid inference and resource-efficient operations, making it ideal for production deployments requiring a balance of cost and capability.",match:{or:[{equals:"gpt-4o-mini"},{equals:"gpt-4o-mini-2024-07-18"},{equals:"gpt-4o-mini-search-preview"},{equals:"gpt-4o-mini-search-preview-2025-03-11"}]},context_window:128e3,prices:{input_mtok:.15,cache_read_mtok:.075,output_mtok:.6}},{id:"gpt-4o-mini-2024-07-18.ft-",description:"GPT-4o Mini fine tuned.",match:{starts_with:"gpt-4o-mini-2024-07-18.ft-"},prices:{input_mtok:.3,output_mtok:1.2}},{id:"gpt-4o-mini-audio-preview",name:"gpt 4o mini audio preview",description:"Audio model for gpt-4o mini",match:{starts_with:"gpt-4o-mini-audio"},prices:{output_mtok:.6,input_audio_mtok:.15}},{id:"gpt-4o-mini-realtime-preview",match:{starts_with:"gpt-4o-mini-realtime"},prices:{input_mtok:.6,cache_read_mtok:.3,output_mtok:2.4,input_audio_mtok:10,cache_audio_read_mtok:.3,output_audio_mtok:20}},{id:"gpt-4o-mini-transcribe",match:{equals:"gpt-4o-mini-transcribe"},prices:{input_mtok:1.25,output_mtok:5,input_audio_mtok:3}},{id:"gpt-4o-mini-tts",match:{equals:"gpt-4o-mini-tts"},prices:{input_mtok:.6,output_audio_mtok:12}},{id:"gpt-4o-realtime-preview",match:{starts_with:"gpt-4o-realtime"},prices:{input_mtok:5,cache_read_mtok:2.5,output_mtok:20,input_audio_mtok:40,cache_audio_read_mtok:2.5,output_audio_mtok:80}},{id:"gpt-4o-search-preview",name:"GPT-4o Search Preview",description:"GPT-4o Search Previewis a specialized model for web search in Chat Completions. It is trained to understand and execute web search queries.",match:{or:[{equals:"gpt-4o-search-preview"},{equals:"gpt-4o-search-preview-2025-03-11"}]},prices:{input_mtok:2.5,output_mtok:10}},{id:"gpt-4o-transcribe",match:{or:[{equals:"gpt-4o-transcribe"},{equals:"gpt-4o-transcribe-diarize"}]},prices:{input_mtok:2.5,output_mtok:10,input_audio_mtok:6}},{id:"gpt-4o:extended",name:"GPT-4o (extended)",description:`GPT-4o ("o" for "omni") is OpenAI's latest AI model, supporting both text and image inputs with text outputs. It maintains the intelligence level of GPT-4 Turbo while being twice as fast and 50% more cost-effective. GPT-4o also offers improved performance in processing non-English languages and enhanced visual capabilities.`,match:{equals:"gpt-4o:extended"},prices:{input_mtok:6,output_mtok:18}},{id:"gpt-5",name:"GPT-5",description:"GPT-5 is OpenAI's flagship model for coding, reasoning, and agentic tasks across domains.",match:{or:[{equals:"gpt-5"},{equals:"gpt-5-2025-08-07"},{equals:"gpt-5-chat"},{equals:"gpt-5-chat-latest"},{equals:"gpt-5-codex"}]},context_window:4e5,prices:{input_mtok:1.25,cache_read_mtok:.125,output_mtok:10}},{id:"gpt-5-image",match:{equals:"gpt-5-image"},price_comments:"Seen on OpenRouter before OpenAI",prices:{input_mtok:10,cache_read_mtok:1.25,output_mtok:10}},{id:"gpt-5-image-mini",match:{equals:"gpt-5-image-mini"},price_comments:"Seen on OpenRouter before OpenAI",prices:{input_mtok:2.5,cache_read_mtok:.25,output_mtok:2}},{id:"gpt-5-mini",name:"GPT-5 mini",description:"GPT-5 mini is a faster, more cost-efficient version of GPT-5. It's great for well-defined tasks and precise prompts.",match:{or:[{equals:"gpt-5-mini"},{equals:"gpt-5-mini-2025-08-07"}]},context_window:4e5,prices:{input_mtok:.25,cache_read_mtok:.025,output_mtok:2}},{id:"gpt-5-nano",name:"GPT-5 nano",description:"GPT-5 Nano is OpenAI's fastest, cheapest version of GPT-5. It's great for summarization and classification tasks.",match:{or:[{equals:"gpt-5-nano"},{starts_with:"gpt-5-nano-"}]},context_window:4e5,prices:{input_mtok:.05,cache_read_mtok:.005,output_mtok:.4}},{id:"gpt-5-pro",match:{or:[{equals:"gpt-5-pro"},{equals:"gpt-5-pro-2025-10-06"}]},context_window:4e5,prices:{input_mtok:15,output_mtok:120}},{id:"gpt-5.1",name:"GPT-5.1",description:"The best model for coding and agentic tasks across industries",match:{or:[{equals:"gpt-5.1"},{equals:"gpt-5.1-2025-11-13"},{equals:"gpt-5.1-codex"},{equals:"gpt-5.1-chat-latest"}]},context_window:4e5,prices:{input_mtok:1.25,cache_read_mtok:.125,output_mtok:10}},{id:"gpt-5.1-codex-mini",name:"GPT-5.1 Codex Mini",match:{or:[{equals:"gpt-5.1-codex-mini"},{equals:"gpt-5.1-mini"}]},context_window:4e5,prices:{input_mtok:.25,cache_read_mtok:.025,output_mtok:2}},{id:"gpt-realtime",match:{or:[{equals:"gpt-realtime"},{equals:"gpt-realtime-2025-08-28"}]},price_comments:"Missing image token prices which we don't support yet",prices:{input_mtok:4,cache_read_mtok:.4,output_mtok:16,input_audio_mtok:32,cache_audio_read_mtok:.4,output_audio_mtok:64}},{id:"gpt-realtime-mini",match:{equals:"gpt-realtime-mini"},price_comments:"Missing image token prices which we don't support yet",prices:{input_mtok:.6,cache_read_mtok:.06,output_mtok:2.4,input_audio_mtok:10,cache_audio_read_mtok:.3,output_audio_mtok:20}},{id:"moderation",description:"All OpenAI moderation models and endpoints are free of charge",match:{contains:"moderation"},prices:{}},{id:"o1",name:"o1",description:"O1 is a model that offers a balance between cost and performance.",match:{or:[{equals:"o1"},{equals:"o1-2024-12-17"},{equals:"o1-preview"},{equals:"o1-preview-2024-09-12"}]},context_window:128e3,prices:{input_mtok:15,cache_read_mtok:7.5,output_mtok:60}},{id:"o1-mini",name:"o1 mini",description:"O1 Mini is a model that offers a balance between cost and performance.",match:{or:[{equals:"o1-mini"},{equals:"o1-mini-2024-09-12"}]},context_window:128e3,prices:{input_mtok:1.1,cache_read_mtok:.55,output_mtok:4.4}},{id:"o1-pro",name:"o1-pro",description:"The o1 series of models are trained with reinforcement learning to think before they answer and perform complex reasoning. The o1-pro model uses more compute to think harder and provide consistently better answers.",match:{or:[{equals:"o1-pro"},{equals:"o1-pro-2025-03-19"}]},prices:{input_mtok:150,output_mtok:600}},{id:"o3",name:"o3",description:"o3 is a well-rounded and powerful model across domains. It sets a new standard for math, science, coding, and visual reasoning tasks. It also excels at technical writing and instruction-following. Use it to think through multi-step problems that involve analysis across text, code, and images. Note that BYOK is required for this model. Set up here: https://openrouter.ai/settings/integrations",match:{or:[{equals:"o3"},{equals:"o3-2025-04-16"}]},prices:[{prices:{input_mtok:10,cache_read_mtok:.5,output_mtok:40}},{constraint:{start_date:"2025-06-10",type:"start_date"},prices:{input_mtok:2,cache_read_mtok:.5,output_mtok:8}}]},{id:"o3-deep-research",match:{or:[{equals:"o3-deep-research"},{equals:"o3-deep-research-2025-06-26"}]},prices:{input_mtok:10,cache_read_mtok:2.5,output_mtok:40}},{id:"o3-mini",name:"o3 Mini",description:"OpenAI o3-mini is a cost-efficient language model optimized for STEM reasoning tasks, particularly excelling in science, mathematics, and coding.",match:{or:[{equals:"o3-mini"},{equals:"o3-mini-2025-01-31"},{equals:"o3-mini-high"}]},prices:{input_mtok:1.1,cache_read_mtok:.55,output_mtok:4.4}},{id:"o3-pro",name:"o3 Pro",description:"The o-series of models are trained with reinforcement learning to think before they answer and perform complex reasoning. The o3-pro model uses more compute to think harder and provide consistently better answers.",match:{or:[{equals:"o3-pro"},{equals:"o3-pro-2025-06-10"}]},prices:{input_mtok:20,output_mtok:80}},{id:"o4-mini",name:"o4 Mini High",description:"OpenAI o4-mini-high is the same model as o4-mini with reasoning_effort set to high.",match:{or:[{equals:"o4-mini-2025-04-16"},{equals:"o4-mini-high"},{equals:"o4-mini"}]},prices:{input_mtok:1.1,cache_read_mtok:.275,output_mtok:4.4}},{id:"o4-mini-deep-research",match:{or:[{equals:"o4-mini-deep-research"},{equals:"o4-mini-deep-research-2025-06-26"}]},prices:{input_mtok:2,cache_read_mtok:.5,output_mtok:8}},{id:"text-davinci-002",match:{equals:"text-davinci-002"},prices:{input_mtok:20,output_mtok:20}},{id:"text-davinci-003",match:{equals:"text-davinci-003"},prices:{input_mtok:20,output_mtok:20}},{id:"text-embedding-3-large",name:"text embedding 3",description:"Text Embedding 3 is a model that offers a balance between cost and performance.",match:{equals:"text-embedding-3-large"},context_window:3072,prices:{input_mtok:.13}},{id:"text-embedding-3-small",name:"text embedding 3",description:"Text Embedding 3 is a model that offers a balance between cost and performance.",match:{equals:"text-embedding-3-small"},context_window:3072,prices:{input_mtok:.02}},{id:"text-embedding-ada-002",name:"text embedding ada",description:"Text Embedding Ada is a model that offers a balance between cost and performance.",match:{or:[{equals:"text-embedding-ada"},{equals:"text-embedding-ada-002"},{equals:"text-embedding-ada-002-v2"}]},context_window:1536,prices:{input_mtok:.1}}]},{id:"openrouter",name:"OpenRouter",pricing_urls:["https://openrouter.ai/models"],api_pattern:"https://(api\\.)?openrouter\\.ai",models:[{id:"01-ai/yi-large",match:{equals:"01-ai/yi-large"},prices:{input_mtok:3,output_mtok:3}},{id:"aetherwiing/mn-starcannon-12b",match:{equals:"aetherwiing/mn-starcannon-12b"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"agentica-org/deepcoder-14b-preview:free",match:{equals:"agentica-org/deepcoder-14b-preview:free"},prices:{}},{id:"ai21/jamba-1-5-large",match:{equals:"ai21/jamba-1-5-large"},prices:{input_mtok:2,output_mtok:8}},{id:"ai21/jamba-1-5-mini",match:{equals:"ai21/jamba-1-5-mini"},prices:{input_mtok:.2,output_mtok:.4}},{id:"ai21/jamba-1.6-large",match:{equals:"ai21/jamba-1.6-large"},prices:{input_mtok:2,output_mtok:8}},{id:"ai21/jamba-1.6-mini",match:{equals:"ai21/jamba-1.6-mini"},prices:{input_mtok:.2,output_mtok:.4}},{id:"ai21/jamba-instruct",match:{equals:"ai21/jamba-instruct"},prices:{input_mtok:.5,output_mtok:.7}},{id:"aion-1.0",name:"Aion-1.0",match:{equals:"aion-1.0"},prices:{input_mtok:4,output_mtok:8}},{id:"aion-1.0-mini",name:"Aion-1.0-Mini",match:{equals:"aion-1.0-mini"},prices:{input_mtok:.7,output_mtok:1.4}},{id:"aion-labs/aion-1.0",match:{equals:"aion-labs/aion-1.0"},prices:{input_mtok:4,output_mtok:8}},{id:"aion-labs/aion-1.0-mini",match:{equals:"aion-labs/aion-1.0-mini"},prices:{input_mtok:.7,output_mtok:1.4}},{id:"aion-labs/aion-rp-llama-3.1-8b",match:{equals:"aion-labs/aion-rp-llama-3.1-8b"},prices:{input_mtok:.2,output_mtok:.2}},{id:"aion-rp-llama-3.1-8b",name:"Aion-RP 1.0 (8B)",match:{equals:"aion-rp-llama-3.1-8b"},prices:{input_mtok:.2,output_mtok:.2}},{id:"alfredpros/codellama-7b-instruct-solidity",match:{equals:"alfredpros/codellama-7b-instruct-solidity"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"all-hands/openhands-lm-32b-v0.1",match:{equals:"all-hands/openhands-lm-32b-v0.1"},prices:{input_mtok:2.6,output_mtok:3.4}},{id:"allenai/molmo-7b-d:free",match:{equals:"allenai/molmo-7b-d:free"},prices:{}},{id:"alpindale/goliath-120b",match:{equals:"alpindale/goliath-120b"},prices:{input_mtok:6.5625,output_mtok:9.375}},{id:"alpindale/magnum-72b",match:{equals:"alpindale/magnum-72b"},prices:{input_mtok:1.5,output_mtok:2.25}},{id:"amazon/nova-lite-v1",match:{equals:"amazon/nova-lite-v1"},prices:{input_mtok:.06,output_mtok:.24}},{id:"amazon/nova-micro-v1",match:{equals:"amazon/nova-micro-v1"},prices:{input_mtok:.035,output_mtok:.14}},{id:"amazon/nova-pro-v1",match:{equals:"amazon/nova-pro-v1"},prices:{input_mtok:.8,output_mtok:3.2}},{id:"anthracite-org/magnum-v2-72b",match:{equals:"anthracite-org/magnum-v2-72b"},prices:{input_mtok:3,output_mtok:3}},{id:"anthracite-org/magnum-v4-72b",match:{equals:"anthracite-org/magnum-v4-72b"},prices:{input_mtok:1.5,output_mtok:2.25}},{id:"anthropic/claude-2",match:{or:[{equals:"anthropic/claude-2"},{equals:"anthropic/claude-2.0"},{equals:"anthropic/claude-2.0:beta"},{equals:"anthropic/claude-2.1"},{equals:"anthropic/claude-2.1:beta"},{equals:"anthropic/claude-2:beta"}]},prices:{input_mtok:8,output_mtok:24}},{id:"anthropic/claude-3-haiku",match:{or:[{equals:"anthropic/claude-3-haiku"},{equals:"anthropic/claude-3-haiku:beta"}]},prices:{input_mtok:.25,output_mtok:1.25}},{id:"anthropic/claude-3-opus",match:{or:[{equals:"anthropic/claude-3-opus"},{equals:"anthropic/claude-3-opus:beta"}]},prices:{input_mtok:15,output_mtok:75}},{id:"anthropic/claude-3-sonnet",match:{or:[{equals:"anthropic/claude-3-sonnet"},{equals:"anthropic/claude-3-sonnet:beta"}]},prices:{input_mtok:3,output_mtok:15}},{id:"anthropic/claude-3.5-haiku",match:{or:[{equals:"anthropic/claude-3.5-haiku"},{equals:"anthropic/claude-3.5-haiku-20241022"},{equals:"anthropic/claude-3.5-haiku-20241022:beta"},{equals:"anthropic/claude-3.5-haiku:beta"}]},prices:{input_mtok:.8,output_mtok:4}},{id:"anthropic/claude-3.5-sonnet",match:{or:[{equals:"anthropic/claude-3.5-sonnet"},{equals:"anthropic/claude-3.5-sonnet-20240620"},{equals:"anthropic/claude-3.5-sonnet-20240620:beta"},{equals:"anthropic/claude-3.5-sonnet:beta"}]},prices:{input_mtok:3,output_mtok:15}},{id:"anthropic/claude-3.7-sonnet",match:{or:[{equals:"anthropic/claude-3.7-sonnet"},{equals:"anthropic/claude-3.7-sonnet:beta"},{equals:"anthropic/claude-3.7-sonnet:thinking"}]},prices:{input_mtok:3,output_mtok:15}},{id:"anubis-pro-105b-v1",name:"Anubis Pro 105B V1",match:{equals:"anubis-pro-105b-v1"},prices:{input_mtok:.8,output_mtok:1}},{id:"arcee-blitz",name:"Arcee Blitz",match:{equals:"arcee-blitz"},prices:{input_mtok:.45,output_mtok:.75}},{id:"arliai/qwq-32b-arliai-rpr-v1:free",match:{equals:"arliai/qwq-32b-arliai-rpr-v1:free"},prices:{}},{id:"bytedance-research/ui-tars-72b:free",match:{equals:"bytedance-research/ui-tars-72b:free"},prices:{}},{id:"caller-large",name:"Caller Large",match:{equals:"caller-large"},prices:{input_mtok:.55,output_mtok:.85}},{id:"chatgpt-4o-latest",name:"ChatGPT-4o",match:{equals:"chatgpt-4o-latest"},prices:{input_mtok:5,output_mtok:15}},{id:"claude-2",name:"Claude v2",match:{or:[{equals:"claude-2"},{equals:"claude-2.0"},{equals:"claude-2.0:beta"},{equals:"claude-2.1"},{equals:"claude-2.1:beta"},{equals:"claude-2:beta"}]},prices:{input_mtok:8,output_mtok:24}},{id:"claude-3-haiku",name:"Claude 3 Haiku",match:{or:[{equals:"claude-3-haiku"},{equals:"claude-3-haiku:beta"}]},prices:{input_mtok:.25,cache_write_mtok:.3,cache_read_mtok:.03,output_mtok:1.25}},{id:"claude-3-opus",name:"Claude 3 Opus",match:{or:[{equals:"claude-3-opus"},{equals:"claude-3-opus:beta"}]},prices:{input_mtok:15,cache_write_mtok:18.75,cache_read_mtok:1.5,output_mtok:75}},{id:"claude-3-sonnet",name:"Claude 3 Sonnet",match:{or:[{equals:"claude-3-sonnet"},{equals:"claude-3-sonnet:beta"}]},prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"claude-3.5-haiku",name:"Claude 3.5 Haiku",match:{or:[{equals:"claude-3.5-haiku"},{equals:"claude-3.5-haiku-20241022"},{equals:"claude-3.5-haiku-20241022:beta"},{equals:"claude-3.5-haiku:beta"}]},prices:{input_mtok:.8,cache_write_mtok:1,cache_read_mtok:.08,output_mtok:4}},{id:"claude-3.5-sonnet",name:"Claude 3.5 Sonnet",match:{or:[{equals:"claude-3.5-sonnet"},{equals:"claude-3.5-sonnet-20240620"},{equals:"claude-3.5-sonnet-20240620:beta"},{equals:"claude-3.5-sonnet:beta"}]},prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"claude-3.7-sonnet",name:"Claude 3.7 Sonnet",match:{or:[{equals:"claude-3.7-sonnet"},{equals:"claude-3.7-sonnet:beta"},{equals:"claude-3.7-sonnet:thinking"}]},prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"claude-opus-4",name:"Claude Opus 4",match:{equals:"claude-opus-4"},prices:{input_mtok:15,cache_write_mtok:18.75,cache_read_mtok:1.5,output_mtok:75}},{id:"claude-sonnet-4",name:"Claude Sonnet 4",match:{equals:"claude-sonnet-4"},prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"codellama-7b-instruct-solidity",name:"CodeLLaMa 7B Instruct Solidity",match:{equals:"codellama-7b-instruct-solidity"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"coder-large",name:"Coder Large",match:{equals:"coder-large"},prices:{input_mtok:.5,output_mtok:.8}},{id:"codestral-2501",name:"Codestral 2501",match:{equals:"codestral-2501"},prices:{input_mtok:.3,output_mtok:.9}},{id:"codex-mini",name:"Codex Mini",match:{equals:"codex-mini"},prices:{input_mtok:1.5,cache_read_mtok:.375,output_mtok:6}},{id:"cognitivecomputations/dolphin-mixtral-8x22b",match:{equals:"cognitivecomputations/dolphin-mixtral-8x22b"},prices:{input_mtok:.9,output_mtok:.9}},{id:"cognitivecomputations/dolphin-mixtral-8x7b",match:{equals:"cognitivecomputations/dolphin-mixtral-8x7b"},prices:{input_mtok:.5,output_mtok:.5}},{id:"cognitivecomputations/dolphin3.0-mistral-24b:free",match:{equals:"cognitivecomputations/dolphin3.0-mistral-24b:free"},prices:{}},{id:"cognitivecomputations/dolphin3.0-r1-mistral-24b:free",match:{equals:"cognitivecomputations/dolphin3.0-r1-mistral-24b:free"},prices:{}},{id:"cohere/command",match:{equals:"cohere/command"},prices:{input_mtok:1,output_mtok:2}},{id:"cohere/command-a",match:{equals:"cohere/command-a"},prices:{input_mtok:2.5,output_mtok:10}},{id:"cohere/command-r",match:{or:[{equals:"cohere/command-r"},{equals:"cohere/command-r-03-2024"}]},prices:{input_mtok:.5,output_mtok:1.5}},{id:"cohere/command-r-08-2024",match:{equals:"cohere/command-r-08-2024"},prices:{input_mtok:.15,output_mtok:.6}},{id:"cohere/command-r-plus",match:{or:[{equals:"cohere/command-r-plus"},{equals:"cohere/command-r-plus-04-2024"}]},prices:{input_mtok:3,output_mtok:15}},{id:"cohere/command-r-plus-08-2024",match:{equals:"cohere/command-r-plus-08-2024"},prices:{input_mtok:2.5,output_mtok:10}},{id:"cohere/command-r7b-12-2024",match:{equals:"cohere/command-r7b-12-2024"},prices:{input_mtok:.0375,output_mtok:.15}},{id:"command",name:"Command",match:{equals:"command"},prices:{input_mtok:1,output_mtok:2}},{id:"command-a",name:"Command A",match:{equals:"command-a"},prices:{input_mtok:2.5,output_mtok:10}},{id:"command-r",name:"Command R",match:{or:[{equals:"command-r"},{equals:"command-r-03-2024"}]},prices:{input_mtok:.5,output_mtok:1.5}},{id:"command-r-08-2024",name:"Command R (08-2024)",match:{equals:"command-r-08-2024"},prices:{input_mtok:.15,output_mtok:.6}},{id:"command-r-plus",name:"Command R+",match:{or:[{equals:"command-r-plus"},{equals:"command-r-plus-04-2024"}]},prices:{input_mtok:3,output_mtok:15}},{id:"command-r-plus-08-2024",name:"Command R+ (08-2024)",match:{equals:"command-r-plus-08-2024"},prices:{input_mtok:2.5,output_mtok:10}},{id:"command-r7b-12-2024",name:"Command R7B (12-2024)",match:{equals:"command-r7b-12-2024"},prices:{input_mtok:.0375,output_mtok:.15}},{id:"deepcoder-14b-preview:free",name:"Deepcoder 14B Preview (free)",match:{equals:"deepcoder-14b-preview:free"},prices:{}},{id:"deephermes-3-llama-3-8b-preview:free",name:"DeepHermes 3 Llama 3 8B Preview (free)",match:{equals:"deephermes-3-llama-3-8b-preview:free"},prices:{}},{id:"deepseek-chat",name:"DeepSeek V3",match:{equals:"deepseek-chat"},prices:{input_mtok:.38,output_mtok:.89}},{id:"deepseek-chat-v3-0324",name:"DeepSeek V3 0324",match:{equals:"deepseek-chat-v3-0324"},prices:{input_mtok:.3,output_mtok:.88}},{id:"deepseek-chat-v3-0324:free",name:"DeepSeek V3 0324 (free)",match:{equals:"deepseek-chat-v3-0324:free"},prices:{}},{id:"deepseek-chat:free",name:"DeepSeek V3 (free)",match:{equals:"deepseek-chat:free"},prices:{}},{id:"deepseek-prover-v2",name:"DeepSeek Prover V2",match:{equals:"deepseek-prover-v2"},prices:{input_mtok:.5,output_mtok:2.18}},{id:"deepseek-r1",name:"R1",match:{equals:"deepseek-r1"},prices:{input_mtok:.45,output_mtok:2.15}},{id:"deepseek-r1-0528",name:"R1 0528",match:{equals:"deepseek-r1-0528"},prices:{input_mtok:.5,output_mtok:2.15}},{id:"deepseek-r1-0528-qwen3-8b",name:"Deepseek R1 0528 Qwen3 8B",match:{equals:"deepseek-r1-0528-qwen3-8b"},prices:{input_mtok:.05,output_mtok:.1}},{id:"deepseek-r1-0528-qwen3-8b:free",name:"Deepseek R1 0528 Qwen3 8B (free)",match:{equals:"deepseek-r1-0528-qwen3-8b:free"},prices:{}},{id:"deepseek-r1-0528:free",name:"R1 0528 (free)",match:{equals:"deepseek-r1-0528:free"},prices:{}},{id:"deepseek-r1-distill-llama-70b",name:"R1 Distill Llama 70B",match:{equals:"deepseek-r1-distill-llama-70b"},prices:{input_mtok:.1,output_mtok:.4}},{id:"deepseek-r1-distill-llama-70b:free",name:"R1 Distill Llama 70B (free)",match:{equals:"deepseek-r1-distill-llama-70b:free"},prices:{}},{id:"deepseek-r1-distill-llama-8b",name:"R1 Distill Llama 8B",match:{equals:"deepseek-r1-distill-llama-8b"},prices:{input_mtok:.04,output_mtok:.04}},{id:"deepseek-r1-distill-qwen-1.5b",name:"R1 Distill Qwen 1.5B",match:{equals:"deepseek-r1-distill-qwen-1.5b"},prices:{input_mtok:.18,output_mtok:.18}},{id:"deepseek-r1-distill-qwen-14b",name:"R1 Distill Qwen 14B",match:{equals:"deepseek-r1-distill-qwen-14b"},prices:{input_mtok:.15,output_mtok:.15}},{id:"deepseek-r1-distill-qwen-14b:free",name:"R1 Distill Qwen 14B (free)",match:{equals:"deepseek-r1-distill-qwen-14b:free"},prices:{}},{id:"deepseek-r1-distill-qwen-32b",name:"R1 Distill Qwen 32B",match:{equals:"deepseek-r1-distill-qwen-32b"},prices:{input_mtok:.12,output_mtok:.18}},{id:"deepseek-r1-distill-qwen-32b:free",name:"R1 Distill Qwen 32B (free)",match:{equals:"deepseek-r1-distill-qwen-32b:free"},prices:{}},{id:"deepseek-r1-distill-qwen-7b",name:"R1 Distill Qwen 7B",match:{equals:"deepseek-r1-distill-qwen-7b"},prices:{input_mtok:.1,output_mtok:.2}},{id:"deepseek-r1:free",name:"R1 (free)",match:{equals:"deepseek-r1:free"},prices:{}},{id:"deepseek-r1t-chimera:free",name:"DeepSeek R1T Chimera (free)",match:{equals:"deepseek-r1t-chimera:free"},prices:{}},{id:"deepseek-v3-base:free",name:"DeepSeek V3 Base (free)",match:{equals:"deepseek-v3-base:free"},prices:{}},{id:"deepseek-v3.1-terminus",name:"DeepSeek V3.1 Terminus",match:{equals:"deepseek-v3.1-terminus"},context_window:163840,prices:{input_mtok:.23,output_mtok:.9}},{id:"deepseek/deepseek-chat",match:{equals:"deepseek/deepseek-chat"},prices:{input_mtok:.38,output_mtok:.89}},{id:"deepseek/deepseek-chat-v3-0324",match:{equals:"deepseek/deepseek-chat-v3-0324"},prices:{input_mtok:.27,output_mtok:1.1}},{id:"deepseek/deepseek-chat-v3-0324:free",match:{equals:"deepseek/deepseek-chat-v3-0324:free"},prices:{}},{id:"deepseek/deepseek-chat-v3.1",name:"DeepSeek Chat V3.1",match:{equals:"deepseek/deepseek-chat-v3.1"},context_window:163840,prices:{input_mtok:.2,output_mtok:.8}},{id:"deepseek/deepseek-chat:free",match:{equals:"deepseek/deepseek-chat:free"},prices:{}},{id:"deepseek/deepseek-r1",match:{equals:"deepseek/deepseek-r1"},prices:{input_mtok:.5,output_mtok:3}},{id:"deepseek/deepseek-r1-distill-llama-70b",match:{equals:"deepseek/deepseek-r1-distill-llama-70b"},prices:{input_mtok:.1,output_mtok:.4}},{id:"deepseek/deepseek-r1-distill-llama-70b:free",match:{equals:"deepseek/deepseek-r1-distill-llama-70b:free"},prices:{}},{id:"deepseek/deepseek-r1-distill-llama-8b",match:{equals:"deepseek/deepseek-r1-distill-llama-8b"},prices:{input_mtok:.04,output_mtok:.04}},{id:"deepseek/deepseek-r1-distill-qwen-1.5b",match:{equals:"deepseek/deepseek-r1-distill-qwen-1.5b"},prices:{input_mtok:.18,output_mtok:.18}},{id:"deepseek/deepseek-r1-distill-qwen-14b",match:{equals:"deepseek/deepseek-r1-distill-qwen-14b"},prices:{input_mtok:.15,output_mtok:.15}},{id:"deepseek/deepseek-r1-distill-qwen-14b:free",match:{equals:"deepseek/deepseek-r1-distill-qwen-14b:free"},prices:{}},{id:"deepseek/deepseek-r1-distill-qwen-32b",match:{equals:"deepseek/deepseek-r1-distill-qwen-32b"},prices:{input_mtok:.12,output_mtok:.18}},{id:"deepseek/deepseek-r1-distill-qwen-32b:free",match:{equals:"deepseek/deepseek-r1-distill-qwen-32b:free"},prices:{}},{id:"deepseek/deepseek-r1-zero:free",match:{equals:"deepseek/deepseek-r1-zero:free"},prices:{}},{id:"deepseek/deepseek-r1:free",match:{equals:"deepseek/deepseek-r1:free"},prices:{}},{id:"deepseek/deepseek-v3-base:free",match:{equals:"deepseek/deepseek-v3-base:free"},prices:{}},{id:"deepseek/deepseek-v3.2-exp",name:"DeepSeek V3.2 Experimental",match:{equals:"deepseek/deepseek-v3.2-exp"},prices:{input_mtok:.27,output_mtok:.4}},{id:"devstral-small",name:"Devstral Small",match:{equals:"devstral-small"},prices:{input_mtok:.06,output_mtok:.12}},{id:"devstral-small:free",name:"Devstral Small (free)",match:{equals:"devstral-small:free"},prices:{}},{id:"dobby-mini-unhinged-plus-llama-3.1-8b",name:"Dobby Mini Plus Llama 3.1 8B",match:{equals:"dobby-mini-unhinged-plus-llama-3.1-8b"},prices:{input_mtok:.2,output_mtok:.2}},{id:"dolphin-mixtral-8x22b",name:"Dolphin 2.9.2 Mixtral 8x22B 🐬",match:{equals:"dolphin-mixtral-8x22b"},prices:{input_mtok:.9,output_mtok:.9}},{id:"dolphin3.0-mistral-24b:free",name:"Dolphin3.0 Mistral 24B (free)",match:{equals:"dolphin3.0-mistral-24b:free"},prices:{}},{id:"dolphin3.0-r1-mistral-24b:free",name:"Dolphin3.0 R1 Mistral 24B (free)",match:{equals:"dolphin3.0-r1-mistral-24b:free"},prices:{}},{id:"eleutherai/llemma_7b",match:{equals:"eleutherai/llemma_7b"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"eva-llama-3.33-70b",name:"EVA Llama 3.33 70B",match:{equals:"eva-llama-3.33-70b"},prices:{input_mtok:4,output_mtok:6}},{id:"eva-qwen-2.5-32b",name:"EVA Qwen2.5 32B",match:{equals:"eva-qwen-2.5-32b"},prices:{input_mtok:2.6,output_mtok:3.4}},{id:"eva-qwen-2.5-72b",name:"EVA Qwen2.5 72B",match:{equals:"eva-qwen-2.5-72b"},prices:{input_mtok:4,output_mtok:6}},{id:"eva-unit-01/eva-llama-3.33-70b",match:{equals:"eva-unit-01/eva-llama-3.33-70b"},prices:{input_mtok:4,output_mtok:6}},{id:"eva-unit-01/eva-qwen-2.5-32b",match:{equals:"eva-unit-01/eva-qwen-2.5-32b"},prices:{input_mtok:2.6,output_mtok:3.4}},{id:"eva-unit-01/eva-qwen-2.5-72b",match:{equals:"eva-unit-01/eva-qwen-2.5-72b"},prices:{input_mtok:.9,output_mtok:1.2}},{id:"featherless/qwerky-72b:free",match:{equals:"featherless/qwerky-72b:free"},prices:{}},{id:"fimbulvetr-11b-v2",name:"Fimbulvetr 11B v2",match:{equals:"fimbulvetr-11b-v2"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"gemini-2.0-flash-001",name:"Gemini 2.0 Flash",match:{equals:"gemini-2.0-flash-001"},prices:{input_mtok:.1,cache_write_mtok:.1833,cache_read_mtok:.025,output_mtok:.4}},{id:"gemini-2.0-flash-exp:free",name:"Gemini 2.0 Flash Experimental (free)",match:{equals:"gemini-2.0-flash-exp:free"},prices:{}},{id:"gemini-2.0-flash-lite-001",name:"Gemini 2.0 Flash Lite",match:{equals:"gemini-2.0-flash-lite-001"},prices:{input_mtok:.075,output_mtok:.3}},{id:"gemini-2.5-flash",name:"Gemini 2.5 Flash",match:{or:[{equals:"gemini-2.5-flash"},{equals:"google/gemini-2.5-flash"}]},prices:{input_mtok:.3,cache_write_mtok:.3833,cache_read_mtok:.075,output_mtok:2.5}},{id:"gemini-2.5-flash-lite-preview-06-17",name:"Gemini 2.5 Flash Lite Preview 06-17",match:{equals:"gemini-2.5-flash-lite-preview-06-17"},prices:{input_mtok:.1,output_mtok:.4}},{id:"gemini-2.5-flash-preview",name:"Gemini 2.5 Flash Preview 04-17",match:{or:[{equals:"gemini-2.5-flash-preview"},{equals:"gemini-2.5-flash-preview-05-20"}]},prices:{input_mtok:.15,cache_write_mtok:.2333,cache_read_mtok:.0375,output_mtok:.6}},{id:"gemini-2.5-flash-preview-05-20:thinking",name:"Gemini 2.5 Flash Preview 05-20 (thinking)",match:{equals:"gemini-2.5-flash-preview-05-20:thinking"},prices:{input_mtok:.15,cache_write_mtok:.2333,cache_read_mtok:.0375,output_mtok:3.5}},{id:"gemini-2.5-flash-preview:thinking",name:"Gemini 2.5 Flash Preview 04-17 (thinking)",match:{equals:"gemini-2.5-flash-preview:thinking"},prices:{input_mtok:.15,cache_write_mtok:.2333,cache_read_mtok:.0375,output_mtok:3.5}},{id:"gemini-2.5-pro",name:"Gemini 2.5 Pro",match:{or:[{equals:"gemini-2.5-pro"},{equals:"gemini-2.5-pro-preview"},{equals:"gemini-2.5-pro-preview-05-06"},{equals:"google/gemini-2.5-pro"},{equals:"google/gemini-2.5-pro-preview"},{equals:"google/gemini-2.5-pro-preview-05-06"}]},prices:{input_mtok:1.25,cache_write_mtok:1.625,cache_read_mtok:.31,output_mtok:10}},{id:"gemini-2.5-pro-exp-03-25",name:"Gemini 2.5 Pro Experimental",match:{equals:"gemini-2.5-pro-exp-03-25"},prices:{}},{id:"gemini-flash-1.5",name:"Gemini 1.5 Flash",match:{equals:"gemini-flash-1.5"},prices:{input_mtok:.075,cache_write_mtok:.1583,cache_read_mtok:.01875,output_mtok:.3}},{id:"gemini-flash-1.5-8b",name:"Gemini 1.5 Flash 8B",match:{equals:"gemini-flash-1.5-8b"},prices:{input_mtok:.0375,cache_write_mtok:.0583,cache_read_mtok:.01,output_mtok:.15}},{id:"gemini-pro-1.5",name:"Gemini 1.5 Pro",match:{equals:"gemini-pro-1.5"},prices:{input_mtok:1.25,output_mtok:5}},{id:"gemma-2-27b-it",name:"Gemma 2 27B",match:{equals:"gemma-2-27b-it"},prices:{input_mtok:.8,output_mtok:.8}},{id:"gemma-2-9b-it",name:"Gemma 2 9B",match:{equals:"gemma-2-9b-it"},prices:{input_mtok:.2,output_mtok:.2}},{id:"gemma-2-9b-it:free",name:"Gemma 2 9B (free)",match:{equals:"gemma-2-9b-it:free"},prices:{}},{id:"gemma-3-12b-it",name:"Gemma 3 12B",match:{equals:"gemma-3-12b-it"},prices:{input_mtok:.05,output_mtok:.1}},{id:"gemma-3-12b-it:free",name:"Gemma 3 12B (free)",match:{equals:"gemma-3-12b-it:free"},prices:{}},{id:"gemma-3-27b-it",name:"Gemma 3 27B",match:{equals:"gemma-3-27b-it"},prices:{input_mtok:.1,output_mtok:.2}},{id:"gemma-3-27b-it:free",name:"Gemma 3 27B (free)",match:{equals:"gemma-3-27b-it:free"},prices:{}},{id:"gemma-3-4b-it",name:"Gemma 3 4B",match:{equals:"gemma-3-4b-it"},prices:{input_mtok:.02,output_mtok:.04}},{id:"gemma-3-4b-it:free",name:"Gemma 3 4B (free)",match:{equals:"gemma-3-4b-it:free"},prices:{}},{id:"gemma-3n-e4b-it:free",name:"Gemma 3n 4B (free)",match:{equals:"gemma-3n-e4b-it:free"},prices:{}},{id:"glm-4-32b",name:"GLM 4 32B",match:{equals:"glm-4-32b"},prices:{input_mtok:.24,output_mtok:.24}},{id:"glm-4-32b:free",name:"GLM 4 32B (free)",match:{equals:"glm-4-32b:free"},prices:{}},{id:"glm-z1-32b",name:"GLM Z1 32B",match:{equals:"glm-z1-32b"},prices:{input_mtok:.24,output_mtok:.24}},{id:"glm-z1-32b:free",name:"GLM Z1 32B (free)",match:{equals:"glm-z1-32b:free"},prices:{}},{id:"glm-z1-rumination-32b",name:"GLM Z1 Rumination 32B",match:{equals:"glm-z1-rumination-32b"},prices:{input_mtok:.24,output_mtok:.24}},{id:"goliath-120b",name:"Goliath 120B",match:{equals:"goliath-120b"},prices:{input_mtok:10,output_mtok:12.5}},{id:"google/gemini-2.0-flash-001",match:{equals:"google/gemini-2.0-flash-001"},prices:{input_mtok:.1,output_mtok:.4}},{id:"google/gemini-2.0-flash-exp:free",match:{equals:"google/gemini-2.0-flash-exp:free"},prices:{}},{id:"google/gemini-2.0-flash-lite-001",match:{equals:"google/gemini-2.0-flash-lite-001"},prices:{input_mtok:.075,output_mtok:.3}},{id:"google/gemini-2.0-flash-thinking-exp-1219:free",match:{equals:"google/gemini-2.0-flash-thinking-exp-1219:free"},prices:{}},{id:"google/gemini-2.0-flash-thinking-exp:free",match:{equals:"google/gemini-2.0-flash-thinking-exp:free"},prices:{}},{id:"google/gemini-2.5-flash-image",name:"Gemini 2.5 Flash Image (Nano Banana)",match:{or:[{equals:"google/gemini-2.5-flash-image"},{equals:"google/gemini-2.5-flash-image-preview"}]},prices:{input_mtok:.3,output_mtok:2.5}},{id:"google/gemini-2.5-flash-lite",name:"Gemini 2.5 Flash Lite",match:{equals:"google/gemini-2.5-flash-lite"},prices:{input_mtok:.1,cache_write_mtok:.183,cache_read_mtok:.025,output_mtok:.4}},{id:"google/gemini-2.5-flash-lite-preview-09-2025",name:"Gemini 2.5 Flash Lite Preview 09-2025",match:{equals:"google/gemini-2.5-flash-lite-preview-09-2025"},prices:{input_mtok:.1,output_mtok:.4}},{id:"google/gemini-2.5-flash-preview",match:{equals:"google/gemini-2.5-flash-preview"},prices:{input_mtok:.15,output_mtok:.6}},{id:"google/gemini-2.5-flash-preview-09-2025",name:"Gemini 2.5 Flash Preview 09-2025",match:{equals:"google/gemini-2.5-flash-preview-09-2025"},prices:{input_mtok:.3,cache_write_mtok:.383,cache_read_mtok:.075,output_mtok:2.5}},{id:"google/gemini-2.5-flash-preview:thinking",match:{equals:"google/gemini-2.5-flash-preview:thinking"},prices:{input_mtok:.15,output_mtok:3.5}},{id:"google/gemini-2.5-pro-exp-03-25:free",match:{equals:"google/gemini-2.5-pro-exp-03-25:free"},prices:{}},{id:"google/gemini-2.5-pro-preview-03-25",match:{equals:"google/gemini-2.5-pro-preview-03-25"},prices:{input_mtok:1.25,output_mtok:10}},{id:"google/gemini-flash-1.5",match:{equals:"google/gemini-flash-1.5"},prices:{input_mtok:.075,output_mtok:.3}},{id:"google/gemini-flash-1.5-8b",match:{equals:"google/gemini-flash-1.5-8b"},prices:{input_mtok:.0375,output_mtok:.15}},{id:"google/gemini-flash-1.5-8b-exp",match:{equals:"google/gemini-flash-1.5-8b-exp"},prices:{}},{id:"google/gemini-pro",match:{or:[{equals:"google/gemini-pro"},{equals:"google/gemini-pro-vision"}]},prices:{input_mtok:.5,output_mtok:1.5}},{id:"google/gemini-pro-1.5",match:{equals:"google/gemini-pro-1.5"},prices:{input_mtok:1.25,output_mtok:5}},{id:"google/gemma-2-27b-it",match:{equals:"google/gemma-2-27b-it"},prices:{input_mtok:.8,output_mtok:.8}},{id:"google/gemma-2-9b-it",match:{equals:"google/gemma-2-9b-it"},prices:{input_mtok:.07,output_mtok:.07}},{id:"google/gemma-2-9b-it:free",match:{equals:"google/gemma-2-9b-it:free"},prices:{}},{id:"google/gemma-3-12b-it",match:{equals:"google/gemma-3-12b-it"},prices:{input_mtok:.05,output_mtok:.1}},{id:"google/gemma-3-12b-it:free",match:{equals:"google/gemma-3-12b-it:free"},prices:{}},{id:"google/gemma-3-1b-it:free",match:{equals:"google/gemma-3-1b-it:free"},prices:{}},{id:"google/gemma-3-27b-it",match:{equals:"google/gemma-3-27b-it"},prices:{input_mtok:.1,output_mtok:.2}},{id:"google/gemma-3-27b-it:free",match:{equals:"google/gemma-3-27b-it:free"},prices:{}},{id:"google/gemma-3-4b-it",match:{equals:"google/gemma-3-4b-it"},prices:{input_mtok:.02,output_mtok:.04}},{id:"google/gemma-3-4b-it:free",match:{equals:"google/gemma-3-4b-it:free"},prices:{}},{id:"google/learnlm-1.5-pro-experimental:free",match:{equals:"google/learnlm-1.5-pro-experimental:free"},prices:{}},{id:"google/palm-2-chat-bison",match:{or:[{equals:"google/palm-2-chat-bison"},{equals:"google/palm-2-chat-bison-32k"}]},prices:{input_mtok:1,output_mtok:2}},{id:"google/palm-2-codechat-bison",match:{or:[{equals:"google/palm-2-codechat-bison"},{equals:"google/palm-2-codechat-bison-32k"}]},prices:{input_mtok:1,output_mtok:2}},{id:"gpt-3.5-turbo",name:"GPT-3.5 Turbo",match:{or:[{equals:"gpt-3.5-turbo"},{equals:"gpt-3.5-turbo-0125"}]},prices:{input_mtok:.5,output_mtok:1.5}},{id:"gpt-3.5-turbo-0613",name:"GPT-3.5 Turbo (older v0613)",match:{equals:"gpt-3.5-turbo-0613"},prices:{input_mtok:1,output_mtok:2}},{id:"gpt-3.5-turbo-1106",name:"GPT-3.5 Turbo 16k (older v1106)",match:{equals:"gpt-3.5-turbo-1106"},prices:{input_mtok:1,output_mtok:2}},{id:"gpt-3.5-turbo-16k",name:"GPT-3.5 Turbo 16k",match:{equals:"gpt-3.5-turbo-16k"},prices:{input_mtok:3,output_mtok:4}},{id:"gpt-3.5-turbo-instruct",name:"GPT-3.5 Turbo Instruct",match:{equals:"gpt-3.5-turbo-instruct"},prices:{input_mtok:1.5,output_mtok:2}},{id:"gpt-4",name:"GPT-4",match:{or:[{equals:"gpt-4"},{equals:"gpt-4-0314"}]},prices:{input_mtok:30,output_mtok:60}},{id:"gpt-4-1106-preview",name:"GPT-4 Turbo (older v1106)",match:{equals:"gpt-4-1106-preview"},prices:{input_mtok:10,output_mtok:30}},{id:"gpt-4-turbo",name:"GPT-4 Turbo",match:{or:[{equals:"gpt-4-turbo"},{equals:"gpt-4-turbo-preview"}]},prices:{input_mtok:10,output_mtok:30}},{id:"gpt-4.1",name:"GPT-4.1",match:{equals:"gpt-4.1"},prices:{input_mtok:2,cache_read_mtok:.5,output_mtok:8}},{id:"gpt-4.1-mini",name:"GPT-4.1 Mini",match:{equals:"gpt-4.1-mini"},prices:{input_mtok:.4,cache_read_mtok:.1,output_mtok:1.6}},{id:"gpt-4.1-nano",name:"GPT-4.1 Nano",match:{equals:"gpt-4.1-nano"},prices:{input_mtok:.1,cache_read_mtok:.025,output_mtok:.4}},{id:"gpt-4.5-preview",name:"GPT-4.5 (Preview)",match:{equals:"gpt-4.5-preview"},prices:{input_mtok:75,cache_read_mtok:37.5,output_mtok:150}},{id:"gpt-4o",name:"GPT-4o",match:{or:[{equals:"gpt-4o"},{equals:"gpt-4o-2024-08-06"},{equals:"gpt-4o-2024-11-20"}]},prices:{input_mtok:2.5,cache_read_mtok:1.25,output_mtok:10}},{id:"gpt-4o-2024-05-13",name:"GPT-4o (2024-05-13)",match:{equals:"gpt-4o-2024-05-13"},prices:{input_mtok:5,output_mtok:15}},{id:"gpt-4o-mini",name:"GPT-4o-mini",match:{or:[{equals:"gpt-4o-mini"},{equals:"gpt-4o-mini-2024-07-18"}]},prices:{input_mtok:.15,cache_read_mtok:.075,output_mtok:.6}},{id:"gpt-4o-mini-search-preview",name:"GPT-4o-mini Search Preview",match:{equals:"gpt-4o-mini-search-preview"},prices:{input_mtok:.15,output_mtok:.6}},{id:"gpt-4o-search-preview",name:"GPT-4o Search Preview",match:{equals:"gpt-4o-search-preview"},prices:{input_mtok:2.5,output_mtok:10}},{id:"gpt-4o:extended",name:"GPT-4o (extended)",match:{equals:"gpt-4o:extended"},prices:{input_mtok:6,output_mtok:18}},{id:"grok-2-1212",name:"Grok 2 1212",match:{equals:"grok-2-1212"},prices:{input_mtok:2,output_mtok:10}},{id:"grok-2-vision-1212",name:"Grok 2 Vision 1212",match:{equals:"grok-2-vision-1212"},prices:{input_mtok:2,output_mtok:10}},{id:"grok-3",name:"Grok 3",match:{or:[{equals:"grok-3"},{equals:"grok-3-beta"}]},prices:{input_mtok:3,cache_read_mtok:.75,output_mtok:15}},{id:"grok-3-mini",name:"Grok 3 Mini",match:{or:[{equals:"grok-3-mini"},{equals:"grok-3-mini-beta"}]},prices:{input_mtok:.3,cache_read_mtok:.075,output_mtok:.5}},{id:"grok-beta",name:"Grok Beta",match:{equals:"grok-beta"},prices:{input_mtok:5,output_mtok:15}},{id:"grok-vision-beta",name:"Grok Vision Beta",match:{equals:"grok-vision-beta"},prices:{input_mtok:5,output_mtok:15}},{id:"gryphe/mythomax-l2-13b",match:{equals:"gryphe/mythomax-l2-13b"},prices:{input_mtok:.065,output_mtok:.065}},{id:"hermes-2-pro-llama-3-8b",name:"Hermes 2 Pro - Llama-3 8B",match:{equals:"hermes-2-pro-llama-3-8b"},prices:{input_mtok:.025,output_mtok:.04}},{id:"hermes-3-llama-3.1-405b",name:"Hermes 3 405B Instruct",match:{equals:"hermes-3-llama-3.1-405b"},prices:{input_mtok:.7,output_mtok:.8}},{id:"hermes-3-llama-3.1-70b",name:"Hermes 3 70B Instruct",match:{equals:"hermes-3-llama-3.1-70b"},prices:{input_mtok:.12,output_mtok:.3}},{id:"huggingfaceh4/zephyr-7b-beta:free",match:{equals:"huggingfaceh4/zephyr-7b-beta:free"},prices:{}},{id:"infermatic/mn-inferor-12b",match:{equals:"infermatic/mn-inferor-12b"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"inflection-3-pi",name:"Inflection 3 Pi",match:{equals:"inflection-3-pi"},prices:{input_mtok:2.5,output_mtok:10}},{id:"inflection-3-productivity",name:"Inflection 3 Productivity",match:{equals:"inflection-3-productivity"},prices:{input_mtok:2.5,output_mtok:10}},{id:"inflection/inflection-3-pi",match:{equals:"inflection/inflection-3-pi"},prices:{input_mtok:2.5,output_mtok:10}},{id:"inflection/inflection-3-productivity",match:{equals:"inflection/inflection-3-productivity"},prices:{input_mtok:2.5,output_mtok:10}},{id:"internvl3-14b:free",name:"InternVL3 14B (free)",match:{equals:"internvl3-14b:free"},prices:{}},{id:"internvl3-2b:free",name:"InternVL3 2B (free)",match:{equals:"internvl3-2b:free"},prices:{}},{id:"jamba-1.6-large",name:"Jamba 1.6 Large",match:{equals:"jamba-1.6-large"},prices:{input_mtok:2,output_mtok:8}},{id:"jamba-1.6-mini",name:"Jamba Mini 1.6",match:{equals:"jamba-1.6-mini"},prices:{input_mtok:.2,output_mtok:.4}},{id:"jondurbin/airoboros-l2-70b",match:{equals:"jondurbin/airoboros-l2-70b"},prices:{input_mtok:.5,output_mtok:.5}},{id:"kimi-dev-72b:free",name:"Kimi Dev 72b (free)",match:{equals:"kimi-dev-72b:free"},prices:{}},{id:"kimi-vl-a3b-thinking:free",name:"Kimi VL A3B Thinking (free)",match:{equals:"kimi-vl-a3b-thinking:free"},prices:{}},{id:"l3-euryale-70b",name:"Llama 3 Euryale 70B v2.1",match:{equals:"l3-euryale-70b"},prices:{input_mtok:1.48,output_mtok:1.48}},{id:"l3-lunaris-8b",name:"Llama 3 8B Lunaris",match:{equals:"l3-lunaris-8b"},prices:{input_mtok:.02,output_mtok:.05}},{id:"l3.1-euryale-70b",name:"Llama 3.1 Euryale 70B v2.2",match:{equals:"l3.1-euryale-70b"},prices:{input_mtok:.7,output_mtok:.8}},{id:"l3.3-euryale-70b",name:"Llama 3.3 Euryale 70B",match:{equals:"l3.3-euryale-70b"},prices:{input_mtok:.7,output_mtok:.8}},{id:"latitudegames/wayfarer-large-70b-llama-3.3",match:{equals:"latitudegames/wayfarer-large-70b-llama-3.3"},prices:{input_mtok:.8,output_mtok:.9}},{id:"lfm-3b",name:"LFM 3B",match:{equals:"lfm-3b"},prices:{input_mtok:.02,output_mtok:.02}},{id:"lfm-40b",name:"LFM 40B MoE",match:{equals:"lfm-40b"},prices:{input_mtok:.15,output_mtok:.15}},{id:"lfm-7b",name:"LFM 7B",match:{equals:"lfm-7b"},prices:{input_mtok:.01,output_mtok:.01}},{id:"liquid/lfm-3b",match:{equals:"liquid/lfm-3b"},prices:{input_mtok:.02,output_mtok:.02}},{id:"liquid/lfm-40b",match:{equals:"liquid/lfm-40b"},prices:{input_mtok:.15,output_mtok:.15}},{id:"liquid/lfm-7b",match:{equals:"liquid/lfm-7b"},prices:{input_mtok:.01,output_mtok:.01}},{id:"llama-3-70b-instruct",name:"Llama 3 70B Instruct",match:{equals:"llama-3-70b-instruct"},prices:{input_mtok:.3,output_mtok:.4}},{id:"llama-3-8b-instruct",name:"Llama 3 8B Instruct",match:{equals:"llama-3-8b-instruct"},prices:{input_mtok:.03,output_mtok:.06}},{id:"llama-3-lumimaid-70b",name:"Llama 3 Lumimaid 70B",match:{equals:"llama-3-lumimaid-70b"},prices:{input_mtok:4,output_mtok:6}},{id:"llama-3-lumimaid-8b",name:"Llama 3 Lumimaid 8B",match:{equals:"llama-3-lumimaid-8b"},prices:{input_mtok:.2,output_mtok:1.25}},{id:"llama-3.1-405b",name:"Llama 3.1 405B (base)",match:{equals:"llama-3.1-405b"},prices:{input_mtok:2,output_mtok:2}},{id:"llama-3.1-405b-instruct",name:"Llama 3.1 405B Instruct",match:{equals:"llama-3.1-405b-instruct"},prices:{input_mtok:.8,output_mtok:.8}},{id:"llama-3.1-70b-instruct",name:"Llama 3.1 70B Instruct",match:{equals:"llama-3.1-70b-instruct"},prices:{input_mtok:.1,output_mtok:.28}},{id:"llama-3.1-8b-instruct",name:"Llama 3.1 8B Instruct",match:{equals:"llama-3.1-8b-instruct"},prices:{input_mtok:.016,output_mtok:.029}},{id:"llama-3.1-8b-instruct:free",name:"Llama 3.1 8B Instruct (free)",match:{equals:"llama-3.1-8b-instruct:free"},prices:{}},{id:"llama-3.1-lumimaid-70b",name:"Lumimaid v0.2 70B",match:{equals:"llama-3.1-lumimaid-70b"},prices:{input_mtok:2.5,output_mtok:3}},{id:"llama-3.1-lumimaid-8b",name:"Lumimaid v0.2 8B",match:{equals:"llama-3.1-lumimaid-8b"},prices:{input_mtok:.2,output_mtok:1.25}},{id:"llama-3.1-nemotron-70b-instruct",name:"Llama 3.1 Nemotron 70B Instruct",match:{equals:"llama-3.1-nemotron-70b-instruct"},prices:{input_mtok:.12,output_mtok:.3}},{id:"llama-3.1-nemotron-ultra-253b-v1",name:"Llama 3.1 Nemotron Ultra 253B v1",match:{equals:"llama-3.1-nemotron-ultra-253b-v1"},prices:{input_mtok:.6,output_mtok:1.8}},{id:"llama-3.1-nemotron-ultra-253b-v1:free",name:"Llama 3.1 Nemotron Ultra 253B v1 (free)",match:{equals:"llama-3.1-nemotron-ultra-253b-v1:free"},prices:{}},{id:"llama-3.1-sonar-large-128k-online",name:"Llama 3.1 Sonar 70B Online",match:{equals:"llama-3.1-sonar-large-128k-online"},prices:{input_mtok:1,output_mtok:1}},{id:"llama-3.1-sonar-small-128k-online",name:"Llama 3.1 Sonar 8B Online",match:{equals:"llama-3.1-sonar-small-128k-online"},prices:{input_mtok:.2,output_mtok:.2}},{id:"llama-3.2-11b-vision-instruct",name:"Llama 3.2 11B Vision Instruct",match:{equals:"llama-3.2-11b-vision-instruct"},prices:{input_mtok:.049,output_mtok:.049}},{id:"llama-3.2-11b-vision-instruct:free",name:"Llama 3.2 11B Vision Instruct (free)",match:{equals:"llama-3.2-11b-vision-instruct:free"},prices:{}},{id:"llama-3.2-1b-instruct",name:"Llama 3.2 1B Instruct",match:{equals:"llama-3.2-1b-instruct"},prices:{input_mtok:.005,output_mtok:.01}},{id:"llama-3.2-1b-instruct:free",name:"Llama 3.2 1B Instruct (free)",match:{equals:"llama-3.2-1b-instruct:free"},prices:{}},{id:"llama-3.2-3b-instruct",name:"Llama 3.2 3B Instruct",match:{equals:"llama-3.2-3b-instruct"},prices:{input_mtok:.01,output_mtok:.02}},{id:"llama-3.2-3b-instruct:free",name:"Llama 3.2 3B Instruct (free)",match:{equals:"llama-3.2-3b-instruct:free"},prices:{}},{id:"llama-3.2-90b-vision-instruct",name:"Llama 3.2 90B Vision Instruct",match:{equals:"llama-3.2-90b-vision-instruct"},prices:{input_mtok:1.2,output_mtok:1.2}},{id:"llama-3.3-70b-instruct",name:"Llama 3.3 70B Instruct",match:{equals:"llama-3.3-70b-instruct"},prices:{input_mtok:.05,output_mtok:.24}},{id:"llama-3.3-70b-instruct:free",name:"Llama 3.3 70B Instruct (free)",match:{equals:"llama-3.3-70b-instruct:free"},prices:{}},{id:"llama-3.3-8b-instruct:free",name:"Llama 3.3 8B Instruct (free)",match:{equals:"llama-3.3-8b-instruct:free"},prices:{}},{id:"llama-3.3-nemotron-super-49b-v1",name:"Llama 3.3 Nemotron Super 49B v1",match:{equals:"llama-3.3-nemotron-super-49b-v1"},prices:{input_mtok:.13,output_mtok:.4}},{id:"llama-3.3-nemotron-super-49b-v1:free",name:"Llama 3.3 Nemotron Super 49B v1 (free)",match:{equals:"llama-3.3-nemotron-super-49b-v1:free"},prices:{}},{id:"llama-4-maverick",name:"Llama 4 Maverick",match:{equals:"llama-4-maverick"},prices:{input_mtok:.15,output_mtok:.6}},{id:"llama-4-maverick:free",name:"Llama 4 Maverick (free)",match:{equals:"llama-4-maverick:free"},prices:{}},{id:"llama-4-scout",name:"Llama 4 Scout",match:{equals:"llama-4-scout"},prices:{input_mtok:.08,output_mtok:.3}},{id:"llama-4-scout:free",name:"Llama 4 Scout (free)",match:{equals:"llama-4-scout:free"},prices:{}},{id:"llama-guard-2-8b",name:"LlamaGuard 2 8B",match:{equals:"llama-guard-2-8b"},prices:{input_mtok:.2,output_mtok:.2}},{id:"llama-guard-3-8b",name:"Llama Guard 3 8B",match:{equals:"llama-guard-3-8b"},prices:{input_mtok:.02,output_mtok:.06}},{id:"llama-guard-4-12b",name:"Llama Guard 4 12B",match:{equals:"llama-guard-4-12b"},prices:{input_mtok:.05,output_mtok:.05}},{id:"llama3.1-typhoon2-70b-instruct",name:"Typhoon2 70B Instruct",match:{equals:"llama3.1-typhoon2-70b-instruct"},prices:{input_mtok:.88,output_mtok:.88}},{id:"llemma_7b",name:"Llemma 7b",match:{equals:"llemma_7b"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"maestro-reasoning",name:"Maestro Reasoning",match:{equals:"maestro-reasoning"},prices:{input_mtok:.9,output_mtok:3.3}},{id:"magistral-medium-2506",name:"Magistral Medium 2506",match:{or:[{equals:"magistral-medium-2506"},{equals:"magistral-medium-2506:thinking"}]},prices:{input_mtok:2,output_mtok:5}},{id:"magistral-small-2506",name:"Magistral Small 2506",match:{equals:"magistral-small-2506"},prices:{input_mtok:.5,output_mtok:1.5}},{id:"magnum-72b",name:"Magnum 72B",match:{equals:"magnum-72b"},prices:{input_mtok:4,output_mtok:6}},{id:"magnum-v2-72b",name:"Magnum v2 72B",match:{equals:"magnum-v2-72b"},prices:{input_mtok:3,output_mtok:3}},{id:"magnum-v4-72b",name:"Magnum v4 72B",match:{equals:"magnum-v4-72b"},prices:{input_mtok:2.5,output_mtok:3}},{id:"mai-ds-r1:free",name:"MAI DS R1 (free)",match:{equals:"mai-ds-r1:free"},prices:{}},{id:"mancer/weaver",match:{equals:"mancer/weaver"},prices:{input_mtok:1.125,output_mtok:1.125}},{id:"mercury-coder-small-beta",name:"Mercury Coder Small Beta",match:{equals:"mercury-coder-small-beta"},prices:{input_mtok:.25,output_mtok:1}},{id:"meta-llama/llama-2-13b-chat",match:{equals:"meta-llama/llama-2-13b-chat"},prices:{input_mtok:.22,output_mtok:.22}},{id:"meta-llama/llama-2-70b-chat",match:{equals:"meta-llama/llama-2-70b-chat"},prices:{input_mtok:.9,output_mtok:.9}},{id:"meta-llama/llama-3-70b-instruct",match:{equals:"meta-llama/llama-3-70b-instruct"},prices:{input_mtok:.3,output_mtok:.4}},{id:"meta-llama/llama-3-8b-instruct",match:{equals:"meta-llama/llama-3-8b-instruct"},prices:{input_mtok:.03,output_mtok:.06}},{id:"meta-llama/llama-3.1-405b",match:{equals:"meta-llama/llama-3.1-405b"},prices:{input_mtok:2,output_mtok:2}},{id:"meta-llama/llama-3.1-405b-instruct",match:{equals:"meta-llama/llama-3.1-405b-instruct"},prices:{input_mtok:.8,output_mtok:.8}},{id:"meta-llama/llama-3.1-405b:free",match:{equals:"meta-llama/llama-3.1-405b:free"},prices:{}},{id:"meta-llama/llama-3.1-70b-instruct",match:{equals:"meta-llama/llama-3.1-70b-instruct"},prices:{input_mtok:.119,output_mtok:.39}},{id:"meta-llama/llama-3.1-8b-instruct",match:{equals:"meta-llama/llama-3.1-8b-instruct"},prices:{input_mtok:.02,output_mtok:.03}},{id:"meta-llama/llama-3.1-8b-instruct:free",match:{equals:"meta-llama/llama-3.1-8b-instruct:free"},prices:{}},{id:"meta-llama/llama-3.2-11b-vision-instruct",match:{equals:"meta-llama/llama-3.2-11b-vision-instruct"},prices:{input_mtok:.049,output_mtok:.049}},{id:"meta-llama/llama-3.2-11b-vision-instruct:free",match:{equals:"meta-llama/llama-3.2-11b-vision-instruct:free"},prices:{}},{id:"meta-llama/llama-3.2-1b-instruct",match:{equals:"meta-llama/llama-3.2-1b-instruct"},prices:{input_mtok:.01,output_mtok:.01}},{id:"meta-llama/llama-3.2-1b-instruct:free",match:{equals:"meta-llama/llama-3.2-1b-instruct:free"},prices:{}},{id:"meta-llama/llama-3.2-3b-instruct",match:{equals:"meta-llama/llama-3.2-3b-instruct"},prices:{input_mtok:.015,output_mtok:.025}},{id:"meta-llama/llama-3.2-3b-instruct:free",match:{equals:"meta-llama/llama-3.2-3b-instruct:free"},prices:{}},{id:"meta-llama/llama-3.2-90b-vision-instruct",match:{equals:"meta-llama/llama-3.2-90b-vision-instruct"},prices:{input_mtok:.9,output_mtok:.9}},{id:"meta-llama/llama-3.3-70b-instruct",match:{equals:"meta-llama/llama-3.3-70b-instruct"},prices:{input_mtok:.1,output_mtok:.25}},{id:"meta-llama/llama-3.3-70b-instruct:free",match:{equals:"meta-llama/llama-3.3-70b-instruct:free"},prices:{}},{id:"meta-llama/llama-4-maverick",match:{equals:"meta-llama/llama-4-maverick"},prices:{input_mtok:.17,output_mtok:.85}},{id:"meta-llama/llama-4-maverick:free",match:{equals:"meta-llama/llama-4-maverick:free"},prices:{}},{id:"meta-llama/llama-4-scout",match:{equals:"meta-llama/llama-4-scout"},prices:{input_mtok:.08,output_mtok:.3}},{id:"meta-llama/llama-4-scout:free",match:{equals:"meta-llama/llama-4-scout:free"},prices:{}},{id:"meta-llama/llama-guard-2-8b",match:{equals:"meta-llama/llama-guard-2-8b"},prices:{input_mtok:.2,output_mtok:.2}},{id:"meta-llama/llama-guard-3-8b",match:{equals:"meta-llama/llama-guard-3-8b"},prices:{input_mtok:.1,output_mtok:.1}},{id:"microsoft/phi-3-medium-128k-instruct",match:{equals:"microsoft/phi-3-medium-128k-instruct"},prices:{input_mtok:1,output_mtok:1}},{id:"microsoft/phi-3-mini-128k-instruct",match:{equals:"microsoft/phi-3-mini-128k-instruct"},prices:{input_mtok:.1,output_mtok:.1}},{id:"microsoft/phi-3.5-mini-128k-instruct",match:{equals:"microsoft/phi-3.5-mini-128k-instruct"},prices:{input_mtok:.1,output_mtok:.1}},{id:"microsoft/phi-4",match:{equals:"microsoft/phi-4"},prices:{input_mtok:.07,output_mtok:.14}},{id:"microsoft/phi-4-multimodal-instruct",match:{equals:"microsoft/phi-4-multimodal-instruct"},prices:{input_mtok:.05,output_mtok:.1}},{id:"microsoft/wizardlm-2-7b",match:{equals:"microsoft/wizardlm-2-7b"},prices:{input_mtok:.07,output_mtok:.07}},{id:"microsoft/wizardlm-2-8x22b",match:{equals:"microsoft/wizardlm-2-8x22b"},prices:{input_mtok:.5,output_mtok:.5}},{id:"midnight-rose-70b",name:"Midnight Rose 70B",match:{equals:"midnight-rose-70b"},prices:{input_mtok:.8,output_mtok:.8}},{id:"minimax-01",name:"MiniMax-01",match:{equals:"minimax-01"},prices:{input_mtok:.2,output_mtok:1.1}},{id:"minimax-m1",name:"MiniMax M1",match:{equals:"minimax-m1"},prices:{input_mtok:.3,output_mtok:1.65}},{id:"minimax-m1:extended",name:"MiniMax M1 (extended)",match:{equals:"minimax-m1:extended"},prices:{input_mtok:.55,output_mtok:2.2}},{id:"minimax/minimax-01",match:{equals:"minimax/minimax-01"},prices:{input_mtok:.2,output_mtok:1.1}},{id:"ministral-3b",name:"Ministral 3B",match:{equals:"ministral-3b"},prices:{input_mtok:.04,output_mtok:.04}},{id:"ministral-8b",name:"Ministral 8B",match:{equals:"ministral-8b"},prices:{input_mtok:.1,output_mtok:.1}},{id:"mistral-7b-instruct",name:"Mistral 7B Instruct",match:{or:[{equals:"mistral-7b-instruct"},{equals:"mistral-7b-instruct-v0.3"}]},prices:{input_mtok:.028,output_mtok:.054}},{id:"mistral-7b-instruct-v0.1",name:"Mistral 7B Instruct v0.1",match:{equals:"mistral-7b-instruct-v0.1"},prices:{input_mtok:.11,output_mtok:.19}},{id:"mistral-7b-instruct-v0.2",name:"Mistral 7B Instruct v0.2",match:{equals:"mistral-7b-instruct-v0.2"},prices:{input_mtok:.2,output_mtok:.2}},{id:"mistral-7b-instruct:free",name:"Mistral 7B Instruct (free)",match:{equals:"mistral-7b-instruct:free"},prices:{}},{id:"mistral-large",name:"Mistral Large",match:{or:[{equals:"mistral-large"},{equals:"mistral-large-2407"},{equals:"mistral-large-2411"}]},prices:{input_mtok:2,output_mtok:6}},{id:"mistral-medium",name:"Mistral Medium",match:{equals:"mistral-medium"},prices:{input_mtok:2.75,output_mtok:8.1}},{id:"mistral-medium-3",name:"Mistral Medium 3",match:{equals:"mistral-medium-3"},prices:{input_mtok:.4,output_mtok:2}},{id:"mistral-nemo",name:"Mistral Nemo",match:{equals:"mistral-nemo"},prices:{input_mtok:.01,output_mtok:.019}},{id:"mistral-nemo:free",name:"Mistral Nemo (free)",match:{equals:"mistral-nemo:free"},prices:{}},{id:"mistral-saba",name:"Saba",match:{equals:"mistral-saba"},prices:{input_mtok:.2,output_mtok:.6}},{id:"mistral-small",name:"Mistral Small",match:{equals:"mistral-small"},prices:{input_mtok:.2,output_mtok:.6}},{id:"mistral-small-24b-instruct-2501",name:"Mistral Small 3",match:{equals:"mistral-small-24b-instruct-2501"},prices:{input_mtok:.05,output_mtok:.09}},{id:"mistral-small-24b-instruct-2501:free",name:"Mistral Small 3 (free)",match:{equals:"mistral-small-24b-instruct-2501:free"},prices:{}},{id:"mistral-small-3.1-24b-instruct",name:"Mistral Small 3.1 24B",match:{equals:"mistral-small-3.1-24b-instruct"},prices:{input_mtok:.05,output_mtok:.15}},{id:"mistral-small-3.1-24b-instruct:free",name:"Mistral Small 3.1 24B (free)",match:{equals:"mistral-small-3.1-24b-instruct:free"},prices:{}},{id:"mistral-small-3.2-24b-instruct:free",name:"Mistral Small 3.2 24B (free)",match:{equals:"mistral-small-3.2-24b-instruct:free"},prices:{}},{id:"mistral-tiny",name:"Mistral Tiny",match:{equals:"mistral-tiny"},prices:{input_mtok:.25,output_mtok:.25}},{id:"mistral/ministral-8b",match:{equals:"mistral/ministral-8b"},prices:{input_mtok:.1,output_mtok:.1}},{id:"mistralai/codestral-2501",match:{equals:"mistralai/codestral-2501"},prices:{input_mtok:.3,output_mtok:.9}},{id:"mistralai/codestral-mamba",match:{equals:"mistralai/codestral-mamba"},prices:{input_mtok:.25,output_mtok:.25}},{id:"mistralai/ministral-3b",match:{equals:"mistralai/ministral-3b"},prices:{input_mtok:.04,output_mtok:.04}},{id:"mistralai/ministral-8b",match:{equals:"mistralai/ministral-8b"},prices:{input_mtok:.1,output_mtok:.1}},{id:"mistralai/mistral-7b-instruct",match:{or:[{equals:"mistralai/mistral-7b-instruct"},{equals:"mistralai/mistral-7b-instruct-v0.3"}]},prices:{input_mtok:.029,output_mtok:.059}},{id:"mistralai/mistral-7b-instruct-v0.1",match:{equals:"mistralai/mistral-7b-instruct-v0.1"},prices:{input_mtok:.2,output_mtok:.2}},{id:"mistralai/mistral-7b-instruct-v0.2",match:{equals:"mistralai/mistral-7b-instruct-v0.2"},prices:{input_mtok:.2,output_mtok:.2}},{id:"mistralai/mistral-7b-instruct:free",match:{equals:"mistralai/mistral-7b-instruct:free"},prices:{}},{id:"mistralai/mistral-large",match:{or:[{equals:"mistralai/mistral-large"},{equals:"mistralai/mistral-large-2407"},{equals:"mistralai/mistral-large-2411"}]},prices:{input_mtok:2,output_mtok:6}},{id:"mistralai/mistral-medium",match:{equals:"mistralai/mistral-medium"},prices:{input_mtok:2.75,output_mtok:8.1}},{id:"mistralai/mistral-nemo",match:{equals:"mistralai/mistral-nemo"},prices:{input_mtok:.035,output_mtok:.08}},{id:"mistralai/mistral-nemo:free",match:{equals:"mistralai/mistral-nemo:free"},prices:{}},{id:"mistralai/mistral-saba",match:{equals:"mistralai/mistral-saba"},prices:{input_mtok:.2,output_mtok:.6}},{id:"mistralai/mistral-small",match:{equals:"mistralai/mistral-small"},prices:{input_mtok:.2,output_mtok:.6}},{id:"mistralai/mistral-small-24b-instruct-2501",match:{equals:"mistralai/mistral-small-24b-instruct-2501"},prices:{input_mtok:.07,output_mtok:.14}},{id:"mistralai/mistral-small-24b-instruct-2501:free",match:{equals:"mistralai/mistral-small-24b-instruct-2501:free"},prices:{}},{id:"mistralai/mistral-small-3.1-24b-instruct",match:{equals:"mistralai/mistral-small-3.1-24b-instruct"},prices:{input_mtok:.1,output_mtok:.3}},{id:"mistralai/mistral-small-3.1-24b-instruct:free",match:{equals:"mistralai/mistral-small-3.1-24b-instruct:free"},prices:{}},{id:"mistralai/mistral-tiny",match:{equals:"mistralai/mistral-tiny"},prices:{input_mtok:.25,output_mtok:.25}},{id:"mistralai/mixtral-8x22b-instruct",match:{equals:"mistralai/mixtral-8x22b-instruct"},prices:{input_mtok:.9,output_mtok:.9}},{id:"mistralai/mixtral-8x7b-instruct",match:{equals:"mistralai/mixtral-8x7b-instruct"},prices:{input_mtok:.24,output_mtok:.24}},{id:"mistralai/pixtral-12b",match:{equals:"mistralai/pixtral-12b"},prices:{input_mtok:.1,output_mtok:.1}},{id:"mistralai/pixtral-large-2411",match:{equals:"mistralai/pixtral-large-2411"},prices:{input_mtok:2,output_mtok:6}},{id:"mixtral-8x22b-instruct",name:"Mixtral 8x22B Instruct",match:{equals:"mixtral-8x22b-instruct"},prices:{input_mtok:.9,output_mtok:.9}},{id:"mixtral-8x7b-instruct",name:"Mixtral 8x7B Instruct",match:{equals:"mixtral-8x7b-instruct"},prices:{input_mtok:.08,output_mtok:.24}},{id:"mn-celeste-12b",name:"Mistral Nemo 12B Celeste",match:{equals:"mn-celeste-12b"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"mn-inferor-12b",name:"Mistral Nemo Inferor 12B",match:{equals:"mn-inferor-12b"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"mn-starcannon-12b",name:"Starcannon 12B",match:{equals:"mn-starcannon-12b"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"moonshotai/kimi-vl-a3b-thinking:free",match:{equals:"moonshotai/kimi-vl-a3b-thinking:free"},prices:{}},{id:"moonshotai/moonlight-16b-a3b-instruct:free",match:{equals:"moonshotai/moonlight-16b-a3b-instruct:free"},prices:{}},{id:"mythalion-13b",name:"Mythalion 13B",match:{equals:"mythalion-13b"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"mythomax-l2-13b",name:"MythoMax 13B",match:{equals:"mythomax-l2-13b"},prices:{input_mtok:.065,output_mtok:.065}},{id:"neversleep/llama-3-lumimaid-70b",match:{equals:"neversleep/llama-3-lumimaid-70b"},prices:{input_mtok:3.375,output_mtok:4.5}},{id:"neversleep/llama-3-lumimaid-8b",match:{or:[{equals:"neversleep/llama-3-lumimaid-8b"},{equals:"neversleep/llama-3-lumimaid-8b:extended"}]},prices:{input_mtok:.09375,output_mtok:.75}},{id:"neversleep/llama-3.1-lumimaid-70b",match:{equals:"neversleep/llama-3.1-lumimaid-70b"},prices:{input_mtok:1.5,output_mtok:2.25}},{id:"neversleep/llama-3.1-lumimaid-8b",match:{equals:"neversleep/llama-3.1-lumimaid-8b"},prices:{input_mtok:.09375,output_mtok:.75}},{id:"neversleep/noromaid-20b",match:{equals:"neversleep/noromaid-20b"},prices:{input_mtok:.75,output_mtok:1.5}},{id:"noromaid-20b",name:"Noromaid 20B",match:{equals:"noromaid-20b"},prices:{input_mtok:1.25,output_mtok:2}},{id:"nothingiisreal/mn-celeste-12b",match:{equals:"nothingiisreal/mn-celeste-12b"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"nous-hermes-2-mixtral-8x7b-dpo",name:"Hermes 2 Mixtral 8x7B DPO",match:{equals:"nous-hermes-2-mixtral-8x7b-dpo"},prices:{input_mtok:.6,output_mtok:.6}},{id:"nousresearch/deephermes-3-llama-3-8b-preview:free",match:{equals:"nousresearch/deephermes-3-llama-3-8b-preview:free"},prices:{}},{id:"nousresearch/hermes-2-pro-llama-3-8b",match:{equals:"nousresearch/hermes-2-pro-llama-3-8b"},prices:{input_mtok:.025,output_mtok:.04}},{id:"nousresearch/hermes-3-llama-3.1-405b",match:{equals:"nousresearch/hermes-3-llama-3.1-405b"},prices:{input_mtok:.8,output_mtok:.8}},{id:"nousresearch/hermes-3-llama-3.1-70b",match:{equals:"nousresearch/hermes-3-llama-3.1-70b"},prices:{input_mtok:.12,output_mtok:.3}},{id:"nousresearch/nous-hermes-2-mixtral-8x7b-dpo",match:{equals:"nousresearch/nous-hermes-2-mixtral-8x7b-dpo"},prices:{input_mtok:.6,output_mtok:.6}},{id:"nousresearch/nous-hermes-llama2-13b",match:{equals:"nousresearch/nous-hermes-llama2-13b"},prices:{input_mtok:.18,output_mtok:.18}},{id:"nova-lite-v1",name:"Nova Lite 1.0",match:{equals:"nova-lite-v1"},prices:{input_mtok:.06,output_mtok:.24}},{id:"nova-micro-v1",name:"Nova Micro 1.0",match:{equals:"nova-micro-v1"},prices:{input_mtok:.035,output_mtok:.14}},{id:"nova-pro-v1",name:"Nova Pro 1.0",match:{equals:"nova-pro-v1"},prices:{input_mtok:.8,output_mtok:3.2}},{id:"nvidia/llama-3.1-nemotron-70b-instruct",match:{equals:"nvidia/llama-3.1-nemotron-70b-instruct"},prices:{input_mtok:.12,output_mtok:.3}},{id:"nvidia/llama-3.1-nemotron-70b-instruct:free",match:{equals:"nvidia/llama-3.1-nemotron-70b-instruct:free"},prices:{}},{id:"nvidia/llama-3.1-nemotron-nano-8b-v1:free",match:{equals:"nvidia/llama-3.1-nemotron-nano-8b-v1:free"},prices:{}},{id:"nvidia/llama-3.1-nemotron-ultra-253b-v1:free",match:{equals:"nvidia/llama-3.1-nemotron-ultra-253b-v1:free"},prices:{}},{id:"nvidia/llama-3.3-nemotron-super-49b-v1:free",match:{equals:"nvidia/llama-3.3-nemotron-super-49b-v1:free"},prices:{}},{id:"o1",name:"o1",match:{or:[{equals:"o1"},{equals:"o1-preview"},{equals:"o1-preview-2024-09-12"}]},prices:{input_mtok:15,cache_read_mtok:7.5,output_mtok:60}},{id:"o1-mini",name:"o1-mini",match:{or:[{equals:"o1-mini"},{equals:"o1-mini-2024-09-12"}]},prices:{input_mtok:1.1,cache_read_mtok:.55,output_mtok:4.4}},{id:"o1-pro",name:"o1-pro",match:{equals:"o1-pro"},prices:{input_mtok:150,output_mtok:600}},{id:"o3",name:"o3",match:{equals:"o3"},prices:{input_mtok:2,cache_read_mtok:.5,output_mtok:8}},{id:"o3-mini",name:"o3 Mini",match:{or:[{equals:"o3-mini"},{equals:"o3-mini-high"}]},prices:{input_mtok:1.1,cache_read_mtok:.55,output_mtok:4.4}},{id:"o3-pro",name:"o3 Pro",match:{equals:"o3-pro"},prices:{input_mtok:20,output_mtok:80}},{id:"o4-mini",name:"o4 Mini",match:{or:[{equals:"o4-mini"},{equals:"o4-mini-high"}]},prices:{input_mtok:1.1,cache_read_mtok:.275,output_mtok:4.4}},{id:"open-r1/olympiccoder-32b:free",match:{equals:"open-r1/olympiccoder-32b:free"},prices:{}},{id:"open-r1/olympiccoder-7b:free",match:{equals:"open-r1/olympiccoder-7b:free"},prices:{}},{id:"openai/chatgpt-4o-latest",match:{equals:"openai/chatgpt-4o-latest"},prices:{input_mtok:5,output_mtok:15}},{id:"openai/gpt-3.5-turbo",match:{or:[{equals:"openai/gpt-3.5-turbo"},{equals:"openai/gpt-3.5-turbo-0125"}]},prices:{input_mtok:.5,output_mtok:1.5}},{id:"openai/gpt-3.5-turbo-0613",match:{equals:"openai/gpt-3.5-turbo-0613"},prices:{input_mtok:1,output_mtok:2}},{id:"openai/gpt-3.5-turbo-1106",match:{equals:"openai/gpt-3.5-turbo-1106"},prices:{input_mtok:1,output_mtok:2}},{id:"openai/gpt-3.5-turbo-16k",match:{equals:"openai/gpt-3.5-turbo-16k"},prices:{input_mtok:3,output_mtok:4}},{id:"openai/gpt-3.5-turbo-instruct",match:{equals:"openai/gpt-3.5-turbo-instruct"},prices:{input_mtok:1.5,output_mtok:2}},{id:"openai/gpt-4",match:{or:[{equals:"openai/gpt-4"},{equals:"openai/gpt-4-0314"}]},prices:{input_mtok:30,output_mtok:60}},{id:"openai/gpt-4-1106-preview",match:{equals:"openai/gpt-4-1106-preview"},prices:{input_mtok:10,output_mtok:30}},{id:"openai/gpt-4-32k",match:{or:[{equals:"openai/gpt-4-32k"},{equals:"openai/gpt-4-32k-0314"}]},prices:{input_mtok:60,output_mtok:120}},{id:"openai/gpt-4-turbo",match:{or:[{equals:"openai/gpt-4-turbo"},{equals:"openai/gpt-4-turbo-preview"}]},prices:{input_mtok:10,output_mtok:30}},{id:"openai/gpt-4.1",match:{equals:"openai/gpt-4.1"},prices:{input_mtok:2,output_mtok:8}},{id:"openai/gpt-4.1-mini",match:{equals:"openai/gpt-4.1-mini"},prices:{input_mtok:.4,output_mtok:1.6}},{id:"openai/gpt-4.1-nano",match:{equals:"openai/gpt-4.1-nano"},prices:{input_mtok:.1,output_mtok:.4}},{id:"openai/gpt-4.5-preview",match:{equals:"openai/gpt-4.5-preview"},prices:{input_mtok:75,output_mtok:150}},{id:"openai/gpt-4o",match:{or:[{equals:"openai/gpt-4o"},{equals:"openai/gpt-4o-2024-08-06"},{equals:"openai/gpt-4o-2024-11-20"},{equals:"openai/gpt-4o-search-preview"}]},prices:{input_mtok:2.5,output_mtok:10}},{id:"openai/gpt-4o-2024-05-13",match:{equals:"openai/gpt-4o-2024-05-13"},prices:{input_mtok:5,output_mtok:15}},{id:"openai/gpt-4o-mini",match:{or:[{equals:"openai/gpt-4o-mini"},{equals:"openai/gpt-4o-mini-2024-07-18"},{equals:"openai/gpt-4o-mini-search-preview"}]},prices:{input_mtok:.15,output_mtok:.6}},{id:"openai/gpt-4o:extended",match:{equals:"openai/gpt-4o:extended"},prices:{input_mtok:6,output_mtok:18}},{id:"openai/o1",match:{or:[{equals:"openai/o1"},{equals:"openai/o1-preview"},{equals:"openai/o1-preview-2024-09-12"}]},prices:{input_mtok:15,output_mtok:60}},{id:"openai/o1-mini",match:{or:[{equals:"openai/o1-mini"},{equals:"openai/o1-mini-2024-09-12"}]},prices:{input_mtok:1.1,output_mtok:4.4}},{id:"openai/o1-pro",match:{equals:"openai/o1-pro"},prices:{input_mtok:150,output_mtok:600}},{id:"openai/o3",match:{equals:"openai/o3"},prices:{input_mtok:10,output_mtok:40}},{id:"openai/o3-mini",match:{or:[{equals:"openai/o3-mini"},{equals:"openai/o3-mini-high"}]},prices:{input_mtok:1.1,output_mtok:4.4}},{id:"openai/o4-mini",match:{or:[{equals:"openai/o4-mini"},{equals:"openai/o4-mini-high"}]},prices:{input_mtok:1.1,output_mtok:4.4}},{id:"openchat/openchat-7b",match:{equals:"openchat/openchat-7b"},prices:{input_mtok:.07,output_mtok:.07}},{id:"openhands-lm-32b-v0.1",name:"OpenHands LM 32B V0.1",match:{equals:"openhands-lm-32b-v0.1"},prices:{input_mtok:2.6,output_mtok:3.4}},{id:"perplexity/llama-3.1-sonar-large-128k-online",match:{equals:"perplexity/llama-3.1-sonar-large-128k-online"},prices:{input_mtok:1,output_mtok:1}},{id:"perplexity/llama-3.1-sonar-small-128k-online",match:{equals:"perplexity/llama-3.1-sonar-small-128k-online"},prices:{input_mtok:.2,output_mtok:.2}},{id:"perplexity/r1-1776",match:{equals:"perplexity/r1-1776"},prices:{input_mtok:2,output_mtok:8}},{id:"perplexity/sonar",match:{equals:"perplexity/sonar"},prices:{input_mtok:1,output_mtok:1}},{id:"perplexity/sonar-deep-research",match:{equals:"perplexity/sonar-deep-research"},prices:{input_mtok:2,output_mtok:8}},{id:"perplexity/sonar-pro",match:{equals:"perplexity/sonar-pro"},prices:{input_mtok:3,output_mtok:15}},{id:"perplexity/sonar-reasoning",match:{equals:"perplexity/sonar-reasoning"},prices:{input_mtok:1,output_mtok:5}},{id:"perplexity/sonar-reasoning-pro",match:{equals:"perplexity/sonar-reasoning-pro"},prices:{input_mtok:2,output_mtok:8}},{id:"phi-3-medium-128k-instruct",name:"Phi-3 Medium 128K Instruct",match:{equals:"phi-3-medium-128k-instruct"},prices:{input_mtok:1,output_mtok:1}},{id:"phi-3-mini-128k-instruct",name:"Phi-3 Mini 128K Instruct",match:{equals:"phi-3-mini-128k-instruct"},prices:{input_mtok:.1,output_mtok:.1}},{id:"phi-3.5-mini-128k-instruct",name:"Phi-3.5 Mini 128K Instruct",match:{equals:"phi-3.5-mini-128k-instruct"},prices:{input_mtok:.1,output_mtok:.1}},{id:"phi-4",name:"Phi 4",match:{equals:"phi-4"},prices:{input_mtok:.07,output_mtok:.14}},{id:"phi-4-multimodal-instruct",name:"Phi 4 Multimodal Instruct",match:{equals:"phi-4-multimodal-instruct"},prices:{input_mtok:.05,output_mtok:.1}},{id:"phi-4-reasoning-plus",name:"Phi 4 Reasoning Plus",match:{equals:"phi-4-reasoning-plus"},prices:{input_mtok:.07,output_mtok:.35}},{id:"phi-4-reasoning-plus:free",name:"Phi 4 Reasoning Plus (free)",match:{equals:"phi-4-reasoning-plus:free"},prices:{}},{id:"phi-4-reasoning:free",name:"Phi 4 Reasoning (free)",match:{equals:"phi-4-reasoning:free"},prices:{}},{id:"pixtral-12b",name:"Pixtral 12B",match:{equals:"pixtral-12b"},prices:{input_mtok:.1,output_mtok:.1}},{id:"pixtral-large-2411",name:"Pixtral Large 2411",match:{equals:"pixtral-large-2411"},prices:{input_mtok:2,output_mtok:6}},{id:"pygmalionai/mythalion-13b",match:{equals:"pygmalionai/mythalion-13b"},prices:{input_mtok:.5625,output_mtok:1.125}},{id:"qwen-2-72b-instruct",name:"Qwen 2 72B Instruct",match:{equals:"qwen-2-72b-instruct"},prices:{input_mtok:.9,output_mtok:.9}},{id:"qwen-2.5-72b-instruct",name:"Qwen2.5 72B Instruct",match:{equals:"qwen-2.5-72b-instruct"},prices:{input_mtok:.12,output_mtok:.39}},{id:"qwen-2.5-72b-instruct:free",name:"Qwen2.5 72B Instruct (free)",match:{equals:"qwen-2.5-72b-instruct:free"},prices:{}},{id:"qwen-2.5-7b-instruct",name:"Qwen2.5 7B Instruct",match:{equals:"qwen-2.5-7b-instruct"},prices:{input_mtok:.04,output_mtok:.1}},{id:"qwen-2.5-coder-32b-instruct",name:"Qwen2.5 Coder 32B Instruct",match:{equals:"qwen-2.5-coder-32b-instruct"},prices:{input_mtok:.06,output_mtok:.15}},{id:"qwen-2.5-coder-32b-instruct:free",name:"Qwen2.5 Coder 32B Instruct (free)",match:{equals:"qwen-2.5-coder-32b-instruct:free"},prices:{}},{id:"qwen-2.5-vl-7b-instruct",name:"Qwen2.5-VL 7B Instruct",match:{equals:"qwen-2.5-vl-7b-instruct"},prices:{input_mtok:.2,output_mtok:.2}},{id:"qwen-max",name:"Qwen-Max",match:{equals:"qwen-max"},prices:{input_mtok:1.6,cache_read_mtok:.64,output_mtok:6.4}},{id:"qwen-plus",name:"Qwen-Plus",match:{equals:"qwen-plus"},prices:{input_mtok:.4,cache_read_mtok:.16,output_mtok:1.2}},{id:"qwen-turbo",name:"Qwen-Turbo",match:{equals:"qwen-turbo"},prices:{input_mtok:.05,cache_read_mtok:.02,output_mtok:.2}},{id:"qwen-vl-max",name:"Qwen VL Max",match:{equals:"qwen-vl-max"},prices:{input_mtok:.8,output_mtok:3.2}},{id:"qwen-vl-plus",name:"Qwen VL Plus",match:{equals:"qwen-vl-plus"},prices:{input_mtok:.21,output_mtok:.63}},{id:"qwen/qwen-2-72b-instruct",match:{equals:"qwen/qwen-2-72b-instruct"},prices:{input_mtok:.9,output_mtok:.9}},{id:"qwen/qwen-2.5-72b-instruct",match:{equals:"qwen/qwen-2.5-72b-instruct"},prices:{input_mtok:.12,output_mtok:.39}},{id:"qwen/qwen-2.5-72b-instruct:free",match:{equals:"qwen/qwen-2.5-72b-instruct:free"},prices:{}},{id:"qwen/qwen-2.5-7b-instruct",match:{equals:"qwen/qwen-2.5-7b-instruct"},prices:{input_mtok:.05,output_mtok:.1}},{id:"qwen/qwen-2.5-7b-instruct:free",match:{equals:"qwen/qwen-2.5-7b-instruct:free"},prices:{}},{id:"qwen/qwen-2.5-coder-32b-instruct",match:{equals:"qwen/qwen-2.5-coder-32b-instruct"},prices:{input_mtok:.07,output_mtok:.15}},{id:"qwen/qwen-2.5-coder-32b-instruct:free",match:{equals:"qwen/qwen-2.5-coder-32b-instruct:free"},prices:{}},{id:"qwen/qwen-2.5-vl-72b-instruct",match:{equals:"qwen/qwen-2.5-vl-72b-instruct"},prices:{input_mtok:.6,output_mtok:.6}},{id:"qwen/qwen-2.5-vl-7b-instruct",match:{equals:"qwen/qwen-2.5-vl-7b-instruct"},prices:{input_mtok:.2,output_mtok:.2}},{id:"qwen/qwen-2.5-vl-7b-instruct:free",match:{equals:"qwen/qwen-2.5-vl-7b-instruct:free"},prices:{}},{id:"qwen/qwen-max",match:{equals:"qwen/qwen-max"},prices:{input_mtok:1.6,output_mtok:6.4}},{id:"qwen/qwen-plus",match:{equals:"qwen/qwen-plus"},prices:{input_mtok:.4,output_mtok:1.2}},{id:"qwen/qwen-turbo",match:{equals:"qwen/qwen-turbo"},prices:{input_mtok:.05,output_mtok:.2}},{id:"qwen/qwen-vl-max",match:{equals:"qwen/qwen-vl-max"},prices:{input_mtok:.8,output_mtok:3.2}},{id:"qwen/qwen-vl-plus",match:{equals:"qwen/qwen-vl-plus"},prices:{input_mtok:.21,output_mtok:.63}},{id:"qwen/qwen2.5-coder-7b-instruct",match:{equals:"qwen/qwen2.5-coder-7b-instruct"},prices:{input_mtok:.2,output_mtok:.2}},{id:"qwen/qwen2.5-vl-32b-instruct",match:{equals:"qwen/qwen2.5-vl-32b-instruct"},prices:{input_mtok:.9,output_mtok:.9}},{id:"qwen/qwen2.5-vl-32b-instruct:free",match:{equals:"qwen/qwen2.5-vl-32b-instruct:free"},prices:{}},{id:"qwen/qwen2.5-vl-3b-instruct:free",match:{equals:"qwen/qwen2.5-vl-3b-instruct:free"},prices:{}},{id:"qwen/qwen2.5-vl-72b-instruct",match:{equals:"qwen/qwen2.5-vl-72b-instruct"},prices:{input_mtok:.7,output_mtok:.7}},{id:"qwen/qwen2.5-vl-72b-instruct:free",match:{equals:"qwen/qwen2.5-vl-72b-instruct:free"},prices:{}},{id:"qwen/qwq-32b",match:{equals:"qwen/qwq-32b"},prices:{input_mtok:.15,output_mtok:.2}},{id:"qwen/qwq-32b-preview",match:{equals:"qwen/qwq-32b-preview"},prices:{input_mtok:.2,output_mtok:.2}},{id:"qwen/qwq-32b-preview:free",match:{equals:"qwen/qwq-32b-preview:free"},prices:{}},{id:"qwen/qwq-32b:free",match:{equals:"qwen/qwq-32b:free"},prices:{}},{id:"qwen2.5-vl-32b-instruct",name:"Qwen2.5 VL 32B Instruct",match:{equals:"qwen2.5-vl-32b-instruct"},prices:{input_mtok:.9,output_mtok:.9}},{id:"qwen2.5-vl-32b-instruct:free",name:"Qwen2.5 VL 32B Instruct (free)",match:{equals:"qwen2.5-vl-32b-instruct:free"},prices:{}},{id:"qwen2.5-vl-72b-instruct",name:"Qwen2.5 VL 72B Instruct",match:{equals:"qwen2.5-vl-72b-instruct"},prices:{input_mtok:.25,output_mtok:.75}},{id:"qwen2.5-vl-72b-instruct:free",name:"Qwen2.5 VL 72B Instruct (free)",match:{equals:"qwen2.5-vl-72b-instruct:free"},prices:{}},{id:"qwen3-14b",name:"Qwen3 14B",match:{equals:"qwen3-14b"},prices:{input_mtok:.06,output_mtok:.24}},{id:"qwen3-14b:free",name:"Qwen3 14B (free)",match:{equals:"qwen3-14b:free"},prices:{}},{id:"qwen3-235b-a22b",name:"Qwen3 235B A22B",match:{equals:"qwen3-235b-a22b"},prices:{input_mtok:.13,output_mtok:.6}},{id:"qwen3-235b-a22b:free",name:"Qwen3 235B A22B (free)",match:{equals:"qwen3-235b-a22b:free"},prices:{}},{id:"qwen3-30b-a3b",name:"Qwen3 30B A3B",match:{equals:"qwen3-30b-a3b"},prices:{input_mtok:.08,output_mtok:.29}},{id:"qwen3-30b-a3b:free",name:"Qwen3 30B A3B (free)",match:{equals:"qwen3-30b-a3b:free"},prices:{}},{id:"qwen3-32b",name:"Qwen3 32B",match:{equals:"qwen3-32b"},prices:{input_mtok:.1,output_mtok:.3}},{id:"qwen3-32b:free",name:"Qwen3 32B (free)",match:{equals:"qwen3-32b:free"},prices:{}},{id:"qwen3-8b",name:"Qwen3 8B",match:{equals:"qwen3-8b"},prices:{input_mtok:.035,output_mtok:.138}},{id:"qwen3-8b:free",name:"Qwen3 8B (free)",match:{equals:"qwen3-8b:free"},prices:{}},{id:"qwerky-72b:free",name:"Qwerky 72B (free)",match:{equals:"qwerky-72b:free"},prices:{}},{id:"qwq-32b",name:"QwQ 32B",match:{equals:"qwq-32b"},prices:{input_mtok:.15,output_mtok:.2}},{id:"qwq-32b-arliai-rpr-v1:free",name:"QwQ 32B RpR v1 (free)",match:{equals:"qwq-32b-arliai-rpr-v1:free"},prices:{}},{id:"qwq-32b-preview",name:"QwQ 32B Preview",match:{equals:"qwq-32b-preview"},prices:{input_mtok:.2,output_mtok:.2}},{id:"qwq-32b:free",name:"QwQ 32B (free)",match:{equals:"qwq-32b:free"},prices:{}},{id:"r1-1776",name:"R1 1776",match:{equals:"r1-1776"},prices:{input_mtok:2,output_mtok:8}},{id:"raifle/sorcererlm-8x22b",match:{equals:"raifle/sorcererlm-8x22b"},prices:{input_mtok:4.5,output_mtok:4.5}},{id:"reka-flash-3:free",name:"Flash 3 (free)",match:{equals:"reka-flash-3:free"},prices:{}},{id:"rekaai/reka-flash-3:free",match:{equals:"rekaai/reka-flash-3:free"},prices:{}},{id:"remm-slerp-l2-13b",name:"ReMM SLERP 13B",match:{equals:"remm-slerp-l2-13b"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"rocinante-12b",name:"Rocinante 12B",match:{equals:"rocinante-12b"},prices:{input_mtok:.25,output_mtok:.5}},{id:"sao10k/fimbulvetr-11b-v2",match:{equals:"sao10k/fimbulvetr-11b-v2"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"sao10k/l3-euryale-70b",match:{equals:"sao10k/l3-euryale-70b"},prices:{input_mtok:1.48,output_mtok:1.48}},{id:"sao10k/l3-lunaris-8b",match:{equals:"sao10k/l3-lunaris-8b"},prices:{input_mtok:.02,output_mtok:.05}},{id:"sao10k/l3.1-euryale-70b",match:{equals:"sao10k/l3.1-euryale-70b"},prices:{input_mtok:.7,output_mtok:.8}},{id:"sao10k/l3.3-euryale-70b",match:{equals:"sao10k/l3.3-euryale-70b"},prices:{input_mtok:.7,output_mtok:.8}},{id:"sarvam-m:free",name:"Sarvam-M (free)",match:{equals:"sarvam-m:free"},prices:{}},{id:"scb10x/llama3.1-typhoon2-70b-instruct",match:{equals:"scb10x/llama3.1-typhoon2-70b-instruct"},prices:{input_mtok:.88,output_mtok:.88}},{id:"scb10x/llama3.1-typhoon2-8b-instruct",match:{equals:"scb10x/llama3.1-typhoon2-8b-instruct"},prices:{input_mtok:.18,output_mtok:.18}},{id:"shisa-ai/shisa-v2-llama3.3-70b:free",match:{equals:"shisa-ai/shisa-v2-llama3.3-70b:free"},prices:{}},{id:"shisa-v2-llama3.3-70b:free",name:"Shisa V2 Llama 3.3 70B (free)",match:{equals:"shisa-v2-llama3.3-70b:free"},prices:{}},{id:"skyfall-36b-v2",name:"Skyfall 36B V2",match:{equals:"skyfall-36b-v2"},prices:{input_mtok:.5,output_mtok:.8}},{id:"sonar",name:"Sonar",match:{equals:"sonar"},prices:{input_mtok:1,output_mtok:1}},{id:"sonar-deep-research",name:"Sonar Deep Research",match:{equals:"sonar-deep-research"},prices:{input_mtok:2,output_mtok:8}},{id:"sonar-pro",name:"Sonar Pro",match:{equals:"sonar-pro"},prices:{input_mtok:3,output_mtok:15}},{id:"sonar-reasoning",name:"Sonar Reasoning",match:{equals:"sonar-reasoning"},prices:{input_mtok:1,output_mtok:5}},{id:"sonar-reasoning-pro",name:"Sonar Reasoning Pro",match:{equals:"sonar-reasoning-pro"},prices:{input_mtok:2,output_mtok:8}},{id:"sophosympatheia/midnight-rose-70b",match:{equals:"sophosympatheia/midnight-rose-70b"},prices:{input_mtok:.8,output_mtok:.8}},{id:"sophosympatheia/rogue-rose-103b-v0.2:free",match:{equals:"sophosympatheia/rogue-rose-103b-v0.2:free"},prices:{}},{id:"sorcererlm-8x22b",name:"SorcererLM 8x22B",match:{equals:"sorcererlm-8x22b"},prices:{input_mtok:4.5,output_mtok:4.5}},{id:"spotlight",name:"Spotlight",match:{equals:"spotlight"},prices:{input_mtok:.18,output_mtok:.18}},{id:"steelskull/l3.3-electra-r1-70b",match:{equals:"steelskull/l3.3-electra-r1-70b"},prices:{input_mtok:.7,output_mtok:.95}},{id:"thedrummer/anubis-pro-105b-v1",match:{equals:"thedrummer/anubis-pro-105b-v1"},prices:{input_mtok:.8,output_mtok:1}},{id:"thedrummer/rocinante-12b",match:{equals:"thedrummer/rocinante-12b"},prices:{input_mtok:.25,output_mtok:.5}},{id:"thedrummer/skyfall-36b-v2",match:{equals:"thedrummer/skyfall-36b-v2"},prices:{input_mtok:.5,output_mtok:.8}},{id:"thedrummer/unslopnemo-12b",match:{equals:"thedrummer/unslopnemo-12b"},prices:{input_mtok:.5,output_mtok:.5}},{id:"thudm/glm-4-32b:free",match:{equals:"thudm/glm-4-32b:free"},prices:{}},{id:"thudm/glm-z1-32b:free",match:{equals:"thudm/glm-z1-32b:free"},prices:{}},{id:"toppy-m-7b",name:"Toppy M 7B",match:{equals:"toppy-m-7b"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"undi95/remm-slerp-l2-13b",match:{equals:"undi95/remm-slerp-l2-13b"},prices:{input_mtok:.5625,output_mtok:1.125}},{id:"undi95/toppy-m-7b",match:{equals:"undi95/toppy-m-7b"},prices:{input_mtok:.07,output_mtok:.07}},{id:"unslopnemo-12b",name:"UnslopNemo 12B",match:{equals:"unslopnemo-12b"},prices:{input_mtok:.45,output_mtok:.45}},{id:"valkyrie-49b-v1",name:"Valkyrie 49B V1",match:{equals:"valkyrie-49b-v1"},prices:{input_mtok:.5,output_mtok:.8}},{id:"virtuoso-large",name:"Virtuoso Large",match:{equals:"virtuoso-large"},prices:{input_mtok:.75,output_mtok:1.2}},{id:"virtuoso-medium-v2",name:"Virtuoso Medium V2",match:{equals:"virtuoso-medium-v2"},prices:{input_mtok:.5,output_mtok:.8}},{id:"weaver",name:"Weaver (alpha)",match:{equals:"weaver"},prices:{input_mtok:1.5,output_mtok:1.5}},{id:"wizardlm-2-8x22b",name:"WizardLM-2 8x22B",match:{equals:"wizardlm-2-8x22b"},prices:{input_mtok:.48,output_mtok:.48}},{id:"x-ai/grok-2-1212",match:{equals:"x-ai/grok-2-1212"},prices:{input_mtok:2,output_mtok:10}},{id:"x-ai/grok-2-vision-1212",match:{equals:"x-ai/grok-2-vision-1212"},prices:{input_mtok:2,output_mtok:10}},{id:"x-ai/grok-3-beta",match:{equals:"x-ai/grok-3-beta"},prices:{input_mtok:3,output_mtok:15}},{id:"x-ai/grok-3-mini-beta",match:{equals:"x-ai/grok-3-mini-beta"},prices:{input_mtok:.3,output_mtok:.5}},{id:"x-ai/grok-beta",match:{equals:"x-ai/grok-beta"},prices:{input_mtok:5,output_mtok:15}},{id:"x-ai/grok-vision-beta",match:{equals:"x-ai/grok-vision-beta"},prices:{input_mtok:5,output_mtok:15}},{id:"xwin-lm/xwin-lm-70b",match:{equals:"xwin-lm/xwin-lm-70b"},prices:{input_mtok:3.75,output_mtok:3.75}},{id:"yi-large",name:"Yi Large",match:{equals:"yi-large"},prices:{input_mtok:3,output_mtok:3}},{id:"z-ai/glm-4.5",match:{equals:"z-ai/glm-4.5"},context_window:131072,prices:{input_mtok:.35,output_mtok:1.55}},{id:"z-ai/glm-4.6",match:{equals:"z-ai/glm-4.6"},context_window:202752,prices:{input_mtok:.4,output_mtok:1.75}}]},{id:"perplexity",name:"Perplexity",pricing_urls:["https://docs.perplexity.ai/guides/pricing"],api_pattern:"https://api\\.perplexity\\.ai",price_comments:"Prices per request vary based on usage, this is not represented here, instead we just take the highest price shown for `requests_kcount`.",models:[{id:"llama-3.1-sonar-large-128k-online",name:"Llama 3.1 Sonar 70B Online",description:"Llama 3.1 Sonar is Perplexity's latest model family. It surpasses their earlier Sonar models in cost-efficiency, speed, and performance.",match:{equals:"llama-3.1-sonar-large-128k-online"},prices:{input_mtok:1,output_mtok:1}},{id:"llama-3.1-sonar-small-128k-online",name:"Llama 3.1 Sonar 8B Online",description:"Llama 3.1 Sonar is Perplexity's latest model family. It surpasses their earlier Sonar models in cost-efficiency, speed, and performance.",match:{equals:"llama-3.1-sonar-small-128k-online"},prices:{input_mtok:.2,output_mtok:.2}},{id:"r1-1776",name:"R1 1776",description:"R1 1776 is a version of DeepSeek-R1 that has been post-trained to remove censorship constraints related to topics restricted by the Chinese government. The model retains its original reasoning capabilities while providing direct responses to a wider range of queries. R1 1776 is an offline chat model that does not use the perplexity search subsystem.",match:{equals:"r1-1776"},prices:{input_mtok:2,output_mtok:8}},{id:"sonar",name:"Sonar",description:"Sonar is lightweight, affordable, fast, and simple to use — now featuring citations and the ability to customize sources. It is designed for companies seeking to integrate lightweight question-and-answer features optimized for speed.",match:{equals:"sonar"},prices:{input_mtok:1,output_mtok:1,requests_kcount:12}},{id:"sonar-deep-research",name:"Sonar Deep Research",description:"Sonar Deep Research is a research-focused model designed for multi-step retrieval, synthesis, and reasoning across complex topics. It autonomously searches, reads, and evaluates sources, refining its approach as it gathers information. This enables comprehensive report generation across domains like finance, technology, health, and current events.",match:{equals:"sonar-deep-research"},prices:{input_mtok:2,output_mtok:8}},{id:"sonar-pro",name:"Sonar Pro",description:"Note: Sonar Pro pricing includes Perplexity search pricing. See details here",match:{equals:"sonar-pro"},prices:{input_mtok:3,output_mtok:15,requests_kcount:14}},{id:"sonar-reasoning",name:"Sonar Reasoning",description:"Sonar Reasoning is a reasoning model provided by Perplexity based on DeepSeek R1.",match:{equals:"sonar-reasoning"},prices:{input_mtok:1,output_mtok:5,requests_kcount:12}},{id:"sonar-reasoning-pro",name:"Sonar Reasoning Pro",description:"Sonar Pro pricing includes Perplexity search pricing.",match:{equals:"sonar-reasoning-pro"},prices:{input_mtok:2,output_mtok:8,requests_kcount:14}}]},{id:"together",name:"Together AI",pricing_urls:["https://www.together.ai/pricing"],api_pattern:"https://api\\.together\\.xyz",provider_match:{or:[{equals:"together-ai"},{equals:"together_ai"}]},models:[{id:"Austism/chronos-hermes-13b",match:{equals:"Austism/chronos-hermes-13b"},prices:{input_mtok:.3,output_mtok:.3}},{id:"Gryphe/MythoMax-L2-13b",match:{equals:"Gryphe/MythoMax-L2-13b"},prices:{input_mtok:.3,output_mtok:.3}},{id:"Nexusflow/NexusRaven-V2-13B",match:{equals:"Nexusflow/NexusRaven-V2-13B"},prices:{input_mtok:.3,output_mtok:.3}},{id:"NousResearch/Nous-Capybara-7B-V1p9",match:{equals:"NousResearch/Nous-Capybara-7B-V1p9"},prices:{input_mtok:.2,output_mtok:.2}},{id:"NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO",match:{equals:"NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO"},prices:{input_mtok:.9,output_mtok:.9}},{id:"NousResearch/Nous-Hermes-2-Mixtral-8x7B-SFT",match:{equals:"NousResearch/Nous-Hermes-2-Mixtral-8x7B-SFT"},prices:{input_mtok:.9,output_mtok:.9}},{id:"NousResearch/Nous-Hermes-2-Yi-34B",match:{equals:"NousResearch/Nous-Hermes-2-Yi-34B"},prices:{input_mtok:.8,output_mtok:.8}},{id:"NousResearch/Nous-Hermes-Llama2-13b",match:{equals:"NousResearch/Nous-Hermes-Llama2-13b"},prices:{input_mtok:.225,output_mtok:.225}},{id:"NousResearch/Nous-Hermes-llama-2-7b",match:{equals:"NousResearch/Nous-Hermes-llama-2-7b"},prices:{input_mtok:.2,output_mtok:.2}},{id:"Open-Orca/Mistral-7B-OpenOrca",match:{equals:"Open-Orca/Mistral-7B-OpenOrca"},prices:{input_mtok:.2,output_mtok:.2}},{id:"Qwen/Qwen1.5-0.5B",match:{or:[{equals:"Qwen/Qwen1.5-0.5B"},{equals:"Qwen/Qwen1.5-0.5B-Chat"}]},prices:{input_mtok:.1,output_mtok:.1}},{id:"Qwen/Qwen1.5-1.8B",match:{or:[{equals:"Qwen/Qwen1.5-1.8B"},{equals:"Qwen/Qwen1.5-1.8B-Chat"}]},prices:{input_mtok:.1,output_mtok:.1}},{id:"Qwen/Qwen1.5-14B",match:{or:[{equals:"Qwen/Qwen1.5-14B"},{equals:"Qwen/Qwen1.5-14B-Chat"}]},prices:{input_mtok:.3,output_mtok:.3}},{id:"Qwen/Qwen1.5-4B",match:{or:[{equals:"Qwen/Qwen1.5-4B"},{equals:"Qwen/Qwen1.5-4B-Chat"}]},prices:{input_mtok:.1,output_mtok:.1}},{id:"Qwen/Qwen1.5-72B",match:{equals:"Qwen/Qwen1.5-72B"},prices:{input_mtok:.9,output_mtok:.9}},{id:"Qwen/Qwen1.5-7B",match:{or:[{equals:"Qwen/Qwen1.5-7B"},{equals:"Qwen/Qwen1.5-7B-Chat"}]},prices:{input_mtok:.2,output_mtok:.2}},{id:"Undi95/ReMM-SLERP-L2-13B",match:{equals:"Undi95/ReMM-SLERP-L2-13B"},prices:{input_mtok:.3,output_mtok:.3}},{id:"Undi95/Toppy-M-7B",match:{equals:"Undi95/Toppy-M-7B"},prices:{input_mtok:.2,output_mtok:.2}},{id:"WizardLM/WizardLM-13B-V1.2",match:{equals:"WizardLM/WizardLM-13B-V1.2"},prices:{input_mtok:.3,output_mtok:.3}},{id:"allenai/OLMo-7B",match:{or:[{equals:"allenai/OLMo-7B"},{equals:"allenai/OLMo-7B-Instruct"},{equals:"allenai/OLMo-7B-Twin-2T"}]},prices:{input_mtok:.2,output_mtok:.2}},{id:"codellama/CodeLlama-13b-Instruct-hf",match:{equals:"codellama/CodeLlama-13b-Instruct-hf"},prices:{input_mtok:.225,output_mtok:.225}},{id:"codellama/CodeLlama-34b-Instruct-hf",match:{equals:"codellama/CodeLlama-34b-Instruct-hf"},prices:{input_mtok:.776,output_mtok:.776}},{id:"codellama/CodeLlama-70b-Instruct-hf",match:{equals:"codellama/CodeLlama-70b-Instruct-hf"},prices:{input_mtok:.9,output_mtok:.9}},{id:"codellama/CodeLlama-7b-Instruct-hf",match:{equals:"codellama/CodeLlama-7b-Instruct-hf"},prices:{input_mtok:.2,output_mtok:.2}},{id:"deepseek-ai/deepseek-coder-33b-instruct",match:{equals:"deepseek-ai/deepseek-coder-33b-instruct"},prices:{input_mtok:.8,output_mtok:.8}},{id:"garage-bAInd/Platypus2-70B-instruct",match:{equals:"garage-bAInd/Platypus2-70B-instruct"},prices:{input_mtok:.9,output_mtok:.9}},{id:"google/gemma-2b",match:{or:[{equals:"google/gemma-2b"},{equals:"google/gemma-2b-it"}]},prices:{input_mtok:.1,output_mtok:.1}},{id:"google/gemma-7b",match:{or:[{equals:"google/gemma-7b"},{equals:"google/gemma-7b-it"}]},prices:{input_mtok:.2,output_mtok:.2}},{id:"lmsys/vicuna-13b-v1.5",match:{equals:"lmsys/vicuna-13b-v1.5"},prices:{input_mtok:.3,output_mtok:.3}},{id:"lmsys/vicuna-7b-v1.5",match:{equals:"lmsys/vicuna-7b-v1.5"},prices:{input_mtok:.2,output_mtok:.2}},{id:"meta-llama/Llama-2-13b-chat-hf",match:{equals:"meta-llama/Llama-2-13b-chat-hf"},prices:{input_mtok:.225,output_mtok:.225}},{id:"meta-llama/Llama-2-70b-chat-hf",match:{equals:"meta-llama/Llama-2-70b-chat-hf"},prices:{input_mtok:.9,output_mtok:.9}},{id:"meta-llama/Llama-2-7b-chat-hf",match:{equals:"meta-llama/Llama-2-7b-chat-hf"},prices:{input_mtok:.2,output_mtok:.2}},{id:"meta-llama/Llama-3-70b-chat-hf",match:{equals:"meta-llama/Llama-3-70b-chat-hf"},prices:{input_mtok:.9,output_mtok:.9}},{id:"meta-llama/Llama-3-8b-chat-hf",match:{equals:"meta-llama/Llama-3-8b-chat-hf"},prices:{input_mtok:.2,output_mtok:.2}},{id:"meta-llama/Llama-3.3-70B-Instruct-Turbo",match:{equals:"meta-llama/Llama-3.3-70B-Instruct-Turbo"},prices:{input_mtok:.88,output_mtok:.88}},{id:"meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",match:{equals:"meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8"},prices:{input_mtok:.27,output_mtok:.85}},{id:"meta-llama/Llama-4-Scout-17B-16E-Instruct",match:{equals:"meta-llama/Llama-4-Scout-17B-16E-Instruct"},prices:{input_mtok:.18,output_mtok:.59}},{id:"meta-llama/Meta-Llama-3-70B-Instruct-Lite",match:{equals:"meta-llama/Meta-Llama-3-70B-Instruct-Lite"},prices:{input_mtok:.54,output_mtok:.54}},{id:"meta-llama/Meta-Llama-3-70B-Instruct-Turbo",match:{equals:"meta-llama/Meta-Llama-3-70B-Instruct-Turbo"},prices:{input_mtok:.88,output_mtok:.88}},{id:"meta-llama/Meta-Llama-3-8B-Instruct-Lite",match:{equals:"meta-llama/Meta-Llama-3-8B-Instruct-Lite"},prices:{input_mtok:.1,output_mtok:.1}},{id:"meta-llama/Meta-Llama-3-8B-Instruct-Turbo",match:{equals:"meta-llama/Meta-Llama-3-8B-Instruct-Turbo"},prices:{input_mtok:.18,output_mtok:.18}},{id:"meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo",match:{equals:"meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo"},prices:{input_mtok:3.5,output_mtok:3.5}},{id:"meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo",match:{equals:"meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo"},prices:{input_mtok:.88,output_mtok:.88}},{id:"meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo",match:{equals:"meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo"},prices:{input_mtok:.18,output_mtok:.18}},{id:"meta-llama/Meta-Llama-3.3-70B-Instruct-Turbo",match:{equals:"meta-llama/Meta-Llama-3.3-70B-Instruct-Turbo"},prices:{input_mtok:.88,output_mtok:.88}},{id:"microsoft/WizardLM-2-8x22B",match:{equals:"microsoft/WizardLM-2-8x22B"},prices:{input_mtok:1.2,output_mtok:1.2}},{id:"microsoft/phi-2",match:{equals:"microsoft/phi-2"},prices:{input_mtok:.1,output_mtok:.1}},{id:"mistralai/Mistral-7B-Instruct-v0.1",match:{equals:"mistralai/Mistral-7B-Instruct-v0.1"},prices:{input_mtok:.2,output_mtok:.2}},{id:"mistralai/Mistral-7B-Instruct-v0.2",match:{equals:"mistralai/Mistral-7B-Instruct-v0.2"},prices:{input_mtok:.2,output_mtok:.2}},{id:"mistralai/Mistral-7B-v0.1",match:{equals:"mistralai/Mistral-7B-v0.1"},prices:{input_mtok:.2,output_mtok:.2}},{id:"mistralai/Mixtral-8x22B-Instruct-v0.1",match:{equals:"mistralai/Mixtral-8x22B-Instruct-v0.1"},prices:{input_mtok:2.4,output_mtok:2.4}},{id:"mistralai/Mixtral-8x7B-Instruct-v0.1",match:{equals:"mistralai/Mixtral-8x7B-Instruct-v0.1"},prices:{input_mtok:.9,output_mtok:.9}},{id:"mistralai/Mixtral-8x7B-v0.1",match:{equals:"mistralai/Mixtral-8x7B-v0.1"},prices:{input_mtok:.9,output_mtok:.9}},{id:"openchat/openchat-3.5-1210",match:{equals:"openchat/openchat-3.5-1210"},prices:{input_mtok:.2,output_mtok:.2}},{id:"snorkelai/Snorkel-Mistral-PairRM-DPO",match:{equals:"snorkelai/Snorkel-Mistral-PairRM-DPO"},prices:{input_mtok:.2,output_mtok:.2}},{id:"teknium/OpenHermes-2-Mistral-7B",match:{equals:"teknium/OpenHermes-2-Mistral-7B"},prices:{input_mtok:.2,output_mtok:.2}},{id:"teknium/OpenHermes-2p5-Mistral-7B",match:{equals:"teknium/OpenHermes-2p5-Mistral-7B"},prices:{input_mtok:.2,output_mtok:.2}},{id:"togethercomputer/GPT-JT-Moderation-6B",match:{equals:"togethercomputer/GPT-JT-Moderation-6B"},prices:{input_mtok:.2,output_mtok:.2}},{id:"togethercomputer/Llama-2-7B-32K-Instruct",match:{equals:"togethercomputer/Llama-2-7B-32K-Instruct"},prices:{input_mtok:.2,output_mtok:.2}},{id:"togethercomputer/RedPajama-INCITE-7B-Base",match:{equals:"togethercomputer/RedPajama-INCITE-7B-Base"},prices:{input_mtok:.2,output_mtok:.2}},{id:"togethercomputer/RedPajama-INCITE-7B-Chat",match:{equals:"togethercomputer/RedPajama-INCITE-7B-Chat"},prices:{input_mtok:.2,output_mtok:.2}},{id:"togethercomputer/RedPajama-INCITE-7B-Instruct",match:{equals:"togethercomputer/RedPajama-INCITE-7B-Instruct"},prices:{input_mtok:.2,output_mtok:.2}},{id:"togethercomputer/RedPajama-INCITE-Base-3B-v1",match:{equals:"togethercomputer/RedPajama-INCITE-Base-3B-v1"},prices:{input_mtok:.1,output_mtok:.1}},{id:"togethercomputer/RedPajama-INCITE-Chat-3B-v1",match:{equals:"togethercomputer/RedPajama-INCITE-Chat-3B-v1"},prices:{input_mtok:.1,output_mtok:.1}},{id:"togethercomputer/RedPajama-INCITE-Instruct-3B-v1",match:{equals:"togethercomputer/RedPajama-INCITE-Instruct-3B-v1"},prices:{input_mtok:.1,output_mtok:.1}},{id:"togethercomputer/StripedHyena-Hessian-7B",match:{equals:"togethercomputer/StripedHyena-Hessian-7B"},prices:{input_mtok:.2,output_mtok:.2}},{id:"togethercomputer/StripedHyena-Nous-7B",match:{equals:"togethercomputer/StripedHyena-Nous-7B"},prices:{input_mtok:.2,output_mtok:.2}},{id:"togethercomputer/alpaca-7b",match:{equals:"togethercomputer/alpaca-7b"},prices:{input_mtok:.2,output_mtok:.2}},{id:"upstage/SOLAR-10.7B-Instruct-v1.0",match:{equals:"upstage/SOLAR-10.7B-Instruct-v1.0"},prices:{input_mtok:.3,output_mtok:.3}},{id:"zero-one-ai/Yi-34B",match:{equals:"zero-one-ai/Yi-34B"},prices:{input_mtok:.8,output_mtok:.8}},{id:"zero-one-ai/Yi-6B",match:{equals:"zero-one-ai/Yi-6B"},prices:{input_mtok:.2,output_mtok:.2}}]},{id:"x-ai",name:"X AI",pricing_urls:["https://docs.x.ai/docs/models"],api_pattern:"https://api\\.x\\.ai",model_match:{contains:"grok"},provider_match:{equals:"xai"},extractors:[{api_flavor:"chat",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0},{path:["prompt_tokens_details","cached_tokens"],dest:"cache_read_tokens",required:!1},{path:["completion_tokens_details","audio_tokens"],dest:"output_audio_tokens",required:!1},{path:"completion_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"grok-2-1212",name:"Grok 2 1212",description:"(deprecated) Grok 2 1212 introduces significant enhancements to accuracy, instruction adherence, and multilingual support, making it a powerful and flexible choice for developers seeking a highly steerable, intelligent model.",match:{or:[{equals:"grok-2-1212"},{equals:"grok-2"},{equals:"grok-2-latest"}]},context_window:32768,prices:{input_mtok:2,output_mtok:10}},{id:"grok-2-vision-1212",name:"Grok 2 Vision 1212",description:"Our multimodal model that processes documents, diagrams, charts, screenshots, and photographs.",match:{or:[{equals:"grok-2-vision-1212"},{equals:"grok-2-vision"},{equals:"grok-2-vision-latest"}]},context_window:32768,prices:{input_mtok:2,output_mtok:10}},{id:"grok-3",name:"Grok 3",description:"Flagship model that excels at enterprise use cases like data extraction, coding, and text summarization. Possesses deep domain knowledge in finance, healthcare, law, and science.",match:{or:[{equals:"grok-3"},{equals:"grok-3-latest"},{equals:"grok-3-beta"}]},context_window:131072,prices:{input_mtok:3,cache_read_mtok:.75,output_mtok:15}},{id:"grok-3-fast",name:"Grok 3 Fast",description:"Excels at enterprise use cases like data extraction, coding, and text summarization. Possesses deep domain knowledge in finance, healthcare, law, and science.",match:{or:[{equals:"grok-3-fast"},{equals:"grok-3-fast-latest"},{equals:"grok-3-fast-beta"}]},context_window:131072,prices:{input_mtok:5,cache_read_mtok:1.25,output_mtok:25}},{id:"grok-3-mini",name:"Grok 3 Mini",description:"A lightweight model that thinks before responding. Fast, smart, and great for logic-based tasks that do not require deep domain knowledge. The raw thinking traces are accessible.",match:{or:[{equals:"grok-3-mini"},{equals:"grok-3-mini-beta"},{equals:"grok-3-mini-latest"}]},context_window:131072,prices:{input_mtok:.3,cache_read_mtok:.075,output_mtok:.5}},{id:"grok-3-mini-fast",name:"Grok 3 Mini Fast",description:"A lightweight model that thinks before responding. Fast, smart, and great for logic-based tasks that do not require deep domain knowledge. The raw thinking traces are accessible.",match:{or:[{equals:"grok-3-mini-fast"},{equals:"grok-3-mini-fast-beta"},{equals:"grok-3-mini-fast-latest"}]},context_window:131072,prices:{input_mtok:.6,cache_read_mtok:.15,output_mtok:4}},{id:"grok-4-0709",name:"Grok 4",description:"A flagship model, offering unparalleled performance in natural language, math and reasoning - the perfect jack of all trades.",match:{or:[{equals:"grok-4-0709"},{equals:"grok-4"},{equals:"grok-4-latest"}]},context_window:256e3,prices:{input_mtok:3,cache_read_mtok:.75,output_mtok:15}}]}];function I(t,e){if(e<=0)return 0;let a=0;const i=[...t.tiers].sort((m,s)=>m.start-s.start),o=i[0]?.start??e,r=Math.min(e,o);a+=r*t.base/1e6;for(let m=0;m<i.length;m++){const s=i[m],n=i[m+1]?.start??1/0,u=Math.max(0,Math.min(e,n)-s.start);u>0&&(a+=u*s.price/1e6)}return a}function c(t,e,a){return t===void 0||e===void 0?0:typeof t=="number"?t*e/1e6:I(t,e)}function L(t,e){let a=0,i=0;const o=t.cache_read_tokens??0,r=t.cache_write_tokens??0,m=t.cache_audio_read_tokens??0,s=t.output_audio_tokens??0;let n=t.input_audio_tokens??0;if(n-=m,n<0)throw new Error("cache_audio_read_tokens cannot be greater than input_audio_tokens");let u=t.input_tokens??0;if(u-=o,u-=r,u-=n,u<0)throw new Error("Uncached text input tokens cannot be negative");let p=o;if(p-=m,p<0)throw new Error("cache_audio_read_tokens cannot be greater than cache_read_tokens");a+=c(e.input_mtok,u),a+=c(e.cache_read_mtok,p),a+=c(e.cache_write_mtok,r),a+=c(e.input_audio_mtok,n),a+=c(e.cache_audio_read_mtok,m);let _=t.output_tokens??0;if(_-=s,_<0)throw new Error("output_audio_tokens cannot be greater than output_tokens");i+=c(e.output_mtok,_),i+=c(e.output_audio_mtok,t.output_audio_tokens);let w=a+i;return e.requests_kcount!==void 0&&(w+=e.requests_kcount/1e3),{input_price:a,output_price:i,total_price:w}}function P(t,e){if(!Array.isArray(t.prices))return t.prices;for(let a=t.prices.length-1;a>=0;a--){const i=t.prices[a],o=i.constraint;if(o===void 0)return i.prices;if(o.type==="start_date"){if(e>=new Date(o.start_date))return i.prices}else{const r=e.toISOString().slice(11,19),m=o.start_time,s=o.end_time;if(s<m){if(r>=m||r<s)return i.prices}else if(r>=m&&r<s)return i.prices}}return t.prices[0].prices}function h(t,e){return"or"in t?t.or.some(a=>h(a,e)):"and"in t?t.and.every(a=>h(a,e)):"equals"in t?e===t.equals:"starts_with"in t?e.startsWith(t.starts_with):"ends_with"in t?e.endsWith(t.ends_with):"contains"in t?e.includes(t.contains):"regex"in t?new RegExp(t.regex).test(e):!1}function T(t,e){const a=e.toLowerCase().trim(),i=t.find(o=>o.id===a);return i||t.find(o=>o.provider_match&&h(o.provider_match,a))}function B(t,{modelId:e,providerApiUrl:a,providerId:i}){if(i)return T(t,i);if(a)return t.find(o=>new RegExp(o.api_pattern).test(a));if(e)return t.find(o=>o.model_match&&h(o.model_match,e))}function G(t,e){return t.find(a=>h(a.match,e))}const y="https://raw.githubusercontent.com/pydantic/genai-prices/main/prices/data.json";let g=x,b=Promise.resolve(x),f=null;function S(t){t!==null&&("then"in t?(b=t,t.then(e=>{e!==null&&(g=e)})):(b=Promise.resolve(t),g=t))}function C(t){f=t}function A(t){t({onCalc:C,remoteDataUrl:y,setProviderData:S})}function R(){return b}function z(t,e,a){f?.();const i=e.toLowerCase().trim(),o=a?.provider??B(g,{modelId:i,providerApiUrl:a?.providerApiUrl,providerId:a?.providerId});if(!o)return null;const r=G(o.models,i);if(!r)return null;const m=a?.timestamp??new Date,s=P(r,m),n=L(t,s);return{auto_update_timestamp:void 0,model:r,model_price:s,provider:o,...n}}function Q(t){return f?.(),B(g,t)}function N(t,e,a){if(a=a??"default",!t.extractors)throw new Error("No extraction logic defined for this provider");const i=t.extractors.find(n=>n.api_flavor===a);if(!i){const n=t.extractors.map(u=>u.api_flavor).join(", ");throw new Error(`Unknown apiFlavor '${a}', allowed values: ${n}`)}if(!k.guard(e))throw new Error(`Expected response data to be a mapping object, got ${l(e)}`);const o=q(i.model_path,e,D,!1,[]),r=M(i.root),m=q(r,e,k,!0,[]),s={};for(const n of i.mappings){const u=q(n.path,m,E,n.required,r);if(u!==null){const p=s[n.dest]??0;s[n.dest]=p+u}}if(!Object.keys(s).length)throw new Error(`No usage information found at ${JSON.stringify(i.root)}`);return{model:o,usage:s}}function q(t,e,a,i,o){const[r,...m]=M(t).reverse();if(typeof r!="string")throw new Error(`Expected last step of path to be a string, got ${l(r)}`);m.reverse();let s=e;const n=[];for(const p of m){if(n.push(p),typeof p=="object")if(Array.isArray(s))s=O(p,s);else{if(i)throw new Error(`Expected \`${d(o,n)}\` value to be a mapping, got ${l(s)}`);return null}else if(k.guard(s))s=s[p];else{if(i)throw new Error(`Expected \`${d(o,n)}\` value to be a mapping, got ${l(s)}`);return null}if(typeof s>"u")if(i){const _=typeof p=="object"?"Unable to find item":"Missing value";throw new Error(`${_} at \`${d(o,n)}\``)}else return null}if(!k.guard(s)){if(i)throw new Error(`Expected \`${d(o,n)}\` value to be a mapping, got ${l(s)}`);return null}const u=s[r];if(typeof u>"u"){if(i)throw n.push(r),new Error(`Missing value at \`${d(o,n)}\``);return null}if(a.guard(u))return u;if(i)throw n.push(r),new Error(`Expected \`${d(o,n)}\` value to be a ${a.name}, got ${l(u)}`);return null}function O(t,e){for(const a of e)if(k.guard(a)){const i=a[t.field];if(typeof i=="string"&&h(t.match,i))return a}}function M(t){return Array.isArray(t)?[...t]:[t]}function l(t){return t===null?"null":Array.isArray(t)?"array":typeof t=="object"?"mapping":typeof t}const k={guard:t=>l(t)==="mapping",name:"mapping"},D={guard:t=>typeof t=="string",name:"string"},E={guard:t=>typeof t=="number",name:"number"},d=(t,e)=>[...t.map(v),...e.map(v)].join("."),v=t=>typeof t=="string"?t:JSON.stringify(t);exports.REMOTE_DATA_JSON_URL=y;exports.calcPrice=z;exports.extractUsage=N;exports.findProvider=Q;exports.updatePrices=A;exports.waitForUpdate=R;
|
|
10
|
+
- fluency in English, French, Italian, German, and Spanish`,match:{equals:"mixtral-8x22b-instruct"},prices:{input_mtok:.9,output_mtok:.9}},{id:"mixtral-8x7b",name:"Mixtral 8x7B",match:{or:[{starts_with:"mixtral-8x7b"},{equals:"open-mixtral-8x7b"}]},prices:{input_mtok:.7,output_mtok:.7}},{id:"pixtral-12b",name:"Pixtral 12B",description:"The first multi-modal, text+image-to-text model from Mistral AI. Its weights were launched via torrent: https://x.com/mistralai/status/1833758285167722836.",match:{or:[{equals:"pixtral-12b"},{equals:"pixtral-12b-latest"}]},prices:{input_mtok:.15,output_mtok:.15}},{id:"pixtral-large",name:"Pixtral Large 2411",description:"Pixtral Large is a 124B parameter, open-weight, multimodal model built on top of Mistral Large 2. The model is able to understand documents, charts and natural images.",match:{or:[{equals:"pixtral-large-latest"},{equals:"pixtral-large-2411"}]},prices:{input_mtok:2,output_mtok:6}}]},{id:"novita",name:"Novita",pricing_urls:["https://novita.ai/pricing"],api_pattern:"https://api\\.novita\\.ai",models:[{id:"Sao10K/L3-8B-Stheno-v3.2",match:{equals:"Sao10K/L3-8B-Stheno-v3.2"},prices:{input_mtok:.05,output_mtok:.05}},{id:"cognitivecomputations/dolphin-mixtral-8x22b",match:{equals:"cognitivecomputations/dolphin-mixtral-8x22b"},prices:{input_mtok:.9,output_mtok:.9}},{id:"deepseek/deepseek-r1",match:{equals:"deepseek/deepseek-r1"},prices:{input_mtok:4,output_mtok:4}},{id:"deepseek/deepseek-r1-distill-llama-70b",match:{equals:"deepseek/deepseek-r1-distill-llama-70b"},prices:{input_mtok:.8,output_mtok:.8}},{id:"deepseek/deepseek-r1-distill-llama-8b",match:{equals:"deepseek/deepseek-r1-distill-llama-8b"},prices:{input_mtok:.04,output_mtok:.04}},{id:"deepseek/deepseek-r1-distill-qwen-14b",match:{equals:"deepseek/deepseek-r1-distill-qwen-14b"},prices:{input_mtok:.15,output_mtok:.15}},{id:"deepseek/deepseek-r1-distill-qwen-32b",match:{equals:"deepseek/deepseek-r1-distill-qwen-32b"},prices:{input_mtok:.3,output_mtok:.3}},{id:"deepseek/deepseek_v3",match:{equals:"deepseek/deepseek_v3"},prices:{input_mtok:.89,output_mtok:.89}},{id:"google/gemma-2-9b-it",match:{equals:"google/gemma-2-9b-it"},prices:{input_mtok:.08,output_mtok:.08}},{id:"gryphe/mythomax-l2-13b",match:{equals:"gryphe/mythomax-l2-13b"},prices:{input_mtok:.09,output_mtok:.09}},{id:"jondurbin/airoboros-l2-70b",match:{equals:"jondurbin/airoboros-l2-70b"},prices:{input_mtok:.5,output_mtok:.5}},{id:"meta-llama/llama-3-70b-instruct",match:{equals:"meta-llama/llama-3-70b-instruct"},prices:{input_mtok:.51,output_mtok:.74}},{id:"meta-llama/llama-3-8b-instruct",match:{equals:"meta-llama/llama-3-8b-instruct"},prices:{input_mtok:.04,output_mtok:.04}},{id:"meta-llama/llama-3.1-70b-instruct",match:{equals:"meta-llama/llama-3.1-70b-instruct"},prices:{input_mtok:.34,output_mtok:.39}},{id:"meta-llama/llama-3.1-8b-instruct",match:{or:[{equals:"meta-llama/llama-3.1-8b-instruct"},{equals:"meta-llama/llama-3.1-8b-instruct-max"}]},prices:{input_mtok:.05,output_mtok:.05}},{id:"meta-llama/llama-3.1-8b-instruct-bf16",match:{equals:"meta-llama/llama-3.1-8b-instruct-bf16"},prices:{input_mtok:.06,output_mtok:.06}},{id:"meta-llama/llama-3.2-11b-vision-instruct",match:{equals:"meta-llama/llama-3.2-11b-vision-instruct"},prices:{input_mtok:.06,output_mtok:.06}},{id:"meta-llama/llama-3.2-1b-instruct",match:{equals:"meta-llama/llama-3.2-1b-instruct"},prices:{input_mtok:.02,output_mtok:.02}},{id:"meta-llama/llama-3.2-3b-instruct",match:{equals:"meta-llama/llama-3.2-3b-instruct"},prices:{input_mtok:.03,output_mtok:.05}},{id:"meta-llama/llama-3.3-70b-instruct",match:{equals:"meta-llama/llama-3.3-70b-instruct"},prices:{input_mtok:.39,output_mtok:.39}},{id:"microsoft/wizardlm-2-8x22b",match:{equals:"microsoft/wizardlm-2-8x22b"},prices:{input_mtok:.62,output_mtok:.62}},{id:"mistralai/mistral-7b-instruct",match:{equals:"mistralai/mistral-7b-instruct"},prices:{input_mtok:.059,output_mtok:.059}},{id:"mistralai/mistral-nemo",match:{equals:"mistralai/mistral-nemo"},prices:{input_mtok:.17,output_mtok:.17}},{id:"nousresearch/hermes-2-pro-llama-3-8b",match:{equals:"nousresearch/hermes-2-pro-llama-3-8b"},prices:{input_mtok:.14,output_mtok:.14}},{id:"nousresearch/nous-hermes-llama2-13b",match:{equals:"nousresearch/nous-hermes-llama2-13b"},prices:{input_mtok:.17,output_mtok:.17}},{id:"openchat/openchat-7b",match:{equals:"openchat/openchat-7b"},prices:{input_mtok:.06,output_mtok:.06}},{id:"qwen/qwen-2-7b-instruct",match:{equals:"qwen/qwen-2-7b-instruct"},prices:{input_mtok:.054,output_mtok:.054}},{id:"qwen/qwen-2-vl-72b-instruct",match:{equals:"qwen/qwen-2-vl-72b-instruct"},prices:{input_mtok:.45,output_mtok:.45}},{id:"qwen/qwen-2.5-72b-instruct",match:{equals:"qwen/qwen-2.5-72b-instruct"},prices:{input_mtok:.38,output_mtok:.4}},{id:"sao10k/l3-70b-euryale-v2.1",match:{equals:"sao10k/l3-70b-euryale-v2.1"},prices:{input_mtok:1.48,output_mtok:1.48}},{id:"sao10k/l3-8b-lunaris",match:{equals:"sao10k/l3-8b-lunaris"},prices:{input_mtok:.05,output_mtok:.05}},{id:"sao10k/l31-70b-euryale-v2.2",match:{equals:"sao10k/l31-70b-euryale-v2.2"},prices:{input_mtok:1.48,output_mtok:1.48}},{id:"sophosympatheia/midnight-rose-70b",match:{equals:"sophosympatheia/midnight-rose-70b"},prices:{input_mtok:.8,output_mtok:.8}},{id:"teknium/openhermes-2.5-mistral-7b",match:{equals:"teknium/openhermes-2.5-mistral-7b"},prices:{input_mtok:.17,output_mtok:.17}}]},{id:"openai",name:"OpenAI",pricing_urls:["https://platform.openai.com/docs/pricing","https://openai.com/api/pricing/","https://platform.openai.com/docs/models","https://help.openai.com/en/articles/7127956-how-much-does-gpt-4-cost"],api_pattern:"https://api\\.openai\\.com",model_match:{or:[{starts_with:"gpt-"},{regex:"^o[134]"}]},provider_match:{contains:"openai"},extractors:[{api_flavor:"chat",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0},{path:["prompt_tokens_details","cached_tokens"],dest:"cache_read_tokens",required:!1},{path:["prompt_tokens_details","audio_tokens"],dest:"input_audio_tokens",required:!1},{path:["completion_tokens_details","audio_tokens"],dest:"output_audio_tokens",required:!1},{path:"completion_tokens",dest:"output_tokens",required:!0}]},{api_flavor:"responses",root:"usage",model_path:"model",mappings:[{path:"input_tokens",dest:"input_tokens",required:!0},{path:["input_tokens_details","cached_tokens"],dest:"cache_read_tokens",required:!1},{path:"output_tokens",dest:"output_tokens",required:!0}]},{api_flavor:"embeddings",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0}]}],models:[{id:"ada",match:{or:[{equals:"ada"},{equals:"text-ada-001"}]},prices:{input_mtok:.4,output_mtok:.4}},{id:"babbage",match:{equals:"babbage"},prices:{input_mtok:.5,output_mtok:.5}},{id:"chatgpt-4o-latest",name:"ChatGPT-4o",description:"OpenAI ChatGPT 4o is continually updated by OpenAI to point to the current version of GPT-4o used by ChatGPT. It therefore differs slightly from the API version of GPT-4o in that it has additional RLHF. It is intended for research and evaluation.",match:{equals:"chatgpt-4o-latest"},prices:{input_mtok:5,output_mtok:15}},{id:"codex-mini",name:"Codex Mini",description:"codex-mini-latest is a fine-tuned version of o4-mini specifically for use in Codex CLI. For direct use in the API, we recommend starting with gpt-4.1.",match:{or:[{equals:"codex-mini"},{equals:"codex-mini-latest"}]},prices:{input_mtok:1.5,cache_read_mtok:.375,output_mtok:6}},{id:"computer-use",name:"Computer use",match:{starts_with:"computer-use"},prices:{input_mtok:3,output_mtok:12}},{id:"curie",match:{or:[{equals:"curie"},{equals:"text-curie-001"}]},prices:{input_mtok:2,output_mtok:2}},{id:"davinci",match:{or:[{equals:"davinci"},{equals:"text-davinci-001"}]},prices:{input_mtok:20,output_mtok:20}},{id:"ft:gpt-3.5-turbo-",description:"GPT-3.5 Turbo fine tuned.",match:{starts_with:"ft:gpt-3.5-turbo"},prices:{input_mtok:3,output_mtok:6}},{id:"ft:gpt-4o",description:"GPT-4o fine tuned.",match:{starts_with:"ft:gpt-4o-2024-"},prices:{input_mtok:3.75,output_mtok:15}},{id:"ft:gpt-4o-mini",description:"GPT-4o Mini fine tuned.",match:{starts_with:"ft:gpt-4o-mini-2024-"},prices:{input_mtok:.3,output_mtok:1.2}},{id:"gpt-3.5-0301",match:{or:[{equals:"gpt-3.5-turbo-0301"},{equals:"gpt-3.5-0301"}]},prices:{input_mtok:1.5,output_mtok:2}},{id:"gpt-3.5-turbo",name:"gpt 3.5 turbo",description:"GPT-3.5 Turbo offers a balance between cost and performance.",match:{or:[{equals:"gpt-3.5-turbo"},{equals:"gpt-35-turbo"},{equals:"gpt-3.5-turbo-0125"}]},context_window:16385,prices:{input_mtok:.5,output_mtok:1.5}},{id:"gpt-3.5-turbo-0613",match:{equals:"gpt-3.5-turbo-0613"},context_window:16385,prices:{input_mtok:1.5,output_mtok:2}},{id:"gpt-3.5-turbo-1106",match:{equals:"gpt-3.5-turbo-1106"},context_window:16385,prices:{input_mtok:1,output_mtok:2}},{id:"gpt-3.5-turbo-16k",name:"GPT-3.5 Turbo 16k",description:"This model offers four times the context length of gpt-3.5-turbo, allowing it to support approximately 20 pages of text in a single request at a higher cost. Training data: up to Sep 2021.",match:{or:[{equals:"gpt-3.5-turbo-16k"},{equals:"gpt-3.5-turbo-16k-0613"},{equals:"gpt-35-turbo-16k-0613"},{equals:"gpt-35-turbo-16k"}]},context_window:16385,prices:{input_mtok:3,output_mtok:4}},{id:"gpt-3.5-turbo-instruct",name:"gpt 3.5 turbo instruct",description:"GPT-3.5 Turbo offers a balance between cost and performance.",match:{or:[{starts_with:"gpt-3.5-turbo-instruct"},{equals:"gpt-3.5-turbo-instruct-0914"}]},context_window:16385,prices:{input_mtok:1.5,output_mtok:2}},{id:"gpt-4",name:"gpt 4",description:"GPT-4 is the latest and most advanced model in the GPT series, demonstrating sophisticated capabilities in complex reasoning, theory of mind, and narrative understanding.",match:{or:[{equals:"gpt-4"},{equals:"gpt-4-0314"},{equals:"gpt-4-0613"},{starts_with:"ft:gpt-4-0"}]},context_window:8192,prices:{input_mtok:30,output_mtok:60}},{id:"gpt-4-32k",name:"gpt 4",description:"GPT-4 is the latest and most advanced model in the GPT series, demonstrating sophisticated capabilities in complex reasoning, theory of mind, and narrative understanding.",match:{or:[{equals:"gpt-4-32k"},{equals:"gpt-4-32k-0314"},{equals:"gpt-4-32k-0613"}]},context_window:32e3,price_comments:"see https://help.openai.com/en/articles/7127956-how-much-does-gpt-4-cost",prices:{input_mtok:60,output_mtok:120}},{id:"gpt-4-turbo",name:"gpt 4 turbo",description:"GPT-4 Turbo offers a balance between cost and performance.",match:{or:[{equals:"gpt-4-turbo"},{equals:"gpt-4-turbo-2024-04-09"},{equals:"gpt-4-turbo-0125-preview"},{equals:"gpt-4-0125-preview"},{equals:"gpt-4-1106-preview"},{equals:"gpt-4-turbo-preview"}]},context_window:128e3,prices:{input_mtok:10,output_mtok:30}},{id:"gpt-4-vision-preview",name:"gpt 4 vision",description:"GPT-4 Vision is a model that offers a balance between cost and performance.",match:{or:[{equals:"gpt-4-vision-preview"},{equals:"gpt-4-1106-vision-preview"}]},context_window:128e3,prices:{input_mtok:10,output_mtok:30}},{id:"gpt-4.1",name:"gpt 4.1",description:"GPT-4.1 is OpenAI's latest flagship model, offering major improvements in coding, instruction following, and long context understanding with up to 1 million tokens of context.",match:{or:[{equals:"gpt-4.1"},{equals:"gpt-4.1-2025-04-14"}]},context_window:1e6,prices:{input_mtok:2,cache_read_mtok:.5,output_mtok:8}},{id:"gpt-4.1-mini",name:"gpt 4.1 mini",description:"GPT-4.1 Mini is a significant leap in small model performance, matching or exceeding GPT-4o in many benchmarks while reducing latency by nearly half and cost by 83%.",match:{or:[{equals:"gpt-4.1-mini"},{equals:"gpt-4.1-mini-2025-04-14"}]},context_window:1e6,prices:{input_mtok:.4,cache_read_mtok:.1,output_mtok:1.6}},{id:"gpt-4.1-nano",name:"gpt 4.1 nano",description:"GPT-4.1 Nano is OpenAI's fastest and cheapest model, delivering exceptional performance for its size with a 1 million token context window, ideal for classification and autocompletion tasks.",match:{or:[{equals:"gpt-4.1-nano"},{equals:"gpt-4.1-nano-2025-04-14"}]},context_window:1e6,prices:{input_mtok:.1,cache_read_mtok:.025,output_mtok:.4}},{id:"gpt-4.5-preview",name:"GPT-4.5 (Preview)",description:"GPT-4.5 (Preview) is a research preview of OpenAI's latest language model, designed to advance capabilities in reasoning, creativity, and multi-turn conversation. It builds on previous iterations with improvements in world knowledge, contextual coherence, and the ability to follow user intent more effectively.",match:{starts_with:"gpt-4.5-preview"},prices:{input_mtok:75,cache_read_mtok:37.5,output_mtok:150}},{id:"gpt-4o",name:"gpt 4o",description:"GPT-4 Optimized (GPT-4o) is designed for high performance in reasoning, creativity, and technical tasks while maintaining consistent output quality.",match:{or:[{equals:"gpt-4o"},{equals:"gpt-4o-2024-05-13"},{equals:"gpt-4o-2024-08-06"},{equals:"gpt-4o-2024-11-20"}]},context_window:128e3,prices:{input_mtok:2.5,cache_read_mtok:1.25,output_mtok:10}},{id:"gpt-4o-audio-preview",name:"gpt 4o audio preview",description:"Audio model for gpt-4o",match:{starts_with:"gpt-4o-audio-preview"},context_window:128e3,prices:{output_mtok:10,input_audio_mtok:2.5}},{id:"gpt-4o-mini",name:"gpt 4o mini",description:"GPT-4o Mini is a cost-optimized variant of GPT-4o, designed for high-efficiency processing while maintaining strong performance. It excels in rapid inference and resource-efficient operations, making it ideal for production deployments requiring a balance of cost and capability.",match:{or:[{equals:"gpt-4o-mini"},{equals:"gpt-4o-mini-2024-07-18"},{equals:"gpt-4o-mini-search-preview"},{equals:"gpt-4o-mini-search-preview-2025-03-11"}]},context_window:128e3,prices:{input_mtok:.15,cache_read_mtok:.075,output_mtok:.6}},{id:"gpt-4o-mini-2024-07-18.ft-",description:"GPT-4o Mini fine tuned.",match:{starts_with:"gpt-4o-mini-2024-07-18.ft-"},prices:{input_mtok:.3,output_mtok:1.2}},{id:"gpt-4o-mini-audio-preview",name:"gpt 4o mini audio preview",description:"Audio model for gpt-4o mini",match:{starts_with:"gpt-4o-mini-audio"},prices:{output_mtok:.6,input_audio_mtok:.15}},{id:"gpt-4o-mini-realtime-preview",match:{starts_with:"gpt-4o-mini-realtime"},prices:{input_mtok:.6,cache_read_mtok:.3,output_mtok:2.4,input_audio_mtok:10,cache_audio_read_mtok:.3,output_audio_mtok:20}},{id:"gpt-4o-mini-transcribe",match:{equals:"gpt-4o-mini-transcribe"},prices:{input_mtok:1.25,output_mtok:5,input_audio_mtok:3}},{id:"gpt-4o-mini-tts",match:{equals:"gpt-4o-mini-tts"},prices:{input_mtok:.6,output_audio_mtok:12}},{id:"gpt-4o-realtime-preview",match:{starts_with:"gpt-4o-realtime"},prices:{input_mtok:5,cache_read_mtok:2.5,output_mtok:20,input_audio_mtok:40,cache_audio_read_mtok:2.5,output_audio_mtok:80}},{id:"gpt-4o-search-preview",name:"GPT-4o Search Preview",description:"GPT-4o Search Previewis a specialized model for web search in Chat Completions. It is trained to understand and execute web search queries.",match:{or:[{equals:"gpt-4o-search-preview"},{equals:"gpt-4o-search-preview-2025-03-11"}]},prices:{input_mtok:2.5,output_mtok:10}},{id:"gpt-4o-transcribe",match:{or:[{equals:"gpt-4o-transcribe"},{equals:"gpt-4o-transcribe-diarize"}]},prices:{input_mtok:2.5,output_mtok:10,input_audio_mtok:6}},{id:"gpt-4o:extended",name:"GPT-4o (extended)",description:`GPT-4o ("o" for "omni") is OpenAI's latest AI model, supporting both text and image inputs with text outputs. It maintains the intelligence level of GPT-4 Turbo while being twice as fast and 50% more cost-effective. GPT-4o also offers improved performance in processing non-English languages and enhanced visual capabilities.`,match:{equals:"gpt-4o:extended"},prices:{input_mtok:6,output_mtok:18}},{id:"gpt-5",name:"GPT-5",description:"GPT-5 is OpenAI's flagship model for coding, reasoning, and agentic tasks across domains.",match:{or:[{equals:"gpt-5"},{equals:"gpt-5-2025-08-07"},{equals:"gpt-5-chat"},{equals:"gpt-5-chat-latest"},{equals:"gpt-5-codex"}]},context_window:4e5,prices:{input_mtok:1.25,cache_read_mtok:.125,output_mtok:10}},{id:"gpt-5-image",match:{equals:"gpt-5-image"},price_comments:"Seen on OpenRouter before OpenAI",prices:{input_mtok:10,cache_read_mtok:1.25,output_mtok:10}},{id:"gpt-5-image-mini",match:{equals:"gpt-5-image-mini"},price_comments:"Seen on OpenRouter before OpenAI",prices:{input_mtok:2.5,cache_read_mtok:.25,output_mtok:2}},{id:"gpt-5-mini",name:"GPT-5 mini",description:"GPT-5 mini is a faster, more cost-efficient version of GPT-5. It's great for well-defined tasks and precise prompts.",match:{or:[{equals:"gpt-5-mini"},{equals:"gpt-5-mini-2025-08-07"}]},context_window:4e5,prices:{input_mtok:.25,cache_read_mtok:.025,output_mtok:2}},{id:"gpt-5-nano",name:"GPT-5 nano",description:"GPT-5 Nano is OpenAI's fastest, cheapest version of GPT-5. It's great for summarization and classification tasks.",match:{or:[{equals:"gpt-5-nano"},{starts_with:"gpt-5-nano-"}]},context_window:4e5,prices:{input_mtok:.05,cache_read_mtok:.005,output_mtok:.4}},{id:"gpt-5-pro",match:{or:[{equals:"gpt-5-pro"},{equals:"gpt-5-pro-2025-10-06"}]},context_window:4e5,prices:{input_mtok:15,output_mtok:120}},{id:"gpt-5.1",name:"GPT-5.1",description:"The best model for coding and agentic tasks across industries",match:{or:[{equals:"gpt-5.1"},{equals:"gpt-5.1-2025-11-13"},{equals:"gpt-5.1-codex"},{equals:"gpt-5.1-chat-latest"}]},context_window:4e5,prices:{input_mtok:1.25,cache_read_mtok:.125,output_mtok:10}},{id:"gpt-5.1-codex-mini",name:"GPT-5.1 Codex Mini",match:{or:[{equals:"gpt-5.1-codex-mini"},{equals:"gpt-5.1-mini"}]},context_window:4e5,prices:{input_mtok:.25,cache_read_mtok:.025,output_mtok:2}},{id:"gpt-realtime",match:{or:[{equals:"gpt-realtime"},{equals:"gpt-realtime-2025-08-28"}]},price_comments:"Missing image token prices which we don't support yet",prices:{input_mtok:4,cache_read_mtok:.4,output_mtok:16,input_audio_mtok:32,cache_audio_read_mtok:.4,output_audio_mtok:64}},{id:"gpt-realtime-mini",match:{equals:"gpt-realtime-mini"},price_comments:"Missing image token prices which we don't support yet",prices:{input_mtok:.6,cache_read_mtok:.06,output_mtok:2.4,input_audio_mtok:10,cache_audio_read_mtok:.3,output_audio_mtok:20}},{id:"moderation",description:"All OpenAI moderation models and endpoints are free of charge",match:{contains:"moderation"},prices:{}},{id:"o1",name:"o1",description:"O1 is a model that offers a balance between cost and performance.",match:{or:[{equals:"o1"},{equals:"o1-2024-12-17"},{equals:"o1-preview"},{equals:"o1-preview-2024-09-12"}]},context_window:128e3,prices:{input_mtok:15,cache_read_mtok:7.5,output_mtok:60}},{id:"o1-mini",name:"o1 mini",description:"O1 Mini is a model that offers a balance between cost and performance.",match:{or:[{equals:"o1-mini"},{equals:"o1-mini-2024-09-12"}]},context_window:128e3,prices:{input_mtok:1.1,cache_read_mtok:.55,output_mtok:4.4}},{id:"o1-pro",name:"o1-pro",description:"The o1 series of models are trained with reinforcement learning to think before they answer and perform complex reasoning. The o1-pro model uses more compute to think harder and provide consistently better answers.",match:{or:[{equals:"o1-pro"},{equals:"o1-pro-2025-03-19"}]},prices:{input_mtok:150,output_mtok:600}},{id:"o3",name:"o3",description:"o3 is a well-rounded and powerful model across domains. It sets a new standard for math, science, coding, and visual reasoning tasks. It also excels at technical writing and instruction-following. Use it to think through multi-step problems that involve analysis across text, code, and images. Note that BYOK is required for this model. Set up here: https://openrouter.ai/settings/integrations",match:{or:[{equals:"o3"},{equals:"o3-2025-04-16"}]},prices:[{prices:{input_mtok:10,cache_read_mtok:.5,output_mtok:40}},{constraint:{start_date:"2025-06-10",type:"start_date"},prices:{input_mtok:2,cache_read_mtok:.5,output_mtok:8}}]},{id:"o3-deep-research",match:{or:[{equals:"o3-deep-research"},{equals:"o3-deep-research-2025-06-26"}]},prices:{input_mtok:10,cache_read_mtok:2.5,output_mtok:40}},{id:"o3-mini",name:"o3 Mini",description:"OpenAI o3-mini is a cost-efficient language model optimized for STEM reasoning tasks, particularly excelling in science, mathematics, and coding.",match:{or:[{equals:"o3-mini"},{equals:"o3-mini-2025-01-31"},{equals:"o3-mini-high"}]},prices:{input_mtok:1.1,cache_read_mtok:.55,output_mtok:4.4}},{id:"o3-pro",name:"o3 Pro",description:"The o-series of models are trained with reinforcement learning to think before they answer and perform complex reasoning. The o3-pro model uses more compute to think harder and provide consistently better answers.",match:{or:[{equals:"o3-pro"},{equals:"o3-pro-2025-06-10"}]},prices:{input_mtok:20,output_mtok:80}},{id:"o4-mini",name:"o4 Mini High",description:"OpenAI o4-mini-high is the same model as o4-mini with reasoning_effort set to high.",match:{or:[{equals:"o4-mini-2025-04-16"},{equals:"o4-mini-high"},{equals:"o4-mini"}]},prices:{input_mtok:1.1,cache_read_mtok:.275,output_mtok:4.4}},{id:"o4-mini-deep-research",match:{or:[{equals:"o4-mini-deep-research"},{equals:"o4-mini-deep-research-2025-06-26"}]},prices:{input_mtok:2,cache_read_mtok:.5,output_mtok:8}},{id:"text-davinci-002",match:{equals:"text-davinci-002"},prices:{input_mtok:20,output_mtok:20}},{id:"text-davinci-003",match:{equals:"text-davinci-003"},prices:{input_mtok:20,output_mtok:20}},{id:"text-embedding-3-large",name:"text embedding 3",description:"Text Embedding 3 is a model that offers a balance between cost and performance.",match:{equals:"text-embedding-3-large"},context_window:3072,prices:{input_mtok:.13}},{id:"text-embedding-3-small",name:"text embedding 3",description:"Text Embedding 3 is a model that offers a balance between cost and performance.",match:{equals:"text-embedding-3-small"},context_window:3072,prices:{input_mtok:.02}},{id:"text-embedding-ada-002",name:"text embedding ada",description:"Text Embedding Ada is a model that offers a balance between cost and performance.",match:{or:[{equals:"text-embedding-ada"},{equals:"text-embedding-ada-002"},{equals:"text-embedding-ada-002-v2"}]},context_window:1536,prices:{input_mtok:.1}}]},{id:"openrouter",name:"OpenRouter",pricing_urls:["https://openrouter.ai/models"],api_pattern:"https://(api\\.)?openrouter\\.ai",models:[{id:"01-ai/yi-large",match:{equals:"01-ai/yi-large"},prices:{input_mtok:3,output_mtok:3}},{id:"aetherwiing/mn-starcannon-12b",match:{equals:"aetherwiing/mn-starcannon-12b"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"agentica-org/deepcoder-14b-preview:free",match:{equals:"agentica-org/deepcoder-14b-preview:free"},prices:{}},{id:"ai21/jamba-1-5-large",match:{equals:"ai21/jamba-1-5-large"},prices:{input_mtok:2,output_mtok:8}},{id:"ai21/jamba-1-5-mini",match:{equals:"ai21/jamba-1-5-mini"},prices:{input_mtok:.2,output_mtok:.4}},{id:"ai21/jamba-1.6-large",match:{equals:"ai21/jamba-1.6-large"},prices:{input_mtok:2,output_mtok:8}},{id:"ai21/jamba-1.6-mini",match:{equals:"ai21/jamba-1.6-mini"},prices:{input_mtok:.2,output_mtok:.4}},{id:"ai21/jamba-instruct",match:{equals:"ai21/jamba-instruct"},prices:{input_mtok:.5,output_mtok:.7}},{id:"aion-1.0",name:"Aion-1.0",match:{equals:"aion-1.0"},prices:{input_mtok:4,output_mtok:8}},{id:"aion-1.0-mini",name:"Aion-1.0-Mini",match:{equals:"aion-1.0-mini"},prices:{input_mtok:.7,output_mtok:1.4}},{id:"aion-labs/aion-1.0",match:{equals:"aion-labs/aion-1.0"},prices:{input_mtok:4,output_mtok:8}},{id:"aion-labs/aion-1.0-mini",match:{equals:"aion-labs/aion-1.0-mini"},prices:{input_mtok:.7,output_mtok:1.4}},{id:"aion-labs/aion-rp-llama-3.1-8b",match:{equals:"aion-labs/aion-rp-llama-3.1-8b"},prices:{input_mtok:.2,output_mtok:.2}},{id:"aion-rp-llama-3.1-8b",name:"Aion-RP 1.0 (8B)",match:{equals:"aion-rp-llama-3.1-8b"},prices:{input_mtok:.2,output_mtok:.2}},{id:"alfredpros/codellama-7b-instruct-solidity",match:{equals:"alfredpros/codellama-7b-instruct-solidity"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"all-hands/openhands-lm-32b-v0.1",match:{equals:"all-hands/openhands-lm-32b-v0.1"},prices:{input_mtok:2.6,output_mtok:3.4}},{id:"allenai/molmo-7b-d:free",match:{equals:"allenai/molmo-7b-d:free"},prices:{}},{id:"alpindale/goliath-120b",match:{equals:"alpindale/goliath-120b"},prices:{input_mtok:6.5625,output_mtok:9.375}},{id:"alpindale/magnum-72b",match:{equals:"alpindale/magnum-72b"},prices:{input_mtok:1.5,output_mtok:2.25}},{id:"amazon/nova-lite-v1",match:{equals:"amazon/nova-lite-v1"},prices:{input_mtok:.06,output_mtok:.24}},{id:"amazon/nova-micro-v1",match:{equals:"amazon/nova-micro-v1"},prices:{input_mtok:.035,output_mtok:.14}},{id:"amazon/nova-pro-v1",match:{equals:"amazon/nova-pro-v1"},prices:{input_mtok:.8,output_mtok:3.2}},{id:"anthracite-org/magnum-v2-72b",match:{equals:"anthracite-org/magnum-v2-72b"},prices:{input_mtok:3,output_mtok:3}},{id:"anthracite-org/magnum-v4-72b",match:{equals:"anthracite-org/magnum-v4-72b"},prices:{input_mtok:1.5,output_mtok:2.25}},{id:"anthropic/claude-2",match:{or:[{equals:"anthropic/claude-2"},{equals:"anthropic/claude-2.0"},{equals:"anthropic/claude-2.0:beta"},{equals:"anthropic/claude-2.1"},{equals:"anthropic/claude-2.1:beta"},{equals:"anthropic/claude-2:beta"}]},prices:{input_mtok:8,output_mtok:24}},{id:"anthropic/claude-3-haiku",match:{or:[{equals:"anthropic/claude-3-haiku"},{equals:"anthropic/claude-3-haiku:beta"}]},prices:{input_mtok:.25,output_mtok:1.25}},{id:"anthropic/claude-3-opus",match:{or:[{equals:"anthropic/claude-3-opus"},{equals:"anthropic/claude-3-opus:beta"}]},prices:{input_mtok:15,output_mtok:75}},{id:"anthropic/claude-3-sonnet",match:{or:[{equals:"anthropic/claude-3-sonnet"},{equals:"anthropic/claude-3-sonnet:beta"}]},prices:{input_mtok:3,output_mtok:15}},{id:"anthropic/claude-3.5-haiku",match:{or:[{equals:"anthropic/claude-3.5-haiku"},{equals:"anthropic/claude-3.5-haiku-20241022"},{equals:"anthropic/claude-3.5-haiku-20241022:beta"},{equals:"anthropic/claude-3.5-haiku:beta"}]},prices:{input_mtok:.8,output_mtok:4}},{id:"anthropic/claude-3.5-sonnet",match:{or:[{equals:"anthropic/claude-3.5-sonnet"},{equals:"anthropic/claude-3.5-sonnet-20240620"},{equals:"anthropic/claude-3.5-sonnet-20240620:beta"},{equals:"anthropic/claude-3.5-sonnet:beta"}]},prices:{input_mtok:3,output_mtok:15}},{id:"anthropic/claude-3.7-sonnet",match:{or:[{equals:"anthropic/claude-3.7-sonnet"},{equals:"anthropic/claude-3.7-sonnet:beta"},{equals:"anthropic/claude-3.7-sonnet:thinking"}]},prices:{input_mtok:3,output_mtok:15}},{id:"anubis-pro-105b-v1",name:"Anubis Pro 105B V1",match:{equals:"anubis-pro-105b-v1"},prices:{input_mtok:.8,output_mtok:1}},{id:"arcee-blitz",name:"Arcee Blitz",match:{equals:"arcee-blitz"},prices:{input_mtok:.45,output_mtok:.75}},{id:"arliai/qwq-32b-arliai-rpr-v1:free",match:{equals:"arliai/qwq-32b-arliai-rpr-v1:free"},prices:{}},{id:"bytedance-research/ui-tars-72b:free",match:{equals:"bytedance-research/ui-tars-72b:free"},prices:{}},{id:"caller-large",name:"Caller Large",match:{equals:"caller-large"},prices:{input_mtok:.55,output_mtok:.85}},{id:"chatgpt-4o-latest",name:"ChatGPT-4o",match:{equals:"chatgpt-4o-latest"},prices:{input_mtok:5,output_mtok:15}},{id:"claude-2",name:"Claude v2",match:{or:[{equals:"claude-2"},{equals:"claude-2.0"},{equals:"claude-2.0:beta"},{equals:"claude-2.1"},{equals:"claude-2.1:beta"},{equals:"claude-2:beta"}]},prices:{input_mtok:8,output_mtok:24}},{id:"claude-3-haiku",name:"Claude 3 Haiku",match:{or:[{equals:"claude-3-haiku"},{equals:"claude-3-haiku:beta"}]},prices:{input_mtok:.25,cache_write_mtok:.3,cache_read_mtok:.03,output_mtok:1.25}},{id:"claude-3-opus",name:"Claude 3 Opus",match:{or:[{equals:"claude-3-opus"},{equals:"claude-3-opus:beta"}]},prices:{input_mtok:15,cache_write_mtok:18.75,cache_read_mtok:1.5,output_mtok:75}},{id:"claude-3-sonnet",name:"Claude 3 Sonnet",match:{or:[{equals:"claude-3-sonnet"},{equals:"claude-3-sonnet:beta"}]},prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"claude-3.5-haiku",name:"Claude 3.5 Haiku",match:{or:[{equals:"claude-3.5-haiku"},{equals:"claude-3.5-haiku-20241022"},{equals:"claude-3.5-haiku-20241022:beta"},{equals:"claude-3.5-haiku:beta"}]},prices:{input_mtok:.8,cache_write_mtok:1,cache_read_mtok:.08,output_mtok:4}},{id:"claude-3.5-sonnet",name:"Claude 3.5 Sonnet",match:{or:[{equals:"claude-3.5-sonnet"},{equals:"claude-3.5-sonnet-20240620"},{equals:"claude-3.5-sonnet-20240620:beta"},{equals:"claude-3.5-sonnet:beta"}]},prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"claude-3.7-sonnet",name:"Claude 3.7 Sonnet",match:{or:[{equals:"claude-3.7-sonnet"},{equals:"claude-3.7-sonnet:beta"},{equals:"claude-3.7-sonnet:thinking"}]},prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"claude-opus-4",name:"Claude Opus 4",match:{equals:"claude-opus-4"},prices:{input_mtok:15,cache_write_mtok:18.75,cache_read_mtok:1.5,output_mtok:75}},{id:"claude-sonnet-4",name:"Claude Sonnet 4",match:{equals:"claude-sonnet-4"},prices:{input_mtok:3,cache_write_mtok:3.75,cache_read_mtok:.3,output_mtok:15}},{id:"codellama-7b-instruct-solidity",name:"CodeLLaMa 7B Instruct Solidity",match:{equals:"codellama-7b-instruct-solidity"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"coder-large",name:"Coder Large",match:{equals:"coder-large"},prices:{input_mtok:.5,output_mtok:.8}},{id:"codestral-2501",name:"Codestral 2501",match:{equals:"codestral-2501"},prices:{input_mtok:.3,output_mtok:.9}},{id:"codex-mini",name:"Codex Mini",match:{equals:"codex-mini"},prices:{input_mtok:1.5,cache_read_mtok:.375,output_mtok:6}},{id:"cognitivecomputations/dolphin-mixtral-8x22b",match:{equals:"cognitivecomputations/dolphin-mixtral-8x22b"},prices:{input_mtok:.9,output_mtok:.9}},{id:"cognitivecomputations/dolphin-mixtral-8x7b",match:{equals:"cognitivecomputations/dolphin-mixtral-8x7b"},prices:{input_mtok:.5,output_mtok:.5}},{id:"cognitivecomputations/dolphin3.0-mistral-24b:free",match:{equals:"cognitivecomputations/dolphin3.0-mistral-24b:free"},prices:{}},{id:"cognitivecomputations/dolphin3.0-r1-mistral-24b:free",match:{equals:"cognitivecomputations/dolphin3.0-r1-mistral-24b:free"},prices:{}},{id:"cohere/command",match:{equals:"cohere/command"},prices:{input_mtok:1,output_mtok:2}},{id:"cohere/command-a",match:{equals:"cohere/command-a"},prices:{input_mtok:2.5,output_mtok:10}},{id:"cohere/command-r",match:{or:[{equals:"cohere/command-r"},{equals:"cohere/command-r-03-2024"}]},prices:{input_mtok:.5,output_mtok:1.5}},{id:"cohere/command-r-08-2024",match:{equals:"cohere/command-r-08-2024"},prices:{input_mtok:.15,output_mtok:.6}},{id:"cohere/command-r-plus",match:{or:[{equals:"cohere/command-r-plus"},{equals:"cohere/command-r-plus-04-2024"}]},prices:{input_mtok:3,output_mtok:15}},{id:"cohere/command-r-plus-08-2024",match:{equals:"cohere/command-r-plus-08-2024"},prices:{input_mtok:2.5,output_mtok:10}},{id:"cohere/command-r7b-12-2024",match:{equals:"cohere/command-r7b-12-2024"},prices:{input_mtok:.0375,output_mtok:.15}},{id:"command",name:"Command",match:{equals:"command"},prices:{input_mtok:1,output_mtok:2}},{id:"command-a",name:"Command A",match:{equals:"command-a"},prices:{input_mtok:2.5,output_mtok:10}},{id:"command-r",name:"Command R",match:{or:[{equals:"command-r"},{equals:"command-r-03-2024"}]},prices:{input_mtok:.5,output_mtok:1.5}},{id:"command-r-08-2024",name:"Command R (08-2024)",match:{equals:"command-r-08-2024"},prices:{input_mtok:.15,output_mtok:.6}},{id:"command-r-plus",name:"Command R+",match:{or:[{equals:"command-r-plus"},{equals:"command-r-plus-04-2024"}]},prices:{input_mtok:3,output_mtok:15}},{id:"command-r-plus-08-2024",name:"Command R+ (08-2024)",match:{equals:"command-r-plus-08-2024"},prices:{input_mtok:2.5,output_mtok:10}},{id:"command-r7b-12-2024",name:"Command R7B (12-2024)",match:{equals:"command-r7b-12-2024"},prices:{input_mtok:.0375,output_mtok:.15}},{id:"deepcoder-14b-preview:free",name:"Deepcoder 14B Preview (free)",match:{equals:"deepcoder-14b-preview:free"},prices:{}},{id:"deephermes-3-llama-3-8b-preview:free",name:"DeepHermes 3 Llama 3 8B Preview (free)",match:{equals:"deephermes-3-llama-3-8b-preview:free"},prices:{}},{id:"deepseek-chat",name:"DeepSeek V3",match:{equals:"deepseek-chat"},prices:{input_mtok:.38,output_mtok:.89}},{id:"deepseek-chat-v3-0324",name:"DeepSeek V3 0324",match:{equals:"deepseek-chat-v3-0324"},prices:{input_mtok:.3,output_mtok:.88}},{id:"deepseek-chat-v3-0324:free",name:"DeepSeek V3 0324 (free)",match:{equals:"deepseek-chat-v3-0324:free"},prices:{}},{id:"deepseek-chat:free",name:"DeepSeek V3 (free)",match:{equals:"deepseek-chat:free"},prices:{}},{id:"deepseek-prover-v2",name:"DeepSeek Prover V2",match:{equals:"deepseek-prover-v2"},prices:{input_mtok:.5,output_mtok:2.18}},{id:"deepseek-r1",name:"R1",match:{equals:"deepseek-r1"},prices:{input_mtok:.45,output_mtok:2.15}},{id:"deepseek-r1-0528",name:"R1 0528",match:{equals:"deepseek-r1-0528"},prices:{input_mtok:.5,output_mtok:2.15}},{id:"deepseek-r1-0528-qwen3-8b",name:"Deepseek R1 0528 Qwen3 8B",match:{equals:"deepseek-r1-0528-qwen3-8b"},prices:{input_mtok:.05,output_mtok:.1}},{id:"deepseek-r1-0528-qwen3-8b:free",name:"Deepseek R1 0528 Qwen3 8B (free)",match:{equals:"deepseek-r1-0528-qwen3-8b:free"},prices:{}},{id:"deepseek-r1-0528:free",name:"R1 0528 (free)",match:{equals:"deepseek-r1-0528:free"},prices:{}},{id:"deepseek-r1-distill-llama-70b",name:"R1 Distill Llama 70B",match:{equals:"deepseek-r1-distill-llama-70b"},prices:{input_mtok:.1,output_mtok:.4}},{id:"deepseek-r1-distill-llama-70b:free",name:"R1 Distill Llama 70B (free)",match:{equals:"deepseek-r1-distill-llama-70b:free"},prices:{}},{id:"deepseek-r1-distill-llama-8b",name:"R1 Distill Llama 8B",match:{equals:"deepseek-r1-distill-llama-8b"},prices:{input_mtok:.04,output_mtok:.04}},{id:"deepseek-r1-distill-qwen-1.5b",name:"R1 Distill Qwen 1.5B",match:{equals:"deepseek-r1-distill-qwen-1.5b"},prices:{input_mtok:.18,output_mtok:.18}},{id:"deepseek-r1-distill-qwen-14b",name:"R1 Distill Qwen 14B",match:{equals:"deepseek-r1-distill-qwen-14b"},prices:{input_mtok:.15,output_mtok:.15}},{id:"deepseek-r1-distill-qwen-14b:free",name:"R1 Distill Qwen 14B (free)",match:{equals:"deepseek-r1-distill-qwen-14b:free"},prices:{}},{id:"deepseek-r1-distill-qwen-32b",name:"R1 Distill Qwen 32B",match:{equals:"deepseek-r1-distill-qwen-32b"},prices:{input_mtok:.12,output_mtok:.18}},{id:"deepseek-r1-distill-qwen-32b:free",name:"R1 Distill Qwen 32B (free)",match:{equals:"deepseek-r1-distill-qwen-32b:free"},prices:{}},{id:"deepseek-r1-distill-qwen-7b",name:"R1 Distill Qwen 7B",match:{equals:"deepseek-r1-distill-qwen-7b"},prices:{input_mtok:.1,output_mtok:.2}},{id:"deepseek-r1:free",name:"R1 (free)",match:{equals:"deepseek-r1:free"},prices:{}},{id:"deepseek-r1t-chimera:free",name:"DeepSeek R1T Chimera (free)",match:{equals:"deepseek-r1t-chimera:free"},prices:{}},{id:"deepseek-v3-base:free",name:"DeepSeek V3 Base (free)",match:{equals:"deepseek-v3-base:free"},prices:{}},{id:"deepseek-v3.1-terminus",name:"DeepSeek V3.1 Terminus",match:{equals:"deepseek-v3.1-terminus"},context_window:163840,prices:{input_mtok:.23,output_mtok:.9}},{id:"deepseek/deepseek-chat",match:{equals:"deepseek/deepseek-chat"},prices:{input_mtok:.38,output_mtok:.89}},{id:"deepseek/deepseek-chat-v3-0324",match:{equals:"deepseek/deepseek-chat-v3-0324"},prices:{input_mtok:.27,output_mtok:1.1}},{id:"deepseek/deepseek-chat-v3-0324:free",match:{equals:"deepseek/deepseek-chat-v3-0324:free"},prices:{}},{id:"deepseek/deepseek-chat-v3.1",name:"DeepSeek Chat V3.1",match:{equals:"deepseek/deepseek-chat-v3.1"},context_window:163840,prices:{input_mtok:.2,output_mtok:.8}},{id:"deepseek/deepseek-chat:free",match:{equals:"deepseek/deepseek-chat:free"},prices:{}},{id:"deepseek/deepseek-r1",match:{equals:"deepseek/deepseek-r1"},prices:{input_mtok:.5,output_mtok:3}},{id:"deepseek/deepseek-r1-distill-llama-70b",match:{equals:"deepseek/deepseek-r1-distill-llama-70b"},prices:{input_mtok:.1,output_mtok:.4}},{id:"deepseek/deepseek-r1-distill-llama-70b:free",match:{equals:"deepseek/deepseek-r1-distill-llama-70b:free"},prices:{}},{id:"deepseek/deepseek-r1-distill-llama-8b",match:{equals:"deepseek/deepseek-r1-distill-llama-8b"},prices:{input_mtok:.04,output_mtok:.04}},{id:"deepseek/deepseek-r1-distill-qwen-1.5b",match:{equals:"deepseek/deepseek-r1-distill-qwen-1.5b"},prices:{input_mtok:.18,output_mtok:.18}},{id:"deepseek/deepseek-r1-distill-qwen-14b",match:{equals:"deepseek/deepseek-r1-distill-qwen-14b"},prices:{input_mtok:.15,output_mtok:.15}},{id:"deepseek/deepseek-r1-distill-qwen-14b:free",match:{equals:"deepseek/deepseek-r1-distill-qwen-14b:free"},prices:{}},{id:"deepseek/deepseek-r1-distill-qwen-32b",match:{equals:"deepseek/deepseek-r1-distill-qwen-32b"},prices:{input_mtok:.12,output_mtok:.18}},{id:"deepseek/deepseek-r1-distill-qwen-32b:free",match:{equals:"deepseek/deepseek-r1-distill-qwen-32b:free"},prices:{}},{id:"deepseek/deepseek-r1-zero:free",match:{equals:"deepseek/deepseek-r1-zero:free"},prices:{}},{id:"deepseek/deepseek-r1:free",match:{equals:"deepseek/deepseek-r1:free"},prices:{}},{id:"deepseek/deepseek-v3-base:free",match:{equals:"deepseek/deepseek-v3-base:free"},prices:{}},{id:"deepseek/deepseek-v3.2-exp",name:"DeepSeek V3.2 Experimental",match:{equals:"deepseek/deepseek-v3.2-exp"},prices:{input_mtok:.27,output_mtok:.4}},{id:"devstral-small",name:"Devstral Small",match:{equals:"devstral-small"},prices:{input_mtok:.06,output_mtok:.12}},{id:"devstral-small:free",name:"Devstral Small (free)",match:{equals:"devstral-small:free"},prices:{}},{id:"dobby-mini-unhinged-plus-llama-3.1-8b",name:"Dobby Mini Plus Llama 3.1 8B",match:{equals:"dobby-mini-unhinged-plus-llama-3.1-8b"},prices:{input_mtok:.2,output_mtok:.2}},{id:"dolphin-mixtral-8x22b",name:"Dolphin 2.9.2 Mixtral 8x22B 🐬",match:{equals:"dolphin-mixtral-8x22b"},prices:{input_mtok:.9,output_mtok:.9}},{id:"dolphin3.0-mistral-24b:free",name:"Dolphin3.0 Mistral 24B (free)",match:{equals:"dolphin3.0-mistral-24b:free"},prices:{}},{id:"dolphin3.0-r1-mistral-24b:free",name:"Dolphin3.0 R1 Mistral 24B (free)",match:{equals:"dolphin3.0-r1-mistral-24b:free"},prices:{}},{id:"eleutherai/llemma_7b",match:{equals:"eleutherai/llemma_7b"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"eva-llama-3.33-70b",name:"EVA Llama 3.33 70B",match:{equals:"eva-llama-3.33-70b"},prices:{input_mtok:4,output_mtok:6}},{id:"eva-qwen-2.5-32b",name:"EVA Qwen2.5 32B",match:{equals:"eva-qwen-2.5-32b"},prices:{input_mtok:2.6,output_mtok:3.4}},{id:"eva-qwen-2.5-72b",name:"EVA Qwen2.5 72B",match:{equals:"eva-qwen-2.5-72b"},prices:{input_mtok:4,output_mtok:6}},{id:"eva-unit-01/eva-llama-3.33-70b",match:{equals:"eva-unit-01/eva-llama-3.33-70b"},prices:{input_mtok:4,output_mtok:6}},{id:"eva-unit-01/eva-qwen-2.5-32b",match:{equals:"eva-unit-01/eva-qwen-2.5-32b"},prices:{input_mtok:2.6,output_mtok:3.4}},{id:"eva-unit-01/eva-qwen-2.5-72b",match:{equals:"eva-unit-01/eva-qwen-2.5-72b"},prices:{input_mtok:.9,output_mtok:1.2}},{id:"featherless/qwerky-72b:free",match:{equals:"featherless/qwerky-72b:free"},prices:{}},{id:"fimbulvetr-11b-v2",name:"Fimbulvetr 11B v2",match:{equals:"fimbulvetr-11b-v2"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"gemini-2.0-flash-001",name:"Gemini 2.0 Flash",match:{equals:"gemini-2.0-flash-001"},prices:{input_mtok:.1,cache_write_mtok:.1833,cache_read_mtok:.025,output_mtok:.4}},{id:"gemini-2.0-flash-exp:free",name:"Gemini 2.0 Flash Experimental (free)",match:{equals:"gemini-2.0-flash-exp:free"},prices:{}},{id:"gemini-2.0-flash-lite-001",name:"Gemini 2.0 Flash Lite",match:{equals:"gemini-2.0-flash-lite-001"},prices:{input_mtok:.075,output_mtok:.3}},{id:"gemini-2.5-flash",name:"Gemini 2.5 Flash",match:{or:[{equals:"gemini-2.5-flash"},{equals:"google/gemini-2.5-flash"}]},prices:{input_mtok:.3,cache_write_mtok:.3833,cache_read_mtok:.075,output_mtok:2.5}},{id:"gemini-2.5-flash-lite-preview-06-17",name:"Gemini 2.5 Flash Lite Preview 06-17",match:{equals:"gemini-2.5-flash-lite-preview-06-17"},prices:{input_mtok:.1,output_mtok:.4}},{id:"gemini-2.5-flash-preview",name:"Gemini 2.5 Flash Preview 04-17",match:{or:[{equals:"gemini-2.5-flash-preview"},{equals:"gemini-2.5-flash-preview-05-20"}]},prices:{input_mtok:.15,cache_write_mtok:.2333,cache_read_mtok:.0375,output_mtok:.6}},{id:"gemini-2.5-flash-preview-05-20:thinking",name:"Gemini 2.5 Flash Preview 05-20 (thinking)",match:{equals:"gemini-2.5-flash-preview-05-20:thinking"},prices:{input_mtok:.15,cache_write_mtok:.2333,cache_read_mtok:.0375,output_mtok:3.5}},{id:"gemini-2.5-flash-preview:thinking",name:"Gemini 2.5 Flash Preview 04-17 (thinking)",match:{equals:"gemini-2.5-flash-preview:thinking"},prices:{input_mtok:.15,cache_write_mtok:.2333,cache_read_mtok:.0375,output_mtok:3.5}},{id:"gemini-2.5-pro",name:"Gemini 2.5 Pro",match:{or:[{equals:"gemini-2.5-pro"},{equals:"gemini-2.5-pro-preview"},{equals:"gemini-2.5-pro-preview-05-06"},{equals:"google/gemini-2.5-pro"},{equals:"google/gemini-2.5-pro-preview"},{equals:"google/gemini-2.5-pro-preview-05-06"}]},prices:{input_mtok:1.25,cache_write_mtok:1.625,cache_read_mtok:.31,output_mtok:10}},{id:"gemini-2.5-pro-exp-03-25",name:"Gemini 2.5 Pro Experimental",match:{equals:"gemini-2.5-pro-exp-03-25"},prices:{}},{id:"gemini-flash-1.5",name:"Gemini 1.5 Flash",match:{equals:"gemini-flash-1.5"},prices:{input_mtok:.075,cache_write_mtok:.1583,cache_read_mtok:.01875,output_mtok:.3}},{id:"gemini-flash-1.5-8b",name:"Gemini 1.5 Flash 8B",match:{equals:"gemini-flash-1.5-8b"},prices:{input_mtok:.0375,cache_write_mtok:.0583,cache_read_mtok:.01,output_mtok:.15}},{id:"gemini-pro-1.5",name:"Gemini 1.5 Pro",match:{equals:"gemini-pro-1.5"},prices:{input_mtok:1.25,output_mtok:5}},{id:"gemma-2-27b-it",name:"Gemma 2 27B",match:{equals:"gemma-2-27b-it"},prices:{input_mtok:.8,output_mtok:.8}},{id:"gemma-2-9b-it",name:"Gemma 2 9B",match:{equals:"gemma-2-9b-it"},prices:{input_mtok:.2,output_mtok:.2}},{id:"gemma-2-9b-it:free",name:"Gemma 2 9B (free)",match:{equals:"gemma-2-9b-it:free"},prices:{}},{id:"gemma-3-12b-it",name:"Gemma 3 12B",match:{equals:"gemma-3-12b-it"},prices:{input_mtok:.05,output_mtok:.1}},{id:"gemma-3-12b-it:free",name:"Gemma 3 12B (free)",match:{equals:"gemma-3-12b-it:free"},prices:{}},{id:"gemma-3-27b-it",name:"Gemma 3 27B",match:{equals:"gemma-3-27b-it"},prices:{input_mtok:.1,output_mtok:.2}},{id:"gemma-3-27b-it:free",name:"Gemma 3 27B (free)",match:{equals:"gemma-3-27b-it:free"},prices:{}},{id:"gemma-3-4b-it",name:"Gemma 3 4B",match:{equals:"gemma-3-4b-it"},prices:{input_mtok:.02,output_mtok:.04}},{id:"gemma-3-4b-it:free",name:"Gemma 3 4B (free)",match:{equals:"gemma-3-4b-it:free"},prices:{}},{id:"gemma-3n-e4b-it:free",name:"Gemma 3n 4B (free)",match:{equals:"gemma-3n-e4b-it:free"},prices:{}},{id:"glm-4-32b",name:"GLM 4 32B",match:{equals:"glm-4-32b"},prices:{input_mtok:.24,output_mtok:.24}},{id:"glm-4-32b:free",name:"GLM 4 32B (free)",match:{equals:"glm-4-32b:free"},prices:{}},{id:"glm-z1-32b",name:"GLM Z1 32B",match:{equals:"glm-z1-32b"},prices:{input_mtok:.24,output_mtok:.24}},{id:"glm-z1-32b:free",name:"GLM Z1 32B (free)",match:{equals:"glm-z1-32b:free"},prices:{}},{id:"glm-z1-rumination-32b",name:"GLM Z1 Rumination 32B",match:{equals:"glm-z1-rumination-32b"},prices:{input_mtok:.24,output_mtok:.24}},{id:"goliath-120b",name:"Goliath 120B",match:{equals:"goliath-120b"},prices:{input_mtok:10,output_mtok:12.5}},{id:"google/gemini-2.0-flash-001",match:{equals:"google/gemini-2.0-flash-001"},prices:{input_mtok:.1,output_mtok:.4}},{id:"google/gemini-2.0-flash-exp:free",match:{equals:"google/gemini-2.0-flash-exp:free"},prices:{}},{id:"google/gemini-2.0-flash-lite-001",match:{equals:"google/gemini-2.0-flash-lite-001"},prices:{input_mtok:.075,output_mtok:.3}},{id:"google/gemini-2.0-flash-thinking-exp-1219:free",match:{equals:"google/gemini-2.0-flash-thinking-exp-1219:free"},prices:{}},{id:"google/gemini-2.0-flash-thinking-exp:free",match:{equals:"google/gemini-2.0-flash-thinking-exp:free"},prices:{}},{id:"google/gemini-2.5-flash-image",name:"Gemini 2.5 Flash Image (Nano Banana)",match:{or:[{equals:"google/gemini-2.5-flash-image"},{equals:"google/gemini-2.5-flash-image-preview"}]},prices:{input_mtok:.3,output_mtok:2.5}},{id:"google/gemini-2.5-flash-lite",name:"Gemini 2.5 Flash Lite",match:{equals:"google/gemini-2.5-flash-lite"},prices:{input_mtok:.1,cache_write_mtok:.183,cache_read_mtok:.025,output_mtok:.4}},{id:"google/gemini-2.5-flash-lite-preview-09-2025",name:"Gemini 2.5 Flash Lite Preview 09-2025",match:{equals:"google/gemini-2.5-flash-lite-preview-09-2025"},prices:{input_mtok:.1,output_mtok:.4}},{id:"google/gemini-2.5-flash-preview",match:{equals:"google/gemini-2.5-flash-preview"},prices:{input_mtok:.15,output_mtok:.6}},{id:"google/gemini-2.5-flash-preview-09-2025",name:"Gemini 2.5 Flash Preview 09-2025",match:{equals:"google/gemini-2.5-flash-preview-09-2025"},prices:{input_mtok:.3,cache_write_mtok:.383,cache_read_mtok:.075,output_mtok:2.5}},{id:"google/gemini-2.5-flash-preview:thinking",match:{equals:"google/gemini-2.5-flash-preview:thinking"},prices:{input_mtok:.15,output_mtok:3.5}},{id:"google/gemini-2.5-pro-exp-03-25:free",match:{equals:"google/gemini-2.5-pro-exp-03-25:free"},prices:{}},{id:"google/gemini-2.5-pro-preview-03-25",match:{equals:"google/gemini-2.5-pro-preview-03-25"},prices:{input_mtok:1.25,output_mtok:10}},{id:"google/gemini-flash-1.5",match:{equals:"google/gemini-flash-1.5"},prices:{input_mtok:.075,output_mtok:.3}},{id:"google/gemini-flash-1.5-8b",match:{equals:"google/gemini-flash-1.5-8b"},prices:{input_mtok:.0375,output_mtok:.15}},{id:"google/gemini-flash-1.5-8b-exp",match:{equals:"google/gemini-flash-1.5-8b-exp"},prices:{}},{id:"google/gemini-pro",match:{or:[{equals:"google/gemini-pro"},{equals:"google/gemini-pro-vision"}]},prices:{input_mtok:.5,output_mtok:1.5}},{id:"google/gemini-pro-1.5",match:{equals:"google/gemini-pro-1.5"},prices:{input_mtok:1.25,output_mtok:5}},{id:"google/gemma-2-27b-it",match:{equals:"google/gemma-2-27b-it"},prices:{input_mtok:.8,output_mtok:.8}},{id:"google/gemma-2-9b-it",match:{equals:"google/gemma-2-9b-it"},prices:{input_mtok:.07,output_mtok:.07}},{id:"google/gemma-2-9b-it:free",match:{equals:"google/gemma-2-9b-it:free"},prices:{}},{id:"google/gemma-3-12b-it",match:{equals:"google/gemma-3-12b-it"},prices:{input_mtok:.05,output_mtok:.1}},{id:"google/gemma-3-12b-it:free",match:{equals:"google/gemma-3-12b-it:free"},prices:{}},{id:"google/gemma-3-1b-it:free",match:{equals:"google/gemma-3-1b-it:free"},prices:{}},{id:"google/gemma-3-27b-it",match:{equals:"google/gemma-3-27b-it"},prices:{input_mtok:.1,output_mtok:.2}},{id:"google/gemma-3-27b-it:free",match:{equals:"google/gemma-3-27b-it:free"},prices:{}},{id:"google/gemma-3-4b-it",match:{equals:"google/gemma-3-4b-it"},prices:{input_mtok:.02,output_mtok:.04}},{id:"google/gemma-3-4b-it:free",match:{equals:"google/gemma-3-4b-it:free"},prices:{}},{id:"google/learnlm-1.5-pro-experimental:free",match:{equals:"google/learnlm-1.5-pro-experimental:free"},prices:{}},{id:"google/palm-2-chat-bison",match:{or:[{equals:"google/palm-2-chat-bison"},{equals:"google/palm-2-chat-bison-32k"}]},prices:{input_mtok:1,output_mtok:2}},{id:"google/palm-2-codechat-bison",match:{or:[{equals:"google/palm-2-codechat-bison"},{equals:"google/palm-2-codechat-bison-32k"}]},prices:{input_mtok:1,output_mtok:2}},{id:"gpt-3.5-turbo",name:"GPT-3.5 Turbo",match:{or:[{equals:"gpt-3.5-turbo"},{equals:"gpt-3.5-turbo-0125"}]},prices:{input_mtok:.5,output_mtok:1.5}},{id:"gpt-3.5-turbo-0613",name:"GPT-3.5 Turbo (older v0613)",match:{equals:"gpt-3.5-turbo-0613"},prices:{input_mtok:1,output_mtok:2}},{id:"gpt-3.5-turbo-1106",name:"GPT-3.5 Turbo 16k (older v1106)",match:{equals:"gpt-3.5-turbo-1106"},prices:{input_mtok:1,output_mtok:2}},{id:"gpt-3.5-turbo-16k",name:"GPT-3.5 Turbo 16k",match:{equals:"gpt-3.5-turbo-16k"},prices:{input_mtok:3,output_mtok:4}},{id:"gpt-3.5-turbo-instruct",name:"GPT-3.5 Turbo Instruct",match:{equals:"gpt-3.5-turbo-instruct"},prices:{input_mtok:1.5,output_mtok:2}},{id:"gpt-4",name:"GPT-4",match:{or:[{equals:"gpt-4"},{equals:"gpt-4-0314"}]},prices:{input_mtok:30,output_mtok:60}},{id:"gpt-4-1106-preview",name:"GPT-4 Turbo (older v1106)",match:{equals:"gpt-4-1106-preview"},prices:{input_mtok:10,output_mtok:30}},{id:"gpt-4-turbo",name:"GPT-4 Turbo",match:{or:[{equals:"gpt-4-turbo"},{equals:"gpt-4-turbo-preview"}]},prices:{input_mtok:10,output_mtok:30}},{id:"gpt-4.1",name:"GPT-4.1",match:{equals:"gpt-4.1"},prices:{input_mtok:2,cache_read_mtok:.5,output_mtok:8}},{id:"gpt-4.1-mini",name:"GPT-4.1 Mini",match:{equals:"gpt-4.1-mini"},prices:{input_mtok:.4,cache_read_mtok:.1,output_mtok:1.6}},{id:"gpt-4.1-nano",name:"GPT-4.1 Nano",match:{equals:"gpt-4.1-nano"},prices:{input_mtok:.1,cache_read_mtok:.025,output_mtok:.4}},{id:"gpt-4.5-preview",name:"GPT-4.5 (Preview)",match:{equals:"gpt-4.5-preview"},prices:{input_mtok:75,cache_read_mtok:37.5,output_mtok:150}},{id:"gpt-4o",name:"GPT-4o",match:{or:[{equals:"gpt-4o"},{equals:"gpt-4o-2024-08-06"},{equals:"gpt-4o-2024-11-20"}]},prices:{input_mtok:2.5,cache_read_mtok:1.25,output_mtok:10}},{id:"gpt-4o-2024-05-13",name:"GPT-4o (2024-05-13)",match:{equals:"gpt-4o-2024-05-13"},prices:{input_mtok:5,output_mtok:15}},{id:"gpt-4o-mini",name:"GPT-4o-mini",match:{or:[{equals:"gpt-4o-mini"},{equals:"gpt-4o-mini-2024-07-18"}]},prices:{input_mtok:.15,cache_read_mtok:.075,output_mtok:.6}},{id:"gpt-4o-mini-search-preview",name:"GPT-4o-mini Search Preview",match:{equals:"gpt-4o-mini-search-preview"},prices:{input_mtok:.15,output_mtok:.6}},{id:"gpt-4o-search-preview",name:"GPT-4o Search Preview",match:{equals:"gpt-4o-search-preview"},prices:{input_mtok:2.5,output_mtok:10}},{id:"gpt-4o:extended",name:"GPT-4o (extended)",match:{equals:"gpt-4o:extended"},prices:{input_mtok:6,output_mtok:18}},{id:"grok-2-1212",name:"Grok 2 1212",match:{equals:"grok-2-1212"},prices:{input_mtok:2,output_mtok:10}},{id:"grok-2-vision-1212",name:"Grok 2 Vision 1212",match:{equals:"grok-2-vision-1212"},prices:{input_mtok:2,output_mtok:10}},{id:"grok-3",name:"Grok 3",match:{or:[{equals:"grok-3"},{equals:"grok-3-beta"}]},prices:{input_mtok:3,cache_read_mtok:.75,output_mtok:15}},{id:"grok-3-mini",name:"Grok 3 Mini",match:{or:[{equals:"grok-3-mini"},{equals:"grok-3-mini-beta"}]},prices:{input_mtok:.3,cache_read_mtok:.075,output_mtok:.5}},{id:"grok-beta",name:"Grok Beta",match:{equals:"grok-beta"},prices:{input_mtok:5,output_mtok:15}},{id:"grok-vision-beta",name:"Grok Vision Beta",match:{equals:"grok-vision-beta"},prices:{input_mtok:5,output_mtok:15}},{id:"gryphe/mythomax-l2-13b",match:{equals:"gryphe/mythomax-l2-13b"},prices:{input_mtok:.065,output_mtok:.065}},{id:"hermes-2-pro-llama-3-8b",name:"Hermes 2 Pro - Llama-3 8B",match:{equals:"hermes-2-pro-llama-3-8b"},prices:{input_mtok:.025,output_mtok:.04}},{id:"hermes-3-llama-3.1-405b",name:"Hermes 3 405B Instruct",match:{equals:"hermes-3-llama-3.1-405b"},prices:{input_mtok:.7,output_mtok:.8}},{id:"hermes-3-llama-3.1-70b",name:"Hermes 3 70B Instruct",match:{equals:"hermes-3-llama-3.1-70b"},prices:{input_mtok:.12,output_mtok:.3}},{id:"huggingfaceh4/zephyr-7b-beta:free",match:{equals:"huggingfaceh4/zephyr-7b-beta:free"},prices:{}},{id:"infermatic/mn-inferor-12b",match:{equals:"infermatic/mn-inferor-12b"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"inflection-3-pi",name:"Inflection 3 Pi",match:{equals:"inflection-3-pi"},prices:{input_mtok:2.5,output_mtok:10}},{id:"inflection-3-productivity",name:"Inflection 3 Productivity",match:{equals:"inflection-3-productivity"},prices:{input_mtok:2.5,output_mtok:10}},{id:"inflection/inflection-3-pi",match:{equals:"inflection/inflection-3-pi"},prices:{input_mtok:2.5,output_mtok:10}},{id:"inflection/inflection-3-productivity",match:{equals:"inflection/inflection-3-productivity"},prices:{input_mtok:2.5,output_mtok:10}},{id:"internvl3-14b:free",name:"InternVL3 14B (free)",match:{equals:"internvl3-14b:free"},prices:{}},{id:"internvl3-2b:free",name:"InternVL3 2B (free)",match:{equals:"internvl3-2b:free"},prices:{}},{id:"jamba-1.6-large",name:"Jamba 1.6 Large",match:{equals:"jamba-1.6-large"},prices:{input_mtok:2,output_mtok:8}},{id:"jamba-1.6-mini",name:"Jamba Mini 1.6",match:{equals:"jamba-1.6-mini"},prices:{input_mtok:.2,output_mtok:.4}},{id:"jondurbin/airoboros-l2-70b",match:{equals:"jondurbin/airoboros-l2-70b"},prices:{input_mtok:.5,output_mtok:.5}},{id:"kimi-dev-72b:free",name:"Kimi Dev 72b (free)",match:{equals:"kimi-dev-72b:free"},prices:{}},{id:"kimi-vl-a3b-thinking:free",name:"Kimi VL A3B Thinking (free)",match:{equals:"kimi-vl-a3b-thinking:free"},prices:{}},{id:"l3-euryale-70b",name:"Llama 3 Euryale 70B v2.1",match:{equals:"l3-euryale-70b"},prices:{input_mtok:1.48,output_mtok:1.48}},{id:"l3-lunaris-8b",name:"Llama 3 8B Lunaris",match:{equals:"l3-lunaris-8b"},prices:{input_mtok:.02,output_mtok:.05}},{id:"l3.1-euryale-70b",name:"Llama 3.1 Euryale 70B v2.2",match:{equals:"l3.1-euryale-70b"},prices:{input_mtok:.7,output_mtok:.8}},{id:"l3.3-euryale-70b",name:"Llama 3.3 Euryale 70B",match:{equals:"l3.3-euryale-70b"},prices:{input_mtok:.7,output_mtok:.8}},{id:"latitudegames/wayfarer-large-70b-llama-3.3",match:{equals:"latitudegames/wayfarer-large-70b-llama-3.3"},prices:{input_mtok:.8,output_mtok:.9}},{id:"lfm-3b",name:"LFM 3B",match:{equals:"lfm-3b"},prices:{input_mtok:.02,output_mtok:.02}},{id:"lfm-40b",name:"LFM 40B MoE",match:{equals:"lfm-40b"},prices:{input_mtok:.15,output_mtok:.15}},{id:"lfm-7b",name:"LFM 7B",match:{equals:"lfm-7b"},prices:{input_mtok:.01,output_mtok:.01}},{id:"liquid/lfm-3b",match:{equals:"liquid/lfm-3b"},prices:{input_mtok:.02,output_mtok:.02}},{id:"liquid/lfm-40b",match:{equals:"liquid/lfm-40b"},prices:{input_mtok:.15,output_mtok:.15}},{id:"liquid/lfm-7b",match:{equals:"liquid/lfm-7b"},prices:{input_mtok:.01,output_mtok:.01}},{id:"llama-3-70b-instruct",name:"Llama 3 70B Instruct",match:{equals:"llama-3-70b-instruct"},prices:{input_mtok:.3,output_mtok:.4}},{id:"llama-3-8b-instruct",name:"Llama 3 8B Instruct",match:{equals:"llama-3-8b-instruct"},prices:{input_mtok:.03,output_mtok:.06}},{id:"llama-3-lumimaid-70b",name:"Llama 3 Lumimaid 70B",match:{equals:"llama-3-lumimaid-70b"},prices:{input_mtok:4,output_mtok:6}},{id:"llama-3-lumimaid-8b",name:"Llama 3 Lumimaid 8B",match:{equals:"llama-3-lumimaid-8b"},prices:{input_mtok:.2,output_mtok:1.25}},{id:"llama-3.1-405b",name:"Llama 3.1 405B (base)",match:{equals:"llama-3.1-405b"},prices:{input_mtok:2,output_mtok:2}},{id:"llama-3.1-405b-instruct",name:"Llama 3.1 405B Instruct",match:{equals:"llama-3.1-405b-instruct"},prices:{input_mtok:.8,output_mtok:.8}},{id:"llama-3.1-70b-instruct",name:"Llama 3.1 70B Instruct",match:{equals:"llama-3.1-70b-instruct"},prices:{input_mtok:.1,output_mtok:.28}},{id:"llama-3.1-8b-instruct",name:"Llama 3.1 8B Instruct",match:{equals:"llama-3.1-8b-instruct"},prices:{input_mtok:.016,output_mtok:.029}},{id:"llama-3.1-8b-instruct:free",name:"Llama 3.1 8B Instruct (free)",match:{equals:"llama-3.1-8b-instruct:free"},prices:{}},{id:"llama-3.1-lumimaid-70b",name:"Lumimaid v0.2 70B",match:{equals:"llama-3.1-lumimaid-70b"},prices:{input_mtok:2.5,output_mtok:3}},{id:"llama-3.1-lumimaid-8b",name:"Lumimaid v0.2 8B",match:{equals:"llama-3.1-lumimaid-8b"},prices:{input_mtok:.2,output_mtok:1.25}},{id:"llama-3.1-nemotron-70b-instruct",name:"Llama 3.1 Nemotron 70B Instruct",match:{equals:"llama-3.1-nemotron-70b-instruct"},prices:{input_mtok:.12,output_mtok:.3}},{id:"llama-3.1-nemotron-ultra-253b-v1",name:"Llama 3.1 Nemotron Ultra 253B v1",match:{equals:"llama-3.1-nemotron-ultra-253b-v1"},prices:{input_mtok:.6,output_mtok:1.8}},{id:"llama-3.1-nemotron-ultra-253b-v1:free",name:"Llama 3.1 Nemotron Ultra 253B v1 (free)",match:{equals:"llama-3.1-nemotron-ultra-253b-v1:free"},prices:{}},{id:"llama-3.1-sonar-large-128k-online",name:"Llama 3.1 Sonar 70B Online",match:{equals:"llama-3.1-sonar-large-128k-online"},prices:{input_mtok:1,output_mtok:1}},{id:"llama-3.1-sonar-small-128k-online",name:"Llama 3.1 Sonar 8B Online",match:{equals:"llama-3.1-sonar-small-128k-online"},prices:{input_mtok:.2,output_mtok:.2}},{id:"llama-3.2-11b-vision-instruct",name:"Llama 3.2 11B Vision Instruct",match:{equals:"llama-3.2-11b-vision-instruct"},prices:{input_mtok:.049,output_mtok:.049}},{id:"llama-3.2-11b-vision-instruct:free",name:"Llama 3.2 11B Vision Instruct (free)",match:{equals:"llama-3.2-11b-vision-instruct:free"},prices:{}},{id:"llama-3.2-1b-instruct",name:"Llama 3.2 1B Instruct",match:{equals:"llama-3.2-1b-instruct"},prices:{input_mtok:.005,output_mtok:.01}},{id:"llama-3.2-1b-instruct:free",name:"Llama 3.2 1B Instruct (free)",match:{equals:"llama-3.2-1b-instruct:free"},prices:{}},{id:"llama-3.2-3b-instruct",name:"Llama 3.2 3B Instruct",match:{equals:"llama-3.2-3b-instruct"},prices:{input_mtok:.01,output_mtok:.02}},{id:"llama-3.2-3b-instruct:free",name:"Llama 3.2 3B Instruct (free)",match:{equals:"llama-3.2-3b-instruct:free"},prices:{}},{id:"llama-3.2-90b-vision-instruct",name:"Llama 3.2 90B Vision Instruct",match:{equals:"llama-3.2-90b-vision-instruct"},prices:{input_mtok:1.2,output_mtok:1.2}},{id:"llama-3.3-70b-instruct",name:"Llama 3.3 70B Instruct",match:{equals:"llama-3.3-70b-instruct"},prices:{input_mtok:.05,output_mtok:.24}},{id:"llama-3.3-70b-instruct:free",name:"Llama 3.3 70B Instruct (free)",match:{equals:"llama-3.3-70b-instruct:free"},prices:{}},{id:"llama-3.3-8b-instruct:free",name:"Llama 3.3 8B Instruct (free)",match:{equals:"llama-3.3-8b-instruct:free"},prices:{}},{id:"llama-3.3-nemotron-super-49b-v1",name:"Llama 3.3 Nemotron Super 49B v1",match:{equals:"llama-3.3-nemotron-super-49b-v1"},prices:{input_mtok:.13,output_mtok:.4}},{id:"llama-3.3-nemotron-super-49b-v1:free",name:"Llama 3.3 Nemotron Super 49B v1 (free)",match:{equals:"llama-3.3-nemotron-super-49b-v1:free"},prices:{}},{id:"llama-4-maverick",name:"Llama 4 Maverick",match:{equals:"llama-4-maverick"},prices:{input_mtok:.15,output_mtok:.6}},{id:"llama-4-maverick:free",name:"Llama 4 Maverick (free)",match:{equals:"llama-4-maverick:free"},prices:{}},{id:"llama-4-scout",name:"Llama 4 Scout",match:{equals:"llama-4-scout"},prices:{input_mtok:.08,output_mtok:.3}},{id:"llama-4-scout:free",name:"Llama 4 Scout (free)",match:{equals:"llama-4-scout:free"},prices:{}},{id:"llama-guard-2-8b",name:"LlamaGuard 2 8B",match:{equals:"llama-guard-2-8b"},prices:{input_mtok:.2,output_mtok:.2}},{id:"llama-guard-3-8b",name:"Llama Guard 3 8B",match:{equals:"llama-guard-3-8b"},prices:{input_mtok:.02,output_mtok:.06}},{id:"llama-guard-4-12b",name:"Llama Guard 4 12B",match:{equals:"llama-guard-4-12b"},prices:{input_mtok:.05,output_mtok:.05}},{id:"llama3.1-typhoon2-70b-instruct",name:"Typhoon2 70B Instruct",match:{equals:"llama3.1-typhoon2-70b-instruct"},prices:{input_mtok:.88,output_mtok:.88}},{id:"llemma_7b",name:"Llemma 7b",match:{equals:"llemma_7b"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"maestro-reasoning",name:"Maestro Reasoning",match:{equals:"maestro-reasoning"},prices:{input_mtok:.9,output_mtok:3.3}},{id:"magistral-medium-2506",name:"Magistral Medium 2506",match:{or:[{equals:"magistral-medium-2506"},{equals:"magistral-medium-2506:thinking"}]},prices:{input_mtok:2,output_mtok:5}},{id:"magistral-small-2506",name:"Magistral Small 2506",match:{equals:"magistral-small-2506"},prices:{input_mtok:.5,output_mtok:1.5}},{id:"magnum-72b",name:"Magnum 72B",match:{equals:"magnum-72b"},prices:{input_mtok:4,output_mtok:6}},{id:"magnum-v2-72b",name:"Magnum v2 72B",match:{equals:"magnum-v2-72b"},prices:{input_mtok:3,output_mtok:3}},{id:"magnum-v4-72b",name:"Magnum v4 72B",match:{equals:"magnum-v4-72b"},prices:{input_mtok:2.5,output_mtok:3}},{id:"mai-ds-r1:free",name:"MAI DS R1 (free)",match:{equals:"mai-ds-r1:free"},prices:{}},{id:"mancer/weaver",match:{equals:"mancer/weaver"},prices:{input_mtok:1.125,output_mtok:1.125}},{id:"mercury-coder-small-beta",name:"Mercury Coder Small Beta",match:{equals:"mercury-coder-small-beta"},prices:{input_mtok:.25,output_mtok:1}},{id:"meta-llama/llama-2-13b-chat",match:{equals:"meta-llama/llama-2-13b-chat"},prices:{input_mtok:.22,output_mtok:.22}},{id:"meta-llama/llama-2-70b-chat",match:{equals:"meta-llama/llama-2-70b-chat"},prices:{input_mtok:.9,output_mtok:.9}},{id:"meta-llama/llama-3-70b-instruct",match:{equals:"meta-llama/llama-3-70b-instruct"},prices:{input_mtok:.3,output_mtok:.4}},{id:"meta-llama/llama-3-8b-instruct",match:{equals:"meta-llama/llama-3-8b-instruct"},prices:{input_mtok:.03,output_mtok:.06}},{id:"meta-llama/llama-3.1-405b",match:{equals:"meta-llama/llama-3.1-405b"},prices:{input_mtok:2,output_mtok:2}},{id:"meta-llama/llama-3.1-405b-instruct",match:{equals:"meta-llama/llama-3.1-405b-instruct"},prices:{input_mtok:.8,output_mtok:.8}},{id:"meta-llama/llama-3.1-405b:free",match:{equals:"meta-llama/llama-3.1-405b:free"},prices:{}},{id:"meta-llama/llama-3.1-70b-instruct",match:{equals:"meta-llama/llama-3.1-70b-instruct"},prices:{input_mtok:.119,output_mtok:.39}},{id:"meta-llama/llama-3.1-8b-instruct",match:{equals:"meta-llama/llama-3.1-8b-instruct"},prices:{input_mtok:.02,output_mtok:.03}},{id:"meta-llama/llama-3.1-8b-instruct:free",match:{equals:"meta-llama/llama-3.1-8b-instruct:free"},prices:{}},{id:"meta-llama/llama-3.2-11b-vision-instruct",match:{equals:"meta-llama/llama-3.2-11b-vision-instruct"},prices:{input_mtok:.049,output_mtok:.049}},{id:"meta-llama/llama-3.2-11b-vision-instruct:free",match:{equals:"meta-llama/llama-3.2-11b-vision-instruct:free"},prices:{}},{id:"meta-llama/llama-3.2-1b-instruct",match:{equals:"meta-llama/llama-3.2-1b-instruct"},prices:{input_mtok:.01,output_mtok:.01}},{id:"meta-llama/llama-3.2-1b-instruct:free",match:{equals:"meta-llama/llama-3.2-1b-instruct:free"},prices:{}},{id:"meta-llama/llama-3.2-3b-instruct",match:{equals:"meta-llama/llama-3.2-3b-instruct"},prices:{input_mtok:.015,output_mtok:.025}},{id:"meta-llama/llama-3.2-3b-instruct:free",match:{equals:"meta-llama/llama-3.2-3b-instruct:free"},prices:{}},{id:"meta-llama/llama-3.2-90b-vision-instruct",match:{equals:"meta-llama/llama-3.2-90b-vision-instruct"},prices:{input_mtok:.9,output_mtok:.9}},{id:"meta-llama/llama-3.3-70b-instruct",match:{equals:"meta-llama/llama-3.3-70b-instruct"},prices:{input_mtok:.1,output_mtok:.25}},{id:"meta-llama/llama-3.3-70b-instruct:free",match:{equals:"meta-llama/llama-3.3-70b-instruct:free"},prices:{}},{id:"meta-llama/llama-4-maverick",match:{equals:"meta-llama/llama-4-maverick"},prices:{input_mtok:.17,output_mtok:.85}},{id:"meta-llama/llama-4-maverick:free",match:{equals:"meta-llama/llama-4-maverick:free"},prices:{}},{id:"meta-llama/llama-4-scout",match:{equals:"meta-llama/llama-4-scout"},prices:{input_mtok:.08,output_mtok:.3}},{id:"meta-llama/llama-4-scout:free",match:{equals:"meta-llama/llama-4-scout:free"},prices:{}},{id:"meta-llama/llama-guard-2-8b",match:{equals:"meta-llama/llama-guard-2-8b"},prices:{input_mtok:.2,output_mtok:.2}},{id:"meta-llama/llama-guard-3-8b",match:{equals:"meta-llama/llama-guard-3-8b"},prices:{input_mtok:.1,output_mtok:.1}},{id:"microsoft/phi-3-medium-128k-instruct",match:{equals:"microsoft/phi-3-medium-128k-instruct"},prices:{input_mtok:1,output_mtok:1}},{id:"microsoft/phi-3-mini-128k-instruct",match:{equals:"microsoft/phi-3-mini-128k-instruct"},prices:{input_mtok:.1,output_mtok:.1}},{id:"microsoft/phi-3.5-mini-128k-instruct",match:{equals:"microsoft/phi-3.5-mini-128k-instruct"},prices:{input_mtok:.1,output_mtok:.1}},{id:"microsoft/phi-4",match:{equals:"microsoft/phi-4"},prices:{input_mtok:.07,output_mtok:.14}},{id:"microsoft/phi-4-multimodal-instruct",match:{equals:"microsoft/phi-4-multimodal-instruct"},prices:{input_mtok:.05,output_mtok:.1}},{id:"microsoft/wizardlm-2-7b",match:{equals:"microsoft/wizardlm-2-7b"},prices:{input_mtok:.07,output_mtok:.07}},{id:"microsoft/wizardlm-2-8x22b",match:{equals:"microsoft/wizardlm-2-8x22b"},prices:{input_mtok:.5,output_mtok:.5}},{id:"midnight-rose-70b",name:"Midnight Rose 70B",match:{equals:"midnight-rose-70b"},prices:{input_mtok:.8,output_mtok:.8}},{id:"minimax-01",name:"MiniMax-01",match:{equals:"minimax-01"},prices:{input_mtok:.2,output_mtok:1.1}},{id:"minimax-m1",name:"MiniMax M1",match:{equals:"minimax-m1"},prices:{input_mtok:.3,output_mtok:1.65}},{id:"minimax-m1:extended",name:"MiniMax M1 (extended)",match:{equals:"minimax-m1:extended"},prices:{input_mtok:.55,output_mtok:2.2}},{id:"minimax/minimax-01",match:{equals:"minimax/minimax-01"},prices:{input_mtok:.2,output_mtok:1.1}},{id:"ministral-3b",name:"Ministral 3B",match:{equals:"ministral-3b"},prices:{input_mtok:.04,output_mtok:.04}},{id:"ministral-8b",name:"Ministral 8B",match:{equals:"ministral-8b"},prices:{input_mtok:.1,output_mtok:.1}},{id:"mistral-7b-instruct",name:"Mistral 7B Instruct",match:{or:[{equals:"mistral-7b-instruct"},{equals:"mistral-7b-instruct-v0.3"}]},prices:{input_mtok:.028,output_mtok:.054}},{id:"mistral-7b-instruct-v0.1",name:"Mistral 7B Instruct v0.1",match:{equals:"mistral-7b-instruct-v0.1"},prices:{input_mtok:.11,output_mtok:.19}},{id:"mistral-7b-instruct-v0.2",name:"Mistral 7B Instruct v0.2",match:{equals:"mistral-7b-instruct-v0.2"},prices:{input_mtok:.2,output_mtok:.2}},{id:"mistral-7b-instruct:free",name:"Mistral 7B Instruct (free)",match:{equals:"mistral-7b-instruct:free"},prices:{}},{id:"mistral-large",name:"Mistral Large",match:{or:[{equals:"mistral-large"},{equals:"mistral-large-2407"},{equals:"mistral-large-2411"}]},prices:{input_mtok:2,output_mtok:6}},{id:"mistral-medium",name:"Mistral Medium",match:{equals:"mistral-medium"},prices:{input_mtok:2.75,output_mtok:8.1}},{id:"mistral-medium-3",name:"Mistral Medium 3",match:{equals:"mistral-medium-3"},prices:{input_mtok:.4,output_mtok:2}},{id:"mistral-nemo",name:"Mistral Nemo",match:{equals:"mistral-nemo"},prices:{input_mtok:.01,output_mtok:.019}},{id:"mistral-nemo:free",name:"Mistral Nemo (free)",match:{equals:"mistral-nemo:free"},prices:{}},{id:"mistral-saba",name:"Saba",match:{equals:"mistral-saba"},prices:{input_mtok:.2,output_mtok:.6}},{id:"mistral-small",name:"Mistral Small",match:{equals:"mistral-small"},prices:{input_mtok:.2,output_mtok:.6}},{id:"mistral-small-24b-instruct-2501",name:"Mistral Small 3",match:{equals:"mistral-small-24b-instruct-2501"},prices:{input_mtok:.05,output_mtok:.09}},{id:"mistral-small-24b-instruct-2501:free",name:"Mistral Small 3 (free)",match:{equals:"mistral-small-24b-instruct-2501:free"},prices:{}},{id:"mistral-small-3.1-24b-instruct",name:"Mistral Small 3.1 24B",match:{equals:"mistral-small-3.1-24b-instruct"},prices:{input_mtok:.05,output_mtok:.15}},{id:"mistral-small-3.1-24b-instruct:free",name:"Mistral Small 3.1 24B (free)",match:{equals:"mistral-small-3.1-24b-instruct:free"},prices:{}},{id:"mistral-small-3.2-24b-instruct:free",name:"Mistral Small 3.2 24B (free)",match:{equals:"mistral-small-3.2-24b-instruct:free"},prices:{}},{id:"mistral-tiny",name:"Mistral Tiny",match:{equals:"mistral-tiny"},prices:{input_mtok:.25,output_mtok:.25}},{id:"mistral/ministral-8b",match:{equals:"mistral/ministral-8b"},prices:{input_mtok:.1,output_mtok:.1}},{id:"mistralai/codestral-2501",match:{equals:"mistralai/codestral-2501"},prices:{input_mtok:.3,output_mtok:.9}},{id:"mistralai/codestral-mamba",match:{equals:"mistralai/codestral-mamba"},prices:{input_mtok:.25,output_mtok:.25}},{id:"mistralai/ministral-3b",match:{equals:"mistralai/ministral-3b"},prices:{input_mtok:.04,output_mtok:.04}},{id:"mistralai/ministral-8b",match:{equals:"mistralai/ministral-8b"},prices:{input_mtok:.1,output_mtok:.1}},{id:"mistralai/mistral-7b-instruct",match:{or:[{equals:"mistralai/mistral-7b-instruct"},{equals:"mistralai/mistral-7b-instruct-v0.3"}]},prices:{input_mtok:.029,output_mtok:.059}},{id:"mistralai/mistral-7b-instruct-v0.1",match:{equals:"mistralai/mistral-7b-instruct-v0.1"},prices:{input_mtok:.2,output_mtok:.2}},{id:"mistralai/mistral-7b-instruct-v0.2",match:{equals:"mistralai/mistral-7b-instruct-v0.2"},prices:{input_mtok:.2,output_mtok:.2}},{id:"mistralai/mistral-7b-instruct:free",match:{equals:"mistralai/mistral-7b-instruct:free"},prices:{}},{id:"mistralai/mistral-large",match:{or:[{equals:"mistralai/mistral-large"},{equals:"mistralai/mistral-large-2407"},{equals:"mistralai/mistral-large-2411"}]},prices:{input_mtok:2,output_mtok:6}},{id:"mistralai/mistral-medium",match:{equals:"mistralai/mistral-medium"},prices:{input_mtok:2.75,output_mtok:8.1}},{id:"mistralai/mistral-nemo",match:{equals:"mistralai/mistral-nemo"},prices:{input_mtok:.035,output_mtok:.08}},{id:"mistralai/mistral-nemo:free",match:{equals:"mistralai/mistral-nemo:free"},prices:{}},{id:"mistralai/mistral-saba",match:{equals:"mistralai/mistral-saba"},prices:{input_mtok:.2,output_mtok:.6}},{id:"mistralai/mistral-small",match:{equals:"mistralai/mistral-small"},prices:{input_mtok:.2,output_mtok:.6}},{id:"mistralai/mistral-small-24b-instruct-2501",match:{equals:"mistralai/mistral-small-24b-instruct-2501"},prices:{input_mtok:.07,output_mtok:.14}},{id:"mistralai/mistral-small-24b-instruct-2501:free",match:{equals:"mistralai/mistral-small-24b-instruct-2501:free"},prices:{}},{id:"mistralai/mistral-small-3.1-24b-instruct",match:{equals:"mistralai/mistral-small-3.1-24b-instruct"},prices:{input_mtok:.1,output_mtok:.3}},{id:"mistralai/mistral-small-3.1-24b-instruct:free",match:{equals:"mistralai/mistral-small-3.1-24b-instruct:free"},prices:{}},{id:"mistralai/mistral-tiny",match:{equals:"mistralai/mistral-tiny"},prices:{input_mtok:.25,output_mtok:.25}},{id:"mistralai/mixtral-8x22b-instruct",match:{equals:"mistralai/mixtral-8x22b-instruct"},prices:{input_mtok:.9,output_mtok:.9}},{id:"mistralai/mixtral-8x7b-instruct",match:{equals:"mistralai/mixtral-8x7b-instruct"},prices:{input_mtok:.24,output_mtok:.24}},{id:"mistralai/pixtral-12b",match:{equals:"mistralai/pixtral-12b"},prices:{input_mtok:.1,output_mtok:.1}},{id:"mistralai/pixtral-large-2411",match:{equals:"mistralai/pixtral-large-2411"},prices:{input_mtok:2,output_mtok:6}},{id:"mixtral-8x22b-instruct",name:"Mixtral 8x22B Instruct",match:{equals:"mixtral-8x22b-instruct"},prices:{input_mtok:.9,output_mtok:.9}},{id:"mixtral-8x7b-instruct",name:"Mixtral 8x7B Instruct",match:{equals:"mixtral-8x7b-instruct"},prices:{input_mtok:.08,output_mtok:.24}},{id:"mn-celeste-12b",name:"Mistral Nemo 12B Celeste",match:{equals:"mn-celeste-12b"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"mn-inferor-12b",name:"Mistral Nemo Inferor 12B",match:{equals:"mn-inferor-12b"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"mn-starcannon-12b",name:"Starcannon 12B",match:{equals:"mn-starcannon-12b"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"moonshotai/kimi-vl-a3b-thinking:free",match:{equals:"moonshotai/kimi-vl-a3b-thinking:free"},prices:{}},{id:"moonshotai/moonlight-16b-a3b-instruct:free",match:{equals:"moonshotai/moonlight-16b-a3b-instruct:free"},prices:{}},{id:"mythalion-13b",name:"Mythalion 13B",match:{equals:"mythalion-13b"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"mythomax-l2-13b",name:"MythoMax 13B",match:{equals:"mythomax-l2-13b"},prices:{input_mtok:.065,output_mtok:.065}},{id:"neversleep/llama-3-lumimaid-70b",match:{equals:"neversleep/llama-3-lumimaid-70b"},prices:{input_mtok:3.375,output_mtok:4.5}},{id:"neversleep/llama-3-lumimaid-8b",match:{or:[{equals:"neversleep/llama-3-lumimaid-8b"},{equals:"neversleep/llama-3-lumimaid-8b:extended"}]},prices:{input_mtok:.09375,output_mtok:.75}},{id:"neversleep/llama-3.1-lumimaid-70b",match:{equals:"neversleep/llama-3.1-lumimaid-70b"},prices:{input_mtok:1.5,output_mtok:2.25}},{id:"neversleep/llama-3.1-lumimaid-8b",match:{equals:"neversleep/llama-3.1-lumimaid-8b"},prices:{input_mtok:.09375,output_mtok:.75}},{id:"neversleep/noromaid-20b",match:{equals:"neversleep/noromaid-20b"},prices:{input_mtok:.75,output_mtok:1.5}},{id:"noromaid-20b",name:"Noromaid 20B",match:{equals:"noromaid-20b"},prices:{input_mtok:1.25,output_mtok:2}},{id:"nothingiisreal/mn-celeste-12b",match:{equals:"nothingiisreal/mn-celeste-12b"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"nous-hermes-2-mixtral-8x7b-dpo",name:"Hermes 2 Mixtral 8x7B DPO",match:{equals:"nous-hermes-2-mixtral-8x7b-dpo"},prices:{input_mtok:.6,output_mtok:.6}},{id:"nousresearch/deephermes-3-llama-3-8b-preview:free",match:{equals:"nousresearch/deephermes-3-llama-3-8b-preview:free"},prices:{}},{id:"nousresearch/hermes-2-pro-llama-3-8b",match:{equals:"nousresearch/hermes-2-pro-llama-3-8b"},prices:{input_mtok:.025,output_mtok:.04}},{id:"nousresearch/hermes-3-llama-3.1-405b",match:{equals:"nousresearch/hermes-3-llama-3.1-405b"},prices:{input_mtok:.8,output_mtok:.8}},{id:"nousresearch/hermes-3-llama-3.1-70b",match:{equals:"nousresearch/hermes-3-llama-3.1-70b"},prices:{input_mtok:.12,output_mtok:.3}},{id:"nousresearch/nous-hermes-2-mixtral-8x7b-dpo",match:{equals:"nousresearch/nous-hermes-2-mixtral-8x7b-dpo"},prices:{input_mtok:.6,output_mtok:.6}},{id:"nousresearch/nous-hermes-llama2-13b",match:{equals:"nousresearch/nous-hermes-llama2-13b"},prices:{input_mtok:.18,output_mtok:.18}},{id:"nova-lite-v1",name:"Nova Lite 1.0",match:{equals:"nova-lite-v1"},prices:{input_mtok:.06,output_mtok:.24}},{id:"nova-micro-v1",name:"Nova Micro 1.0",match:{equals:"nova-micro-v1"},prices:{input_mtok:.035,output_mtok:.14}},{id:"nova-pro-v1",name:"Nova Pro 1.0",match:{equals:"nova-pro-v1"},prices:{input_mtok:.8,output_mtok:3.2}},{id:"nvidia/llama-3.1-nemotron-70b-instruct",match:{equals:"nvidia/llama-3.1-nemotron-70b-instruct"},prices:{input_mtok:.12,output_mtok:.3}},{id:"nvidia/llama-3.1-nemotron-70b-instruct:free",match:{equals:"nvidia/llama-3.1-nemotron-70b-instruct:free"},prices:{}},{id:"nvidia/llama-3.1-nemotron-nano-8b-v1:free",match:{equals:"nvidia/llama-3.1-nemotron-nano-8b-v1:free"},prices:{}},{id:"nvidia/llama-3.1-nemotron-ultra-253b-v1:free",match:{equals:"nvidia/llama-3.1-nemotron-ultra-253b-v1:free"},prices:{}},{id:"nvidia/llama-3.3-nemotron-super-49b-v1:free",match:{equals:"nvidia/llama-3.3-nemotron-super-49b-v1:free"},prices:{}},{id:"o1",name:"o1",match:{or:[{equals:"o1"},{equals:"o1-preview"},{equals:"o1-preview-2024-09-12"}]},prices:{input_mtok:15,cache_read_mtok:7.5,output_mtok:60}},{id:"o1-mini",name:"o1-mini",match:{or:[{equals:"o1-mini"},{equals:"o1-mini-2024-09-12"}]},prices:{input_mtok:1.1,cache_read_mtok:.55,output_mtok:4.4}},{id:"o1-pro",name:"o1-pro",match:{equals:"o1-pro"},prices:{input_mtok:150,output_mtok:600}},{id:"o3",name:"o3",match:{equals:"o3"},prices:{input_mtok:2,cache_read_mtok:.5,output_mtok:8}},{id:"o3-mini",name:"o3 Mini",match:{or:[{equals:"o3-mini"},{equals:"o3-mini-high"}]},prices:{input_mtok:1.1,cache_read_mtok:.55,output_mtok:4.4}},{id:"o3-pro",name:"o3 Pro",match:{equals:"o3-pro"},prices:{input_mtok:20,output_mtok:80}},{id:"o4-mini",name:"o4 Mini",match:{or:[{equals:"o4-mini"},{equals:"o4-mini-high"}]},prices:{input_mtok:1.1,cache_read_mtok:.275,output_mtok:4.4}},{id:"open-r1/olympiccoder-32b:free",match:{equals:"open-r1/olympiccoder-32b:free"},prices:{}},{id:"open-r1/olympiccoder-7b:free",match:{equals:"open-r1/olympiccoder-7b:free"},prices:{}},{id:"openai/chatgpt-4o-latest",match:{equals:"openai/chatgpt-4o-latest"},prices:{input_mtok:5,output_mtok:15}},{id:"openai/gpt-3.5-turbo",match:{or:[{equals:"openai/gpt-3.5-turbo"},{equals:"openai/gpt-3.5-turbo-0125"}]},prices:{input_mtok:.5,output_mtok:1.5}},{id:"openai/gpt-3.5-turbo-0613",match:{equals:"openai/gpt-3.5-turbo-0613"},prices:{input_mtok:1,output_mtok:2}},{id:"openai/gpt-3.5-turbo-1106",match:{equals:"openai/gpt-3.5-turbo-1106"},prices:{input_mtok:1,output_mtok:2}},{id:"openai/gpt-3.5-turbo-16k",match:{equals:"openai/gpt-3.5-turbo-16k"},prices:{input_mtok:3,output_mtok:4}},{id:"openai/gpt-3.5-turbo-instruct",match:{equals:"openai/gpt-3.5-turbo-instruct"},prices:{input_mtok:1.5,output_mtok:2}},{id:"openai/gpt-4",match:{or:[{equals:"openai/gpt-4"},{equals:"openai/gpt-4-0314"}]},prices:{input_mtok:30,output_mtok:60}},{id:"openai/gpt-4-1106-preview",match:{equals:"openai/gpt-4-1106-preview"},prices:{input_mtok:10,output_mtok:30}},{id:"openai/gpt-4-32k",match:{or:[{equals:"openai/gpt-4-32k"},{equals:"openai/gpt-4-32k-0314"}]},prices:{input_mtok:60,output_mtok:120}},{id:"openai/gpt-4-turbo",match:{or:[{equals:"openai/gpt-4-turbo"},{equals:"openai/gpt-4-turbo-preview"}]},prices:{input_mtok:10,output_mtok:30}},{id:"openai/gpt-4.1",match:{equals:"openai/gpt-4.1"},prices:{input_mtok:2,output_mtok:8}},{id:"openai/gpt-4.1-mini",match:{equals:"openai/gpt-4.1-mini"},prices:{input_mtok:.4,output_mtok:1.6}},{id:"openai/gpt-4.1-nano",match:{equals:"openai/gpt-4.1-nano"},prices:{input_mtok:.1,output_mtok:.4}},{id:"openai/gpt-4.5-preview",match:{equals:"openai/gpt-4.5-preview"},prices:{input_mtok:75,output_mtok:150}},{id:"openai/gpt-4o",match:{or:[{equals:"openai/gpt-4o"},{equals:"openai/gpt-4o-2024-08-06"},{equals:"openai/gpt-4o-2024-11-20"},{equals:"openai/gpt-4o-search-preview"}]},prices:{input_mtok:2.5,output_mtok:10}},{id:"openai/gpt-4o-2024-05-13",match:{equals:"openai/gpt-4o-2024-05-13"},prices:{input_mtok:5,output_mtok:15}},{id:"openai/gpt-4o-mini",match:{or:[{equals:"openai/gpt-4o-mini"},{equals:"openai/gpt-4o-mini-2024-07-18"},{equals:"openai/gpt-4o-mini-search-preview"}]},prices:{input_mtok:.15,output_mtok:.6}},{id:"openai/gpt-4o:extended",match:{equals:"openai/gpt-4o:extended"},prices:{input_mtok:6,output_mtok:18}},{id:"openai/o1",match:{or:[{equals:"openai/o1"},{equals:"openai/o1-preview"},{equals:"openai/o1-preview-2024-09-12"}]},prices:{input_mtok:15,output_mtok:60}},{id:"openai/o1-mini",match:{or:[{equals:"openai/o1-mini"},{equals:"openai/o1-mini-2024-09-12"}]},prices:{input_mtok:1.1,output_mtok:4.4}},{id:"openai/o1-pro",match:{equals:"openai/o1-pro"},prices:{input_mtok:150,output_mtok:600}},{id:"openai/o3",match:{equals:"openai/o3"},prices:{input_mtok:10,output_mtok:40}},{id:"openai/o3-mini",match:{or:[{equals:"openai/o3-mini"},{equals:"openai/o3-mini-high"}]},prices:{input_mtok:1.1,output_mtok:4.4}},{id:"openai/o4-mini",match:{or:[{equals:"openai/o4-mini"},{equals:"openai/o4-mini-high"}]},prices:{input_mtok:1.1,output_mtok:4.4}},{id:"openchat/openchat-7b",match:{equals:"openchat/openchat-7b"},prices:{input_mtok:.07,output_mtok:.07}},{id:"openhands-lm-32b-v0.1",name:"OpenHands LM 32B V0.1",match:{equals:"openhands-lm-32b-v0.1"},prices:{input_mtok:2.6,output_mtok:3.4}},{id:"perplexity/llama-3.1-sonar-large-128k-online",match:{equals:"perplexity/llama-3.1-sonar-large-128k-online"},prices:{input_mtok:1,output_mtok:1}},{id:"perplexity/llama-3.1-sonar-small-128k-online",match:{equals:"perplexity/llama-3.1-sonar-small-128k-online"},prices:{input_mtok:.2,output_mtok:.2}},{id:"perplexity/r1-1776",match:{equals:"perplexity/r1-1776"},prices:{input_mtok:2,output_mtok:8}},{id:"perplexity/sonar",match:{equals:"perplexity/sonar"},prices:{input_mtok:1,output_mtok:1}},{id:"perplexity/sonar-deep-research",match:{equals:"perplexity/sonar-deep-research"},prices:{input_mtok:2,output_mtok:8}},{id:"perplexity/sonar-pro",match:{equals:"perplexity/sonar-pro"},prices:{input_mtok:3,output_mtok:15}},{id:"perplexity/sonar-reasoning",match:{equals:"perplexity/sonar-reasoning"},prices:{input_mtok:1,output_mtok:5}},{id:"perplexity/sonar-reasoning-pro",match:{equals:"perplexity/sonar-reasoning-pro"},prices:{input_mtok:2,output_mtok:8}},{id:"phi-3-medium-128k-instruct",name:"Phi-3 Medium 128K Instruct",match:{equals:"phi-3-medium-128k-instruct"},prices:{input_mtok:1,output_mtok:1}},{id:"phi-3-mini-128k-instruct",name:"Phi-3 Mini 128K Instruct",match:{equals:"phi-3-mini-128k-instruct"},prices:{input_mtok:.1,output_mtok:.1}},{id:"phi-3.5-mini-128k-instruct",name:"Phi-3.5 Mini 128K Instruct",match:{equals:"phi-3.5-mini-128k-instruct"},prices:{input_mtok:.1,output_mtok:.1}},{id:"phi-4",name:"Phi 4",match:{equals:"phi-4"},prices:{input_mtok:.07,output_mtok:.14}},{id:"phi-4-multimodal-instruct",name:"Phi 4 Multimodal Instruct",match:{equals:"phi-4-multimodal-instruct"},prices:{input_mtok:.05,output_mtok:.1}},{id:"phi-4-reasoning-plus",name:"Phi 4 Reasoning Plus",match:{equals:"phi-4-reasoning-plus"},prices:{input_mtok:.07,output_mtok:.35}},{id:"phi-4-reasoning-plus:free",name:"Phi 4 Reasoning Plus (free)",match:{equals:"phi-4-reasoning-plus:free"},prices:{}},{id:"phi-4-reasoning:free",name:"Phi 4 Reasoning (free)",match:{equals:"phi-4-reasoning:free"},prices:{}},{id:"pixtral-12b",name:"Pixtral 12B",match:{equals:"pixtral-12b"},prices:{input_mtok:.1,output_mtok:.1}},{id:"pixtral-large-2411",name:"Pixtral Large 2411",match:{equals:"pixtral-large-2411"},prices:{input_mtok:2,output_mtok:6}},{id:"pygmalionai/mythalion-13b",match:{equals:"pygmalionai/mythalion-13b"},prices:{input_mtok:.5625,output_mtok:1.125}},{id:"qwen-2-72b-instruct",name:"Qwen 2 72B Instruct",match:{equals:"qwen-2-72b-instruct"},prices:{input_mtok:.9,output_mtok:.9}},{id:"qwen-2.5-72b-instruct",name:"Qwen2.5 72B Instruct",match:{equals:"qwen-2.5-72b-instruct"},prices:{input_mtok:.12,output_mtok:.39}},{id:"qwen-2.5-72b-instruct:free",name:"Qwen2.5 72B Instruct (free)",match:{equals:"qwen-2.5-72b-instruct:free"},prices:{}},{id:"qwen-2.5-7b-instruct",name:"Qwen2.5 7B Instruct",match:{equals:"qwen-2.5-7b-instruct"},prices:{input_mtok:.04,output_mtok:.1}},{id:"qwen-2.5-coder-32b-instruct",name:"Qwen2.5 Coder 32B Instruct",match:{equals:"qwen-2.5-coder-32b-instruct"},prices:{input_mtok:.06,output_mtok:.15}},{id:"qwen-2.5-coder-32b-instruct:free",name:"Qwen2.5 Coder 32B Instruct (free)",match:{equals:"qwen-2.5-coder-32b-instruct:free"},prices:{}},{id:"qwen-2.5-vl-7b-instruct",name:"Qwen2.5-VL 7B Instruct",match:{equals:"qwen-2.5-vl-7b-instruct"},prices:{input_mtok:.2,output_mtok:.2}},{id:"qwen-max",name:"Qwen-Max",match:{equals:"qwen-max"},prices:{input_mtok:1.6,cache_read_mtok:.64,output_mtok:6.4}},{id:"qwen-plus",name:"Qwen-Plus",match:{equals:"qwen-plus"},prices:{input_mtok:.4,cache_read_mtok:.16,output_mtok:1.2}},{id:"qwen-turbo",name:"Qwen-Turbo",match:{equals:"qwen-turbo"},prices:{input_mtok:.05,cache_read_mtok:.02,output_mtok:.2}},{id:"qwen-vl-max",name:"Qwen VL Max",match:{equals:"qwen-vl-max"},prices:{input_mtok:.8,output_mtok:3.2}},{id:"qwen-vl-plus",name:"Qwen VL Plus",match:{equals:"qwen-vl-plus"},prices:{input_mtok:.21,output_mtok:.63}},{id:"qwen/qwen-2-72b-instruct",match:{equals:"qwen/qwen-2-72b-instruct"},prices:{input_mtok:.9,output_mtok:.9}},{id:"qwen/qwen-2.5-72b-instruct",match:{equals:"qwen/qwen-2.5-72b-instruct"},prices:{input_mtok:.12,output_mtok:.39}},{id:"qwen/qwen-2.5-72b-instruct:free",match:{equals:"qwen/qwen-2.5-72b-instruct:free"},prices:{}},{id:"qwen/qwen-2.5-7b-instruct",match:{equals:"qwen/qwen-2.5-7b-instruct"},prices:{input_mtok:.05,output_mtok:.1}},{id:"qwen/qwen-2.5-7b-instruct:free",match:{equals:"qwen/qwen-2.5-7b-instruct:free"},prices:{}},{id:"qwen/qwen-2.5-coder-32b-instruct",match:{equals:"qwen/qwen-2.5-coder-32b-instruct"},prices:{input_mtok:.07,output_mtok:.15}},{id:"qwen/qwen-2.5-coder-32b-instruct:free",match:{equals:"qwen/qwen-2.5-coder-32b-instruct:free"},prices:{}},{id:"qwen/qwen-2.5-vl-72b-instruct",match:{equals:"qwen/qwen-2.5-vl-72b-instruct"},prices:{input_mtok:.6,output_mtok:.6}},{id:"qwen/qwen-2.5-vl-7b-instruct",match:{equals:"qwen/qwen-2.5-vl-7b-instruct"},prices:{input_mtok:.2,output_mtok:.2}},{id:"qwen/qwen-2.5-vl-7b-instruct:free",match:{equals:"qwen/qwen-2.5-vl-7b-instruct:free"},prices:{}},{id:"qwen/qwen-max",match:{equals:"qwen/qwen-max"},prices:{input_mtok:1.6,output_mtok:6.4}},{id:"qwen/qwen-plus",match:{equals:"qwen/qwen-plus"},prices:{input_mtok:.4,output_mtok:1.2}},{id:"qwen/qwen-turbo",match:{equals:"qwen/qwen-turbo"},prices:{input_mtok:.05,output_mtok:.2}},{id:"qwen/qwen-vl-max",match:{equals:"qwen/qwen-vl-max"},prices:{input_mtok:.8,output_mtok:3.2}},{id:"qwen/qwen-vl-plus",match:{equals:"qwen/qwen-vl-plus"},prices:{input_mtok:.21,output_mtok:.63}},{id:"qwen/qwen2.5-coder-7b-instruct",match:{equals:"qwen/qwen2.5-coder-7b-instruct"},prices:{input_mtok:.2,output_mtok:.2}},{id:"qwen/qwen2.5-vl-32b-instruct",match:{equals:"qwen/qwen2.5-vl-32b-instruct"},prices:{input_mtok:.9,output_mtok:.9}},{id:"qwen/qwen2.5-vl-32b-instruct:free",match:{equals:"qwen/qwen2.5-vl-32b-instruct:free"},prices:{}},{id:"qwen/qwen2.5-vl-3b-instruct:free",match:{equals:"qwen/qwen2.5-vl-3b-instruct:free"},prices:{}},{id:"qwen/qwen2.5-vl-72b-instruct",match:{equals:"qwen/qwen2.5-vl-72b-instruct"},prices:{input_mtok:.7,output_mtok:.7}},{id:"qwen/qwen2.5-vl-72b-instruct:free",match:{equals:"qwen/qwen2.5-vl-72b-instruct:free"},prices:{}},{id:"qwen/qwq-32b",match:{equals:"qwen/qwq-32b"},prices:{input_mtok:.15,output_mtok:.2}},{id:"qwen/qwq-32b-preview",match:{equals:"qwen/qwq-32b-preview"},prices:{input_mtok:.2,output_mtok:.2}},{id:"qwen/qwq-32b-preview:free",match:{equals:"qwen/qwq-32b-preview:free"},prices:{}},{id:"qwen/qwq-32b:free",match:{equals:"qwen/qwq-32b:free"},prices:{}},{id:"qwen2.5-vl-32b-instruct",name:"Qwen2.5 VL 32B Instruct",match:{equals:"qwen2.5-vl-32b-instruct"},prices:{input_mtok:.9,output_mtok:.9}},{id:"qwen2.5-vl-32b-instruct:free",name:"Qwen2.5 VL 32B Instruct (free)",match:{equals:"qwen2.5-vl-32b-instruct:free"},prices:{}},{id:"qwen2.5-vl-72b-instruct",name:"Qwen2.5 VL 72B Instruct",match:{equals:"qwen2.5-vl-72b-instruct"},prices:{input_mtok:.25,output_mtok:.75}},{id:"qwen2.5-vl-72b-instruct:free",name:"Qwen2.5 VL 72B Instruct (free)",match:{equals:"qwen2.5-vl-72b-instruct:free"},prices:{}},{id:"qwen3-14b",name:"Qwen3 14B",match:{equals:"qwen3-14b"},prices:{input_mtok:.06,output_mtok:.24}},{id:"qwen3-14b:free",name:"Qwen3 14B (free)",match:{equals:"qwen3-14b:free"},prices:{}},{id:"qwen3-235b-a22b",name:"Qwen3 235B A22B",match:{equals:"qwen3-235b-a22b"},prices:{input_mtok:.13,output_mtok:.6}},{id:"qwen3-235b-a22b:free",name:"Qwen3 235B A22B (free)",match:{equals:"qwen3-235b-a22b:free"},prices:{}},{id:"qwen3-30b-a3b",name:"Qwen3 30B A3B",match:{equals:"qwen3-30b-a3b"},prices:{input_mtok:.08,output_mtok:.29}},{id:"qwen3-30b-a3b:free",name:"Qwen3 30B A3B (free)",match:{equals:"qwen3-30b-a3b:free"},prices:{}},{id:"qwen3-32b",name:"Qwen3 32B",match:{equals:"qwen3-32b"},prices:{input_mtok:.1,output_mtok:.3}},{id:"qwen3-32b:free",name:"Qwen3 32B (free)",match:{equals:"qwen3-32b:free"},prices:{}},{id:"qwen3-8b",name:"Qwen3 8B",match:{equals:"qwen3-8b"},prices:{input_mtok:.035,output_mtok:.138}},{id:"qwen3-8b:free",name:"Qwen3 8B (free)",match:{equals:"qwen3-8b:free"},prices:{}},{id:"qwerky-72b:free",name:"Qwerky 72B (free)",match:{equals:"qwerky-72b:free"},prices:{}},{id:"qwq-32b",name:"QwQ 32B",match:{equals:"qwq-32b"},prices:{input_mtok:.15,output_mtok:.2}},{id:"qwq-32b-arliai-rpr-v1:free",name:"QwQ 32B RpR v1 (free)",match:{equals:"qwq-32b-arliai-rpr-v1:free"},prices:{}},{id:"qwq-32b-preview",name:"QwQ 32B Preview",match:{equals:"qwq-32b-preview"},prices:{input_mtok:.2,output_mtok:.2}},{id:"qwq-32b:free",name:"QwQ 32B (free)",match:{equals:"qwq-32b:free"},prices:{}},{id:"r1-1776",name:"R1 1776",match:{equals:"r1-1776"},prices:{input_mtok:2,output_mtok:8}},{id:"raifle/sorcererlm-8x22b",match:{equals:"raifle/sorcererlm-8x22b"},prices:{input_mtok:4.5,output_mtok:4.5}},{id:"reka-flash-3:free",name:"Flash 3 (free)",match:{equals:"reka-flash-3:free"},prices:{}},{id:"rekaai/reka-flash-3:free",match:{equals:"rekaai/reka-flash-3:free"},prices:{}},{id:"remm-slerp-l2-13b",name:"ReMM SLERP 13B",match:{equals:"remm-slerp-l2-13b"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"rocinante-12b",name:"Rocinante 12B",match:{equals:"rocinante-12b"},prices:{input_mtok:.25,output_mtok:.5}},{id:"sao10k/fimbulvetr-11b-v2",match:{equals:"sao10k/fimbulvetr-11b-v2"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"sao10k/l3-euryale-70b",match:{equals:"sao10k/l3-euryale-70b"},prices:{input_mtok:1.48,output_mtok:1.48}},{id:"sao10k/l3-lunaris-8b",match:{equals:"sao10k/l3-lunaris-8b"},prices:{input_mtok:.02,output_mtok:.05}},{id:"sao10k/l3.1-euryale-70b",match:{equals:"sao10k/l3.1-euryale-70b"},prices:{input_mtok:.7,output_mtok:.8}},{id:"sao10k/l3.3-euryale-70b",match:{equals:"sao10k/l3.3-euryale-70b"},prices:{input_mtok:.7,output_mtok:.8}},{id:"sarvam-m:free",name:"Sarvam-M (free)",match:{equals:"sarvam-m:free"},prices:{}},{id:"scb10x/llama3.1-typhoon2-70b-instruct",match:{equals:"scb10x/llama3.1-typhoon2-70b-instruct"},prices:{input_mtok:.88,output_mtok:.88}},{id:"scb10x/llama3.1-typhoon2-8b-instruct",match:{equals:"scb10x/llama3.1-typhoon2-8b-instruct"},prices:{input_mtok:.18,output_mtok:.18}},{id:"shisa-ai/shisa-v2-llama3.3-70b:free",match:{equals:"shisa-ai/shisa-v2-llama3.3-70b:free"},prices:{}},{id:"shisa-v2-llama3.3-70b:free",name:"Shisa V2 Llama 3.3 70B (free)",match:{equals:"shisa-v2-llama3.3-70b:free"},prices:{}},{id:"skyfall-36b-v2",name:"Skyfall 36B V2",match:{equals:"skyfall-36b-v2"},prices:{input_mtok:.5,output_mtok:.8}},{id:"sonar",name:"Sonar",match:{equals:"sonar"},prices:{input_mtok:1,output_mtok:1}},{id:"sonar-deep-research",name:"Sonar Deep Research",match:{equals:"sonar-deep-research"},prices:{input_mtok:2,output_mtok:8}},{id:"sonar-pro",name:"Sonar Pro",match:{equals:"sonar-pro"},prices:{input_mtok:3,output_mtok:15}},{id:"sonar-reasoning",name:"Sonar Reasoning",match:{equals:"sonar-reasoning"},prices:{input_mtok:1,output_mtok:5}},{id:"sonar-reasoning-pro",name:"Sonar Reasoning Pro",match:{equals:"sonar-reasoning-pro"},prices:{input_mtok:2,output_mtok:8}},{id:"sophosympatheia/midnight-rose-70b",match:{equals:"sophosympatheia/midnight-rose-70b"},prices:{input_mtok:.8,output_mtok:.8}},{id:"sophosympatheia/rogue-rose-103b-v0.2:free",match:{equals:"sophosympatheia/rogue-rose-103b-v0.2:free"},prices:{}},{id:"sorcererlm-8x22b",name:"SorcererLM 8x22B",match:{equals:"sorcererlm-8x22b"},prices:{input_mtok:4.5,output_mtok:4.5}},{id:"spotlight",name:"Spotlight",match:{equals:"spotlight"},prices:{input_mtok:.18,output_mtok:.18}},{id:"steelskull/l3.3-electra-r1-70b",match:{equals:"steelskull/l3.3-electra-r1-70b"},prices:{input_mtok:.7,output_mtok:.95}},{id:"thedrummer/anubis-pro-105b-v1",match:{equals:"thedrummer/anubis-pro-105b-v1"},prices:{input_mtok:.8,output_mtok:1}},{id:"thedrummer/rocinante-12b",match:{equals:"thedrummer/rocinante-12b"},prices:{input_mtok:.25,output_mtok:.5}},{id:"thedrummer/skyfall-36b-v2",match:{equals:"thedrummer/skyfall-36b-v2"},prices:{input_mtok:.5,output_mtok:.8}},{id:"thedrummer/unslopnemo-12b",match:{equals:"thedrummer/unslopnemo-12b"},prices:{input_mtok:.5,output_mtok:.5}},{id:"thudm/glm-4-32b:free",match:{equals:"thudm/glm-4-32b:free"},prices:{}},{id:"thudm/glm-z1-32b:free",match:{equals:"thudm/glm-z1-32b:free"},prices:{}},{id:"toppy-m-7b",name:"Toppy M 7B",match:{equals:"toppy-m-7b"},prices:{input_mtok:.8,output_mtok:1.2}},{id:"undi95/remm-slerp-l2-13b",match:{equals:"undi95/remm-slerp-l2-13b"},prices:{input_mtok:.5625,output_mtok:1.125}},{id:"undi95/toppy-m-7b",match:{equals:"undi95/toppy-m-7b"},prices:{input_mtok:.07,output_mtok:.07}},{id:"unslopnemo-12b",name:"UnslopNemo 12B",match:{equals:"unslopnemo-12b"},prices:{input_mtok:.45,output_mtok:.45}},{id:"valkyrie-49b-v1",name:"Valkyrie 49B V1",match:{equals:"valkyrie-49b-v1"},prices:{input_mtok:.5,output_mtok:.8}},{id:"virtuoso-large",name:"Virtuoso Large",match:{equals:"virtuoso-large"},prices:{input_mtok:.75,output_mtok:1.2}},{id:"virtuoso-medium-v2",name:"Virtuoso Medium V2",match:{equals:"virtuoso-medium-v2"},prices:{input_mtok:.5,output_mtok:.8}},{id:"weaver",name:"Weaver (alpha)",match:{equals:"weaver"},prices:{input_mtok:1.5,output_mtok:1.5}},{id:"wizardlm-2-8x22b",name:"WizardLM-2 8x22B",match:{equals:"wizardlm-2-8x22b"},prices:{input_mtok:.48,output_mtok:.48}},{id:"x-ai/grok-2-1212",match:{equals:"x-ai/grok-2-1212"},prices:{input_mtok:2,output_mtok:10}},{id:"x-ai/grok-2-vision-1212",match:{equals:"x-ai/grok-2-vision-1212"},prices:{input_mtok:2,output_mtok:10}},{id:"x-ai/grok-3-beta",match:{equals:"x-ai/grok-3-beta"},prices:{input_mtok:3,output_mtok:15}},{id:"x-ai/grok-3-mini-beta",match:{equals:"x-ai/grok-3-mini-beta"},prices:{input_mtok:.3,output_mtok:.5}},{id:"x-ai/grok-beta",match:{equals:"x-ai/grok-beta"},prices:{input_mtok:5,output_mtok:15}},{id:"x-ai/grok-vision-beta",match:{equals:"x-ai/grok-vision-beta"},prices:{input_mtok:5,output_mtok:15}},{id:"xwin-lm/xwin-lm-70b",match:{equals:"xwin-lm/xwin-lm-70b"},prices:{input_mtok:3.75,output_mtok:3.75}},{id:"yi-large",name:"Yi Large",match:{equals:"yi-large"},prices:{input_mtok:3,output_mtok:3}},{id:"z-ai/glm-4.5",match:{equals:"z-ai/glm-4.5"},context_window:131072,prices:{input_mtok:.35,output_mtok:1.55}},{id:"z-ai/glm-4.6",match:{equals:"z-ai/glm-4.6"},context_window:202752,prices:{input_mtok:.4,output_mtok:1.75}}]},{id:"perplexity",name:"Perplexity",pricing_urls:["https://docs.perplexity.ai/guides/pricing"],api_pattern:"https://api\\.perplexity\\.ai",price_comments:"Prices per request vary based on usage, this is not represented here, instead we just take the highest price shown for `requests_kcount`.",models:[{id:"llama-3.1-sonar-large-128k-online",name:"Llama 3.1 Sonar 70B Online",description:"Llama 3.1 Sonar is Perplexity's latest model family. It surpasses their earlier Sonar models in cost-efficiency, speed, and performance.",match:{equals:"llama-3.1-sonar-large-128k-online"},prices:{input_mtok:1,output_mtok:1}},{id:"llama-3.1-sonar-small-128k-online",name:"Llama 3.1 Sonar 8B Online",description:"Llama 3.1 Sonar is Perplexity's latest model family. It surpasses their earlier Sonar models in cost-efficiency, speed, and performance.",match:{equals:"llama-3.1-sonar-small-128k-online"},prices:{input_mtok:.2,output_mtok:.2}},{id:"r1-1776",name:"R1 1776",description:"R1 1776 is a version of DeepSeek-R1 that has been post-trained to remove censorship constraints related to topics restricted by the Chinese government. The model retains its original reasoning capabilities while providing direct responses to a wider range of queries. R1 1776 is an offline chat model that does not use the perplexity search subsystem.",match:{equals:"r1-1776"},prices:{input_mtok:2,output_mtok:8}},{id:"sonar",name:"Sonar",description:"Sonar is lightweight, affordable, fast, and simple to use — now featuring citations and the ability to customize sources. It is designed for companies seeking to integrate lightweight question-and-answer features optimized for speed.",match:{equals:"sonar"},prices:{input_mtok:1,output_mtok:1,requests_kcount:12}},{id:"sonar-deep-research",name:"Sonar Deep Research",description:"Sonar Deep Research is a research-focused model designed for multi-step retrieval, synthesis, and reasoning across complex topics. It autonomously searches, reads, and evaluates sources, refining its approach as it gathers information. This enables comprehensive report generation across domains like finance, technology, health, and current events.",match:{equals:"sonar-deep-research"},prices:{input_mtok:2,output_mtok:8}},{id:"sonar-pro",name:"Sonar Pro",description:"Note: Sonar Pro pricing includes Perplexity search pricing. See details here",match:{equals:"sonar-pro"},prices:{input_mtok:3,output_mtok:15,requests_kcount:14}},{id:"sonar-reasoning",name:"Sonar Reasoning",description:"Sonar Reasoning is a reasoning model provided by Perplexity based on DeepSeek R1.",match:{equals:"sonar-reasoning"},prices:{input_mtok:1,output_mtok:5,requests_kcount:12}},{id:"sonar-reasoning-pro",name:"Sonar Reasoning Pro",description:"Sonar Pro pricing includes Perplexity search pricing.",match:{equals:"sonar-reasoning-pro"},prices:{input_mtok:2,output_mtok:8,requests_kcount:14}}]},{id:"together",name:"Together AI",pricing_urls:["https://www.together.ai/pricing"],api_pattern:"https://api\\.together\\.xyz",provider_match:{or:[{equals:"together-ai"},{equals:"together_ai"}]},models:[{id:"Austism/chronos-hermes-13b",match:{equals:"Austism/chronos-hermes-13b"},prices:{input_mtok:.3,output_mtok:.3}},{id:"Gryphe/MythoMax-L2-13b",match:{equals:"Gryphe/MythoMax-L2-13b"},prices:{input_mtok:.3,output_mtok:.3}},{id:"Nexusflow/NexusRaven-V2-13B",match:{equals:"Nexusflow/NexusRaven-V2-13B"},prices:{input_mtok:.3,output_mtok:.3}},{id:"NousResearch/Nous-Capybara-7B-V1p9",match:{equals:"NousResearch/Nous-Capybara-7B-V1p9"},prices:{input_mtok:.2,output_mtok:.2}},{id:"NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO",match:{equals:"NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO"},prices:{input_mtok:.9,output_mtok:.9}},{id:"NousResearch/Nous-Hermes-2-Mixtral-8x7B-SFT",match:{equals:"NousResearch/Nous-Hermes-2-Mixtral-8x7B-SFT"},prices:{input_mtok:.9,output_mtok:.9}},{id:"NousResearch/Nous-Hermes-2-Yi-34B",match:{equals:"NousResearch/Nous-Hermes-2-Yi-34B"},prices:{input_mtok:.8,output_mtok:.8}},{id:"NousResearch/Nous-Hermes-Llama2-13b",match:{equals:"NousResearch/Nous-Hermes-Llama2-13b"},prices:{input_mtok:.225,output_mtok:.225}},{id:"NousResearch/Nous-Hermes-llama-2-7b",match:{equals:"NousResearch/Nous-Hermes-llama-2-7b"},prices:{input_mtok:.2,output_mtok:.2}},{id:"Open-Orca/Mistral-7B-OpenOrca",match:{equals:"Open-Orca/Mistral-7B-OpenOrca"},prices:{input_mtok:.2,output_mtok:.2}},{id:"Qwen/Qwen1.5-0.5B",match:{or:[{equals:"Qwen/Qwen1.5-0.5B"},{equals:"Qwen/Qwen1.5-0.5B-Chat"}]},prices:{input_mtok:.1,output_mtok:.1}},{id:"Qwen/Qwen1.5-1.8B",match:{or:[{equals:"Qwen/Qwen1.5-1.8B"},{equals:"Qwen/Qwen1.5-1.8B-Chat"}]},prices:{input_mtok:.1,output_mtok:.1}},{id:"Qwen/Qwen1.5-14B",match:{or:[{equals:"Qwen/Qwen1.5-14B"},{equals:"Qwen/Qwen1.5-14B-Chat"}]},prices:{input_mtok:.3,output_mtok:.3}},{id:"Qwen/Qwen1.5-4B",match:{or:[{equals:"Qwen/Qwen1.5-4B"},{equals:"Qwen/Qwen1.5-4B-Chat"}]},prices:{input_mtok:.1,output_mtok:.1}},{id:"Qwen/Qwen1.5-72B",match:{equals:"Qwen/Qwen1.5-72B"},prices:{input_mtok:.9,output_mtok:.9}},{id:"Qwen/Qwen1.5-7B",match:{or:[{equals:"Qwen/Qwen1.5-7B"},{equals:"Qwen/Qwen1.5-7B-Chat"}]},prices:{input_mtok:.2,output_mtok:.2}},{id:"Undi95/ReMM-SLERP-L2-13B",match:{equals:"Undi95/ReMM-SLERP-L2-13B"},prices:{input_mtok:.3,output_mtok:.3}},{id:"Undi95/Toppy-M-7B",match:{equals:"Undi95/Toppy-M-7B"},prices:{input_mtok:.2,output_mtok:.2}},{id:"WizardLM/WizardLM-13B-V1.2",match:{equals:"WizardLM/WizardLM-13B-V1.2"},prices:{input_mtok:.3,output_mtok:.3}},{id:"allenai/OLMo-7B",match:{or:[{equals:"allenai/OLMo-7B"},{equals:"allenai/OLMo-7B-Instruct"},{equals:"allenai/OLMo-7B-Twin-2T"}]},prices:{input_mtok:.2,output_mtok:.2}},{id:"codellama/CodeLlama-13b-Instruct-hf",match:{equals:"codellama/CodeLlama-13b-Instruct-hf"},prices:{input_mtok:.225,output_mtok:.225}},{id:"codellama/CodeLlama-34b-Instruct-hf",match:{equals:"codellama/CodeLlama-34b-Instruct-hf"},prices:{input_mtok:.776,output_mtok:.776}},{id:"codellama/CodeLlama-70b-Instruct-hf",match:{equals:"codellama/CodeLlama-70b-Instruct-hf"},prices:{input_mtok:.9,output_mtok:.9}},{id:"codellama/CodeLlama-7b-Instruct-hf",match:{equals:"codellama/CodeLlama-7b-Instruct-hf"},prices:{input_mtok:.2,output_mtok:.2}},{id:"deepseek-ai/deepseek-coder-33b-instruct",match:{equals:"deepseek-ai/deepseek-coder-33b-instruct"},prices:{input_mtok:.8,output_mtok:.8}},{id:"garage-bAInd/Platypus2-70B-instruct",match:{equals:"garage-bAInd/Platypus2-70B-instruct"},prices:{input_mtok:.9,output_mtok:.9}},{id:"google/gemma-2b",match:{or:[{equals:"google/gemma-2b"},{equals:"google/gemma-2b-it"}]},prices:{input_mtok:.1,output_mtok:.1}},{id:"google/gemma-7b",match:{or:[{equals:"google/gemma-7b"},{equals:"google/gemma-7b-it"}]},prices:{input_mtok:.2,output_mtok:.2}},{id:"lmsys/vicuna-13b-v1.5",match:{equals:"lmsys/vicuna-13b-v1.5"},prices:{input_mtok:.3,output_mtok:.3}},{id:"lmsys/vicuna-7b-v1.5",match:{equals:"lmsys/vicuna-7b-v1.5"},prices:{input_mtok:.2,output_mtok:.2}},{id:"meta-llama/Llama-2-13b-chat-hf",match:{equals:"meta-llama/Llama-2-13b-chat-hf"},prices:{input_mtok:.225,output_mtok:.225}},{id:"meta-llama/Llama-2-70b-chat-hf",match:{equals:"meta-llama/Llama-2-70b-chat-hf"},prices:{input_mtok:.9,output_mtok:.9}},{id:"meta-llama/Llama-2-7b-chat-hf",match:{equals:"meta-llama/Llama-2-7b-chat-hf"},prices:{input_mtok:.2,output_mtok:.2}},{id:"meta-llama/Llama-3-70b-chat-hf",match:{equals:"meta-llama/Llama-3-70b-chat-hf"},prices:{input_mtok:.9,output_mtok:.9}},{id:"meta-llama/Llama-3-8b-chat-hf",match:{equals:"meta-llama/Llama-3-8b-chat-hf"},prices:{input_mtok:.2,output_mtok:.2}},{id:"meta-llama/Llama-3.3-70B-Instruct-Turbo",match:{equals:"meta-llama/Llama-3.3-70B-Instruct-Turbo"},prices:{input_mtok:.88,output_mtok:.88}},{id:"meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",match:{equals:"meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8"},prices:{input_mtok:.27,output_mtok:.85}},{id:"meta-llama/Llama-4-Scout-17B-16E-Instruct",match:{equals:"meta-llama/Llama-4-Scout-17B-16E-Instruct"},prices:{input_mtok:.18,output_mtok:.59}},{id:"meta-llama/Meta-Llama-3-70B-Instruct-Lite",match:{equals:"meta-llama/Meta-Llama-3-70B-Instruct-Lite"},prices:{input_mtok:.54,output_mtok:.54}},{id:"meta-llama/Meta-Llama-3-70B-Instruct-Turbo",match:{equals:"meta-llama/Meta-Llama-3-70B-Instruct-Turbo"},prices:{input_mtok:.88,output_mtok:.88}},{id:"meta-llama/Meta-Llama-3-8B-Instruct-Lite",match:{equals:"meta-llama/Meta-Llama-3-8B-Instruct-Lite"},prices:{input_mtok:.1,output_mtok:.1}},{id:"meta-llama/Meta-Llama-3-8B-Instruct-Turbo",match:{equals:"meta-llama/Meta-Llama-3-8B-Instruct-Turbo"},prices:{input_mtok:.18,output_mtok:.18}},{id:"meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo",match:{equals:"meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo"},prices:{input_mtok:3.5,output_mtok:3.5}},{id:"meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo",match:{equals:"meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo"},prices:{input_mtok:.88,output_mtok:.88}},{id:"meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo",match:{equals:"meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo"},prices:{input_mtok:.18,output_mtok:.18}},{id:"meta-llama/Meta-Llama-3.3-70B-Instruct-Turbo",match:{equals:"meta-llama/Meta-Llama-3.3-70B-Instruct-Turbo"},prices:{input_mtok:.88,output_mtok:.88}},{id:"microsoft/WizardLM-2-8x22B",match:{equals:"microsoft/WizardLM-2-8x22B"},prices:{input_mtok:1.2,output_mtok:1.2}},{id:"microsoft/phi-2",match:{equals:"microsoft/phi-2"},prices:{input_mtok:.1,output_mtok:.1}},{id:"mistralai/Mistral-7B-Instruct-v0.1",match:{equals:"mistralai/Mistral-7B-Instruct-v0.1"},prices:{input_mtok:.2,output_mtok:.2}},{id:"mistralai/Mistral-7B-Instruct-v0.2",match:{equals:"mistralai/Mistral-7B-Instruct-v0.2"},prices:{input_mtok:.2,output_mtok:.2}},{id:"mistralai/Mistral-7B-v0.1",match:{equals:"mistralai/Mistral-7B-v0.1"},prices:{input_mtok:.2,output_mtok:.2}},{id:"mistralai/Mixtral-8x22B-Instruct-v0.1",match:{equals:"mistralai/Mixtral-8x22B-Instruct-v0.1"},prices:{input_mtok:2.4,output_mtok:2.4}},{id:"mistralai/Mixtral-8x7B-Instruct-v0.1",match:{equals:"mistralai/Mixtral-8x7B-Instruct-v0.1"},prices:{input_mtok:.9,output_mtok:.9}},{id:"mistralai/Mixtral-8x7B-v0.1",match:{equals:"mistralai/Mixtral-8x7B-v0.1"},prices:{input_mtok:.9,output_mtok:.9}},{id:"openchat/openchat-3.5-1210",match:{equals:"openchat/openchat-3.5-1210"},prices:{input_mtok:.2,output_mtok:.2}},{id:"snorkelai/Snorkel-Mistral-PairRM-DPO",match:{equals:"snorkelai/Snorkel-Mistral-PairRM-DPO"},prices:{input_mtok:.2,output_mtok:.2}},{id:"teknium/OpenHermes-2-Mistral-7B",match:{equals:"teknium/OpenHermes-2-Mistral-7B"},prices:{input_mtok:.2,output_mtok:.2}},{id:"teknium/OpenHermes-2p5-Mistral-7B",match:{equals:"teknium/OpenHermes-2p5-Mistral-7B"},prices:{input_mtok:.2,output_mtok:.2}},{id:"togethercomputer/GPT-JT-Moderation-6B",match:{equals:"togethercomputer/GPT-JT-Moderation-6B"},prices:{input_mtok:.2,output_mtok:.2}},{id:"togethercomputer/Llama-2-7B-32K-Instruct",match:{equals:"togethercomputer/Llama-2-7B-32K-Instruct"},prices:{input_mtok:.2,output_mtok:.2}},{id:"togethercomputer/RedPajama-INCITE-7B-Base",match:{equals:"togethercomputer/RedPajama-INCITE-7B-Base"},prices:{input_mtok:.2,output_mtok:.2}},{id:"togethercomputer/RedPajama-INCITE-7B-Chat",match:{equals:"togethercomputer/RedPajama-INCITE-7B-Chat"},prices:{input_mtok:.2,output_mtok:.2}},{id:"togethercomputer/RedPajama-INCITE-7B-Instruct",match:{equals:"togethercomputer/RedPajama-INCITE-7B-Instruct"},prices:{input_mtok:.2,output_mtok:.2}},{id:"togethercomputer/RedPajama-INCITE-Base-3B-v1",match:{equals:"togethercomputer/RedPajama-INCITE-Base-3B-v1"},prices:{input_mtok:.1,output_mtok:.1}},{id:"togethercomputer/RedPajama-INCITE-Chat-3B-v1",match:{equals:"togethercomputer/RedPajama-INCITE-Chat-3B-v1"},prices:{input_mtok:.1,output_mtok:.1}},{id:"togethercomputer/RedPajama-INCITE-Instruct-3B-v1",match:{equals:"togethercomputer/RedPajama-INCITE-Instruct-3B-v1"},prices:{input_mtok:.1,output_mtok:.1}},{id:"togethercomputer/StripedHyena-Hessian-7B",match:{equals:"togethercomputer/StripedHyena-Hessian-7B"},prices:{input_mtok:.2,output_mtok:.2}},{id:"togethercomputer/StripedHyena-Nous-7B",match:{equals:"togethercomputer/StripedHyena-Nous-7B"},prices:{input_mtok:.2,output_mtok:.2}},{id:"togethercomputer/alpaca-7b",match:{equals:"togethercomputer/alpaca-7b"},prices:{input_mtok:.2,output_mtok:.2}},{id:"upstage/SOLAR-10.7B-Instruct-v1.0",match:{equals:"upstage/SOLAR-10.7B-Instruct-v1.0"},prices:{input_mtok:.3,output_mtok:.3}},{id:"zero-one-ai/Yi-34B",match:{equals:"zero-one-ai/Yi-34B"},prices:{input_mtok:.8,output_mtok:.8}},{id:"zero-one-ai/Yi-6B",match:{equals:"zero-one-ai/Yi-6B"},prices:{input_mtok:.2,output_mtok:.2}}]},{id:"x-ai",name:"X AI",pricing_urls:["https://docs.x.ai/docs/models"],api_pattern:"https://api\\.x\\.ai",model_match:{contains:"grok"},provider_match:{equals:"xai"},extractors:[{api_flavor:"chat",root:"usage",model_path:"model",mappings:[{path:"prompt_tokens",dest:"input_tokens",required:!0},{path:["prompt_tokens_details","cached_tokens"],dest:"cache_read_tokens",required:!1},{path:["completion_tokens_details","audio_tokens"],dest:"output_audio_tokens",required:!1},{path:"completion_tokens",dest:"output_tokens",required:!0}]}],models:[{id:"grok-2-1212",name:"Grok 2 1212",description:"(deprecated) Grok 2 1212 introduces significant enhancements to accuracy, instruction adherence, and multilingual support, making it a powerful and flexible choice for developers seeking a highly steerable, intelligent model.",match:{or:[{equals:"grok-2-1212"},{equals:"grok-2"},{equals:"grok-2-latest"}]},context_window:32768,prices:{input_mtok:2,output_mtok:10}},{id:"grok-2-vision-1212",name:"Grok 2 Vision 1212",description:"Our multimodal model that processes documents, diagrams, charts, screenshots, and photographs.",match:{or:[{equals:"grok-2-vision-1212"},{equals:"grok-2-vision"},{equals:"grok-2-vision-latest"}]},context_window:32768,prices:{input_mtok:2,output_mtok:10}},{id:"grok-3",name:"Grok 3",description:"Flagship model that excels at enterprise use cases like data extraction, coding, and text summarization. Possesses deep domain knowledge in finance, healthcare, law, and science.",match:{or:[{equals:"grok-3"},{equals:"grok-3-latest"},{equals:"grok-3-beta"}]},context_window:131072,prices:{input_mtok:3,cache_read_mtok:.75,output_mtok:15}},{id:"grok-3-fast",name:"Grok 3 Fast",description:"Excels at enterprise use cases like data extraction, coding, and text summarization. Possesses deep domain knowledge in finance, healthcare, law, and science.",match:{or:[{equals:"grok-3-fast"},{equals:"grok-3-fast-latest"},{equals:"grok-3-fast-beta"}]},context_window:131072,prices:{input_mtok:5,cache_read_mtok:1.25,output_mtok:25}},{id:"grok-3-mini",name:"Grok 3 Mini",description:"A lightweight model that thinks before responding. Fast, smart, and great for logic-based tasks that do not require deep domain knowledge. The raw thinking traces are accessible.",match:{or:[{equals:"grok-3-mini"},{equals:"grok-3-mini-beta"},{equals:"grok-3-mini-latest"}]},context_window:131072,prices:{input_mtok:.3,cache_read_mtok:.075,output_mtok:.5}},{id:"grok-3-mini-fast",name:"Grok 3 Mini Fast",description:"A lightweight model that thinks before responding. Fast, smart, and great for logic-based tasks that do not require deep domain knowledge. The raw thinking traces are accessible.",match:{or:[{equals:"grok-3-mini-fast"},{equals:"grok-3-mini-fast-beta"},{equals:"grok-3-mini-fast-latest"}]},context_window:131072,prices:{input_mtok:.6,cache_read_mtok:.15,output_mtok:4}},{id:"grok-4-0709",name:"Grok 4",description:"A flagship model, offering unparalleled performance in natural language, math and reasoning - the perfect jack of all trades.",match:{or:[{equals:"grok-4-0709"},{equals:"grok-4"},{equals:"grok-4-latest"}]},context_window:256e3,prices:{input_mtok:3,cache_read_mtok:.75,output_mtok:15}}]}];function M(t,e){if(e<=0)return 0;let a=0;const i=[...t.tiers].sort((r,n)=>r.start-n.start),o=i[0]?.start??e,m=Math.min(e,o);a+=m*t.base/1e6;for(let r=0;r<i.length;r++){const n=i[r],s=i[r+1]?.start??1/0,u=Math.max(0,Math.min(e,s)-n.start);u>0&&(a+=u*n.price/1e6)}return a}function c(t,e,a){return t===void 0||e===void 0?0:typeof t=="number"?t*e/1e6:M(t,e)}function Q(t,e){let a=0,i=0;const o=t.cache_read_tokens??0,m=t.cache_write_tokens??0,r=t.cache_audio_read_tokens??0,n=t.output_audio_tokens??0;let s=t.input_audio_tokens??0;if(s-=r,s<0)throw new Error("cache_audio_read_tokens cannot be greater than input_audio_tokens");let u=t.input_tokens??0;if(u-=o,u-=m,u-=s,u<0)throw new Error("Uncached text input tokens cannot be negative");let p=o;if(p-=r,p<0)throw new Error("cache_audio_read_tokens cannot be greater than cache_read_tokens");a+=c(e.input_mtok,u),a+=c(e.cache_read_mtok,p),a+=c(e.cache_write_mtok,m),a+=c(e.input_audio_mtok,s),a+=c(e.cache_audio_read_mtok,r);let k=t.output_tokens??0;if(k-=n,k<0)throw new Error("output_audio_tokens cannot be greater than output_tokens");i+=c(e.output_mtok,k),i+=c(e.output_audio_mtok,t.output_audio_tokens);let f=a+i;return e.requests_kcount!==void 0&&(f+=e.requests_kcount/1e3),{input_price:a,output_price:i,total_price:f}}function y(t,e){if(!Array.isArray(t.prices))return t.prices;for(let a=t.prices.length-1;a>=0;a--){const i=t.prices[a],o=i.constraint;if(o===void 0)return i.prices;if(o.type==="start_date"){if(e>=new Date(o.start_date))return i.prices}else{const m=e.toISOString().slice(11,19),r=o.start_time,n=o.end_time;if(n<r){if(m>=r||m<n)return i.prices}else if(m>=r&&m<n)return i.prices}}return t.prices[0].prices}function _(t,e){return"or"in t?t.or.some(a=>_(a,e)):"and"in t?t.and.every(a=>_(a,e)):"equals"in t?e===t.equals:"starts_with"in t?e.startsWith(t.starts_with):"ends_with"in t?e.endsWith(t.ends_with):"contains"in t?e.includes(t.contains):"regex"in t?new RegExp(t.regex).test(e):!1}function S(t,e){const a=e.toLowerCase().trim(),i=t.find(o=>o.id===a);return i||t.find(o=>o.provider_match&&_(o.provider_match,a))}function x(t,{modelId:e,providerApiUrl:a,providerId:i}){if(i)return S(t,i);if(a)return t.find(o=>new RegExp(o.api_pattern).test(a));if(e)return t.find(o=>o.model_match&&_(o.model_match,e))}function P(t,e){return t.find(a=>_(a.match,e))}const I="https://raw.githubusercontent.com/pydantic/genai-prices/main/prices/data.json";let g=B,q=Promise.resolve(B),b=null;function T(t){t!==null&&("then"in t?(q=t,t.then(e=>{e!==null&&(g=e)})):(q=Promise.resolve(t),g=t))}function A(t){b=t}function G(t){t({onCalc:A,remoteDataUrl:I,setProviderData:T})}function D(){return q}function R(t,e,a){b?.();const i=e.toLowerCase().trim(),o=a?.provider??x(g,{modelId:i,providerApiUrl:a?.providerApiUrl,providerId:a?.providerId});if(!o)return null;const m=P(o.models,i);if(!m)return null;const r=a?.timestamp??new Date,n=y(m,r),s=Q(t,n);return{auto_update_timestamp:void 0,model:m,model_price:n,provider:o,...s}}function C(t){return b?.(),x(g,t)}function E(t,e,a){if(a=a??"default",!t.extractors)throw new Error("No extraction logic defined for this provider");const i=t.extractors.find(s=>s.api_flavor===a);if(!i){const s=t.extractors.map(u=>u.api_flavor).join(", ");throw new Error(`Unknown apiFlavor '${a}', allowed values: ${s}`)}if(!h.guard(e))throw new Error(`Expected response data to be a mapping object, got ${l(e)}`);const o=w(i.model_path,e,N,!1,[]),m=L(i.root),r=w(m,e,h,!0,[]),n={};for(const s of i.mappings){const u=w(s.path,r,V,s.required,m);if(u!==null){const p=n[s.dest]??0;n[s.dest]=p+u}}if(!Object.keys(n).length)throw new Error(`No usage information found at ${JSON.stringify(i.root)}`);return{model:o,usage:n}}function w(t,e,a,i,o){const[m,...r]=L(t).reverse();if(typeof m!="string")throw new Error(`Expected last step of path to be a string, got ${l(m)}`);r.reverse();let n=e;const s=[];for(const p of r){if(s.push(p),typeof p=="object")if(Array.isArray(n))n=z(p,n);else{if(i)throw new Error(`Expected \`${d(o,s)}\` value to be a mapping, got ${l(n)}`);return null}else if(h.guard(n))n=n[p];else{if(i)throw new Error(`Expected \`${d(o,s)}\` value to be a mapping, got ${l(n)}`);return null}if(typeof n>"u")if(i){const k=typeof p=="object"?"Unable to find item":"Missing value";throw new Error(`${k} at \`${d(o,s)}\``)}else return null}if(!h.guard(n)){if(i)throw new Error(`Expected \`${d(o,s)}\` value to be a mapping, got ${l(n)}`);return null}const u=n[m];if(typeof u>"u"){if(i)throw s.push(m),new Error(`Missing value at \`${d(o,s)}\``);return null}if(a.guard(u))return u;if(i)throw s.push(m),new Error(`Expected \`${d(o,s)}\` value to be a ${a.name}, got ${l(u)}`);return null}function z(t,e){for(const a of e)if(h.guard(a)){const i=a[t.field];if(typeof i=="string"&&_(t.match,i))return a}}function L(t){return Array.isArray(t)?[...t]:[t]}function l(t){return t===null?"null":Array.isArray(t)?"array":typeof t=="object"?"mapping":typeof t}const h={guard:t=>l(t)==="mapping",name:"mapping"},N={guard:t=>typeof t=="string",name:"string"},V={guard:t=>typeof t=="number",name:"number"},d=(t,e)=>[...t.map(v),...e.map(v)].join("."),v=t=>typeof t=="string"?t:JSON.stringify(t);exports.REMOTE_DATA_JSON_URL=I;exports.calcPrice=R;exports.extractUsage=E;exports.findProvider=C;exports.updatePrices=G;exports.waitForUpdate=D;
|