npm - @lobehub/chat - Versions diffs - 1.68.7 → 1.68.8 - Mend

@lobehub/chat 1.68.7 → 1.68.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

package/CHANGELOG.md +25 -0
package/changelog/v1.json +9 -0
package/package.json +1 -1
package/src/database/server/models/aiModel.ts +1 -0
package/src/libs/agent-runtime/openrouter/__snapshots__/index.test.ts.snap +898 -48
package/src/libs/agent-runtime/openrouter/index.ts +24 -8
package/src/libs/agent-runtime/openrouter/type.ts +11 -0
package/src/types/llm.ts +1 -1

package/src/libs/agent-runtime/openrouter/__snapshots__/index.test.ts.snap CHANGED Viewed

@@ -14,7 +14,12 @@ _These are free, rate-limited endpoints for [Reflection 70B](/models/mattshumer/
     "functionCall": false,
     "id": "mattshumer/reflection-70b:free",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 0,
+      "output": 0,
+    },
     "reasoning": false,
+    "releasedAt": "2024-09-06",
     "vision": false,
   },
   {
@@ -27,7 +32,12 @@ The model was trained on synthetic data.",
     "functionCall": false,
     "id": "mattshumer/reflection-70b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.35,
+      "output": 0.4,
+    },
     "reasoning": false,
+    "releasedAt": "2024-09-06",
     "vision": false,
   },
   {
@@ -39,10 +49,15 @@ Read the launch post [here](https://txt.cohere.com/command-r/).
 Use of this model is subject to Cohere's [Acceptable Use Policy](https://docs.cohere.com/docs/c4ai-acceptable-use-policy).",
     "displayName": "Cohere: Command R (03-2024)",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "cohere/command-r-03-2024",
     "maxTokens": 4000,
+    "pricing": {
+      "input": 0.5,
+      "output": 1.5,
+    },
     "reasoning": false,
+    "releasedAt": "2024-08-31",
     "vision": false,
   },
   {
@@ -54,10 +69,15 @@ It offers multilingual support for ten key languages to facilitate global busine
 Use of this model is subject to Cohere's [Acceptable Use Policy](https://docs.cohere.com/docs/c4ai-acceptable-use-policy).",
     "displayName": "Cohere: Command R+ (04-2024)",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "cohere/command-r-plus-04-2024",
     "maxTokens": 4000,
+    "pricing": {
+      "input": 3,
+      "output": 15,
+    },
     "reasoning": false,
+    "releasedAt": "2024-08-31",
     "vision": false,
   },
   {
@@ -69,10 +89,15 @@ Read the launch post [here](https://docs.cohere.com/changelog/command-gets-refre
 Use of this model is subject to Cohere's [Acceptable Use Policy](https://docs.cohere.com/docs/c4ai-acceptable-use-policy).",
     "displayName": "Cohere: Command R+ (08-2024)",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "cohere/command-r-plus-08-2024",
     "maxTokens": 4000,
+    "pricing": {
+      "input": 2.5,
+      "output": 10,
+    },
     "reasoning": false,
+    "releasedAt": "2024-08-30",
     "vision": false,
   },
   {
@@ -84,10 +109,15 @@ Read the launch post [here](https://docs.cohere.com/changelog/command-gets-refre
 Use of this model is subject to Cohere's [Acceptable Use Policy](https://docs.cohere.com/docs/c4ai-acceptable-use-policy).",
     "displayName": "Cohere: Command R (08-2024)",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "cohere/command-r-08-2024",
     "maxTokens": 4000,
+    "pricing": {
+      "input": 0.15,
+      "output": 0.6,
+    },
     "reasoning": false,
+    "releasedAt": "2024-08-30",
     "vision": false,
   },
   {
@@ -104,7 +134,12 @@ Note: This model is experimental and not suited for production use-cases. It may
     "functionCall": false,
     "id": "google/gemini-flash-8b-1.5-exp",
     "maxTokens": 32768,
+    "pricing": {
+      "input": 0,
+      "output": 0,
+    },
     "reasoning": false,
+    "releasedAt": "2024-08-28",
     "vision": true,
   },
   {
@@ -121,7 +156,12 @@ Note: This model is experimental and not suited for production use-cases. It may
     "functionCall": false,
     "id": "google/gemini-flash-1.5-exp",
     "maxTokens": 32768,
+    "pricing": {
+      "input": 0,
+      "output": 0,
+    },
     "reasoning": false,
+    "releasedAt": "2024-08-28",
     "vision": true,
   },
   {
@@ -132,7 +172,12 @@ Note: This model is experimental and not suited for production use-cases. It may
     "functionCall": false,
     "id": "sao10k/l3.1-euryale-70b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 1.5,
+      "output": 1.5,
+    },
     "reasoning": false,
+    "releasedAt": "2024-08-28",
     "vision": false,
   },
   {
@@ -146,10 +191,15 @@ Built on a novel SSM-Transformer architecture, it outperforms larger models like
 Read their [announcement](https://www.ai21.com/blog/announcing-jamba-model-family) to learn more.",
     "displayName": "AI21: Jamba 1.5 Large",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "ai21/jamba-1-5-large",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 2,
+      "output": 8,
+    },
     "reasoning": false,
+    "releasedAt": "2024-08-23",
     "vision": false,
   },
   {
@@ -163,10 +213,15 @@ This model uses less computer memory and works faster with longer texts than pre
 Read their [announcement](https://www.ai21.com/blog/announcing-jamba-model-family) to learn more.",
     "displayName": "AI21: Jamba 1.5 Mini",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "ai21/jamba-1-5-mini",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 0.2,
+      "output": 0.4,
+    },
     "reasoning": false,
+    "releasedAt": "2024-08-23",
     "vision": false,
   },
   {
@@ -176,10 +231,15 @@ Read their [announcement](https://www.ai21.com/blog/announcing-jamba-model-famil
 The models underwent a rigorous enhancement process, incorporating both supervised fine-tuning, proximal policy optimization, and direct preference optimization to ensure precise instruction adherence and robust safety measures. When assessed against benchmarks that test common sense, language understanding, math, code, long context and logical reasoning, Phi-3.5 models showcased robust and state-of-the-art performance among models with less than 13 billion parameters.",
     "displayName": "Phi-3.5 Mini 128K Instruct",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "microsoft/phi-3.5-mini-128k-instruct",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.1,
+      "output": 0.1,
+    },
     "reasoning": false,
+    "releasedAt": "2024-08-21",
     "vision": false,
   },
   {
@@ -194,7 +254,12 @@ The Hermes 3 series builds and expands on the Hermes 2 set of capabilities, incl
     "functionCall": true,
     "id": "nousresearch/hermes-3-llama-3.1-70b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.4,
+      "output": 0.4,
+    },
     "reasoning": false,
+    "releasedAt": "2024-08-18",
     "vision": false,
   },
   {
@@ -211,7 +276,12 @@ Hermes 3 is competitive, if not superior, to Llama-3.1 Instruct models at genera
     "functionCall": true,
     "id": "nousresearch/hermes-3-llama-3.1-405b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0,
+      "output": 0,
+    },
     "reasoning": false,
+    "releasedAt": "2024-08-16",
     "vision": false,
   },
   {
@@ -230,7 +300,12 @@ _These are extended-context endpoints for [Hermes 3 405B Instruct](/models/nousr
     "functionCall": true,
     "id": "nousresearch/hermes-3-llama-3.1-405b:extended",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0,
+      "output": 0,
+    },
     "reasoning": false,
+    "releasedAt": "2024-08-16",
     "vision": false,
   },
   {
@@ -241,7 +316,12 @@ _These are extended-context endpoints for [Hermes 3 405B Instruct](/models/nousr
     "functionCall": false,
     "id": "perplexity/llama-3.1-sonar-huge-128k-online",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 5,
+      "output": 5,
+    },
     "reasoning": false,
+    "releasedAt": "2024-08-14",
     "vision": false,
   },
   {
@@ -254,8 +334,13 @@ Note: This model is experimental and not suited for production use-cases. It may
     "functionCall": false,
     "id": "openai/chatgpt-4o-latest",
     "maxTokens": 16384,
+    "pricing": {
+      "input": 5,
+      "output": 15,
+    },
     "reasoning": false,
-    "vision": false,
+    "releasedAt": "2024-08-14",
+    "vision": true,
   },
   {
     "contextWindowTokens": 8192,
@@ -269,7 +354,12 @@ For best results, use with Llama 3 Instruct context template, temperature 1.4, a
     "functionCall": false,
     "id": "sao10k/l3-lunaris-8b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 2,
+      "output": 2,
+    },
     "reasoning": false,
+    "releasedAt": "2024-08-13",
     "vision": false,
   },
   {
@@ -282,7 +372,12 @@ Although more similar to Magnum overall, the model remains very creative, with a
     "functionCall": false,
     "id": "aetherwiing/mn-starcannon-12b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 2,
+      "output": 2,
+    },
     "reasoning": false,
+    "releasedAt": "2024-08-13",
     "vision": false,
   },
   {
@@ -294,11 +389,16 @@ GPT-4o ("o" for "omni") is OpenAI's latest AI model, supporting both text and im
 For benchmarking against other models, it was briefly called ["im-also-a-good-gpt2-chatbot"](https://twitter.com/LiamFedus/status/1790064963966370209)",
     "displayName": "OpenAI: GPT-4o (2024-08-06)",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "openai/gpt-4o-2024-08-06",
     "maxTokens": 16384,
+    "pricing": {
+      "input": 2.5,
+      "output": 10,
+    },
     "reasoning": false,
-    "vision": false,
+    "releasedAt": "2024-08-06",
+    "vision": true,
   },
   {
     "contextWindowTokens": 131072,
@@ -312,7 +412,12 @@ To read more about the model release, [click here](https://ai.meta.com/blog/meta
     "functionCall": false,
     "id": "meta-llama/llama-3.1-405b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 2,
+      "output": 2,
+    },
     "reasoning": false,
+    "releasedAt": "2024-08-02",
     "vision": false,
   },
   {
@@ -327,7 +432,12 @@ Check out the model's [HuggingFace page](https://huggingface.co/nothingiisreal/M
     "functionCall": false,
     "id": "nothingiisreal/mn-celeste-12b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 1.5,
+      "output": 1.5,
+    },
     "reasoning": false,
+    "releasedAt": "2024-08-02",
     "vision": false,
   },
   {
@@ -344,7 +454,12 @@ Note: This model is experimental and not suited for production use-cases. It may
     "functionCall": false,
     "id": "google/gemini-pro-1.5-exp",
     "maxTokens": 32768,
+    "pricing": {
+      "input": 0,
+      "output": 0,
+    },
     "reasoning": false,
+    "releasedAt": "2024-08-01",
     "vision": true,
   },
   {
@@ -357,7 +472,12 @@ This is the online version of the [offline chat model](/models/perplexity/llama-
     "functionCall": false,
     "id": "perplexity/llama-3.1-sonar-large-128k-online",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 1,
+      "output": 1,
+    },
     "reasoning": false,
+    "releasedAt": "2024-08-01",
     "vision": false,
   },
   {
@@ -370,7 +490,12 @@ This is a normal offline LLM, but the [online version](/models/perplexity/llama-
     "functionCall": false,
     "id": "perplexity/llama-3.1-sonar-large-128k-chat",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 1,
+      "output": 1,
+    },
     "reasoning": false,
+    "releasedAt": "2024-08-01",
     "vision": false,
   },
   {
@@ -383,7 +508,12 @@ This is the online version of the [offline chat model](/models/perplexity/llama-
     "functionCall": false,
     "id": "perplexity/llama-3.1-sonar-small-128k-online",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.2,
+      "output": 0.2,
+    },
     "reasoning": false,
+    "releasedAt": "2024-08-01",
     "vision": false,
   },
   {
@@ -396,7 +526,12 @@ This is a normal offline LLM, but the [online version](/models/perplexity/llama-
     "functionCall": false,
     "id": "perplexity/llama-3.1-sonar-small-128k-chat",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.2,
+      "output": 0.2,
+    },
     "reasoning": false,
+    "releasedAt": "2024-08-01",
     "vision": false,
   },
   {
@@ -408,10 +543,15 @@ It has demonstrated strong performance compared to leading closed-source models
 To read more about the model release, [click here](https://ai.meta.com/blog/meta-llama-3/). Usage of this model is subject to [Meta's Acceptable Use Policy](https://llama.meta.com/llama3/use-policy/).",
     "displayName": "Meta: Llama 3.1 70B Instruct",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "meta-llama/llama-3.1-70b-instruct",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.3,
+      "output": 0.3,
+    },
     "reasoning": false,
+    "releasedAt": "2024-07-23",
     "vision": false,
   },
   {
@@ -428,7 +568,12 @@ _These are free, rate-limited endpoints for [Llama 3.1 8B Instruct](/models/meta
     "functionCall": false,
     "id": "meta-llama/llama-3.1-8b-instruct:free",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 0,
+      "output": 0,
+    },
     "reasoning": false,
+    "releasedAt": "2024-07-23",
     "vision": false,
   },
   {
@@ -440,10 +585,15 @@ It has demonstrated strong performance compared to leading closed-source models
 To read more about the model release, [click here](https://ai.meta.com/blog/meta-llama-3/). Usage of this model is subject to [Meta's Acceptable Use Policy](https://llama.meta.com/llama3/use-policy/).",
     "displayName": "Meta: Llama 3.1 8B Instruct",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "meta-llama/llama-3.1-8b-instruct",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.055,
+      "output": 0.055,
+    },
     "reasoning": false,
+    "releasedAt": "2024-07-23",
     "vision": false,
   },
   {
@@ -457,10 +607,15 @@ It has demonstrated strong performance compared to leading closed-source models
 To read more about the model release, [click here](https://ai.meta.com/blog/meta-llama-3/). Usage of this model is subject to [Meta's Acceptable Use Policy](https://llama.meta.com/llama3/use-policy/).",
     "displayName": "Meta: Llama 3.1 405B Instruct",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "meta-llama/llama-3.1-405b-instruct",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 1.79,
+      "output": 1.79,
+    },
     "reasoning": false,
+    "releasedAt": "2024-07-23",
     "vision": false,
   },
   {
@@ -475,7 +630,12 @@ Usage of this model is subject to [Meta's Acceptable Use Policy](https://llama.m
     "functionCall": true,
     "id": "cognitivecomputations/dolphin-llama-3-70b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.35,
+      "output": 0.4,
+    },
     "reasoning": false,
+    "releasedAt": "2024-07-19",
     "vision": false,
   },
   {
@@ -489,10 +649,15 @@ Usage of this model is subject to [Meta's Acceptable Use Policy](https://llama.m
 - Available under the Apache 2.0 license for free use, modification, and distribution",
     "displayName": "Mistral: Codestral Mamba",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "mistralai/codestral-mamba",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.25,
+      "output": 0.25,
+    },
     "reasoning": false,
+    "releasedAt": "2024-07-19",
     "vision": false,
   },
   {
@@ -507,7 +672,12 @@ It supports function calling and is released under the Apache 2.0 license.",
     "functionCall": true,
     "id": "mistralai/mistral-nemo",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.13,
+      "output": 0.13,
+    },
     "reasoning": false,
+    "releasedAt": "2024-07-19",
     "vision": false,
   },
   {
@@ -521,11 +691,16 @@ GPT-4o mini achieves an 82% score on MMLU and presently ranks higher than GPT-4
 Check out the [launch announcement](https://openai.com/index/gpt-4o-mini-advancing-cost-efficient-intelligence/) to learn more.",
     "displayName": "OpenAI: GPT-4o-mini (2024-07-18)",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "openai/gpt-4o-mini-2024-07-18",
     "maxTokens": 16384,
+    "pricing": {
+      "input": 0.15,
+      "output": 0.6,
+    },
     "reasoning": false,
-    "vision": false,
+    "releasedAt": "2024-07-18",
+    "vision": true,
   },
   {
     "contextWindowTokens": 128000,
@@ -541,7 +716,12 @@ Check out the [launch announcement](https://openai.com/index/gpt-4o-mini-advanci
     "functionCall": true,
     "id": "openai/gpt-4o-mini",
     "maxTokens": 16384,
+    "pricing": {
+      "input": 0.15,
+      "output": 0.6,
+    },
     "reasoning": false,
+    "releasedAt": "2024-07-18",
     "vision": true,
   },
   {
@@ -560,7 +740,12 @@ _These are free, rate-limited endpoints for [Qwen 2 7B Instruct](/models/qwen/qw
     "functionCall": false,
     "id": "qwen/qwen-2-7b-instruct:free",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 0,
+      "output": 0,
+    },
     "reasoning": false,
+    "releasedAt": "2024-07-16",
     "vision": false,
   },
   {
@@ -577,7 +762,12 @@ Usage of this model is subject to [Tongyi Qianwen LICENSE AGREEMENT](https://hug
     "functionCall": false,
     "id": "qwen/qwen-2-7b-instruct",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.055,
+      "output": 0.055,
+    },
     "reasoning": false,
+    "releasedAt": "2024-07-16",
     "vision": false,
   },
   {
@@ -592,7 +782,12 @@ See the [launch announcement](https://blog.google/technology/developers/google-g
     "functionCall": false,
     "id": "google/gemma-2-27b-it",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.27,
+      "output": 0.27,
+    },
     "reasoning": false,
+    "releasedAt": "2024-07-13",
     "vision": false,
   },
   {
@@ -605,7 +800,12 @@ The model is based on [Qwen2 72B](https://openrouter.ai/models/qwen/qwen-2-72b-i
     "functionCall": false,
     "id": "alpindale/magnum-72b",
     "maxTokens": 1024,
+    "pricing": {
+      "input": 3.75,
+      "output": 4.5,
+    },
     "reasoning": false,
+    "releasedAt": "2024-07-11",
     "vision": false,
   },
   {
@@ -618,7 +818,12 @@ Hermes-2 Θ (theta) was specifically designed with a few capabilities in mind: e
     "functionCall": false,
     "id": "nousresearch/hermes-2-theta-llama-3-8b",
     "maxTokens": 2048,
+    "pricing": {
+      "input": 0.1875,
+      "output": 1.125,
+    },
     "reasoning": false,
+    "releasedAt": "2024-07-11",
     "vision": false,
   },
   {
@@ -635,7 +840,12 @@ _These are free, rate-limited endpoints for [Gemma 2 9B](/models/google/gemma-2-
     "functionCall": false,
     "id": "google/gemma-2-9b-it:free",
     "maxTokens": 2048,
+    "pricing": {
+      "input": 0,
+      "output": 0,
+    },
     "reasoning": false,
+    "releasedAt": "2024-06-28",
     "vision": false,
   },
   {
@@ -650,7 +860,12 @@ See the [launch announcement](https://blog.google/technology/developers/google-g
     "functionCall": false,
     "id": "google/gemma-2-9b-it",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.06,
+      "output": 0.06,
+    },
     "reasoning": false,
+    "releasedAt": "2024-06-28",
     "vision": false,
   },
   {
@@ -666,7 +881,12 @@ Compared to older Stheno version, this model is trained on:
     "functionCall": false,
     "id": "sao10k/l3-stheno-8b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.25,
+      "output": 1.5,
+    },
     "reasoning": false,
+    "releasedAt": "2024-06-27",
     "vision": false,
   },
   {
@@ -684,7 +904,12 @@ Jamba has a knowledge cutoff of February 2024.",
     "functionCall": false,
     "id": "ai21/jamba-instruct",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 0.5,
+      "output": 0.7,
+    },
     "reasoning": false,
+    "releasedAt": "2024-06-25",
     "vision": false,
   },
   {
@@ -702,7 +927,12 @@ Jamba has a knowledge cutoff of February 2024.",
     "functionCall": true,
     "id": "anthropic/claude-3.5-sonnet",
     "maxTokens": 8192,
+    "pricing": {
+      "input": 3,
+      "output": 15,
+    },
     "reasoning": false,
+    "releasedAt": "2024-06-20",
     "vision": true,
   },
   {
@@ -722,7 +952,12 @@ _This is a faster endpoint, made available in collaboration with Anthropic, that
     "functionCall": true,
     "id": "anthropic/claude-3.5-sonnet:beta",
     "maxTokens": 8192,
+    "pricing": {
+      "input": 3,
+      "output": 15,
+    },
     "reasoning": false,
+    "releasedAt": "2024-06-20",
     "vision": true,
   },
   {
@@ -739,7 +974,12 @@ _This is a faster endpoint, made available in collaboration with Anthropic, that
     "functionCall": false,
     "id": "sao10k/l3-euryale-70b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.35,
+      "output": 0.4,
+    },
     "reasoning": false,
+    "releasedAt": "2024-06-18",
     "vision": false,
   },
   {
@@ -754,7 +994,12 @@ For 128k context length, try [Phi-3 Medium 128K](/models/microsoft/phi-3-medium-
     "functionCall": false,
     "id": "microsoft/phi-3-medium-4k-instruct",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.14,
+      "output": 0.14,
+    },
     "reasoning": false,
+    "releasedAt": "2024-06-15",
     "vision": false,
   },
   {
@@ -771,7 +1016,12 @@ The model is uncensored and is stripped of alignment and bias. It requires an ex
     "functionCall": false,
     "id": "cognitivecomputations/dolphin-mixtral-8x22b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.9,
+      "output": 0.9,
+    },
     "reasoning": false,
+    "releasedAt": "2024-06-08",
     "vision": false,
   },
   {
@@ -788,7 +1038,12 @@ Usage of this model is subject to [Tongyi Qianwen LICENSE AGREEMENT](https://hug
     "functionCall": false,
     "id": "qwen/qwen-2-72b-instruct",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.35,
+      "output": 0.4,
+    },
     "reasoning": false,
+    "releasedAt": "2024-06-07",
     "vision": false,
   },
   {
@@ -806,7 +1061,12 @@ It outperforms many similarly sized models including [Llama 3 8B Instruct](/mode
     "functionCall": false,
     "id": "openchat/openchat-8b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.055,
+      "output": 0.055,
+    },
     "reasoning": false,
+    "releasedAt": "2024-06-01",
     "vision": false,
   },
   {
@@ -817,7 +1077,12 @@ It outperforms many similarly sized models including [Llama 3 8B Instruct](/mode
     "functionCall": false,
     "id": "nousresearch/hermes-2-pro-llama-3-8b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.14,
+      "output": 0.14,
+    },
     "reasoning": false,
+    "releasedAt": "2024-05-27",
     "vision": false,
   },
   {
@@ -836,7 +1101,12 @@ NOTE: Support for function calling depends on the provider.",
     "functionCall": true,
     "id": "mistralai/mistral-7b-instruct-v0.3",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.055,
+      "output": 0.055,
+    },
     "reasoning": false,
+    "releasedAt": "2024-05-27",
     "vision": false,
   },
   {
@@ -851,7 +1121,12 @@ _These are free, rate-limited endpoints for [Mistral 7B Instruct](/models/mistra
     "functionCall": false,
     "id": "mistralai/mistral-7b-instruct:free",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 0,
+      "output": 0,
+    },
     "reasoning": false,
+    "releasedAt": "2024-05-27",
     "vision": false,
   },
   {
@@ -861,10 +1136,15 @@ _These are free, rate-limited endpoints for [Mistral 7B Instruct](/models/mistra
 *Mistral 7B Instruct has multiple version variants, and this is intended to be the latest version.*",
     "displayName": "Mistral: Mistral 7B Instruct",
     "enabled": true,
-    "functionCall": false,
+    "functionCall": true,
     "id": "mistralai/mistral-7b-instruct",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.055,
+      "output": 0.055,
+    },
     "reasoning": false,
+    "releasedAt": "2024-05-27",
     "vision": false,
   },
   {
@@ -879,7 +1159,12 @@ _These are higher-throughput endpoints for [Mistral 7B Instruct](/models/mistral
     "functionCall": false,
     "id": "mistralai/mistral-7b-instruct:nitro",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.07,
+      "output": 0.07,
+    },
     "reasoning": false,
+    "releasedAt": "2024-05-27",
     "vision": false,
   },
   {
@@ -891,10 +1176,15 @@ At time of release, Phi-3 Medium demonstrated state-of-the-art performance among
 _These are free, rate-limited endpoints for [Phi-3 Mini 128K Instruct](/models/microsoft/phi-3-mini-128k-instruct). Outputs may be cached. Read about rate limits [here](/docs/limits)._",
     "displayName": "Phi-3 Mini 128K Instruct (free)",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "microsoft/phi-3-mini-128k-instruct:free",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 0,
+      "output": 0,
+    },
     "reasoning": false,
+    "releasedAt": "2024-05-26",
     "vision": false,
   },
   {
@@ -904,10 +1194,15 @@ _These are free, rate-limited endpoints for [Phi-3 Mini 128K Instruct](/models/m
 At time of release, Phi-3 Medium demonstrated state-of-the-art performance among lightweight models. This model is static, trained on an offline dataset with an October 2023 cutoff date.",
     "displayName": "Phi-3 Mini 128K Instruct",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "microsoft/phi-3-mini-128k-instruct",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.1,
+      "output": 0.1,
+    },
     "reasoning": false,
+    "releasedAt": "2024-05-26",
     "vision": false,
   },
   {
@@ -921,10 +1216,15 @@ For 4k context length, try [Phi-3 Medium 4K](/models/microsoft/phi-3-medium-4k-i
 _These are free, rate-limited endpoints for [Phi-3 Medium 128K Instruct](/models/microsoft/phi-3-medium-128k-instruct). Outputs may be cached. Read about rate limits [here](/docs/limits)._",
     "displayName": "Phi-3 Medium 128K Instruct (free)",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "microsoft/phi-3-medium-128k-instruct:free",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 0,
+      "output": 0,
+    },
     "reasoning": false,
+    "releasedAt": "2024-05-24",
     "vision": false,
   },
   {
@@ -936,10 +1236,15 @@ At time of release, Phi-3 Medium demonstrated state-of-the-art performance among
 For 4k context length, try [Phi-3 Medium 4K](/models/microsoft/phi-3-medium-4k-instruct).",
     "displayName": "Phi-3 Medium 128K Instruct",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "microsoft/phi-3-medium-128k-instruct",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 1,
+      "output": 1,
+    },
     "reasoning": false,
+    "releasedAt": "2024-05-24",
     "vision": false,
   },
   {
@@ -954,7 +1259,12 @@ Usage of this model is subject to [Meta's Acceptable Use Policy](https://llama.m
     "functionCall": false,
     "id": "neversleep/llama-3-lumimaid-70b",
     "maxTokens": 2048,
+    "pricing": {
+      "input": 3.375,
+      "output": 4.5,
+    },
     "reasoning": false,
+    "releasedAt": "2024-05-16",
     "vision": false,
   },
   {
@@ -971,7 +1281,12 @@ Usage of Gemini is subject to Google's [Gemini Terms of Use](https://ai.google.d
     "functionCall": true,
     "id": "google/gemini-flash-1.5",
     "maxTokens": 32768,
+    "pricing": {
+      "input": 0.0375,
+      "output": 0.15,
+    },
     "reasoning": false,
+    "releasedAt": "2024-05-14",
     "vision": true,
   },
   {
@@ -984,7 +1299,12 @@ The original V1 model was trained from scratch on 2T tokens, with a composition
     "functionCall": false,
     "id": "deepseek/deepseek-coder",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 0.14,
+      "output": 0.28,
+    },
     "reasoning": false,
+    "releasedAt": "2024-05-14",
     "vision": false,
   },
   {
@@ -999,7 +1319,12 @@ DeepSeek-V2 achieves remarkable performance on both standard benchmarks and open
     "functionCall": true,
     "id": "deepseek/deepseek-chat",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 0.14,
+      "output": 0.28,
+    },
     "reasoning": false,
+    "releasedAt": "2024-05-14",
     "vision": false,
   },
   {
@@ -1012,7 +1337,12 @@ This is the online version of the [offline chat model](/models/perplexity/llama-
     "functionCall": false,
     "id": "perplexity/llama-3-sonar-large-32k-online",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 1,
+      "output": 1,
+    },
     "reasoning": false,
+    "releasedAt": "2024-05-14",
     "vision": false,
   },
   {
@@ -1025,7 +1355,12 @@ This is a normal offline LLM, but the [online version](/models/perplexity/llama-
     "functionCall": false,
     "id": "perplexity/llama-3-sonar-large-32k-chat",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 1,
+      "output": 1,
+    },
     "reasoning": false,
+    "releasedAt": "2024-05-14",
     "vision": false,
   },
   {
@@ -1038,7 +1373,12 @@ This is the online version of the [offline chat model](/models/perplexity/llama-
     "functionCall": false,
     "id": "perplexity/llama-3-sonar-small-32k-online",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.2,
+      "output": 0.2,
+    },
     "reasoning": false,
+    "releasedAt": "2024-05-14",
     "vision": false,
   },
   {
@@ -1051,7 +1391,12 @@ This is a normal offline LLM, but the [online version](/models/perplexity/llama-
     "functionCall": false,
     "id": "perplexity/llama-3-sonar-small-32k-chat",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.2,
+      "output": 0.2,
+    },
     "reasoning": false,
+    "releasedAt": "2024-05-14",
     "vision": false,
   },
   {
@@ -1070,7 +1415,12 @@ To read more about the model release, [click here](https://ai.meta.com/blog/meta
     "functionCall": false,
     "id": "meta-llama/llama-guard-2-8b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.18,
+      "output": 0.18,
+    },
     "reasoning": false,
+    "releasedAt": "2024-05-13",
     "vision": false,
   },
   {
@@ -1080,11 +1430,16 @@ To read more about the model release, [click here](https://ai.meta.com/blog/meta
 For benchmarking against other models, it was briefly called ["im-also-a-good-gpt2-chatbot"](https://twitter.com/LiamFedus/status/1790064963966370209)",
     "displayName": "OpenAI: GPT-4o (2024-05-13)",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "openai/gpt-4o-2024-05-13",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 5,
+      "output": 15,
+    },
     "reasoning": false,
-    "vision": false,
+    "releasedAt": "2024-05-13",
+    "vision": true,
   },
   {
     "contextWindowTokens": 128000,
@@ -1096,7 +1451,12 @@ For benchmarking against other models, it was briefly called ["im-also-a-good-gp
     "functionCall": true,
     "id": "openai/gpt-4o",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 5,
+      "output": 15,
+    },
     "reasoning": false,
+    "releasedAt": "2024-05-13",
     "vision": true,
   },
   {
@@ -1106,10 +1466,15 @@ For benchmarking against other models, it was briefly called ["im-also-a-good-gp
 _These are extended-context endpoints for [GPT-4o](/models/openai/gpt-4o). They may have higher prices._",
     "displayName": "OpenAI: GPT-4o (extended)",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "openai/gpt-4o:extended",
     "maxTokens": 64000,
+    "pricing": {
+      "input": 6,
+      "output": 18,
+    },
     "reasoning": false,
+    "releasedAt": "2024-05-13",
     "vision": false,
   },
   {
@@ -1128,7 +1493,12 @@ Usage of this model is subject to [Tongyi Qianwen LICENSE AGREEMENT](https://hug
     "functionCall": false,
     "id": "qwen/qwen-72b-chat",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.81,
+      "output": 0.81,
+    },
     "reasoning": false,
+    "releasedAt": "2024-05-09",
     "vision": false,
   },
   {
@@ -1147,7 +1517,12 @@ Usage of this model is subject to [Tongyi Qianwen LICENSE AGREEMENT](https://hug
     "functionCall": false,
     "id": "qwen/qwen-110b-chat",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 1.62,
+      "output": 1.62,
+    },
     "reasoning": false,
+    "releasedAt": "2024-05-09",
     "vision": false,
   },
   {
@@ -1162,7 +1537,12 @@ Usage of this model is subject to [Meta's Acceptable Use Policy](https://llama.m
     "functionCall": false,
     "id": "neversleep/llama-3-lumimaid-8b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.1875,
+      "output": 1.125,
+    },
     "reasoning": false,
+    "releasedAt": "2024-05-04",
     "vision": false,
   },
   {
@@ -1179,7 +1559,12 @@ _These are extended-context endpoints for [Llama 3 Lumimaid 8B](/models/neversle
     "functionCall": false,
     "id": "neversleep/llama-3-lumimaid-8b:extended",
     "maxTokens": 2048,
+    "pricing": {
+      "input": 0.1875,
+      "output": 1.125,
+    },
     "reasoning": false,
+    "releasedAt": "2024-05-04",
     "vision": false,
   },
   {
@@ -1192,7 +1577,12 @@ If you submit a raw prompt, you can use Alpaca or Vicuna formats.",
     "functionCall": false,
     "id": "sao10k/fimbulvetr-11b-v2",
     "maxTokens": 2048,
+    "pricing": {
+      "input": 0.375,
+      "output": 1.5,
+    },
     "reasoning": false,
+    "releasedAt": "2024-04-21",
     "vision": false,
   },
   {
@@ -1204,10 +1594,15 @@ It has demonstrated strong performance compared to leading closed-source models
 To read more about the model release, [click here](https://ai.meta.com/blog/meta-llama-3/). Usage of this model is subject to [Meta's Acceptable Use Policy](https://llama.meta.com/llama3/use-policy/).",
     "displayName": "Meta: Llama 3 70B Instruct",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "meta-llama/llama-3-70b-instruct",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.35,
+      "output": 0.4,
+    },
     "reasoning": false,
+    "releasedAt": "2024-04-18",
     "vision": false,
   },
   {
@@ -1224,7 +1619,12 @@ _These are higher-throughput endpoints for [Llama 3 70B Instruct](/models/meta-l
     "functionCall": false,
     "id": "meta-llama/llama-3-70b-instruct:nitro",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.792,
+      "output": 0.792,
+    },
     "reasoning": false,
+    "releasedAt": "2024-04-18",
     "vision": false,
   },
   {
@@ -1241,7 +1641,12 @@ _These are free, rate-limited endpoints for [Llama 3 8B Instruct](/models/meta-l
     "functionCall": false,
     "id": "meta-llama/llama-3-8b-instruct:free",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 0,
+      "output": 0,
+    },
     "reasoning": false,
+    "releasedAt": "2024-04-18",
     "vision": false,
   },
   {
@@ -1253,10 +1658,15 @@ It has demonstrated strong performance compared to leading closed-source models
 To read more about the model release, [click here](https://ai.meta.com/blog/meta-llama-3/). Usage of this model is subject to [Meta's Acceptable Use Policy](https://llama.meta.com/llama3/use-policy/).",
     "displayName": "Meta: Llama 3 8B Instruct",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "meta-llama/llama-3-8b-instruct",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.055,
+      "output": 0.055,
+    },
     "reasoning": false,
+    "releasedAt": "2024-04-18",
     "vision": false,
   },
   {
@@ -1273,7 +1683,12 @@ _These are higher-throughput endpoints for [Llama 3 8B Instruct](/models/meta-ll
     "functionCall": false,
     "id": "meta-llama/llama-3-8b-instruct:nitro",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.162,
+      "output": 0.162,
+    },
     "reasoning": false,
+    "releasedAt": "2024-04-18",
     "vision": false,
   },
   {
@@ -1290,7 +1705,12 @@ _These are extended-context endpoints for [Llama 3 8B Instruct](/models/meta-lla
     "functionCall": false,
     "id": "meta-llama/llama-3-8b-instruct:extended",
     "maxTokens": 2048,
+    "pricing": {
+      "input": 0.1875,
+      "output": 1.125,
+    },
     "reasoning": false,
+    "releasedAt": "2024-04-18",
     "vision": false,
   },
   {
@@ -1307,7 +1727,12 @@ See benchmarks on the launch announcement [here](https://mistral.ai/news/mixtral
     "functionCall": false,
     "id": "mistralai/mixtral-8x22b-instruct",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.65,
+      "output": 0.65,
+    },
     "reasoning": false,
+    "releasedAt": "2024-04-17",
     "vision": false,
   },
   {
@@ -1324,7 +1749,12 @@ To read more about the model release, [click here](https://wizardlm.github.io/Wi
     "functionCall": false,
     "id": "microsoft/wizardlm-2-7b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.055,
+      "output": 0.055,
+    },
     "reasoning": false,
+    "releasedAt": "2024-04-16",
     "vision": false,
   },
   {
@@ -1341,7 +1771,12 @@ To read more about the model release, [click here](https://wizardlm.github.io/Wi
     "functionCall": false,
     "id": "microsoft/wizardlm-2-8x22b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.5,
+      "output": 0.5,
+    },
     "reasoning": false,
+    "releasedAt": "2024-04-16",
     "vision": false,
   },
   {
@@ -1367,7 +1802,12 @@ Usage of Gemini is subject to Google's [Gemini Terms of Use](https://ai.google.d
     "functionCall": true,
     "id": "google/gemini-pro-1.5",
     "maxTokens": 32768,
+    "pricing": {
+      "input": 2.5,
+      "output": 7.5,
+    },
     "reasoning": false,
+    "releasedAt": "2024-04-09",
     "vision": true,
   },
   {
@@ -1380,7 +1820,12 @@ Training data: up to December 2023.",
     "functionCall": true,
     "id": "openai/gpt-4-turbo",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 10,
+      "output": 30,
+    },
     "reasoning": false,
+    "releasedAt": "2024-04-09",
     "vision": true,
   },
   {
@@ -1392,10 +1837,15 @@ It offers multilingual support for ten key languages to facilitate global busine
 Use of this model is subject to Cohere's [Acceptable Use Policy](https://docs.cohere.com/docs/c4ai-acceptable-use-policy).",
     "displayName": "Cohere: Command R+",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "cohere/command-r-plus",
     "maxTokens": 4000,
+    "pricing": {
+      "input": 3,
+      "output": 15,
+    },
     "reasoning": false,
+    "releasedAt": "2024-04-04",
     "vision": false,
   },
   {
@@ -1412,7 +1862,12 @@ See the launch announcement and benchmark results [here](https://www.databricks.
     "functionCall": false,
     "id": "databricks/dbrx-instruct",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 1.08,
+      "output": 1.08,
+    },
     "reasoning": false,
+    "releasedAt": "2024-03-29",
     "vision": false,
   },
   {
@@ -1425,7 +1880,12 @@ Descending from earlier versions of Midnight Rose and [Wizard Tulu Dolphin 70B](
     "functionCall": false,
     "id": "sophosympatheia/midnight-rose-70b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.8,
+      "output": 0.8,
+    },
     "reasoning": false,
+    "releasedAt": "2024-03-22",
     "vision": false,
   },
   {
@@ -1437,10 +1897,15 @@ Read the launch post [here](https://txt.cohere.com/command-r/).
 Use of this model is subject to Cohere's [Acceptable Use Policy](https://docs.cohere.com/docs/c4ai-acceptable-use-policy).",
     "displayName": "Cohere: Command R",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "cohere/command-r",
     "maxTokens": 4000,
+    "pricing": {
+      "input": 0.5,
+      "output": 1.5,
+    },
     "reasoning": false,
+    "releasedAt": "2024-03-14",
     "vision": false,
   },
   {
@@ -1453,7 +1918,12 @@ Use of this model is subject to Cohere's [Acceptable Use Policy](https://docs.co
     "functionCall": false,
     "id": "cohere/command",
     "maxTokens": 4000,
+    "pricing": {
+      "input": 1,
+      "output": 2,
+    },
     "reasoning": false,
+    "releasedAt": "2024-03-14",
     "vision": false,
   },
   {
@@ -1469,7 +1939,12 @@ See the launch announcement and benchmark results [here](https://www.anthropic.c
     "functionCall": true,
     "id": "anthropic/claude-3-haiku",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 0.25,
+      "output": 1.25,
+    },
     "reasoning": false,
+    "releasedAt": "2024-03-13",
     "vision": true,
   },
   {
@@ -1484,10 +1959,15 @@ See the launch announcement and benchmark results [here](https://www.anthropic.c
 _This is a faster endpoint, made available in collaboration with Anthropic, that is self-moderated: response moderation happens on the provider's side instead of OpenRouter's. For requests that pass moderation, it's identical to the [Standard](/models/anthropic/claude-3-haiku) variant._",
     "displayName": "Anthropic: Claude 3 Haiku (self-moderated)",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "anthropic/claude-3-haiku:beta",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 0.25,
+      "output": 1.25,
+    },
     "reasoning": false,
+    "releasedAt": "2024-03-13",
     "vision": true,
   },
   {
@@ -1499,10 +1979,15 @@ See the launch announcement and benchmark results [here](https://www.anthropic.c
 #multimodal",
     "displayName": "Anthropic: Claude 3 Sonnet",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "anthropic/claude-3-sonnet",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 3,
+      "output": 15,
+    },
     "reasoning": false,
+    "releasedAt": "2024-03-05",
     "vision": true,
   },
   {
@@ -1516,10 +2001,15 @@ See the launch announcement and benchmark results [here](https://www.anthropic.c
 _This is a faster endpoint, made available in collaboration with Anthropic, that is self-moderated: response moderation happens on the provider's side instead of OpenRouter's. For requests that pass moderation, it's identical to the [Standard](/models/anthropic/claude-3-sonnet) variant._",
     "displayName": "Anthropic: Claude 3 Sonnet (self-moderated)",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "anthropic/claude-3-sonnet:beta",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 3,
+      "output": 15,
+    },
     "reasoning": false,
+    "releasedAt": "2024-03-05",
     "vision": true,
   },
   {
@@ -1534,7 +2024,12 @@ See the launch announcement and benchmark results [here](https://www.anthropic.c
     "functionCall": true,
     "id": "anthropic/claude-3-opus",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 15,
+      "output": 75,
+    },
     "reasoning": false,
+    "releasedAt": "2024-03-05",
     "vision": true,
   },
   {
@@ -1548,10 +2043,15 @@ See the launch announcement and benchmark results [here](https://www.anthropic.c
 _This is a faster endpoint, made available in collaboration with Anthropic, that is self-moderated: response moderation happens on the provider's side instead of OpenRouter's. For requests that pass moderation, it's identical to the [Standard](/models/anthropic/claude-3-opus) variant._",
     "displayName": "Anthropic: Claude 3 Opus (self-moderated)",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "anthropic/claude-3-opus:beta",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 15,
+      "output": 75,
+    },
     "reasoning": false,
+    "releasedAt": "2024-03-05",
     "vision": true,
   },
   {
@@ -1561,10 +2061,15 @@ _This is a faster endpoint, made available in collaboration with Anthropic, that
 It is fluent in English, French, Spanish, German, and Italian, with high grammatical accuracy, and its long context window allows precise information recall from large documents.",
     "displayName": "Mistral Large",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "mistralai/mistral-large",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 3,
+      "output": 9,
+    },
     "reasoning": false,
+    "releasedAt": "2024-02-26",
     "vision": false,
   },
   {
@@ -1577,7 +2082,12 @@ It is fluent in English, French, Spanish, German, and Italian, with high grammat
     "functionCall": true,
     "id": "openai/gpt-4-turbo-preview",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 10,
+      "output": 30,
+    },
     "reasoning": false,
+    "releasedAt": "2024-01-25",
     "vision": false,
   },
   {
@@ -1587,10 +2097,15 @@ It is fluent in English, French, Spanish, German, and Italian, with high grammat
 Training data up to Sep 2021.",
     "displayName": "OpenAI: GPT-3.5 Turbo (older v0613)",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "openai/gpt-3.5-turbo-0613",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 1,
+      "output": 2,
+    },
     "reasoning": false,
+    "releasedAt": "2024-01-25",
     "vision": false,
   },
   {
@@ -1605,7 +2120,12 @@ The model was trained on over 1,000,000 entries of primarily [GPT-4](/models/ope
     "functionCall": false,
     "id": "nousresearch/nous-hermes-2-mixtral-8x7b-dpo",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.45,
+      "output": 0.45,
+    },
     "reasoning": false,
+    "releasedAt": "2024-01-16",
     "vision": false,
   },
   {
@@ -1613,10 +2133,15 @@ The model was trained on over 1,000,000 entries of primarily [GPT-4](/models/ope
     "description": "This is Mistral AI's closed-source, medium-sided model. It's powered by a closed-source prototype and excels at reasoning, code, JSON, chat, and more. In benchmarks, it compares with many of the flagship models of other companies.",
     "displayName": "Mistral Medium",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "mistralai/mistral-medium",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 2.7,
+      "output": 8.1,
+    },
     "reasoning": false,
+    "releasedAt": "2024-01-10",
     "vision": false,
   },
   {
@@ -1625,10 +2150,15 @@ The model was trained on over 1,000,000 entries of primarily [GPT-4](/models/ope
 #moe",
     "displayName": "Mistral Small",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "mistralai/mistral-small",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 2,
+      "output": 6,
+    },
     "reasoning": false,
+    "releasedAt": "2024-01-10",
     "vision": false,
   },
   {
@@ -1636,10 +2166,15 @@ The model was trained on over 1,000,000 entries of primarily [GPT-4](/models/ope
     "description": "This model is currently powered by Mistral-7B-v0.2, and incorporates a "better" fine-tuning than [Mistral 7B](/models/mistralai/mistral-7b-instruct-v0.1), inspired by community work. It's best used for large batch processing tasks where cost is a significant factor but reasoning capabilities are not crucial.",
     "displayName": "Mistral Tiny",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "mistralai/mistral-tiny",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.25,
+      "output": 0.25,
+    },
     "reasoning": false,
+    "releasedAt": "2024-01-10",
     "vision": false,
   },
   {
@@ -1650,7 +2185,12 @@ The model was trained on over 1,000,000 entries of primarily [GPT-4](/models/ope
     "functionCall": false,
     "id": "austism/chronos-hermes-13b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.13,
+      "output": 0.13,
+    },
     "reasoning": false,
+    "releasedAt": "2024-01-05",
     "vision": false,
   },
   {
@@ -1663,7 +2203,12 @@ Nous-Hermes 2 on Yi 34B outperforms all Nous-Hermes & Open-Hermes models of the
     "functionCall": false,
     "id": "nousresearch/nous-hermes-yi-34b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.72,
+      "output": 0.72,
+    },
     "reasoning": false,
+    "releasedAt": "2024-01-02",
     "vision": false,
   },
   {
@@ -1680,7 +2225,12 @@ An improved version of [Mistral 7B Instruct](/modelsmistralai/mistral-7b-instruc
     "functionCall": false,
     "id": "mistralai/mistral-7b-instruct-v0.2",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.055,
+      "output": 0.055,
+    },
     "reasoning": false,
+    "releasedAt": "2023-12-28",
     "vision": false,
   },
   {
@@ -1695,7 +2245,12 @@ The model is uncensored and is stripped of alignment and bias. It requires an ex
     "functionCall": false,
     "id": "cognitivecomputations/dolphin-mixtral-8x7b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.5,
+      "output": 0.5,
+    },
     "reasoning": false,
+    "releasedAt": "2023-12-21",
     "vision": false,
   },
   {
@@ -1709,10 +2264,15 @@ Usage of Gemini is subject to Google's [Gemini Terms of Use](https://ai.google.d
 #multimodal",
     "displayName": "Google: Gemini Pro Vision 1.0",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "google/gemini-pro-vision",
     "maxTokens": 8192,
+    "pricing": {
+      "input": 0.125,
+      "output": 0.375,
+    },
     "reasoning": false,
+    "releasedAt": "2023-12-13",
     "vision": true,
   },
   {
@@ -1724,10 +2284,15 @@ See the benchmarks and prompting guidelines from [Deepmind](https://deepmind.goo
 Usage of Gemini is subject to Google's [Gemini Terms of Use](https://ai.google.dev/terms).",
     "displayName": "Google: Gemini Pro 1.0",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "google/gemini-pro",
     "maxTokens": 32768,
+    "pricing": {
+      "input": 0.125,
+      "output": 0.375,
+    },
     "reasoning": false,
+    "releasedAt": "2023-12-13",
     "vision": false,
   },
   {
@@ -1737,10 +2302,15 @@ Usage of Gemini is subject to Google's [Gemini Terms of Use](https://ai.google.d
 Instruct model fine-tuned by Mistral. #moe",
     "displayName": "Mixtral 8x7B Instruct",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "mistralai/mixtral-8x7b-instruct",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.24,
+      "output": 0.24,
+    },
     "reasoning": false,
+    "releasedAt": "2023-12-10",
     "vision": false,
   },
   {
@@ -1755,7 +2325,12 @@ _These are higher-throughput endpoints for [Mixtral 8x7B Instruct](/models/mistr
     "functionCall": false,
     "id": "mistralai/mixtral-8x7b-instruct:nitro",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.54,
+      "output": 0.54,
+    },
     "reasoning": false,
+    "releasedAt": "2023-12-10",
     "vision": false,
   },
   {
@@ -1768,7 +2343,12 @@ _These are higher-throughput endpoints for [Mixtral 8x7B Instruct](/models/mistr
     "functionCall": false,
     "id": "mistralai/mixtral-8x7b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.54,
+      "output": 0.54,
+    },
     "reasoning": false,
+    "releasedAt": "2023-12-10",
     "vision": false,
   },
   {
@@ -1781,7 +2361,12 @@ StripedHyena uses a new architecture that competes with traditional Transformers
     "functionCall": false,
     "id": "togethercomputer/stripedhyena-nous-7b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.18,
+      "output": 0.18,
+    },
     "reasoning": false,
+    "releasedAt": "2023-12-09",
     "vision": false,
   },
   {
@@ -1798,7 +2383,12 @@ _These are free, rate-limited endpoints for [MythoMist 7B](/models/gryphe/mythom
     "functionCall": false,
     "id": "gryphe/mythomist-7b:free",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 0,
+      "output": 0,
+    },
     "reasoning": false,
+    "releasedAt": "2023-12-07",
     "vision": false,
   },
   {
@@ -1813,7 +2403,12 @@ It combines [Neural Chat 7B](/models/intel/neural-chat-7b), Airoboros 7b, [Toppy
     "functionCall": false,
     "id": "gryphe/mythomist-7b",
     "maxTokens": 2048,
+    "pricing": {
+      "input": 0.375,
+      "output": 0.375,
+    },
     "reasoning": false,
+    "releasedAt": "2023-12-07",
     "vision": false,
   },
   {
@@ -1831,7 +2426,12 @@ _These are free, rate-limited endpoints for [OpenChat 3.5 7B](/models/openchat/o
     "functionCall": false,
     "id": "openchat/openchat-7b:free",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 0,
+      "output": 0,
+    },
     "reasoning": false,
+    "releasedAt": "2023-11-28",
     "vision": false,
   },
   {
@@ -1847,7 +2447,12 @@ _These are free, rate-limited endpoints for [OpenChat 3.5 7B](/models/openchat/o
     "functionCall": false,
     "id": "openchat/openchat-7b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.055,
+      "output": 0.055,
+    },
     "reasoning": false,
+    "releasedAt": "2023-11-28",
     "vision": false,
   },
   {
@@ -1860,7 +2465,12 @@ _These are free, rate-limited endpoints for [OpenChat 3.5 7B](/models/openchat/o
     "functionCall": false,
     "id": "neversleep/noromaid-20b",
     "maxTokens": 2048,
+    "pricing": {
+      "input": 1.5,
+      "output": 2.25,
+    },
     "reasoning": false,
+    "releasedAt": "2023-11-26",
     "vision": false,
   },
   {
@@ -1871,7 +2481,12 @@ _These are free, rate-limited endpoints for [OpenChat 3.5 7B](/models/openchat/o
     "functionCall": false,
     "id": "anthropic/claude-instant-1.1",
     "maxTokens": 2048,
+    "pricing": {
+      "input": 0.8,
+      "output": 2.4,
+    },
     "reasoning": false,
+    "releasedAt": "2023-11-22",
     "vision": false,
   },
   {
@@ -1882,7 +2497,12 @@ _These are free, rate-limited endpoints for [OpenChat 3.5 7B](/models/openchat/o
     "functionCall": false,
     "id": "anthropic/claude-2.1",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 8,
+      "output": 24,
+    },
     "reasoning": false,
+    "releasedAt": "2023-11-22",
     "vision": false,
   },
   {
@@ -1895,7 +2515,12 @@ _This is a faster endpoint, made available in collaboration with Anthropic, that
     "functionCall": false,
     "id": "anthropic/claude-2.1:beta",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 8,
+      "output": 24,
+    },
     "reasoning": false,
+    "releasedAt": "2023-11-22",
     "vision": false,
   },
   {
@@ -1906,7 +2531,12 @@ _This is a faster endpoint, made available in collaboration with Anthropic, that
     "functionCall": false,
     "id": "anthropic/claude-2",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 8,
+      "output": 24,
+    },
     "reasoning": false,
+    "releasedAt": "2023-11-22",
     "vision": false,
   },
   {
@@ -1919,7 +2549,12 @@ _This is a faster endpoint, made available in collaboration with Anthropic, that
     "functionCall": false,
     "id": "anthropic/claude-2:beta",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 8,
+      "output": 24,
+    },
     "reasoning": false,
+    "releasedAt": "2023-11-22",
     "vision": false,
   },
   {
@@ -1931,7 +2566,12 @@ Potentially the most interesting finding from training on a good ratio (est. of
     "functionCall": false,
     "id": "teknium/openhermes-2.5-mistral-7b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.17,
+      "output": 0.17,
+    },
     "reasoning": false,
+    "releasedAt": "2023-11-20",
     "vision": false,
   },
   {
@@ -1946,7 +2586,12 @@ Potentially the most interesting finding from training on a good ratio (est. of
     "functionCall": false,
     "id": "openai/gpt-4-vision-preview",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 10,
+      "output": 30,
+    },
     "reasoning": false,
+    "releasedAt": "2023-11-13",
     "vision": true,
   },
   {
@@ -1960,7 +2605,12 @@ A multi-model merge of several LLaMA2 70B finetunes for roleplaying and creative
     "functionCall": false,
     "id": "lizpreciatior/lzlv-70b-fp16-hf",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.35,
+      "output": 0.4,
+    },
     "reasoning": false,
+    "releasedAt": "2023-11-12",
     "vision": false,
   },
   {
@@ -1977,7 +2627,12 @@ Credits to
     "functionCall": false,
     "id": "alpindale/goliath-120b",
     "maxTokens": 400,
+    "pricing": {
+      "input": 9.375,
+      "output": 9.375,
+    },
     "reasoning": false,
+    "releasedAt": "2023-11-10",
     "vision": false,
   },
   {
@@ -1998,7 +2653,12 @@ _These are free, rate-limited endpoints for [Toppy M 7B](/models/undi95/toppy-m-
     "functionCall": false,
     "id": "undi95/toppy-m-7b:free",
     "maxTokens": 2048,
+    "pricing": {
+      "input": 0,
+      "output": 0,
+    },
     "reasoning": false,
+    "releasedAt": "2023-11-10",
     "vision": false,
   },
   {
@@ -2017,7 +2677,12 @@ List of merged models:
     "functionCall": false,
     "id": "undi95/toppy-m-7b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.07,
+      "output": 0.07,
+    },
     "reasoning": false,
+    "releasedAt": "2023-11-10",
     "vision": false,
   },
   {
@@ -2038,7 +2703,12 @@ _These are higher-throughput endpoints for [Toppy M 7B](/models/undi95/toppy-m-7
     "functionCall": false,
     "id": "undi95/toppy-m-7b:nitro",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.07,
+      "output": 0.07,
+    },
     "reasoning": false,
+    "releasedAt": "2023-11-10",
     "vision": false,
   },
   {
@@ -2051,7 +2721,12 @@ A major redesign of this router is coming soon. Stay tuned on [Discord](https://
     "functionCall": false,
     "id": "openrouter/auto",
     "maxTokens": undefined,
+    "pricing": {
+      "input": undefined,
+      "output": undefined,
+    },
     "reasoning": false,
+    "releasedAt": "2023-11-08",
     "vision": false,
   },
   {
@@ -2064,8 +2739,13 @@ Training data: up to April 2023.",
     "functionCall": true,
     "id": "openai/gpt-4-1106-preview",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 10,
+      "output": 30,
+    },
     "reasoning": false,
-    "vision": true,
+    "releasedAt": "2023-11-06",
+    "vision": false,
   },
   {
     "contextWindowTokens": 16385,
@@ -2075,7 +2755,12 @@ Training data: up to April 2023.",
     "functionCall": true,
     "id": "openai/gpt-3.5-turbo-1106",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 1,
+      "output": 2,
+    },
     "reasoning": false,
+    "releasedAt": "2023-11-06",
     "vision": false,
   },
   {
@@ -2086,7 +2771,12 @@ Training data: up to April 2023.",
     "functionCall": false,
     "id": "google/palm-2-codechat-bison-32k",
     "maxTokens": 32768,
+    "pricing": {
+      "input": 0.25,
+      "output": 0.5,
+    },
     "reasoning": false,
+    "releasedAt": "2023-11-03",
     "vision": false,
   },
   {
@@ -2097,7 +2787,12 @@ Training data: up to April 2023.",
     "functionCall": false,
     "id": "google/palm-2-chat-bison-32k",
     "maxTokens": 32768,
+    "pricing": {
+      "input": 0.25,
+      "output": 0.5,
+    },
     "reasoning": false,
+    "releasedAt": "2023-11-03",
     "vision": false,
   },
   {
@@ -2110,7 +2805,12 @@ Currently based on [jondurbin/airoboros-l2-70b](https://huggingface.co/jondurbin
     "functionCall": false,
     "id": "jondurbin/airoboros-l2-70b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.5,
+      "output": 0.5,
+    },
     "reasoning": false,
+    "releasedAt": "2023-10-29",
     "vision": false,
   },
   {
@@ -2121,7 +2821,12 @@ Currently based on [jondurbin/airoboros-l2-70b](https://huggingface.co/jondurbin
     "functionCall": false,
     "id": "xwin-lm/xwin-lm-70b",
     "maxTokens": 400,
+    "pricing": {
+      "input": 3.75,
+      "output": 3.75,
+    },
     "reasoning": false,
+    "releasedAt": "2023-10-15",
     "vision": false,
   },
   {
@@ -2132,7 +2837,12 @@ Currently based on [jondurbin/airoboros-l2-70b](https://huggingface.co/jondurbin
     "functionCall": true,
     "id": "mistralai/mistral-7b-instruct-v0.1",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.055,
+      "output": 0.055,
+    },
     "reasoning": false,
+    "releasedAt": "2023-09-28",
     "vision": false,
   },
   {
@@ -2143,7 +2853,12 @@ Currently based on [jondurbin/airoboros-l2-70b](https://huggingface.co/jondurbin
     "functionCall": false,
     "id": "openai/gpt-3.5-turbo-instruct",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 1.5,
+      "output": 2,
+    },
     "reasoning": false,
+    "releasedAt": "2023-09-28",
     "vision": false,
   },
   {
@@ -2154,7 +2869,12 @@ Currently based on [jondurbin/airoboros-l2-70b](https://huggingface.co/jondurbin
     "functionCall": false,
     "id": "pygmalionai/mythalion-13b",
     "maxTokens": 400,
+    "pricing": {
+      "input": 1.125,
+      "output": 1.125,
+    },
     "reasoning": false,
+    "releasedAt": "2023-09-02",
     "vision": false,
   },
   {
@@ -2162,10 +2882,15 @@ Currently based on [jondurbin/airoboros-l2-70b](https://huggingface.co/jondurbin
     "description": "GPT-4-32k is an extended version of GPT-4, with the same capabilities but quadrupled context length, allowing for processing up to 40 pages of text in a single pass. This is particularly beneficial for handling longer content like interacting with PDFs without an external vector database. Training data: up to Sep 2021.",
     "displayName": "OpenAI: GPT-4 32k (older v0314)",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "openai/gpt-4-32k-0314",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 60,
+      "output": 120,
+    },
     "reasoning": false,
+    "releasedAt": "2023-08-28",
     "vision": false,
   },
   {
@@ -2173,10 +2898,15 @@ Currently based on [jondurbin/airoboros-l2-70b](https://huggingface.co/jondurbin
     "description": "GPT-4-32k is an extended version of GPT-4, with the same capabilities but quadrupled context length, allowing for processing up to 40 pages of text in a single pass. This is particularly beneficial for handling longer content like interacting with PDFs without an external vector database. Training data: up to Sep 2021.",
     "displayName": "OpenAI: GPT-4 32k",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "openai/gpt-4-32k",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 60,
+      "output": 120,
+    },
     "reasoning": false,
+    "releasedAt": "2023-08-28",
     "vision": false,
   },
   {
@@ -2184,10 +2914,15 @@ Currently based on [jondurbin/airoboros-l2-70b](https://huggingface.co/jondurbin
     "description": "This model offers four times the context length of gpt-3.5-turbo, allowing it to support approximately 20 pages of text in a single request at a higher cost. Training data: up to Sep 2021.",
     "displayName": "OpenAI: GPT-3.5 Turbo 16k",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "openai/gpt-3.5-turbo-16k",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 3,
+      "output": 4,
+    },
     "reasoning": false,
+    "releasedAt": "2023-08-28",
     "vision": false,
   },
   {
@@ -2198,7 +2933,12 @@ Currently based on [jondurbin/airoboros-l2-70b](https://huggingface.co/jondurbin
     "functionCall": false,
     "id": "nousresearch/nous-hermes-llama2-13b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.17,
+      "output": 0.17,
+    },
     "reasoning": false,
+    "releasedAt": "2023-08-20",
     "vision": false,
   },
   {
@@ -2211,7 +2951,12 @@ _These are free, rate-limited endpoints for [Zephyr 7B](/models/huggingfaceh4/ze
     "functionCall": false,
     "id": "huggingfaceh4/zephyr-7b-beta:free",
     "maxTokens": 2048,
+    "pricing": {
+      "input": 0,
+      "output": 0,
+    },
     "reasoning": false,
+    "releasedAt": "2023-08-02",
     "vision": false,
   },
   {
@@ -2222,7 +2967,12 @@ _These are free, rate-limited endpoints for [Zephyr 7B](/models/huggingfaceh4/ze
     "functionCall": false,
     "id": "mancer/weaver",
     "maxTokens": 1000,
+    "pricing": {
+      "input": 1.875,
+      "output": 2.25,
+    },
     "reasoning": false,
+    "releasedAt": "2023-08-02",
     "vision": false,
   },
   {
@@ -2233,7 +2983,12 @@ _These are free, rate-limited endpoints for [Zephyr 7B](/models/huggingfaceh4/ze
     "functionCall": false,
     "id": "anthropic/claude-instant-1.0",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 0.8,
+      "output": 2.4,
+    },
     "reasoning": false,
+    "releasedAt": "2023-07-28",
     "vision": false,
   },
   {
@@ -2244,7 +2999,12 @@ _These are free, rate-limited endpoints for [Zephyr 7B](/models/huggingfaceh4/ze
     "functionCall": false,
     "id": "anthropic/claude-1.2",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 8,
+      "output": 24,
+    },
     "reasoning": false,
+    "releasedAt": "2023-07-28",
     "vision": false,
   },
   {
@@ -2255,7 +3015,12 @@ _These are free, rate-limited endpoints for [Zephyr 7B](/models/huggingfaceh4/ze
     "functionCall": false,
     "id": "anthropic/claude-1",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 8,
+      "output": 24,
+    },
     "reasoning": false,
+    "releasedAt": "2023-07-28",
     "vision": false,
   },
   {
@@ -2266,7 +3031,12 @@ _These are free, rate-limited endpoints for [Zephyr 7B](/models/huggingfaceh4/ze
     "functionCall": false,
     "id": "anthropic/claude-instant-1",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 0.8,
+      "output": 2.4,
+    },
     "reasoning": false,
+    "releasedAt": "2023-07-28",
     "vision": false,
   },
   {
@@ -2279,7 +3049,12 @@ _This is a faster endpoint, made available in collaboration with Anthropic, that
     "functionCall": false,
     "id": "anthropic/claude-instant-1:beta",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 0.8,
+      "output": 2.4,
+    },
     "reasoning": false,
+    "releasedAt": "2023-07-28",
     "vision": false,
   },
   {
@@ -2290,7 +3065,12 @@ _This is a faster endpoint, made available in collaboration with Anthropic, that
     "functionCall": false,
     "id": "anthropic/claude-2.0",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 8,
+      "output": 24,
+    },
     "reasoning": false,
+    "releasedAt": "2023-07-28",
     "vision": false,
   },
   {
@@ -2303,7 +3083,12 @@ _This is a faster endpoint, made available in collaboration with Anthropic, that
     "functionCall": false,
     "id": "anthropic/claude-2.0:beta",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 8,
+      "output": 24,
+    },
     "reasoning": false,
+    "releasedAt": "2023-07-28",
     "vision": false,
   },
   {
@@ -2314,7 +3099,12 @@ _This is a faster endpoint, made available in collaboration with Anthropic, that
     "functionCall": false,
     "id": "undi95/remm-slerp-l2-13b",
     "maxTokens": 400,
+    "pricing": {
+      "input": 1.125,
+      "output": 1.125,
+    },
     "reasoning": false,
+    "releasedAt": "2023-07-22",
     "vision": false,
   },
   {
@@ -2327,7 +3117,12 @@ _These are extended-context endpoints for [ReMM SLERP 13B](/models/undi95/remm-s
     "functionCall": false,
     "id": "undi95/remm-slerp-l2-13b:extended",
     "maxTokens": 400,
+    "pricing": {
+      "input": 1.125,
+      "output": 1.125,
+    },
     "reasoning": false,
+    "releasedAt": "2023-07-22",
     "vision": false,
   },
   {
@@ -2338,7 +3133,12 @@ _These are extended-context endpoints for [ReMM SLERP 13B](/models/undi95/remm-s
     "functionCall": false,
     "id": "google/palm-2-codechat-bison",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 0.25,
+      "output": 0.5,
+    },
     "reasoning": false,
+    "releasedAt": "2023-07-20",
     "vision": false,
   },
   {
@@ -2349,7 +3149,12 @@ _These are extended-context endpoints for [ReMM SLERP 13B](/models/undi95/remm-s
     "functionCall": false,
     "id": "google/palm-2-chat-bison",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 0.25,
+      "output": 0.5,
+    },
     "reasoning": false,
+    "releasedAt": "2023-07-20",
     "vision": false,
   },
   {
@@ -2360,7 +3165,12 @@ _These are extended-context endpoints for [ReMM SLERP 13B](/models/undi95/remm-s
     "functionCall": false,
     "id": "gryphe/mythomax-l2-13b",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.1,
+      "output": 0.1,
+    },
     "reasoning": false,
+    "releasedAt": "2023-07-02",
     "vision": false,
   },
   {
@@ -2373,7 +3183,12 @@ _These are higher-throughput endpoints for [MythoMax 13B](/models/gryphe/mythoma
     "functionCall": false,
     "id": "gryphe/mythomax-l2-13b:nitro",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.2,
+      "output": 0.2,
+    },
     "reasoning": false,
+    "releasedAt": "2023-07-02",
     "vision": false,
   },
   {
@@ -2386,7 +3201,12 @@ _These are extended-context endpoints for [MythoMax 13B](/models/gryphe/mythomax
     "functionCall": false,
     "id": "gryphe/mythomax-l2-13b:extended",
     "maxTokens": 400,
+    "pricing": {
+      "input": 1.125,
+      "output": 1.125,
+    },
     "reasoning": false,
+    "releasedAt": "2023-07-02",
     "vision": false,
   },
   {
@@ -2397,7 +3217,12 @@ _These are extended-context endpoints for [MythoMax 13B](/models/gryphe/mythomax
     "functionCall": false,
     "id": "meta-llama/llama-2-13b-chat",
     "maxTokens": undefined,
+    "pricing": {
+      "input": 0.27,
+      "output": 0.27,
+    },
     "reasoning": false,
+    "releasedAt": "2023-06-20",
     "vision": false,
   },
   {
@@ -2405,10 +3230,15 @@ _These are extended-context endpoints for [MythoMax 13B](/models/gryphe/mythomax
     "description": "GPT-4-0314 is the first version of GPT-4 released, with a context length of 8,192 tokens, and was supported until June 14. Training data: up to Sep 2021.",
     "displayName": "OpenAI: GPT-4 (older v0314)",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "openai/gpt-4-0314",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 30,
+      "output": 60,
+    },
     "reasoning": false,
+    "releasedAt": "2023-05-28",
     "vision": false,
   },
   {
@@ -2416,11 +3246,16 @@ _These are extended-context endpoints for [MythoMax 13B](/models/gryphe/mythomax
     "description": "OpenAI's flagship model, GPT-4 is a large-scale multimodal language model capable of solving difficult problems with greater accuracy than previous models due to its broader general knowledge and advanced reasoning capabilities. Training data: up to Sep 2021.",
     "displayName": "OpenAI: GPT-4",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "openai/gpt-4",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 30,
+      "output": 60,
+    },
     "reasoning": false,
-    "vision": true,
+    "releasedAt": "2023-05-28",
+    "vision": false,
   },
   {
     "contextWindowTokens": 4095,
@@ -2432,7 +3267,12 @@ Training data up to Sep 2021.",
     "functionCall": false,
     "id": "openai/gpt-3.5-turbo-0301",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 1,
+      "output": 2,
+    },
     "reasoning": false,
+    "releasedAt": "2023-05-28",
     "vision": false,
   },
   {
@@ -2445,7 +3285,12 @@ This version has a higher accuracy at responding in requested formats and a fix
     "functionCall": true,
     "id": "openai/gpt-3.5-turbo-0125",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 0.5,
+      "output": 1.5,
+    },
     "reasoning": false,
+    "releasedAt": "2023-05-28",
     "vision": false,
   },
   {
@@ -2455,10 +3300,15 @@ This version has a higher accuracy at responding in requested formats and a fix
 Training data up to Sep 2021.",
     "displayName": "OpenAI: GPT-3.5 Turbo",
     "enabled": false,
-    "functionCall": false,
+    "functionCall": true,
     "id": "openai/gpt-3.5-turbo",
     "maxTokens": 4096,
+    "pricing": {
+      "input": 0.5,
+      "output": 1.5,
+    },
     "reasoning": false,
+    "releasedAt": "2023-05-28",
     "vision": false,
   },
 ]