PyPI - mirascope - Versions diffs - 1.18.3__py3-none-any.whl → 1.18.4__py3-none-any.whl - Mend

mirascope 1.18.3py3-none-any.whl → 1.18.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (88) hide show

mirascope/__init__.py +20 -2
mirascope/beta/openai/__init__.py +1 -1
mirascope/beta/openai/realtime/__init__.py +1 -1
mirascope/beta/openai/realtime/tool.py +1 -1
mirascope/beta/rag/__init__.py +2 -2
mirascope/beta/rag/base/__init__.py +2 -2
mirascope/beta/rag/weaviate/__init__.py +1 -1
mirascope/core/__init__.py +26 -8
mirascope/core/anthropic/__init__.py +3 -3
mirascope/core/anthropic/_utils/_calculate_cost.py +114 -47
mirascope/core/anthropic/call_response.py +9 -1
mirascope/core/anthropic/call_response_chunk.py +7 -0
mirascope/core/anthropic/stream.py +3 -1
mirascope/core/azure/__init__.py +2 -2
mirascope/core/azure/_utils/_calculate_cost.py +4 -1
mirascope/core/azure/call_response.py +9 -1
mirascope/core/azure/call_response_chunk.py +5 -0
mirascope/core/azure/stream.py +3 -1
mirascope/core/base/__init__.py +11 -9
mirascope/core/base/_utils/__init__.py +10 -10
mirascope/core/base/_utils/_get_common_usage.py +8 -4
mirascope/core/base/_utils/_get_create_fn_or_async_create_fn.py +2 -2
mirascope/core/base/_utils/_protocols.py +9 -8
mirascope/core/base/call_response.py +22 -20
mirascope/core/base/call_response_chunk.py +12 -1
mirascope/core/base/stream.py +24 -21
mirascope/core/base/tool.py +7 -5
mirascope/core/base/types.py +22 -5
mirascope/core/bedrock/__init__.py +3 -3
mirascope/core/bedrock/_utils/_calculate_cost.py +4 -1
mirascope/core/bedrock/call_response.py +8 -1
mirascope/core/bedrock/call_response_chunk.py +5 -0
mirascope/core/bedrock/stream.py +3 -1
mirascope/core/cohere/__init__.py +2 -2
mirascope/core/cohere/_utils/_calculate_cost.py +4 -3
mirascope/core/cohere/call_response.py +9 -1
mirascope/core/cohere/call_response_chunk.py +5 -0
mirascope/core/cohere/stream.py +3 -1
mirascope/core/gemini/__init__.py +2 -2
mirascope/core/gemini/_utils/_calculate_cost.py +4 -1
mirascope/core/gemini/_utils/_convert_message_params.py +1 -1
mirascope/core/gemini/call_response.py +9 -1
mirascope/core/gemini/call_response_chunk.py +5 -0
mirascope/core/gemini/stream.py +3 -1
mirascope/core/google/__init__.py +2 -2
mirascope/core/google/_utils/_calculate_cost.py +141 -14
mirascope/core/google/_utils/_convert_message_params.py +23 -51
mirascope/core/google/_utils/_message_param_converter.py +34 -33
mirascope/core/google/_utils/_validate_media_type.py +34 -0
mirascope/core/google/call_response.py +26 -4
mirascope/core/google/call_response_chunk.py +17 -9
mirascope/core/google/stream.py +20 -2
mirascope/core/groq/__init__.py +2 -2
mirascope/core/groq/_utils/_calculate_cost.py +12 -11
mirascope/core/groq/call_response.py +9 -1
mirascope/core/groq/call_response_chunk.py +5 -0
mirascope/core/groq/stream.py +3 -1
mirascope/core/litellm/__init__.py +1 -1
mirascope/core/litellm/_utils/_setup_call.py +7 -3
mirascope/core/mistral/__init__.py +2 -2
mirascope/core/mistral/_utils/_calculate_cost.py +10 -9
mirascope/core/mistral/call_response.py +9 -1
mirascope/core/mistral/call_response_chunk.py +5 -0
mirascope/core/mistral/stream.py +3 -1
mirascope/core/openai/__init__.py +2 -2
mirascope/core/openai/_utils/_calculate_cost.py +78 -37
mirascope/core/openai/call_params.py +13 -0
mirascope/core/openai/call_response.py +14 -1
mirascope/core/openai/call_response_chunk.py +12 -0
mirascope/core/openai/stream.py +6 -4
mirascope/core/vertex/__init__.py +1 -1
mirascope/core/vertex/_utils/_calculate_cost.py +1 -0
mirascope/core/vertex/_utils/_convert_message_params.py +1 -1
mirascope/core/vertex/call_response.py +9 -1
mirascope/core/vertex/call_response_chunk.py +5 -0
mirascope/core/vertex/stream.py +3 -1
mirascope/integrations/_middleware_factory.py +6 -6
mirascope/integrations/logfire/_utils.py +1 -1
mirascope/llm/__init__.py +1 -1
mirascope/llm/_protocols.py +5 -5
mirascope/llm/call_response.py +16 -7
mirascope/llm/stream.py +43 -31
mirascope/retries/__init__.py +1 -1
mirascope/tools/__init__.py +2 -2
{mirascope-1.18.3.dist-info → mirascope-1.18.4.dist-info}/METADATA +1 -1
{mirascope-1.18.3.dist-info → mirascope-1.18.4.dist-info}/RECORD +88 -87
{mirascope-1.18.3.dist-info → mirascope-1.18.4.dist-info}/WHEEL +0 -0
{mirascope-1.18.3.dist-info → mirascope-1.18.4.dist-info}/licenses/LICENSE +0 -0

mirascope/core/openai/_utils/_calculate_cost.py CHANGED Viewed

@@ -3,6 +3,7 @@
 def calculate_cost(
     input_tokens: int | float | None,
+    cached_tokens: int | float | None,
     output_tokens: int | float | None,
     model: str = "gpt-3.5-turbo-16k",
 ) -> float | None:
@@ -10,196 +11,236 @@ def calculate_cost(
     https://openai.com/pricing
-    Model                                     Input               Output
-    gpt-4o                                    $2.50 / 1M tokens   $10.00 / 1M tokens
-    gpt-4o-2024-11-20                         $2.50 / 1M tokens   $10.00 / 1M tokens
-    gpt-4o-2024-08-06                         $2.50 / 1M tokens   $10.00 / 1M tokens
-    gpt-4o-2024-05-13                         $5.00 / 1M tokens   $15.00 / 1M tokens
-    gpt-4o-audio-preview                      $2.50 / 1M tokens   $10.00 / 1M tokens
-    gpt-4o-audio-preview-2024-12-17           $2.50 / 1M tokens   $10.00 / 1M tokens
-    gpt-4o-audio-preview-2024-10-01           $2.50 / 1M tokens   $10.00 / 1M tokens
-    gpt-4o-realtime-preview                   $5.00 / 1M tokens   $20.00 / 1M tokens
-    gpt-4o-realtime-preview-2024-12-17        $5.00 / 1M tokens   $20.00 / 1M tokens
-    gpt-4o-realtime-preview-2024-10-01        $5.00 / 1M tokens   $20.00 / 1M tokens
-    gpt-4o-mini                               $0.15 / 1M tokens   $0.60  / 1M tokens
-    gpt-4o-mini-2024-07-18                    $0.15 / 1M tokens   $0.60  / 1M tokens
-    gpt-4o-mini-audio-preview                 $0.15 / 1M tokens   $0.60  / 1M tokens
-    gpt-4o-mini-audio-preview-2024-12-17      $0.15 / 1M tokens   $0.60  / 1M tokens
-    gpt-4o-mini-realtime-preview              $0.60 / 1M tokens   $2.40  / 1M tokens
-    gpt-4o-mini-realtime-preview-2024-12-17   $0.60 / 1M tokens   $2.40  / 1M tokens
-    o1                                        $15.00 / 1M tokens  $60.00 / 1M tokens
-    o1-2024-12-17                             $15.00 / 1M tokens  $60.00 / 1M tokens
-    o1-preview-2024-09-12                     $15.00 / 1M tokens  $60.00 / 1M tokens
-    o3-mini                                   $1.10 / 1M tokens   $4.40  / 1M tokens
-    o3-mini-2025-01-31                        $1.10 / 1M tokens   $4.40  / 1M tokens
-    o1-mini                                   $1.10 / 1M tokens   $4.40  / 1M tokens
-    o1-mini-2024-09-12                        $1.10 / 1M tokens   $4.40  / 1M tokens
-    gpt-4-turbo                               $10.00 / 1M tokens  $30.00 / 1M tokens
-    gpt-4-turbo-2024-04-09                    $10.00 / 1M tokens  $30.00 / 1M tokens
-    gpt-3.5-turbo-0125	                      $0.50 / 1M tokens	  $1.50 / 1M tokens
-    gpt-3.5-turbo-1106	                      $1.00 / 1M tokens	  $2.00 / 1M tokens
-    gpt-4-1106-preview	                      $10.00 / 1M tokens  $30.00 / 1M tokens
-    gpt-4	                                  $30.00 / 1M tokens  $60.00 / 1M tokens
-    text-embedding-3-small	                  $0.02 / 1M tokens
-    text-embedding-3-large	                  $0.13 / 1M tokens
-    text-embedding-ada-0002	                  $0.10 / 1M tokens
+    Model                                     Input               Cached               Output
+    gpt-4o                                    $2.50  / 1M tokens  $1.25 / 1M tokens   $10.00 / 1M tokens
+    gpt-4o-2024-11-20                         $2.50  / 1M tokens  $1.25 / 1M tokens   $10.00 / 1M tokens
+    gpt-4o-2024-08-06                         $2.50  / 1M tokens  $1.25 / 1M tokens   $10.00 / 1M tokens
+    gpt-4o-2024-05-13                         $5.00  / 1M tokens  $2.50 / 1M tokens   $15.00 / 1M tokens
+    gpt-4o-audio-preview                      $2.50  / 1M tokens  $1.25 / 1M tokens   $10.00 / 1M tokens
+    gpt-4o-audio-preview-2024-12-17           $2.50  / 1M tokens  $1.25 / 1M tokens   $10.00 / 1M tokens
+    gpt-4o-audio-preview-2024-10-01           $2.50  / 1M tokens  $1.25 / 1M tokens   $10.00 / 1M tokens
+    gpt-4o-realtime-preview                   $5.00  / 1M tokens  $2.50 / 1M tokens   $20.00 / 1M tokens
+    gpt-4o-realtime-preview-2024-12-17        $5.00  / 1M tokens  $2.50 / 1M tokens   $20.00 / 1M tokens
+    gpt-4o-realtime-preview-2024-10-01        $5.00  / 1M tokens  $2.50 / 1M tokens   $20.00 / 1M tokens
+    gpt-4o-mini                               $0.15  / 1M tokens  $0.08 / 1M tokens   $0.60  / 1M tokens
+    gpt-4o-mini-2024-07-18                    $0.15  / 1M tokens  $0.08 / 1M tokens   $0.60  / 1M tokens
+    gpt-4o-mini-audio-preview                 $0.15  / 1M tokens  $0.08 / 1M tokens   $0.60  / 1M tokens
+    gpt-4o-mini-audio-preview-2024-12-17      $0.15  / 1M tokens  $0.08 / 1M tokens   $0.60  / 1M tokens
+    gpt-4o-mini-realtime-preview              $0.60  / 1M tokens  $0.30 / 1M tokens   $2.40  / 1M tokens
+    gpt-4o-mini-realtime-preview-2024-12-17   $0.60  / 1M tokens  $0.30 / 1M tokens   $2.40  / 1M tokens
+    o1                                        $15.00 / 1M tokens  $7.50 / 1M tokens   $60.00 / 1M tokens
+    o1-2024-12-17                             $15.00 / 1M tokens  $7.50 / 1M tokens   $60.00 / 1M tokens
+    o1-preview-2024-09-12                     $15.00 / 1M tokens  $7.50 / 1M tokens   $60.00 / 1M tokens
+    o3-mini                                   $1.10  / 1M tokens  $0.55 / 1M tokens   $4.40  / 1M tokens
+    o3-mini-2025-01-31                        $1.10  / 1M tokens  $0.55 / 1M tokens   $4.40  / 1M tokens
+    o1-mini                                   $1.10  / 1M tokens  $0.55 / 1M tokens   $4.40  / 1M tokens
+    o1-mini-2024-09-12                        $1.10  / 1M tokens  $0.55 / 1M tokens   $4.40  / 1M tokens
+    gpt-4-turbo                               $10.00 / 1M tokens                      $30.00 / 1M tokens
+    gpt-4-turbo-2024-04-09                    $10.00 / 1M tokens                      $30.00 / 1M tokens
+    gpt-3.5-turbo-0125	                      $0.50  / 1M tokens	                  $1.50  / 1M tokens
+    gpt-3.5-turbo-1106	                      $1.00  / 1M tokens	                  $2.00  / 1M tokens
+    gpt-4-1106-preview	                      $10.00 / 1M tokens                      $30.00 / 1M tokens
+    gpt-4	                                  $30.00 / 1M tokens                      $60.00 / 1M tokens
+    text-embedding-3-small	                  $0.02  / 1M tokens
+    text-embedding-3-large	                  $0.13  / 1M tokens
+    text-embedding-ada-0002	                  $0.10  / 1M tokens
     """
     pricing = {
         "gpt-4o": {
             "prompt": 0.000_002_5,
+            "cached": 0.000_001_25,
             "completion": 0.000_01,
         },
         "gpt-4o-2024-11-20": {
             "prompt": 0.000_002_5,
+            "cached": 0.000_001_25,
             "completion": 0.000_01,
         },
         "gpt-4o-2024-08-06": {
             "prompt": 0.000_002_5,
+            "cached": 0.000_001_25,
             "completion": 0.000_01,
         },
         "gpt-4o-2024-05-13": {
             "prompt": 0.000_005,
+            "cached": 0.000_002_5,
             "completion": 0.000_015,
         },
         "gpt-4o-audio-preview": {
             "prompt": 0.000_002_5,
+            "cached": 0.000_001_25,
             "completion": 0.000_01,
         },
         "gpt-4o-audio-preview-2024-12-17": {
             "prompt": 0.000_002_5,
+            "cached": 0.000_001_25,
             "completion": 0.000_01,
         },
         "gpt-4o-audio-preview-2024-10-01": {
             "prompt": 0.000_002_5,
+            "cached": 0.000_001_25,
             "completion": 0.000_01,
         },
         "gpt-4o-realtime-preview": {
             "prompt": 0.000_005,
+            "cached": 0.000_002_5,
             "completion": 0.000_02,
         },
         "gpt-4o-realtime-preview-2024-12-17": {
             "prompt": 0.000_005,
+            "cached": 0.000_002_5,
             "completion": 0.000_02,
         },
         "gpt-4o-realtime-preview-2024-10-01": {
             "prompt": 0.000_005,
+            "cached": 0.000_002_5,
             "completion": 0.000_02,
         },
         "gpt-4o-mini": {
             "prompt": 0.000_000_15,
+            "cached": 0.000_000_08,
             "completion": 0.000_000_6,
         },
         "gpt-4o-mini-2024-07-18": {
             "prompt": 0.000_000_15,
+            "cached": 0.000_000_08,
             "completion": 0.000_000_6,
         },
         "gpt-4o-mini-audio-preview": {
             "prompt": 0.000_000_15,
+            "cached": 0.000_000_08,
             "completion": 0.000_000_6,
         },
         "gpt-4o-mini-audio-preview-2024-12-17": {
             "prompt": 0.000_000_15,
+            "cached": 0.000_000_08,
             "completion": 0.000_000_6,
         },
         "gpt-4o-mini-realtime-preview": {
             "prompt": 0.000_000_6,
+            "cached": 0.000_000_3,
             "completion": 0.000_002_4,
         },
         "gpt-4o-mini-realtime-preview-2024-12-17": {
             "prompt": 0.000_000_6,
+            "cached": 0.000_000_3,
             "completion": 0.000_002_4,
         },
         "o1": {
             "prompt": 0.000_015,
+            "cached": 0.000_007_5,
             "completion": 0.000_06,
         },
         "o1-2024-12-17": {
             "prompt": 0.000_015,
+            "cached": 0.000_007_5,
             "completion": 0.000_06,
         },
         "o1-preview-2024-09-12": {
             "prompt": 0.000_015,
+            "cached": 0.000_007_5,
             "completion": 0.000_06,
         },
         "o3-mini": {
             "prompt": 0.000_001_1,
+            "cached": 0.000_000_55,
             "completion": 0.000_004_4,
         },
         "o3-mini-2025-01-31": {
             "prompt": 0.000_001_1,
+            "cached": 0.000_000_55,
             "completion": 0.000_004_4,
         },
         "o1-mini": {
             "prompt": 0.000_001_1,
+            "cached": 0.000_000_55,
             "completion": 0.000_004_4,
         },
         "o1-mini-2024-09-12": {
             "prompt": 0.000_001_1,
+            "cached": 0.000_000_55,
             "completion": 0.000_004_4,
         },
         "gpt-4-turbo": {
             "prompt": 0.000_01,
+            "cached": 0,
             "completion": 0.000_03,
         },
         "gpt-4-turbo-2024-04-09": {
             "prompt": 0.000_01,
+            "cached": 0,
             "completion": 0.000_03,
         },
         "gpt-3.5-turbo-0125": {
             "prompt": 0.000_000_5,
+            "cached": 0,
             "completion": 0.000_001_5,
         },
         "gpt-3.5-turbo-1106": {
             "prompt": 0.000_001,
+            "cached": 0,
             "completion": 0.000_002,
         },
         "gpt-4-1106-preview": {
             "prompt": 0.000_01,
+            "cached": 0,
             "completion": 0.000_03,
         },
         "gpt-4": {
             "prompt": 0.000_003,
+            "cached": 0,
             "completion": 0.000_006,
         },
         "gpt-3.5-turbo-4k": {
             "prompt": 0.000_015,
+            "cached": 0,
             "completion": 0.000_02,
         },
         "gpt-3.5-turbo-16k": {
             "prompt": 0.000_003,
+            "cached": 0,
             "completion": 0.000_004,
         },
         "gpt-4-8k": {
             "prompt": 0.000_003,
+            "cached": 0,
             "completion": 0.000_006,
         },
         "gpt-4-32k": {
             "prompt": 0.000_006,
+            "cached": 0,
             "completion": 0.000_012,
         },
         "text-embedding-3-small": {
             "prompt": 0.000_000_02,
-            "completion": 0.000_000_02,
+            "cached": 0,
+            "completion": 0,
         },
         "text-embedding-ada-002": {
             "prompt": 0.000_000_1,
-            "completion": 0.000_000_1,
+            "cached": 0,
+            "completion": 0,
         },
         "text-embedding-3-large": {
             "prompt": 0.000_000_13,
-            "completion": 0.000_000_13,
+            "cached": 0,
+            "completion": 0,
         },
     }
     if input_tokens is None or output_tokens is None:
         return None
+    if cached_tokens is None:
+        cached_tokens = 0
     try:
         model_pricing = pricing[model]
     except KeyError:
         return None
     prompt_cost = input_tokens * model_pricing["prompt"]
+    cached_cost = cached_tokens * model_pricing["cached"]
     completion_cost = output_tokens * model_pricing["completion"]
-    total_cost = prompt_cost + completion_cost
+    total_cost = prompt_cost + cached_cost + completion_cost
     return total_cost

mirascope/core/openai/call_params.py CHANGED Viewed

@@ -18,6 +18,9 @@ if TYPE_CHECKING:
         ChatCompletionAudioParam,
         ChatCompletionModality,  # pyright: ignore [reportAttributeAccessIssue]
     )
+    from openai.types.chat.chat_completion_reasoning_effort import (  # pyright: ignore [reportMissingImports]
+        ChatCompletionReasoningEffort,  # pyright: ignore [reportAttributeAccessIssue]
+    )
 else:
     try:
         from openai.types.chat.chat_completion_audio_param import (  # pyright: ignore [reportMissingImports]
@@ -30,6 +33,14 @@ else:
         class ChatCompletionModality: ...
+    try:
+        from openai.types.chat.chat_completion_reasoning_effort import (  # pyright: ignore [reportMissingImports]
+            ChatCompletionReasoningEffort,
+        )
+    except ImportError:
+        class ChatCompletionReasoningEffort: ...
 class OpenAICallParams(BaseCallParams):
     """The parameters to use when calling the OpenAI API.
@@ -46,6 +57,7 @@ class OpenAICallParams(BaseCallParams):
         n: ...
         parallel_tool_calls: ...
         presence_penalty: ...
+        reasoning_effort: ...
         response_format: ...
         seed: ...
         stop: ...
@@ -67,6 +79,7 @@ class OpenAICallParams(BaseCallParams):
     n: NotRequired[int | None]
     parallel_tool_calls: NotRequired[bool]
     presence_penalty: NotRequired[float | None]
+    reasoning_effort: NotRequired[ChatCompletionReasoningEffort | None]
     response_format: NotRequired[ResponseFormat]
     seed: NotRequired[int | None]
     stop: NotRequired[str | list[str] | None]

mirascope/core/openai/call_response.py CHANGED Viewed

@@ -118,6 +118,17 @@ class OpenAICallResponse(
         """Returns the number of input tokens."""
         return self.usage.prompt_tokens if self.usage else None
+    @computed_field
+    @property
+    def cached_tokens(self) -> int | None:
+        """Returns the number of cached tokens."""
+        return (
+            details.cached_tokens
+            if self.usage
+            and (details := getattr(self.usage, "prompt_tokens_details", None))
+            else None
+        )
     @computed_field
     @property
     def output_tokens(self) -> int | None:
@@ -128,7 +139,9 @@ class OpenAICallResponse(
     @property
     def cost(self) -> float | None:
         """Returns the cost of the call."""
-        return calculate_cost(self.input_tokens, self.output_tokens, self.model)
+        return calculate_cost(
+            self.input_tokens, self.cached_tokens, self.output_tokens, self.model
+        )
     @computed_field
     @cached_property

mirascope/core/openai/call_response_chunk.py CHANGED Viewed

@@ -79,6 +79,18 @@ class OpenAICallResponseChunk(BaseCallResponseChunk[ChatCompletionChunk, FinishR
             return self.chunk.usage
         return None
+    @computed_field
+    @property
+    def cached_tokens(self) -> int | None:
+        """Returns the number of cached tokens."""
+        return (
+            details.cached_tokens
+            if hasattr(self.chunk, "usage")
+            and self.usage
+            and (details := getattr(self.usage, "prompt_tokens_details", None))
+            else None
+        )
     @property
     def input_tokens(self) -> int | None:
         """Returns the number of input tokens."""

mirascope/core/openai/stream.py CHANGED Viewed

@@ -87,9 +87,9 @@ class OpenAIStream(
     ) -> AsyncGenerator[tuple[OpenAICallResponseChunk, OpenAITool | None], None]:
         aiter = super().__aiter__()
-        async def generator() -> (
-            AsyncGenerator[tuple[OpenAICallResponseChunk, OpenAITool | None], None]
-        ):
+        async def generator() -> AsyncGenerator[
+            tuple[OpenAICallResponseChunk, OpenAITool | None], None
+        ]:
             async for chunk, tool in aiter:
                 if (
                     (choices := chunk.chunk.choices)
@@ -104,7 +104,9 @@ class OpenAIStream(
     @property
     def cost(self) -> float | None:
         """Returns the cost of the call."""
-        return calculate_cost(self.input_tokens, self.output_tokens, self.model)
+        return calculate_cost(
+            self.input_tokens, self.cached_tokens, self.output_tokens, self.model
+        )
     def _construct_message_param(
         self,

mirascope/core/vertex/__init__.py CHANGED Viewed

@@ -33,7 +33,6 @@ warnings.warn(
 )
 __all__ = [
-    "call",
     "VertexCallParams",
     "VertexCallResponse",
     "VertexCallResponseChunk",
@@ -41,5 +40,6 @@ __all__ = [
     "VertexMessageParam",
     "VertexStream",
     "VertexTool",
+    "call",
     "vertex_call",
 ]

mirascope/core/vertex/_utils/_calculate_cost.py CHANGED Viewed

@@ -3,6 +3,7 @@
 def calculate_cost(
     input_chars: int | float | None,
+    cached_chars: int | float | None,
     output_chars: int | float | None,
     model: str = "gemini-1.5-pro",
     context_length: int = 0,

mirascope/core/vertex/_utils/_convert_message_params.py CHANGED Viewed

@@ -106,7 +106,7 @@ def convert_message_params(
                 elif part.type == "audio_url":
                     # Should download the audio to determine the media type
                     audio = _load_media(part.url)
-                    audio_type = get_audio_type(audio)
+                    audio_type = f"audio/{get_audio_type(audio)}"
                     if audio_type not in [
                         "audio/wav",
                         "audio/mp3",

mirascope/core/vertex/call_response.py CHANGED Viewed

@@ -112,6 +112,12 @@ class VertexCallResponse(
         """Returns the number of input tokens."""
         return self.usage.prompt_token_count
+    @computed_field
+    @property
+    def cached_tokens(self) -> int:
+        """Returns the number of cached tokens."""
+        return 0
     @computed_field
     @property
     def output_tokens(self) -> int:
@@ -122,7 +128,9 @@ class VertexCallResponse(
     @property
     def cost(self) -> float | None:
         """Returns the cost of the call."""
-        return calculate_cost(self.input_tokens, self.output_tokens, self.model)
+        return calculate_cost(
+            self.input_tokens, self.cached_tokens, self.output_tokens, self.model
+        )
     @computed_field
     @cached_property

mirascope/core/vertex/call_response_chunk.py CHANGED Viewed

@@ -76,6 +76,11 @@ class VertexCallResponseChunk(
         """Returns the number of input tokens."""
         return None
+    @property
+    def cached_tokens(self) -> None:
+        """Returns the number of cached tokens."""
+        return None
     @property
     def output_tokens(self) -> None:
         """Returns the number of output tokens."""

mirascope/core/vertex/stream.py CHANGED Viewed

@@ -64,7 +64,9 @@ class VertexStream(
     @property
     def cost(self) -> float | None:
         """Returns the cost of the call."""
-        return calculate_cost(self.input_tokens, self.output_tokens, self.model)
+        return calculate_cost(
+            self.input_tokens, self.cached_tokens, self.output_tokens, self.model
+        )
     def _construct_message_param(
         self,

mirascope/integrations/_middleware_factory.py CHANGED Viewed

@@ -175,9 +175,9 @@ def middleware_factory(
                     def new_stream_aiter(
                         self: Any,  # noqa: ANN401
                     ) -> AsyncGenerator[tuple[Any, Any | None], Any]:  # noqa: ANN401
-                        async def generator() -> (
-                            AsyncGenerator[tuple[Any, Any | None], Any]
-                        ):
+                        async def generator() -> AsyncGenerator[
+                            tuple[Any, Any | None], Any
+                        ]:
                             try:
                                 async for chunk, tool in original_aiter():
                                     yield chunk, tool
@@ -226,9 +226,9 @@ def middleware_factory(
                     def new_aiter(
                         self: Any,  # noqa: ANN401
                     ) -> AsyncGenerator[tuple[Any, Any | None], Any]:  # noqa: ANN401
-                        async def generator() -> (
-                            AsyncGenerator[tuple[Any, Any | None], Any]
-                        ):
+                        async def generator() -> AsyncGenerator[
+                            tuple[Any, Any | None], Any
+                        ]:
                             try:
                                 async for chunk in original_aiter():
                                     yield chunk

mirascope/integrations/logfire/_utils.py CHANGED Viewed

@@ -23,7 +23,7 @@ def custom_context_manager(
 ) -> Generator[logfire.LogfireSpan, Any, None]:
     metadata: Metadata = _utils.get_metadata(fn, None)
     tags = metadata.get("tags", [])
-    with logfire.with_settings(custom_scope_suffix="mirascope", tags=list(tags)).span(
+    with logfire.with_settings(custom_scope_suffix="mirascope", tags=list(tags)).span(  # pyright: ignore[reportGeneralTypeIssues]
         fn.__name__
     ) as logfire_span:
         yield logfire_span

mirascope/llm/__init__.py CHANGED Viewed

@@ -3,4 +3,4 @@ from .call_response import CallResponse
 from .llm_call import call
 from .llm_override import override
-__all__ = ["call", "override", "CallResponse", "Provider"]
+__all__ = ["CallResponse", "Provider", "call", "override"]

mirascope/llm/_protocols.py CHANGED Viewed

@@ -90,7 +90,7 @@ class _CallDecorator(
     ],
 ):
     @overload
-    def __call__(
+    def __call__(  # pyright: ignore[reportOverlappingOverload]
         self,
         provider: Provider,
         model: str,
@@ -110,7 +110,7 @@ class _CallDecorator(
     ]: ...
     @overload
-    def __call__(
+    def __call__(  # pyright: ignore[reportOverlappingOverload]
         self,
         provider: Provider,
         model: str,
@@ -140,7 +140,7 @@ class _CallDecorator(
     ) -> SyncLLMFunctionDecorator[_BaseDynamicConfigT, _BaseCallResponseT]: ...
     @overload
-    def __call__(
+    def __call__(  # pyright: ignore[reportOverlappingOverload]
         self,
         provider: Provider,
         model: str,
@@ -288,7 +288,7 @@ class _CallDecorator(
     ) -> NoReturn: ...
     @overload
-    def __call__(
+    def __call__(  # pyright: ignore[reportOverlappingOverload]
         self,
         provider: Provider,
         model: str,
@@ -382,7 +382,7 @@ class _CallDecorator(
     ) -> SyncLLMFunctionDecorator[_BaseDynamicConfigT, _ParsedOutputT]: ...
     @overload
-    def __call__(
+    def __call__(  # pyright: ignore[reportOverlappingOverload]
         self,
         provider: Provider,
         model: str,

mirascope/llm/call_response.py CHANGED Viewed

@@ -13,6 +13,7 @@ from mirascope.core.base import (
     BaseCallResponse,
     BaseMessageParam,
     BaseTool,
+    Usage,
     transform_tool_outputs,
 )
 from mirascope.core.base.message_param import ToolResultPart
@@ -22,14 +23,11 @@ from mirascope.llm.tool import Tool
 _ResponseT = TypeVar("_ResponseT")
-_ToolMessageParamT = TypeVar("_ToolMessageParamT")
-_BaseToolT = TypeVar("_BaseToolT", bound=BaseTool)
 class CallResponse(
     BaseCallResponse[
         _ResponseT,
-        _BaseToolT,
+        Tool,
         Any,
         BaseDynamicConfig[Any, Any, Any],
         BaseMessageParam,
@@ -44,11 +42,11 @@ class CallResponse(
     We rely on _response having `common_` methods or properties for normalization.
     """
-    _response: BaseCallResponse[_ResponseT, _BaseToolT, Any, Any, Any, Any, Any]
+    _response: BaseCallResponse[_ResponseT, Tool, Any, Any, Any, Any, Any]
     def __init__(
         self,
-        response: BaseCallResponse[_ResponseT, _BaseToolT, Any, Any, Any, Any, Any],
+        response: BaseCallResponse[_ResponseT, Tool, Any, Any, Any, Any, Any],
     ) -> None:
         super().__init__(
             **{
@@ -65,7 +63,13 @@ class CallResponse(
     def __getattribute__(self, name: str) -> Any:  # noqa: ANN401
         special_names = {
             "_response",
+            "finish_reasons",
+            "usage",
+            "message_param",
             "user_message_param",
+            "tools",
+            "tool",
+            "tool_message_params",
             "__dict__",
             "__class__",
             "model_fields",
@@ -97,6 +101,11 @@ class CallResponse(
     def finish_reasons(self) -> list[FinishReason] | None:  # pyright: ignore [reportIncompatibleMethodOverride]
         return self._response.common_finish_reasons
+    @property
+    def usage(self) -> Usage | None:
+        """Returns the usage of the chat completion."""
+        return self._response.common_usage
     @computed_field
     @cached_property
     def message_param(self) -> BaseMessageParam:
@@ -116,7 +125,7 @@ class CallResponse(
     @classmethod
     @transform_tool_outputs
     def tool_message_params(
-        cls, tools_and_outputs: list[tuple[BaseTool, str]]
+        cls, tools_and_outputs: list[tuple[Tool, str]]
     ) -> list[BaseMessageParam]:
         """Returns the tool message parameters for tool call results.

mirascope 1.18.3__py3-none-any.whl → 1.18.4__py3-none-any.whl

mirascope 1.18.3py3-none-any.whl → 1.18.4py3-none-any.whl