PyPI - payi - Versions diffs - 0.1.0a107__py3-none-any.whl → 0.1.0a137__py3-none-any.whl - Mend

payi 0.1.0a107py3-none-any.whl → 0.1.0a137py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (83) hide show

payi/__init__.py +3 -1
payi/_base_client.py +12 -12
payi/_client.py +8 -8
payi/_compat.py +48 -48
payi/_models.py +87 -59
payi/_qs.py +7 -7
payi/_streaming.py +4 -6
payi/_types.py +53 -12
payi/_utils/__init__.py +9 -2
payi/_utils/_compat.py +45 -0
payi/_utils/_datetime_parse.py +136 -0
payi/_utils/_sync.py +3 -31
payi/_utils/_transform.py +13 -3
payi/_utils/_typing.py +6 -1
payi/_utils/_utils.py +5 -6
payi/_version.py +1 -1
payi/lib/AnthropicInstrumentor.py +83 -57
payi/lib/BedrockInstrumentor.py +292 -57
payi/lib/GoogleGenAiInstrumentor.py +18 -31
payi/lib/OpenAIInstrumentor.py +56 -72
payi/lib/ProviderRequest.py +216 -0
payi/lib/StreamWrappers.py +379 -0
payi/lib/VertexInstrumentor.py +18 -37
payi/lib/VertexRequest.py +16 -2
payi/lib/data/cohere_embed_english_v3.json +30706 -0
payi/lib/helpers.py +62 -5
payi/lib/instrument.py +433 -659
payi/resources/categories/__init__.py +0 -14
payi/resources/categories/categories.py +25 -53
payi/resources/categories/resources.py +27 -23
payi/resources/ingest.py +126 -132
payi/resources/limits/__init__.py +14 -14
payi/resources/limits/limits.py +58 -58
payi/resources/limits/properties.py +171 -0
payi/resources/requests/request_id/properties.py +8 -8
payi/resources/requests/request_id/result.py +3 -3
payi/resources/requests/response_id/properties.py +8 -8
payi/resources/requests/response_id/result.py +3 -3
payi/resources/use_cases/definitions/definitions.py +27 -27
payi/resources/use_cases/definitions/kpis.py +23 -23
payi/resources/use_cases/definitions/limit_config.py +14 -14
payi/resources/use_cases/definitions/version.py +3 -3
payi/resources/use_cases/kpis.py +15 -15
payi/resources/use_cases/properties.py +6 -6
payi/resources/use_cases/use_cases.py +7 -7
payi/types/__init__.py +2 -0
payi/types/bulk_ingest_response.py +3 -20
payi/types/categories/__init__.py +0 -1
payi/types/categories/resource_list_params.py +5 -1
payi/types/category_list_resources_params.py +5 -1
payi/types/category_resource_response.py +31 -1
payi/types/ingest_event_param.py +7 -6
payi/types/ingest_units_params.py +5 -4
payi/types/limit_create_params.py +3 -3
payi/types/limit_list_response.py +1 -3
payi/types/limit_response.py +1 -3
payi/types/limits/__init__.py +2 -9
payi/types/limits/{tag_remove_params.py → property_update_params.py} +4 -5
payi/types/limits/{tag_delete_response.py → property_update_response.py} +3 -3
payi/types/requests/request_id/property_update_params.py +2 -2
payi/types/requests/response_id/property_update_params.py +2 -2
payi/types/shared/__init__.py +2 -0
payi/types/shared/api_error.py +18 -0
payi/types/shared/pay_i_common_models_budget_management_create_limit_base.py +3 -3
payi/types/shared/properties_request.py +11 -0
payi/types/shared/xproxy_result.py +2 -0
payi/types/shared_params/pay_i_common_models_budget_management_create_limit_base.py +3 -3
payi/types/use_cases/definitions/limit_config_create_params.py +3 -3
payi/types/use_cases/property_update_params.py +2 -2
{payi-0.1.0a107.dist-info → payi-0.1.0a137.dist-info}/METADATA +6 -6
{payi-0.1.0a107.dist-info → payi-0.1.0a137.dist-info}/RECORD +73 -75
payi/resources/categories/fixed_cost_resources.py +0 -196
payi/resources/limits/tags.py +0 -507
payi/types/categories/fixed_cost_resource_create_params.py +0 -21
payi/types/limits/limit_tags.py +0 -16
payi/types/limits/tag_create_params.py +0 -13
payi/types/limits/tag_create_response.py +0 -10
payi/types/limits/tag_list_response.py +0 -10
payi/types/limits/tag_remove_response.py +0 -10
payi/types/limits/tag_update_params.py +0 -13
payi/types/limits/tag_update_response.py +0 -10
{payi-0.1.0a107.dist-info → payi-0.1.0a137.dist-info}/WHEEL +0 -0
{payi-0.1.0a107.dist-info → payi-0.1.0a137.dist-info}/licenses/LICENSE +0 -0

payi/_utils/_datetime_parse.py ADDED Viewed

@@ -0,0 +1,136 @@
+"""
+This file contains code from https://github.com/pydantic/pydantic/blob/main/pydantic/v1/datetime_parse.py
+without the Pydantic v1 specific errors.
+"""
+from __future__ import annotations
+import re
+from typing import Dict, Union, Optional
+from datetime import date, datetime, timezone, timedelta
+from .._types import StrBytesIntFloat
+date_expr = r"(?P<year>\d{4})-(?P<month>\d{1,2})-(?P<day>\d{1,2})"
+time_expr = (
+    r"(?P<hour>\d{1,2}):(?P<minute>\d{1,2})"
+    r"(?::(?P<second>\d{1,2})(?:\.(?P<microsecond>\d{1,6})\d{0,6})?)?"
+    r"(?P<tzinfo>Z|[+-]\d{2}(?::?\d{2})?)?$"
+)
+date_re = re.compile(f"{date_expr}$")
+datetime_re = re.compile(f"{date_expr}[T ]{time_expr}")
+EPOCH = datetime(1970, 1, 1)
+# if greater than this, the number is in ms, if less than or equal it's in seconds
+# (in seconds this is 11th October 2603, in ms it's 20th August 1970)
+MS_WATERSHED = int(2e10)
+# slightly more than datetime.max in ns - (datetime.max - EPOCH).total_seconds() * 1e9
+MAX_NUMBER = int(3e20)
+def _get_numeric(value: StrBytesIntFloat, native_expected_type: str) -> Union[None, int, float]:
+    if isinstance(value, (int, float)):
+        return value
+    try:
+        return float(value)
+    except ValueError:
+        return None
+    except TypeError:
+        raise TypeError(f"invalid type; expected {native_expected_type}, string, bytes, int or float") from None
+def _from_unix_seconds(seconds: Union[int, float]) -> datetime:
+    if seconds > MAX_NUMBER:
+        return datetime.max
+    elif seconds < -MAX_NUMBER:
+        return datetime.min
+    while abs(seconds) > MS_WATERSHED:
+        seconds /= 1000
+    dt = EPOCH + timedelta(seconds=seconds)
+    return dt.replace(tzinfo=timezone.utc)
+def _parse_timezone(value: Optional[str]) -> Union[None, int, timezone]:
+    if value == "Z":
+        return timezone.utc
+    elif value is not None:
+        offset_mins = int(value[-2:]) if len(value) > 3 else 0
+        offset = 60 * int(value[1:3]) + offset_mins
+        if value[0] == "-":
+            offset = -offset
+        return timezone(timedelta(minutes=offset))
+    else:
+        return None
+def parse_datetime(value: Union[datetime, StrBytesIntFloat]) -> datetime:
+    """
+    Parse a datetime/int/float/string and return a datetime.datetime.
+    This function supports time zone offsets. When the input contains one,
+    the output uses a timezone with a fixed offset from UTC.
+    Raise ValueError if the input is well formatted but not a valid datetime.
+    Raise ValueError if the input isn't well formatted.
+    """
+    if isinstance(value, datetime):
+        return value
+    number = _get_numeric(value, "datetime")
+    if number is not None:
+        return _from_unix_seconds(number)
+    if isinstance(value, bytes):
+        value = value.decode()
+    assert not isinstance(value, (float, int))
+    match = datetime_re.match(value)
+    if match is None:
+        raise ValueError("invalid datetime format")
+    kw = match.groupdict()
+    if kw["microsecond"]:
+        kw["microsecond"] = kw["microsecond"].ljust(6, "0")
+    tzinfo = _parse_timezone(kw.pop("tzinfo"))
+    kw_: Dict[str, Union[None, int, timezone]] = {k: int(v) for k, v in kw.items() if v is not None}
+    kw_["tzinfo"] = tzinfo
+    return datetime(**kw_)  # type: ignore
+def parse_date(value: Union[date, StrBytesIntFloat]) -> date:
+    """
+    Parse a date/int/float/string and return a datetime.date.
+    Raise ValueError if the input is well formatted but not a valid date.
+    Raise ValueError if the input isn't well formatted.
+    """
+    if isinstance(value, date):
+        if isinstance(value, datetime):
+            return value.date()
+        else:
+            return value
+    number = _get_numeric(value, "date")
+    if number is not None:
+        return _from_unix_seconds(number).date()
+    if isinstance(value, bytes):
+        value = value.decode()
+    assert not isinstance(value, (float, int))
+    match = date_re.match(value)
+    if match is None:
+        raise ValueError("invalid date format")
+    kw = {k: int(v) for k, v in match.groupdict().items()}
+    try:
+        return date(**kw)
+    except ValueError:
+        raise ValueError("invalid date format") from None

payi/_utils/_sync.py CHANGED Viewed

@@ -1,10 +1,8 @@
 from __future__ import annotations
-import sys
 import asyncio
 import functools
-import contextvars
-from typing import Any, TypeVar, Callable, Awaitable
+from typing import TypeVar, Callable, Awaitable
 from typing_extensions import ParamSpec
 import anyio
@@ -15,34 +13,11 @@ T_Retval = TypeVar("T_Retval")
 T_ParamSpec = ParamSpec("T_ParamSpec")
-if sys.version_info >= (3, 9):
-    _asyncio_to_thread = asyncio.to_thread
-else:
-    # backport of https://docs.python.org/3/library/asyncio-task.html#asyncio.to_thread
-    # for Python 3.8 support
-    async def _asyncio_to_thread(
-        func: Callable[T_ParamSpec, T_Retval], /, *args: T_ParamSpec.args, **kwargs: T_ParamSpec.kwargs
-    ) -> Any:
-        """Asynchronously run function *func* in a separate thread.
-        Any *args and **kwargs supplied for this function are directly passed
-        to *func*. Also, the current :class:`contextvars.Context` is propagated,
-        allowing context variables from the main thread to be accessed in the
-        separate thread.
-        Returns a coroutine that can be awaited to get the eventual result of *func*.
-        """
-        loop = asyncio.events.get_running_loop()
-        ctx = contextvars.copy_context()
-        func_call = functools.partial(ctx.run, func, *args, **kwargs)
-        return await loop.run_in_executor(None, func_call)
 async def to_thread(
     func: Callable[T_ParamSpec, T_Retval], /, *args: T_ParamSpec.args, **kwargs: T_ParamSpec.kwargs
 ) -> T_Retval:
     if sniffio.current_async_library() == "asyncio":
-        return await _asyncio_to_thread(func, *args, **kwargs)
+        return await asyncio.to_thread(func, *args, **kwargs)
     return await anyio.to_thread.run_sync(
         functools.partial(func, *args, **kwargs),
@@ -53,10 +28,7 @@ async def to_thread(
 def asyncify(function: Callable[T_ParamSpec, T_Retval]) -> Callable[T_ParamSpec, Awaitable[T_Retval]]:
     """
     Take a blocking function and create an async one that receives the same
-    positional and keyword arguments. For python version 3.9 and above, it uses
-    asyncio.to_thread to run the function in a separate thread. For python version
-    3.8, it uses locally defined copy of the asyncio.to_thread function which was
-    introduced in python 3.9.
+    positional and keyword arguments.
     Usage:

payi/_utils/_transform.py CHANGED Viewed

@@ -16,18 +16,20 @@ from ._utils import (
     lru_cache,
     is_mapping,
     is_iterable,
+    is_sequence,
 )
 from .._files import is_base64_file_input
+from ._compat import get_origin, is_typeddict
 from ._typing import (
     is_list_type,
     is_union_type,
     extract_type_arg,
     is_iterable_type,
     is_required_type,
+    is_sequence_type,
     is_annotated_type,
     strip_annotated_type,
 )
-from .._compat import get_origin, model_dump, is_typeddict
 _T = TypeVar("_T")
@@ -167,6 +169,8 @@ def _transform_recursive(
             Defaults to the same value as the `annotation` argument.
     """
+    from .._compat import model_dump
     if inner_type is None:
         inner_type = annotation
@@ -184,6 +188,8 @@ def _transform_recursive(
         (is_list_type(stripped_type) and is_list(data))
         # Iterable[T]
         or (is_iterable_type(stripped_type) and is_iterable(data) and not isinstance(data, str))
+        # Sequence[T]
+        or (is_sequence_type(stripped_type) and is_sequence(data) and not isinstance(data, str))
     ):
         # dicts are technically iterable, but it is an iterable on the keys of the dict and is not usually
         # intended as an iterable, so we don't transform it.
@@ -262,7 +268,7 @@ def _transform_typeddict(
     annotations = get_type_hints(expected_type, include_extras=True)
     for key, value in data.items():
         if not is_given(value):
-            # we don't need to include `NotGiven` values here as they'll
+            # we don't need to include omitted values here as they'll
             # be stripped out before the request is sent anyway
             continue
@@ -329,6 +335,8 @@ async def _async_transform_recursive(
             Defaults to the same value as the `annotation` argument.
     """
+    from .._compat import model_dump
     if inner_type is None:
         inner_type = annotation
@@ -346,6 +354,8 @@ async def _async_transform_recursive(
         (is_list_type(stripped_type) and is_list(data))
         # Iterable[T]
         or (is_iterable_type(stripped_type) and is_iterable(data) and not isinstance(data, str))
+        # Sequence[T]
+        or (is_sequence_type(stripped_type) and is_sequence(data) and not isinstance(data, str))
     ):
         # dicts are technically iterable, but it is an iterable on the keys of the dict and is not usually
         # intended as an iterable, so we don't transform it.
@@ -424,7 +434,7 @@ async def _async_transform_typeddict(
     annotations = get_type_hints(expected_type, include_extras=True)
     for key, value in data.items():
         if not is_given(value):
-            # we don't need to include `NotGiven` values here as they'll
+            # we don't need to include omitted values here as they'll
             # be stripped out before the request is sent anyway
             continue

payi/_utils/_typing.py CHANGED Viewed

@@ -15,7 +15,7 @@ from typing_extensions import (
 from ._utils import lru_cache
 from .._types import InheritsGeneric
-from .._compat import is_union as _is_union
+from ._compat import is_union as _is_union
 def is_annotated_type(typ: type) -> bool:
@@ -26,6 +26,11 @@ def is_list_type(typ: type) -> bool:
     return (get_origin(typ) or typ) == list
+def is_sequence_type(typ: type) -> bool:
+    origin = get_origin(typ) or typ
+    return origin == typing_extensions.Sequence or origin == typing.Sequence or origin == _c_abc.Sequence
 def is_iterable_type(typ: type) -> bool:
     """If the given type is `typing.Iterable[T]`"""
     origin = get_origin(typ) or typ

payi/_utils/_utils.py CHANGED Viewed

@@ -21,8 +21,7 @@ from typing_extensions import TypeGuard
 import sniffio
-from .._types import NotGiven, FileTypes, NotGivenOr, HeadersLike
-from .._compat import parse_date as parse_date, parse_datetime as parse_datetime
+from .._types import Omit, NotGiven, FileTypes, HeadersLike
 _T = TypeVar("_T")
 _TupleT = TypeVar("_TupleT", bound=Tuple[object, ...])
@@ -64,7 +63,7 @@ def _extract_items(
     try:
         key = path[index]
     except IndexError:
-        if isinstance(obj, NotGiven):
+        if not is_given(obj):
             # no value was provided - we can safely ignore
             return []
@@ -127,14 +126,14 @@ def _extract_items(
     return []
-def is_given(obj: NotGivenOr[_T]) -> TypeGuard[_T]:
-    return not isinstance(obj, NotGiven)
+def is_given(obj: _T | NotGiven | Omit) -> TypeGuard[_T]:
+    return not isinstance(obj, NotGiven) and not isinstance(obj, Omit)
 # Type safe methods for narrowing types with TypeVars.
 # The default narrowing for isinstance(obj, dict) is dict[unknown, unknown],
 # however this cause Pyright to rightfully report errors. As we know we don't
-# care about the contained types we can safely use `object` in it's place.
+# care about the contained types we can safely use `object` in its place.
 #
 # There are two separate functions defined, `is_*` and `is_*_t` for different use cases.
 # `is_*` is for when you're dealing with an unknown input

payi/_version.py CHANGED Viewed

@@ -1,4 +1,4 @@
 # File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
 __title__ = "payi"
-__version__ = "0.1.0-alpha.107"  # x-release-please-version
+__version__ = "0.1.0-alpha.137"  # x-release-please-version

payi/lib/AnthropicInstrumentor.py CHANGED Viewed

@@ -1,3 +1,5 @@
+from __future__ import annotations
 import json
 from typing import Any, Union, Optional, Sequence
 from typing_extensions import override
@@ -8,8 +10,9 @@ from wrapt import wrap_function_wrapper  # type: ignore
 from payi.lib.helpers import PayiCategories
 from payi.types.ingest_units_params import Units
-from .instrument import _ChunkResult, _IsStreaming, _StreamingType, _ProviderRequest, _PayiInstrumentor
+from .instrument import _IsStreaming, _PayiInstrumentor
 from .version_helper import get_version_helper
+from .ProviderRequest import _ChunkResult, _StreamingType, _ProviderRequest
 class AnthropicInstrumentor:
@@ -30,37 +33,26 @@ class AnthropicInstrumentor:
     @staticmethod
     def instrument(instrumentor: _PayiInstrumentor) -> None:
-        try:
-            AnthropicInstrumentor._module_version = get_version_helper(AnthropicInstrumentor._module_name)
-            wrap_function_wrapper(
-                "anthropic.resources.messages",
-                "Messages.create",
-                messages_wrapper(instrumentor),
-            )
-            wrap_function_wrapper(
-                "anthropic.resources.messages",
-                "Messages.stream",
-                stream_messages_wrapper(instrumentor),
-            )
-            wrap_function_wrapper(
-                "anthropic.resources.messages",
-                "AsyncMessages.create",
-                amessages_wrapper(instrumentor),
-            )
-            wrap_function_wrapper(
-                "anthropic.resources.messages",
-                "AsyncMessages.stream",
-                astream_messages_wrapper(instrumentor),
-            )
-        except Exception as e:
-            instrumentor._logger.debug(f"Error instrumenting anthropic: {e}")
-            return
+        AnthropicInstrumentor._module_version = get_version_helper(AnthropicInstrumentor._module_name)
+        wrappers = [
+            ("anthropic._base_client", "AsyncAPIClient._process_response", _ProviderRequest.aprocess_response_wrapper),
+            ("anthropic._base_client", "SyncAPIClient._process_response", _ProviderRequest.process_response_wrapper),
+            ("anthropic.resources.messages", "Messages.create", messages_wrapper(instrumentor)),
+            ("anthropic.resources.messages", "Messages.stream", stream_messages_wrapper(instrumentor)),
+            ("anthropic.resources.beta.messages", "Messages.create", messages_wrapper(instrumentor)),
+            ("anthropic.resources.beta.messages", "Messages.stream", stream_messages_wrapper(instrumentor)),
+            ("anthropic.resources.messages", "AsyncMessages.create", amessages_wrapper(instrumentor)),
+            ("anthropic.resources.messages", "AsyncMessages.stream", astream_messages_wrapper(instrumentor)),
+            ("anthropic.resources.beta.messages", "AsyncMessages.create", amessages_wrapper(instrumentor)),
+            ("anthropic.resources.beta.messages", "AsyncMessages.stream", astream_messages_wrapper(instrumentor)),
+        ]
+        for module, method, wrapper in wrappers:
+            try:
+                wrap_function_wrapper(module, method, wrapper)
+            except Exception as e:
+                instrumentor._logger.debug(f"Error wrapping {module}.{method}: {e}")
 @_PayiInstrumentor.payi_wrapper
 def messages_wrapper(
@@ -171,15 +163,26 @@ class _AnthropicProviderRequest(_ProviderRequest):
         return None
+    def _update_resource_name(self, model: str) -> str:
+        return ("anthropic." if self._is_vertex else "") + model
     @override
-    def process_request(self, instance: Any, extra_headers: 'dict[str, str]', args: Sequence[Any], kwargs: Any) -> bool:
-        self._ingest["resource"] = ("anthropic." if self._is_vertex else "") + kwargs.get("model", "")
+    def process_request(self, instance: Any, extra_headers: 'dict[str, str]',  args: Sequence[Any], kwargs: Any) -> bool:
+        self._ingest["resource"] = self._update_resource_name(kwargs.get("model", ""))
+        if self._price_as.resource_scope:
+            self._ingest["resource_scope"] = self._price_as.resource_scope
+        # override defaults
+        if self._price_as.category:
+            self._ingest["category"] = self._price_as.category
+        if self._price_as.resource:
+            self._ingest["resource"] = self._update_resource_name(self._price_as.resource)
         self._instrumentor._logger.debug(f"Processing anthropic request: model {self._ingest['resource']}, category {self._category}")
         messages = kwargs.get("messages")
         if messages:
             anthropic_has_image_and_get_texts(self, messages)
         return True
@@ -220,23 +223,52 @@ class _AnthropicProviderRequest(_ProviderRequest):
         return True
-def anthropic_process_synchronous_response(request: _ProviderRequest, response: 'dict[str, Any]', log_prompt_and_response: bool, assign_id: bool) -> Any:
-    usage = response['usage']
-    input = usage['input_tokens']
-    output = usage['output_tokens']
+def anthropic_process_compute_input_cost(request: _ProviderRequest, usage: 'dict[str, Any]') -> int:
+    input = usage.get('input_tokens', 0)
     units: dict[str, Units] = request._ingest["units"]
     cache_creation_input_tokens = usage.get("cache_creation_input_tokens", 0)
-    if cache_creation_input_tokens > 0:
-        units["text_cache_write"] = Units(input=cache_creation_input_tokens, output=0)
+    cache_read_input_tokens = usage.get("cache_read_input_tokens", 0)
+    total_input_tokens = input + cache_creation_input_tokens + cache_read_input_tokens
+    request._is_large_context = total_input_tokens >= 200000
+    large_context = "_large_context" if request._is_large_context else ""
+    cache_creation: dict[str, int] = usage.get("cache_creation", {})
+    ephemeral_5m_input_tokens: Optional[int] = None
+    ephemeral_1h_input_tokens: Optional[int] = None
+    textCacheWriteAdded = False
+    if cache_creation:
+        ephemeral_5m_input_tokens = cache_creation.get("ephemeral_5m_input_tokens", 0)
+        if ephemeral_5m_input_tokens > 0:
+            textCacheWriteAdded = True
+            units["text_cache_write"+large_context] = Units(input=ephemeral_5m_input_tokens, output=0)
+        ephemeral_1h_input_tokens = cache_creation.get("ephemeral_1h_input_tokens", 0)
+        if ephemeral_1h_input_tokens > 0:
+            textCacheWriteAdded = True
+            units["text_cache_write_1h"+large_context] = Units(input=ephemeral_1h_input_tokens, output=0)
+    if textCacheWriteAdded is False and cache_creation_input_tokens > 0:
+        units["text_cache_write"+large_context] = Units(input=cache_creation_input_tokens, output=0)
     cache_read_input_tokens = usage.get("cache_read_input_tokens", 0)
     if cache_read_input_tokens > 0:
-        units["text_cache_read"] = Units(input=cache_read_input_tokens, output=0)
+        units["text_cache_read"+large_context] = Units(input=cache_read_input_tokens, output=0)
+    return request.update_for_vision(input)
-    input = _PayiInstrumentor.update_for_vision(input, units, request._estimated_prompt_tokens)
+def anthropic_process_synchronous_response(request: _ProviderRequest, response: 'dict[str, Any]', log_prompt_and_response: bool, assign_id: bool) -> Any:
+    usage = response.get('usage', {})
+    units: dict[str, Units] = request._ingest["units"]
-    units["text"] = Units(input=input, output=output)
+    input_tokens = anthropic_process_compute_input_cost(request, usage)
+    output = usage.get('output_tokens', 0)
+    large_context = "_large_context" if request._is_large_context else ""
+    units["text"+large_context] = Units(input=input_tokens, output=output)
     content = response.get('content', [])
     if content:
@@ -274,34 +306,28 @@ def anthropic_process_chunk(request: _ProviderRequest, chunk: 'dict[str, Any]',
         if model and 'resource' in request._ingest:
             request._instrumentor._logger.debug(f"Anthropic streaming, reported model: {model}, instrumented model {request._ingest['resource']}")
-        usage = message['usage']
+        usage = message.get('usage', {})
         units = request._ingest["units"]
-        input = _PayiInstrumentor.update_for_vision(usage['input_tokens'], units, request._estimated_prompt_tokens)
-        units["text"] = Units(input=input, output=0)
-        text_cache_write: int = usage.get("cache_creation_input_tokens", 0)
-        if text_cache_write > 0:
-            units["text_cache_write"] = Units(input=text_cache_write, output=0)
+        input = anthropic_process_compute_input_cost(request, usage)
-        text_cache_read: int = usage.get("cache_read_input_tokens", 0)
-        if text_cache_read > 0:
-            units["text_cache_read"] = Units(input=text_cache_read, output=0)
+        large_context = "_large_context" if request._is_large_context else ""
+        units["text"+large_context] = Units(input=input, output=0)
         request._instrumentor._logger.debug(f"Anthropic streaming captured {input} input tokens, ")
     elif type == "message_delta":
         usage = chunk.get('usage', {})
         ingest = True
+        large_context = "_large_context" if request._is_large_context else ""
         # Web search will return an updated input tokens value at the end of streaming
         input_tokens = usage.get('input_tokens', None)
         if input_tokens is not None:
             request._instrumentor._logger.debug(f"Anthropic streaming finished, updated input tokens: {input_tokens}")
-            request._ingest["units"]["text"]["input"] = input_tokens
+            request._ingest["units"]["text"+large_context]["input"] = input_tokens
-        request._ingest["units"]["text"]["output"] = usage.get('output_tokens', 0)
+        request._ingest["units"]["text"+large_context]["output"] = usage.get('output_tokens', 0)
         request._instrumentor._logger.debug(f"Anthropic streaming finished: output tokens {usage.get('output_tokens', 0)} ")

payi 0.1.0a107__py3-none-any.whl → 0.1.0a137__py3-none-any.whl

payi 0.1.0a107py3-none-any.whl → 0.1.0a137py3-none-any.whl