PyPI - payi - Versions diffs - 0.1.0a107__py3-none-any.whl → 0.1.0a137__py3-none-any.whl - Mend

payi 0.1.0a107py3-none-any.whl → 0.1.0a137py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (83) hide show

payi/__init__.py +3 -1
payi/_base_client.py +12 -12
payi/_client.py +8 -8
payi/_compat.py +48 -48
payi/_models.py +87 -59
payi/_qs.py +7 -7
payi/_streaming.py +4 -6
payi/_types.py +53 -12
payi/_utils/__init__.py +9 -2
payi/_utils/_compat.py +45 -0
payi/_utils/_datetime_parse.py +136 -0
payi/_utils/_sync.py +3 -31
payi/_utils/_transform.py +13 -3
payi/_utils/_typing.py +6 -1
payi/_utils/_utils.py +5 -6
payi/_version.py +1 -1
payi/lib/AnthropicInstrumentor.py +83 -57
payi/lib/BedrockInstrumentor.py +292 -57
payi/lib/GoogleGenAiInstrumentor.py +18 -31
payi/lib/OpenAIInstrumentor.py +56 -72
payi/lib/ProviderRequest.py +216 -0
payi/lib/StreamWrappers.py +379 -0
payi/lib/VertexInstrumentor.py +18 -37
payi/lib/VertexRequest.py +16 -2
payi/lib/data/cohere_embed_english_v3.json +30706 -0
payi/lib/helpers.py +62 -5
payi/lib/instrument.py +433 -659
payi/resources/categories/__init__.py +0 -14
payi/resources/categories/categories.py +25 -53
payi/resources/categories/resources.py +27 -23
payi/resources/ingest.py +126 -132
payi/resources/limits/__init__.py +14 -14
payi/resources/limits/limits.py +58 -58
payi/resources/limits/properties.py +171 -0
payi/resources/requests/request_id/properties.py +8 -8
payi/resources/requests/request_id/result.py +3 -3
payi/resources/requests/response_id/properties.py +8 -8
payi/resources/requests/response_id/result.py +3 -3
payi/resources/use_cases/definitions/definitions.py +27 -27
payi/resources/use_cases/definitions/kpis.py +23 -23
payi/resources/use_cases/definitions/limit_config.py +14 -14
payi/resources/use_cases/definitions/version.py +3 -3
payi/resources/use_cases/kpis.py +15 -15
payi/resources/use_cases/properties.py +6 -6
payi/resources/use_cases/use_cases.py +7 -7
payi/types/__init__.py +2 -0
payi/types/bulk_ingest_response.py +3 -20
payi/types/categories/__init__.py +0 -1
payi/types/categories/resource_list_params.py +5 -1
payi/types/category_list_resources_params.py +5 -1
payi/types/category_resource_response.py +31 -1
payi/types/ingest_event_param.py +7 -6
payi/types/ingest_units_params.py +5 -4
payi/types/limit_create_params.py +3 -3
payi/types/limit_list_response.py +1 -3
payi/types/limit_response.py +1 -3
payi/types/limits/__init__.py +2 -9
payi/types/limits/{tag_remove_params.py → property_update_params.py} +4 -5
payi/types/limits/{tag_delete_response.py → property_update_response.py} +3 -3
payi/types/requests/request_id/property_update_params.py +2 -2
payi/types/requests/response_id/property_update_params.py +2 -2
payi/types/shared/__init__.py +2 -0
payi/types/shared/api_error.py +18 -0
payi/types/shared/pay_i_common_models_budget_management_create_limit_base.py +3 -3
payi/types/shared/properties_request.py +11 -0
payi/types/shared/xproxy_result.py +2 -0
payi/types/shared_params/pay_i_common_models_budget_management_create_limit_base.py +3 -3
payi/types/use_cases/definitions/limit_config_create_params.py +3 -3
payi/types/use_cases/property_update_params.py +2 -2
{payi-0.1.0a107.dist-info → payi-0.1.0a137.dist-info}/METADATA +6 -6
{payi-0.1.0a107.dist-info → payi-0.1.0a137.dist-info}/RECORD +73 -75
payi/resources/categories/fixed_cost_resources.py +0 -196
payi/resources/limits/tags.py +0 -507
payi/types/categories/fixed_cost_resource_create_params.py +0 -21
payi/types/limits/limit_tags.py +0 -16
payi/types/limits/tag_create_params.py +0 -13
payi/types/limits/tag_create_response.py +0 -10
payi/types/limits/tag_list_response.py +0 -10
payi/types/limits/tag_remove_response.py +0 -10
payi/types/limits/tag_update_params.py +0 -13
payi/types/limits/tag_update_response.py +0 -10
{payi-0.1.0a107.dist-info → payi-0.1.0a137.dist-info}/WHEEL +0 -0
{payi-0.1.0a107.dist-info → payi-0.1.0a137.dist-info}/licenses/LICENSE +0 -0

payi/lib/StreamWrappers.py ADDED Viewed

@@ -0,0 +1,379 @@
+from __future__ import annotations
+from typing import TYPE_CHECKING, Any, Union, Optional
+from wrapt import ObjectProxy  # type: ignore
+from payi.lib.helpers import _compact_json
+from payi.lib.Stopwatch import Stopwatch
+from payi.types.shared.xproxy_error import XproxyError
+from payi.types.shared.xproxy_result import XproxyResult
+from .ProviderRequest import _ChunkResult, _ProviderRequest
+if TYPE_CHECKING:
+    from .instrument import _PayiInstrumentor
+__all__ = [
+    "_StreamIteratorWrapper",
+    "_StreamManagerWrapper",
+    "_GeneratorWrapper",
+]
+class _StreamIteratorWrapper(ObjectProxy):  # type: ignore
+    def __init__(
+        self,
+        response: Any,
+        instance: Any,
+        instrumentor: '_PayiInstrumentor',
+        stopwatch: Stopwatch,
+        request: _ProviderRequest,
+    ) -> None:
+        instrumentor._logger.debug(f"StreamIteratorWrapper: instance {instance}, category {request._category}")
+        request.process_initial_stream_response(response)
+        bedrock_from_stream: bool = False
+        if request.is_aws_client:
+            stream = response.get("stream", None)
+            if stream:
+                response = stream
+                bedrock_from_stream = True
+            else:
+                response = response.get("body")
+                bedrock_from_stream = False
+        super().__init__(response)  # type: ignore
+        self._response = response
+        self._instance = instance
+        self._instrumentor = instrumentor
+        self._stopwatch: Stopwatch = stopwatch
+        self._responses: list[str] = []
+        self._request: _ProviderRequest = request
+        self._first_token: bool = True
+        self._bedrock_from_stream: bool = bedrock_from_stream
+        self._ingested: bool = False
+        self._iter_started: bool = False
+    def __enter__(self) -> Any:
+        self._instrumentor._logger.debug(f"StreamIteratorWrapper: __enter__")
+        return self
+    def __exit__(self, exc_type: Any, exc_val: Any, exc_tb: Any) -> None:
+        self._instrumentor._logger.debug(f"StreamIteratorWrapper: __exit__")
+        self.__wrapped__.__exit__(exc_type, exc_val, exc_tb)  # type: ignore
+    async def __aenter__(self) -> Any:
+        self._instrumentor._logger.debug(f"StreamIteratorWrapper: __aenter__")
+        return self
+    async def __aexit__(self, exc_type: Any, exc_val: Any, exc_tb: Any) -> None:
+        self._instrumentor._logger.debug(f"StreamIteratorWrapper: __aexit__")
+        await self.__wrapped__.__aexit__(exc_type, exc_val, exc_tb)  # type: ignore
+    def __iter__(self) -> Any:
+        self._iter_started = True
+        if self._request.is_aws_client:
+            # MUST reside in a separate function so that the yield statement (e.g. the generator) doesn't implicitly return its own iterator and overriding self
+            self._instrumentor._logger.debug(f"StreamIteratorWrapper: bedrock __iter__")
+            return self._iter_bedrock()
+        self._instrumentor._logger.debug(f"StreamIteratorWrapper: __iter__")
+        return self
+    def _iter_bedrock(self) -> Any:
+        # botocore EventStream doesn't have a __next__ method so iterate over the wrapped object in place
+        for event in self.__wrapped__: # type: ignore
+            result: Optional[_ChunkResult] = None
+            if (self._bedrock_from_stream):
+                result = self._evaluate_chunk(event)
+            else:
+                chunk = event.get('chunk') # type: ignore
+                if chunk:
+                    decode = chunk.get('bytes').decode() # type: ignore
+                    result = self._evaluate_chunk(decode)
+            if result and result.ingest:
+                from .BedrockInstrumentor import BedrockInstrumentor
+                xproxy_result = self._stop_iteration()
+                # the xproxy_result is not json serializable by default so adding the object is opt in by the client
+                if BedrockInstrumentor._add_streaming_xproxy_result:
+                    self._request.assign_xproxy_result(event, xproxy_result)
+            yield event
+        self._instrumentor._logger.debug(f"StreamIteratorWrapper: bedrock iter finished")
+        self._stop_iteration()
+    def __aiter__(self) -> Any:
+        self._iter_started = True
+        self._instrumentor._logger.debug(f"StreamIteratorWrapper: __aiter__")
+        return self
+    def __next__(self) -> object:
+        try:
+            chunk: object = self.__wrapped__.__next__()  # type: ignore
+            if self._ingested:
+                self._instrumentor._logger.debug(f"StreamIteratorWrapper: __next__ already ingested, not processing chunk {chunk}")
+                return chunk # type: ignore
+            result = self._evaluate_chunk(chunk)
+            if result.ingest:
+                xproxy_result = self._stop_iteration()
+                self._request.assign_xproxy_result(chunk, xproxy_result)
+            if result.send_chunk_to_caller:
+                return chunk # type: ignore
+            else:
+                return self.__next__()
+        except Exception as e:
+            if isinstance(e, StopIteration):
+                self._stop_iteration()
+            else:
+                self._instrumentor._logger.debug(f"StreamIteratorWrapper: __next__ exception {e}")
+            raise e
+    async def __anext__(self) -> object:
+        try:
+            chunk: object = await self.__wrapped__.__anext__()  # type: ignore
+            if self._ingested:
+                self._instrumentor._logger.debug(f"StreamIteratorWrapper: __next__ already ingested, not processing chunk {chunk}")
+                return chunk # type: ignore
+            result = self._evaluate_chunk(chunk)
+            if result.ingest:
+                xproxy_result = await self._astop_iteration()
+                self._request.assign_xproxy_result(chunk, xproxy_result)
+            if  result.send_chunk_to_caller:
+                return chunk # type: ignore
+            else:
+                return await self.__anext__()
+        except Exception as e:
+            if isinstance(e, StopAsyncIteration):
+                await self._astop_iteration()
+            else:
+                self._instrumentor._logger.debug(f"StreamIteratorWrapper: __anext__ exception {e}")
+            raise e
+    def _evaluate_chunk(self, chunk: Any) -> _ChunkResult:
+        if self._first_token:
+            self._request._ingest["time_to_first_token_ms"] = self._stopwatch.elapsed_ms_int()
+            self._first_token = False
+        if self._instrumentor._log_prompt_and_response:
+            self._responses.append(self.chunk_to_json(chunk))
+        return self._request.process_chunk(chunk)
+    def _process_stop_iteration(self) -> None:
+        self._instrumentor._logger.debug(f"StreamIteratorWrapper: process stop iteration")
+        self._stopwatch.stop()
+        self._request._ingest["end_to_end_latency_ms"] = self._stopwatch.elapsed_ms_int()
+        self._request._ingest["http_status_code"] = 200
+        if self._instrumentor._log_prompt_and_response:
+            self._request._ingest["provider_response_json"] = self._responses
+    async def _astop_iteration(self) -> Optional[Union[XproxyResult, XproxyError]]:
+        if self._ingested:
+            self._instrumentor._logger.debug(f"StreamIteratorWrapper: astop iteration already ingested, skipping")
+            return None
+        self._process_stop_iteration()
+        xproxy_result = await self._instrumentor._aingest_units(self._request)
+        self._ingested = True
+        return xproxy_result
+    def _stop_iteration(self) -> Optional[Union[XproxyResult, XproxyError]]:
+        if self._ingested:
+            self._instrumentor._logger.debug(f"StreamIteratorWrapper: stop iteration already ingested, skipping")
+            return None
+        self._process_stop_iteration()
+        xproxy_result = self._instrumentor._ingest_units(self._request)
+        self._ingested = True
+        return xproxy_result
+    @staticmethod
+    def chunk_to_json(chunk: Any) -> str:
+        if hasattr(chunk, "to_json"):
+            return str(chunk.to_json())
+        elif isinstance(chunk, bytes):
+            return chunk.decode()
+        elif isinstance(chunk, str):
+            return chunk
+        else:
+            # assume dict
+            return _compact_json(chunk)
+class _StreamManagerWrapper(ObjectProxy):  # type: ignore
+    def __init__(
+        self,
+        stream_manager: Any,  # type: ignore
+        instance: Any,
+        instrumentor: _PayiInstrumentor,
+        stopwatch: Stopwatch,
+        request: _ProviderRequest,
+    ) -> None:
+        instrumentor._logger.debug(f"StreamManagerWrapper: instance {instance}, category {request._category}")
+        super().__init__(stream_manager)  # type: ignore
+        self._stream_manager = stream_manager
+        self._instance = instance
+        self._instrumentor = instrumentor
+        self._stopwatch: Stopwatch = stopwatch
+        self._responses: list[str] = []
+        self._request: _ProviderRequest = request
+        self._first_token: bool = True
+    def __enter__(self) -> _StreamIteratorWrapper:
+        self._instrumentor._logger.debug(f"_StreamManagerWrapper: __enter__")
+        return _StreamIteratorWrapper(
+            response=self.__wrapped__.__enter__(),  # type: ignore
+            instance=self._instance,
+            instrumentor=self._instrumentor,
+            stopwatch=self._stopwatch,
+            request=self._request,
+        )
+class _GeneratorWrapper:  # type: ignore
+    def __init__(
+        self,
+        generator: Any,
+        instance: Any,
+        instrumentor: _PayiInstrumentor,
+        stopwatch: Stopwatch,
+        request: _ProviderRequest,
+    ) -> None:
+        instrumentor._logger.debug(f"GeneratorWrapper: instance {instance}, category {request._category}")
+        super().__init__()  # type: ignore
+        self._generator = generator
+        self._instance = instance
+        self._instrumentor = instrumentor
+        self._stopwatch: Stopwatch = stopwatch
+        self._log_prompt_and_response: bool = instrumentor._log_prompt_and_response
+        self._responses: list[str] = []
+        self._request: _ProviderRequest = request
+        self._first_token: bool = True
+        self._ingested: bool = False
+        self._iter_started: bool = False
+    def __iter__(self) -> Any:
+        self._iter_started = True
+        self._instrumentor._logger.debug(f"GeneratorWrapper: __iter__")
+        return self
+    def __aiter__(self) -> Any:
+        self._instrumentor._logger.debug(f"GeneratorWrapper: __aiter__")
+        return self
+    def _process_chunk(self, chunk: Any) -> _ChunkResult:
+        if self._first_token:
+            self._request._ingest["time_to_first_token_ms"] = self._stopwatch.elapsed_ms_int()
+            self._first_token = False
+        if self._log_prompt_and_response:
+            dict = self._chunk_to_dict(chunk)
+            self._responses.append(_compact_json(dict))
+        return self._request.process_chunk(chunk)
+    def __next__(self) -> Any:
+        try:
+            chunk = next(self._generator)
+            result = self._process_chunk(chunk)
+            if result.ingest:
+                xproxy_result = self._stop_iteration()
+                self._request.assign_xproxy_result(chunk, xproxy_result)
+            # ignore result.send_chunk_to_caller:
+            return chunk
+        except Exception as e:
+            if isinstance(e, StopIteration):
+                self._stop_iteration()
+            else:
+                self._instrumentor._logger.debug(f"GeneratorWrapper: __next__ exception {e}")
+            raise e
+    async def __anext__(self) -> Any:
+        try:
+            chunk = await anext(self._generator) # type: ignore
+            result = self._process_chunk(chunk)
+            if result.ingest:
+                xproxy_result = await self._astop_iteration()
+                self._request.assign_xproxy_result(chunk, xproxy_result)
+            # ignore result.send_chunk_to_caller:
+            return chunk # type: ignore
+        except Exception as e:
+            if isinstance(e, StopAsyncIteration):
+                await self._astop_iteration()
+            else:
+                self._instrumentor._logger.debug(f"GeneratorWrapper: __anext__ exception {e}")
+            raise e
+    @staticmethod
+    def _chunk_to_dict(chunk: Any) -> 'dict[str, object]':
+        if hasattr(chunk, "to_dict"):
+            return chunk.to_dict() # type: ignore
+        elif hasattr(chunk, "to_json_dict"):
+            return chunk.to_json_dict() # type: ignore
+        else:
+            return {}
+    def _stop_iteration(self) -> Optional[Union[XproxyResult, XproxyError]]:
+        if self._ingested:
+            self._instrumentor._logger.debug(f"GeneratorWrapper: stop iteration already ingested, skipping")
+            return None
+        self._process_stop_iteration()
+        xproxy_result = self._instrumentor._ingest_units(self._request)
+        self._ingested = True
+        return xproxy_result
+    async def _astop_iteration(self) -> Optional[Union[XproxyResult, XproxyError]]:
+        if self._ingested:
+            self._instrumentor._logger.debug(f"GeneratorWrapper: astop iteration already ingested, skipping")
+            return None
+        self._process_stop_iteration()
+        xproxy_result = await self._instrumentor._aingest_units(self._request)
+        self._ingested = True
+        return xproxy_result
+    def _process_stop_iteration(self) -> None:
+        self._instrumentor._logger.debug(f"GeneratorWrapper: stop iteration")
+        self._stopwatch.stop()
+        self._request._ingest["end_to_end_latency_ms"] = self._stopwatch.elapsed_ms_int()
+        self._request._ingest["http_status_code"] = 200
+        if self._log_prompt_and_response:
+            self._request._ingest["provider_response_json"] = self._responses

payi/lib/VertexInstrumentor.py CHANGED Viewed

@@ -1,11 +1,14 @@
+from __future__ import annotations
 from typing import Any, List, Union, Optional, Sequence
 from typing_extensions import override
 from wrapt import wrap_function_wrapper  # type: ignore
-from .instrument import _ChunkResult, _IsStreaming, _PayiInstrumentor
+from .instrument import _IsStreaming, _PayiInstrumentor
 from .VertexRequest import _VertexRequest
 from .version_helper import get_version_helper
+from .ProviderRequest import _ChunkResult
 class VertexInstrumentor:
@@ -14,42 +17,20 @@ class VertexInstrumentor:
     @staticmethod
     def instrument(instrumentor: _PayiInstrumentor) -> None:
-        try:
-            VertexInstrumentor._module_version = get_version_helper(VertexInstrumentor._module_name)
-            wrap_function_wrapper(
-                "vertexai.generative_models",
-                "GenerativeModel.generate_content",
-                generate_wrapper(instrumentor),
-            )
-            wrap_function_wrapper(
-                "vertexai.generative_models",
-                "GenerativeModel.generate_content_async",
-                agenerate_wrapper(instrumentor),
-            )
-        except Exception as e:
-            instrumentor._logger.debug(f"Error instrumenting vertex: {e}")
-            return
-        # separate instrumetning preview functionality from released in case it fails
-        try:
-            wrap_function_wrapper(
-                "vertexai.preview.generative_models",
-                "GenerativeModel.generate_content",
-                generate_wrapper(instrumentor),
-            )
-            wrap_function_wrapper(
-                "vertexai.preview.generative_models",
-                "GenerativeModel.generate_content_async",
-                agenerate_wrapper(instrumentor),
-            )
-        except Exception as e:
-            instrumentor._logger.debug(f"Error instrumenting vertex: {e}")
-            return
+        VertexInstrumentor._module_version = get_version_helper(VertexInstrumentor._module_name)
+        wrappers = [
+            ("vertexai.generative_models", "GenerativeModel.generate_content", generate_wrapper(instrumentor)),
+            ("vertexai.generative_models", "GenerativeModel.generate_content_async", agenerate_wrapper(instrumentor)),
+            ("vertexai.preview.generative_models", "GenerativeModel.generate_content", generate_wrapper(instrumentor)),
+            ("vertexai.preview.generative_models", "GenerativeModel.generate_content_async", agenerate_wrapper(instrumentor)),
+        ]
+        for module, method, wrapper in wrappers:
+            try:
+                wrap_function_wrapper(module, method, wrapper)
+            except Exception as e:
+                instrumentor._logger.debug(f"Error wrapping {module}.{method}: {e}")
 @_PayiInstrumentor.payi_wrapper
 def generate_wrapper(

payi/lib/VertexRequest.py CHANGED Viewed

@@ -1,3 +1,5 @@
+from __future__ import annotations
 import json
 import math
 from typing import Any, Optional
@@ -6,7 +8,8 @@ from typing_extensions import override
 from payi.lib.helpers import PayiCategories
 from payi.types.ingest_units_params import Units
-from .instrument import _ChunkResult, _StreamingType, _ProviderRequest, _PayiInstrumentor
+from .instrument import _PayiInstrumentor
+from .ProviderRequest import _ChunkResult, _StreamingType, _ProviderRequest
 class _VertexRequest(_ProviderRequest): # type: ignore
@@ -44,6 +47,11 @@ class _VertexRequest(_ProviderRequest): # type: ignore
             if id:
                 self._ingest["provider_response_id"] = id
+        if "provider_response_headers" not in self._ingest:
+            response_headers = response_dict.get('sdk_http_response', {}).get('headers', {})
+            if response_headers:
+                self.add_response_headers(response_headers)
         if "resource" not in self._ingest:
             model: Optional[str] = self._get_model_name(response_dict)  # type: ignore[unreachable]
             if model:
@@ -111,6 +119,10 @@ class _VertexRequest(_ProviderRequest): # type: ignore
         response_dict: 'dict[str, Any]',
         log_prompt_and_response: bool) -> Any:
+        response_headers = response_dict.get('sdk_http_response', {}).get('headers', {})
+        if response_headers:
+            self.add_response_headers(response_headers)
         id: Optional[str] = response_dict.get("response_id", None)
         if id:
             self._ingest["provider_response_id"] = id
@@ -148,7 +160,7 @@ class _VertexRequest(_ProviderRequest): # type: ignore
             return model.startswith("gemini-1.")
         def is_large_context_token_model(model: str, input_tokens: int) -> bool:
-            return model.startswith("gemini-2.5-pro") and input_tokens > 200_000
+            return model.startswith("gemini-2.5-pro") and input_tokens > 200000
         def add_units(request: _ProviderRequest, key: str, input: Optional[int] = None, output: Optional[int] = None) -> None:
             if key not in request._ingest["units"]:
@@ -172,6 +184,7 @@ class _VertexRequest(_ProviderRequest): # type: ignore
         if is_character_billing_model(model):
             if input > 128000:
+                self._is_large_context = True
                 large_context = "_large_context"
             # gemini 1.0 and 1.5 units are reported in characters, per second, per image, etc...
@@ -222,6 +235,7 @@ class _VertexRequest(_ProviderRequest): # type: ignore
             thinking_token_count = usage.get("thoughts_token_count", 0)
             if is_large_context_token_model(model, input):
+                self._is_large_context = True
                 large_context = "_large_context"
             cache_details: dict[str, int] = {}

payi 0.1.0a107__py3-none-any.whl → 0.1.0a137__py3-none-any.whl

payi 0.1.0a107py3-none-any.whl → 0.1.0a137py3-none-any.whl