PyPI - payi - Versions diffs - 0.1.0a40__py3-none-any.whl → 0.1.0a42__py3-none-any.whl - Mend

payi 0.1.0a40py3-none-any.whl → 0.1.0a42py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of payi might be problematic. Click here for more details.

Files changed (18) hide show

payi/_constants.py +1 -1
payi/_models.py +1 -1
payi/_version.py +1 -1
payi/lib/AnthropicInstrumentor.py +42 -13
payi/lib/BedrockInstrumentor.py +282 -0
payi/lib/Instruments.py +1 -0
payi/lib/OpenAIInstrumentor.py +37 -8
payi/lib/Stopwatch.py +1 -1
payi/lib/instrument.py +505 -155
payi/resources/ingest.py +78 -0
payi/types/__init__.py +3 -0
payi/types/bulk_ingest_response.py +51 -0
payi/types/ingest_bulk_params.py +14 -0
payi/types/ingest_event_param.py +60 -0
{payi-0.1.0a40.dist-info → payi-0.1.0a42.dist-info}/METADATA +1 -1
{payi-0.1.0a40.dist-info → payi-0.1.0a42.dist-info}/RECORD +18 -14
{payi-0.1.0a40.dist-info → payi-0.1.0a42.dist-info}/WHEEL +0 -0
{payi-0.1.0a40.dist-info → payi-0.1.0a42.dist-info}/licenses/LICENSE +0 -0

payi/lib/instrument.py CHANGED Viewed

@@ -1,21 +1,28 @@
 import json
 import uuid
-import asyncio
 import inspect
 import logging
 import traceback
+from enum import Enum
 from typing import Any, Set, Union, Callable, Optional
 from wrapt import ObjectProxy  # type: ignore
 from payi import Payi, AsyncPayi
 from payi.types import IngestUnitsParams
+from payi.types.ingest_response import IngestResponse
 from payi.types.ingest_units_params import Units
+from payi.types.pay_i_common_models_api_router_header_info_param import PayICommonModelsAPIRouterHeaderInfoParam
 from .Stopwatch import Stopwatch
 from .Instruments import Instruments
+class IsStreaming(Enum):
+    false = 0
+    true = 1
+    kwargs = 2
 class PayiInstrumentor:
     estimated_prompt_tokens: str = "estimated_prompt_tokens"
@@ -44,12 +51,15 @@ class PayiInstrumentor:
     def _instrument_all(self) -> None:
         self._instrument_openai()
         self._instrument_anthropic()
+        self._instrument_aws_bedrock()
     def _instrument_specific(self, instruments: Set[Instruments]) -> None:
         if Instruments.OPENAI in instruments:
             self._instrument_openai()
         if Instruments.ANTHROPIC in instruments:
             self._instrument_anthropic()
+        if Instruments.AWS_BEDROCK in instruments:
+            self._instrument_aws_bedrock()
     def _instrument_openai(self) -> None:
         from .OpenAIInstrumentor import OpenAiInstrumentor
@@ -69,79 +79,101 @@ class PayiInstrumentor:
         except Exception as e:
             logging.error(f"Error instrumenting Anthropic: {e}")
-    def _ingest_units(self, ingest_units: IngestUnitsParams) -> None:
-        # return early if there are no units to ingest and on a successul ingest request
+    def _instrument_aws_bedrock(self) -> None:
+        from .BedrockInstrumentor import BedrockInstrumentor
+        try:
+            BedrockInstrumentor.instrument(self)
+        except Exception as e:
+            logging.error(f"Error instrumenting AWS bedrock: {e}")
+    def _process_ingest_units(self, ingest_units: IngestUnitsParams, log_data: 'dict[str, str]') -> bool:
         if int(ingest_units.get("http_status_code") or 0) < 400:
             units = ingest_units.get("units", {})
             if not units or all(unit.get("input", 0) == 0 and unit.get("output", 0) == 0 for unit in units.values()):
                 logging.error(
                     'No units to ingest.  For OpenAI streaming calls, make sure you pass stream_options={"include_usage": True}'
                 )
-                return
+                return False
+        if self._log_prompt_and_response and self._prompt_and_response_logger:
+            response_json = ingest_units.pop("provider_response_json", None)
+            request_json = ingest_units.pop("provider_request_json", None)
+            stack_trace = ingest_units.get("properties", {}).pop("system.stack_trace", None)  # type: ignore
+            if response_json is not None:
+                # response_json is a list of strings, convert a single json string
+                log_data["provider_response_json"] = json.dumps(response_json)
+            if request_json is not None:
+                log_data["provider_request_json"] = request_json
+            if stack_trace is not None:
+                log_data["stack_trace"] = stack_trace
+        return True
+    def _process_ingest_units_response(self, ingest_response: IngestResponse) -> None:
+        if ingest_response.xproxy_result.limits:
+            for limit_id, state in ingest_response.xproxy_result.limits.items():
+                removeBlockedId: bool = False
+                if state.state == "blocked":
+                    self._blocked_limits.add(limit_id)
+                elif state.state == "exceeded":
+                    self._exceeded_limits.add(limit_id)
+                    removeBlockedId = True
+                elif state.state == "ok":
+                    removeBlockedId = True
+                # opportunistically remove blocked limits
+                if removeBlockedId:
+                    self._blocked_limits.discard(limit_id)
+    async def _aingest_units(self, ingest_units: IngestUnitsParams) -> None:
+        # return early if there are no units to ingest and on a successul ingest request
+        log_data: 'dict[str,str]' = {}
+        if not self._process_ingest_units(ingest_units, log_data):
+            return
         try:
             if isinstance(self._payi, AsyncPayi):
-                loop = asyncio.new_event_loop()
-                asyncio.set_event_loop(loop)
-                try:
-                    ingest_result = loop.run_until_complete(self._payi.ingest.units(**ingest_units))
-                finally:
-                    loop.close()
-            elif isinstance(self._payi, Payi):
-                ingest_result = self._payi.ingest.units(**ingest_units)
+                ingest_response= await self._payi.ingest.units(**ingest_units)
+                self._process_ingest_units_response(ingest_response)
+                if self._log_prompt_and_response and self._prompt_and_response_logger:
+                    request_id = ingest_response.xproxy_result.request_id
+                    self._prompt_and_response_logger(request_id, log_data)  # type: ignore
             else:
                 logging.error("No payi instance to ingest units")
                 return
+        except Exception as e:
+            logging.error(f"Error Pay-i ingesting result: {e}")
-            if ingest_result.xproxy_result.limits:
-                for limit_id, state in ingest_result.xproxy_result.limits.items():
-                    removeBlockedId: bool = False
-                    if state.state == "blocked":
-                        self._blocked_limits.add(limit_id)
-                    elif state.state == "exceeded":
-                        self._exceeded_limits.add(limit_id)
-                        removeBlockedId = True
-                    elif state.state == "ok":
-                        removeBlockedId = True
-                    # opportunistically remove blocked limits
-                    if removeBlockedId:
-                        self._blocked_limits.discard(limit_id)
-            if self._log_prompt_and_response and self._prompt_and_response_logger:
-                request_id = ingest_result.xproxy_result.request_id
-                log_data = {}
-                response_json = ingest_units.pop("provider_response_json", None)
-                request_json = ingest_units.pop("provider_request_json", None)
-                stack_trace = ingest_units.get("properties", {}).pop("system.stack_trace", None)  # type: ignore
+    def _ingest_units(self, ingest_units: IngestUnitsParams) -> None:
+        # return early if there are no units to ingest and on a successul ingest request
+        log_data: 'dict[str,str]' = {}
+        if not self._process_ingest_units(ingest_units, log_data):
+            return
-                if response_json is not None:
-                    # response_json is a list of strings, convert a single json string
-                    log_data["provider_response_json"] = json.dumps(response_json)
-                if request_json is not None:
-                    log_data["provider_request_json"] = request_json
-                if stack_trace is not None:
-                    log_data["stack_trace"] = stack_trace
+        try:
+            if isinstance(self._payi, Payi):
+                ingest_response = self._payi.ingest.units(**ingest_units)
-                self._prompt_and_response_logger(request_id, log_data)  # type: ignore
+                self._process_ingest_units_response(ingest_response)
+                if self._log_prompt_and_response and self._prompt_and_response_logger:
+                    request_id = ingest_response.xproxy_result.request_id
+                    self._prompt_and_response_logger(request_id, log_data)  # type: ignore
+            else:
+                logging.error("No payi instance to ingest units")
+                return
         except Exception as e:
             logging.error(f"Error Pay-i ingesting result: {e}")
-    def _call_func(
-        self,
-        func: Any,
-        proxy: bool,
-        limit_ids: Optional["list[str]"],
-        request_tags: Optional["list[str]"],
-        experience_name: Optional[str],
-        experience_id: Optional[str],
-        user_id: Optional[str],
-        *args: Any,
-        **kwargs: Any,
-    ) -> Any:
+    def _setup_call_func(
+        self
+        ) -> 'tuple[dict[str, Any], Optional[str], Optional[str]]':
         if len(self._context_stack) > 0:
             # copy current context into the upcoming context
             context = self._context_stack[-1].copy()
@@ -152,36 +184,100 @@ class PayiInstrumentor:
             context = {}
             previous_experience_name = None
             previous_experience_id = None
+        return (context, previous_experience_name, previous_experience_id)
-        with self:
-            context["proxy"] = proxy
-            # Handle experience name and ID logic
-            if not experience_name:
-                # If no experience_name specified, use previous values
-                context["experience_name"] = previous_experience_name
-                context["experience_id"] = previous_experience_id
+    def _init_context(
+        self,
+        context: "dict[str, Any]",
+        previous_experience_name: Optional[str],
+        previous_experience_id: Optional[str],
+        proxy: bool,
+        limit_ids: Optional["list[str]"],
+        request_tags: Optional["list[str]"],
+        experience_name: Optional[str],
+        experience_id: Optional[str],
+        user_id: Optional[str],
+        ) -> None:
+        context["proxy"] = proxy
+        # Handle experience name and ID logic
+        if not experience_name:
+            # If no experience_name specified, use previous values
+            context["experience_name"] = previous_experience_name
+            context["experience_id"] = previous_experience_id
+        else:
+            # If experience_name is specified
+            if experience_name == previous_experience_name:
+                # Same experience name, use previous ID unless new one specified
+                context["experience_name"] = experience_name
+                context["experience_id"] = experience_id if experience_id else previous_experience_id
             else:
-                # If experience_name is specified
-                if experience_name == previous_experience_name:
-                    # Same experience name, use previous ID unless new one specified
-                    context["experience_name"] = experience_name
-                    context["experience_id"] = experience_id if experience_id else previous_experience_id
-                else:
-                    # Different experience name, use specified ID or generate one
-                    context["experience_name"] = experience_name
-                    context["experience_id"] = experience_id if experience_id else str(uuid.uuid4())
+                # Different experience name, use specified ID or generate one
+                context["experience_name"] = experience_name
+                context["experience_id"] = experience_id if experience_id else str(uuid.uuid4())
+        # set any values explicitly passed by the caller, otherwise use what is already in the context
+        if limit_ids:
+            context["limit_ids"] = limit_ids
+        if request_tags:
+            context["request_tags"] = request_tags
+        if user_id:
+            context["user_id"] = user_id
+        self.set_context(context)
+    async def _acall_func(
+        self,
+        func: Any,
+        proxy: bool,
+        limit_ids: Optional["list[str]"],
+        request_tags: Optional["list[str]"],
+        experience_name: Optional[str],
+        experience_id: Optional[str],
+        user_id: Optional[str],
+        *args: Any,
+        **kwargs: Any,
+    ) -> Any:
+        context, previous_experience_name, previous_experience_id = self._setup_call_func()
-            # set any values explicitly passed by the caller, otherwise use what is already in the context
-            if limit_ids:
-                context["limit_ids"] = limit_ids
-            if request_tags:
-                context["request_tags"] = request_tags
-            if user_id:
-                context["user_id"] = user_id
+        with self:
+            self._init_context(
+                context,
+                previous_experience_name,
+                previous_experience_id,
+                proxy,
+                limit_ids,
+                request_tags,
+                experience_name,
+                experience_id,
+                user_id)
+            return await func(*args, **kwargs)
-            self.set_context(context)
+    def _call_func(
+        self,
+        func: Any,
+        proxy: bool,
+        limit_ids: Optional["list[str]"],
+        request_tags: Optional["list[str]"],
+        experience_name: Optional[str],
+        experience_id: Optional[str],
+        user_id: Optional[str],
+        *args: Any,
+        **kwargs: Any,
+    ) -> Any:
+        context, previous_experience_name, previous_experience_id = self._setup_call_func()
+        with self:
+            self._init_context(
+                context,
+                previous_experience_name,
+                previous_experience_id,
+                proxy,
+                limit_ids,
+                request_tags,
+                experience_name,
+                experience_id,
+                user_id)
             return func(*args, **kwargs)
     def __enter__(self) -> Any:
@@ -203,22 +299,68 @@ class PayiInstrumentor:
         # Return the current top of the stack
         return self._context_stack[-1] if self._context_stack else None
-    def chat_wrapper(
+    def _prepare_ingest(
+        self,
+        ingest: IngestUnitsParams,
+        ingest_extra_headers: "dict[str, str]", # do not coflict potential kwargs["extra_headers"]
+        **kwargs: Any,
+    ) -> None:
+        limit_ids = ingest_extra_headers.pop("xProxy-Limit-IDs", None)
+        request_tags = ingest_extra_headers.pop("xProxy-Request-Tags", None)
+        experience_name = ingest_extra_headers.pop("xProxy-Experience-Name", None)
+        experience_id = ingest_extra_headers.pop("xProxy-Experience-ID", None)
+        user_id = ingest_extra_headers.pop("xProxy-User-ID", None)
+        if limit_ids:
+            ingest["limit_ids"] = limit_ids.split(",")
+        if request_tags:
+            ingest["request_tags"] = request_tags.split(",")
+        if experience_name:
+            ingest["experience_name"] = experience_name
+        if experience_id:
+            ingest["experience_id"] = experience_id
+        if user_id:
+            ingest["user_id"] = user_id
+        if len(ingest_extra_headers) > 0:
+            ingest["provider_request_headers"] = [PayICommonModelsAPIRouterHeaderInfoParam(name=k, value=v) for k, v in ingest_extra_headers.items()]
+        provider_prompt = {}
+        for k, v in kwargs.items():
+            if k == "messages":
+                provider_prompt[k] = [m.model_dump() if hasattr(m, "model_dump") else m for m in v]
+            elif k in ["extra_headers", "extra_query"]:
+                pass
+            else:
+                provider_prompt[k] = v
+        if self._log_prompt_and_response:
+            ingest["provider_request_json"] = json.dumps(provider_prompt)
+    async def achat_wrapper(
         self,
         category: str,
-        process_chunk: Callable[[Any, IngestUnitsParams], None],
-        process_request: Optional[Callable[[IngestUnitsParams, Any], None]],
-        process_synchronous_response: Optional[Callable[[Any, IngestUnitsParams, bool], None]],
+        process_chunk: Optional[Callable[[Any, IngestUnitsParams], None]],
+        process_request: Optional[Callable[[IngestUnitsParams, Any, Any], None]],
+        process_synchronous_response: Any,
+        is_streaming: IsStreaming,
         wrapped: Any,
         instance: Any,
         args: Any,
-        kwargs: 'dict[str, Any]',
+        kwargs: Any,
     ) -> Any:
         context = self.get_context()
+        is_bedrock:bool = category == "system.aws.bedrock"
         if not context:
-            # should not happen
-            return wrapped(*args, **kwargs)
+            if is_bedrock:
+                # boto3 doesn't allow extra_headers
+                kwargs.pop("extra_headers", None)
+            # wrapped function invoked outside of decorator scope
+            return await wrapped(*args, **kwargs)
         # after _udpate_headers, all metadata to add to ingest is in extra_headers, keyed by the xproxy-xxx header name
         extra_headers = kwargs.get("extra_headers", {})
@@ -228,13 +370,16 @@ class PayiInstrumentor:
             if "extra_headers" not in kwargs:
                 kwargs["extra_headers"] = extra_headers
-            return wrapped(*args, **kwargs)
+            return await wrapped(*args, **kwargs)
-        ingest: IngestUnitsParams = {"category": category, "resource": kwargs.get("model"), "units": {}} # type: ignore
+        ingest: IngestUnitsParams = {"category": category, "units": {}} # type: ignore
+        if is_bedrock:
+            # boto3 doesn't allow extra_headers
+            kwargs.pop("extra_headers", None)
+            ingest["resource"] = kwargs.get("modelId", "")
+        else:
+            ingest["resource"] = kwargs.get("model", "")
-        # blocked_limit = next((limit for limit in (context.get('limit_ids') or []) if limit in self._blocked_limits), None)
-        # if blocked_limit:
-        #      raise Exception(f"Limit {blocked_limit} is blocked")
         current_frame = inspect.currentframe()
         # f_back excludes the current frame, strip() cleans up whitespace and newlines
         stack = [frame.strip() for frame in traceback.format_stack(current_frame.f_back)]  # type: ignore
@@ -242,46 +387,135 @@ class PayiInstrumentor:
         ingest['properties'] = { 'system.stack_trace': json.dumps(stack) }
         if process_request:
-            process_request(ingest, kwargs)
+            process_request(ingest, (), instance)
         sw = Stopwatch()
-        stream = kwargs.get("stream", False)
+        stream: bool = False
+        if is_streaming == IsStreaming.kwargs:
+            stream = kwargs.get("stream", False)
+        elif is_streaming == IsStreaming.true:
+            stream = True
+        else:
+            stream = False
         try:
-            limit_ids = extra_headers.pop("xProxy-Limit-IDs", None)
-            request_tags = extra_headers.pop("xProxy-Request-Tags", None)
-            experience_name = extra_headers.pop("xProxy-Experience-Name", None)
-            experience_id = extra_headers.pop("xProxy-Experience-ID", None)
-            user_id = extra_headers.pop("xProxy-User-ID", None)
-            if limit_ids:
-                ingest["limit_ids"] = limit_ids.split(",")
-            if request_tags:
-                ingest["request_tags"] = request_tags.split(",")
-            if experience_name:
-                ingest["experience_name"] = experience_name
-            if experience_id:
-                ingest["experience_id"] = experience_id
-            if user_id:
-                ingest["user_id"] = user_id
-            if len(extra_headers) > 0:
-                ingest["provider_request_headers"] = {k: [v] for k, v in extra_headers.items()}  # type: ignore
-            provider_prompt = {}
-            for k, v in kwargs.items():
-                if k == "messages":
-                    provider_prompt[k] = [m.model_dump() if hasattr(m, "model_dump") else m for m in v]
-                elif k in ["extra_headers", "extra_query"]:
-                    pass
+            self._prepare_ingest(ingest, extra_headers, **kwargs)
+            sw.start()
+            response = await wrapped(*args, **kwargs)
+        except Exception as e:  # pylint: disable=broad-except
+            sw.stop()
+            duration = sw.elapsed_ms_int()
+            # TODO ingest error
+            raise e
+        if stream:
+            stream_result = ChatStreamWrapper(
+                response=response,
+                instance=instance,
+                instrumentor=self,
+                log_prompt_and_response=self._log_prompt_and_response,
+                ingest=ingest,
+                stopwatch=sw,
+                process_chunk=process_chunk,
+                is_bedrock=is_bedrock,
+            )
+            if is_bedrock:
+                if "body" in response:
+                    response["body"] = stream_result
                 else:
-                    provider_prompt[k] = v
+                    response["stream"] = stream_result
+                return response
+            return stream_result
+        sw.stop()
+        duration = sw.elapsed_ms_int()
+        ingest["end_to_end_latency_ms"] = duration
+        ingest["http_status_code"] = 200
+        if process_synchronous_response:
+            return_result: Any = process_synchronous_response(
+                response=response,
+                ingest=ingest,
+                log_prompt_and_response=self._log_prompt_and_response,
+                instrumentor=self)
+            if return_result:
+                return return_result
+        await self._aingest_units(ingest)
+        return response
+    def chat_wrapper(
+        self,
+        category: str,
+        process_chunk: Optional[Callable[[Any, IngestUnitsParams], None]],
+        process_request: Optional[Callable[[IngestUnitsParams, Any, Any], None]],
+        process_synchronous_response: Any,
+        is_streaming: IsStreaming,
+        wrapped: Any,
+        instance: Any,
+        args: Any,
+        kwargs: Any,
+    ) -> Any:
+        context = self.get_context()
+        is_bedrock:bool = category == "system.aws.bedrock"
+        if not context:
+            if is_bedrock:
+                # boto3 doesn't allow extra_headers
+                kwargs.pop("extra_headers", None)
+            # wrapped function invoked outside of decorator scope
+            return wrapped(*args, **kwargs)
+        # after _udpate_headers, all metadata to add to ingest is in extra_headers, keyed by the xproxy-xxx header name
+        extra_headers = kwargs.get("extra_headers", {})
+        self._update_headers(context, extra_headers)
+        if context.get("proxy", True):
+            if "extra_headers" not in kwargs:
+                kwargs["extra_headers"] = extra_headers
+            return wrapped(*args, **kwargs)
+        ingest: IngestUnitsParams = {"category": category, "units": {}} # type: ignore
+        if is_bedrock:
+            # boto3 doesn't allow extra_headers
+            kwargs.pop("extra_headers", None)
+            ingest["resource"] = kwargs.get("modelId", "")
+        else:
+            ingest["resource"] = kwargs.get("model", "")
+        current_frame = inspect.currentframe()
+        # f_back excludes the current frame, strip() cleans up whitespace and newlines
+        stack = [frame.strip() for frame in traceback.format_stack(current_frame.f_back)]  # type: ignore
-            if self._log_prompt_and_response:
-                ingest["provider_request_json"] = json.dumps(provider_prompt)
+        ingest['properties'] = { 'system.stack_trace': json.dumps(stack) }
+        if process_request:
+            process_request(ingest, (), kwargs)
+        sw = Stopwatch()
+        stream: bool = False
+        if is_streaming == IsStreaming.kwargs:
+            stream = kwargs.get("stream", False)
+        elif is_streaming == IsStreaming.true:
+            stream = True
+        else:
+            stream = False
+        try:
+            self._prepare_ingest(ingest, extra_headers, **kwargs)
             sw.start()
-            response = wrapped(*args, **kwargs.copy())
+            response = wrapped(*args, **kwargs)
         except Exception as e:  # pylint: disable=broad-except
             sw.stop()
@@ -292,7 +526,7 @@ class PayiInstrumentor:
             raise e
         if stream:
-            return ChatStreamWrapper(
+            stream_result = ChatStreamWrapper(
                 response=response,
                 instance=instance,
                 instrumentor=self,
@@ -300,15 +534,31 @@ class PayiInstrumentor:
                 ingest=ingest,
                 stopwatch=sw,
                 process_chunk=process_chunk,
+                is_bedrock=is_bedrock,
             )
+            if is_bedrock:
+                if "body" in response:
+                    response["body"] = stream_result
+                else:
+                    response["stream"] = stream_result
+                return response
+            return stream_result
         sw.stop()
         duration = sw.elapsed_ms_int()
         ingest["end_to_end_latency_ms"] = duration
         ingest["http_status_code"] = 200
         if process_synchronous_response:
-            process_synchronous_response(response, ingest, self._log_prompt_and_response)
+            return_result: Any = process_synchronous_response(
+                response=response,
+                ingest=ingest,
+                log_prompt_and_response=self._log_prompt_and_response,
+                instrumentor=self)
+            if return_result:
+                return return_result
         self._ingest_units(ingest)
@@ -379,14 +629,29 @@ class PayiInstrumentor:
                     o,
                     wrapped,
                     instance,
-                    args,
-                    kwargs,
+                    *args,
+                    **kwargs,
                 )
             return wrapper
         return _payi_wrapper
+    @staticmethod
+    def payi_awrapper(func: Any) -> Any:
+        def _payi_awrapper(o: Any) -> Any:
+            async def wrapper(wrapped: Any, instance: Any, args: Any, kwargs: Any) -> Any:
+                return await func(
+                    o,
+                    wrapped,
+                    instance,
+                    *args,
+                    **kwargs,
+                )
+            return wrapper
+        return _payi_awrapper
 class ChatStreamWrapper(ObjectProxy):  # type: ignore
     def __init__(
@@ -398,7 +663,19 @@ class ChatStreamWrapper(ObjectProxy):  # type: ignore
         stopwatch: Stopwatch,
         process_chunk: Optional[Callable[[Any, IngestUnitsParams], None]] = None,
         log_prompt_and_response: bool = True,
+        is_bedrock: bool = False,
     ) -> None:
+        bedrock_from_stream: bool = False
+        if is_bedrock:
+            stream = response.get("stream", None)
+            if stream:
+                response = stream
+                bedrock_from_stream = True
+            else:
+                response = response.get("body")
+                bedrock_from_stream = False
         super().__init__(response)  # type: ignore
         self._response = response
@@ -413,6 +690,8 @@ class ChatStreamWrapper(ObjectProxy):  # type: ignore
         self._process_chunk: Optional[Callable[[Any, IngestUnitsParams], None]] = process_chunk
         self._first_token: bool = True
+        self._is_bedrock: bool = is_bedrock
+        self._bedrock_from_stream: bool = bedrock_from_stream
     def __enter__(self) -> Any:
         return self
@@ -426,9 +705,26 @@ class ChatStreamWrapper(ObjectProxy):  # type: ignore
     async def __aexit__(self, exc_type: Any, exc_val: Any, exc_tb: Any) -> None:
         await self.__wrapped__.__aexit__(exc_type, exc_val, exc_tb)  # type: ignore
-    def __iter__(self) -> Any:
+    def __iter__(self) -> Any:
+        if self._is_bedrock:
+            # MUST be reside in a separate function so that the yield statement doesn't implicitly return its own iterator and overriding self
+            return self._iter_bedrock()
         return self
+    def _iter_bedrock(self) -> Any:
+        # botocore EventStream doesn't have a __next__ method so iterate over the wrapped object in place
+        for event in self.__wrapped__: # type: ignore
+            if (self._bedrock_from_stream):
+                self._evaluate_chunk(event)
+            else:
+                chunk = event.get('chunk') # type: ignore
+                if chunk:
+                    decode = chunk.get('bytes').decode() # type: ignore
+                    self._evaluate_chunk(decode)
+            yield event
+        self._stop_iteration()
     def __aiter__(self) -> Any:
         return self
@@ -448,7 +744,7 @@ class ChatStreamWrapper(ObjectProxy):  # type: ignore
             chunk: Any = await self.__wrapped__.__anext__()  # type: ignore
         except Exception as e:
             if isinstance(e, StopAsyncIteration):
-                self._stop_iteration()
+                await self._astop_iteration()
             raise e
         else:
             self._evaluate_chunk(chunk)
@@ -460,12 +756,12 @@ class ChatStreamWrapper(ObjectProxy):  # type: ignore
             self._first_token = False
         if self._log_prompt_and_response:
-            self._responses.append(chunk.to_json())
+            self._responses.append(self.chunk_to_json(chunk))
         if self._process_chunk:
             self._process_chunk(chunk, self._ingest)
-    def _stop_iteration(self) -> None:
+    def _process_stop_iteration(self) -> None:
         self._stopwatch.stop()
         self._ingest["end_to_end_latency_ms"] = self._stopwatch.elapsed_ms_int()
         self._ingest["http_status_code"] = 200
@@ -473,13 +769,29 @@ class ChatStreamWrapper(ObjectProxy):  # type: ignore
         if self._log_prompt_and_response:
             self._ingest["provider_response_json"] = self._responses
+    async def _astop_iteration(self) -> None:
+        self._process_stop_iteration()
+        await self._instrumentor._aingest_units(self._ingest)
+    def _stop_iteration(self) -> None:
+        self._process_stop_iteration()
         self._instrumentor._ingest_units(self._ingest)
+    @staticmethod
+    def chunk_to_json(chunk: Any) -> str:
+        if hasattr(chunk, "to_json"):
+            return str(chunk.to_json())
+        elif isinstance(chunk, bytes):
+            return chunk.decode()
+        elif isinstance(chunk, str):
+            return chunk
+        else:
+            # assume dict
+            return json.dumps(chunk)
 global _instrumentor
 _instrumentor: PayiInstrumentor
 def payi_instrument(
     payi: Optional[Union[Payi, AsyncPayi]] = None,
     instruments: Optional[Set[Instruments]] = None,
@@ -494,7 +806,6 @@ def payi_instrument(
         prompt_and_response_logger=prompt_and_response_logger,
     )
 def ingest(
     limit_ids: Optional["list[str]"] = None,
     request_tags: Optional["list[str]"] = None,
@@ -503,24 +814,38 @@ def ingest(
     user_id: Optional[str] = None,
 ) -> Any:
     def _ingest(func: Any) -> Any:
-        def _ingest_wrapper(*args: Any, **kwargs: Any) -> Any:
-            return _instrumentor._call_func(
-                func,
-                False,  # false -> ingest
-                limit_ids,
-                request_tags,
-                experience_name,
-                experience_id,
-                user_id,
-                *args,
-                **kwargs,
-            )
-        return _ingest_wrapper
+        import asyncio
+        if asyncio.iscoroutinefunction(func):
+            async def awrapper(*args: Any, **kwargs: Any) -> Any:
+                # Call the instrumentor's _call_func for async functions
+                return await _instrumentor._acall_func(
+                    func,
+                    False,
+                    limit_ids,
+                    request_tags,
+                    experience_name,
+                    experience_id,
+                    user_id,
+                    *args,
+                    *kwargs,
+                )
+            return awrapper
+        else:
+            def wrapper(*args: Any, **kwargs: Any) -> Any:
+                return _instrumentor._call_func(
+                    func,
+                    False,
+                    limit_ids,
+                    request_tags,
+                    experience_name,
+                    experience_id,
+                    user_id,
+                    *args,
+                    **kwargs,
+                )
+            return wrapper
     return _ingest
 def proxy(
     limit_ids: Optional["list[str]"] = None,
     request_tags: Optional["list[str]"] = None,
@@ -529,11 +854,36 @@ def proxy(
     user_id: Optional[str] = None,
 ) -> Any:
     def _proxy(func: Any) -> Any:
-        def _proxy_wrapper(*args: Any, **kwargs: Any) -> Any:
-            return _instrumentor._call_func(
-                func, True, limit_ids, request_tags, experience_name, experience_id, user_id, *args, **kwargs
-            )
+        import asyncio
+        if asyncio.iscoroutinefunction(func):
+            async def _proxy_awrapper(*args: Any, **kwargs: Any) -> Any:
+                return await _instrumentor._call_func(
+                    func,
+                    True,
+                    limit_ids,
+                    request_tags,
+                    experience_name,
+                    experience_id,
+                    user_id,
+                    *args,
+                    **kwargs
+                )
+            return _proxy_awrapper
+        else:
+            def _proxy_wrapper(*args: Any, **kwargs: Any) -> Any:
+                return _instrumentor._call_func(
+                    func,
+                    True,
+                    limit_ids,
+                    request_tags,
+                    experience_name,
+                    experience_id,
+                    user_id,
+                    *args,
+                    **kwargs
+                )
-        return _proxy_wrapper
+            return _proxy_wrapper
     return _proxy

payi 0.1.0a40__py3-none-any.whl → 0.1.0a42__py3-none-any.whl

Potentially problematic release.

payi 0.1.0a40py3-none-any.whl → 0.1.0a42py3-none-any.whl