PyPI - deepeval - Versions diffs - 3.5.9__py3-none-any.whl → 3.6.1__py3-none-any.whl - Mend

deepeval 3.5.9py3-none-any.whl → 3.6.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (22) hide show

deepeval/_version.py +1 -1
deepeval/config/settings_manager.py +1 -1
deepeval/contextvars.py +25 -0
deepeval/dataset/__init__.py +8 -2
deepeval/evaluate/execute.py +15 -3
deepeval/openai_agents/__init__.py +4 -3
deepeval/openai_agents/agent.py +8 -166
deepeval/openai_agents/callback_handler.py +69 -61
deepeval/openai_agents/extractors.py +83 -7
deepeval/openai_agents/patch.py +255 -61
deepeval/openai_agents/runner.py +348 -335
deepeval/tracing/context.py +1 -0
deepeval/tracing/otel/exporter.py +6 -0
deepeval/tracing/otel/utils.py +62 -0
deepeval/tracing/tracing.py +3 -0
deepeval/tracing/utils.py +54 -0
deepeval/utils.py +4 -3
{deepeval-3.5.9.dist-info → deepeval-3.6.1.dist-info}/METADATA +1 -1
{deepeval-3.5.9.dist-info → deepeval-3.6.1.dist-info}/RECORD +22 -21
{deepeval-3.5.9.dist-info → deepeval-3.6.1.dist-info}/LICENSE.md +0 -0
{deepeval-3.5.9.dist-info → deepeval-3.6.1.dist-info}/WHEEL +0 -0
{deepeval-3.5.9.dist-info → deepeval-3.6.1.dist-info}/entry_points.txt +0 -0

deepeval/openai_agents/runner.py CHANGED Viewed

@@ -1,335 +1,348 @@
-from __future__ import annotations
-from dataclasses import replace
-from typing import List, Any, Union, Optional
-try:
-    from agents import (
-        RunConfig,
-        RunResult,
-        RunResultStreaming,
-        Runner as AgentsRunner,
-    )
-    from agents.agent import Agent
-    from agents.models.interface import ModelProvider
-    from agents.items import TResponseInputItem
-    from agents.lifecycle import RunHooks
-    from agents.memory import Session
-    from agents.run import DEFAULT_MAX_TURNS
-    from agents.run import AgentRunner
-    from agents.run_context import TContext
-    from agents.models.interface import Model
-    agents_available = True
-except:
-    agents_available = False
-def is_agents_available():
-    if not agents_available:
-        raise ImportError(
-            "agents is required for this integration. Install it via your package manager"
-        )
-from deepeval.tracing.tracing import Observer
-from deepeval.tracing.context import current_span_context, current_trace_context
-# Import observed provider/model helpers from our agent module
-from deepeval.metrics import BaseMetric
-from deepeval.openai_agents.agent import _ObservedModel
-_PATCHED_DEFAULT_GET_MODEL = False
-def _patch_default_agent_runner_get_model():
-    global _PATCHED_DEFAULT_GET_MODEL
-    if _PATCHED_DEFAULT_GET_MODEL:
-        return
-    original_get_model = AgentRunner._get_model
-    @classmethod
-    def patched_get_model(
-        cls, agent: Agent[Any], run_config: RunConfig
-    ) -> Model:
-        model = original_get_model(agent, run_config)
-        # Extract attributes from agent if it's a DeepEvalAgent
-        llm_metrics = getattr(agent, "llm_metrics", None)
-        llm_metric_collection = getattr(agent, "llm_metric_collection", None)
-        confident_prompt = getattr(agent, "confident_prompt", None)
-        model = _ObservedModel(
-            inner=model,
-            llm_metric_collection=llm_metric_collection,
-            llm_metrics=llm_metrics,
-            confident_prompt=confident_prompt,
-        )
-        return model
-    # Replace the method
-    AgentRunner._get_model = patched_get_model
-    _PATCHED_DEFAULT_GET_MODEL = True
-if agents_available:
-    _patch_default_agent_runner_get_model()
-class Runner(AgentsRunner):
-    @classmethod
-    async def run(
-        cls,
-        starting_agent: Agent[TContext],
-        input: Union[str, list[TResponseInputItem]],
-        *,
-        context: Optional[TContext] = None,
-        max_turns: int = DEFAULT_MAX_TURNS,
-        hooks: Optional[RunHooks[TContext]] = None,
-        run_config: Optional[RunConfig] = None,
-        previous_response_id: Optional[str] = None,
-        conversation_id: Optional[str] = None,
-        session: Optional[Session] = None,
-        metrics: Optional[List[BaseMetric]] = None,
-        metric_collection: Optional[str] = None,
-        name: Optional[str] = None,
-        tags: Optional[List[str]] = None,
-        metadata: Optional[dict] = None,
-        thread_id: Optional[str] = None,
-        user_id: Optional[str] = None,
-        **kwargs,  # backwards compatibility
-    ) -> RunResult:
-        is_agents_available()
-        # _patch_default_agent_runner_get_model()
-        with Observer(
-            span_type="custom",
-            metric_collection=metric_collection,
-            metrics=metrics,
-            func_name="run",
-            function_kwargs={"input": input},  # also set below
-        ) as observer:
-            update_trace_attributes(
-                name=name,
-                tags=tags,
-                metadata=metadata,
-                thread_id=thread_id,
-                user_id=user_id,
-                metric_collection=metric_collection,
-                metrics=metrics,
-            )
-            current_span = current_span_context.get()
-            current_trace = current_trace_context.get()
-            if not current_trace.input:
-                current_trace.input = input
-            if current_span:
-                current_span.input = input
-            res = await super().run(
-                starting_agent,
-                input,
-                context=context,
-                max_turns=max_turns,
-                hooks=hooks,
-                run_config=run_config,
-                previous_response_id=previous_response_id,
-                conversation_id=conversation_id,
-                session=session,
-                **kwargs,  # backwards compatibility
-            )
-            current_trace_thread_id = current_trace_context.get().thread_id
-            _output = None
-            if current_trace_thread_id:
-                _output = res.final_output
-            else:
-                _output = str(res)
-            observer.result = _output
-            update_trace_attributes(output=_output)
-        return res
-    @classmethod
-    def run_sync(
-        cls,
-        starting_agent: Agent[TContext],
-        input: Union[str, list[TResponseInputItem]],
-        *,
-        context: Optional[TContext] = None,
-        max_turns: int = DEFAULT_MAX_TURNS,
-        hooks: Optional[RunHooks[TContext]] = None,
-        run_config: Optional[RunConfig] = None,
-        previous_response_id: Optional[str] = None,
-        conversation_id: Optional[str] = None,
-        session: Optional[Session] = None,
-        metrics: Optional[List[BaseMetric]] = None,
-        metric_collection: Optional[str] = None,
-        name: Optional[str] = None,
-        tags: Optional[List[str]] = None,
-        metadata: Optional[dict] = None,
-        thread_id: Optional[str] = None,
-        user_id: Optional[str] = None,
-        **kwargs,
-    ) -> RunResult:
-        is_agents_available()
-        with Observer(
-            span_type="custom",
-            metric_collection=metric_collection,
-            metrics=metrics,
-            func_name="run_sync",
-            function_kwargs={"input": input},  # also set below
-        ) as observer:
-            update_trace_attributes(
-                name=name,
-                tags=tags,
-                metadata=metadata,
-                thread_id=thread_id,
-                user_id=user_id,
-                metric_collection=metric_collection,
-                metrics=metrics,
-            )
-            current_span = current_span_context.get()
-            current_trace = current_trace_context.get()
-            if not current_trace.input:
-                current_trace.input = input
-            if current_span:
-                current_span.input = input
-            res = super().run_sync(
-                starting_agent,
-                input,
-                context=context,
-                max_turns=max_turns,
-                hooks=hooks,
-                run_config=run_config,
-                previous_response_id=previous_response_id,
-                conversation_id=conversation_id,
-                session=session,
-                **kwargs,  # backwards compatibility
-            )
-            current_trace_thread_id = current_trace_context.get().thread_id
-            _output = None
-            if current_trace_thread_id:
-                _output = res.final_output
-            else:
-                _output = str(res)
-            update_trace_attributes(output=_output)
-            observer.result = _output
-        return res
-    @classmethod
-    def run_streamed(
-        cls,
-        starting_agent: Agent[TContext],
-        input: Union[str, list[TResponseInputItem]],
-        *,
-        context: Optional[TContext] = None,
-        max_turns: int = DEFAULT_MAX_TURNS,
-        hooks: Optional[RunHooks[TContext]] = None,
-        run_config: Optional[RunConfig] = None,
-        previous_response_id: Optional[str] = None,
-        conversation_id: Optional[str] = None,
-        session: Optional[Session] = None,
-        metrics: Optional[List[BaseMetric]] = None,
-        metric_collection: Optional[str] = None,
-        name: Optional[str] = None,
-        tags: Optional[List[str]] = None,
-        metadata: Optional[dict] = None,
-        thread_id: Optional[str] = None,
-        user_id: Optional[str] = None,
-        **kwargs,  # backwards compatibility
-    ) -> RunResultStreaming:
-        is_agents_available()
-        # Manually enter observer; we'll exit when streaming finishes
-        observer = Observer(
-            span_type="custom",
-            metric_collection=metric_collection,
-            metrics=metrics,
-            func_name="run_streamed",
-            function_kwargs={"input": input},
-        )
-        observer.__enter__()
-        update_trace_attributes(
-            name=name,
-            tags=tags,
-            metadata=metadata,
-            thread_id=thread_id,
-            user_id=user_id,
-            metric_collection=metric_collection,
-            metrics=metrics,
-        )
-        current_trace = current_trace_context.get()
-        if not current_trace.input:
-            current_trace.input = input
-        current_span = current_span_context.get()
-        if current_span:
-            current_span.input = input
-        res = super().run_streamed(
-            starting_agent,
-            input,
-            context=context,
-            max_turns=max_turns,
-            hooks=hooks,
-            run_config=run_config,
-            previous_response_id=previous_response_id,
-            conversation_id=conversation_id,
-            session=session,
-            **kwargs,  # backwards compatibility
-        )
-        # Runtime-patch stream_events so the observer closes only after streaming completes
-        orig_stream_events = res.stream_events
-        async def _patched_stream_events(self: RunResultStreaming):
-            try:
-                async for event in orig_stream_events():
-                    yield event
-                observer.result = self.final_output
-                update_trace_attributes(output=self.final_output)
-            except Exception as e:
-                observer.__exit__(type(e), e, e.__traceback__)
-                raise
-            finally:
-                observer.__exit__(None, None, None)
-        from types import MethodType as _MethodType
-        res.stream_events = _MethodType(_patched_stream_events, res)
-        return res
-def update_trace_attributes(
-    input: Any = None,
-    output: Any = None,
-    name: str = None,
-    tags: List[str] = None,
-    metadata: dict = None,
-    thread_id: str = None,
-    user_id: str = None,
-    metric_collection: str = None,
-    metrics: List[BaseMetric] = None,
-):
-    current_trace = current_trace_context.get()
-    if input:
-        current_trace.input = input
-    if output:
-        current_trace.output = output
-    if name:
-        current_trace.name = name
-    if tags:
-        current_trace.tags = tags
-    if metadata:
-        current_trace.metadata = metadata
-    if thread_id:
-        current_trace.thread_id = thread_id
-    if user_id:
-        current_trace.user_id = user_id
-    if metric_collection:
-        current_trace.metric_collection = metric_collection
-    if metrics:
-        current_trace.metrics = metrics
+# from __future__ import annotations
+# from dataclasses import replace
+# from typing import List, Any, Union, Optional
+# try:
+#     from agents import (
+#         RunConfig,
+#         RunResult,
+#         RunResultStreaming,
+#         Runner as AgentsRunner,
+#     )
+#     from agents.agent import Agent
+#     from agents.models.interface import ModelProvider
+#     from agents.items import TResponseInputItem
+#     from agents.lifecycle import RunHooks
+#     from agents.memory import Session
+#     from agents.run import DEFAULT_MAX_TURNS
+#     from agents.run import AgentRunner
+#     from agents.run_context import TContext
+#     from agents.models.interface import Model
+#     from agents.run import SingleStepResult
+#     agents_available = True
+# except:
+#     agents_available = False
+# def is_agents_available():
+#     if not agents_available:
+#         raise ImportError(
+#             "agents is required for this integration. Install it via your package manager"
+#         )
+# from deepeval.tracing.tracing import Observer
+# from deepeval.tracing.context import current_span_context, current_trace_context
+# from deepeval.tracing.utils import make_json_serializable
+# from deepeval.tracing.types import AgentSpan
+# # Import observed provider/model helpers from our agent module
+# from deepeval.metrics import BaseMetric
+# from deepeval.openai_agents.agent import _ObservedModel
+# _PATCHED_DEFAULT_GET_MODEL = False
+# _PATCHED_DEFAULT_RUN_SINGLE_TURN = False
+# def patch_default_agent_runner_get_model():
+#     global _PATCHED_DEFAULT_GET_MODEL
+#     if _PATCHED_DEFAULT_GET_MODEL:
+#         return
+#     original_get_model_cm = AgentRunner._get_model
+#     try:
+#         original_get_model = original_get_model_cm.__func__
+#     except AttributeError:
+#         original_get_model = original_get_model_cm  # fallback (non-classmethod edge case)
+#     def patched_get_model(cls, *args, **kwargs) -> Model:
+#         model = original_get_model(cls, *args, **kwargs)
+#         agent = kwargs.get("agent") if "agent" in kwargs else (args[0] if args else None)
+#         if agent is None:
+#             return model
+#         if isinstance(model, _ObservedModel):
+#             return model
+#         llm_metrics = getattr(agent, "llm_metrics", None)
+#         llm_metric_collection = getattr(agent, "llm_metric_collection", None)
+#         confident_prompt = getattr(agent, "confident_prompt", None)
+#         return _ObservedModel(
+#             inner=model,
+#             llm_metric_collection=llm_metric_collection,
+#             llm_metrics=llm_metrics,
+#             confident_prompt=confident_prompt,
+#         )
+#     # Preserve basic metadata and mark as patched
+#     patched_get_model.__name__ = original_get_model.__name__
+#     patched_get_model.__doc__ = original_get_model.__doc__
+#     AgentRunner._get_model = classmethod(patched_get_model)
+#     _PATCHED_DEFAULT_GET_MODEL = True
+# # if agents_available:
+#     # patch_default_agent_run_single_turn()
+#     # patch_single_turn_streamed()
+#     # patch_default_agent_runner_get_model()
+# class Runner(AgentsRunner):
+#     @classmethod
+#     async def run(
+#         cls,
+#         starting_agent: Agent[TContext],
+#         input: Union[str, list[TResponseInputItem]],
+#         *,
+#         context: Optional[TContext] = None,
+#         max_turns: int = DEFAULT_MAX_TURNS,
+#         hooks: Optional[RunHooks[TContext]] = None,
+#         run_config: Optional[RunConfig] = None,
+#         previous_response_id: Optional[str] = None,
+#         conversation_id: Optional[str] = None,
+#         session: Optional[Session] = None,
+#         metrics: Optional[List[BaseMetric]] = None,
+#         metric_collection: Optional[str] = None,
+#         name: Optional[str] = None,
+#         tags: Optional[List[str]] = None,
+#         metadata: Optional[dict] = None,
+#         thread_id: Optional[str] = None,
+#         user_id: Optional[str] = None,
+#         **kwargs,  # backwards compatibility
+#     ) -> RunResult:
+#         is_agents_available()
+#         # _patch_default_agent_runner_get_model()
+#         with Observer(
+#             span_type="custom",
+#             metric_collection=metric_collection,
+#             metrics=metrics,
+#             func_name="run",
+#             function_kwargs={"input": input},  # also set below
+#         ) as observer:
+#             update_trace_attributes(
+#                 name=name,
+#                 tags=tags,
+#                 metadata=metadata,
+#                 thread_id=thread_id,
+#                 user_id=user_id,
+#                 metric_collection=metric_collection,
+#                 metrics=metrics,
+#             )
+#             current_span = current_span_context.get()
+#             current_trace = current_trace_context.get()
+#             if not current_trace.input:
+#                 current_trace.input = input
+#             if current_span:
+#                 current_span.input = input
+#             res = await super().run(
+#                 starting_agent,
+#                 input,
+#                 context=context,
+#                 max_turns=max_turns,
+#                 hooks=hooks,
+#                 run_config=run_config,
+#                 previous_response_id=previous_response_id,
+#                 conversation_id=conversation_id,
+#                 session=session,
+#                 **kwargs,  # backwards compatibility
+#             )
+#             current_trace_thread_id = current_trace_context.get().thread_id
+#             _output = None
+#             if current_trace_thread_id:
+#                 _output = res.final_output
+#             else:
+#                 _output = str(res)
+#             observer.result = _output
+#             update_trace_attributes(output=_output)
+#         return res
+#     @classmethod
+#     def run_sync(
+#         cls,
+#         starting_agent: Agent[TContext],
+#         input: Union[str, list[TResponseInputItem]],
+#         *,
+#         context: Optional[TContext] = None,
+#         max_turns: int = DEFAULT_MAX_TURNS,
+#         hooks: Optional[RunHooks[TContext]] = None,
+#         run_config: Optional[RunConfig] = None,
+#         previous_response_id: Optional[str] = None,
+#         conversation_id: Optional[str] = None,
+#         session: Optional[Session] = None,
+#         metrics: Optional[List[BaseMetric]] = None,
+#         metric_collection: Optional[str] = None,
+#         name: Optional[str] = None,
+#         tags: Optional[List[str]] = None,
+#         metadata: Optional[dict] = None,
+#         thread_id: Optional[str] = None,
+#         user_id: Optional[str] = None,
+#         **kwargs,
+#     ) -> RunResult:
+#         is_agents_available()
+#         with Observer(
+#             span_type="custom",
+#             metric_collection=metric_collection,
+#             metrics=metrics,
+#             func_name="run_sync",
+#             function_kwargs={"input": input},  # also set below
+#         ) as observer:
+#             update_trace_attributes(
+#                 name=name,
+#                 tags=tags,
+#                 metadata=metadata,
+#                 thread_id=thread_id,
+#                 user_id=user_id,
+#                 metric_collection=metric_collection,
+#                 metrics=metrics,
+#             )
+#             current_span = current_span_context.get()
+#             current_trace = current_trace_context.get()
+#             if not current_trace.input:
+#                 current_trace.input = input
+#             if current_span:
+#                 current_span.input = input
+#             res = super().run_sync(
+#                 starting_agent,
+#                 input,
+#                 context=context,
+#                 max_turns=max_turns,
+#                 hooks=hooks,
+#                 run_config=run_config,
+#                 previous_response_id=previous_response_id,
+#                 conversation_id=conversation_id,
+#                 session=session,
+#                 **kwargs,  # backwards compatibility
+#             )
+#             current_trace_thread_id = current_trace_context.get().thread_id
+#             _output = None
+#             if current_trace_thread_id:
+#                 _output = res.final_output
+#             else:
+#                 _output = str(res)
+#             update_trace_attributes(output=_output)
+#             observer.result = _output
+#         return res
+#     @classmethod
+#     def run_streamed(
+#         cls,
+#         starting_agent: Agent[TContext],
+#         input: Union[str, list[TResponseInputItem]],
+#         *,
+#         context: Optional[TContext] = None,
+#         max_turns: int = DEFAULT_MAX_TURNS,
+#         hooks: Optional[RunHooks[TContext]] = None,
+#         run_config: Optional[RunConfig] = None,
+#         previous_response_id: Optional[str] = None,
+#         conversation_id: Optional[str] = None,
+#         session: Optional[Session] = None,
+#         metrics: Optional[List[BaseMetric]] = None,
+#         metric_collection: Optional[str] = None,
+#         name: Optional[str] = None,
+#         tags: Optional[List[str]] = None,
+#         metadata: Optional[dict] = None,
+#         thread_id: Optional[str] = None,
+#         user_id: Optional[str] = None,
+#         **kwargs,  # backwards compatibility
+#     ) -> RunResultStreaming:
+#         is_agents_available()
+#         # Manually enter observer; we'll exit when streaming finishes
+#         observer = Observer(
+#             span_type="custom",
+#             metric_collection=metric_collection,
+#             metrics=metrics,
+#             func_name="run_streamed",
+#             function_kwargs={"input": input},
+#         )
+#         observer.__enter__()
+#         update_trace_attributes(
+#             name=name,
+#             tags=tags,
+#             metadata=metadata,
+#             thread_id=thread_id,
+#             user_id=user_id,
+#             metric_collection=metric_collection,
+#             metrics=metrics,
+#         )
+#         current_trace = current_trace_context.get()
+#         if not current_trace.input:
+#             current_trace.input = input
+#         current_span = current_span_context.get()
+#         if current_span:
+#             current_span.input = input
+#         res = super().run_streamed(
+#             starting_agent,
+#             input,
+#             context=context,
+#             max_turns=max_turns,
+#             hooks=hooks,
+#             run_config=run_config,
+#             previous_response_id=previous_response_id,
+#             conversation_id=conversation_id,
+#             session=session,
+#             **kwargs,  # backwards compatibility
+#         )
+#         # Runtime-patch stream_events so the observer closes only after streaming completes
+#         orig_stream_events = res.stream_events
+#         async def _patched_stream_events(self: RunResultStreaming):
+#             try:
+#                 async for event in orig_stream_events():
+#                     yield event
+#                 observer.result = self.final_output
+#                 update_trace_attributes(output=self.final_output)
+#             except Exception as e:
+#                 observer.__exit__(type(e), e, e.__traceback__)
+#                 raise
+#             finally:
+#                 observer.__exit__(None, None, None)
+#         from types import MethodType as _MethodType
+#         res.stream_events = _MethodType(_patched_stream_events, res)
+#         return res
+# def update_trace_attributes(
+#     input: Any = None,
+#     output: Any = None,
+#     name: str = None,
+#     tags: List[str] = None,
+#     metadata: dict = None,
+#     thread_id: str = None,
+#     user_id: str = None,
+#     metric_collection: str = None,
+#     metrics: List[BaseMetric] = None,
+# ):
+#     current_trace = current_trace_context.get()
+#     if input:
+#         current_trace.input = input
+#     if output:
+#         current_trace.output = output
+#     if name:
+#         current_trace.name = name
+#     if tags:
+#         current_trace.tags = tags
+#     if metadata:
+#         current_trace.metadata = metadata
+#     if thread_id:
+#         current_trace.thread_id = thread_id
+#     if user_id:
+#         current_trace.user_id = user_id
+#     if metric_collection:
+#         current_trace.metric_collection = metric_collection
+#     if metrics:
+#         current_trace.metrics = metrics

deepeval 3.5.9__py3-none-any.whl → 3.6.1__py3-none-any.whl

deepeval 3.5.9py3-none-any.whl → 3.6.1py3-none-any.whl