PyPI - deepeval - Versions diffs - 3.7.6__py3-none-any.whl → 3.7.8__py3-none-any.whl - Mend

deepeval 3.7.6py3-none-any.whl → 3.7.8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (57) hide show

deepeval/_version.py +1 -1
deepeval/cli/main.py +2022 -759
deepeval/cli/utils.py +208 -36
deepeval/config/dotenv_handler.py +19 -0
deepeval/config/settings.py +658 -262
deepeval/config/utils.py +9 -1
deepeval/dataset/test_run_tracer.py +4 -6
deepeval/evaluate/execute.py +153 -94
deepeval/integrations/pydantic_ai/instrumentator.py +4 -2
deepeval/integrations/pydantic_ai/otel.py +5 -1
deepeval/key_handler.py +121 -51
deepeval/metrics/base_metric.py +9 -3
deepeval/metrics/g_eval/g_eval.py +6 -1
deepeval/metrics/indicator.py +8 -4
deepeval/metrics/mcp/mcp_task_completion.py +15 -16
deepeval/metrics/mcp/multi_turn_mcp_use_metric.py +15 -15
deepeval/metrics/mcp/schema.py +4 -0
deepeval/metrics/mcp/template.py +8 -1
deepeval/metrics/prompt_alignment/prompt_alignment.py +6 -3
deepeval/metrics/tool_use/schema.py +4 -0
deepeval/metrics/tool_use/template.py +16 -2
deepeval/metrics/tool_use/tool_use.py +30 -28
deepeval/metrics/topic_adherence/schema.py +4 -0
deepeval/metrics/topic_adherence/template.py +8 -1
deepeval/metrics/topic_adherence/topic_adherence.py +15 -14
deepeval/metrics/turn_contextual_precision/template.py +8 -1
deepeval/metrics/turn_contextual_precision/turn_contextual_precision.py +44 -86
deepeval/metrics/turn_contextual_recall/template.py +8 -1
deepeval/metrics/turn_contextual_recall/turn_contextual_recall.py +44 -82
deepeval/metrics/turn_contextual_relevancy/template.py +8 -1
deepeval/metrics/turn_contextual_relevancy/turn_contextual_relevancy.py +48 -92
deepeval/metrics/turn_faithfulness/template.py +8 -1
deepeval/metrics/turn_faithfulness/turn_faithfulness.py +76 -130
deepeval/metrics/utils.py +16 -1
deepeval/models/__init__.py +2 -0
deepeval/models/llms/__init__.py +2 -0
deepeval/models/llms/amazon_bedrock_model.py +5 -4
deepeval/models/llms/anthropic_model.py +4 -3
deepeval/models/llms/azure_model.py +4 -3
deepeval/models/llms/deepseek_model.py +5 -8
deepeval/models/llms/grok_model.py +5 -8
deepeval/models/llms/kimi_model.py +5 -8
deepeval/models/llms/litellm_model.py +2 -0
deepeval/models/llms/local_model.py +1 -1
deepeval/models/llms/openai_model.py +4 -3
deepeval/models/retry_policy.py +10 -5
deepeval/models/utils.py +1 -5
deepeval/simulator/conversation_simulator.py +6 -2
deepeval/simulator/template.py +3 -1
deepeval/synthesizer/synthesizer.py +19 -17
deepeval/test_run/test_run.py +6 -1
deepeval/utils.py +26 -0
{deepeval-3.7.6.dist-info → deepeval-3.7.8.dist-info}/METADATA +3 -3
{deepeval-3.7.6.dist-info → deepeval-3.7.8.dist-info}/RECORD +57 -56
{deepeval-3.7.6.dist-info → deepeval-3.7.8.dist-info}/LICENSE.md +0 -0
{deepeval-3.7.6.dist-info → deepeval-3.7.8.dist-info}/WHEEL +0 -0
{deepeval-3.7.6.dist-info → deepeval-3.7.8.dist-info}/entry_points.txt +0 -0

deepeval/config/utils.py CHANGED Viewed

@@ -1,7 +1,8 @@
 import json
 import os
 import re
+from dotenv import dotenv_values
+from pathlib import Path
 from typing import Any, Iterable, List, Optional
@@ -142,3 +143,10 @@ def dedupe_preserve_order(items: Iterable[str]) -> List[str]:
 def constrain_between(value: float, lo: float, hi: float) -> float:
     """Return value constrained to the inclusive range [lo, hi]."""
     return min(max(value, lo), hi)
+def read_dotenv_file(path: Path) -> dict[str, str]:
+    if not path.exists():
+        return {}
+    values = dotenv_values(path)
+    return {key: value for key, value in values.items() if value is not None}

deepeval/dataset/test_run_tracer.py CHANGED Viewed

@@ -5,6 +5,7 @@ from opentelemetry.trace import Tracer as OTelTracer
 from opentelemetry.sdk.trace import SpanProcessor
 from opentelemetry.sdk.trace import TracerProvider
 from opentelemetry.sdk.trace.export import BatchSpanProcessor
+from deepeval.config.settings import get_settings
 try:
     from opentelemetry.exporter.otlp.proto.http.trace_exporter import (
@@ -26,11 +27,8 @@ def is_opentelemetry_available():
 from deepeval.confident.api import get_confident_api_key
-OTLP_ENDPOINT = (
-    os.getenv("OTEL_EXPORTER_OTLP_ENDPOINT")
-    if os.getenv("OTEL_EXPORTER_OTLP_ENDPOINT")
-    else "https://otel.confident-ai.com"
-)
+settings = get_settings()
+OTLP_ENDPOINT = str(settings.CONFIDENT_OTEL_URL)
 # OTLP_ENDPOINT = "http://127.0.0.1:4318"
 # Module-level globals to be imported and used by other code
@@ -67,7 +65,7 @@ def init_global_test_run_tracer(api_key: Optional[str] = None):
     provider = TracerProvider()
     exporter = OTLPSpanExporter(
-        endpoint=f"{OTLP_ENDPOINT}/v1/traces",
+        endpoint=f"{OTLP_ENDPOINT}v1/traces",
         headers={"x-confident-api-key": api_key},
     )
     provider.add_span_processor(RunIdSpanProcessor())

deepeval/evaluate/execute.py CHANGED Viewed

@@ -51,6 +51,10 @@ from deepeval.utils import (
     shorten,
     len_medium,
     format_error_text,
+    are_timeouts_disabled,
+    get_per_task_timeout_seconds,
+    get_gather_timeout_seconds,
+    get_gather_timeout,
 )
 from deepeval.telemetry import capture_evaluation_run
 from deepeval.metrics import (
@@ -109,6 +113,57 @@ from deepeval.test_run.hyperparameters import (
 logger = logging.getLogger(__name__)
+def _timeout_msg(action: str, seconds: float) -> str:
+    if are_timeouts_disabled():
+        return (
+            f"Timeout occurred while {action} "
+            "(DeepEval timeouts are disabled; this likely came from the model/provider SDK or network layer). "
+            "Set DEEPEVAL_LOG_STACK_TRACES=1 for full traceback."
+        )
+    return (
+        f"Timed out after {seconds:.2f}s while {action}. "
+        "Increase DEEPEVAL_PER_TASK_TIMEOUT_SECONDS_OVERRIDE or set "
+        "DEEPEVAL_LOG_STACK_TRACES=1 for full traceback."
+    )
+def _log_gather_timeout(
+    logger,
+    *,
+    exc: Optional[BaseException] = None,
+    pending: Optional[int] = None,
+) -> None:
+    settings = get_settings()
+    if are_timeouts_disabled():
+        logger.warning(
+            "A task raised %s while waiting for gathered results; DeepEval gather/per-task timeouts are disabled%s. "
+            "This likely came from the model/provider SDK or network layer.",
+            type(exc).__name__ if exc else "TimeoutError",
+            f" (pending={pending})" if pending is not None else "",
+            exc_info=settings.DEEPEVAL_LOG_STACK_TRACES,
+        )
+    else:
+        if pending is not None:
+            logger.warning(
+                "Gather TIMEOUT after %.1fs; pending=%d tasks. "
+                "Some metrics may be marked as timed out. "
+                "To give tasks more time, consider increasing "
+                "DEEPEVAL_PER_TASK_TIMEOUT_SECONDS_OVERRIDE or "
+                "DEEPEVAL_TASK_GATHER_BUFFER_SECONDS_OVERRIDE.",
+                get_gather_timeout_seconds(),
+                pending,
+            )
+        else:
+            logger.warning(
+                "gather TIMEOUT after %.1fs. Some metrics may be marked as timed out. "
+                "To give tasks more time, consider increasing "
+                "DEEPEVAL_PER_TASK_TIMEOUT_SECONDS_OVERRIDE or "
+                "DEEPEVAL_TASK_GATHER_BUFFER_SECONDS_OVERRIDE.",
+                get_gather_timeout_seconds(),
+            )
 def _skip_metrics_for_error(
     span: Optional[BaseSpan] = None,
     trace: Optional[Trace] = None,
@@ -217,18 +272,6 @@ async def _snapshot_tasks():
     return {t for t in asyncio.all_tasks() if t is not cur}
-def _per_task_timeout() -> float:
-    return get_settings().DEEPEVAL_PER_TASK_TIMEOUT_SECONDS
-def _gather_timeout() -> float:
-    s = get_settings()
-    return (
-        s.DEEPEVAL_PER_TASK_TIMEOUT_SECONDS
-        + s.DEEPEVAL_TASK_GATHER_BUFFER_SECONDS
-    )
 def filter_duplicate_results(
     main_result: TestResult, results: List[TestResult]
 ) -> List[TestResult]:
@@ -250,6 +293,10 @@ async def _await_with_outer_deadline(obj, *args, timeout: float, **kwargs):
             coro = obj
         else:
             coro = obj(*args, **kwargs)
+        if get_settings().DEEPEVAL_DISABLE_TIMEOUTS:
+            return await coro
         return await asyncio.wait_for(coro, timeout=timeout)
     finally:
         reset_outer_deadline(token)
@@ -350,7 +397,7 @@ def execute_test_cases(
             index_of = {id(m): i for i, m in enumerate(metrics_for_case)}
             current_index = -1
             start_time = time.perf_counter()
-            deadline_timeout = _per_task_timeout()
+            deadline_timeout = get_per_task_timeout_seconds()
             deadline_token = set_outer_deadline(deadline_timeout)
             new_cached_test_case: CachedTestCase = None
             try:
@@ -435,25 +482,20 @@ def execute_test_cases(
                 run_sync_with_timeout(_run_case, deadline_timeout)
             except (asyncio.TimeoutError, TimeoutError):
-                msg = (
-                    f"Timed out after {deadline_timeout:.2f}s while evaluating metric. "
-                    "Increase DEEPEVAL_PER_TASK_TIMEOUT_SECONDS_OVERRIDE or set "
-                    "DEEPEVAL_LOG_STACK_TRACES=1 for full traceback."
-                )
-                for i, m in enumerate(metrics_for_case):
-                    if getattr(m, "skipped", False):
+                msg = _timeout_msg("evaluating metric", deadline_timeout)
+                for i, metric in enumerate(metrics_for_case):
+                    if metric.skipped:
                         continue
                     # already finished or errored? leave it
-                    if getattr(m, "success", None) is not None or getattr(
-                        m, "error", None
-                    ):
+                    if metric.success is not None or metric.error is not None:
                         continue
                     if i == current_index:
-                        m.success = False
-                        m.error = msg
+                        metric.success = False
+                        metric.error = msg
                     elif i > current_index:
-                        m.success = False
-                        m.error = "Skipped due to case timeout."
+                        metric.success = False
+                        metric.error = "Skipped due to case timeout."
                 if not error_config.ignore_errors:
                     raise
@@ -478,12 +520,12 @@ def execute_test_cases(
                         )
                     # Attach MetricData for *all* metrics (finished or synthesized)
-                    for i, m in enumerate(metrics_for_case):
-                        if getattr(m, "skipped", False):
+                    for i, metric in enumerate(metrics_for_case):
+                        if metric.skipped:
                             continue
                         if not emitted[i]:
                             api_test_case.update_metric_data(
-                                create_metric_data(m)
+                                create_metric_data(metric)
                             )
                     elapsed = time.perf_counter() - start_time
@@ -536,9 +578,8 @@ async def a_execute_test_cases(
     async def execute_with_semaphore(func: Callable, *args, **kwargs):
         async with semaphore:
-            timeout = _per_task_timeout()
             return await _await_with_outer_deadline(
-                func, *args, timeout=timeout, **kwargs
+                func, *args, timeout=get_per_task_timeout_seconds(), **kwargs
             )
     global_test_run_cache_manager.disable_write_cache = (
@@ -636,17 +677,16 @@ async def a_execute_test_cases(
             try:
                 await asyncio.wait_for(
                     asyncio.gather(*tasks),
-                    timeout=_gather_timeout(),
+                    timeout=get_gather_timeout(),
                 )
-            except (asyncio.TimeoutError, TimeoutError):
+            except (asyncio.TimeoutError, TimeoutError) as e:
                 for t in tasks:
                     if not t.done():
                         t.cancel()
                 await asyncio.gather(*tasks, return_exceptions=True)
-                logging.getLogger("deepeval").error(
-                    "Gather timed out after %.1fs. Some metrics may be marked as timed out.",
-                    _gather_timeout(),
-                )
+                _log_gather_timeout(logger, exc=e)
                 if not error_config.ignore_errors:
                     raise
@@ -706,7 +746,7 @@ async def a_execute_test_cases(
         try:
             await asyncio.wait_for(
                 asyncio.gather(*tasks),
-                timeout=_gather_timeout(),
+                timeout=get_gather_timeout(),
             )
         except (asyncio.TimeoutError, TimeoutError):
             # Cancel any still-pending tasks and drain them
@@ -775,11 +815,18 @@ async def _a_execute_llm_test_cases(
             progress=progress,
         )
     except asyncio.CancelledError:
-        msg = (
-            "Timed out/cancelled while evaluating metric. "
-            "Increase DEEPEVAL_PER_TASK_TIMEOUT_SECONDS_OVERRIDE or set "
-            "DEEPEVAL_LOG_STACK_TRACES=1 for full traceback."
-        )
+        if get_settings().DEEPEVAL_DISABLE_TIMEOUTS:
+            msg = (
+                "Cancelled while evaluating metric. "
+                "(DeepEval timeouts are disabled; this cancellation likely came from upstream orchestration or manual cancellation). "
+                "Set DEEPEVAL_LOG_STACK_TRACES=1 for full traceback."
+            )
+        else:
+            msg = (
+                "Timed out/cancelled while evaluating metric. "
+                "Increase DEEPEVAL_PER_TASK_TIMEOUT_SECONDS_OVERRIDE or set "
+                "DEEPEVAL_LOG_STACK_TRACES=1 for full traceback."
+            )
         for m in metrics:
             if getattr(m, "skipped", False):
                 continue
@@ -885,11 +932,18 @@ async def _a_execute_conversational_test_cases(
         )
     except asyncio.CancelledError:
-        msg = (
-            "Timed out/cancelled while evaluating metric. "
-            "Increase DEEPEVAL_PER_TASK_TIMEOUT_SECONDS_OVERRIDE or set "
-            "DEEPEVAL_LOG_STACK_TRACES=1 for full traceback."
-        )
+        if get_settings().DEEPEVAL_DISABLE_TIMEOUTS:
+            msg = (
+                "Cancelled while evaluating metric. "
+                "(DeepEval timeouts are disabled; this cancellation likely came from upstream orchestration or manual cancellation). "
+                "Set DEEPEVAL_LOG_STACK_TRACES=1 for full traceback."
+            )
+        else:
+            msg = (
+                "Timed out/cancelled while evaluating metric. "
+                "Increase DEEPEVAL_PER_TASK_TIMEOUT_SECONDS_OVERRIDE or set "
+                "DEEPEVAL_LOG_STACK_TRACES=1 for full traceback."
+            )
         for m in metrics:
             if getattr(m, "skipped", False):
                 continue
@@ -999,7 +1053,7 @@ def execute_agentic_test_cases(
                             loop.run_until_complete(
                                 _await_with_outer_deadline(
                                     coro,
-                                    timeout=_per_task_timeout(),
+                                    timeout=get_per_task_timeout_seconds(),
                                 )
                             )
                         else:
@@ -1326,17 +1380,13 @@ def execute_agentic_test_cases(
             # run the golden with a timeout
             start_time = time.perf_counter()
-            deadline = _per_task_timeout()
+            deadline = get_per_task_timeout_seconds()
             try:
                 run_sync_with_timeout(_run_golden, deadline)
             except (asyncio.TimeoutError, TimeoutError):
                 # mark any not yet finished trace level and span level metrics as timed out.
-                msg = (
-                    f"Timed out after {deadline:.2f}s while executing agentic test case. "
-                    "Increase DEEPEVAL_PER_TASK_TIMEOUT_SECONDS_OVERRIDE or set "
-                    "DEEPEVAL_LOG_STACK_TRACES=1 for full traceback."
-                )
+                msg = _timeout_msg("executing agentic test case", deadline)
                 if current_trace is not None:
                     # Trace-level metrics
@@ -1517,9 +1567,8 @@ async def a_execute_agentic_test_cases(
     async def execute_with_semaphore(func: Callable, *args, **kwargs):
         async with semaphore:
-            timeout = _per_task_timeout()
             return await _await_with_outer_deadline(
-                func, *args, timeout=timeout, **kwargs
+                func, *args, timeout=get_per_task_timeout_seconds(), **kwargs
             )
     test_run_manager = global_test_run_manager
@@ -1570,7 +1619,7 @@ async def a_execute_agentic_test_cases(
             try:
                 await asyncio.wait_for(
                     asyncio.gather(*tasks),
-                    timeout=_gather_timeout(),
+                    timeout=get_gather_timeout(),
                 )
             except (asyncio.TimeoutError, TimeoutError):
                 # Cancel any still-pending tasks and drain them
@@ -1651,7 +1700,7 @@ async def _a_execute_agentic_test_case(
                     await _await_with_outer_deadline(
                         observed_callback,
                         golden.input,
-                        timeout=_per_task_timeout(),
+                        timeout=get_per_task_timeout_seconds(),
                     )
                 else:
                     observed_callback(golden.input)
@@ -1745,7 +1794,7 @@ async def _a_execute_agentic_test_case(
                 try:
                     await asyncio.wait_for(
                         asyncio.gather(*child_tasks),
-                        timeout=_gather_timeout(),
+                        timeout=get_gather_timeout(),
                     )
                 except (asyncio.TimeoutError, TimeoutError):
                     for t in child_tasks:
@@ -1768,11 +1817,18 @@ async def _a_execute_agentic_test_case(
                     )
     except asyncio.CancelledError:
         # mark any unfinished metrics as cancelled
-        cancel_msg = (
-            "Timed out/cancelled while evaluating agentic test case. "
-            "Increase DEEPEVAL_PER_TASK_TIMEOUT_SECONDS_OVERRIDE or set "
-            "DEEPEVAL_LOG_STACK_TRACES=1 for full traceback."
-        )
+        if get_settings().DEEPEVAL_DISABLE_TIMEOUTS:
+            cancel_msg = (
+                "Cancelled while evaluating agentic test case. "
+                "(DeepEval timeouts are disabled; this cancellation likely came from upstream orchestration or manual cancellation). "
+                "Set DEEPEVAL_LOG_STACK_TRACES=1 for full traceback."
+            )
+        else:
+            cancel_msg = (
+                "Timed out/cancelled while evaluating agentic test case. "
+                "Increase DEEPEVAL_PER_TASK_TIMEOUT_SECONDS_OVERRIDE or set "
+                "DEEPEVAL_LOG_STACK_TRACES=1 for full traceback."
+            )
         if trace_metrics:
             for m in trace_metrics:
@@ -2464,8 +2520,9 @@ def a_execute_agentic_test_cases_from_loop(
     async def execute_callback_with_semaphore(coroutine: Awaitable):
         async with semaphore:
-            timeout = _per_task_timeout()
-            return await _await_with_outer_deadline(coroutine, timeout=timeout)
+            return await _await_with_outer_deadline(
+                coroutine, timeout=get_per_task_timeout_seconds()
+            )
     def evaluate_test_cases(
         progress: Optional[Progress] = None,
@@ -2687,15 +2744,18 @@ def a_execute_agentic_test_cases_from_loop(
                 loop.run_until_complete(
                     asyncio.wait_for(
                         asyncio.gather(*created_tasks, return_exceptions=True),
-                        timeout=_gather_timeout(),
+                        timeout=get_gather_timeout(),
                     )
                 )
-            except (asyncio.TimeoutError, TimeoutError):
+            except (asyncio.TimeoutError, TimeoutError) as e:
                 import traceback
+                settings = get_settings()
                 pending = [t for t in created_tasks if not t.done()]
+                _log_gather_timeout(logger, exc=e, pending=len(pending))
                 # Log the elapsed time for each task that was pending
                 for t in pending:
                     meta = task_meta.get(t, {})
@@ -2703,26 +2763,27 @@ def a_execute_agentic_test_cases_from_loop(
                     elapsed_time = time.perf_counter() - start_time
                     # Determine if it was a per task or gather timeout based on task's elapsed time
-                    if elapsed_time >= _per_task_timeout():
-                        timeout_type = "per-task"
+                    if not settings.DEEPEVAL_DISABLE_TIMEOUTS:
+                        timeout_type = (
+                            "per-task"
+                            if elapsed_time >= get_per_task_timeout_seconds()
+                            else "gather"
+                        )
+                        logger.info(
+                            "  - PENDING %s elapsed_time=%.2fs timeout_type=%s meta=%s",
+                            t.get_name(),
+                            elapsed_time,
+                            timeout_type,
+                            meta,
+                        )
                     else:
-                        timeout_type = "gather"
-                    logger.warning(
-                        f"[deepeval] gather TIMEOUT after {_gather_timeout()}s; "
-                        f"pending={len(pending)} tasks. Timeout type: {timeout_type}. "
-                        f"To give tasks more time, consider increasing "
-                        f"DEEPEVAL_PER_TASK_TIMEOUT_SECONDS for longer task completion time or "
-                        f"DEEPEVAL_TASK_GATHER_BUFFER_SECONDS to allow more time for gathering results."
-                    )
+                        logger.info(
+                            "  - PENDING %s elapsed_time=%.2fs meta=%s",
+                            t.get_name(),
+                            elapsed_time,
+                            meta,
+                        )
-                    # Log pending tasks and their stack traces
-                    logger.info(
-                        "  - PENDING %s elapsed_time=%.2fs meta=%s",
-                        t.get_name(),
-                        elapsed_time,
-                        meta,
-                    )
                     if loop.get_debug() and get_settings().DEEPEVAL_DEBUG_ASYNC:
                         frames = t.get_stack(limit=6)
                         if frames:
@@ -2904,9 +2965,8 @@ async def _a_evaluate_traces(
     async def execute_evals_with_semaphore(func: Callable, *args, **kwargs):
         async with semaphore:
-            timeout = _per_task_timeout()
             return await _await_with_outer_deadline(
-                func, *args, timeout=timeout, **kwargs
+                func, *args, timeout=get_per_task_timeout_seconds(), **kwargs
             )
     eval_tasks = []
@@ -2954,7 +3014,7 @@ async def _a_evaluate_traces(
     try:
         await asyncio.wait_for(
             asyncio.gather(*eval_tasks),
-            timeout=_gather_timeout(),
+            timeout=get_gather_timeout(),
         )
     except (asyncio.TimeoutError, TimeoutError):
         for t in eval_tasks:
@@ -2984,9 +3044,8 @@ async def _evaluate_test_case_pairs(
     async def execute_with_semaphore(func: Callable, *args, **kwargs):
         async with semaphore:
-            timeout = _per_task_timeout()
             return await _await_with_outer_deadline(
-                func, *args, timeout=timeout, **kwargs
+                func, *args, timeout=get_per_task_timeout_seconds(), **kwargs
             )
     tasks = []
@@ -3024,7 +3083,7 @@ async def _evaluate_test_case_pairs(
     try:
         await asyncio.wait_for(
             asyncio.gather(*tasks),
-            timeout=_gather_timeout(),
+            timeout=get_gather_timeout(),
         )
     except (asyncio.TimeoutError, TimeoutError):
         # Cancel any still-pending tasks and drain them

deepeval/integrations/pydantic_ai/instrumentator.py CHANGED Viewed

@@ -27,6 +27,7 @@ from deepeval.tracing.types import (
 )
 logger = logging.getLogger(__name__)
+settings = get_settings()
 try:
     # Optional dependencies
@@ -48,7 +49,7 @@ except ImportError as e:
     dependency_installed = False
     # Preserve previous behavior: only log when verbose mode is enabled.
-    if get_settings().DEEPEVAL_VERBOSE_MODE:
+    if settings.DEEPEVAL_VERBOSE_MODE:
         if isinstance(e, ModuleNotFoundError):
             logger.warning(
                 "Optional tracing dependency not installed: %s",
@@ -104,7 +105,8 @@ else:
     ReadableSpan = _ReadableSpan
 # OTLP_ENDPOINT = "http://127.0.0.1:4318/v1/traces"
-OTLP_ENDPOINT = "https://otel.confident-ai.com/v1/traces"
+# OTLP_ENDPOINT = "https://otel.confident-ai.com/v1/traces"
+OTLP_ENDPOINT = str(settings.CONFIDENT_OTEL_URL) + "v1/traces"
 init_clock_bridge()  # initialize clock bridge for perf_counter() to epoch_nanos conversion

deepeval/integrations/pydantic_ai/otel.py CHANGED Viewed

@@ -1,6 +1,7 @@
 import warnings
 from typing import Optional
 from deepeval.telemetry import capture_tracing_integration
+from deepeval.config.settings import get_settings
 try:
     from opentelemetry import trace
@@ -23,7 +24,10 @@ def is_opentelemetry_available():
     return True
-OTLP_ENDPOINT = "https://otel.confident-ai.com/v1/traces"
+settings = get_settings()
+# OTLP_ENDPOINT = "https://otel.confident-ai.com/v1/traces"
+OTLP_ENDPOINT = str(settings.CONFIDENT_OTEL_URL) + "v1/traces"
 def instrument_pydantic_ai(api_key: Optional[str] = None):

deepeval 3.7.6__py3-none-any.whl → 3.7.8__py3-none-any.whl

deepeval 3.7.6py3-none-any.whl → 3.7.8py3-none-any.whl