PyPI - deepeval - Versions diffs - 3.6.1__py3-none-any.whl → 3.6.3__py3-none-any.whl - Mend

deepeval 3.6.1py3-none-any.whl → 3.6.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (20) hide show

deepeval/_version.py +1 -1
deepeval/confident/api.py +1 -0
deepeval/evaluate/execute.py +11 -2
deepeval/metrics/g_eval/g_eval.py +3 -2
deepeval/metrics/hallucination/hallucination.py +1 -1
deepeval/metrics/tool_correctness/tool_correctness.py +2 -2
deepeval/models/llms/amazon_bedrock_model.py +3 -31
deepeval/models/llms/openai_model.py +0 -1
deepeval/models/llms/utils.py +22 -0
deepeval/prompt/api.py +2 -0
deepeval/prompt/prompt.py +281 -121
deepeval/test_case/llm_test_case.py +3 -0
deepeval/tracing/otel/utils.py +71 -55
deepeval/tracing/tracing.py +7 -1
deepeval/tracing/utils.py +3 -6
{deepeval-3.6.1.dist-info → deepeval-3.6.3.dist-info}/METADATA +2 -2
{deepeval-3.6.1.dist-info → deepeval-3.6.3.dist-info}/RECORD +20 -20
{deepeval-3.6.1.dist-info → deepeval-3.6.3.dist-info}/LICENSE.md +0 -0
{deepeval-3.6.1.dist-info → deepeval-3.6.3.dist-info}/WHEEL +0 -0
{deepeval-3.6.1.dist-info → deepeval-3.6.3.dist-info}/entry_points.txt +0 -0

deepeval/_version.py CHANGED Viewed

	@@ -1 +1 @@
1	- __version__: str = "3.6.1"
1	+ __version__: str = "3.6.3"

deepeval/confident/api.py CHANGED Viewed

@@ -90,6 +90,7 @@ class Endpoints(Enum):
     TRACES_ENDPOINT = "/v1/traces"
     ANNOTATIONS_ENDPOINT = "/v1/annotations"
     PROMPTS_VERSION_ID_ENDPOINT = "/v1/prompts/:alias/versions/:versionId"
+    PROMPTS_LABEL_ENDPOINT = "/v1/prompts/:alias/labels/:label"
     PROMPTS_ENDPOINT = "/v1/prompts"
     PROMPTS_VERSIONS_ENDPOINT = "/v1/prompts/:alias/versions"
     SIMULATE_ENDPOINT = "/v1/simulate"

deepeval/evaluate/execute.py CHANGED Viewed

@@ -836,7 +836,13 @@ def execute_agentic_test_cases(
                 ):
                     if asyncio.iscoroutinefunction(observed_callback):
                         loop = get_or_create_event_loop()
-                        loop.run_until_complete(observed_callback(golden.input))
+                        coro = observed_callback(golden.input)
+                        loop.run_until_complete(
+                            asyncio.wait_for(
+                                coro,
+                                timeout=settings.DEEPEVAL_PER_TASK_TIMEOUT_SECONDS,
+                            )
+                        )
                     else:
                         observed_callback(golden.input)
                     current_trace: Trace = current_trace_context.get()
@@ -1190,7 +1196,10 @@ async def _a_execute_agentic_test_case(
             _pbar_callback_id=pbar_tags_id,
         ):
             if asyncio.iscoroutinefunction(observed_callback):
-                await observed_callback(golden.input)
+                await asyncio.wait_for(
+                    observed_callback(golden.input),
+                    timeout=settings.DEEPEVAL_PER_TASK_TIMEOUT_SECONDS,
+                )
             else:
                 observed_callback(golden.input)
             current_trace: Trace = current_trace_context.get()

deepeval/metrics/g_eval/g_eval.py CHANGED Viewed

@@ -97,7 +97,8 @@ class GEval(BaseMetric):
                     test_case, _additional_context=_additional_context
                 )
                 self.score = (
-                    float(g_score) / self.score_range_span
+                    (float(g_score) - self.score_range[0])
+                    / self.score_range_span
                     if not self.strict_mode
                     else int(g_score)
                 )
@@ -140,7 +141,7 @@ class GEval(BaseMetric):
                 test_case, _additional_context=_additional_context
             )
             self.score = (
-                float(g_score) / self.score_range_span
+                (float(g_score) - self.score_range[0]) / self.score_range_span
                 if not self.strict_mode
                 else int(g_score)
             )

deepeval/metrics/hallucination/hallucination.py CHANGED Viewed

@@ -30,7 +30,7 @@ class HallucinationMetric(BaseMetric):
         threshold: float = 0.5,
         model: Optional[Union[str, DeepEvalBaseLLM]] = None,
         include_reason: bool = True,
-        async_mode: bool = False,
+        async_mode: bool = True,
         strict_mode: bool = False,
         verbose_mode: bool = False,
         evaluation_template: Type[

deepeval/metrics/tool_correctness/tool_correctness.py CHANGED Viewed

@@ -1,4 +1,4 @@
-from typing import List, Union, Dict
+from typing import List, Dict
 from deepeval.metrics.indicator import metric_progress_indicator
 from deepeval.metrics.utils import (
@@ -299,7 +299,7 @@ class ToolCorrectnessMetric(BaseMetric):
     def is_successful(self) -> bool:
         try:
             self.success = self.score >= self.threshold
-        except:
+        except (AttributeError, TypeError):
             self.success = False
         return self.success

deepeval/models/llms/amazon_bedrock_model.py CHANGED Viewed

@@ -9,7 +9,7 @@ from deepeval.models.retry_policy import (
     sdk_retries_for,
 )
 from deepeval.models import DeepEvalBaseLLM
-from deepeval.models.llms.utils import trim_and_load_json
+from deepeval.models.llms.utils import trim_and_load_json, safe_asyncio_run
 from deepeval.constants import ProviderSlug as PS
 # check aiobotocore availability
@@ -40,7 +40,6 @@ class AmazonBedrockModel(DeepEvalBaseLLM):
         region_name: str,
         aws_access_key_id: Optional[str] = None,
         aws_secret_access_key: Optional[str] = None,
-        temperature: float = 0,
         input_token_cost: float = 0,
         output_token_cost: float = 0,
         generation_kwargs: Optional[Dict] = None,
@@ -53,13 +52,9 @@ class AmazonBedrockModel(DeepEvalBaseLLM):
         self.region_name = region_name
         self.aws_access_key_id = aws_access_key_id
         self.aws_secret_access_key = aws_secret_access_key
-        self.temperature = temperature
         self.input_token_cost = input_token_cost
         self.output_token_cost = output_token_cost
-        if self.temperature < 0:
-            raise ValueError("Temperature must be >= 0.")
         # prepare aiobotocore session, config, and async exit stack
         self._session = get_session()
         self._exit_stack = AsyncExitStack()
@@ -75,7 +70,7 @@ class AmazonBedrockModel(DeepEvalBaseLLM):
     def generate(
         self, prompt: str, schema: Optional[BaseModel] = None
     ) -> Tuple[Union[str, Dict], float]:
-        return asyncio.run(self.a_generate(prompt, schema))
+        return safe_asyncio_run(self.a_generate(prompt, schema))
     @retry_bedrock
     async def a_generate(
@@ -142,34 +137,11 @@ class AmazonBedrockModel(DeepEvalBaseLLM):
     ###############################################
     def get_converse_request_body(self, prompt: str) -> dict:
-        # Inline parameter translation with defaults
-        param_mapping = {
-            "max_tokens": "maxTokens",
-            "top_p": "topP",
-            "top_k": "topK",
-            "stop_sequences": "stopSequences",
-        }
-        # Start with defaults for required parameters
-        translated_kwargs = {
-            "maxTokens": self.generation_kwargs.get("max_tokens", 1000),
-            "topP": self.generation_kwargs.get("top_p", 0),
-        }
-        # Add any other parameters from generation_kwargs
-        for key, value in self.generation_kwargs.items():
-            if key not in [
-                "max_tokens",
-                "top_p",
-            ]:  # Skip already handled defaults
-                aws_key = param_mapping.get(key, key)
-                translated_kwargs[aws_key] = value
         return {
             "messages": [{"role": "user", "content": [{"text": prompt}]}],
             "inferenceConfig": {
-                "temperature": self.temperature,
-                **translated_kwargs,
+                **self.generation_kwargs,
             },
         }

deepeval/models/llms/openai_model.py CHANGED Viewed

@@ -204,7 +204,6 @@ models_requiring_temperature_1 = [
     "gpt-5-mini-2025-08-07",
     "gpt-5-nano",
     "gpt-5-nano-2025-08-07",
-    "gpt-5-chat-latest",
 ]

deepeval/models/llms/utils.py CHANGED Viewed

@@ -1,6 +1,7 @@
 from typing import Dict
 import re
 import json
+import asyncio
 def trim_and_load_json(
@@ -20,3 +21,24 @@ def trim_and_load_json(
         raise ValueError(error_str)
     except Exception as e:
         raise Exception(f"An unexpected error occurred: {str(e)}")
+def safe_asyncio_run(coro):
+    """
+    Run an async coroutine safely.
+    Falls back to run_until_complete if already in a running event loop.
+    """
+    try:
+        return asyncio.run(coro)
+    except RuntimeError:
+        try:
+            loop = asyncio.get_event_loop()
+            if loop.is_running():
+                future = asyncio.ensure_future(coro)
+                return loop.run_until_complete(future)
+            else:
+                return loop.run_until_complete(coro)
+        except Exception as inner_e:
+            raise
+    except Exception as e:
+        raise

deepeval/prompt/api.py CHANGED Viewed

@@ -45,6 +45,8 @@ class PromptVersionsHttpResponse(BaseModel):
 class PromptHttpResponse(BaseModel):
     id: str
+    version: str
+    label: Optional[str] = None
     text: Optional[str] = None
     messages: Optional[List[PromptMessage]] = None
     interpolation_type: PromptInterpolationType = Field(

deepeval/prompt/prompt.py CHANGED Viewed

@@ -1,5 +1,5 @@
 from enum import Enum
-from typing import Optional, List, Dict
+from typing import Literal, Optional, List, Dict
 from rich.progress import Progress, SpinnerColumn, TextColumn, BarColumn
 from rich.console import Console
 import time
@@ -7,6 +7,7 @@ import json
 import os
 from pydantic import BaseModel
 import asyncio
+import portalocker
 from deepeval.prompt.api import (
     PromptHttpResponse,
@@ -25,6 +26,8 @@ from deepeval.utils import (
 )
 CACHE_FILE_NAME = f"{HIDDEN_DIR}/.deepeval-prompt-cache.json"
+VERSION_CACHE_KEY = "version"
+LABEL_CACHE_KEY = "label"
 class CustomEncoder(json.JSONEncoder):
@@ -39,6 +42,7 @@ class CustomEncoder(json.JSONEncoder):
 class CachedPrompt(BaseModel):
     alias: str
     version: str
+    label: Optional[str] = None
     template: Optional[str]
     messages_template: Optional[List[PromptMessage]]
     prompt_version_id: str
@@ -50,6 +54,7 @@ class CachedPrompt(BaseModel):
 class Prompt:
+    label: Optional[str] = None
     _prompt_version_id: Optional[str] = None
     _type: Optional[PromptType] = None
     _interpolation_type: Optional[PromptInterpolationType] = None
@@ -73,8 +78,8 @@ class Prompt:
         self._text_template = template
         self._messages_template = messages_template
         self._version = None
-        self._polling_tasks: Dict[str, asyncio.Task] = {}
-        self._refresh_map: Dict[str, int] = {}
+        self._polling_tasks: Dict[str, Dict[str, asyncio.Task]] = {}
+        self._refresh_map: Dict[str, Dict[str, int]] = {}
         if template:
             self._type = PromptType.TEXT
         elif messages_template:
@@ -138,87 +143,173 @@ class Prompt:
         return versions.text_versions or versions.messages_versions or []
     def _read_from_cache(
-        self, alias: str, version: Optional[str] = None
+        self,
+        alias: str,
+        version: Optional[str] = None,
+        label: Optional[str] = None,
     ) -> Optional[CachedPrompt]:
         if not os.path.exists(CACHE_FILE_NAME):
-            raise Exception("No Prompt cache file found")
+            return None
         try:
-            with open(CACHE_FILE_NAME, "r") as f:
+            # Use shared lock for reading to allow concurrent reads
+            with portalocker.Lock(
+                CACHE_FILE_NAME,
+                mode="r",
+                flags=portalocker.LOCK_SH | portalocker.LOCK_NB,
+            ) as f:
                 cache_data = json.load(f)
             if alias in cache_data:
                 if version:
-                    if version in cache_data[alias]:
-                        return CachedPrompt(**cache_data[alias][version])
-                    else:
-                        raise Exception(
-                            f"Unable to find Prompt version: '{version}' for alias: '{alias}' in cache"
+                    if (
+                        VERSION_CACHE_KEY in cache_data[alias]
+                        and version in cache_data[alias][VERSION_CACHE_KEY]
+                    ):
+                        return CachedPrompt(
+                            **cache_data[alias][VERSION_CACHE_KEY][version]
                         )
-                else:
-                    raise Exception(
-                        f"Unable to load Prompt with alias: '{alias}' from cache when no version is specified "
-                    )
-            else:
-                raise Exception(
-                    f"Unable to find Prompt with alias: '{alias}' in cache"
-                )
-        except Exception as e:
-            raise Exception(f"Error reading Prompt cache from disk: {e}")
+                elif label:
+                    if (
+                        LABEL_CACHE_KEY in cache_data[alias]
+                        and label in cache_data[alias][LABEL_CACHE_KEY]
+                    ):
+                        return CachedPrompt(
+                            **cache_data[alias][LABEL_CACHE_KEY][label]
+                        )
+            return None
+        except (portalocker.exceptions.LockException, Exception):
+            # If cache is locked, corrupted or unreadable, return None and let it fetch from API
+            return None
     def _write_to_cache(
         self,
-        version: Optional[str] = None,
+        cache_key: Literal[VERSION_CACHE_KEY, LABEL_CACHE_KEY],
+        version: str,
+        label: Optional[str] = None,
         text_template: Optional[str] = None,
         messages_template: Optional[List[PromptMessage]] = None,
         prompt_version_id: Optional[str] = None,
         type: Optional[PromptType] = None,
         interpolation_type: Optional[PromptInterpolationType] = None,
     ):
-        if not self.alias or not version:
+        if not self.alias:
             return
-        cache_data = {}
-        if os.path.exists(CACHE_FILE_NAME):
-            try:
-                with open(CACHE_FILE_NAME, "r") as f:
-                    cache_data = json.load(f)
-            except Exception:
-                cache_data = {}
-        # Ensure the cache structure is initialized properly
-        if self.alias not in cache_data:
-            cache_data[self.alias] = {}
-        # Cache the prompt
-        cache_data[self.alias][version] = {
-            "alias": self.alias,
-            "version": version,
-            "template": text_template,
-            "messages_template": messages_template,
-            "prompt_version_id": prompt_version_id,
-            "type": type,
-            "interpolation_type": interpolation_type,
-        }
         # Ensure directory exists
         os.makedirs(HIDDEN_DIR, exist_ok=True)
-        # Write back to cache file
-        with open(CACHE_FILE_NAME, "w") as f:
-            json.dump(cache_data, f, cls=CustomEncoder)
+        try:
+            # Use r+ mode if file exists, w mode if it doesn't
+            mode = "r+" if os.path.exists(CACHE_FILE_NAME) else "w"
+            with portalocker.Lock(
+                CACHE_FILE_NAME,
+                mode=mode,
+                flags=portalocker.LOCK_EX,
+            ) as f:
+                # Read existing cache data if file exists and has content
+                cache_data = {}
+                if mode == "r+":
+                    try:
+                        f.seek(0)
+                        content = f.read()
+                        if content:
+                            cache_data = json.loads(content)
+                    except (json.JSONDecodeError, Exception):
+                        cache_data = {}
+                # Ensure the cache structure is initialized properly
+                if self.alias not in cache_data:
+                    cache_data[self.alias] = {}
+                if cache_key not in cache_data[self.alias]:
+                    cache_data[self.alias][cache_key] = {}
+                # Cache the prompt
+                cached_entry = {
+                    "alias": self.alias,
+                    "version": version,
+                    "label": label,
+                    "template": text_template,
+                    "messages_template": messages_template,
+                    "prompt_version_id": prompt_version_id,
+                    "type": type,
+                    "interpolation_type": interpolation_type,
+                }
+                if cache_key == VERSION_CACHE_KEY:
+                    cache_data[self.alias][cache_key][version] = cached_entry
+                else:
+                    cache_data[self.alias][cache_key][label] = cached_entry
+                # Write back to cache file
+                f.seek(0)
+                f.truncate()
+                json.dump(cache_data, f, cls=CustomEncoder)
+        except portalocker.exceptions.LockException:
+            # If we can't acquire the lock, silently skip caching
+            pass
+        except Exception:
+            # If any other error occurs during caching, silently skip
+            pass
+    def _load_from_cache_with_progress(
+        self,
+        progress: Progress,
+        task_id: int,
+        start_time: float,
+        version: Optional[str] = None,
+        label: Optional[str] = None,
+    ):
+        """
+        Load prompt from cache and update progress bar.
+        Raises if unable to load from cache.
+        """
+        cached_prompt = self._read_from_cache(
+            self.alias, version=version, label=label
+        )
+        if not cached_prompt:
+            raise ValueError("Unable to fetch prompt and load from cache")
+        self.version = cached_prompt.version
+        self.label = cached_prompt.label
+        self._text_template = cached_prompt.template
+        self._messages_template = cached_prompt.messages_template
+        self._prompt_version_id = cached_prompt.prompt_version_id
+        self._type = PromptType(cached_prompt.type)
+        self._interpolation_type = PromptInterpolationType(
+            cached_prompt.interpolation_type
+        )
+        end_time = time.perf_counter()
+        time_taken = format(end_time - start_time, ".2f")
+        progress.update(
+            task_id,
+            description=f"{progress.tasks[task_id].description}[rgb(25,227,160)]Loaded from cache! ({time_taken}s)",
+        )
     def pull(
         self,
         version: Optional[str] = None,
+        label: Optional[str] = None,
         fallback_to_cache: bool = True,
         write_to_cache: bool = True,
         default_to_cache: bool = True,
         refresh: Optional[int] = 60,
     ):
+        should_write_on_first_fetch = False
         if refresh:
             default_to_cache = True
-            write_to_cache = False
+            # Check if we need to bootstrap the cache
+            cached_prompt = self._read_from_cache(
+                self.alias, version=version, label=label
+            )
+            if cached_prompt is None:
+                # No cache exists, so we should write after fetching to bootstrap
+                should_write_on_first_fetch = True
+            write_to_cache = False  # Polling will handle subsequent writes
         if self.alias is None:
             raise TypeError(
                 "Unable to pull prompt from Confident AI when no alias is provided."
@@ -227,15 +318,20 @@ class Prompt:
         # Manage background prompt polling
         loop = get_or_create_general_event_loop()
         if loop.is_running():
-            loop.create_task(self.create_polling_task(version, refresh))
+            loop.create_task(self.create_polling_task(version, label, refresh))
         else:
-            loop.run_until_complete(self.create_polling_task(version, refresh))
+            loop.run_until_complete(
+                self.create_polling_task(version, label, refresh)
+            )
         if default_to_cache:
             try:
-                cached_prompt = self._read_from_cache(self.alias, version)
+                cached_prompt = self._read_from_cache(
+                    self.alias, version=version, label=label
+                )
                 if cached_prompt:
                     self.version = cached_prompt.version
+                    self.label = cached_prompt.label
                     self._text_template = cached_prompt.template
                     self._messages_template = cached_prompt.messages_template
                     self._prompt_version_id = cached_prompt.prompt_version_id
@@ -254,58 +350,60 @@ class Prompt:
             TextColumn("[progress.description]{task.description}"),
             transient=False,
         ) as progress:
+            HINT_TEXT = (
+                f"version='{version or 'latest'}'"
+                if not label
+                else f"label='{label}'"
+            )
             task_id = progress.add_task(
-                f"Pulling [rgb(106,0,255)]'{self.alias}' (version='{version or 'latest'}')[/rgb(106,0,255)] from Confident AI...",
+                f"Pulling [rgb(106,0,255)]'{self.alias}' ({HINT_TEXT})[/rgb(106,0,255)] from Confident AI...",
                 total=100,
             )
             start_time = time.perf_counter()
             try:
-                data, _ = api.send_request(
-                    method=HttpMethods.GET,
-                    endpoint=Endpoints.PROMPTS_VERSION_ID_ENDPOINT,
-                    url_params={
-                        "alias": self.alias,
-                        "versionId": version or "latest",
-                    },
-                )
+                if label:
+                    data, _ = api.send_request(
+                        method=HttpMethods.GET,
+                        endpoint=Endpoints.PROMPTS_LABEL_ENDPOINT,
+                        url_params={
+                            "alias": self.alias,
+                            "label": label,
+                        },
+                    )
+                else:
+                    data, _ = api.send_request(
+                        method=HttpMethods.GET,
+                        endpoint=Endpoints.PROMPTS_VERSION_ID_ENDPOINT,
+                        url_params={
+                            "alias": self.alias,
+                            "versionId": version or "latest",
+                        },
+                    )
                 response = PromptHttpResponse(
                     id=data["id"],
+                    version=data.get("version", None),
+                    label=data.get("label", None),
                     text=data.get("text", None),
                     messages=data.get("messages", None),
                     type=data["type"],
                     interpolation_type=data["interpolationType"],
                 )
-            except:
-                try:
-                    if fallback_to_cache:
-                        cached_prompt = self._read_from_cache(
-                            self.alias, version
-                        )
-                        if cached_prompt:
-                            self.version = cached_prompt.version
-                            self._text_template = cached_prompt.template
-                            self._messages_template = (
-                                cached_prompt.messages_template
-                            )
-                            self._prompt_version_id = (
-                                cached_prompt.prompt_version_id
-                            )
-                            self._type = PromptType(cached_prompt.type)
-                            self._interpolation_type = PromptInterpolationType(
-                                cached_prompt.interpolation_type
-                            )
-                            end_time = time.perf_counter()
-                            time_taken = format(end_time - start_time, ".2f")
-                            progress.update(
-                                task_id,
-                                description=f"{progress.tasks[task_id].description}[rgb(25,227,160)]Loaded from cache! ({time_taken}s)",
-                            )
-                            return
-                except:
-                    raise
-            self.version = version or "latest"
+            except Exception:
+                if fallback_to_cache:
+                    self._load_from_cache_with_progress(
+                        progress,
+                        task_id,
+                        start_time,
+                        version=version,
+                        label=label,
+                    )
+                    return
+                raise
+            self.version = response.version
+            self.label = response.label
             self._text_template = response.text
             self._messages_template = response.messages
             self._prompt_version_id = response.id
@@ -318,9 +416,12 @@ class Prompt:
                 task_id,
                 description=f"{progress.tasks[task_id].description}[rgb(25,227,160)]Done! ({time_taken}s)",
             )
-            if write_to_cache:
+            # Write to cache if explicitly requested OR if we need to bootstrap cache for refresh mode
+            if write_to_cache or should_write_on_first_fetch:
                 self._write_to_cache(
-                    version=version or "latest",
+                    cache_key=LABEL_CACHE_KEY if label else VERSION_CACHE_KEY,
+                    version=response.version,
+                    label=response.label,
                     text_template=response.text,
                     messages_template=response.messages,
                     prompt_version_id=response.id,
@@ -380,55 +481,114 @@ class Prompt:
     async def create_polling_task(
         self,
         version: Optional[str],
+        label: Optional[str],
         refresh: Optional[int] = 60,
+        default_to_cache: bool = True,
     ):
-        if version is None:
+        if version is None and label is None:
             return
         # If polling task doesn't exist, start it
-        polling_task: Optional[asyncio.Task] = self._polling_tasks.get(version)
+        CACHE_KEY = LABEL_CACHE_KEY if label else VERSION_CACHE_KEY
+        cache_value = label if label else version
+        # Initialize nested dicts if they don't exist
+        if CACHE_KEY not in self._polling_tasks:
+            self._polling_tasks[CACHE_KEY] = {}
+        if CACHE_KEY not in self._refresh_map:
+            self._refresh_map[CACHE_KEY] = {}
+        polling_task: Optional[asyncio.Task] = self._polling_tasks[
+            CACHE_KEY
+        ].get(cache_value)
         if refresh:
-            self._refresh_map[version] = refresh
+            self._refresh_map[CACHE_KEY][cache_value] = refresh
             if not polling_task:
-                self._polling_tasks[version] = asyncio.create_task(
-                    self.poll(version)
+                self._polling_tasks[CACHE_KEY][cache_value] = (
+                    asyncio.create_task(
+                        self.poll(version, label, default_to_cache)
+                    )
                 )
         # If invalid `refresh`, stop the task
         else:
             if polling_task:
                 polling_task.cancel()
-            self._polling_tasks.pop(version)
-            self._refresh_map.pop(version)
+            if cache_value in self._polling_tasks[CACHE_KEY]:
+                self._polling_tasks[CACHE_KEY].pop(cache_value)
+            if cache_value in self._refresh_map[CACHE_KEY]:
+                self._refresh_map[CACHE_KEY].pop(cache_value)
-    async def poll(self, version: Optional[str] = None):
-        api = Api()
+    async def poll(
+        self,
+        version: Optional[str] = None,
+        label: Optional[str] = None,
+        default_to_cache: bool = True,
+    ):
         while True:
-            try:
-                data, _ = api.send_request(
-                    method=HttpMethods.GET,
-                    endpoint=Endpoints.PROMPTS_VERSION_ID_ENDPOINT,
-                    url_params={
-                        "alias": self.alias,
-                        "versionId": version or "latest",
-                    },
+            if default_to_cache:
+                cached_prompt = self._read_from_cache(
+                    self.alias, version=version, label=label
                 )
+                if cached_prompt:
+                    self.version = cached_prompt.version
+                    self.label = cached_prompt.label
+                    self._text_template = cached_prompt.template
+                    self._messages_template = cached_prompt.messages_template
+                    self._prompt_version_id = cached_prompt.prompt_version_id
+                    self._type = PromptType(cached_prompt.type)
+                    self._interpolation_type = PromptInterpolationType(
+                        cached_prompt.interpolation_type
+                    )
+                    return
+            api = Api()
+            try:
+                if label:
+                    data, _ = api.send_request(
+                        method=HttpMethods.GET,
+                        endpoint=Endpoints.PROMPTS_LABEL_ENDPOINT,
+                        url_params={
+                            "alias": self.alias,
+                            "label": label,
+                        },
+                    )
+                else:
+                    data, _ = api.send_request(
+                        method=HttpMethods.GET,
+                        endpoint=Endpoints.PROMPTS_VERSION_ID_ENDPOINT,
+                        url_params={
+                            "alias": self.alias,
+                            "versionId": version or "latest",
+                        },
+                    )
                 response = PromptHttpResponse(
                     id=data["id"],
+                    version=data.get("version", None),
+                    label=data.get("label", None),
                     text=data.get("text", None),
                     messages=data.get("messages", None),
                     type=data["type"],
                     interpolation_type=data["interpolationType"],
                 )
-                self._write_to_cache(
-                    version=version or "latest",
-                    text_template=response.text,
-                    messages_template=response.messages,
-                    prompt_version_id=response.id,
-                    type=response.type,
-                    interpolation_type=response.interpolation_type,
-                )
+                if default_to_cache:
+                    self._write_to_cache(
+                        cache_key=(
+                            LABEL_CACHE_KEY if label else VERSION_CACHE_KEY
+                        ),
+                        version=response.version,
+                        label=response.label,
+                        text_template=response.text,
+                        messages_template=response.messages,
+                        prompt_version_id=response.id,
+                        type=response.type,
+                        interpolation_type=response.interpolation_type,
+                    )
             except Exception as e:
                 pass
-            await asyncio.sleep(self._refresh_map[version])
+            CACHE_KEY = LABEL_CACHE_KEY if label else VERSION_CACHE_KEY
+            cache_value = label if label else version
+            await asyncio.sleep(self._refresh_map[CACHE_KEY][cache_value])

deepeval/test_case/llm_test_case.py CHANGED Viewed

@@ -1,4 +1,5 @@
 from pydantic import (
+    ConfigDict,
     Field,
     BaseModel,
     model_validator,
@@ -151,6 +152,8 @@ class ToolCall(BaseModel):
 class LLMTestCase(BaseModel):
+    model_config = ConfigDict(extra="ignore")
     input: str
     actual_output: Optional[str] = Field(
         default=None,

deepeval/tracing/otel/utils.py CHANGED Viewed

@@ -1,11 +1,16 @@
+import json
 from typing import List, Optional, Tuple, Any
-from deepeval.tracing.types import Trace, LLMTestCase, ToolCall
-from deepeval.tracing import trace_manager, BaseSpan
 from opentelemetry.sdk.trace.export import ReadableSpan
-import json
+from deepeval.evaluate.utils import create_api_test_case
+from deepeval.test_run.api import LLMApiTestCase
+from deepeval.test_run.test_run import global_test_run_manager
+from deepeval.tracing.types import Trace, LLMTestCase, ToolCall
+from deepeval.tracing import trace_manager, BaseSpan
 from deepeval.tracing.utils import make_json_serializable
 GEN_AI_OPERATION_NAMES = ["chat", "generate_content", "task_completion"]
@@ -107,12 +112,12 @@ def check_llm_input_from_gen_ai_attributes(
         input = json.loads(span.attributes.get("gen_ai.input.messages"))
         input = _flatten_input(input)
-    except Exception as e:
+    except Exception:
         pass
     try:
         output = json.loads(span.attributes.get("gen_ai.output.messages"))
         output = _flatten_input(output)
-    except Exception as e:
+    except Exception:
         pass
     if input is None and output is None:
@@ -126,7 +131,7 @@ def check_llm_input_from_gen_ai_attributes(
                     and last_event.get("event.name") == "gen_ai.choice"
                 ):
                     output = last_event
-        except Exception as e:
+        except Exception:
             pass
     return input, output
@@ -181,7 +186,7 @@ def _flatten_input(input: list) -> list:
                         }
                     )
             return result
-        except Exception as e:
+        except Exception:
             return input
     return input
@@ -192,7 +197,7 @@ def check_tool_name_from_gen_ai_attributes(span: ReadableSpan) -> Optional[str]:
         gen_ai_tool_name = span.attributes.get("gen_ai.tool.name")
         if gen_ai_tool_name:
             return gen_ai_tool_name
-    except Exception as e:
+    except Exception:
         pass
     return None
@@ -205,7 +210,7 @@ def check_tool_input_parameters_from_gen_ai_attributes(
         tool_arguments = span.attributes.get("tool_arguments")
         if tool_arguments:
             return json.loads(tool_arguments)
-    except Exception as e:
+    except Exception:
         pass
     return None
@@ -224,7 +229,7 @@ def check_span_type_from_gen_ai_attributes(span: ReadableSpan):
         elif gen_ai_tool_name:
             return "tool"
-    except Exception as e:
+    except Exception:
         pass
     return "base"
@@ -235,7 +240,7 @@ def check_model_from_gen_ai_attributes(span: ReadableSpan):
         gen_ai_request_model_name = span.attributes.get("gen_ai.request.model")
         if gen_ai_request_model_name:
             return gen_ai_request_model_name
-    except Exception as e:
+    except Exception:
         pass
     return None
@@ -286,7 +291,7 @@ def prepare_trace_llm_test_case(span: ReadableSpan) -> Optional[LLMTestCase]:
                     tools_called.append(
                         ToolCall.model_validate_json(tool_call_json_str)
                     )
-                except Exception as e:
+                except Exception:
                     pass
     _expected_tools = span.attributes.get(
@@ -299,7 +304,7 @@ def prepare_trace_llm_test_case(span: ReadableSpan) -> Optional[LLMTestCase]:
                     expected_tools.append(
                         ToolCall.model_validate_json(tool_call_json_str)
                     )
-                except Exception as e:
+                except Exception:
                     pass
     test_case.tools_called = tools_called
@@ -328,12 +333,6 @@ def parse_list_of_strings(context: List[str]) -> List[str]:
     return parsed_context
-from deepeval.evaluate.utils import create_api_test_case
-from deepeval.test_run.api import LLMApiTestCase
-from deepeval.test_run.test_run import global_test_run_manager
-from typing import Optional
 def post_test_run(traces: List[Trace], test_run_id: Optional[str]):
     # Accept single trace or list of traces
     if isinstance(traces, Trace):
@@ -384,53 +383,70 @@ def post_test_run(traces: List[Trace], test_run_id: Optional[str]):
     # return test_run_manager.post_test_run(test_run) TODO: add after test run with metric collection is implemented
+def _normalize_pydantic_ai_messages(span: ReadableSpan) -> Optional[list]:
+    try:
+        raw = span.attributes.get("pydantic_ai.all_messages")
+        if not raw:
+            return None
+        messages = raw
+        if isinstance(messages, str):
+            messages = json.loads(messages)
+        elif isinstance(messages, tuple):
+            messages = list(messages)
+        if isinstance(messages, list):
+            normalized = []
+            for m in messages:
+                if isinstance(m, str):
+                    try:
+                        m = json.loads(m)
+                    except Exception:
+                        pass
+                normalized.append(m)
+            return normalized
+    except Exception:
+        pass
+    return None
 def check_pydantic_ai_agent_input_output(
     span: ReadableSpan,
 ) -> Tuple[Optional[Any], Optional[Any]]:
     input_val: Optional[Any] = None
     output_val: Optional[Any] = None
+    # Get normalized messages once
+    normalized = _normalize_pydantic_ai_messages(span)
     # Input (pydantic_ai.all_messages) - slice up to and including the first 'user' message
-    try:
-        raw = span.attributes.get("pydantic_ai.all_messages")
-        if raw:
-            messages = raw
-            if isinstance(messages, str):
-                messages = json.loads(messages)
-            elif isinstance(messages, tuple):
-                messages = list(messages)
-            if isinstance(messages, list):
-                normalized = []
-                for m in messages:
-                    if isinstance(m, str):
-                        try:
-                            m = json.loads(m)
-                        except Exception:
-                            pass
-                    normalized.append(m)
-                first_user_idx = None
-                for i, m in enumerate(normalized):
-                    role = None
-                    if isinstance(m, dict):
-                        role = m.get("role") or m.get("author")
-                    if role == "user":
-                        first_user_idx = i
-                        break
-                input_val = (
-                    normalized
-                    if first_user_idx is None
-                    else normalized[: first_user_idx + 1]
-                )
-    except Exception:
-        pass
+    if normalized:
+        try:
+            first_user_idx = None
+            for i, m in enumerate(normalized):
+                role = None
+                if isinstance(m, dict):
+                    role = m.get("role") or m.get("author")
+                if role == "user":
+                    first_user_idx = i
+                    break
+            input_val = (
+                normalized
+                if first_user_idx is None
+                else normalized[: first_user_idx + 1]
+            )
+        except Exception:
+            pass
     # Output (agent final_result)
     try:
         if span.attributes.get("confident.span.type") == "agent":
             output_val = span.attributes.get("final_result")
+            if not output_val and normalized:
+                # Extract the last message if no final_result is available
+                output_val = normalized[-1]
     except Exception:
         pass
@@ -442,7 +458,7 @@ def check_pydantic_ai_agent_input_output(
 def check_tool_output(span: ReadableSpan):
     try:
         return span.attributes.get("tool_response")
-    except Exception as e:
+    except Exception:
         pass
     return None

deepeval/tracing/tracing.py CHANGED Viewed

@@ -208,7 +208,13 @@ class TraceManager:
                 else:
                     # print(f"Ending trace: {trace.root_spans}")
                     self.environment = Environment.TESTING
-                    trace.root_spans = [trace.root_spans[0].children[0]]
+                    if (
+                        trace.root_spans
+                        and len(trace.root_spans) > 0
+                        and trace.root_spans[0].children
+                        and len(trace.root_spans[0].children) > 0
+                    ):
+                        trace.root_spans = [trace.root_spans[0].children[0]]
                     for root_span in trace.root_spans:
                         root_span.parent_uuid = None

deepeval/tracing/utils.py CHANGED Viewed

@@ -1,15 +1,12 @@
 import os
-import time
 import inspect
 import json
 import sys
-import difflib
 from datetime import datetime, timezone
 from enum import Enum
 from time import perf_counter
-import time
 from collections import deque
-from typing import Any, Dict, Optional, Sequence, Callable
+from typing import Any, Dict, Optional
 from deepeval.constants import CONFIDENT_TRACING_ENABLED
@@ -189,8 +186,8 @@ def perf_counter_to_datetime(perf_counter_value: float) -> datetime:
 def replace_self_with_class_name(obj):
     try:
         return f"<{obj.__class__.__name__}>"
-    except:
-        return f"<self>"
+    except Exception:
+        return "<self>"
 def get_deepeval_trace_mode() -> Optional[str]:

{deepeval-3.6.1.dist-info → deepeval-3.6.3.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: deepeval
-Version: 3.6.1
+Version: 3.6.3
 Summary: The LLM Evaluation Framework
 Home-page: https://github.com/confident-ai/deepeval
 License: Apache-2.0
@@ -359,7 +359,7 @@ for golden in dataset.goldens:
 @pytest.mark.parametrize(
     "test_case",
-    dataset,
+    dataset.test_cases,
 )
 def test_customer_chatbot(test_case: LLMTestCase):
     answer_relevancy_metric = AnswerRelevancyMetric(threshold=0.5)

{deepeval-3.6.1.dist-info → deepeval-3.6.3.dist-info}/RECORD RENAMED Viewed

@@ -1,5 +1,5 @@
 deepeval/__init__.py,sha256=6fsb813LD_jNhqR-xZnSdE5E-KsBbC3tc4oIg5ZMgTw,2115
-deepeval/_version.py,sha256=60ky4ZrqXl83ooFzPWUHtPFcXD1XP6b9GQDnqw3EHOU,27
+deepeval/_version.py,sha256=1BsEnmEpD1mtVjCYoXBeguVgrKPAi3TRpS_a7ndu4XU,27
 deepeval/annotation/__init__.py,sha256=ZFhUVNNuH_YgQSZJ-m5E9iUb9TkAkEV33a6ouMDZ8EI,111
 deepeval/annotation/annotation.py,sha256=3j3-syeJepAcEj3u3e4T_BeRDzNr7yXGDIoNQGMKpwQ,2298
 deepeval/annotation/api.py,sha256=EYN33ACVzVxsFleRYm60KB4Exvff3rPJKt1VBuuX970,2147
@@ -138,7 +138,7 @@ deepeval/cli/test.py,sha256=kSIFMRTAfVzBJ4OitwvT829-ylV7UzPMP57P2DePS-Q,5482
 deepeval/cli/types.py,sha256=_7KdthstHNc-JKCWrfpDQCf_j8h9PMxh0qJCHmVXJr0,310
 deepeval/cli/utils.py,sha256=F4-yuONzk4ojDoSLjI9RYERB7HOD412iZ2lNlSCq4wk,5601
 deepeval/confident/__init__.py,sha256=AbpHGcgLb-kRsJGnwFEktk7uzpZOCcBY74-YBdrKVGs,1
-deepeval/confident/api.py,sha256=bOC71TaVAEgoXFtJ9yMo0-atmUUdBuvaclMGczMcR6o,8455
+deepeval/confident/api.py,sha256=2ZhrQOtfxcnQSyY6OxrjY17y1yn-NB7pfIiJa20B1Pk,8519
 deepeval/confident/types.py,sha256=-slFhDof_1maMgpLxqDRZv6kz6ZVY2hP_0uj_aveJKU,533
 deepeval/config/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 deepeval/config/settings.py,sha256=gRRi6nXEUKse13xAShU9MA18zo14vpIgl_R0xJ_0vnM,21314
@@ -159,7 +159,7 @@ deepeval/evaluate/api.py,sha256=rkblH0ZFAAdyuF0Ymh7JE1pIJPR9yFuPrn9SQaCEQp4,435
 deepeval/evaluate/compare.py,sha256=tdSJY4E7YJ_zO3dzvpwngZHLiUI2YQcTWJOLI83htsQ,9855
 deepeval/evaluate/configs.py,sha256=QfWjaWNxLsgEe8-5j4PIs5WcSyEckiWt0qdpXSpl57M,928
 deepeval/evaluate/evaluate.py,sha256=NPAJ2iJqJI_RurXKUIC0tft_ozYMIKwZf5iPfmnNhQc,10412
-deepeval/evaluate/execute.py,sha256=7RCjn2GGcjqK6cp9-0BtHL6PPJNw5-KXqXL60GN3G5Y,88672
+deepeval/evaluate/execute.py,sha256=XS0XtDGKC1ZOo09lthillfi5aDI5TWFbJ-Y7yICNvGo,89056
 deepeval/evaluate/types.py,sha256=IGZ3Xsj0UecPI3JNeTpJaK1gDvlepokfCmHwtItIW9M,831
 deepeval/evaluate/utils.py,sha256=kkliSGzuICeUsXDtlMMPfN95dUKlqarNhfciSffd4gI,23143
 deepeval/integrations/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -240,12 +240,12 @@ deepeval/metrics/faithfulness/faithfulness.py,sha256=bYVhHI7Tr7xH0x-7F2LijxRuCCE
 deepeval/metrics/faithfulness/schema.py,sha256=2dU9dwwmqpGJcWvY2webERWIfH_tn02xgLghHkAY_eM,437
 deepeval/metrics/faithfulness/template.py,sha256=RuZ0LFm4BjZ8lhVrKPgU3ecHszwkF0fe5-BxAkaP5AA,5839
 deepeval/metrics/g_eval/__init__.py,sha256=HAhsQFVq9LIpZXPN00Jc_WrMXrh47NIT86VnUpWM4_4,102
-deepeval/metrics/g_eval/g_eval.py,sha256=JI3rTaEClYgiL9oLaVFh7sunqGoXI7qBeBgi9RkSwDs,14327
+deepeval/metrics/g_eval/g_eval.py,sha256=CaW7VHPW-SyXt18IE1rSatgagY238s3It-j6SLRI4H4,14395
 deepeval/metrics/g_eval/schema.py,sha256=V629txuDrr_2IEKEsgJVYYZb_pkdfcltQV9ZjvxK5co,287
 deepeval/metrics/g_eval/template.py,sha256=mHj4-mr_HQwbCjpHg7lM_6UesoSatL3g8UGGQAOdT0U,4509
 deepeval/metrics/g_eval/utils.py,sha256=uUT86jRXVYvLDzcnZvvfWssDyGoBHb66nWcJSg4i1u4,8784
 deepeval/metrics/hallucination/__init__.py,sha256=rCVlHi2UGzDKmZKi0esFLafmshVBx2WZ0jiIb-KqcYQ,44
-deepeval/metrics/hallucination/hallucination.py,sha256=tozck1KwqDv80Nd449QH6_6mG15768eCGxmjoBsbzKw,9549
+deepeval/metrics/hallucination/hallucination.py,sha256=8JN5pj5YWRtl7rgbbFQF6EVBCGm1NV9vaX3_5tScNs4,9548
 deepeval/metrics/hallucination/schema.py,sha256=V8xbrBLMwJfre-lPuDc7rMEdhHf_1hfgoW1jE_ULvAY,286
 deepeval/metrics/hallucination/template.py,sha256=hiss1soxSBFqzOt0KmHZdZUzoQsmXnslDyb8HsjALPs,2620
 deepeval/metrics/indicator.py,sha256=oewo_n5Qet9Zfzo2QQs-EQ8w92siuyDCAmoTZW45ndc,10244
@@ -348,7 +348,7 @@ deepeval/metrics/task_completion/schema.py,sha256=JfnZkbCh7skWvrESy65GEo6Rvo0FDJ
 deepeval/metrics/task_completion/task_completion.py,sha256=RKFkXCVOhO70I8A16zv5BCaV3QVKldNxawJ0T93U_Zc,8978
 deepeval/metrics/task_completion/template.py,sha256=4xjTBcGrPQxInbf8iwJOZyok9SQex1aCkbxKmfkXoA4,10437
 deepeval/metrics/tool_correctness/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-deepeval/metrics/tool_correctness/tool_correctness.py,sha256=8uyNFGM_aGFAB2aCv2CVDg5cjj0OJe8UVDqaT3Gp3kU,12090
+deepeval/metrics/tool_correctness/tool_correctness.py,sha256=j5wB9mJp7BLbn3bTZd6LlIeub1kXxXGaDVWrzyvBFo4,12111
 deepeval/metrics/toxicity/__init__.py,sha256=1lgt8BKxfBDd7bfSLu_5kMzmsr9b2_ahPK9oq5zLkMk,39
 deepeval/metrics/toxicity/schema.py,sha256=7uUdzXqTvIIz5nfahlllo_fzVRXg7UeMeXn7Hl32pKY,459
 deepeval/metrics/toxicity/template.py,sha256=zl4y4Tg9gXkxKJ8aXVwj0cJ94pvfYuP7MTeV3dvB5yQ,5045
@@ -370,7 +370,7 @@ deepeval/models/embedding_models/ollama_embedding_model.py,sha256=w3etdIdWvYfVIE
 deepeval/models/embedding_models/openai_embedding_model.py,sha256=Z1--e3CnNNmwryqmUMxBCaTURjtgKWHqADuUeCqFlSc,3545
 deepeval/models/hallucination_model.py,sha256=ABi978VKLE_jNHbDzM96kJ08EsZ5ZlvOlJHA_ptSkfQ,1003
 deepeval/models/llms/__init__.py,sha256=qmvv7wnmTDvys2uUTwQRo-_3DlFV3fGLiewPeQYRsAI,670
-deepeval/models/llms/amazon_bedrock_model.py,sha256=xaNV7BnqcsH31ghIKBcacKzetORlFRGHtuBlfr8vbnQ,6183
+deepeval/models/llms/amazon_bedrock_model.py,sha256=3yiUUGU_d_YK7Usq8v5iqG3yHa5VnqeDOoCLG_p8rtc,5185
 deepeval/models/llms/anthropic_model.py,sha256=5gYRNkYUD7Zl3U0SibBG2YGCQsD6DdTsaBhqdaJlKIw,6072
 deepeval/models/llms/azure_model.py,sha256=dqINcfoJNqdd9zh5iTPwQ_ToGMOF7iH6YUB-UWRSOlc,10730
 deepeval/models/llms/deepseek_model.py,sha256=EqBJkKa7rXppCmlnIt_D-Z_r9fbsOUsOAVvN2jWA-Hk,6404
@@ -380,8 +380,8 @@ deepeval/models/llms/kimi_model.py,sha256=ldTefdSVitZYJJQ-_ZsP87iiT5iZ4QCVdfi-Yz
 deepeval/models/llms/litellm_model.py,sha256=iu4-_JCpd9LdEa-eCWseD2iLTA-r7OSgYGWQ0IxB4eA,11527
 deepeval/models/llms/local_model.py,sha256=hEyKVA6pkQm9dICUKsMNgjVI3w6gnyMdmBt_EylkWDk,4473
 deepeval/models/llms/ollama_model.py,sha256=xPO4d4jMY-cQAyHAcMuFvWS8JMWwCUbKP9CMi838Nuc,3307
-deepeval/models/llms/openai_model.py,sha256=F02N8BgbiEXH7F6y-a6DkjVcBXFEzr87SEB2gVn4xlU,17192
-deepeval/models/llms/utils.py,sha256=ZMZ02kjXAAleq0bIEyjj-gZwe6Gp0b0mK8YMuid2-20,722
+deepeval/models/llms/openai_model.py,sha256=mUvQ8a9FVk4lrdZyS_QRZTK4imufyaCNjZFPeqbc0AM,17167
+deepeval/models/llms/utils.py,sha256=gFM_8eIvdSwN_D4Yqp-j7PkfoiRn_bgu7tlCHol3A6c,1324
 deepeval/models/mlllms/__init__.py,sha256=19nN6kUB5XI0nUWUQX0aD9GBUMM8WWGvsDgKjuT4EF4,144
 deepeval/models/mlllms/gemini_model.py,sha256=7tHIWD4w_fBz3L7jkKWygn1QpBPk9nl2Kw-yb0Jc3PI,10167
 deepeval/models/mlllms/ollama_model.py,sha256=_YtYtw8oIMVVI-CFsDicsdeEJUPhw_9ArPxB_1olsJA,4798
@@ -404,8 +404,8 @@ deepeval/plugins/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,
 deepeval/plugins/plugin.py,sha256=_dwsdx4Dg9DbXxK3f7zJY4QWTJQWc7QE1HmIg2Zjjag,1515
 deepeval/progress_context.py,sha256=ZSKpxrE9sdgt9G3REKnVeXAv7GJXHHVGgLynpG1Pudw,3557
 deepeval/prompt/__init__.py,sha256=M99QTWdxOfiNeySGCSqN873Q80PPxqRvjLq4_Mw-X1w,49
-deepeval/prompt/api.py,sha256=kR3MkaHuU2wYILKVnvnXhQWxWp0XgtcWX-kIjpMJRl8,1728
-deepeval/prompt/prompt.py,sha256=192W5zFBx08nELxRHHDQscMM3psj8OUFV_JR85BZv8Q,15823
+deepeval/prompt/api.py,sha256=665mLKiq8irXWV8kM9P_qFJipdCYZUNQFwW8AkA3itM,1777
+deepeval/prompt/prompt.py,sha256=w2BmKtSzXxobjSlBQqUjdAB0Zwe6IYaLjLg7KQvVDXE,21999
 deepeval/prompt/utils.py,sha256=Ermw9P-1-T5wQ5uYuj5yWgdj7pVB_JLw8D37Qvmh9ok,1938
 deepeval/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 deepeval/red_teaming/README.md,sha256=BY5rAdpp3-sMMToEKwq0Nsd9ivkGDzPE16DeDb8GY7U,154
@@ -434,7 +434,7 @@ deepeval/telemetry.py,sha256=JPZw1VBJ5dGiS8k-dzWs5OhMbNlr65QgVretTy33WCg,21704
 deepeval/test_case/__init__.py,sha256=hLkHxGH0-FFhx4MlJwIbzNHL4pgyLGquh8l0qD-z_cQ,731
 deepeval/test_case/arena_test_case.py,sha256=PcfDxadlc4yW4AEDdvN32AeUpx2Sms1jvnbX31Xu65o,957
 deepeval/test_case/conversational_test_case.py,sha256=lF0V1yCGCInQetggm2wbXx-MkuMRs2ScwqIXCSwb1Fs,7534
-deepeval/test_case/llm_test_case.py,sha256=uWipuFVzKR3gYSpAbjK6GB_6XdtDMIRDNms-LyZYsuc,12117
+deepeval/test_case/llm_test_case.py,sha256=L-dCvJ4pMPPavZTyN9ZKN30h351DWI_TunmXfHPIjig,12180
 deepeval/test_case/mcp.py,sha256=Z625NLvz0E_UJpbyfyuAi_4nsqKH6DByBf0rfKd70xU,1879
 deepeval/test_case/mllm_test_case.py,sha256=8a0YoE72geX_fLI6yk_cObSxCPddwW-DOb-5OPE1-W8,5414
 deepeval/test_case/utils.py,sha256=5lT7QmhItsQHt44-qQfspuktilcrEyvl2cS0cgUJxds,809
@@ -454,15 +454,15 @@ deepeval/tracing/offline_evals/thread.py,sha256=bcSGFcZJKnszArOLIlWvnCyt0zSmsd7X
 deepeval/tracing/offline_evals/trace.py,sha256=vTflaTKysKRiYvKA-Nx6PUJ3J6NrRLXiIdWieVcm90E,1868
 deepeval/tracing/otel/__init__.py,sha256=HQsaF5yLPwyW5qg8AOV81_nG_7pFHnatOTHi9Wx3HEk,88
 deepeval/tracing/otel/exporter.py,sha256=wPO1ITKpjueLOSNLO6nD2QL9LAd8Xcu6en8hRkB61Wo,28891
-deepeval/tracing/otel/utils.py,sha256=THXOoqLau4w6Jlz0YJV3K3vQcVptxo14hcDQCJiPeks,14821
+deepeval/tracing/otel/utils.py,sha256=yAXyPvTjax2HdLcvbVv9pyOVW4S7elIp3RLGuBTr_8o,15113
 deepeval/tracing/patchers.py,sha256=DAPNkhrDtoeyJIVeQDUMhTz-xGcXu00eqjQZmov8FiU,3096
 deepeval/tracing/perf_epoch_bridge.py,sha256=iyAPddB6Op7NpMtPHJ29lDm53Btz9yLaN6xSCfTRQm4,1825
-deepeval/tracing/tracing.py,sha256=WFXfGLt58Ia9yCohDZBIUGX6mwieoF8489UziuC-NJI,42458
+deepeval/tracing/tracing.py,sha256=xZEyuxdGY259nQaDkGp_qO7Avriv8hrf4L15ZfeMNV8,42728
 deepeval/tracing/types.py,sha256=l_utWKerNlE5H3mOKpeUJLsvpP3cMyjH7HRANNgTmSQ,5306
-deepeval/tracing/utils.py,sha256=RUcsDpS_aobK3zuNfZGNvjk7aBbBfHOj3aYu2hRZzg0,7993
+deepeval/tracing/utils.py,sha256=SLnks8apGlrV6uVnvFVl2mWYABEkvXbPXnQvq3KaU_o,7943
 deepeval/utils.py,sha256=-_o3W892u7naX4Y7a8if4mP0Rtkgtapg6Krr1ZBpj0o,17197
-deepeval-3.6.1.dist-info/LICENSE.md,sha256=0ATkuLv6QgsJTBODUHC5Rak_PArA6gv2t7inJzNTP38,11352
-deepeval-3.6.1.dist-info/METADATA,sha256=UrYM0bqzIvhmMlevcqO-Hcbbm2e5r26FwWEzz2rKua8,18743
-deepeval-3.6.1.dist-info/WHEEL,sha256=d2fvjOD7sXsVzChCqf0Ty0JbHKBaLYwDbGQDwQTnJ50,88
-deepeval-3.6.1.dist-info/entry_points.txt,sha256=fVr8UphXTfJe9I2rObmUtfU3gkSrYeM0pLy-NbJYg10,94
-deepeval-3.6.1.dist-info/RECORD,,
+deepeval-3.6.3.dist-info/LICENSE.md,sha256=0ATkuLv6QgsJTBODUHC5Rak_PArA6gv2t7inJzNTP38,11352
+deepeval-3.6.3.dist-info/METADATA,sha256=BoRZ6BEBPwkypse9Xzw8gRlsezwSrDKsT5RO9C3thQc,18754
+deepeval-3.6.3.dist-info/WHEEL,sha256=d2fvjOD7sXsVzChCqf0Ty0JbHKBaLYwDbGQDwQTnJ50,88
+deepeval-3.6.3.dist-info/entry_points.txt,sha256=fVr8UphXTfJe9I2rObmUtfU3gkSrYeM0pLy-NbJYg10,94
+deepeval-3.6.3.dist-info/RECORD,,

{deepeval-3.6.1.dist-info → deepeval-3.6.3.dist-info}/LICENSE.md RENAMED Viewed

File without changes

{deepeval-3.6.1.dist-info → deepeval-3.6.3.dist-info}/WHEEL RENAMED Viewed

File without changes

{deepeval-3.6.1.dist-info → deepeval-3.6.3.dist-info}/entry_points.txt RENAMED Viewed

File without changes

deepeval 3.6.1__py3-none-any.whl → 3.6.3__py3-none-any.whl

deepeval 3.6.1py3-none-any.whl → 3.6.3py3-none-any.whl