PyPI - judgeval - Versions diffs - 0.0.42__tar.gz → 0.0.44__tar.gz - Mend

judgeval 0.0.42tar.gz → 0.0.44tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (179) hide show

{judgeval-0.0.42 → judgeval-0.0.44}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: judgeval
-Version: 0.0.42
+Version: 0.0.44
 Summary: Judgeval Package
 Project-URL: Homepage, https://github.com/JudgmentLabs/judgeval
 Project-URL: Issues, https://github.com/JudgmentLabs/judgeval/issues

{judgeval-0.0.42 → judgeval-0.0.44}/pyproject.toml RENAMED Viewed

@@ -1,6 +1,6 @@
 [project]
 name = "judgeval"
-version = "0.0.42"
+version = "0.0.44"
 authors = [
     { name="Andrew Li", email="andrew@judgmentlabs.ai" },
     { name="Alex Shan", email="alex@judgmentlabs.ai" },

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/common/tracer.py RENAMED Viewed

@@ -1557,7 +1557,6 @@ class _DeepTracer:
 #         current_trace.record_output({"log": message})
 class Tracer:
-    _instance = None
     # Tracer.current_trace class variable is currently used in wrap()
     # TODO: Keep track of cross-context state for current trace and current span ID solely through class variables instead of instance variables?
@@ -1567,11 +1566,6 @@ class Tracer:
     trace_across_async_contexts: bool = False # BY default, we don't trace across async contexts
-    def __new__(cls, *args, **kwargs):
-        if cls._instance is None:
-            cls._instance = super(Tracer, cls).__new__(cls)
-        return cls._instance
     def __init__(
         self,
         api_key: str = os.getenv("JUDGMENT_API_KEY"),
@@ -1595,66 +1589,56 @@ class Tracer:
         span_flush_interval: float = 1.0,  # Time in seconds between automatic flushes
         span_num_workers: int = 10  # Number of worker threads for span processing
         ):
-        if not hasattr(self, 'initialized'):
-            if not api_key:
-                raise ValueError("Tracer must be configured with a Judgment API key")
-            result, response = validate_api_key(api_key)
-            if not result:
-                raise JudgmentAPIError(f"Issue with passed in Judgment API key: {response}")
-            if not organization_id:
-                raise ValueError("Tracer must be configured with an Organization ID")
-            if use_s3 and not s3_bucket_name:
-                raise ValueError("S3 bucket name must be provided when use_s3 is True")
-            self.api_key: str = api_key
-            self.project_name: str = project_name or str(uuid.uuid4())
-            self.organization_id: str = organization_id
-            self.rules: List[Rule] = rules or []  # Store rules at tracer level
-            self.traces: List[Trace] = []
-            self.initialized: bool = True
-            self.enable_monitoring: bool = enable_monitoring
-            self.enable_evaluations: bool = enable_evaluations
-            self.class_identifiers: Dict[str, str] = {}  # Dictionary to store class identifiers
-            self.span_id_to_previous_span_id: Dict[str, str] = {}
-            self.trace_id_to_previous_trace: Dict[str, TraceClient] = {}
-            self.current_span_id: Optional[str] = None
-            self.current_trace: Optional[TraceClient] = None
-            self.trace_across_async_contexts: bool = trace_across_async_contexts
-            Tracer.trace_across_async_contexts = trace_across_async_contexts
-            # Initialize S3 storage if enabled
-            self.use_s3 = use_s3
-            if use_s3:
-                from judgeval.common.s3_storage import S3Storage
-                self.s3_storage = S3Storage(
-                    bucket_name=s3_bucket_name,
-                    aws_access_key_id=s3_aws_access_key_id,
-                    aws_secret_access_key=s3_aws_secret_access_key,
-                    region_name=s3_region_name
-                )
-            self.offline_mode: bool = offline_mode
-            self.deep_tracing: bool = deep_tracing  # NEW: Store deep tracing setting
-            # Initialize background span service
-            self.enable_background_spans: bool = enable_background_spans
-            self.background_span_service: Optional[BackgroundSpanService] = None
-            if enable_background_spans and not offline_mode:
-                self.background_span_service = BackgroundSpanService(
-                    judgment_api_key=api_key,
-                    organization_id=organization_id,
-                    batch_size=span_batch_size,
-                    flush_interval=span_flush_interval,
-                    num_workers=span_num_workers
-                )
-        elif hasattr(self, 'project_name') and self.project_name != project_name:
-            warnings.warn(
-                f"Attempting to initialize Tracer with project_name='{project_name}' but it was already initialized with "
-                f"project_name='{self.project_name}'. Due to the singleton pattern, the original project_name will be used. "
-                "To use a different project name, ensure the first Tracer initialization uses the desired project name.",
-                RuntimeWarning
+        if not api_key:
+            raise ValueError("Tracer must be configured with a Judgment API key")
+        result, response = validate_api_key(api_key)
+        if not result:
+            raise JudgmentAPIError(f"Issue with passed in Judgment API key: {response}")
+        if not organization_id:
+            raise ValueError("Tracer must be configured with an Organization ID")
+        if use_s3 and not s3_bucket_name:
+            raise ValueError("S3 bucket name must be provided when use_s3 is True")
+        self.api_key: str = api_key
+        self.project_name: str = project_name or str(uuid.uuid4())
+        self.organization_id: str = organization_id
+        self.rules: List[Rule] = rules or []  # Store rules at tracer level
+        self.traces: List[Trace] = []
+        self.enable_monitoring: bool = enable_monitoring
+        self.enable_evaluations: bool = enable_evaluations
+        self.class_identifiers: Dict[str, str] = {}  # Dictionary to store class identifiers
+        self.span_id_to_previous_span_id: Dict[str, str] = {}
+        self.trace_id_to_previous_trace: Dict[str, TraceClient] = {}
+        self.current_span_id: Optional[str] = None
+        self.current_trace: Optional[TraceClient] = None
+        self.trace_across_async_contexts: bool = trace_across_async_contexts
+        Tracer.trace_across_async_contexts = trace_across_async_contexts
+        # Initialize S3 storage if enabled
+        self.use_s3 = use_s3
+        if use_s3:
+            from judgeval.common.s3_storage import S3Storage
+            self.s3_storage = S3Storage(
+                bucket_name=s3_bucket_name,
+                aws_access_key_id=s3_aws_access_key_id,
+                aws_secret_access_key=s3_aws_secret_access_key,
+                region_name=s3_region_name
+            )
+        self.offline_mode: bool = offline_mode
+        self.deep_tracing: bool = deep_tracing  # NEW: Store deep tracing setting
+        # Initialize background span service
+        self.enable_background_spans: bool = enable_background_spans
+        self.background_span_service: Optional[BackgroundSpanService] = None
+        if enable_background_spans and not offline_mode:
+            self.background_span_service = BackgroundSpanService(
+                judgment_api_key=api_key,
+                organization_id=organization_id,
+                batch_size=span_batch_size,
+                flush_interval=span_flush_interval,
+                num_workers=span_num_workers
             )
     def set_current_span(self, span_id: str):
@@ -2237,7 +2221,7 @@ def wrap(client: Any, trace_across_async_contexts: bool = Tracer.trace_across_as
     Supports OpenAI, Together, Anthropic, and Google GenAI clients.
     Patches both '.create' and Anthropic's '.stream' methods using a wrapper class.
     """
-    span_name, original_create, original_responses_create, original_stream = _get_client_config(client)
+    span_name, original_create, original_responses_create, original_stream, original_beta_parse = _get_client_config(client)
     def _get_current_trace():
         if trace_across_async_contexts:
@@ -2307,6 +2291,22 @@ def wrap(client: Any, trace_across_async_contexts: bool = Tracer.trace_across_as
                 _capture_exception_for_trace(span, sys.exc_info())
                 raise e
+    async def traced_beta_parse_async(*args, **kwargs):
+        current_trace = _get_current_trace()
+        if not current_trace:
+            return await original_beta_parse(*args, **kwargs)
+        with current_trace.span(span_name, span_type="llm") as span:
+            is_streaming = _record_input_and_check_streaming(span, kwargs)
+            try:
+                response_or_iterator = await original_beta_parse(*args, **kwargs)
+                return _format_and_record_output(span, response_or_iterator, is_streaming, True, False)
+            except Exception as e:
+                _capture_exception_for_trace(span, sys.exc_info())
+                raise e
     # Async responses for OpenAI clients
     async def traced_response_create_async(*args, **kwargs):
         current_trace = _get_current_trace()
@@ -2354,6 +2354,21 @@ def wrap(client: Any, trace_across_async_contexts: bool = Tracer.trace_across_as
             except Exception as e:
                 _capture_exception_for_trace(span, sys.exc_info())
                 raise e
+    def traced_beta_parse_sync(*args, **kwargs):
+        current_trace = _get_current_trace()
+        if not current_trace:
+            return original_beta_parse(*args, **kwargs)
+        with current_trace.span(span_name, span_type="llm") as span:
+            is_streaming = _record_input_and_check_streaming(span, kwargs)
+            try:
+                response_or_iterator = original_beta_parse(*args, **kwargs)
+                return _format_and_record_output(span, response_or_iterator, is_streaming, False, False)
+            except Exception as e:
+                _capture_exception_for_trace(span, sys.exc_info())
+                raise e
     def traced_response_create_sync(*args, **kwargs):
         current_trace = _get_current_trace()
@@ -2392,7 +2407,7 @@ def wrap(client: Any, trace_across_async_contexts: bool = Tracer.trace_across_as
         if hasattr(client, "responses") and hasattr(client.responses, "create"):
             client.responses.create = traced_response_create_async
         if hasattr(client, "beta") and hasattr(client.beta, "chat") and hasattr(client.beta.chat, "completions") and hasattr(client.beta.chat.completions, "parse"):
-            client.beta.chat.completions.parse = traced_create_async
+            client.beta.chat.completions.parse = traced_beta_parse_async
     elif isinstance(client, AsyncAnthropic):
         client.messages.create = traced_create_async
         if original_stream:
@@ -2404,7 +2419,7 @@ def wrap(client: Any, trace_across_async_contexts: bool = Tracer.trace_across_as
         if hasattr(client, "responses") and hasattr(client.responses, "create"):
             client.responses.create = traced_response_create_sync
         if hasattr(client, "beta") and hasattr(client.beta, "chat") and hasattr(client.beta.chat, "completions") and hasattr(client.beta.chat.completions, "parse"):
-            client.beta.chat.completions.parse = traced_create_sync
+            client.beta.chat.completions.parse = traced_beta_parse_sync
     elif isinstance(client, Anthropic):
         client.messages.create = traced_create_sync
         if original_stream:
@@ -2423,23 +2438,24 @@ def _get_client_config(client: ApiClient) -> tuple[str, callable, Optional[calla
         client: An instance of OpenAI, Together, or Anthropic client
     Returns:
-        tuple: (span_name, create_method, stream_method)
+        tuple: (span_name, create_method, responses_method, stream_method, beta_parse_method)
             - span_name: String identifier for tracing
             - create_method: Reference to the client's creation method
             - responses_method: Reference to the client's responses method (if applicable)
             - stream_method: Reference to the client's stream method (if applicable)
+            - beta_parse_method: Reference to the client's beta parse method (if applicable)
     Raises:
         ValueError: If client type is not supported
     """
     if isinstance(client, (OpenAI, AsyncOpenAI)):
-        return "OPENAI_API_CALL", client.chat.completions.create, client.responses.create, None
+        return "OPENAI_API_CALL", client.chat.completions.create, client.responses.create, None, client.beta.chat.completions.parse
     elif isinstance(client, (Together, AsyncTogether)):
-        return "TOGETHER_API_CALL", client.chat.completions.create, None, None
+        return "TOGETHER_API_CALL", client.chat.completions.create, None, None, None
     elif isinstance(client, (Anthropic, AsyncAnthropic)):
-        return "ANTHROPIC_API_CALL", client.messages.create, None, client.messages.stream
+        return "ANTHROPIC_API_CALL", client.messages.create, None, client.messages.stream, None
     elif isinstance(client, (genai.Client, genai.client.AsyncClient)):
-        return "GOOGLE_API_CALL", client.models.generate_content, None, None
+        return "GOOGLE_API_CALL", client.models.generate_content, None, None, None
     raise ValueError(f"Unsupported client type: {type(client)}")
 def _format_input_data(client: ApiClient, **kwargs) -> dict:
@@ -2449,10 +2465,13 @@ def _format_input_data(client: ApiClient, **kwargs) -> dict:
     to ensure consistent tracing across different APIs.
     """
     if isinstance(client, (OpenAI, Together, AsyncOpenAI, AsyncTogether)):
-        return {
+        input_data = {
             "model": kwargs.get("model"),
             "messages": kwargs.get("messages"),
         }
+        if kwargs.get("response_format"):
+            input_data["response_format"] = kwargs.get("response_format")
+        return input_data
     elif isinstance(client, (genai.Client, genai.client.AsyncClient)):
         return {
             "model": kwargs.get("model"),
@@ -2522,7 +2541,10 @@ def _format_output_data(client: ApiClient, response: Any) -> dict:
         model_name = response.model
         prompt_tokens = response.usage.prompt_tokens
         completion_tokens = response.usage.completion_tokens
-        message_content = response.choices[0].message.content
+        if hasattr(response.choices[0].message, "parsed") and response.choices[0].message.parsed:
+            message_content = response.choices[0].message.parsed
+        else:
+            message_content = response.choices[0].message.content
     elif isinstance(client, (genai.Client, genai.client.AsyncClient)):
         model_name = response.model_version
         prompt_tokens = response.usage_metadata.prompt_token_count

{judgeval-0.0.42 → judgeval-0.0.44}/.github/pull_request_template.md RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/.github/workflows/blocked-pr.yaml RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/.github/workflows/ci.yaml RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/.github/workflows/merge-branch-check.yaml RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/.github/workflows/release.yaml RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/.github/workflows/validate-branch.yaml RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/.gitignore RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/LICENSE.md RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/README.md RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/assets/Screenshot 2025-05-17 at 8.14.27/342/200/257PM.png" RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/assets/dataset_clustering_screenshot.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/assets/dataset_clustering_screenshot_dm.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/assets/datasets_preview_screenshot.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/assets/experiments_dashboard_screenshot.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/assets/experiments_page.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/assets/experiments_pagev2.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/assets/logo-dark.svg RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/assets/logo-light.svg RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/assets/monitoring_screenshot.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/assets/new_darkmode.svg RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/assets/new_lightmode.svg RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/assets/trace_demo.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/assets/trace_screenshot.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/README.md RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/alerts/notifications.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/alerts/platform_notifications.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/alerts/rules.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/api_reference/judgment_client.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/api_reference/trace.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/changelog/2025-04-21.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/clustering/clustering.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/compliance/certifications.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/development.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/essentials/code.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/essentials/images.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/essentials/markdown.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/essentials/navigation.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/essentials/reusable-snippets.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/essentials/settings.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/evaluation/data_datasets.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/evaluation/data_examples.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/evaluation/data_sequences.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/evaluation/experiment_comparisons.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/evaluation/introduction.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/evaluation/judges.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/evaluation/scorers/agent/derailment.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/evaluation/scorers/classifier_scorer.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/evaluation/scorers/custom_scorers.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/evaluation/scorers/default/answer_correctness.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/evaluation/scorers/default/answer_relevancy.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/evaluation/scorers/default/comparison.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/evaluation/scorers/default/contextual_precision.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/evaluation/scorers/default/contextual_recall.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/evaluation/scorers/default/contextual_relevancy.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/evaluation/scorers/default/execution_order.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/evaluation/scorers/default/faithfulness.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/evaluation/scorers/default/groundedness.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/evaluation/scorers/default/json_correctness.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/evaluation/scorers/default/summarization.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/evaluation/scorers/introduction.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/evaluation/unit_testing.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/favicon.svg RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/getting_started.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/images/annotation_queue_ui.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/images/basic_trace_example.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/images/checks-passed.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/images/cluster.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/images/cluster_button.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/images/create_aggressive_scorer.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/images/create_scorer.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/images/dashboard_annotation_queue_button.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/images/evaluation_diagram.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/images/experiment-comparison-page-2.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/images/experiment-page-comparison.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/images/experiment-popout-comparison.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/images/experiments-page-comparison-2.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/images/experiments-page-comparison.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/images/export-dataset.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/images/hero-dark.svg RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/images/hero-light.svg RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/images/notifications_page.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/images/online_eval_fault.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/images/reports_modal.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/images/synth_data_button.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/images/synth_data_window.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/images/trace_ss.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/integration/langgraph.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/introduction.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/judgment_cli/installation.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/judgment_cli/self-hosting.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/judgment_cli/supabase-org-id.png RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/logo/dark.svg RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/logo/light.svg RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/mint.json RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/monitoring/annotations.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/monitoring/introduction.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/monitoring/production_insights.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/monitoring/tracing.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/monitoring/tracing_s3.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/notebooks/create_dataset.ipynb RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/notebooks/create_scorer.ipynb RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/notebooks/demo.ipynb RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/notebooks/prompt_scorer.ipynb RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/notebooks/quickstart.ipynb RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/optimization/osiris_agent.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/quickstart.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/self_hosting/get_started.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/snippets/snippet-intro.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/docs/synthetic_data/synthetic_data.mdx RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/pytest.ini RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/.coveragerc RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/clients.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/common/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/common/exceptions.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/common/logger.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/common/s3_storage.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/common/utils.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/constants.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/data/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/data/custom_example.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/data/datasets/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/data/datasets/dataset.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/data/datasets/eval_dataset_client.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/data/example.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/data/result.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/data/scorer_data.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/data/tool.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/data/trace.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/data/trace_run.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/evaluation_run.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/integrations/langgraph.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/judges/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/judges/base_judge.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/judges/litellm_judge.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/judges/mixture_of_judges.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/judges/together_judge.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/judges/utils.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/judgment_client.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/rules.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/run_evaluation.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/api_scorer.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/exceptions.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/judgeval_scorer.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/judgeval_scorers/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/judgeval_scorers/api_scorers/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/judgeval_scorers/api_scorers/answer_correctness.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/judgeval_scorers/api_scorers/answer_relevancy.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/judgeval_scorers/api_scorers/classifier_scorer.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/judgeval_scorers/api_scorers/comparison.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/judgeval_scorers/api_scorers/contextual_precision.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/judgeval_scorers/api_scorers/contextual_recall.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/judgeval_scorers/api_scorers/contextual_relevancy.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/judgeval_scorers/api_scorers/derailment_scorer.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/judgeval_scorers/api_scorers/execution_order.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/judgeval_scorers/api_scorers/faithfulness.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/judgeval_scorers/api_scorers/groundedness.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/judgeval_scorers/api_scorers/hallucination.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/judgeval_scorers/api_scorers/instruction_adherence.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/judgeval_scorers/api_scorers/json_correctness.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/judgeval_scorers/api_scorers/summarization.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/judgeval_scorers/api_scorers/tool_dependency.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/judgeval_scorers/api_scorers/tool_order.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/judgeval_scorers/classifiers/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/judgeval_scorers/classifiers/text2sql/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/judgeval_scorers/classifiers/text2sql/text2sql_scorer.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/prompt_scorer.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/score.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/scorers/utils.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/tracer/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/utils/alerts.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/utils/data_utils.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/src/judgeval/version_check.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/update_version.py RENAMED Viewed

File without changes

{judgeval-0.0.42 → judgeval-0.0.44}/uv.lock RENAMED Viewed

File without changes

judgeval 0.0.42__tar.gz → 0.0.44__tar.gz

judgeval 0.0.42tar.gz → 0.0.44tar.gz