PyPI - judgeval - Versions diffs - 0.0.13__tar.gz → 0.0.14__tar.gz - Mend

judgeval 0.0.13tar.gz → 0.0.14tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (162) hide show

{judgeval-0.0.13 → judgeval-0.0.14}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: judgeval
-Version: 0.0.13
+Version: 0.0.14
 Summary: Judgeval Package
 Project-URL: Homepage, https://github.com/JudgmentLabs/judgeval
 Project-URL: Issues, https://github.com/JudgmentLabs/judgeval/issues

{judgeval-0.0.13 → judgeval-0.0.14}/pyproject.toml RENAMED Viewed

@@ -1,6 +1,6 @@
 [project]
 name = "judgeval"
-version = "0.0.13"
+version = "0.0.14"
 authors = [
     { name="Andrew Li", email="andrew@judgmentlabs.ai" },
     { name="Alex Shan", email="alex@judgmentlabs.ai" },

{judgeval-0.0.13 → judgeval-0.0.14}/src/demo/cookbooks/openai_travel_agent/agent.py RENAMED Viewed

@@ -50,7 +50,7 @@ async def get_flights(destination):
     judgment.get_current_trace().async_evaluate(
         scorers=[AnswerRelevancyScorer(threshold=0.5)],
         input=prompt,
-        actual_output=flights_search,
+        actual_output=flights_search["results"],
         model="gpt-4",
     )
     return flights_search
@@ -63,7 +63,7 @@ async def get_weather(destination, start_date, end_date):
     judgment.get_current_trace().async_evaluate(
         scorers=[AnswerRelevancyScorer(threshold=0.5)],
         input=prompt,
-        actual_output=weather_search,
+        actual_output=weather_search["results"],
         model="gpt-4",
     )
     return weather_search

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/common/tracer.py RENAMED Viewed

@@ -188,8 +188,9 @@ class TraceManagerClient:
     - Saving a trace
     - Deleting a trace
     """
-    def __init__(self, judgment_api_key: str):
+    def __init__(self, judgment_api_key: str, organization_id: str):
         self.judgment_api_key = judgment_api_key
+        self.organization_id = organization_id
     def fetch_trace(self, trace_id: str):
         """
@@ -199,11 +200,11 @@ class TraceManagerClient:
             JUDGMENT_TRACES_FETCH_API_URL,
             json={
                 "trace_id": trace_id,
-                # "judgment_api_key": self.judgment_api_key,
             },
             headers={
                 "Content-Type": "application/json",
-                "Authorization": f"Bearer {self.judgment_api_key}"
+                "Authorization": f"Bearer {self.judgment_api_key}",
+                "X-Organization-Id": self.organization_id
             }
         )
@@ -226,7 +227,8 @@ class TraceManagerClient:
             json=trace_data,
             headers={
                 "Content-Type": "application/json",
-                "Authorization": f"Bearer {self.judgment_api_key}"
+                "Authorization": f"Bearer {self.judgment_api_key}",
+                "X-Organization-Id": self.organization_id
             }
         )
@@ -245,12 +247,12 @@ class TraceManagerClient:
         response = requests.delete(
             JUDGMENT_TRACES_DELETE_API_URL,
             json={
-                "judgment_api_key": self.judgment_api_key,
                 "trace_ids": [trace_id],
             },
             headers={
                 "Content-Type": "application/json",
-                "Authorization": f"Bearer {self.judgment_api_key}"
+                "Authorization": f"Bearer {self.judgment_api_key}",
+                "X-Organization-Id": self.organization_id
             }
         )
@@ -266,12 +268,12 @@ class TraceManagerClient:
         response = requests.delete(
             JUDGMENT_TRACES_DELETE_API_URL,
             json={
-                # "judgment_api_key": self.judgment_api_key,
                 "trace_ids": trace_ids,
             },
             headers={
                 "Content-Type": "application/json",
-                "Authorization": f"Bearer {self.judgment_api_key}"
+                "Authorization": f"Bearer {self.judgment_api_key}",
+                "X-Organization-Id": self.organization_id
             }
         )
@@ -294,7 +296,7 @@ class TraceClient:
         self.span_type = None
         self._current_span: Optional[TraceEntry] = None
         self.overwrite = overwrite
-        self.trace_manager_client = TraceManagerClient(tracer.api_key)  # Manages DB operations for trace data
+        self.trace_manager_client = TraceManagerClient(tracer.api_key, tracer.organization_id)  # Manages DB operations for trace data
     @contextmanager
     def span(self, name: str, span_type: SpanType = "span"):
@@ -371,6 +373,7 @@ class TraceClient:
             raise ValueError(f"Failed to load scorers: {str(e)}")
         eval_run = EvaluationRun(
+            organization_id=self.tracer.organization_id,
             log_results=log_results,
             project_name=self.project_name,
             eval_name=f"{self.name.capitalize()}-"
@@ -546,7 +549,6 @@ class TraceClient:
         # Create trace document
         trace_data = {
             "trace_id": self.trace_id,
-            "api_key": self.tracer.api_key,
             "name": self.name,
             "project_name": self.project_name,
             "created_at": datetime.fromtimestamp(self.start_time).isoformat(),
@@ -568,6 +570,8 @@ class TraceClient:
             channel = connection.channel()
             channel.queue_declare(queue=RABBITMQ_QUEUE, durable=True)
+            trace_data["judgment_api_key"] = self.tracer.api_key
+            trace_data["organization_id"] = self.tracer.organization_id
             channel.basic_publish(
                 exchange='',
@@ -580,25 +584,6 @@ class TraceClient:
         self.trace_manager_client.save_trace(trace_data, empty_save)
-        # Save trace data by making POST request to API
-        response = requests.post(
-            JUDGMENT_TRACES_SAVE_API_URL,
-            json=trace_data,
-            headers={
-                "Content-Type": "application/json",
-                "Authorization": f"Bearer {self.tracer.api_key}"  # Bearer token format
-            }
-        )
-        if response.status_code == HTTPStatus.BAD_REQUEST:
-            raise ValueError(f"Failed to save trace data: Check your Trace name for conflicts, set overwrite=True to overwrite existing traces: {response.text}")
-        elif response.status_code != HTTPStatus.OK:
-            raise ValueError(f"Failed to save trace data: {response.text}")
-        if not empty_save and "ui_results_url" in response.json():
-            rprint(f"\n🔍 You can view your trace data here: [rgb(106,0,255)]{response.json()['ui_results_url']}[/]\n")
         return self.trace_id, trace_data
     def delete(self):
@@ -612,14 +597,18 @@ class Tracer:
             cls._instance = super(Tracer, cls).__new__(cls)
         return cls._instance
-    def __init__(self, api_key: str = os.getenv("JUDGMENT_API_KEY"), project_name: str = "default_project"):
+    def __init__(self, api_key: str = os.getenv("JUDGMENT_API_KEY"), project_name: str = "default_project", organization_id: str = os.getenv("ORGANIZATION_ID")):
         if not hasattr(self, 'initialized'):
             if not api_key:
                 raise ValueError("Tracer must be configured with a Judgment API key")
+            if not organization_id:
+                raise ValueError("Tracer must be configured with an Organization ID")
             self.api_key: str = api_key
             self.project_name: str = project_name
             self.client: JudgmentClient = JudgmentClient(judgment_api_key=api_key)
+            self.organization_id: str = organization_id
             self.depth: int = 0
             self._current_trace: Optional[str] = None
             self.initialized: bool = True

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/data/datasets/dataset.py RENAMED Viewed

@@ -17,9 +17,10 @@ class EvalDataset:
     _alias: Union[str, None] = field(default=None)
     _id: Union[str, None] = field(default=None)
     judgment_api_key: str = field(default="")
+    organization_id: str = field(default="")
     def __init__(self,
                  judgment_api_key: str = os.getenv("JUDGMENT_API_KEY"),
+                 organization_id: str = os.getenv("ORGANIZATION_ID"),
                  ground_truths: List[GroundTruthExample] = [],
                  examples: List[Example] = [],
                  ):
@@ -31,7 +32,7 @@ class EvalDataset:
         self._alias = None
         self._id = None
         self.judgment_api_key = judgment_api_key
+        self.organization_id = organization_id
     def add_from_json(self, file_path: str) -> None:
         debug(f"Loading dataset from JSON file: {file_path}")

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/data/datasets/eval_dataset_client.py RENAMED Viewed

@@ -19,8 +19,9 @@ from judgeval.data.datasets.ground_truth import GroundTruthExample
 class EvalDatasetClient:
-    def __init__(self, judgment_api_key: str):
+    def __init__(self, judgment_api_key: str, organization_id: str):
         self.judgment_api_key = judgment_api_key
+        self.organization_id = organization_id
     def create_dataset(self) -> EvalDataset:
         return EvalDataset(judgment_api_key=self.judgment_api_key)
@@ -58,7 +59,6 @@ class EvalDatasetClient:
                     "ground_truths": [g.to_dict() for g in dataset.ground_truths],
                     "examples": [e.to_dict() for e in dataset.examples],
                     "overwrite": overwrite,
-                    # "judgment_api_key": dataset.judgment_api_key
                 }
             try:
                 response = requests.post(
@@ -66,7 +66,8 @@ class EvalDatasetClient:
                     json=content,
                     headers={
                         "Content-Type": "application/json",
-                        "Authorization": f"Bearer {self.judgment_api_key}"
+                        "Authorization": f"Bearer {self.judgment_api_key}",
+                        "X-Organization-Id": self.organization_id
                     }
                 )
                 if response.status_code == 500:
@@ -121,7 +122,6 @@ class EvalDatasetClient:
                 )
                 request_body = {
                     "alias": alias,
-                    # "judgment_api_key": self.judgment_api_key
                 }
                 try:
@@ -130,7 +130,8 @@ class EvalDatasetClient:
                         json=request_body,
                         headers={
                             "Content-Type": "application/json",
-                            "Authorization": f"Bearer {self.judgment_api_key}"
+                            "Authorization": f"Bearer {self.judgment_api_key}",
+                            "X-Organization-Id": self.organization_id
                         }
                     )
                     response.raise_for_status()
@@ -179,7 +180,6 @@ class EvalDatasetClient:
                     total=100,
                 )
                 request_body = {
-                    # "judgment_api_key": self.judgment_api_key
                 }
                 try:
@@ -188,7 +188,8 @@ class EvalDatasetClient:
                         json=request_body,
                         headers={
                             "Content-Type": "application/json",
-                            "Authorization": f"Bearer {self.judgment_api_key}"
+                            "Authorization": f"Bearer {self.judgment_api_key}",
+                            "X-Organization-Id": self.organization_id
                         }
                     )
                     response.raise_for_status()
@@ -238,7 +239,12 @@ class EvalDatasetClient:
             try:
                 response = requests.post(
                     JUDGMENT_DATASETS_EDIT_API_URL,
-                    json=content
+                    json=content,
+                    headers={
+                        "Content-Type": "application/json",
+                        "Authorization": f"Bearer {self.judgment_api_key}",
+                        "X-Organization-Id": self.organization_id
+                    }
                 )
                 response.raise_for_status()
             except requests.exceptions.RequestException as e:
@@ -266,7 +272,8 @@ class EvalDatasetClient:
                     json={"alias": alias},
                     headers={
                         "Content-Type": "application/json",
-                        "Authorization": f"Bearer {self.judgment_api_key}"
+                        "Authorization": f"Bearer {self.judgment_api_key}",
+                        "X-Organization-Id": self.organization_id
                     },
                     stream=True
                 )

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/data/example.py RENAMED Viewed

@@ -5,7 +5,7 @@ Classes for representing examples in a dataset.
 from typing import TypeVar, Optional, Any, Dict, List
 from uuid import uuid4
-from pydantic import BaseModel, Field
+from pydantic import BaseModel, Field, field_validator
 from enum import Enum
 from datetime import datetime
 import time
@@ -40,6 +40,13 @@ class Example(BaseModel):
     timestamp: Optional[str] = None
     trace_id: Optional[str] = None
+    @field_validator('input', 'actual_output', mode='before')
+    def convert_to_str(cls, value):
+        try:
+            return str(value)
+        except Exception:
+            return repr(value)
     def __init__(self, **data):
         if 'example_id' not in data:
             data['example_id'] = str(uuid4())

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/evaluation_run.py RENAMED Viewed

@@ -24,6 +24,7 @@ class EvaluationRun(BaseModel):
     # The user will specify whether they want log_results when they call run_eval
     log_results: bool = False  # NOTE: log_results has to be set first because it is used to validate project_name and eval_name
+    organization_id: Optional[str] = None
     project_name: Optional[str] = None
     eval_name: Optional[str] = None
     examples: List[Example]

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/judgment_client.py RENAMED Viewed

@@ -34,9 +34,10 @@ class EvalRunRequestBody(BaseModel):
 class JudgmentClient:
-    def __init__(self, judgment_api_key: str = os.getenv("JUDGMENT_API_KEY")):
+    def __init__(self, judgment_api_key: str = os.getenv("JUDGMENT_API_KEY"), organization_id: str = os.getenv("ORGANIZATION_ID")):
         self.judgment_api_key = judgment_api_key
-        self.eval_dataset_client = EvalDatasetClient(judgment_api_key)
+        self.organization_id = organization_id
+        self.eval_dataset_client = EvalDatasetClient(judgment_api_key, organization_id)
         # Verify API key is valid
         result, response = self._validate_api_key()
@@ -78,7 +79,8 @@ class JudgmentClient:
                 model=model,
                 aggregator=aggregator,
                 metadata=metadata,
-                judgment_api_key=self.judgment_api_key
+                judgment_api_key=self.judgment_api_key,
+                organization_id=self.organization_id
             )
             return run_eval(eval, override)
         except ValueError as e:
@@ -115,7 +117,8 @@ class JudgmentClient:
                 model=model,
                 aggregator=aggregator,
                 metadata=metadata,
-                judgment_api_key=self.judgment_api_key
+                judgment_api_key=self.judgment_api_key,
+                organization_id=self.organization_id
             )
             return run_eval(evaluation_run)
         except ValueError as e:
@@ -189,7 +192,8 @@ class JudgmentClient:
         eval_run = requests.post(JUDGMENT_EVAL_FETCH_API_URL,
                                  headers={
                                     "Content-Type": "application/json",
-                                    "Authorization": f"Bearer {self.judgment_api_key}"
+                                    "Authorization": f"Bearer {self.judgment_api_key}",
+                                    "X-Organization-Id": self.organization_id
                                  },
                                  json=eval_run_request_body.model_dump())
         if eval_run.status_code != requests.codes.ok:
@@ -222,7 +226,8 @@ class JudgmentClient:
                         json=eval_run_request_body.model_dump(),
                         headers={
                             "Content-Type": "application/json",
-                            "Authorization": f"Bearer {self.judgment_api_key}"
+                            "Authorization": f"Bearer {self.judgment_api_key}",
+                            "X-Organization-Id": self.organization_id
                         })
         if response.status_code != requests.codes.ok:
             raise ValueError(f"Error deleting eval results: {response.json()}")
@@ -241,11 +246,12 @@ class JudgmentClient:
         response = requests.delete(JUDGMENT_EVAL_DELETE_PROJECT_API_URL,
                         json={
                             "project_name": project_name,
-                            "judgment_api_key": self.judgment_api_key
+                            "judgment_api_key": self.judgment_api_key,
                         },
                         headers={
                             "Content-Type": "application/json",
-                            "Authorization": f"Bearer {self.judgment_api_key}"
+                            "Authorization": f"Bearer {self.judgment_api_key}",
+                            "X-Organization-Id": self.organization_id
                         })
         if response.status_code != requests.codes.ok:
             raise ValueError(f"Error deleting eval results: {response.json()}")
@@ -283,7 +289,6 @@ class JudgmentClient:
         """
         request_body = {
             "slug": slug,
-            # "judgment_api_key": self.judgment_api_key
         }
         response = requests.post(
@@ -291,7 +296,8 @@ class JudgmentClient:
             json=request_body,
             headers={
                 "Content-Type": "application/json",
-                "Authorization": f"Bearer {self.judgment_api_key}"
+                "Authorization": f"Bearer {self.judgment_api_key}",
+                "X-Organization-Id": self.organization_id
             }
         )
@@ -325,7 +331,6 @@ class JudgmentClient:
             "name": scorer.name,
             "conversation": scorer.conversation,
             "options": scorer.options,
-            # "judgment_api_key": self.judgment_api_key,
             "slug": slug
         }
@@ -334,7 +339,8 @@ class JudgmentClient:
             json=request_body,
             headers={
                 "Content-Type": "application/json",
-                "Authorization": f"Bearer {self.judgment_api_key}"
+                "Authorization": f"Bearer {self.judgment_api_key}",
+                "X-Organization-Id": self.organization_id
             }
         )

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/run_evaluation.py RENAMED Viewed

@@ -50,7 +50,8 @@ def execute_api_eval(evaluation_run: EvaluationRun) -> List[Dict]:
         response = requests.post(
             JUDGMENT_EVAL_API_URL, headers={
             "Content-Type": "application/json",
-            "Authorization": f"Bearer {evaluation_run.judgment_api_key}"
+            "Authorization": f"Bearer {evaluation_run.judgment_api_key}",
+            "X-Organization-Id": evaluation_run.organization_id
         },
         json=payload)
         response_data = response.json()
@@ -140,7 +141,7 @@ def check_missing_scorer_data(results: List[ScoringResult]) -> List[ScoringResul
     return results
-def check_eval_run_name_exists(eval_name: str, project_name: str, judgment_api_key: str) -> None:
+def check_eval_run_name_exists(eval_name: str, project_name: str, judgment_api_key: str, organization_id: str) -> None:
     """
     Checks if an evaluation run name already exists for a given project.
@@ -158,7 +159,8 @@ def check_eval_run_name_exists(eval_name: str, project_name: str, judgment_api_k
             f"{ROOT_API}/eval-run-name-exists/",
             headers={
                 "Content-Type": "application/json",
-                "Authorization": f"Bearer {judgment_api_key}"
+                "Authorization": f"Bearer {judgment_api_key}",
+                "X-Organization-Id": organization_id
             },
             json={
                 "eval_name": eval_name,
@@ -199,11 +201,11 @@ def log_evaluation_results(merged_results: List[ScoringResult], evaluation_run:
             JUDGMENT_EVAL_LOG_API_URL,
             headers={
                 "Content-Type": "application/json",
-                "Authorization": f"Bearer {evaluation_run.judgment_api_key}"
+                "Authorization": f"Bearer {evaluation_run.judgment_api_key}",
+                "X-Organization-Id": evaluation_run.organization_id
             },
             json={
                 "results": [result.to_dict() for result in merged_results],
-                "judgment_api_key": evaluation_run.judgment_api_key,
                 "project_name": evaluation_run.project_name,
                 "eval_name": evaluation_run.eval_name,
             }
@@ -254,7 +256,8 @@ def run_eval(evaluation_run: EvaluationRun, override: bool = False) -> List[Scor
         check_eval_run_name_exists(
             evaluation_run.eval_name,
             evaluation_run.project_name,
-            evaluation_run.judgment_api_key
+            evaluation_run.judgment_api_key,
+            evaluation_run.organization_id
         )
     # Set example IDs if not already set
@@ -312,6 +315,7 @@ def run_eval(evaluation_run: EvaluationRun, override: bool = False) -> List[Scor
                 aggregator=evaluation_run.aggregator,
                 metadata=evaluation_run.metadata,
                 judgment_api_key=evaluation_run.judgment_api_key,
+                organization_id=evaluation_run.organization_id,
                 log_results=evaluation_run.log_results
             )
             debug("Sending request to Judgment API")

{judgeval-0.0.13 → judgeval-0.0.14}/.github/workflows/ci.yaml RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/.gitignore RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/LICENSE.md RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/Pipfile RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/Pipfile.lock RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/README.md RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/README.md RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/api_reference/judgment_client.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/api_reference/trace.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/development.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/essentials/code.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/essentials/images.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/essentials/markdown.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/essentials/navigation.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/essentials/reusable-snippets.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/essentials/settings.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/evaluation/data_datasets.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/evaluation/data_examples.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/evaluation/introduction.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/evaluation/judges.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/evaluation/scorers/answer_correctness.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/evaluation/scorers/answer_relevancy.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/evaluation/scorers/classifier_scorer.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/evaluation/scorers/contextual_precision.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/evaluation/scorers/contextual_recall.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/evaluation/scorers/contextual_relevancy.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/evaluation/scorers/custom_scorers.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/evaluation/scorers/faithfulness.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/evaluation/scorers/hallucination.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/evaluation/scorers/introduction.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/evaluation/scorers/json_correctness.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/evaluation/scorers/summarization.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/evaluation/scorers/tool_correctness.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/evaluation/unit_testing.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/favicon.svg RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/getting_started.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/images/basic_trace_example.png RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/images/checks-passed.png RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/images/create_aggressive_scorer.png RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/images/create_scorer.png RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/images/evaluation_diagram.png RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/images/hero-dark.svg RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/images/hero-light.svg RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/images/trace_screenshot.png RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/introduction.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/judgment/introduction.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/logo/dark.svg RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/logo/light.svg RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/mint.json RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/monitoring/introduction.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/monitoring/production_insights.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/monitoring/tracing.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/notebooks/create_dataset.ipynb RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/notebooks/create_scorer.ipynb RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/notebooks/demo.ipynb RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/notebooks/prompt_scorer.ipynb RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/notebooks/quickstart.ipynb RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/quickstart.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/docs/snippets/snippet-intro.mdx RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/pytest.ini RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/demo/cookbooks/ci_testing/ci_testing.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/demo/cookbooks/ci_testing/travel_response.txt RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/demo/cookbooks/custom_scorers/competitor_mentions.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/demo/cookbooks/custom_scorers/text2sql.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/demo/cookbooks/langchain_basic_rag/basic_agentic_rag.ipynb RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/demo/cookbooks/langchain_basic_rag/tesla_q3.pdf RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/demo/cookbooks/langchain_sales/example_product_price_id_mapping.json RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/demo/cookbooks/langchain_sales/sales_agent_with_context.ipynb RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/demo/cookbooks/langchain_sales/sample_product_catalog.txt RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/demo/cookbooks/new_bot/basic_bot.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/demo/cookbooks/openai_travel_agent/populate_db.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/demo/cookbooks/openai_travel_agent/tools.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/demo/customer_use/cstone/basic_test.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/demo/customer_use/cstone/cstone_data.csv RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/demo/customer_use/cstone/data.csv RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/demo/customer_use/cstone/faithfulness_testing.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/demo/customer_use/cstone/galen_data.csv RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/demo/customer_use/cstone/playground.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/demo/customer_use/cstone/results.csv RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/clients.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/common/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/common/exceptions.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/common/logger.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/common/utils.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/constants.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/data/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/data/api_example.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/data/datasets/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/data/datasets/ground_truth.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/data/datasets/utils.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/data/result.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/data/scorer_data.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/judges/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/judges/base_judge.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/judges/litellm_judge.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/judges/mixture_of_judges.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/judges/together_judge.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/judges/utils.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/api_scorer.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/base_scorer.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/exceptions.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorer.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/api_scorers/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/api_scorers/answer_correctness.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/api_scorers/answer_relevancy.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/api_scorers/contextual_precision.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/api_scorers/contextual_recall.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/api_scorers/contextual_relevancy.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/api_scorers/faithfulness.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/api_scorers/hallucination.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/api_scorers/json_correctness.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/api_scorers/summarization.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/api_scorers/tool_correctness.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/classifiers/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/classifiers/text2sql/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/classifiers/text2sql/text2sql_scorer.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/answer_correctness/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/answer_correctness/answer_correctness_scorer.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/answer_correctness/prompts.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/answer_relevancy/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/answer_relevancy/answer_relevancy_scorer.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/answer_relevancy/prompts.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/contextual_precision/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/contextual_precision/contextual_precision_scorer.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/contextual_precision/prompts.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/contextual_recall/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/contextual_recall/contextual_recall_scorer.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/contextual_recall/prompts.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/contextual_relevancy/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/contextual_relevancy/contextual_relevancy_scorer.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/contextual_relevancy/prompts.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/faithfulness/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/faithfulness/faithfulness_scorer.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/faithfulness/prompts.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/hallucination/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/hallucination/hallucination_scorer.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/hallucination/prompts.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/json_correctness/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/json_correctness/json_correctness_scorer.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/summarization/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/summarization/prompts.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/summarization/summarization_scorer.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/tool_correctness/__init__.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/judgeval_scorers/local_implementations/tool_correctness/tool_correctness_scorer.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/prompt_scorer.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/score.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/scorers/utils.py RENAMED Viewed

File without changes

{judgeval-0.0.13 → judgeval-0.0.14}/src/judgeval/tracer/__init__.py RENAMED Viewed

File without changes

judgeval 0.0.13__tar.gz → 0.0.14__tar.gz

judgeval 0.0.13tar.gz → 0.0.14tar.gz