PyPI - arize - Versions diffs - 8.0.0a22__py3-none-any.whl → 8.0.0b0__py3-none-any.whl - Mend

arize 8.0.0a22py3-none-any.whl → 8.0.0b0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (171) hide show

arize/__init__.py +28 -19
arize/_exporter/client.py +56 -37
arize/_exporter/parsers/tracing_data_parser.py +41 -30
arize/_exporter/validation.py +3 -3
arize/_flight/client.py +207 -76
arize/_generated/api_client/__init__.py +30 -6
arize/_generated/api_client/api/__init__.py +1 -0
arize/_generated/api_client/api/datasets_api.py +864 -190
arize/_generated/api_client/api/experiments_api.py +167 -131
arize/_generated/api_client/api/projects_api.py +1197 -0
arize/_generated/api_client/api_client.py +2 -2
arize/_generated/api_client/configuration.py +42 -34
arize/_generated/api_client/exceptions.py +2 -2
arize/_generated/api_client/models/__init__.py +15 -4
arize/_generated/api_client/models/dataset.py +10 -10
arize/_generated/api_client/models/dataset_example.py +111 -0
arize/_generated/api_client/models/dataset_example_update.py +100 -0
arize/_generated/api_client/models/dataset_version.py +13 -13
arize/_generated/api_client/models/datasets_create_request.py +16 -8
arize/_generated/api_client/models/datasets_examples_insert_request.py +100 -0
arize/_generated/api_client/models/datasets_examples_list200_response.py +106 -0
arize/_generated/api_client/models/datasets_examples_update_request.py +102 -0
arize/_generated/api_client/models/datasets_list200_response.py +10 -4
arize/_generated/api_client/models/experiment.py +14 -16
arize/_generated/api_client/models/experiment_run.py +108 -0
arize/_generated/api_client/models/experiment_run_create.py +102 -0
arize/_generated/api_client/models/experiments_create_request.py +16 -10
arize/_generated/api_client/models/experiments_list200_response.py +10 -4
arize/_generated/api_client/models/experiments_runs_list200_response.py +19 -5
arize/_generated/api_client/models/{error.py → pagination_metadata.py} +13 -11
arize/_generated/api_client/models/primitive_value.py +172 -0
arize/_generated/api_client/models/problem.py +100 -0
arize/_generated/api_client/models/project.py +99 -0
arize/_generated/api_client/models/{datasets_list_examples200_response.py → projects_create_request.py} +13 -11
arize/_generated/api_client/models/projects_list200_response.py +106 -0
arize/_generated/api_client/rest.py +2 -2
arize/_generated/api_client/test/test_dataset.py +4 -2
arize/_generated/api_client/test/test_dataset_example.py +56 -0
arize/_generated/api_client/test/test_dataset_example_update.py +52 -0
arize/_generated/api_client/test/test_dataset_version.py +7 -2
arize/_generated/api_client/test/test_datasets_api.py +27 -13
arize/_generated/api_client/test/test_datasets_create_request.py +8 -4
arize/_generated/api_client/test/{test_datasets_list_examples200_response.py → test_datasets_examples_insert_request.py} +19 -15
arize/_generated/api_client/test/test_datasets_examples_list200_response.py +66 -0
arize/_generated/api_client/test/test_datasets_examples_update_request.py +61 -0
arize/_generated/api_client/test/test_datasets_list200_response.py +9 -3
arize/_generated/api_client/test/test_experiment.py +2 -4
arize/_generated/api_client/test/test_experiment_run.py +56 -0
arize/_generated/api_client/test/test_experiment_run_create.py +54 -0
arize/_generated/api_client/test/test_experiments_api.py +6 -6
arize/_generated/api_client/test/test_experiments_create_request.py +9 -6
arize/_generated/api_client/test/test_experiments_list200_response.py +9 -5
arize/_generated/api_client/test/test_experiments_runs_list200_response.py +15 -5
arize/_generated/api_client/test/test_pagination_metadata.py +53 -0
arize/_generated/api_client/test/{test_error.py → test_primitive_value.py} +13 -14
arize/_generated/api_client/test/test_problem.py +57 -0
arize/_generated/api_client/test/test_project.py +58 -0
arize/_generated/api_client/test/test_projects_api.py +59 -0
arize/_generated/api_client/test/test_projects_create_request.py +54 -0
arize/_generated/api_client/test/test_projects_list200_response.py +70 -0
arize/_generated/api_client_README.md +43 -29
arize/_generated/protocol/flight/flight_pb2.py +400 -0
arize/_lazy.py +27 -19
arize/client.py +181 -58
arize/config.py +324 -116
arize/constants/__init__.py +1 -0
arize/constants/config.py +11 -4
arize/constants/ml.py +6 -4
arize/constants/openinference.py +2 -0
arize/constants/pyarrow.py +2 -0
arize/constants/spans.py +3 -1
arize/datasets/__init__.py +1 -0
arize/datasets/client.py +304 -84
arize/datasets/errors.py +32 -2
arize/datasets/validation.py +18 -8
arize/embeddings/__init__.py +2 -0
arize/embeddings/auto_generator.py +23 -19
arize/embeddings/base_generators.py +89 -36
arize/embeddings/constants.py +2 -0
arize/embeddings/cv_generators.py +26 -4
arize/embeddings/errors.py +27 -5
arize/embeddings/nlp_generators.py +43 -18
arize/embeddings/tabular_generators.py +46 -31
arize/embeddings/usecases.py +12 -2
arize/exceptions/__init__.py +1 -0
arize/exceptions/auth.py +11 -1
arize/exceptions/base.py +29 -4
arize/exceptions/models.py +21 -2
arize/exceptions/parameters.py +31 -0
arize/exceptions/spaces.py +12 -1
arize/exceptions/types.py +86 -7
arize/exceptions/values.py +220 -20
arize/experiments/__init__.py +13 -0
arize/experiments/client.py +394 -285
arize/experiments/evaluators/__init__.py +1 -0
arize/experiments/evaluators/base.py +74 -41
arize/experiments/evaluators/exceptions.py +6 -3
arize/experiments/evaluators/executors.py +121 -73
arize/experiments/evaluators/rate_limiters.py +106 -57
arize/experiments/evaluators/types.py +34 -7
arize/experiments/evaluators/utils.py +65 -27
arize/experiments/functions.py +103 -101
arize/experiments/tracing.py +52 -44
arize/experiments/types.py +56 -31
arize/logging.py +54 -22
arize/ml/__init__.py +1 -0
arize/ml/batch_validation/__init__.py +1 -0
arize/{models → ml}/batch_validation/errors.py +545 -67
arize/{models → ml}/batch_validation/validator.py +344 -303
arize/ml/bounded_executor.py +47 -0
arize/{models → ml}/casting.py +118 -108
arize/{models → ml}/client.py +339 -118
arize/{models → ml}/proto.py +97 -42
arize/{models → ml}/stream_validation.py +43 -15
arize/ml/surrogate_explainer/__init__.py +1 -0
arize/{models → ml}/surrogate_explainer/mimic.py +25 -10
arize/{types.py → ml/types.py} +355 -354
arize/pre_releases.py +44 -0
arize/projects/__init__.py +1 -0
arize/projects/client.py +134 -0
arize/regions.py +40 -0
arize/spans/__init__.py +1 -0
arize/spans/client.py +204 -175
arize/spans/columns.py +13 -0
arize/spans/conversion.py +60 -37
arize/spans/validation/__init__.py +1 -0
arize/spans/validation/annotations/__init__.py +1 -0
arize/spans/validation/annotations/annotations_validation.py +6 -4
arize/spans/validation/annotations/dataframe_form_validation.py +13 -11
arize/spans/validation/annotations/value_validation.py +35 -11
arize/spans/validation/common/__init__.py +1 -0
arize/spans/validation/common/argument_validation.py +33 -8
arize/spans/validation/common/dataframe_form_validation.py +35 -9
arize/spans/validation/common/errors.py +211 -11
arize/spans/validation/common/value_validation.py +81 -14
arize/spans/validation/evals/__init__.py +1 -0
arize/spans/validation/evals/dataframe_form_validation.py +28 -8
arize/spans/validation/evals/evals_validation.py +34 -4
arize/spans/validation/evals/value_validation.py +26 -3
arize/spans/validation/metadata/__init__.py +1 -1
arize/spans/validation/metadata/argument_validation.py +14 -5
arize/spans/validation/metadata/dataframe_form_validation.py +26 -10
arize/spans/validation/metadata/value_validation.py +24 -10
arize/spans/validation/spans/__init__.py +1 -0
arize/spans/validation/spans/dataframe_form_validation.py +35 -14
arize/spans/validation/spans/spans_validation.py +35 -4
arize/spans/validation/spans/value_validation.py +78 -8
arize/utils/__init__.py +1 -0
arize/utils/arrow.py +31 -15
arize/utils/cache.py +34 -6
arize/utils/dataframe.py +20 -3
arize/utils/online_tasks/__init__.py +2 -0
arize/utils/online_tasks/dataframe_preprocessor.py +58 -47
arize/utils/openinference_conversion.py +44 -5
arize/utils/proto.py +10 -0
arize/utils/size.py +5 -3
arize/utils/types.py +105 -0
arize/version.py +3 -1
{arize-8.0.0a22.dist-info → arize-8.0.0b0.dist-info}/METADATA +13 -6
arize-8.0.0b0.dist-info/RECORD +175 -0
{arize-8.0.0a22.dist-info → arize-8.0.0b0.dist-info}/WHEEL +1 -1
arize-8.0.0b0.dist-info/licenses/LICENSE +176 -0
arize-8.0.0b0.dist-info/licenses/NOTICE +13 -0
arize/_generated/protocol/flight/export_pb2.py +0 -61
arize/_generated/protocol/flight/ingest_pb2.py +0 -365
arize/models/__init__.py +0 -0
arize/models/batch_validation/__init__.py +0 -0
arize/models/bounded_executor.py +0 -34
arize/models/surrogate_explainer/__init__.py +0 -0
arize-8.0.0a22.dist-info/RECORD +0 -146
arize-8.0.0a22.dist-info/licenses/LICENSE.md +0 -12

arize/experiments/evaluators/__init__.py CHANGED Viewed

	@@ -0,0 +1 @@
1	+ """Evaluator implementations for experiment evaluation in the Arize SDK."""

arize/experiments/evaluators/base.py CHANGED Viewed

@@ -1,10 +1,13 @@
+"""Base evaluator classes for experiment evaluation."""
 from __future__ import annotations
 import functools
 import inspect
 from abc import ABC
+from collections.abc import Awaitable, Callable, Mapping, Sequence
 from types import MappingProxyType
-from typing import Any, Awaitable, Callable, Mapping, Sequence
+from typing import TYPE_CHECKING
 from arize.experiments.evaluators.types import (
     AnnotatorKind,
@@ -14,17 +17,19 @@ from arize.experiments.evaluators.types import (
     EvaluatorOutput,
     JSONSerializable,
 )
-from arize.experiments.types import (
-    ExampleInput,
-    ExampleMetadata,
-    ExampleOutput,
-    TaskOutput,
-)
+if TYPE_CHECKING:
+    from arize.experiments.types import (
+        ExampleInput,
+        ExampleMetadata,
+        ExampleOutput,
+        TaskOutput,
+    )
 class Evaluator(ABC):
-    """
-    A helper super class to guide the implementation of an `Evaluator` object.
+    """A helper super class to guide the implementation of an `Evaluator` object.
     Subclasses must implement either the `evaluate` or `async_evaluate` method.
     Implementing both methods is recommended, but not required.
@@ -36,17 +41,20 @@ class Evaluator(ABC):
     @functools.cached_property
     def name(self) -> EvaluatorName:
+        """Return the name of this evaluator."""
         if hasattr(self, "_name"):
             return self._name
         return self.__class__.__name__
     @functools.cached_property
     def kind(self) -> EvaluatorKind:
+        """Return the kind of this evaluator (CODE or LLM)."""
         if hasattr(self, "_kind"):
             return self._kind
         return AnnotatorKind.CODE.value
-    def __new__(cls, *args: Any, **kwargs: Any) -> Evaluator:
+    def __new__(cls, *args: object, **kwargs: object) -> Evaluator:
+        """Create a new evaluator instance, preventing direct instantiation of abstract class."""
         if cls is Evaluator:
             raise TypeError(
                 f"{cls.__name__} is an abstract class and should not be instantiated."
@@ -62,20 +70,23 @@ class Evaluator(ABC):
         experiment_output: TaskOutput | None = None,
         dataset_output: ExampleOutput = MappingProxyType({}),
         metadata: ExampleMetadata = MappingProxyType({}),
-        **kwargs: Any,
+        **kwargs: object,
     ) -> EvaluationResult:
-        """
-        Evaluate the given inputs and produce an evaluation result.
+        """Evaluate the given inputs and produce an evaluation result.
         This method should be implemented by subclasses to perform the actual
         evaluation logic. It is recommended to implement both this synchronous
         method and the asynchronous `async_evaluate` method, but it is not required.
         Args:
-            output (Optional[TaskOutput]): The output produced by the task.
-            expected (Optional[ExampleOutput]): The expected output for comparison.
             dataset_row (Optional[Mapping[str, JSONSerializable]]): A row from the dataset.
-            metadata (ExampleMetadata): Metadata associated with the example.
             input (ExampleInput): The input provided for evaluation.
+            output (Optional[TaskOutput]): The output produced by the task.
+            experiment_output (Optional[TaskOutput]): The experiment output for comparison.
+            dataset_output (ExampleOutput): The expected output from the dataset.
+            metadata (ExampleMetadata): Metadata associated with the example.
             **kwargs (Any): Additional keyword arguments.
         Raises:
             NotImplementedError: If the method is not implemented by the subclass.
         """
@@ -92,22 +103,26 @@ class Evaluator(ABC):
         experiment_output: TaskOutput | None = None,
         dataset_output: ExampleOutput = MappingProxyType({}),
         metadata: ExampleMetadata = MappingProxyType({}),
-        **kwargs: Any,
+        **kwargs: object,
     ) -> EvaluationResult:
-        """
-        Asynchronously evaluate the given inputs and produce an evaluation result.
+        """Asynchronously evaluate the given inputs and produce an evaluation result.
         This method should be implemented by subclasses to perform the actual
         evaluation logic. It is recommended to implement both this asynchronous
         method and the synchronous `evaluate` method, but it is not required.
         Args:
-            output (Optional[TaskOutput]): The output produced by the task.
-            expected (Optional[ExampleOutput]): The expected output for comparison.
             dataset_row (Optional[Mapping[str, JSONSerializable]]): A row from the dataset.
-            metadata (ExampleMetadata): Metadata associated with the example.
             input (ExampleInput): The input provided for evaluation.
+            output (Optional[TaskOutput]): The output produced by the task.
+            experiment_output (Optional[TaskOutput]): The experiment output for comparison.
+            dataset_output (ExampleOutput): The expected output from the dataset.
+            metadata (ExampleMetadata): Metadata associated with the example.
             **kwargs (Any): Additional keyword arguments.
         Returns:
             EvaluationResult: The result of the evaluation.
         Raises:
             NotImplementedError: If the method is not implemented by the subclass.
         """
@@ -124,8 +139,14 @@ class Evaluator(ABC):
         )
     def __init_subclass__(
-        cls, is_abstract: bool = False, **kwargs: Any
+        cls, is_abstract: bool = False, **kwargs: object
     ) -> None:
+        """Validate subclass implementation when inherited.
+        Args:
+            is_abstract: Whether the subclass is abstract and should skip validation.
+            **kwargs: Additional keyword arguments for parent class.
+        """
         super().__init_subclass__(**kwargs)
         if is_abstract:
             return
@@ -136,9 +157,10 @@ class Evaluator(ABC):
             if evaluate := super_cls.__dict__.get(Evaluator.evaluate.__name__):
                 if isinstance(evaluate, classmethod):
                     evaluate = evaluate.__func__
-                assert callable(evaluate), (
-                    "`evaluate()` method should be callable"
-                )
+                if not callable(evaluate):
+                    raise TypeError(
+                        f"`evaluate()` method should be callable, got {type(evaluate)}"
+                    )
                 # need to remove the first param, i.e. `self`
                 _validate_sig(functools.partial(evaluate, None), "evaluate")
                 return
@@ -147,9 +169,10 @@ class Evaluator(ABC):
             ):
                 if isinstance(async_evaluate, classmethod):
                     async_evaluate = async_evaluate.__func__
-                assert callable(async_evaluate), (
-                    "`async_evaluate()` method should be callable"
-                )
+                if not callable(async_evaluate):
+                    raise TypeError(
+                        f"`async_evaluate()` method should be callable, got {type(async_evaluate)}"
+                    )
                 # need to remove the first param, i.e. `self`
                 _validate_sig(
                     functools.partial(async_evaluate, None), "async_evaluate"
@@ -162,7 +185,7 @@ class Evaluator(ABC):
         )
-def _validate_sig(fn: Callable[..., Any], fn_name: str) -> None:
+def _validate_sig(fn: Callable[..., object], fn_name: str) -> None:
     sig = inspect.signature(fn)
     validate_evaluator_signature(sig)
     for param in sig.parameters.values():
@@ -175,6 +198,14 @@ def _validate_sig(fn: Callable[..., Any], fn_name: str) -> None:
 def validate_evaluator_signature(sig: inspect.Signature) -> None:
+    """Validate that a function signature is compatible for use as an evaluator.
+    Args:
+        sig: The function signature to validate.
+    Raises:
+        ValueError: If the signature is invalid for use as an evaluator.
+    """
     # Check that the wrapped function has a valid signature for use as an evaluator
     # If it does not, raise an error to exit early before running evaluations
     params = sig.parameters
@@ -199,23 +230,24 @@ def validate_evaluator_signature(sig: inspect.Signature) -> None:
             ):
                 continue
             raise ValueError(
-                f"Invalid parameter names in evaluation function: {', '.join(not_found)}. "
+                f"Invalid parameter names in evaluation function: {not_found}. "
                 "Parameters names for multi-argument functions must be "
                 f"any of: {', '.join(valid_named_params)}."
             )
 class CodeEvaluator(Evaluator, ABC, is_abstract=True):
-    """
-    A convenience super class for defining code evaluators. There are functionally
-    no differences between this class and the `Evaluator` class, except that this
-    class has a default `_kind` attribute for AnnotatorKind.CODE.
+    """A convenience super class for defining code evaluators.
+    There are functionally no differences between this class and the `Evaluator` class,
+    except that this class has a default `_kind` attribute for AnnotatorKind.CODE.
     This class is intended to be subclassed, and should not be instantiated directly.
     """
     _kind = str(AnnotatorKind.CODE)
-    def __new__(cls, *args: Any, **kwargs: Any) -> CodeEvaluator:
+    def __new__(cls, *args: object, **kwargs: object) -> CodeEvaluator:
+        """Create a new code evaluator instance, preventing direct instantiation of abstract class."""
         if cls is CodeEvaluator:
             raise TypeError(
                 f"{cls.__name__} is an abstract class and should not be instantiated."
@@ -224,16 +256,17 @@ class CodeEvaluator(Evaluator, ABC, is_abstract=True):
 class LLMEvaluator(Evaluator, ABC, is_abstract=True):
-    """
-    A convenience super class for defining LLM evaluators. There are functionally
-    no differences between this class and the `Evaluator` class, except that this
-    class has a default `_kind` attribute for AnnotatorKind.LLM.
+    """A convenience super class for defining LLM evaluators.
+    There are functionally no differences between this class and the `Evaluator` class,
+    except that this class has a default `_kind` attribute for AnnotatorKind.LLM.
     This class is intended to be subclassed, and should not be instantiated directly.
     """
     _kind = str(AnnotatorKind.LLM)
-    def __new__(cls, *args: Any, **kwargs: Any) -> LLMEvaluator:
+    def __new__(cls, *args: object, **kwargs: object) -> LLMEvaluator:
+        """Create a new LLM evaluator instance, preventing direct instantiation of abstract class."""
         if cls is LLMEvaluator:
             raise TypeError(
                 f"{cls.__name__} is an abstract class and should not be instantiated."

arize/experiments/evaluators/exceptions.py CHANGED Viewed

@@ -1,10 +1,13 @@
+"""Evaluator-specific exception classes."""
 class ArizeException(Exception):
-    pass
+    """Base exception for Arize experiment evaluator errors."""
 class ArizeContextLimitExceeded(ArizeException):
-    pass
+    """Raised when context limit is exceeded during evaluation."""
 class ArizeTemplateMappingError(ArizeException):
-    pass
+    """Raised when template mapping fails during evaluation."""

arize 8.0.0a22__py3-none-any.whl → 8.0.0b0__py3-none-any.whl

arize 8.0.0a22py3-none-any.whl → 8.0.0b0py3-none-any.whl