PyPI - dataeval - Versions diffs - 0.81.0__py3-none-any.whl → 0.82.1__py3-none-any.whl - Mend

dataeval 0.81.0py3-none-any.whl → 0.82.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (86) hide show

dataeval/__init__.py +1 -1
dataeval/config.py +68 -11
dataeval/detectors/drift/__init__.py +2 -2
dataeval/detectors/drift/_base.py +8 -64
dataeval/detectors/drift/_mmd.py +12 -38
dataeval/detectors/drift/_torch.py +7 -7
dataeval/detectors/drift/_uncertainty.py +6 -5
dataeval/detectors/drift/updates.py +20 -3
dataeval/detectors/linters/__init__.py +3 -2
dataeval/detectors/linters/duplicates.py +14 -46
dataeval/detectors/linters/outliers.py +25 -159
dataeval/detectors/ood/__init__.py +1 -1
dataeval/detectors/ood/ae.py +6 -5
dataeval/detectors/ood/base.py +2 -2
dataeval/detectors/ood/metadata_ood_mi.py +4 -6
dataeval/detectors/ood/mixin.py +3 -4
dataeval/detectors/ood/vae.py +3 -2
dataeval/metadata/__init__.py +2 -1
dataeval/metadata/_distance.py +134 -0
dataeval/metadata/_ood.py +30 -49
dataeval/metadata/_utils.py +44 -0
dataeval/metrics/bias/__init__.py +5 -4
dataeval/metrics/bias/_balance.py +17 -149
dataeval/metrics/bias/_coverage.py +4 -106
dataeval/metrics/bias/_diversity.py +12 -107
dataeval/metrics/bias/_parity.py +7 -71
dataeval/metrics/estimators/__init__.py +5 -4
dataeval/metrics/estimators/_ber.py +2 -20
dataeval/metrics/estimators/_clusterer.py +1 -61
dataeval/metrics/estimators/_divergence.py +2 -19
dataeval/metrics/estimators/_uap.py +2 -16
dataeval/metrics/stats/__init__.py +15 -12
dataeval/metrics/stats/_base.py +41 -128
dataeval/metrics/stats/_boxratiostats.py +13 -13
dataeval/metrics/stats/_dimensionstats.py +17 -58
dataeval/metrics/stats/_hashstats.py +19 -35
dataeval/metrics/stats/_imagestats.py +94 -0
dataeval/metrics/stats/_labelstats.py +42 -121
dataeval/metrics/stats/_pixelstats.py +19 -51
dataeval/metrics/stats/_visualstats.py +19 -51
dataeval/outputs/__init__.py +57 -0
dataeval/outputs/_base.py +182 -0
dataeval/outputs/_bias.py +381 -0
dataeval/outputs/_drift.py +83 -0
dataeval/outputs/_estimators.py +114 -0
dataeval/outputs/_linters.py +186 -0
dataeval/outputs/_metadata.py +54 -0
dataeval/{detectors/ood/output.py → outputs/_ood.py} +22 -22
dataeval/outputs/_stats.py +393 -0
dataeval/outputs/_utils.py +44 -0
dataeval/outputs/_workflows.py +364 -0
dataeval/typing.py +187 -7
dataeval/utils/_method.py +1 -5
dataeval/utils/_plot.py +2 -2
dataeval/utils/data/__init__.py +5 -1
dataeval/utils/data/_dataset.py +217 -0
dataeval/utils/data/_embeddings.py +12 -14
dataeval/utils/data/_images.py +30 -27
dataeval/utils/data/_metadata.py +28 -11
dataeval/utils/data/_selection.py +25 -22
dataeval/utils/data/_split.py +5 -29
dataeval/utils/data/_targets.py +14 -2
dataeval/utils/data/datasets/_base.py +5 -5
dataeval/utils/data/datasets/_cifar10.py +1 -1
dataeval/utils/data/datasets/_milco.py +1 -1
dataeval/utils/data/datasets/_mnist.py +1 -1
dataeval/utils/data/datasets/_ships.py +1 -1
dataeval/utils/data/{_types.py → datasets/_types.py} +10 -16
dataeval/utils/data/datasets/_voc.py +1 -1
dataeval/utils/data/selections/_classfilter.py +4 -5
dataeval/utils/data/selections/_indices.py +2 -2
dataeval/utils/data/selections/_limit.py +2 -2
dataeval/utils/data/selections/_reverse.py +2 -2
dataeval/utils/data/selections/_shuffle.py +2 -2
dataeval/utils/torch/_internal.py +5 -5
dataeval/utils/torch/trainer.py +8 -8
dataeval/workflows/__init__.py +2 -1
dataeval/workflows/sufficiency.py +6 -342
{dataeval-0.81.0.dist-info → dataeval-0.82.1.dist-info}/METADATA +2 -2
dataeval-0.82.1.dist-info/RECORD +105 -0
dataeval/_output.py +0 -137
dataeval/detectors/ood/metadata_ks_compare.py +0 -129
dataeval/metrics/stats/_datasetstats.py +0 -198
dataeval-0.81.0.dist-info/RECORD +0 -94
{dataeval-0.81.0.dist-info → dataeval-0.82.1.dist-info}/LICENSE.txt +0 -0
{dataeval-0.81.0.dist-info → dataeval-0.82.1.dist-info}/WHEEL +0 -0

dataeval/outputs/_utils.py ADDED Viewed

@@ -0,0 +1,44 @@
+from __future__ import annotations
+__all__ = []
+from dataclasses import dataclass
+import numpy as np
+from numpy.typing import NDArray
+from dataeval.outputs._base import Output
+@dataclass(frozen=True)
+class TrainValSplit:
+    """
+    Dataclass containing train and validation indices.
+    Attributes
+    ----------
+    train: NDArray[np.intp]
+        Indices for the training set
+    val: NDArray[np.intp]
+        Indices for the validation set
+    """
+    train: NDArray[np.intp]
+    val: NDArray[np.intp]
+@dataclass(frozen=True)
+class SplitDatasetOutput(Output):
+    """
+    Output class containing test indices and a list of TrainValSplits.
+    Attributes
+    ----------
+    test: NDArray[np.intp]
+        Indices for the test set
+    folds: list[TrainValSplit]
+        List of train and validation split indices
+    """
+    test: NDArray[np.intp]
+    folds: list[TrainValSplit]

dataeval/outputs/_workflows.py ADDED Viewed

@@ -0,0 +1,364 @@
+from __future__ import annotations
+__all__ = []
+import contextlib
+import warnings
+from dataclasses import dataclass
+from typing import Any, Iterable, Mapping, Sequence, cast
+import numpy as np
+from numpy.typing import NDArray
+with contextlib.suppress(ImportError):
+    from matplotlib.figure import Figure
+from scipy.optimize import basinhopping
+from dataeval.outputs._base import Output, set_metadata
+from dataeval.typing import ArrayLike
+from dataeval.utils._array import as_numpy
+def f_out(n_i: NDArray[Any], x: NDArray[Any]) -> NDArray[Any]:
+    """
+    Calculates the line of best fit based on its free parameters
+    Parameters
+    ----------
+    n_i : NDArray
+        Array of sample sizes
+    x : NDArray
+        Array of inverse power curve coefficients
+    Returns
+    -------
+    NDArray
+        Data points for the line of best fit
+    """
+    return x[0] * n_i ** (-x[1]) + x[2]
+def project_steps(params: NDArray[Any], projection: NDArray[Any]) -> NDArray[Any]:
+    """Projects the measures for each value of X
+    Parameters
+    ----------
+    params : NDArray
+        Inverse power curve coefficients used to calculate projection
+    projection : NDArray
+        Steps to extrapolate
+    Returns
+    -------
+    NDArray
+        Extrapolated measure values at each projection step
+    """
+    return 1 - f_out(projection, params)
+def plot_measure(
+    name: str,
+    steps: NDArray[Any],
+    measure: NDArray[Any],
+    params: NDArray[Any],
+    projection: NDArray[Any],
+) -> Figure:
+    import matplotlib.pyplot
+    fig = matplotlib.pyplot.figure()
+    fig = cast(Figure, fig)
+    fig.tight_layout()
+    ax = fig.add_subplot(111)
+    ax.set_title(f"{name} Sufficiency")
+    ax.set_ylabel(f"{name}")
+    ax.set_xlabel("Steps")
+    # Plot measure over each step
+    ax.scatter(steps, measure, label=f"Model Results ({name})", s=15, c="black")
+    # Plot extrapolation
+    ax.plot(
+        projection,
+        project_steps(params, projection),
+        linestyle="dashed",
+        label=f"Potential Model Results ({name})",
+    )
+    ax.legend()
+    return fig
+def f_inv_out(y_i: NDArray[Any], x: NDArray[Any]) -> NDArray[np.uint64]:
+    """
+    Inverse function for f_out()
+    Parameters
+    ----------
+    y_i : NDArray
+        Data points for the line of best fit
+    x : NDArray
+        Array of inverse power curve coefficients
+    Returns
+    -------
+    NDArray
+        Array of sample sizes
+    """
+    n_i = ((y_i - x[2]) / x[0]) ** (-1 / x[1])
+    return np.asarray(n_i, dtype=np.uint64)
+def inv_project_steps(params: NDArray[Any], targets: NDArray[Any]) -> NDArray[np.uint64]:
+    """Inverse function for project_steps()
+    Parameters
+    ----------
+    params : NDArray
+        Inverse power curve coefficients used to calculate projection
+    targets : NDArray
+        Desired measure values
+    Returns
+    -------
+    NDArray
+        Array of sample sizes, or 0 if overflow
+    """
+    steps = f_inv_out(1 - np.array(targets), params)
+    steps[np.isnan(steps)] = 0
+    return np.ceil(steps)
+def calc_params(p_i: NDArray[Any], n_i: NDArray[Any], niter: int) -> NDArray[Any]:
+    """
+    Retrieves the inverse power curve coefficients for the line of best fit.
+    Global minimization is done via basin hopping. More info on this algorithm
+    can be found here: https://arxiv.org/abs/cond-mat/9803344 .
+    Parameters
+    ----------
+    p_i : NDArray
+        Array of corresponding losses
+    n_i : NDArray
+        Array of sample sizes
+    niter : int
+        Number of iterations to perform in the basin-hopping
+        numerical process to curve-fit p_i
+    Returns
+    -------
+    NDArray
+        Array of parameters to recreate line of best fit
+    """
+    def is_valid(f_new, x_new, f_old, x_old):
+        return f_new != np.nan
+    def f(x):
+        try:
+            return np.sum(np.square(p_i - f_out(n_i, x)))
+        except RuntimeWarning:
+            return np.nan
+    with warnings.catch_warnings():
+        warnings.filterwarnings("error", category=RuntimeWarning)
+        res = basinhopping(
+            f,
+            np.array([0.5, 0.5, 0.1]),
+            niter=niter,
+            stepsize=1.0,
+            minimizer_kwargs={"method": "Powell"},
+            accept_test=is_valid,
+            niter_success=200,
+        )
+    return res.x
+def get_curve_params(measures: dict[str, NDArray[Any]], ranges: NDArray[Any], niter: int) -> dict[str, NDArray[Any]]:
+    """Calculates and aggregates parameters for both single and multi-class metrics"""
+    output = {}
+    for name, measure in measures.items():
+        measure = cast(np.ndarray, measure)
+        if measure.ndim > 1:
+            result = []
+            for value in measure:
+                result.append(calc_params(1 - value, ranges, niter))
+            output[name] = np.array(result)
+        else:
+            output[name] = calc_params(1 - measure, ranges, niter)
+    return output
+@dataclass
+class SufficiencyOutput(Output):
+    """
+    Output class for :class:`.Sufficiency` workflow.
+    Attributes
+    ----------
+    steps : NDArray
+        Array of sample sizes
+    measures : Dict[str, NDArray]
+        Average of values observed for each sample size step for each measure
+    n_iter : int, default 1000
+        Number of iterations to perform in the basin-hopping curve-fit process
+    """
+    steps: NDArray[np.uint32]
+    measures: dict[str, NDArray[np.float64]]
+    n_iter: int = 1000
+    def __post_init__(self) -> None:
+        c = len(self.steps)
+        for m, v in self.measures.items():
+            c_v = v.shape[1] if v.ndim > 1 else len(v)
+            if c != c_v:
+                raise ValueError(f"{m} does not contain the expected number ({c}) of data points.")
+        self._params = None
+    @property
+    def params(self) -> dict[str, NDArray[Any]]:
+        if self._params is None:
+            self._params = {}
+        if self.n_iter not in self._params:
+            self._params[self.n_iter] = get_curve_params(self.measures, self.steps, self.n_iter)
+        return self._params[self.n_iter]
+    @set_metadata
+    def project(
+        self,
+        projection: int | Iterable[int],
+    ) -> SufficiencyOutput:
+        """
+        Projects the measures for each step.
+        Parameters
+        ----------
+        projection : int | Iterable[int]
+            Step or steps to project
+        Returns
+        -------
+        SufficiencyOutput
+            Dataclass containing the projected measures per projection
+        Raises
+        ------
+        ValueError
+            If the length of data points in the measures do not match
+            If `projection` is not numerical
+        """
+        projection = np.asarray(list(projection) if isinstance(projection, Iterable) else [projection])
+        if not np.issubdtype(projection.dtype, np.number):
+            raise ValueError("'projection' must consist of numerical values")
+        output = {}
+        for name, measures in self.measures.items():
+            if measures.ndim > 1:
+                result = []
+                for i in range(len(measures)):
+                    projected = project_steps(self.params[name][i], projection)
+                    result.append(projected)
+                output[name] = np.array(result)
+            else:
+                output[name] = project_steps(self.params[name], projection)
+        proj = SufficiencyOutput(projection, output, self.n_iter)
+        proj._params = self._params
+        return proj
+    def plot(self, class_names: Sequence[str] | None = None) -> list[Figure]:
+        """
+        Plotting function for data :term:`sufficience<Sufficiency>` tasks.
+        Parameters
+        ----------
+        class_names : Sequence[str] | None, default None
+            List of class names
+        Returns
+        -------
+        list[Figure]
+            List of Figures for each measure
+        Raises
+        ------
+        ValueError
+            If the length of data points in the measures do not match
+        Notes
+        -----
+        This method requires `matplotlib <https://matplotlib.org/>`_ to be installed.
+        """
+        # Extrapolation parameters
+        last_X = self.steps[-1]
+        geomshape = (0.01 * last_X, last_X * 4, len(self.steps))
+        extrapolated = np.geomspace(*geomshape).astype(np.int64)
+        # Stores all plots
+        plots = []
+        # Create a plot for each measure on one figure
+        for name, measures in self.measures.items():
+            if measures.ndim > 1:
+                if class_names is not None and len(measures) != len(class_names):
+                    raise IndexError("Class name count does not align with measures")
+                for i, measure in enumerate(measures):
+                    class_name = str(i) if class_names is None else class_names[i]
+                    fig = plot_measure(
+                        f"{name}_{class_name}",
+                        self.steps,
+                        measure,
+                        self.params[name][i],
+                        extrapolated,
+                    )
+                    plots.append(fig)
+            else:
+                fig = plot_measure(name, self.steps, measures, self.params[name], extrapolated)
+                plots.append(fig)
+        return plots
+    def inv_project(
+        self, targets: Mapping[str, ArrayLike], n_iter: int | None = None
+    ) -> dict[str, NDArray[np.float64]]:
+        """
+        Calculate training samples needed to achieve target model metric values.
+        Parameters
+        ----------
+        targets : Mapping[str, ArrayLike]
+            Mapping of target metric scores (from 0.0 to 1.0) that we want
+            to achieve, where the key is the name of the metric.
+        n_iter : int or None, default None
+            Iteration to use when calculating the inverse power curve, if None defaults to 1000
+        Returns
+        -------
+        dict[str, NDArray]
+            List of the number of training samples needed to achieve each
+            corresponding entry in targets
+        """
+        projection = {}
+        for name, target in targets.items():
+            tarray = as_numpy(target)
+            if name not in self.measures:
+                continue
+            measure = self.measures[name]
+            if measure.ndim > 1:
+                projection[name] = np.zeros((len(measure), len(tarray)))
+                for i in range(len(measure)):
+                    projection[name][i] = inv_project_steps(
+                        self.params[name][i], tarray[i] if tarray.ndim == measure.ndim else tarray
+                    )
+            else:
+                projection[name] = inv_project_steps(self.params[name], tarray)
+        return projection

dataeval/typing.py CHANGED Viewed

@@ -2,9 +2,32 @@
 Common type hints used for interoperability with DataEval.
 """
-__all__ = ["Array", "ArrayLike"]
-from typing import Any, Iterator, Protocol, Sequence, TypeVar, Union, runtime_checkable
+__all__ = [
+    "Array",
+    "ArrayLike",
+    "Dataset",
+    "AnnotatedDataset",
+    "DatasetMetadata",
+    "ImageClassificationDatum",
+    "ImageClassificationDataset",
+    "ObjectDetectionTarget",
+    "ObjectDetectionDatum",
+    "ObjectDetectionDataset",
+    "SegmentationTarget",
+    "SegmentationDatum",
+    "SegmentationDataset",
+]
+import sys
+from typing import Any, Generic, Iterator, Protocol, Sequence, TypedDict, TypeVar, Union, runtime_checkable
+from typing_extensions import NotRequired, Required
+if sys.version_info >= (3, 10):
+    from typing import TypeAlias
+else:
+    from typing_extensions import TypeAlias
 @runtime_checkable
@@ -43,12 +66,169 @@ class Array(Protocol):
     def __len__(self) -> int: ...
-TArray = TypeVar("TArray", bound=Array)
-ArrayLike = Union[Sequence[Any], Array]
+_T_co = TypeVar("_T_co", covariant=True)
+_ScalarType = Union[int, float, bool, str]
+ArrayLike: TypeAlias = Union[Sequence[_ScalarType], Sequence[Sequence[_ScalarType]], Sequence[Array], Array]
 """
 Type alias for array-like objects used for interoperability with DataEval.
 This includes native Python sequences, as well as objects that conform to
-the `Array` protocol.
+the :class:`Array` protocol.
+"""
+class DatasetMetadata(TypedDict, total=False):
+    """
+    Dataset level metadata required for all `AnnotatedDataset` classes.
+    Attributes
+    ----------
+    id : Required[str]
+        A unique identifier for the dataset
+    index2label : NotRequired[dict[int, str]]
+        A lookup table converting label value to class name
+    """
+    id: Required[str]
+    index2label: NotRequired[dict[int, str]]
+@runtime_checkable
+class Dataset(Generic[_T_co], Protocol):
+    """
+    Protocol for a generic `Dataset`.
+    Methods
+    -------
+    __getitem__(index: int)
+        Returns datum at specified index.
+    __len__()
+        Returns dataset length.
+    """
+    def __getitem__(self, index: int, /) -> _T_co: ...
+    def __len__(self) -> int: ...
+@runtime_checkable
+class AnnotatedDataset(Dataset[_T_co], Generic[_T_co], Protocol):
+    """
+    Protocol for a generic `AnnotatedDataset`.
+    Attributes
+    ----------
+    metadata : :class:`.DatasetMetadata` or derivatives.
+    Methods
+    -------
+    __getitem__(index: int)
+        Returns datum at specified index.
+    __len__()
+        Returns dataset length.
+    Notes
+    -----
+    Inherits from :class:`.Dataset`.
+    """
+    @property
+    def metadata(self) -> DatasetMetadata: ...
+# ========== IMAGE CLASSIFICATION DATASETS ==========
+ImageClassificationDatum: TypeAlias = tuple[Array, Array, dict[str, Any]]
+"""
+A type definition for an image classification datum tuple.
+- :class:`Array` of shape (C, H, W) - Image data in channel, height, width format.
+- :class:`Array` of shape (N,) - Class label as one-hot encoded ground-truth or prediction confidences.
+- dict[str, Any] - Datum level metadata.
+"""
+ImageClassificationDataset: TypeAlias = AnnotatedDataset[ImageClassificationDatum]
+"""
+A type definition for an :class:`AnnotatedDataset` of :class:`ImageClassificationDatum` elements.
+"""
+# ========== OBJECT DETECTION DATASETS ==========
+@runtime_checkable
+class ObjectDetectionTarget(Protocol):
+    """
+    A protocol for targets in an Object Detection dataset.
+    Attributes
+    ----------
+    boxes : :class:`ArrayLike` of shape (N, 4)
+    labels : :class:`ArrayLike` of shape (N,)
+    scores : :class:`ArrayLike` of shape (N, M)
+    """
+    @property
+    def boxes(self) -> ArrayLike: ...
+    @property
+    def labels(self) -> ArrayLike: ...
+    @property
+    def scores(self) -> ArrayLike: ...
+ObjectDetectionDatum: TypeAlias = tuple[Array, ObjectDetectionTarget, dict[str, Any]]
+"""
+A type definition for an object detection datum tuple.
+- :class:`Array` of shape (C, H, W) - Image data in channel, height, width format.
+- :class:`ObjectDetectionTarget` - Object detection target information for the image.
+- dict[str, Any] - Datum level metadata.
+"""
+ObjectDetectionDataset: TypeAlias = AnnotatedDataset[ObjectDetectionDatum]
+"""
+A type definition for an :class:`AnnotatedDataset` of :class:`ObjectDetectionDatum` elements.
+"""
+# ========== SEGMENTATION DATASETS ==========
+@runtime_checkable
+class SegmentationTarget(Protocol):
+    """
+    A protocol for targets in a Segmentation dataset.
+    Attributes
+    ----------
+    mask : :class:`ArrayLike`
+    labels : :class:`ArrayLike`
+    scores : :class:`ArrayLike`
+    """
+    @property
+    def mask(self) -> ArrayLike: ...
+    @property
+    def labels(self) -> ArrayLike: ...
+    @property
+    def scores(self) -> ArrayLike: ...
+SegmentationDatum: TypeAlias = tuple[Array, SegmentationTarget, dict[str, Any]]
+"""
+A type definition for an image classification datum tuple.
+- :class:`Array` of shape (C, H, W) - Image data in channel, height, width format.
+- :class:`SegmentationTarget` - Segmentation target information for the image.
+- dict[str, Any] - Datum level metadata.
+"""
+SegmentationDataset: TypeAlias = AnnotatedDataset[SegmentationDatum]
+"""
+A type definition for an :class:`AnnotatedDataset` of :class:`SegmentationDatum` elements.
 """

dataeval/utils/_method.py CHANGED Viewed

@@ -1,12 +1,8 @@
 from __future__ import annotations
-import sys
 from typing import Callable, TypeVar
-if sys.version_info >= (3, 10):
-    from typing import ParamSpec
-else:
-    from typing_extensions import ParamSpec
+from typing_extensions import ParamSpec
 P = ParamSpec("P")
 R = TypeVar("R")

dataeval/utils/_plot.py CHANGED Viewed

@@ -49,8 +49,8 @@ def heatmap(
     from matplotlib.ticker import FuncFormatter
     np_data = to_numpy(data)
-    rows = row_labels if isinstance(row_labels, list) else to_numpy(row_labels)
-    cols = col_labels if isinstance(col_labels, list) else to_numpy(col_labels)
+    rows: list[str] = [str(n) for n in to_numpy(row_labels)]
+    cols: list[str] = [str(n) for n in to_numpy(col_labels)]
     fig, ax = plt.subplots(figsize=(10, 10))

dataeval/utils/data/__init__.py CHANGED Viewed

@@ -10,13 +10,17 @@ __all__ = [
     "SplitDatasetOutput",
     "Targets",
     "split_dataset",
+    "to_image_classification_dataset",
+    "to_object_detection_dataset",
 ]
+from dataeval.outputs._utils import SplitDatasetOutput
+from dataeval.utils.data._dataset import to_image_classification_dataset, to_object_detection_dataset
 from dataeval.utils.data._embeddings import Embeddings
 from dataeval.utils.data._images import Images
 from dataeval.utils.data._metadata import Metadata
 from dataeval.utils.data._selection import Select
-from dataeval.utils.data._split import SplitDatasetOutput, split_dataset
+from dataeval.utils.data._split import split_dataset
 from dataeval.utils.data._targets import Targets
 from . import collate, datasets

dataeval 0.81.0__py3-none-any.whl → 0.82.1__py3-none-any.whl

dataeval 0.81.0py3-none-any.whl → 0.82.1py3-none-any.whl