PyPI - dataeval - Versions diffs - 0.76.1__py3-none-any.whl → 0.82.0__py3-none-any.whl - Mend

dataeval 0.76.1py3-none-any.whl → 0.82.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (113) hide show

dataeval/__init__.py +3 -3
dataeval/config.py +77 -0
dataeval/detectors/__init__.py +1 -1
dataeval/detectors/drift/__init__.py +6 -6
dataeval/detectors/drift/{base.py → _base.py} +40 -85
dataeval/detectors/drift/{cvm.py → _cvm.py} +21 -28
dataeval/detectors/drift/{ks.py → _ks.py} +20 -26
dataeval/detectors/drift/{mmd.py → _mmd.py} +31 -43
dataeval/detectors/drift/{torch.py → _torch.py} +2 -1
dataeval/detectors/drift/{uncertainty.py → _uncertainty.py} +24 -7
dataeval/detectors/drift/updates.py +20 -3
dataeval/detectors/linters/__init__.py +3 -5
dataeval/detectors/linters/duplicates.py +13 -36
dataeval/detectors/linters/outliers.py +23 -148
dataeval/detectors/ood/__init__.py +1 -1
dataeval/detectors/ood/ae.py +30 -9
dataeval/detectors/ood/base.py +5 -4
dataeval/detectors/ood/mixin.py +21 -7
dataeval/detectors/ood/vae.py +73 -0
dataeval/metadata/__init__.py +6 -0
dataeval/metadata/_distance.py +167 -0
dataeval/metadata/_ood.py +217 -0
dataeval/metadata/_utils.py +44 -0
dataeval/metrics/__init__.py +1 -1
dataeval/metrics/bias/__init__.py +6 -4
dataeval/metrics/bias/{balance.py → _balance.py} +15 -101
dataeval/metrics/bias/_coverage.py +98 -0
dataeval/metrics/bias/{diversity.py → _diversity.py} +18 -111
dataeval/metrics/bias/{parity.py → _parity.py} +39 -77
dataeval/metrics/estimators/__init__.py +15 -4
dataeval/metrics/estimators/{ber.py → _ber.py} +42 -29
dataeval/metrics/estimators/_clusterer.py +44 -0
dataeval/metrics/estimators/{divergence.py → _divergence.py} +18 -30
dataeval/metrics/estimators/{uap.py → _uap.py} +4 -18
dataeval/metrics/stats/__init__.py +16 -13
dataeval/metrics/stats/{base.py → _base.py} +82 -133
dataeval/metrics/stats/{boxratiostats.py → _boxratiostats.py} +15 -18
dataeval/metrics/stats/_dimensionstats.py +75 -0
dataeval/metrics/stats/{hashstats.py → _hashstats.py} +21 -37
dataeval/metrics/stats/_imagestats.py +94 -0
dataeval/metrics/stats/_labelstats.py +131 -0
dataeval/metrics/stats/{pixelstats.py → _pixelstats.py} +19 -50
dataeval/metrics/stats/{visualstats.py → _visualstats.py} +23 -54
dataeval/outputs/__init__.py +53 -0
dataeval/{output.py → outputs/_base.py} +55 -25
dataeval/outputs/_bias.py +381 -0
dataeval/outputs/_drift.py +83 -0
dataeval/outputs/_estimators.py +114 -0
dataeval/outputs/_linters.py +184 -0
dataeval/{detectors/ood/output.py → outputs/_ood.py} +22 -22
dataeval/outputs/_stats.py +387 -0
dataeval/outputs/_utils.py +44 -0
dataeval/outputs/_workflows.py +364 -0
dataeval/typing.py +234 -0
dataeval/utils/__init__.py +2 -2
dataeval/utils/_array.py +169 -0
dataeval/utils/_bin.py +199 -0
dataeval/utils/_clusterer.py +144 -0
dataeval/utils/_fast_mst.py +189 -0
dataeval/utils/{image.py → _image.py} +6 -4
dataeval/utils/_method.py +14 -0
dataeval/utils/{shared.py → _mst.py} +3 -65
dataeval/utils/{plot.py → _plot.py} +6 -6
dataeval/utils/data/__init__.py +26 -0
dataeval/utils/data/_dataset.py +217 -0
dataeval/utils/data/_embeddings.py +104 -0
dataeval/utils/data/_images.py +68 -0
dataeval/utils/data/_metadata.py +360 -0
dataeval/utils/data/_selection.py +126 -0
dataeval/utils/{dataset/split.py → data/_split.py} +12 -38
dataeval/utils/data/_targets.py +85 -0
dataeval/utils/data/collate.py +103 -0
dataeval/utils/data/datasets/__init__.py +17 -0
dataeval/utils/data/datasets/_base.py +254 -0
dataeval/utils/data/datasets/_cifar10.py +134 -0
dataeval/utils/data/datasets/_fileio.py +168 -0
dataeval/utils/data/datasets/_milco.py +153 -0
dataeval/utils/data/datasets/_mixin.py +56 -0
dataeval/utils/data/datasets/_mnist.py +183 -0
dataeval/utils/data/datasets/_ships.py +123 -0
dataeval/utils/data/datasets/_types.py +52 -0
dataeval/utils/data/datasets/_voc.py +352 -0
dataeval/utils/data/selections/__init__.py +15 -0
dataeval/utils/data/selections/_classfilter.py +57 -0
dataeval/utils/data/selections/_indices.py +26 -0
dataeval/utils/data/selections/_limit.py +26 -0
dataeval/utils/data/selections/_reverse.py +18 -0
dataeval/utils/data/selections/_shuffle.py +29 -0
dataeval/utils/metadata.py +51 -376
dataeval/utils/torch/{gmm.py → _gmm.py} +4 -2
dataeval/utils/torch/{internal.py → _internal.py} +21 -51
dataeval/utils/torch/models.py +43 -2
dataeval/workflows/__init__.py +2 -1
dataeval/workflows/sufficiency.py +11 -346
{dataeval-0.76.1.dist-info → dataeval-0.82.0.dist-info}/METADATA +5 -2
dataeval-0.82.0.dist-info/RECORD +104 -0
dataeval/detectors/linters/clusterer.py +0 -512
dataeval/detectors/linters/merged_stats.py +0 -49
dataeval/detectors/ood/metadata_ks_compare.py +0 -129
dataeval/detectors/ood/metadata_least_likely.py +0 -119
dataeval/interop.py +0 -69
dataeval/metrics/bias/coverage.py +0 -194
dataeval/metrics/stats/datasetstats.py +0 -202
dataeval/metrics/stats/dimensionstats.py +0 -115
dataeval/metrics/stats/labelstats.py +0 -210
dataeval/utils/dataset/__init__.py +0 -7
dataeval/utils/dataset/datasets.py +0 -412
dataeval/utils/dataset/read.py +0 -63
dataeval-0.76.1.dist-info/RECORD +0 -67
/dataeval/{log.py → _log.py} +0 -0
/dataeval/utils/torch/{blocks.py → _blocks.py} +0 -0
{dataeval-0.76.1.dist-info → dataeval-0.82.0.dist-info}/LICENSE.txt +0 -0
{dataeval-0.76.1.dist-info → dataeval-0.82.0.dist-info}/WHEEL +0 -0

dataeval/outputs/_workflows.py ADDED Viewed

@@ -0,0 +1,364 @@
+from __future__ import annotations
+__all__ = []
+import contextlib
+import warnings
+from dataclasses import dataclass
+from typing import Any, Iterable, Mapping, Sequence, cast
+import numpy as np
+from numpy.typing import NDArray
+with contextlib.suppress(ImportError):
+    from matplotlib.figure import Figure
+from scipy.optimize import basinhopping
+from dataeval.outputs._base import Output, set_metadata
+from dataeval.typing import ArrayLike
+from dataeval.utils._array import as_numpy
+def f_out(n_i: NDArray[Any], x: NDArray[Any]) -> NDArray[Any]:
+    """
+    Calculates the line of best fit based on its free parameters
+    Parameters
+    ----------
+    n_i : NDArray
+        Array of sample sizes
+    x : NDArray
+        Array of inverse power curve coefficients
+    Returns
+    -------
+    NDArray
+        Data points for the line of best fit
+    """
+    return x[0] * n_i ** (-x[1]) + x[2]
+def project_steps(params: NDArray[Any], projection: NDArray[Any]) -> NDArray[Any]:
+    """Projects the measures for each value of X
+    Parameters
+    ----------
+    params : NDArray
+        Inverse power curve coefficients used to calculate projection
+    projection : NDArray
+        Steps to extrapolate
+    Returns
+    -------
+    NDArray
+        Extrapolated measure values at each projection step
+    """
+    return 1 - f_out(projection, params)
+def plot_measure(
+    name: str,
+    steps: NDArray[Any],
+    measure: NDArray[Any],
+    params: NDArray[Any],
+    projection: NDArray[Any],
+) -> Figure:
+    import matplotlib.pyplot
+    fig = matplotlib.pyplot.figure()
+    fig = cast(Figure, fig)
+    fig.tight_layout()
+    ax = fig.add_subplot(111)
+    ax.set_title(f"{name} Sufficiency")
+    ax.set_ylabel(f"{name}")
+    ax.set_xlabel("Steps")
+    # Plot measure over each step
+    ax.scatter(steps, measure, label=f"Model Results ({name})", s=15, c="black")
+    # Plot extrapolation
+    ax.plot(
+        projection,
+        project_steps(params, projection),
+        linestyle="dashed",
+        label=f"Potential Model Results ({name})",
+    )
+    ax.legend()
+    return fig
+def f_inv_out(y_i: NDArray[Any], x: NDArray[Any]) -> NDArray[np.uint64]:
+    """
+    Inverse function for f_out()
+    Parameters
+    ----------
+    y_i : NDArray
+        Data points for the line of best fit
+    x : NDArray
+        Array of inverse power curve coefficients
+    Returns
+    -------
+    NDArray
+        Array of sample sizes
+    """
+    n_i = ((y_i - x[2]) / x[0]) ** (-1 / x[1])
+    return np.asarray(n_i, dtype=np.uint64)
+def inv_project_steps(params: NDArray[Any], targets: NDArray[Any]) -> NDArray[np.uint64]:
+    """Inverse function for project_steps()
+    Parameters
+    ----------
+    params : NDArray
+        Inverse power curve coefficients used to calculate projection
+    targets : NDArray
+        Desired measure values
+    Returns
+    -------
+    NDArray
+        Array of sample sizes, or 0 if overflow
+    """
+    steps = f_inv_out(1 - np.array(targets), params)
+    steps[np.isnan(steps)] = 0
+    return np.ceil(steps)
+def calc_params(p_i: NDArray[Any], n_i: NDArray[Any], niter: int) -> NDArray[Any]:
+    """
+    Retrieves the inverse power curve coefficients for the line of best fit.
+    Global minimization is done via basin hopping. More info on this algorithm
+    can be found here: https://arxiv.org/abs/cond-mat/9803344 .
+    Parameters
+    ----------
+    p_i : NDArray
+        Array of corresponding losses
+    n_i : NDArray
+        Array of sample sizes
+    niter : int
+        Number of iterations to perform in the basin-hopping
+        numerical process to curve-fit p_i
+    Returns
+    -------
+    NDArray
+        Array of parameters to recreate line of best fit
+    """
+    def is_valid(f_new, x_new, f_old, x_old):
+        return f_new != np.nan
+    def f(x):
+        try:
+            return np.sum(np.square(p_i - f_out(n_i, x)))
+        except RuntimeWarning:
+            return np.nan
+    with warnings.catch_warnings():
+        warnings.filterwarnings("error", category=RuntimeWarning)
+        res = basinhopping(
+            f,
+            np.array([0.5, 0.5, 0.1]),
+            niter=niter,
+            stepsize=1.0,
+            minimizer_kwargs={"method": "Powell"},
+            accept_test=is_valid,
+            niter_success=200,
+        )
+    return res.x
+def get_curve_params(measures: dict[str, NDArray[Any]], ranges: NDArray[Any], niter: int) -> dict[str, NDArray[Any]]:
+    """Calculates and aggregates parameters for both single and multi-class metrics"""
+    output = {}
+    for name, measure in measures.items():
+        measure = cast(np.ndarray, measure)
+        if measure.ndim > 1:
+            result = []
+            for value in measure:
+                result.append(calc_params(1 - value, ranges, niter))
+            output[name] = np.array(result)
+        else:
+            output[name] = calc_params(1 - measure, ranges, niter)
+    return output
+@dataclass
+class SufficiencyOutput(Output):
+    """
+    Output class for :class:`.Sufficiency` workflow.
+    Attributes
+    ----------
+    steps : NDArray
+        Array of sample sizes
+    measures : Dict[str, NDArray]
+        Average of values observed for each sample size step for each measure
+    n_iter : int, default 1000
+        Number of iterations to perform in the basin-hopping curve-fit process
+    """
+    steps: NDArray[np.uint32]
+    measures: dict[str, NDArray[np.float64]]
+    n_iter: int = 1000
+    def __post_init__(self) -> None:
+        c = len(self.steps)
+        for m, v in self.measures.items():
+            c_v = v.shape[1] if v.ndim > 1 else len(v)
+            if c != c_v:
+                raise ValueError(f"{m} does not contain the expected number ({c}) of data points.")
+        self._params = None
+    @property
+    def params(self) -> dict[str, NDArray[Any]]:
+        if self._params is None:
+            self._params = {}
+        if self.n_iter not in self._params:
+            self._params[self.n_iter] = get_curve_params(self.measures, self.steps, self.n_iter)
+        return self._params[self.n_iter]
+    @set_metadata
+    def project(
+        self,
+        projection: int | Iterable[int],
+    ) -> SufficiencyOutput:
+        """
+        Projects the measures for each step.
+        Parameters
+        ----------
+        projection : int | Iterable[int]
+            Step or steps to project
+        Returns
+        -------
+        SufficiencyOutput
+            Dataclass containing the projected measures per projection
+        Raises
+        ------
+        ValueError
+            If the length of data points in the measures do not match
+            If `projection` is not numerical
+        """
+        projection = np.asarray(list(projection) if isinstance(projection, Iterable) else [projection])
+        if not np.issubdtype(projection.dtype, np.number):
+            raise ValueError("'projection' must consist of numerical values")
+        output = {}
+        for name, measures in self.measures.items():
+            if measures.ndim > 1:
+                result = []
+                for i in range(len(measures)):
+                    projected = project_steps(self.params[name][i], projection)
+                    result.append(projected)
+                output[name] = np.array(result)
+            else:
+                output[name] = project_steps(self.params[name], projection)
+        proj = SufficiencyOutput(projection, output, self.n_iter)
+        proj._params = self._params
+        return proj
+    def plot(self, class_names: Sequence[str] | None = None) -> list[Figure]:
+        """
+        Plotting function for data :term:`sufficience<Sufficiency>` tasks.
+        Parameters
+        ----------
+        class_names : Sequence[str] | None, default None
+            List of class names
+        Returns
+        -------
+        list[Figure]
+            List of Figures for each measure
+        Raises
+        ------
+        ValueError
+            If the length of data points in the measures do not match
+        Notes
+        -----
+        This method requires `matplotlib <https://matplotlib.org/>`_ to be installed.
+        """
+        # Extrapolation parameters
+        last_X = self.steps[-1]
+        geomshape = (0.01 * last_X, last_X * 4, len(self.steps))
+        extrapolated = np.geomspace(*geomshape).astype(np.int64)
+        # Stores all plots
+        plots = []
+        # Create a plot for each measure on one figure
+        for name, measures in self.measures.items():
+            if measures.ndim > 1:
+                if class_names is not None and len(measures) != len(class_names):
+                    raise IndexError("Class name count does not align with measures")
+                for i, measure in enumerate(measures):
+                    class_name = str(i) if class_names is None else class_names[i]
+                    fig = plot_measure(
+                        f"{name}_{class_name}",
+                        self.steps,
+                        measure,
+                        self.params[name][i],
+                        extrapolated,
+                    )
+                    plots.append(fig)
+            else:
+                fig = plot_measure(name, self.steps, measures, self.params[name], extrapolated)
+                plots.append(fig)
+        return plots
+    def inv_project(
+        self, targets: Mapping[str, ArrayLike], n_iter: int | None = None
+    ) -> dict[str, NDArray[np.float64]]:
+        """
+        Calculate training samples needed to achieve target model metric values.
+        Parameters
+        ----------
+        targets : Mapping[str, ArrayLike]
+            Mapping of target metric scores (from 0.0 to 1.0) that we want
+            to achieve, where the key is the name of the metric.
+        n_iter : int or None, default None
+            Iteration to use when calculating the inverse power curve, if None defaults to 1000
+        Returns
+        -------
+        dict[str, NDArray]
+            List of the number of training samples needed to achieve each
+            corresponding entry in targets
+        """
+        projection = {}
+        for name, target in targets.items():
+            tarray = as_numpy(target)
+            if name not in self.measures:
+                continue
+            measure = self.measures[name]
+            if measure.ndim > 1:
+                projection[name] = np.zeros((len(measure), len(tarray)))
+                for i in range(len(measure)):
+                    projection[name][i] = inv_project_steps(
+                        self.params[name][i], tarray[i] if tarray.ndim == measure.ndim else tarray
+                    )
+            else:
+                projection[name] = inv_project_steps(self.params[name], tarray)
+        return projection

dataeval/typing.py ADDED Viewed

@@ -0,0 +1,234 @@
+"""
+Common type hints used for interoperability with DataEval.
+"""
+__all__ = [
+    "Array",
+    "ArrayLike",
+    "Dataset",
+    "AnnotatedDataset",
+    "DatasetMetadata",
+    "ImageClassificationDatum",
+    "ImageClassificationDataset",
+    "ObjectDetectionTarget",
+    "ObjectDetectionDatum",
+    "ObjectDetectionDataset",
+    "SegmentationTarget",
+    "SegmentationDatum",
+    "SegmentationDataset",
+]
+import sys
+from typing import Any, Generic, Iterator, Protocol, Sequence, TypedDict, TypeVar, Union, runtime_checkable
+from typing_extensions import NotRequired, Required
+if sys.version_info >= (3, 10):
+    from typing import TypeAlias
+else:
+    from typing_extensions import TypeAlias
+@runtime_checkable
+class Array(Protocol):
+    """
+    Protocol for array objects providing interoperability with DataEval.
+    Supports common array representations with popular libraries like
+    PyTorch, Tensorflow and JAX, as well as NumPy arrays.
+    Example
+    -------
+    >>> import numpy as np
+    >>> import torch
+    >>> from dataeval.typing import Array
+    Create array objects
+    >>> ndarray = np.random.random((10, 10))
+    >>> tensor = torch.tensor([1, 2, 3])
+    Check type at runtime
+    >>> isinstance(ndarray, Array)
+    True
+    >>> isinstance(tensor, Array)
+    True
+    """
+    @property
+    def shape(self) -> tuple[int, ...]: ...
+    def __array__(self) -> Any: ...
+    def __getitem__(self, key: Any, /) -> Any: ...
+    def __iter__(self) -> Iterator[Any]: ...
+    def __len__(self) -> int: ...
+_T_co = TypeVar("_T_co", covariant=True)
+_ScalarType = Union[int, float, bool, str]
+ArrayLike: TypeAlias = Union[Sequence[_ScalarType], Sequence[Sequence[_ScalarType]], Sequence[Array], Array]
+"""
+Type alias for array-like objects used for interoperability with DataEval.
+This includes native Python sequences, as well as objects that conform to
+the :class:`Array` protocol.
+"""
+class DatasetMetadata(TypedDict, total=False):
+    """
+    Dataset level metadata required for all `AnnotatedDataset` classes.
+    Attributes
+    ----------
+    id : Required[str]
+        A unique identifier for the dataset
+    index2label : NotRequired[dict[int, str]]
+        A lookup table converting label value to class name
+    """
+    id: Required[str]
+    index2label: NotRequired[dict[int, str]]
+@runtime_checkable
+class Dataset(Generic[_T_co], Protocol):
+    """
+    Protocol for a generic `Dataset`.
+    Methods
+    -------
+    __getitem__(index: int)
+        Returns datum at specified index.
+    __len__()
+        Returns dataset length.
+    """
+    def __getitem__(self, index: int, /) -> _T_co: ...
+    def __len__(self) -> int: ...
+@runtime_checkable
+class AnnotatedDataset(Dataset[_T_co], Generic[_T_co], Protocol):
+    """
+    Protocol for a generic `AnnotatedDataset`.
+    Attributes
+    ----------
+    metadata : :class:`.DatasetMetadata` or derivatives.
+    Methods
+    -------
+    __getitem__(index: int)
+        Returns datum at specified index.
+    __len__()
+        Returns dataset length.
+    Notes
+    -----
+    Inherits from :class:`.Dataset`.
+    """
+    @property
+    def metadata(self) -> DatasetMetadata: ...
+# ========== IMAGE CLASSIFICATION DATASETS ==========
+ImageClassificationDatum: TypeAlias = tuple[Array, Array, dict[str, Any]]
+"""
+A type definition for an image classification datum tuple.
+- :class:`Array` of shape (C, H, W) - Image data in channel, height, width format.
+- :class:`Array` of shape (N,) - Class label as one-hot encoded ground-truth or prediction confidences.
+- dict[str, Any] - Datum level metadata.
+"""
+ImageClassificationDataset: TypeAlias = AnnotatedDataset[ImageClassificationDatum]
+"""
+A type definition for an :class:`AnnotatedDataset` of :class:`ImageClassificationDatum` elements.
+"""
+# ========== OBJECT DETECTION DATASETS ==========
+@runtime_checkable
+class ObjectDetectionTarget(Protocol):
+    """
+    A protocol for targets in an Object Detection dataset.
+    Attributes
+    ----------
+    boxes : :class:`ArrayLike` of shape (N, 4)
+    labels : :class:`ArrayLike` of shape (N,)
+    scores : :class:`ArrayLike` of shape (N, M)
+    """
+    @property
+    def boxes(self) -> ArrayLike: ...
+    @property
+    def labels(self) -> ArrayLike: ...
+    @property
+    def scores(self) -> ArrayLike: ...
+ObjectDetectionDatum: TypeAlias = tuple[Array, ObjectDetectionTarget, dict[str, Any]]
+"""
+A type definition for an object detection datum tuple.
+- :class:`Array` of shape (C, H, W) - Image data in channel, height, width format.
+- :class:`ObjectDetectionTarget` - Object detection target information for the image.
+- dict[str, Any] - Datum level metadata.
+"""
+ObjectDetectionDataset: TypeAlias = AnnotatedDataset[ObjectDetectionDatum]
+"""
+A type definition for an :class:`AnnotatedDataset` of :class:`ObjectDetectionDatum` elements.
+"""
+# ========== SEGMENTATION DATASETS ==========
+@runtime_checkable
+class SegmentationTarget(Protocol):
+    """
+    A protocol for targets in a Segmentation dataset.
+    Attributes
+    ----------
+    mask : :class:`ArrayLike`
+    labels : :class:`ArrayLike`
+    scores : :class:`ArrayLike`
+    """
+    @property
+    def mask(self) -> ArrayLike: ...
+    @property
+    def labels(self) -> ArrayLike: ...
+    @property
+    def scores(self) -> ArrayLike: ...
+SegmentationDatum: TypeAlias = tuple[Array, SegmentationTarget, dict[str, Any]]
+"""
+A type definition for an image classification datum tuple.
+- :class:`Array` of shape (C, H, W) - Image data in channel, height, width format.
+- :class:`SegmentationTarget` - Segmentation target information for the image.
+- dict[str, Any] - Datum level metadata.
+"""
+SegmentationDataset: TypeAlias = AnnotatedDataset[SegmentationDatum]
+"""
+A type definition for an :class:`AnnotatedDataset` of :class:`SegmentationDatum` elements.
+"""

dataeval/utils/__init__.py CHANGED Viewed

@@ -4,6 +4,6 @@ in setting up data and architectures that are guaranteed to work with applicable
 DataEval metrics.
 """
-__all__ = ["dataset", "metadata", "torch"]
+__all__ = ["data", "metadata", "torch"]
-from dataeval.utils import dataset, metadata, torch
+from . import data, metadata, torch

dataeval 0.76.1__py3-none-any.whl → 0.82.0__py3-none-any.whl

dataeval 0.76.1py3-none-any.whl → 0.82.0py3-none-any.whl