PyPI - dataeval - Versions diffs - 0.81.0__py3-none-any.whl → 0.82.1__py3-none-any.whl - Mend

dataeval 0.81.0py3-none-any.whl → 0.82.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (86) hide show

dataeval/__init__.py +1 -1
dataeval/config.py +68 -11
dataeval/detectors/drift/__init__.py +2 -2
dataeval/detectors/drift/_base.py +8 -64
dataeval/detectors/drift/_mmd.py +12 -38
dataeval/detectors/drift/_torch.py +7 -7
dataeval/detectors/drift/_uncertainty.py +6 -5
dataeval/detectors/drift/updates.py +20 -3
dataeval/detectors/linters/__init__.py +3 -2
dataeval/detectors/linters/duplicates.py +14 -46
dataeval/detectors/linters/outliers.py +25 -159
dataeval/detectors/ood/__init__.py +1 -1
dataeval/detectors/ood/ae.py +6 -5
dataeval/detectors/ood/base.py +2 -2
dataeval/detectors/ood/metadata_ood_mi.py +4 -6
dataeval/detectors/ood/mixin.py +3 -4
dataeval/detectors/ood/vae.py +3 -2
dataeval/metadata/__init__.py +2 -1
dataeval/metadata/_distance.py +134 -0
dataeval/metadata/_ood.py +30 -49
dataeval/metadata/_utils.py +44 -0
dataeval/metrics/bias/__init__.py +5 -4
dataeval/metrics/bias/_balance.py +17 -149
dataeval/metrics/bias/_coverage.py +4 -106
dataeval/metrics/bias/_diversity.py +12 -107
dataeval/metrics/bias/_parity.py +7 -71
dataeval/metrics/estimators/__init__.py +5 -4
dataeval/metrics/estimators/_ber.py +2 -20
dataeval/metrics/estimators/_clusterer.py +1 -61
dataeval/metrics/estimators/_divergence.py +2 -19
dataeval/metrics/estimators/_uap.py +2 -16
dataeval/metrics/stats/__init__.py +15 -12
dataeval/metrics/stats/_base.py +41 -128
dataeval/metrics/stats/_boxratiostats.py +13 -13
dataeval/metrics/stats/_dimensionstats.py +17 -58
dataeval/metrics/stats/_hashstats.py +19 -35
dataeval/metrics/stats/_imagestats.py +94 -0
dataeval/metrics/stats/_labelstats.py +42 -121
dataeval/metrics/stats/_pixelstats.py +19 -51
dataeval/metrics/stats/_visualstats.py +19 -51
dataeval/outputs/__init__.py +57 -0
dataeval/outputs/_base.py +182 -0
dataeval/outputs/_bias.py +381 -0
dataeval/outputs/_drift.py +83 -0
dataeval/outputs/_estimators.py +114 -0
dataeval/outputs/_linters.py +186 -0
dataeval/outputs/_metadata.py +54 -0
dataeval/{detectors/ood/output.py → outputs/_ood.py} +22 -22
dataeval/outputs/_stats.py +393 -0
dataeval/outputs/_utils.py +44 -0
dataeval/outputs/_workflows.py +364 -0
dataeval/typing.py +187 -7
dataeval/utils/_method.py +1 -5
dataeval/utils/_plot.py +2 -2
dataeval/utils/data/__init__.py +5 -1
dataeval/utils/data/_dataset.py +217 -0
dataeval/utils/data/_embeddings.py +12 -14
dataeval/utils/data/_images.py +30 -27
dataeval/utils/data/_metadata.py +28 -11
dataeval/utils/data/_selection.py +25 -22
dataeval/utils/data/_split.py +5 -29
dataeval/utils/data/_targets.py +14 -2
dataeval/utils/data/datasets/_base.py +5 -5
dataeval/utils/data/datasets/_cifar10.py +1 -1
dataeval/utils/data/datasets/_milco.py +1 -1
dataeval/utils/data/datasets/_mnist.py +1 -1
dataeval/utils/data/datasets/_ships.py +1 -1
dataeval/utils/data/{_types.py → datasets/_types.py} +10 -16
dataeval/utils/data/datasets/_voc.py +1 -1
dataeval/utils/data/selections/_classfilter.py +4 -5
dataeval/utils/data/selections/_indices.py +2 -2
dataeval/utils/data/selections/_limit.py +2 -2
dataeval/utils/data/selections/_reverse.py +2 -2
dataeval/utils/data/selections/_shuffle.py +2 -2
dataeval/utils/torch/_internal.py +5 -5
dataeval/utils/torch/trainer.py +8 -8
dataeval/workflows/__init__.py +2 -1
dataeval/workflows/sufficiency.py +6 -342
{dataeval-0.81.0.dist-info → dataeval-0.82.1.dist-info}/METADATA +2 -2
dataeval-0.82.1.dist-info/RECORD +105 -0
dataeval/_output.py +0 -137
dataeval/detectors/ood/metadata_ks_compare.py +0 -129
dataeval/metrics/stats/_datasetstats.py +0 -198
dataeval-0.81.0.dist-info/RECORD +0 -94
{dataeval-0.81.0.dist-info → dataeval-0.82.1.dist-info}/LICENSE.txt +0 -0
{dataeval-0.81.0.dist-info → dataeval-0.82.1.dist-info}/WHEEL +0 -0

dataeval/outputs/_bias.py ADDED Viewed

@@ -0,0 +1,381 @@
+from __future__ import annotations
+__all__ = []
+import contextlib
+from dataclasses import asdict, dataclass
+from typing import Any, Literal, TypeVar, overload
+import numpy as np
+from numpy.typing import NDArray
+with contextlib.suppress(ImportError):
+    import pandas as pd
+    from matplotlib.figure import Figure
+from dataeval.outputs._base import Output
+from dataeval.typing import ArrayLike
+from dataeval.utils._array import to_numpy
+from dataeval.utils._plot import heatmap
+TData = TypeVar("TData", np.float64, NDArray[np.float64])
+class ToDataFrameMixin:
+    score: Any
+    p_value: Any
+    def to_dataframe(self) -> pd.DataFrame:
+        """
+        Exports the parity output results to a pandas DataFrame.
+        Returns
+        -------
+        pd.DataFrame
+        Notes
+        -----
+        This method requires `pandas <https://pandas.pydata.org/>`_ to be installed.
+        """
+        import pandas as pd
+        return pd.DataFrame(
+            index=self.factor_names,  # type: ignore - list[str] is documented as acceptable index type
+            data={
+                "score": self.score.round(2),
+                "p-value": self.p_value.round(2),
+            },
+        )
+@dataclass(frozen=True)
+class ParityOutput(ToDataFrameMixin, Output):
+    """
+    Output class for :func:`.parity` :term:`bias<Bias>` metrics.
+    Attributes
+    ----------
+    score : NDArray[np.float64]
+        chi-squared score(s) of the test
+    p_value : NDArray[np.float64]
+        p-value(s) of the test
+    factor_names : list[str]
+        Names of each metadata factor
+    insufficient_data: dict
+        Dictionary of metadata factors with less than 5 class occurrences per value
+    """
+    score: NDArray[np.float64]
+    p_value: NDArray[np.float64]
+    factor_names: list[str]
+    insufficient_data: dict[str, dict[int, dict[str, int]]]
+@dataclass(frozen=True)
+class LabelParityOutput(ToDataFrameMixin, Output):
+    """
+    Output class for :func:`.label_parity` :term:`bias<Bias>` metrics.
+    Attributes
+    ----------
+    score : np.float64
+        chi-squared score(s) of the test
+    p_value : np.float64
+        p-value(s) of the test
+    """
+    score: np.float64
+    p_value: np.float64
+@dataclass(frozen=True)
+class CoverageOutput(Output):
+    """
+    Output class for :func:`.coverage` :term:`bias<Bias>` metric.
+    Attributes
+    ----------
+    uncovered_indices : NDArray[np.intp]
+        Array of uncovered indices
+    critical_value_radii : NDArray[np.float64]
+        Array of critical value radii
+    coverage_radius : float
+        Radius for :term:`coverage<Coverage>`
+    """
+    uncovered_indices: NDArray[np.intp]
+    critical_value_radii: NDArray[np.float64]
+    coverage_radius: float
+    def plot(self, images: ArrayLike, top_k: int = 6) -> Figure:
+        """
+        Plot the top k images together for visualization.
+        Parameters
+        ----------
+        images : ArrayLike
+            Original images (not embeddings) in (N, C, H, W) or (N, H, W) format
+        top_k : int, default 6
+            Number of images to plot (plotting assumes groups of 3)
+        Returns
+        -------
+        matplotlib.figure.Figure
+        Notes
+        -----
+        This method requires `matplotlib <https://matplotlib.org/>`_ to be installed.
+        """
+        import matplotlib.pyplot as plt
+        # Determine which images to plot
+        highest_uncovered_indices = self.uncovered_indices[:top_k]
+        # Grab the images
+        selected_images = to_numpy(images)[highest_uncovered_indices]
+        # Plot the images
+        num_images = min(top_k, len(images))
+        ndim = selected_images.ndim
+        if ndim == 4:
+            selected_images = np.moveaxis(selected_images, 1, -1)
+        elif ndim == 3:
+            selected_images = np.repeat(selected_images[:, :, :, np.newaxis], 3, axis=-1)
+        else:
+            raise ValueError(
+                f"Expected a (N,C,H,W) or a (N, H, W) set of images, but got a {ndim}-dimensional set of images."
+            )
+        rows = int(np.ceil(num_images / 3))
+        fig, axs = plt.subplots(rows, 3, figsize=(9, 3 * rows))
+        if rows == 1:
+            for j in range(3):
+                if j >= len(selected_images):
+                    continue
+                axs[j].imshow(selected_images[j])
+                axs[j].axis("off")
+        else:
+            for i in range(rows):
+                for j in range(3):
+                    i_j = i * 3 + j
+                    if i_j >= len(selected_images):
+                        continue
+                    axs[i, j].imshow(selected_images[i_j])
+                    axs[i, j].axis("off")
+        fig.tight_layout()
+        return fig
+@dataclass(frozen=True)
+class BalanceOutput(Output):
+    """
+    Output class for :func:`.balance` :term:`bias<Bias>` metric.
+    Attributes
+    ----------
+    balance : NDArray[np.float64]
+        Estimate of mutual information between metadata factors and class label
+    factors : NDArray[np.float64]
+        Estimate of inter/intra-factor mutual information
+    classwise : NDArray[np.float64]
+        Estimate of mutual information between metadata factors and individual class labels
+    factor_names : list[str]
+        Names of each metadata factor
+    class_names : list[str]
+        List of the class labels present in the dataset
+    """
+    balance: NDArray[np.float64]
+    factors: NDArray[np.float64]
+    classwise: NDArray[np.float64]
+    factor_names: list[str]
+    class_names: list[str]
+    @overload
+    def _by_factor_type(
+        self,
+        attr: Literal["factor_names"],
+        factor_type: Literal["discrete", "continuous", "both"],
+    ) -> list[str]: ...
+    @overload
+    def _by_factor_type(
+        self,
+        attr: Literal["balance", "factors", "classwise"],
+        factor_type: Literal["discrete", "continuous", "both"],
+    ) -> NDArray[np.float64]: ...
+    def _by_factor_type(
+        self,
+        attr: Literal["balance", "factors", "classwise", "factor_names"],
+        factor_type: Literal["discrete", "continuous", "both"],
+    ) -> NDArray[np.float64] | list[str]:
+        # if not filtering by factor_type then just return the requested attribute without mask
+        if factor_type == "both":
+            return getattr(self, attr)
+        # create the mask for the selected factor_type
+        mask_lambda = (
+            (lambda x: "-continuous" not in x) if factor_type == "discrete" else (lambda x: "-discrete" not in x)
+        )
+        # return the masked attribute
+        if attr == "factor_names":
+            return [x.replace(f"-{factor_type}", "") for x in self.factor_names if mask_lambda(x)]
+        else:
+            factor_type_mask = np.asarray([mask_lambda(x) for x in self.factor_names])
+            if attr == "factors":
+                return self.factors[factor_type_mask[1:]][:, factor_type_mask[1:]]
+            elif attr == "balance":
+                return self.balance[factor_type_mask]
+            elif attr == "classwise":
+                return self.classwise[:, factor_type_mask]
+    def plot(
+        self,
+        row_labels: list[Any] | NDArray[Any] | None = None,
+        col_labels: list[Any] | NDArray[Any] | None = None,
+        plot_classwise: bool = False,
+        factor_type: Literal["discrete", "continuous", "both"] = "discrete",
+    ) -> Figure:
+        """
+        Plot a heatmap of balance information.
+        Parameters
+        ----------
+        row_labels : ArrayLike or None, default None
+            List/Array containing the labels for rows in the histogram
+        col_labels : ArrayLike or None, default None
+            List/Array containing the labels for columns in the histogram
+        plot_classwise : bool, default False
+            Whether to plot per-class balance instead of global balance
+        factor_type : "discrete", "continuous", or "both", default "discrete"
+            Whether to plot discretized values, continuous values, or to include both
+        Returns
+        -------
+        matplotlib.figure.Figure
+        Notes
+        -----
+        This method requires `matplotlib <https://matplotlib.org/>`_ to be installed.
+        """
+        if plot_classwise:
+            if row_labels is None:
+                row_labels = self.class_names
+            if col_labels is None:
+                col_labels = self._by_factor_type("factor_names", factor_type)
+            fig = heatmap(
+                self._by_factor_type("classwise", factor_type),
+                row_labels,
+                col_labels,
+                xlabel="Factors",
+                ylabel="Class",
+                cbarlabel="Normalized Mutual Information",
+            )
+        else:
+            # Combine balance and factors results
+            data = np.concatenate(
+                [
+                    self._by_factor_type("balance", factor_type)[np.newaxis, 1:],
+                    self._by_factor_type("factors", factor_type),
+                ],
+                axis=0,
+            )
+            # Create a mask for the upper triangle of the symmetrical array, ignoring the diagonal
+            mask = np.triu(data + 1, k=0) < 1
+            # Finalize the data for the plot, last row is last factor x last factor so it gets dropped
+            heat_data = np.where(mask, np.nan, data)[:-1]
+            # Creating label array for heat map axes
+            heat_labels = self._by_factor_type("factor_names", factor_type)
+            if row_labels is None:
+                row_labels = heat_labels[:-1]
+            if col_labels is None:
+                col_labels = heat_labels[1:]
+            fig = heatmap(heat_data, row_labels, col_labels, cbarlabel="Normalized Mutual Information")
+        return fig
+@dataclass(frozen=True)
+class DiversityOutput(Output):
+    """
+    Output class for :func:`.diversity` :term:`bias<Bias>` metric.
+    Attributes
+    ----------
+    diversity_index : NDArray[np.double]
+        :term:`Diversity` index for classes and factors
+    classwise : NDArray[np.double]
+        Classwise diversity index [n_class x n_factor]
+    factor_names : list[str]
+        Names of each metadata factor
+    class_names : list[str]
+        Class labels for each value in the dataset
+    """
+    diversity_index: NDArray[np.double]
+    classwise: NDArray[np.double]
+    factor_names: list[str]
+    class_names: list[str]
+    def plot(
+        self,
+        row_labels: ArrayLike | None = None,
+        col_labels: ArrayLike | None = None,
+        plot_classwise: bool = False,
+    ) -> Figure:
+        """
+        Plot a heatmap of diversity information.
+        Parameters
+        ----------
+        row_labels : ArrayLike or None, default None
+            List/Array containing the labels for rows in the histogram
+        col_labels : ArrayLike or None, default None
+            List/Array containing the labels for columns in the histogram
+        plot_classwise : bool, default False
+            Whether to plot per-class balance instead of global balance
+        Returns
+        -------
+        matplotlib.figure.Figure
+        Notes
+        -----
+        This method requires `matplotlib <https://matplotlib.org/>`_ to be installed.
+        """
+        if plot_classwise:
+            if row_labels is None:
+                row_labels = self.class_names
+            if col_labels is None:
+                col_labels = self.factor_names
+            fig = heatmap(
+                self.classwise,
+                row_labels,
+                col_labels,
+                xlabel="Factors",
+                ylabel="Class",
+                cbarlabel=f"Normalized {asdict(self.meta())['arguments']['method'].title()} Index",
+            )
+        else:
+            # Creating label array for heat map axes
+            import matplotlib.pyplot as plt
+            fig, ax = plt.subplots(figsize=(8, 8))
+            heat_labels = np.concatenate((["class"], self.factor_names))
+            ax.bar(heat_labels, self.diversity_index)
+            ax.set_xlabel("Factors")
+            plt.setp(ax.get_xticklabels(), rotation=45, ha="right", rotation_mode="anchor")
+            fig.tight_layout()
+        return fig

dataeval/outputs/_drift.py ADDED Viewed

@@ -0,0 +1,83 @@
+from __future__ import annotations
+__all__ = []
+from dataclasses import dataclass
+import numpy as np
+from numpy.typing import NDArray
+from dataeval.outputs._base import Output
+@dataclass(frozen=True)
+class DriftBaseOutput(Output):
+    """
+    Base output class for Drift Detector classes
+    """
+    drifted: bool
+    threshold: float
+    p_val: float
+    distance: float
+@dataclass(frozen=True)
+class DriftMMDOutput(DriftBaseOutput):
+    """
+    Output class for :class:`.DriftMMD` :term:`drift<Drift>` detector.
+    Attributes
+    ----------
+    drifted : bool
+        Drift prediction for the images
+    threshold : float
+        :term:`P-Value` used for significance of the permutation test
+    p_val : float
+        P-value obtained from the permutation test
+    distance : float
+        MMD^2 between the reference and test set
+    distance_threshold : float
+        MMD^2 threshold above which drift is flagged
+    """
+    # drifted: bool
+    # threshold: float
+    # p_val: float
+    # distance: float
+    distance_threshold: float
+@dataclass(frozen=True)
+class DriftOutput(DriftBaseOutput):
+    """
+    Output class for :class:`.DriftCVM`, :class:`.DriftKS`, and :class:`.DriftUncertainty` drift detectors.
+    Attributes
+    ----------
+    drifted : bool
+        :term:`Drift` prediction for the images
+    threshold : float
+        Threshold after multivariate correction if needed
+    p_val : float
+        Instance-level p-value
+    distance : float
+        Instance-level distance
+    feature_drift : NDArray
+        Feature-level array of images detected to have drifted
+    feature_threshold : float
+        Feature-level threshold to determine drift
+    p_vals : NDArray
+        Feature-level p-values
+    distances : NDArray
+        Feature-level distances
+    """
+    # drifted: bool
+    # threshold: float
+    # p_val: float
+    # distance: float
+    feature_drift: NDArray[np.bool_]
+    feature_threshold: float
+    p_vals: NDArray[np.float32]
+    distances: NDArray[np.float32]

dataeval/outputs/_estimators.py ADDED Viewed

@@ -0,0 +1,114 @@
+from __future__ import annotations
+__all__ = []
+from dataclasses import dataclass
+import numpy as np
+from numpy.typing import NDArray
+from dataeval.outputs._base import Output
+@dataclass(frozen=True)
+class BEROutput(Output):
+    """
+    Output class for :func:`.ber` estimator metric.
+    Attributes
+    ----------
+    ber : float
+        The upper bounds of the :term:`Bayes error rate<Bayes Error Rate (BER)>`
+    ber_lower : float
+        The lower bounds of the Bayes Error Rate
+    """
+    ber: float
+    ber_lower: float
+@dataclass(frozen=True)
+class ClustererOutput(Output):
+    """
+    Output class for :func:`.clusterer`.
+    Attributes
+    ----------
+    clusters : NDArray[int]
+        Assigned clusters
+    mst : NDArray[int]
+        The minimum spanning tree of the data
+    linkage_tree : NDArray[float]
+        The linkage array of the data
+    condensed_tree : NDArray[float]
+        The condensed tree of the data
+    membership_strengths : NDArray[float]
+        The strength of the data point belonging to the assigned cluster
+    """
+    clusters: NDArray[np.int_]
+    mst: NDArray[np.double]
+    linkage_tree: NDArray[np.double]
+    condensed_tree: NDArray[np.double]
+    membership_strengths: NDArray[np.double]
+    def find_outliers(self) -> NDArray[np.int_]:
+        """
+        Retrieves Outliers based on when the sample was added to the cluster
+        and how far it was from the cluster when it was added
+        Returns
+        -------
+        NDArray[int]
+            A numpy array of the outlier indices
+        """
+        return np.nonzero(self.clusters == -1)[0]
+    def find_duplicates(self) -> tuple[list[list[int]], list[list[int]]]:
+        """
+        Finds duplicate and near duplicate data based on cluster average distance
+        Returns
+        -------
+        Tuple[List[List[int]], List[List[int]]]
+            The exact :term:`duplicates<Duplicates>` and near duplicates as lists of related indices
+        """
+        # Delay load numba compiled functions
+        from dataeval.utils._clusterer import compare_links_to_cluster_std, sorted_union_find
+        exact_indices, near_indices = compare_links_to_cluster_std(self.mst, self.clusters)
+        exact_dupes = sorted_union_find(exact_indices)
+        near_dupes = sorted_union_find(near_indices)
+        return [[int(ii) for ii in il] for il in exact_dupes], [[int(ii) for ii in il] for il in near_dupes]
+@dataclass(frozen=True)
+class DivergenceOutput(Output):
+    """
+    Output class for :func:`.divergence` estimator metric.
+    Attributes
+    ----------
+    divergence : float
+        :term:`Divergence` value calculated between 2 datasets ranging between 0.0 and 1.0
+    errors : int
+        The number of differing edges between the datasets
+    """
+    divergence: float
+    errors: int
+@dataclass(frozen=True)
+class UAPOutput(Output):
+    """
+    Output class for :func:`.uap` estimator metric.
+    Attributes
+    ----------
+    uap : float
+        The empirical mean precision estimate
+    """
+    uap: float

dataeval 0.81.0__py3-none-any.whl → 0.82.1__py3-none-any.whl

dataeval 0.81.0py3-none-any.whl → 0.82.1py3-none-any.whl