PyPI - dataeval - Versions diffs - 0.72.0__py3-none-any.whl → 0.72.2__py3-none-any.whl - Mend

dataeval 0.72.0py3-none-any.whl → 0.72.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (90) hide show

dataeval/__init__.py +4 -4
dataeval/detectors/__init__.py +4 -3
dataeval/detectors/drift/__init__.py +10 -11
dataeval/{_internal/detectors → detectors}/drift/base.py +51 -102
dataeval/{_internal/detectors → detectors}/drift/cvm.py +9 -8
dataeval/{_internal/detectors → detectors}/drift/ks.py +11 -10
dataeval/{_internal/detectors → detectors}/drift/mmd.py +33 -34
dataeval/{_internal/detectors → detectors}/drift/torch.py +15 -13
dataeval/{_internal/detectors → detectors}/drift/uncertainty.py +12 -9
dataeval/detectors/drift/updates.py +61 -0
dataeval/detectors/linters/__init__.py +3 -3
dataeval/{_internal/detectors → detectors/linters}/clusterer.py +47 -45
dataeval/{_internal/detectors → detectors/linters}/duplicates.py +20 -10
dataeval/{_internal/detectors → detectors/linters}/merged_stats.py +3 -1
dataeval/{_internal/detectors → detectors/linters}/outliers.py +19 -26
dataeval/detectors/ood/__init__.py +8 -16
dataeval/{_internal/detectors → detectors}/ood/ae.py +9 -9
dataeval/{_internal/detectors → detectors}/ood/aegmm.py +10 -30
dataeval/{_internal/detectors → detectors}/ood/base.py +27 -21
dataeval/{_internal/detectors → detectors}/ood/llr.py +27 -23
dataeval/detectors/ood/metadata_ks_compare.py +99 -0
dataeval/detectors/ood/metadata_least_likely.py +119 -0
dataeval/detectors/ood/metadata_ood_mi.py +92 -0
dataeval/{_internal/detectors → detectors}/ood/vae.py +11 -13
dataeval/{_internal/detectors → detectors}/ood/vaegmm.py +10 -32
dataeval/{_internal/interop.py → interop.py} +12 -7
dataeval/metrics/__init__.py +1 -1
dataeval/metrics/bias/__init__.py +4 -4
dataeval/{_internal/metrics → metrics/bias}/balance.py +70 -4
dataeval/{_internal/metrics → metrics/bias}/coverage.py +10 -8
dataeval/{_internal/metrics → metrics/bias}/diversity.py +54 -20
dataeval/metrics/bias/metadata.py +275 -0
dataeval/{_internal/metrics → metrics/bias}/parity.py +21 -17
dataeval/metrics/estimators/__init__.py +3 -3
dataeval/{_internal/metrics → metrics/estimators}/ber.py +31 -28
dataeval/{_internal/metrics → metrics/estimators}/divergence.py +15 -16
dataeval/{_internal/metrics → metrics/estimators}/uap.py +8 -6
dataeval/metrics/stats/__init__.py +7 -7
dataeval/{_internal/metrics → metrics}/stats/base.py +66 -40
dataeval/{_internal/metrics → metrics}/stats/boxratiostats.py +19 -15
dataeval/{_internal/metrics → metrics}/stats/datasetstats.py +19 -17
dataeval/{_internal/metrics → metrics}/stats/dimensionstats.py +12 -10
dataeval/metrics/stats/hashstats.py +156 -0
dataeval/{_internal/metrics → metrics}/stats/labelstats.py +8 -6
dataeval/{_internal/metrics → metrics}/stats/pixelstats.py +12 -11
dataeval/{_internal/metrics → metrics}/stats/visualstats.py +14 -13
dataeval/{_internal/output.py → output.py} +26 -6
dataeval/utils/__init__.py +8 -4
dataeval/utils/image.py +71 -0
dataeval/utils/shared.py +151 -0
dataeval/utils/split_dataset.py +486 -0
dataeval/utils/tensorflow/__init__.py +9 -7
dataeval/{_internal/models/tensorflow → utils/tensorflow/_internal}/autoencoder.py +64 -68
dataeval/{_internal/models/tensorflow/losses.py → utils/tensorflow/_internal/loss.py} +10 -9
dataeval/{_internal/models/tensorflow → utils/tensorflow/_internal}/pixelcnn.py +18 -22
dataeval/{_internal/models/tensorflow → utils/tensorflow/_internal}/trainer.py +3 -1
dataeval/{_internal/models/tensorflow → utils/tensorflow/_internal}/utils.py +18 -18
dataeval/utils/tensorflow/loss/__init__.py +6 -2
dataeval/utils/torch/__init__.py +7 -3
dataeval/{_internal/models/pytorch → utils/torch}/blocks.py +19 -14
dataeval/{_internal → utils/torch}/datasets.py +49 -43
dataeval/utils/torch/models.py +138 -0
dataeval/{_internal/models/pytorch/autoencoder.py → utils/torch/trainer.py} +12 -141
dataeval/{_internal → utils/torch}/utils.py +3 -1
dataeval/workflows/__init__.py +1 -1
dataeval/{_internal/workflows → workflows}/sufficiency.py +42 -37
{dataeval-0.72.0.dist-info → dataeval-0.72.2.dist-info}/METADATA +7 -5
dataeval-0.72.2.dist-info/RECORD +72 -0
dataeval/_internal/detectors/__init__.py +0 -0
dataeval/_internal/detectors/drift/__init__.py +0 -0
dataeval/_internal/detectors/ood/__init__.py +0 -0
dataeval/_internal/metrics/__init__.py +0 -0
dataeval/_internal/metrics/stats/hashstats.py +0 -75
dataeval/_internal/metrics/utils.py +0 -447
dataeval/_internal/models/__init__.py +0 -0
dataeval/_internal/models/pytorch/__init__.py +0 -0
dataeval/_internal/models/pytorch/utils.py +0 -67
dataeval/_internal/models/tensorflow/__init__.py +0 -0
dataeval/_internal/workflows/__init__.py +0 -0
dataeval/detectors/drift/kernels/__init__.py +0 -10
dataeval/detectors/drift/updates/__init__.py +0 -7
dataeval/utils/tensorflow/models/__init__.py +0 -9
dataeval/utils/tensorflow/recon/__init__.py +0 -3
dataeval/utils/torch/datasets/__init__.py +0 -12
dataeval/utils/torch/models/__init__.py +0 -11
dataeval/utils/torch/trainer/__init__.py +0 -7
dataeval-0.72.0.dist-info/RECORD +0 -80
/dataeval/{_internal/models/tensorflow → utils/tensorflow/_internal}/gmm.py +0 -0
{dataeval-0.72.0.dist-info → dataeval-0.72.2.dist-info}/LICENSE.txt +0 -0
{dataeval-0.72.0.dist-info → dataeval-0.72.2.dist-info}/WHEEL +0 -0

dataeval/{_internal/metrics → metrics/bias}/diversity.py RENAMED Viewed

@@ -1,40 +1,77 @@
 from __future__ import annotations
+__all__ = ["DiversityOutput", "diversity"]
 from dataclasses import dataclass
-from typing import Literal, Mapping
+from typing import Any, Literal, Mapping
 import numpy as np
 from numpy.typing import ArrayLike, NDArray
-from dataeval._internal.metrics.utils import entropy, get_counts, get_method, get_num_bins, preprocess_metadata
-from dataeval._internal.output import OutputMetadata, set_metadata
+from dataeval.metrics.bias.metadata import entropy, get_counts, get_num_bins, heatmap, preprocess_metadata
+from dataeval.output import OutputMetadata, set_metadata
+from dataeval.utils.shared import get_method
 @dataclass(frozen=True)
 class DiversityOutput(OutputMetadata):
     """
-    Output class for :func:`diversity` bias metric
+    Output class for :func:`diversity` :term:`bias<Bias>` metric
     Attributes
     ----------
     diversity_index : NDArray[np.float64]
-        Diversity index for classes and factors
+        :term:`Diversity` index for classes and factors
     classwise : NDArray[np.float64]
         Classwise diversity index [n_class x n_factor]
+    class_list: NDArray[np.int64]
+        Class labels for each value in the dataset
+    metadata_names: list[str]
+        Names of each metadata factor
     """
     diversity_index: NDArray[np.float64]
     classwise: NDArray[np.float64]
+    class_list: NDArray[np.int64]
+    metadata_names: list[str]
+    method: Literal["shannon", "simpson"]
+    def plot(self, row_labels: NDArray[Any] | None = None, col_labels: NDArray[Any] | None = None) -> None:
+        """
+        Plot a heatmap of diversity information
+        Parameters
+        ----------
+        row_labels: NDArray | None, default None
+            Array containing the labels for rows in the histogram
+        col_labels: NDArray | None, default None
+            Array containing the labels for columns in the histogram
+        """
+        if row_labels is None:
+            row_labels = np.unique(self.class_list)
+        if col_labels is None:
+            col_labels = np.array(self.metadata_names)
+        heatmap(
+            self.classwise,
+            row_labels,
+            col_labels,
+            xlabel="Factors",
+            ylabel="Class",
+            cbarlabel=f"Normalized {self.method.title()} Index",
+        )
 def diversity_shannon(
-    data: NDArray,
+    data: NDArray[Any],
     names: list[str],
     is_categorical: list[bool],
     subset_mask: NDArray[np.bool_] | None = None,
-) -> NDArray:
+) -> NDArray[np.float64]:
     """
-    Compute diversity for discrete/categorical variables and, through standard
+    Compute :term:`diversity<Diversity>` for discrete/categorical variables and, through standard
     histogram binning, for continuous variables.
     We define diversity as a normalized form of the Shannon entropy.
@@ -79,13 +116,13 @@ def diversity_shannon(
 def diversity_simpson(
-    data: NDArray,
+    data: NDArray[Any],
     names: list[str],
     is_categorical: list[bool],
     subset_mask: NDArray[np.bool_] | None = None,
-) -> NDArray:
+) -> NDArray[np.float64]:
     """
-    Compute diversity for discrete/categorical variables and, through standard
+    Compute :term:`diversity<Diversity>` for discrete/categorical variables and, through standard
     histogram binning, for continuous variables.
     We define diversity as the inverse Simpson diversity index linearly rescaled to the unit interval.
@@ -139,16 +176,13 @@ def diversity_simpson(
     return ev_index
-DIVERSITY_FN_MAP = {"simpson": diversity_simpson, "shannon": diversity_shannon}
-@set_metadata("dataeval.metrics")
+@set_metadata()
 def diversity(
     class_labels: ArrayLike, metadata: Mapping[str, ArrayLike], method: Literal["shannon", "simpson"] = "simpson"
 ) -> DiversityOutput:
     """
-    Compute diversity and classwise diversity for discrete/categorical variables and, through standard
-    histogram binning, for continuous variables.
+    Compute :term:`diversity<Diversity>` and classwise diversity for discrete/categorical variables and,
+    through standard histogram binning, for continuous variables.
     We define diversity as a normalized form of the inverse Simpson diversity index.
@@ -202,12 +236,12 @@ def diversity(
     --------
     numpy.histogram
     """
-    diversity_fn = get_method(DIVERSITY_FN_MAP, method)
+    diversity_fn = get_method({"simpson": diversity_simpson, "shannon": diversity_shannon}, method)
     data, names, is_categorical = preprocess_metadata(class_labels, metadata)
     diversity_index = diversity_fn(data, names, is_categorical, None).astype(np.float64)
     class_idx = names.index("class_label")
-    class_lbl = data[:, class_idx]
+    class_lbl = np.array(data[:, class_idx], dtype=int)
     u_classes = np.unique(class_lbl)
     num_factors = len(names)
@@ -218,4 +252,4 @@ def diversity(
         diversity[idx, :] = diversity_fn(data, names, is_categorical, subset_mask)
     div_no_class = np.concatenate((diversity[:, :class_idx], diversity[:, (class_idx + 1) :]), axis=1)
-    return DiversityOutput(diversity_index, div_no_class)
+    return DiversityOutput(diversity_index, div_no_class, class_lbl, list(metadata.keys()), method)

dataeval/metrics/bias/metadata.py ADDED Viewed

@@ -0,0 +1,275 @@
+from __future__ import annotations
+__all__ = []
+from typing import Any, Mapping
+import numpy as np
+from numpy.typing import ArrayLike, NDArray
+from scipy.stats import entropy as sp_entropy
+from dataeval.interop import to_numpy
+def get_counts(
+    data: NDArray[np.int_], names: list[str], is_categorical: list[bool], subset_mask: NDArray[np.bool_] | None = None
+) -> tuple[dict[str, NDArray[np.int_]], dict[str, NDArray[np.int_]]]:
+    """
+    Initialize dictionary of histogram counts --- treat categorical values
+    as histogram bins.
+    Parameters
+    ----------
+    subset_mask: NDArray[np.bool_] | None
+        Boolean mask of samples to bin (e.g. when computing per class).  True -> include in histogram counts
+    Returns
+    -------
+    counts: Dict
+        histogram counts per metadata factor in `factors`.  Each
+        factor will have a different number of bins.  Counts get reused
+        across metrics, so hist_counts are cached but only if computed
+        globally, i.e. without masked samples.
+    """
+    hist_counts, hist_bins = {}, {}
+    # np.where needed to satisfy linter
+    mask = np.where(subset_mask if subset_mask is not None else np.ones(data.shape[0], dtype=bool))
+    for cdx, fn in enumerate(names):
+        # linter doesn't like double indexing
+        col_data = data[mask, cdx].squeeze()
+        if is_categorical[cdx]:
+            # if discrete, use unique values as bins
+            bins, cnts = np.unique(col_data, return_counts=True)
+        else:
+            bins = hist_bins.get(fn, "auto")
+            cnts, bins = np.histogram(col_data, bins=bins, density=True)
+        hist_counts[fn] = cnts
+        hist_bins[fn] = bins
+    return hist_counts, hist_bins
+def entropy(
+    data: NDArray[Any],
+    names: list[str],
+    is_categorical: list[bool],
+    normalized: bool = False,
+    subset_mask: NDArray[np.bool_] | None = None,
+) -> NDArray[np.float64]:
+    """
+    Meant for use with :term:`bias<Bias>` metrics, :term:`balance<Balance>`, :term:`diversity<Diversity>`,
+    ClasswiseBalance, and Classwise Diversity.
+    Compute entropy for discrete/categorical variables and for continuous variables through standard
+    histogram binning.
+    Parameters
+    ----------
+    normalized: bool
+        Flag that determines whether or not to normalize entropy by log(num_bins)
+    subset_mask: NDArray[np.bool_] | None
+        Boolean mask of samples to bin (e.g. when computing per class).  True -> include in histogram counts
+    Note
+    ----
+    For continuous variables, histogram bins are chosen automatically.  See
+    numpy.histogram for details.
+    Returns
+    -------
+    ent: NDArray[np.float64]
+        Entropy estimate per column of X
+    See Also
+    --------
+    numpy.histogram
+    scipy.stats.entropy
+    """
+    num_factors = len(names)
+    hist_counts, _ = get_counts(data, names, is_categorical, subset_mask)
+    ev_index = np.empty(num_factors)
+    for col, cnts in enumerate(hist_counts.values()):
+        # entropy in nats, normalizes counts
+        ev_index[col] = sp_entropy(cnts)
+        if normalized:
+            if len(cnts) == 1:
+                # log(0)
+                ev_index[col] = 0
+            else:
+                ev_index[col] /= np.log(len(cnts))
+    return ev_index
+def get_num_bins(
+    data: NDArray[Any], names: list[str], is_categorical: list[bool], subset_mask: NDArray[np.bool_] | None = None
+) -> NDArray[np.float64]:
+    """
+    Number of bins or unique values for each metadata factor, used to
+    normalize entropy/:term:`diversity<Diversity>`.
+    Parameters
+    ----------
+    subset_mask: NDArray[np.bool_] | None
+        Boolean mask of samples to bin (e.g. when computing per class).  True -> include in histogram counts
+    Returns
+    -------
+    NDArray[np.float64]
+    """
+    # likely cached
+    hist_counts, _ = get_counts(data, names, is_categorical, subset_mask)
+    num_bins = np.empty(len(hist_counts))
+    for idx, cnts in enumerate(hist_counts.values()):
+        num_bins[idx] = len(cnts)
+    return num_bins
+def infer_categorical(arr: NDArray[Any], threshold: float = 0.2) -> NDArray[Any]:
+    """
+    Compute fraction of feature values that are unique --- intended to be used
+    for inferring whether variables are categorical.
+    """
+    if arr.ndim == 1:
+        arr = np.expand_dims(arr, axis=1)
+    num_samples = arr.shape[0]
+    pct_unique = np.empty(arr.shape[1])
+    for col in range(arr.shape[1]):  # type: ignore
+        uvals = np.unique(arr[:, col], axis=0)
+        pct_unique[col] = len(uvals) / num_samples
+    return pct_unique < threshold
+def preprocess_metadata(
+    class_labels: ArrayLike, metadata: Mapping[str, ArrayLike], cat_thresh: float = 0.2
+) -> tuple[NDArray[Any], list[str], list[bool]]:
+    # convert class_labels and dict of lists to matrix of metadata values
+    preprocessed_metadata = {"class_label": np.asarray(class_labels, dtype=int)}
+    # map columns of dict that are not numeric (e.g. string) to numeric values
+    # that mutual information and diversity functions can accommodate.  Each
+    # unique string receives a unique integer value.
+    for k, v in metadata.items():
+        # if not numeric
+        v = to_numpy(v)
+        if not np.issubdtype(v.dtype, np.number):
+            _, mapped_vals = np.unique(v, return_inverse=True)
+            preprocessed_metadata[k] = mapped_vals
+        else:
+            preprocessed_metadata[k] = v
+    data = np.stack(list(preprocessed_metadata.values()), axis=-1)
+    names = list(preprocessed_metadata.keys())
+    is_categorical = [infer_categorical(preprocessed_metadata[var], cat_thresh)[0] for var in names]
+    return data, names, is_categorical
+def heatmap(
+    data: NDArray[Any],
+    row_labels: NDArray[Any],
+    col_labels: NDArray[Any],
+    xlabel: str = "",
+    ylabel: str = "",
+    cbarlabel: str = "",
+) -> None:
+    """
+    Plots a formatted heatmap
+    Parameters
+    ----------
+    data: NDArray
+        Array containing numerical values for factors to plot
+    row_labels: NDArray
+        Array containing the labels for rows in the histogram
+    col_labels: NDArray
+        Array containing the labels for columns in the histogram
+    xlabel: str, default ""
+        X-axis label
+    ylabel: str, default ""
+        Y-axis label
+    cbarlabel: str, default ""
+        Label for the colorbar
+    """
+    import matplotlib
+    import matplotlib.pyplot as plt
+    fig, ax = plt.subplots(figsize=(10, 10))
+    # Plot the heatmap
+    im = ax.imshow(data, vmin=0, vmax=1.0)
+    # Create colorbar
+    cbar = fig.colorbar(im, shrink=0.5)
+    cbar.set_ticks([0.0, 0.25, 0.5, 0.75, 1.0])
+    cbar.set_ticklabels(["0.0", "0.25", "0.5", "0.75", "1.0"])
+    cbar.set_label(cbarlabel, loc="center")
+    # Show all ticks and label them with the respective list entries.
+    ax.set_xticks(np.arange(data.shape[1]), labels=col_labels)
+    ax.set_yticks(np.arange(data.shape[0]), labels=row_labels)
+    ax.tick_params(top=False, bottom=True, labeltop=False, labelbottom=True)
+    # Rotate the tick labels and set their alignment.
+    plt.setp(ax.get_xticklabels(), rotation=45, ha="right", rotation_mode="anchor")
+    # Turn spines off and create white grid.
+    ax.spines[:].set_visible(False)
+    ax.set_xticks(np.arange(data.shape[1] + 1) - 0.5, minor=True)
+    ax.set_yticks(np.arange(data.shape[0] + 1) - 0.5, minor=True)
+    ax.grid(which="minor", color="w", linestyle="-", linewidth=3)
+    ax.tick_params(which="minor", bottom=False, left=False)
+    if xlabel:
+        ax.set_xlabel(xlabel)
+    if ylabel:
+        ax.set_ylabel(ylabel)
+    valfmt = matplotlib.ticker.FuncFormatter(format_text)  # type: ignore
+    # Normalize the threshold to the images color range.
+    threshold = im.norm(1.0) / 2.0
+    # Set default alignment to center, but allow it to be
+    # overwritten by textkw.
+    kw = {"horizontalalignment": "center", "verticalalignment": "center"}
+    # Loop over the data and create a `Text` for each "pixel".
+    # Change the text's color depending on the data.
+    textcolors = ("white", "black")
+    texts = []
+    for i in range(data.shape[0]):
+        for j in range(data.shape[1]):
+            kw.update(color=textcolors[int(im.norm(data[i, j]) > threshold)])
+            text = im.axes.text(j, i, valfmt(data[i, j], None), **kw)  # type: ignore
+            texts.append(text)
+    fig.tight_layout()
+    plt.show()
+# Function to define how the text is displayed in the heatmap
+def format_text(*args: str) -> str:
+    """
+    Helper function to format text for heatmap()
+    Parameters
+    ----------
+    *args: Tuple (str, str)
+        Text to be formatted. Second element is ignored, but is a
+        mandatory pass-through argument as per matplotlib.ticket.FuncFormatter
+    Returns
+    -------
+    str
+        Formatted text
+    """
+    x = args[0]
+    return f"{x:.2f}".replace("0.00", "0").replace("0.", ".").replace("nan", "")

dataeval/{_internal/metrics → metrics/bias}/parity.py RENAMED Viewed

@@ -1,15 +1,17 @@
 from __future__ import annotations
+__all__ = ["ParityOutput", "parity", "label_parity"]
 import warnings
 from dataclasses import dataclass
-from typing import Generic, Mapping, TypeVar
+from typing import Any, Generic, Mapping, TypeVar
 import numpy as np
 from numpy.typing import ArrayLike, NDArray
 from scipy.stats import chi2_contingency, chisquare
-from dataeval._internal.interop import to_numpy
-from dataeval._internal.output import OutputMetadata, set_metadata
+from dataeval.interop import to_numpy
+from dataeval.output import OutputMetadata, set_metadata
 TData = TypeVar("TData", np.float64, NDArray[np.float64])
@@ -17,7 +19,7 @@ TData = TypeVar("TData", np.float64, NDArray[np.float64])
 @dataclass(frozen=True)
 class ParityOutput(Generic[TData], OutputMetadata):
     """
-    Output class for :func:`parity` and :func:`label_parity` bias metrics
+    Output class for :func:`parity` and :func:`label_parity` :term:`bias<Bias>` metrics
     Attributes
     ----------
@@ -31,7 +33,7 @@ class ParityOutput(Generic[TData], OutputMetadata):
     p_value: TData
-def digitize_factor_bins(continuous_values: NDArray, bins: int, factor_name: str) -> NDArray:
+def digitize_factor_bins(continuous_values: NDArray[Any], bins: int, factor_name: str) -> NDArray[np.intp]:
     """
     Digitizes a list of values into a given number of bins.
@@ -64,8 +66,8 @@ def digitize_factor_bins(continuous_values: NDArray, bins: int, factor_name: str
 def format_discretize_factors(
-    data_factors: Mapping[str, NDArray], continuous_factor_bincounts: Mapping[str, int]
-) -> dict[str, NDArray]:
+    data_factors: Mapping[str, NDArray[Any]], continuous_factor_bincounts: Mapping[str, int]
+) -> dict[str, NDArray[Any]]:
     """
     Sets up the internal list of metadata factors.
@@ -115,7 +117,7 @@ def format_discretize_factors(
     return metadata_factors
-def normalize_expected_dist(expected_dist: NDArray, observed_dist: NDArray) -> NDArray:
+def normalize_expected_dist(expected_dist: NDArray[Any], observed_dist: NDArray[Any]) -> NDArray[Any]:
     """
     Normalize the expected label distribution to match the total number of labels in the observed distribution.
@@ -162,7 +164,7 @@ def normalize_expected_dist(expected_dist: NDArray, observed_dist: NDArray) -> N
     return expected_dist
-def validate_dist(label_dist: NDArray, label_name: str):
+def validate_dist(label_dist: NDArray[Any], label_name: str) -> None:
     """
     Verifies that the given label distribution has labels and checks if
     any labels have frequencies less than 5.
@@ -191,14 +193,15 @@ def validate_dist(label_dist: NDArray, label_name: str):
         )
-@set_metadata("dataeval.metrics")
+@set_metadata()
 def label_parity(
     expected_labels: ArrayLike,
     observed_labels: ArrayLike,
     num_classes: int | None = None,
 ) -> ParityOutput[np.float64]:
     """
-    Calculate the chi-square statistic to assess the parity between expected and observed label distributions.
+    Calculate the chi-square statistic to assess the :term:`parity<Parity>` between expected and
+    observed label distributions.
     This function computes the frequency distribution of classes in both expected and observed labels, normalizes
     the expected distribution to match the total number of observed labels, and then calculates the chi-square
@@ -217,7 +220,7 @@ def label_parity(
     Returns
     -------
     ParityOutput[np.float64]
-        chi-squared score and p-value of the test
+        chi-squared score and :term`P-Value` of the test
     Raises
     ------
@@ -231,8 +234,8 @@ def label_parity(
     - Providing ``num_classes`` can be helpful if there are classes with zero instances in one of the distributions.
     - The function first validates the observed distribution and normalizes the expected distribution so that it
       has the same total number of labels as the observed distribution.
-    - It then performs a chi-square test to determine if there is a statistically significant difference between
-      the observed and expected label distributions.
+    - It then performs a :term:`Chi-Square Test of Independence` to determine if there is a statistically significant
+      difference between the observed and expected label distributions.
     - This function acts as an interface to the scipy.stats.chisquare method, which is documented at
       https://docs.scipy.org/doc/scipy/reference/generated/scipy.stats.chisquare.html
@@ -278,14 +281,15 @@ def label_parity(
     return ParityOutput(cs, p)
-@set_metadata("dataeval.metrics")
+@set_metadata()
 def parity(
     class_labels: ArrayLike,
     data_factors: Mapping[str, ArrayLike],
     continuous_factor_bincounts: Mapping[str, int] | None = None,
 ) -> ParityOutput[NDArray[np.float64]]:
     """
-    Calculate chi-square statistics to assess the relationship between multiple factors and class labels.
+    Calculate chi-square statistics to assess the relationship between multiple factors
+    and class labels.
     This function computes the chi-square statistic for each metadata factor to determine if there is
     a significant relationship between the factor values and class labels. The function handles both categorical
@@ -308,7 +312,7 @@ def parity(
     -------
     ParityOutput[NDArray[np.float64]]
         Arrays of length (num_factors) whose (i)th element corresponds to the
-        chi-square score and p-value for the relationship between factor i and
+        chi-square score and :term:`p-value<P-Value>` for the relationship between factor i and
         the class labels in the dataset.
     Raises

dataeval/metrics/estimators/__init__.py CHANGED Viewed

@@ -2,8 +2,8 @@
 Estimators calculate performance bounds and the statistical distance between datasets.
 """
-from dataeval._internal.metrics.ber import BEROutput, ber
-from dataeval._internal.metrics.divergence import DivergenceOutput, divergence
-from dataeval._internal.metrics.uap import UAPOutput, uap
+from dataeval.metrics.estimators.ber import BEROutput, ber
+from dataeval.metrics.estimators.divergence import DivergenceOutput, divergence
+from dataeval.metrics.estimators.uap import UAPOutput, uap
 __all__ = ["ber", "divergence", "uap", "BEROutput", "DivergenceOutput", "UAPOutput"]

dataeval 0.72.0__py3-none-any.whl → 0.72.2__py3-none-any.whl

dataeval 0.72.0py3-none-any.whl → 0.72.2py3-none-any.whl