PyPI - dataeval - Versions diffs - 0.82.0__py3-none-any.whl → 0.82.1__py3-none-any.whl - Mend

dataeval 0.82.0py3-none-any.whl → 0.82.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (37) hide show

dataeval/__init__.py +1 -1
dataeval/config.py +68 -11
dataeval/detectors/drift/_mmd.py +9 -9
dataeval/detectors/drift/_torch.py +7 -7
dataeval/detectors/drift/_uncertainty.py +4 -4
dataeval/detectors/linters/duplicates.py +3 -3
dataeval/detectors/linters/outliers.py +3 -3
dataeval/detectors/ood/ae.py +5 -4
dataeval/detectors/ood/base.py +2 -2
dataeval/detectors/ood/metadata_ood_mi.py +4 -6
dataeval/detectors/ood/mixin.py +1 -1
dataeval/detectors/ood/vae.py +2 -1
dataeval/metadata/_distance.py +11 -44
dataeval/metadata/_ood.py +9 -7
dataeval/metrics/bias/_balance.py +7 -3
dataeval/metrics/bias/_diversity.py +3 -0
dataeval/metrics/bias/_parity.py +2 -0
dataeval/metrics/stats/_base.py +3 -3
dataeval/metrics/stats/_boxratiostats.py +1 -1
dataeval/metrics/stats/_imagestats.py +4 -4
dataeval/outputs/__init__.py +4 -0
dataeval/outputs/_base.py +50 -21
dataeval/outputs/_bias.py +1 -1
dataeval/outputs/_linters.py +4 -2
dataeval/outputs/_metadata.py +54 -0
dataeval/outputs/_stats.py +12 -6
dataeval/utils/data/_embeddings.py +8 -9
dataeval/utils/data/_metadata.py +16 -7
dataeval/utils/data/_selection.py +4 -8
dataeval/utils/data/_split.py +3 -2
dataeval/utils/data/selections/_classfilter.py +5 -3
dataeval/utils/torch/_internal.py +5 -5
dataeval/utils/torch/trainer.py +8 -8
{dataeval-0.82.0.dist-info → dataeval-0.82.1.dist-info}/METADATA +1 -1
{dataeval-0.82.0.dist-info → dataeval-0.82.1.dist-info}/RECORD +37 -36
{dataeval-0.82.0.dist-info → dataeval-0.82.1.dist-info}/LICENSE.txt +0 -0
{dataeval-0.82.0.dist-info → dataeval-0.82.1.dist-info}/WHEEL +0 -0

dataeval/__init__.py CHANGED Viewed

@@ -8,7 +8,7 @@ shifts that impact performance of deployed models.
 from __future__ import annotations
 __all__ = ["config", "detectors", "log", "metrics", "typing", "utils", "workflows"]
-__version__ = "0.82.0"
+__version__ = "0.82.1"
 import logging

dataeval/config.py CHANGED Viewed

@@ -4,36 +4,61 @@ Global configuration settings for DataEval.
 from __future__ import annotations
-__all__ = ["get_device", "set_device", "get_max_processes", "set_max_processes"]
+__all__ = ["get_device", "set_device", "get_max_processes", "set_max_processes", "DeviceLike"]
+import sys
+from typing import Union
+if sys.version_info >= (3, 10):
+    from typing import TypeAlias
+else:
+    from typing_extensions import TypeAlias
+import numpy as np
 import torch
-from torch import device
-_device: device | None = None
+_device: torch.device | None = None
 _processes: int | None = None
+_seed: int | None = None
+DeviceLike: TypeAlias = Union[int, str, tuple[str, int], torch.device]
+"""
+Type alias for types that are acceptable for specifying a torch.device.
+See Also
+--------
+`torch.device <https://pytorch.org/docs/stable/tensor_attributes.html#torch.device>`_
+"""
+def _todevice(device: DeviceLike) -> torch.device:
+    return torch.device(*device) if isinstance(device, tuple) else torch.device(device)
-def set_device(device: str | device | int) -> None:
+def set_device(device: DeviceLike) -> None:
     """
     Sets the default device to use when executing against a PyTorch backend.
     Parameters
     ----------
-    device : str or int or `torch.device`
-        The default device to use. See `torch.device <https://pytorch.org/docs/stable/tensor_attributes.html#torch.device>`_
-        documentation for more information.
+    device : DeviceLike
+        The default device to use. See documentation for more information.
+    See Also
+    --------
+    `torch.device <https://pytorch.org/docs/stable/tensor_attributes.html#torch.device>`_
     """
     global _device
-    _device = torch.device(device)
+    _device = _todevice(device)
-def get_device(override: str | device | int | None = None) -> torch.device:
+def get_device(override: DeviceLike | None = None) -> torch.device:
     """
     Returns the PyTorch device to use.
     Parameters
     ----------
-    override : str or int or `torch.device` or None, default None
+    override : DeviceLike or None, default None
         The user specified override if provided, otherwise returns the default device.
     Returns
@@ -44,7 +69,7 @@ def get_device(override: str | device | int | None = None) -> torch.device:
         global _device
         return torch.get_default_device() if _device is None else _device
     else:
-        return torch.device(override)
+        return _todevice(override)
 def set_max_processes(processes: int | None) -> None:
@@ -75,3 +100,35 @@ def get_max_processes() -> int | None:
     """
     global _processes
     return _processes
+def set_seed(seed: int | None, all_generators: bool = False) -> None:
+    """
+    Sets the seed for use by classes that allow for a random state or seed.
+    Parameters
+    ----------
+    seed : int or None
+        The seed to use.
+    all_generators : bool, default False
+        Whether to set the seed for all generators, including NumPy and PyTorch.
+    """
+    global _seed
+    _seed = seed
+    if all_generators:
+        np.random.seed(seed)
+        torch.manual_seed(seed)
+def get_seed() -> int | None:
+    """
+    Returns the seed for random state or seed.
+    Returns
+    -------
+    int or None
+        The seed to use.
+    """
+    global _seed
+    return _seed

dataeval/detectors/drift/_mmd.py CHANGED Viewed

@@ -14,7 +14,7 @@ from typing import Callable
 import torch
-from dataeval.config import get_device
+from dataeval.config import DeviceLike, get_device
 from dataeval.detectors.drift._base import BaseDrift, UpdateStrategy, preprocess_x, update_x_ref
 from dataeval.detectors.drift._torch import GaussianRBF, mmd2_from_kernel_matrix
 from dataeval.outputs import DriftMMDOutput
@@ -31,7 +31,7 @@ class DriftMMD(BaseDrift):
     ----------
     x_ref : ArrayLike
         Data used as reference distribution.
-    p_val : float | None, default 0.05
+    p_val : float or None, default 0.05
         :term:`P-value` used for significance of the statistical test for each feature.
         If the FDR correction method is used, this corresponds to the acceptable
         q-value.
@@ -39,14 +39,14 @@ class DriftMMD(BaseDrift):
         Whether the given reference data ``x_ref`` has been preprocessed yet.
         If ``True``, only the test data ``x`` will be preprocessed at prediction time.
         If ``False``, the reference data will also be preprocessed.
-    update_x_ref : UpdateStrategy | None, default None
+    update_x_ref : UpdateStrategy or None, default None
         Reference data can optionally be updated using an UpdateStrategy class. Update
         using the last n instances seen by the detector with LastSeenUpdateStrategy
         or via reservoir sampling with ReservoirSamplingUpdateStrategy.
-    preprocess_fn : Callable | None, default None
+    preprocess_fn : Callable or None, default None
         Function to preprocess the data before computing the data drift metrics.
         Typically a :term:`dimensionality reduction<Dimensionality Reduction>` technique.
-    sigma : ArrayLike | None, default None
+    sigma : ArrayLike or None, default None
         Optionally set the internal GaussianRBF kernel bandwidth. Can also pass multiple
         bandwidth values as an array. The kernel evaluation is then averaged over
         those bandwidths.
@@ -54,9 +54,9 @@ class DriftMMD(BaseDrift):
         Whether to already configure the kernel bandwidth from the reference data.
     n_permutations : int, default 100
         Number of permutations used in the permutation test.
-    device : str | None, default None
-        Device type used. The default None uses the GPU and falls back on CPU.
-        Can be specified by passing either 'cuda', 'gpu' or 'cpu'.
+    device : DeviceLike or None, default None
+        The hardware device to use if specified, otherwise uses the DataEval
+        default or torch default.
     Example
     -------
@@ -84,7 +84,7 @@ class DriftMMD(BaseDrift):
         sigma: ArrayLike | None = None,
         configure_kernel_from_x_ref: bool = True,
         n_permutations: int = 100,
-        device: str | torch.device | None = None,
+        device: DeviceLike | None = None,
     ) -> None:
         super().__init__(x_ref, p_val, x_ref_preprocessed, update_x_ref, preprocess_fn)

dataeval/detectors/drift/_torch.py CHANGED Viewed

@@ -17,7 +17,7 @@ import torch
 import torch.nn as nn
 from numpy.typing import NDArray
-from dataeval.config import get_device
+from dataeval.config import DeviceLike, get_device
 from dataeval.utils.torch._internal import predict_batch
@@ -59,7 +59,7 @@ def mmd2_from_kernel_matrix(
 def preprocess_drift(
     x: NDArray[Any],
     model: nn.Module,
-    device: str | torch.device | None = None,
+    device: DeviceLike | None = None,
     preprocess_batch_fn: Callable | None = None,
     batch_size: int = int(1e10),
     dtype: type[np.generic] | torch.dtype = np.float32,
@@ -73,15 +73,15 @@ def preprocess_drift(
         Batch of instances.
     model : nn.Module
         Model used for preprocessing.
-    device : torch.device | None, default None
-        Device type used. The default None tries to use the GPU and falls back on CPU.
-        Can be specified by passing either torch.device('cuda') or torch.device('cpu').
-    preprocess_batch_fn : Callable | None, default None
+    device : DeviceLike or None, default None
+        The hardware device to use if specified, otherwise uses the DataEval
+        default or torch default.
+    preprocess_batch_fn : Callable or None, default None
         Optional batch preprocessing function. For example to convert a list of objects
         to a batch which can be processed by the PyTorch model.
     batch_size : int, default 1e10
         Batch size used during prediction.
-    dtype : np.dtype | torch.dtype, default np.float32
+    dtype : np.dtype or torch.dtype, default np.float32
         Model output type, either a :term:`NumPy` or torch dtype, e.g. np.float32 or torch.float32.
     Returns

dataeval/detectors/drift/_uncertainty.py CHANGED Viewed

@@ -85,20 +85,20 @@ class DriftUncertainty:
         Whether the given reference data ``x_ref`` has been preprocessed yet.
         If ``True``, only the test data ``x`` will be preprocessed at prediction time.
         If ``False``, the reference data will also be preprocessed.
-    update_x_ref : UpdateStrategy | None, default None
+    update_x_ref : UpdateStrategy or None, default None
         Reference data can optionally be updated using an UpdateStrategy class. Update
         using the last n instances seen by the detector with LastSeenUpdateStrategy
         or via reservoir sampling with ReservoirSamplingUpdateStrategy.
-    preds_type : "probs" | "logits", default "probs"
+    preds_type : "probs" or "logits", default "probs"
         Type of prediction output by the model. Options are 'probs' (in [0,1]) or
         'logits' (in [-inf,inf]).
     batch_size : int, default 32
         Batch size used to evaluate model. Only relevant when backend has been
         specified for batch prediction.
-    preprocess_batch_fn : Callable | None, default None
+    preprocess_batch_fn : Callable or None, default None
         Optional batch preprocessing function. For example to convert a list of
         objects to a batch which can be processed by the model.
-    device : str | None, default None
+    device : DeviceLike or None, default None
         Device type used. The default None tries to use the GPU and falls back on
         CPU if needed. Can be specified by passing either 'cuda' or 'cpu'.

dataeval/detectors/linters/duplicates.py CHANGED Viewed

@@ -88,13 +88,13 @@ class Duplicates:
         """
         if isinstance(hashes, HashStatsOutput):
-            return DuplicatesOutput(**self._get_duplicates(hashes.dict()))
+            return DuplicatesOutput(**self._get_duplicates(hashes.data()))
         if not isinstance(hashes, Sequence):
             raise TypeError("Invalid stats output type; only use output from hashstats.")
         combined, dataset_steps = combine_stats(hashes)
-        duplicates = self._get_duplicates(combined.dict())
+        duplicates = self._get_duplicates(combined.data())
         # split up results from combined dataset into individual dataset buckets
         for dup_type, dup_list in duplicates.items():
@@ -136,5 +136,5 @@ class Duplicates:
         """  # noqa: E501
         images = Images(data) if isinstance(data, Dataset) else data
         self.stats = hashstats(images)
-        duplicates = self._get_duplicates(self.stats.dict())
+        duplicates = self._get_duplicates(self.stats.data())
         return DuplicatesOutput(**duplicates)

dataeval/detectors/linters/outliers.py CHANGED Viewed

@@ -169,7 +169,7 @@ class Outliers:
         {}
         """  # noqa: E501
         if isinstance(stats, (ImageStatsOutput, DimensionStatsOutput, PixelStatsOutput, VisualStatsOutput)):
-            return OutliersOutput(self._get_outliers(stats.dict()))
+            return OutliersOutput(self._get_outliers(stats.data()))
         if not isinstance(stats, Sequence):
             raise TypeError(
@@ -189,7 +189,7 @@ class Outliers:
         output_list: list[dict[int, dict[str, float]]] = [{} for _ in stats]
         for _, indices in stats_map.items():
             substats, dataset_steps = combine_stats([stats[i] for i in indices])
-            outliers = self._get_outliers(substats.dict())
+            outliers = self._get_outliers(substats.data())
             for idx, issue in outliers.items():
                 k, v = get_dataset_step_from_idx(idx, dataset_steps)
                 output_list[indices[k]][v] = issue
@@ -225,5 +225,5 @@ class Outliers:
         """
         images = Images(data) if isinstance(data, Dataset) else data
         self.stats = imagestats(images)
-        outliers = self._get_outliers(self.stats.dict())
+        outliers = self._get_outliers(self.stats.data())
         return OutliersOutput(outliers)

dataeval/detectors/ood/ae.py CHANGED Viewed

@@ -18,6 +18,7 @@ import numpy as np
 import torch
 from numpy.typing import NDArray
+from dataeval.config import DeviceLike
 from dataeval.detectors.ood.base import OODBase
 from dataeval.outputs import OODScoreOutput
 from dataeval.typing import ArrayLike
@@ -33,9 +34,9 @@ class OOD_AE(OODBase):
     model : torch.nn.Module
         An autoencoder model to use for encoding and reconstruction of images
         for detection of out-of-distribution samples.
-    device : str or torch.Device or None, default None
-        The device to use for the detector. None will default to the global
-        configuration selection if set, otherwise "cuda" then "cpu" by availability.
+    device : DeviceLike or None, default None
+        The hardware device to use if specified, otherwise uses the DataEval
+        default or torch default.
     Example
     -------
@@ -57,7 +58,7 @@ class OOD_AE(OODBase):
     array([ True,  True, False,  True,  True,  True,  True,  True])
     """
-    def __init__(self, model: torch.nn.Module, device: str | torch.device | None = None) -> None:
+    def __init__(self, model: torch.nn.Module, device: DeviceLike | None = None) -> None:
         super().__init__(model, device)
     def fit(

dataeval/detectors/ood/base.py CHANGED Viewed

@@ -14,7 +14,7 @@ from typing import Callable, cast
 import torch
-from dataeval.config import get_device
+from dataeval.config import DeviceLike, get_device
 from dataeval.detectors.ood.mixin import OODBaseMixin, OODFitMixin, OODGMMMixin
 from dataeval.typing import ArrayLike
 from dataeval.utils._array import to_numpy
@@ -23,7 +23,7 @@ from dataeval.utils.torch._internal import trainer
 class OODBase(OODBaseMixin[torch.nn.Module], OODFitMixin[Callable[..., torch.nn.Module], torch.optim.Optimizer]):
-    def __init__(self, model: torch.nn.Module, device: str | torch.device | None = None) -> None:
+    def __init__(self, model: torch.nn.Module, device: DeviceLike | None = None) -> None:
         self.device: torch.device = get_device(device)
         super().__init__(model)

dataeval/detectors/ood/metadata_ood_mi.py CHANGED Viewed

@@ -10,6 +10,8 @@ import numpy as np
 from numpy.typing import NDArray
 from sklearn.feature_selection import mutual_info_classif
+from dataeval.config import get_seed
 # NATS2BITS is the reciprocal of natural log of 2. If you have an information/entropy-type quantity measured in nats,
 #   which is what many library functions return, multiply it by NATS2BITS to get it in bits.
 NATS2BITS = 1.442695
@@ -19,7 +21,6 @@ def get_metadata_ood_mi(
     metadata: dict[str, list[Any] | NDArray[Any]],
     is_ood: NDArray[np.bool_],
     discrete_features: str | bool | NDArray[np.bool_] = False,
-    random_state: int | None = None,
 ) -> dict[str, float]:
     """Computes mutual information between a set of metadata features and an out-of-distribution flag.
@@ -39,9 +40,6 @@ def get_metadata_ood_mi(
         A boolean array, with one value per example, that indicates which examples are OOD.
     discrete_features : str | bool | NDArray[np.bool_]
         Either a boolean array or a single boolean value, indicate which features take on discrete values.
-    random_state : int, optional - default None
-        Determines random number generation for small noise added to continuous variables. Set to a value for
-        reproducible results.
     Returns
     -------
@@ -55,7 +53,7 @@ def get_metadata_ood_mi(
     >>> metadata = {"time": np.linspace(0, 10, 100), "altitude": np.linspace(0, 16, 100) ** 2}
     >>> is_ood = metadata["altitude"] > 100
-    >>> get_metadata_ood_mi(metadata, is_ood, discrete_features=False, random_state=0)
+    >>> get_metadata_ood_mi(metadata, is_ood, discrete_features=False)
     {'time': 0.9359596758173668, 'altitude': 0.9407686591507002}
     """
     numerical_keys = [k for k, v in metadata.items() if all(isinstance(vi, numbers.Number) for vi in v)]
@@ -84,7 +82,7 @@ def get_metadata_ood_mi(
             Xscl,
             is_ood,
             discrete_features=discrete_features,  # type: ignore
-            random_state=random_state,
+            random_state=get_seed(),
         )
         * NATS2BITS
     )

dataeval/detectors/ood/mixin.py CHANGED Viewed

@@ -157,4 +157,4 @@ class OODBaseMixin(Generic[TModel], ABC):
         # compute outlier scores
         score = self.score(X, batch_size=batch_size)
         ood_pred = score.get(ood_type) > self._threshold_score(ood_type)
-        return OODOutput(is_ood=ood_pred, **score.dict())
+        return OODOutput(is_ood=ood_pred, **score.data())

dataeval/detectors/ood/vae.py CHANGED Viewed

@@ -17,6 +17,7 @@ from typing import Callable
 import numpy as np
 import torch
+from dataeval.config import DeviceLike
 from dataeval.detectors.ood.base import OODBase
 from dataeval.outputs import OODScoreOutput
 from dataeval.typing import ArrayLike
@@ -34,7 +35,7 @@ class OOD_VAE(OODBase):
         An Autoencoder model.
     """
-    def __init__(self, model: torch.nn.Module, device: str | torch.device | None = None) -> None:
+    def __init__(self, model: torch.nn.Module, device: DeviceLike | None = None) -> None:
         super().__init__(model, device)
     def fit(

dataeval/metadata/_distance.py CHANGED Viewed

@@ -10,7 +10,8 @@ from scipy.stats import iqr, ks_2samp
 from scipy.stats import wasserstein_distance as emd
 from dataeval.metadata._utils import _compare_keys, _validate_factors_and_data
-from dataeval.outputs._base import MappingOutput
+from dataeval.outputs import MetadataDistanceOutput, MetadataDistanceValues
+from dataeval.outputs._base import set_metadata
 from dataeval.typing import ArrayLike
 from dataeval.utils.data import Metadata
@@ -23,41 +24,6 @@ class KSType(NamedTuple):
     pvalue: float
-class MetadataKSResult(NamedTuple):
-    """
-    Attributes
-    ----------
-    statistic : float
-        the KS statistic
-    location : float
-        The value at which the KS statistic has its maximum, measured in IQR-normalized units relative
-        to the median of the reference distribution.
-    dist : float
-        The Earth Mover's Distance normalized by the interquartile range (IQR) of the reference
-    pvalue : float
-        The p-value from the KS two-sample test
-    """
-    statistic: float
-    location: float
-    dist: float
-    pvalue: float
-class KSOutput(MappingOutput[str, MetadataKSResult]):
-    """
-    Output class for results of ks_2samp featurewise comparisons of new metadata to reference metadata.
-    Attributes
-    ----------
-    key: str
-        Metadata feature names
-    value: :class:`MetadataKSResult`
-        Output per feature name containing the statistic, statistic location, distance, and pvalue.
-    """
 def _calculate_drift(x1: ArrayLike, x2: ArrayLike) -> float:
     """Calculates the shift magnitude between x1 and x2 scaled by x1"""
@@ -74,7 +40,8 @@ def _calculate_drift(x1: ArrayLike, x2: ArrayLike) -> float:
     return distance if xmin == xmax else distance / (xmax - xmin)
-def metadata_distance(metadata1: Metadata, metadata2: Metadata) -> KSOutput:
+@set_metadata
+def metadata_distance(metadata1: Metadata, metadata2: Metadata) -> MetadataDistanceOutput:
     """
     Measures the feature-wise distance between two continuous metadata distributions and
     computes a p-value to evaluate its significance.
@@ -90,8 +57,8 @@ def metadata_distance(metadata1: Metadata, metadata2: Metadata) -> KSOutput:
     Returns
     -------
-    dict[str, KstestResult]
-        A dictionary with keys corresponding to metadata feature names, and values that are KstestResult objects, as
+    MetadataDistanceOutput
+        A mapping with keys corresponding to metadata feature names, and values that are KstestResult objects, as
         defined by scipy.stats.ks_2samp.
     See Also
@@ -110,7 +77,7 @@ def metadata_distance(metadata1: Metadata, metadata2: Metadata) -> KSOutput:
     >>> list(output)
     ['time', 'altitude']
     >>> output["time"]
-    MetadataKSResult(statistic=1.0, location=0.44354838709677413, dist=2.7, pvalue=0.0)
+    MetadataDistanceValues(statistic=1.0, location=0.44354838709677413, dist=2.7, pvalue=0.0)
     """
     _compare_keys(metadata1.continuous_factor_names, metadata2.continuous_factor_names)
@@ -134,7 +101,7 @@ def metadata_distance(metadata1: Metadata, metadata2: Metadata) -> KSOutput:
         )
     # Set default for statistic, location, and magnitude to zero and pvalue to one
-    results: dict[str, MetadataKSResult] = {}
+    results: dict[str, MetadataDistanceValues] = {}
     # Per factor
     for i, fname in enumerate(fnames):
@@ -147,7 +114,7 @@ def metadata_distance(metadata1: Metadata, metadata2: Metadata) -> KSOutput:
         # Default case
         if xmin == xmax:
-            results[fname] = MetadataKSResult(statistic=0.0, location=0.0, dist=0.0, pvalue=1.0)
+            results[fname] = MetadataDistanceValues(statistic=0.0, location=0.0, dist=0.0, pvalue=1.0)
             continue
         ks_result = cast(KSType, ks_2samp(fdata1, fdata2, method="asymp"))
@@ -157,11 +124,11 @@ def metadata_distance(metadata1: Metadata, metadata2: Metadata) -> KSOutput:
         drift = _calculate_drift(fdata1, fdata2)
-        results[fname] = MetadataKSResult(
+        results[fname] = MetadataDistanceValues(
             statistic=ks_result.statistic,
             location=loc,
             dist=drift,
             pvalue=ks_result.pvalue,
         )
-    return KSOutput(results)
+    return MetadataDistanceOutput(results)

dataeval/metadata/_ood.py CHANGED Viewed

@@ -8,7 +8,8 @@ import numpy as np
 from numpy.typing import NDArray
 from dataeval.metadata._utils import _compare_keys, _validate_factors_and_data
-from dataeval.outputs import OODOutput
+from dataeval.outputs import MostDeviatedFactorsOutput, OODOutput
+from dataeval.outputs._base import set_metadata
 from dataeval.utils.data import Metadata
@@ -119,11 +120,12 @@ def _calc_median_deviations(reference: NDArray, test: NDArray) -> NDArray:
     return np.abs(np.where(test_dev >= 0, test_dev / pscale, test_dev / nscale))  # (S_t, F)
+@set_metadata
 def most_deviated_factors(
     metadata_1: Metadata,
     metadata_2: Metadata,
     ood: OODOutput,
-) -> list[tuple[str, float]]:
+) -> MostDeviatedFactorsOutput:
     """
     Determines greatest deviation in metadata features per out of distribution sample in metadata_2.
@@ -159,20 +161,20 @@ def most_deviated_factors(
     >>> is_ood = OODOutput(np.array([True, True, True]), np.array([]), np.array([]))
     >>> most_deviated_factors(metadata1, metadata2, is_ood)
-    [('time', 2.0), ('time', 2.592), ('time', 3.51)]
+    MostDeviatedFactorsOutput([('time', 2.0), ('time', 2.592), ('time', 3.51)])
     If there are no out-of-distribution samples, a list is returned
     >>> is_ood = OODOutput(np.array([False, False, False]), np.array([]), np.array([]))
     >>> most_deviated_factors(metadata1, metadata2, is_ood)
-    []
+    MostDeviatedFactorsOutput([])
     """
     ood_mask: NDArray[np.bool] = ood.is_ood
     # No metadata correlated with out of distribution data
     if not any(ood_mask):
-        return []
+        return MostDeviatedFactorsOutput([])
     # Combines reference and test factor names and data if exists and match exactly
     # shape -> (samples, factors)
@@ -190,7 +192,7 @@ def most_deviated_factors(
             f"At least 3 reference metadata samples are needed, got {len(metadata_ref)}",
             UserWarning,
         )
-        return []
+        return MostDeviatedFactorsOutput([])
     if len(metadata_tst) != len(ood_mask):
         raise ValueError(
@@ -214,4 +216,4 @@ def most_deviated_factors(
     # List of tuples matching the factor name with its deviation
-    return [(factor, dev) for factor, dev in zip(most_ood_factors, deviation)]
+    return MostDeviatedFactorsOutput([(factor, dev) for factor, dev in zip(most_ood_factors, deviation)])

dataeval/metrics/bias/_balance.py CHANGED Viewed

@@ -8,6 +8,7 @@ import numpy as np
 import scipy as sp
 from sklearn.feature_selection import mutual_info_classif, mutual_info_regression
+from dataeval.config import get_seed
 from dataeval.outputs import BalanceOutput
 from dataeval.outputs._base import set_metadata
 from dataeval.utils._bin import get_counts
@@ -91,6 +92,9 @@ def balance(
     sklearn.feature_selection.mutual_info_regression
     sklearn.metrics.mutual_info_score
     """
+    if not metadata.discrete_factor_names and not metadata.continuous_factor_names:
+        raise ValueError("No factors found in provided metadata.")
     num_neighbors = _validate_num_neighbors(num_neighbors)
     num_factors = metadata.total_num_factors
@@ -110,7 +114,7 @@ def balance(
                 data[:, idx],
                 discrete_features=is_discrete,  # type: ignore
                 n_neighbors=num_neighbors,
-                random_state=0,
+                random_state=get_seed(),
             )
         else:
             mi[idx, :] = mutual_info_classif(
@@ -118,7 +122,7 @@ def balance(
                 data[:, idx],
                 discrete_features=is_discrete,  # type: ignore
                 n_neighbors=num_neighbors,
-                random_state=0,
+                random_state=get_seed(),
             )
     # Normalization via entropy
@@ -147,7 +151,7 @@ def balance(
             tgt_bin[:, idx],
             discrete_features=is_discrete,  # type: ignore
             n_neighbors=num_neighbors,
-            random_state=0,
+            random_state=get_seed(),
         )
     # Classwise normalization via entropy

dataeval/metrics/bias/_diversity.py CHANGED Viewed

@@ -158,6 +158,9 @@ def diversity(
     --------
     scipy.stats.entropy
     """
+    if not metadata.discrete_factor_names and not metadata.continuous_factor_names:
+        raise ValueError("No factors found in provided metadata.")
     diversity_fn = get_method(_DIVERSITY_FN_MAP, method)
     discretized_data = np.hstack((metadata.class_labels[:, np.newaxis], metadata.discrete_data))
     cnts = get_counts(discretized_data)

dataeval/metrics/bias/_parity.py CHANGED Viewed

@@ -241,6 +241,8 @@ def parity(metadata: Metadata) -> ParityOutput:
     >>> parity(metadata)
     ParityOutput(score=array([7.357, 5.467, 0.515]), p_value=array([0.289, 0.243, 0.773]), factor_names=['age', 'income', 'gender'], insufficient_data={'age': {3: {'artist': 4}, 4: {'artist': 4, 'teacher': 3}}, 'income': {1: {'artist': 3}}})
     """  # noqa: E501
+    if not metadata.discrete_factor_names and not metadata.continuous_factor_names:
+        raise ValueError("No factors found in provided metadata.")
     chi_scores = np.zeros(metadata.discrete_data.shape[1])
     p_values = np.zeros_like(chi_scores)

dataeval 0.82.0__py3-none-any.whl → 0.82.1__py3-none-any.whl

dataeval 0.82.0py3-none-any.whl → 0.82.1py3-none-any.whl