PyPI - dataeval - Versions diffs - 0.86.7__py3-none-any.whl → 0.86.8__py3-none-any.whl - Mend

dataeval 0.86.7py3-none-any.whl → 0.86.8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (21) hide show

dataeval/__init__.py +10 -3
dataeval/_version.py +21 -0
dataeval/config.py +7 -1
dataeval/detectors/drift/_mvdc.py +2 -9
dataeval/detectors/drift/_nml/_chunk.py +2 -2
dataeval/detectors/ood/ae.py +1 -1
dataeval/detectors/ood/base.py +3 -3
dataeval/metrics/bias/_completeness.py +3 -3
dataeval/metrics/bias/_coverage.py +2 -2
dataeval/metrics/bias/_parity.py +1 -1
dataeval/metrics/estimators/_ber.py +2 -2
dataeval/metrics/estimators/_divergence.py +2 -2
dataeval/outputs/_estimators.py +6 -6
dataeval/utils/_array.py +20 -9
dataeval/utils/_clusterer.py +7 -7
dataeval/utils/torch/_internal.py +3 -3
dataeval/utils/torch/trainer.py +1 -1
{dataeval-0.86.7.dist-info → dataeval-0.86.8.dist-info}/METADATA +67 -47
{dataeval-0.86.7.dist-info → dataeval-0.86.8.dist-info}/RECORD +25 -24
{dataeval-0.86.7.dist-info → dataeval-0.86.8.dist-info}/WHEEL +1 -1
{dataeval-0.86.7.dist-info → dataeval-0.86.8.dist-info/licenses}/LICENSE.txt +0 -0

dataeval/__init__.py CHANGED Viewed

@@ -7,12 +7,19 @@ shifts that impact performance of deployed models.
 from __future__ import annotations
-__all__ = ["config", "detectors", "log", "metrics", "typing", "utils", "workflows"]
-__version__ = "0.86.7"
+try:
+    from ._version import __version__
+except ImportError:
+    __version__ = "unknown"
+# Strongly type for pyright
+__version__ = str(__version__)
+__all__ = ["__version__", "config", "detectors", "log", "metrics", "typing", "utils", "workflows"]
 import logging
-from dataeval import config, detectors, metrics, typing, utils, workflows
+from . import config, detectors, metrics, typing, utils, workflows
 logging.getLogger(__name__).addHandler(logging.NullHandler())

dataeval/_version.py ADDED Viewed

@@ -0,0 +1,21 @@
+# file generated by setuptools-scm
+# don't change, don't track in version control
+__all__ = ["__version__", "__version_tuple__", "version", "version_tuple"]
+TYPE_CHECKING = False
+if TYPE_CHECKING:
+    from typing import Tuple
+    from typing import Union
+    VERSION_TUPLE = Tuple[Union[int, str], ...]
+else:
+    VERSION_TUPLE = object
+version: str
+__version__: str
+__version_tuple__: VERSION_TUPLE
+version_tuple: VERSION_TUPLE
+__version__ = version = '0.86.8'
+__version_tuple__ = version_tuple = (0, 86, 8)

dataeval/config.py CHANGED Viewed

@@ -77,7 +77,13 @@ def get_device(override: DeviceLike | None = None) -> torch.device:
     """
     if override is None:
         global _device
-        return torch.get_default_device() if _device is None else _device
+        return (
+            torch.get_default_device()
+            if hasattr(torch, "get_default_device")
+            else torch.device("cpu")
+            if _device is None
+            else _device
+        )
     return _todevice(override)

dataeval/detectors/drift/_mvdc.py CHANGED Viewed

@@ -1,16 +1,9 @@
 from __future__ import annotations
-from typing import TYPE_CHECKING
 import numpy as np
 import pandas as pd
 from numpy.typing import ArrayLike
-if TYPE_CHECKING:
-    from typing import Self
-else:
-    from typing_extensions import Self
 from dataeval.detectors.drift._nml._chunk import CountBasedChunker, SizeBasedChunker
 from dataeval.detectors.drift._nml._domainclassifier import DomainClassifierCalculator
 from dataeval.detectors.drift._nml._thresholds import ConstantThreshold
@@ -52,7 +45,7 @@ class DriftMVDC:
             threshold=ConstantThreshold(lower=self.threshold[0], upper=self.threshold[1]),
         )
-    def fit(self, x_ref: ArrayLike) -> Self:
+    def fit(self, x_ref: ArrayLike) -> DriftMVDC:
         """
         Fit the domain classifier on the training dataframe
@@ -63,7 +56,7 @@ class DriftMVDC:
         Returns
         -------
-        Self
+        DriftMVDC
         """
         # for 1D input, assume that is 1 sample: dim[1,n_features]

dataeval/detectors/drift/_nml/_chunk.py CHANGED Viewed

@@ -46,10 +46,10 @@ class Chunk(ABC):
         return self.data.shape[0]
     @abstractmethod
-    def __add__(self, other: Self) -> Self: ...
+    def __add__(self, other: Any) -> Any: ...
     @abstractmethod
-    def __lt__(self, other: Self) -> bool: ...
+    def __lt__(self, other: Any) -> bool: ...
     @abstractmethod
     def dict(self) -> dict[str, Any]: ...

dataeval/detectors/ood/ae.py CHANGED Viewed

@@ -65,7 +65,7 @@ class OOD_AE(OODBase):
         self,
         x_ref: ArrayLike,
         threshold_perc: float,
-        loss_fn: Callable[..., torch.nn.Module] | None = None,
+        loss_fn: Callable[..., torch.Tensor] | None = None,
         optimizer: torch.optim.Optimizer | None = None,
         epochs: int = 20,
         batch_size: int = 64,

dataeval/detectors/ood/base.py CHANGED Viewed

@@ -22,7 +22,7 @@ from dataeval.utils.torch._gmm import GaussianMixtureModelParams, gmm_params
 from dataeval.utils.torch._internal import trainer
-class OODBase(OODBaseMixin[torch.nn.Module], OODFitMixin[Callable[..., torch.nn.Module], torch.optim.Optimizer]):
+class OODBase(OODBaseMixin[torch.nn.Module], OODFitMixin[Callable[..., torch.Tensor], torch.optim.Optimizer]):
     def __init__(self, model: torch.nn.Module, device: DeviceLike | None = None) -> None:
         self.device: torch.device = get_device(device)
         super().__init__(model)
@@ -31,7 +31,7 @@ class OODBase(OODBaseMixin[torch.nn.Module], OODFitMixin[Callable[..., torch.nn.
         self,
         x_ref: ArrayLike,
         threshold_perc: float,
-        loss_fn: Callable[..., torch.nn.Module] | None,
+        loss_fn: Callable[..., torch.Tensor] | None,
         optimizer: torch.optim.Optimizer | None,
         epochs: int,
         batch_size: int,
@@ -82,7 +82,7 @@ class OODBaseGMM(OODBase, OODGMMMixin[GaussianMixtureModelParams]):
         self,
         x_ref: ArrayLike,
         threshold_perc: float,
-        loss_fn: Callable[..., torch.nn.Module] | None,
+        loss_fn: Callable[..., torch.Tensor] | None,
         optimizer: torch.optim.Optimizer | None,
         epochs: int,
         batch_size: int,

dataeval/metrics/bias/_completeness.py CHANGED Viewed

@@ -9,11 +9,11 @@ import numpy as np
 from dataeval.config import EPSILON
 from dataeval.outputs import CompletenessOutput
-from dataeval.typing import ArrayLike
+from dataeval.typing import Array
 from dataeval.utils._array import ensure_embeddings
-def completeness(embeddings: ArrayLike, quantiles: int) -> CompletenessOutput:
+def completeness(embeddings: Array, quantiles: int) -> CompletenessOutput:
     """
     Calculate the fraction of boxes in a grid defined by quantiles that
     contain at least one data point.
@@ -21,7 +21,7 @@ def completeness(embeddings: ArrayLike, quantiles: int) -> CompletenessOutput:
     Parameters
     ----------
-    embeddings : ArrayLike
+    embeddings : Array
         Embedded dataset (or other low-dimensional data) (nxp)
     quantiles : int
         number of quantile values to use for partitioning each dimension

dataeval/metrics/bias/_coverage.py CHANGED Viewed

@@ -10,13 +10,13 @@ from scipy.spatial.distance import pdist, squareform
 from dataeval.outputs import CoverageOutput
 from dataeval.outputs._base import set_metadata
-from dataeval.typing import ArrayLike
+from dataeval.typing import Array
 from dataeval.utils._array import ensure_embeddings, flatten
 @set_metadata
 def coverage(
-    embeddings: ArrayLike,
+    embeddings: Array,
     radius_type: Literal["adaptive", "naive"] = "adaptive",
     num_observations: int = 20,
     percent: float = 0.01,

dataeval/metrics/bias/_parity.py CHANGED Viewed

@@ -271,7 +271,7 @@ def parity(metadata: Metadata) -> ParityOutput:
         # because scipy.stats.chi2_contingency fails when there are rows containing only zeros.
         contingency_matrix = contingency_matrix[np.any(contingency_matrix, axis=1)]
-        chi_scores[i], p_values[i] = chi2_contingency(contingency_matrix)[:2]
+        chi_scores[i], p_values[i] = chi2_contingency(contingency_matrix)[:2]  # type: ignore
     if insufficient_data:
         warnings.warn(

dataeval/metrics/estimators/_ber.py CHANGED Viewed

@@ -22,7 +22,7 @@ from scipy.stats import mode
 from dataeval.config import EPSILON
 from dataeval.outputs import BEROutput
 from dataeval.outputs._base import set_metadata
-from dataeval.typing import ArrayLike
+from dataeval.typing import Array
 from dataeval.utils._array import as_numpy, ensure_embeddings
 from dataeval.utils._method import get_method
 from dataeval.utils._mst import compute_neighbors, minimum_spanning_tree
@@ -105,7 +105,7 @@ _BER_FN_MAP = {"KNN": ber_knn, "MST": ber_mst}
 @set_metadata
-def ber(embeddings: ArrayLike, labels: ArrayLike, k: int = 1, method: Literal["KNN", "MST"] = "KNN") -> BEROutput:
+def ber(embeddings: Array, labels: Array, k: int = 1, method: Literal["KNN", "MST"] = "KNN") -> BEROutput:
     """
     An estimator for Multi-class :term:`Bayes error rate<Bayes Error Rate (BER)>` \
     using FR or KNN test statistic basis.

dataeval/metrics/estimators/_divergence.py CHANGED Viewed

@@ -14,7 +14,7 @@ from numpy.typing import NDArray
 from dataeval.outputs import DivergenceOutput
 from dataeval.outputs._base import set_metadata
-from dataeval.typing import ArrayLike
+from dataeval.typing import Array
 from dataeval.utils._array import ensure_embeddings
 from dataeval.utils._method import get_method
 from dataeval.utils._mst import compute_neighbors, minimum_spanning_tree
@@ -65,7 +65,7 @@ _DIVERGENCE_FN_MAP = {"FNN": divergence_fnn, "MST": divergence_mst}
 @set_metadata
-def divergence(emb_a: ArrayLike, emb_b: ArrayLike, method: Literal["FNN", "MST"] = "FNN") -> DivergenceOutput:
+def divergence(emb_a: Array, emb_b: Array, method: Literal["FNN", "MST"] = "FNN") -> DivergenceOutput:
     """
     Calculates the :term:`divergence` and any errors between the datasets.

dataeval/outputs/_estimators.py CHANGED Viewed

@@ -47,11 +47,11 @@ class ClustererOutput(Output):
         The strength of the data point belonging to the assigned cluster
     """
-    clusters: NDArray[np.int_]
-    mst: NDArray[np.double]
-    linkage_tree: NDArray[np.double]
-    condensed_tree: NDArray[np.double]
-    membership_strengths: NDArray[np.double]
+    clusters: NDArray[np.intp]
+    mst: NDArray[np.float32]
+    linkage_tree: NDArray[np.float32]
+    condensed_tree: NDArray[np.float32]
+    membership_strengths: NDArray[np.float32]
     def find_outliers(self) -> NDArray[np.int_]:
         """
@@ -77,7 +77,7 @@ class ClustererOutput(Output):
         # Delay load numba compiled functions
         from dataeval.utils._clusterer import compare_links_to_cluster_std, sorted_union_find
-        exact_indices, near_indices = compare_links_to_cluster_std(self.mst, self.clusters)
+        exact_indices, near_indices = compare_links_to_cluster_std(self.mst, self.clusters)  # type: ignore
         exact_dupes = sorted_union_find(exact_indices)
         near_dupes = sorted_union_find(near_indices)

dataeval/utils/_array.py CHANGED Viewed

@@ -19,7 +19,7 @@ _logger = logging.getLogger(__name__)
 _MODULE_CACHE = {}
-T = TypeVar("T", ArrayLike, np.ndarray, torch.Tensor)
+T = TypeVar("T", Array, np.ndarray, torch.Tensor)
 _np_dtype = TypeVar("_np_dtype", bound=np.generic)
@@ -73,6 +73,19 @@ def to_numpy_iter(iterable: Iterable[ArrayLike]) -> Iterator[NDArray[Any]]:
         yield to_numpy(array)
+@overload
+def rescale_array(array: NDArray[_np_dtype]) -> NDArray[_np_dtype]: ...
+@overload
+def rescale_array(array: torch.Tensor) -> torch.Tensor: ...
+def rescale_array(array: Array | NDArray[_np_dtype] | torch.Tensor) -> Array | NDArray[_np_dtype] | torch.Tensor:
+    """Rescale an array to the range [0, 1]"""
+    if isinstance(array, (np.ndarray, torch.Tensor)):
+        arr_min = array.min()
+        arr_max = array.max()
+        return (array - arr_min) / (arr_max - arr_min)
+    raise TypeError(f"Unsupported type: {type(array)}")
 @overload
 def ensure_embeddings(
     embeddings: T,
@@ -137,14 +150,12 @@ def ensure_embeddings(
     if arr.ndim != 2:
         raise ValueError(f"Expected a 2D array, but got a {arr.ndim}D array.")
-    if unit_interval:
-        arr_min, arr_max = arr.min(), arr.max()
-        if arr_min < 0 or arr_max > 1:
-            if unit_interval == "force":
-                warnings.warn("Embeddings are not unit interval [0, 1]. Forcing to unit interval.")
-                arr = (arr - arr_min) / (arr_max - arr_min)
-            else:
-                raise ValueError("Embeddings must be unit interval [0, 1].")
+    if unit_interval and (arr.min() < 0 or arr.max() > 1):
+        if unit_interval == "force":
+            warnings.warn("Embeddings are not unit interval [0, 1]. Forcing to unit interval.")
+            arr = rescale_array(arr)
+        else:
+            raise ValueError("Embeddings must be unit interval [0, 1].")
     if dtype is None:
         return embeddings

dataeval/utils/_clusterer.py CHANGED Viewed

@@ -69,12 +69,12 @@ def compare_links_to_cluster_std(
 @dataclass
 class ClusterData:
     clusters: NDArray[np.intp]
-    mst: NDArray[np.double]
-    linkage_tree: NDArray[np.double]
+    mst: NDArray[np.float32]
+    linkage_tree: NDArray[np.float32]
     condensed_tree: CondensedTree
-    membership_strengths: NDArray[np.double]
+    membership_strengths: NDArray[np.float32]
     k_neighbors: NDArray[np.int32]
-    k_distances: NDArray[np.double]
+    k_distances: NDArray[np.float32]
 def cluster(data: ArrayLike) -> ClusterData:
@@ -95,9 +95,9 @@ def cluster(data: ArrayLike) -> ClusterData:
     max_neighbors = min(25, num_samples - 1)
     kneighbors, kdistances = calculate_neighbor_distances(x, max_neighbors)
-    unsorted_mst: NDArray[np.double] = minimum_spanning_tree(x, kneighbors, kdistances)
-    mst: NDArray[np.double] = unsorted_mst[np.argsort(unsorted_mst.T[2])]
-    linkage_tree: NDArray[np.double] = mst_to_linkage_tree(mst)
+    unsorted_mst: NDArray[np.float32] = minimum_spanning_tree(x, kneighbors, kdistances)
+    mst: NDArray[np.float32] = unsorted_mst[np.argsort(unsorted_mst.T[2])]
+    linkage_tree: NDArray[np.float32] = mst_to_linkage_tree(mst).astype(np.float32)
     condensed_tree: CondensedTree = condense_tree(linkage_tree, min_cluster_size, None)
     cluster_tree = cluster_tree_from_condensed_tree(condensed_tree)

dataeval/utils/torch/_internal.py CHANGED Viewed

@@ -65,7 +65,7 @@ def trainer(
     model: torch.nn.Module,
     x_train: NDArray[Any],
     y_train: NDArray[Any] | None,
-    loss_fn: Callable[..., torch.Tensor | torch.nn.Module] | None,
+    loss_fn: Callable[..., torch.Tensor] | None,
     optimizer: torch.optim.Optimizer | None,
     preprocess_fn: Callable[[torch.Tensor], torch.Tensor] | None,
     epochs: int,
@@ -117,7 +117,7 @@ def trainer(
     model = model.to(device)
     # iterate over epochs
-    loss = torch.nan
+    loss = torch.scalar_tensor(torch.nan)
     disable_tqdm = not verbose
     for epoch in (pbar := tqdm(range(epochs), disable=disable_tqdm)):
         epoch_loss = loss
@@ -133,7 +133,7 @@ def trainer(
             y_hat = model(x)
             y = x if y is None else y
-            loss = loss_fn(y, *y_hat) if isinstance(y_hat, tuple) else loss_fn(y, y_hat)  # type: ignore
+            loss = loss_fn(y, *y_hat) if isinstance(y_hat, tuple) else loss_fn(y, y_hat)
             optimizer.zero_grad()
             loss.backward()

dataeval/utils/torch/trainer.py CHANGED Viewed

@@ -172,7 +172,7 @@ class AETrainer:
         for batch in dl:
             imgs = get_images_from_batch(batch)
             imgs = imgs.to(self.device)
-            embeddings = encode_func(imgs).to("cpu")
+            embeddings = encode_func(imgs).to("cpu")  # type: ignore
             encodings = torch.vstack((encodings, embeddings)) if len(encodings) else embeddings
         return encodings

{dataeval-0.86.7.dist-info → dataeval-0.86.8.dist-info}/METADATA RENAMED Viewed

@@ -1,45 +1,52 @@
-Metadata-Version: 2.1
+Metadata-Version: 2.4
 Name: dataeval
-Version: 0.86.7
+Version: 0.86.8
 Summary: DataEval provides a simple interface to characterize image data and its impact on model performance across classification and object-detection tasks
-Home-page: https://dataeval.ai/
-License: MIT
-Author: Andrew Weng
-Author-email: andrew.weng@ariacoustics.com
-Maintainer: ARiA
-Maintainer-email: dataeval@ariacoustics.com
-Requires-Python: >=3.9,<3.13
+Project-URL: Homepage, https://dataeval.ai/
+Project-URL: Repository, https://github.com/aria-ml/dataeval/
+Project-URL: Documentation, https://dataeval.readthedocs.io/
+Author-email: Andrew Weng <andrew.weng@ariacoustics.com>, Bill Peria <bill.peria@ariacoustics.com>, Jon Botts <jonathan.botts@ariacoustics.com>, Jonathan Christian <jonathan.christian@ariacoustics.com>, Justin McMillan <justin.mcmillan@ariacoustics.com>, Ryan Wood <ryan.wood@ariacoustics.com>, Scott Swan <scott.swan@ariacoustics.com>, Shaun Jullens <shaun.jullens@ariacoustics.com>
+Maintainer-email: ARiA <dataeval@ariacoustics.com>
+License-Expression: MIT
+License-File: LICENSE.txt
 Classifier: Development Status :: 4 - Beta
 Classifier: Intended Audience :: Science/Research
 Classifier: License :: OSI Approved :: MIT License
 Classifier: Operating System :: OS Independent
-Classifier: Programming Language :: Python :: 3
+Classifier: Programming Language :: Python :: 3 :: Only
 Classifier: Programming Language :: Python :: 3.9
 Classifier: Programming Language :: Python :: 3.10
 Classifier: Programming Language :: Python :: 3.11
 Classifier: Programming Language :: Python :: 3.12
-Classifier: Programming Language :: Python :: 3 :: Only
 Classifier: Topic :: Scientific/Engineering
+Requires-Python: <3.13,>=3.9
+Requires-Dist: defusedxml>=0.7.1
+Requires-Dist: fast-hdbscan==0.2.0
+Requires-Dist: lightgbm>=4
+Requires-Dist: numba>=0.59.1
+Requires-Dist: numpy>=1.24.2
+Requires-Dist: pandas>=2.0
+Requires-Dist: pillow>=10.3.0
+Requires-Dist: polars>=1.0.0
+Requires-Dist: requests>=2.32.3
+Requires-Dist: scikit-learn>=1.5.0
+Requires-Dist: scipy>=1.10
+Requires-Dist: torch>=2.2.0
+Requires-Dist: torchvision>=0.17.0
+Requires-Dist: tqdm>=4.66
+Requires-Dist: typing-extensions>=4.12; python_version ~= '3.9'
+Requires-Dist: xxhash>=3.3
 Provides-Extra: all
-Requires-Dist: defusedxml (>=0.7.1)
-Requires-Dist: fast_hdbscan (==0.2.0)
-Requires-Dist: lightgbm (>=4)
-Requires-Dist: matplotlib (>=3.7.1) ; extra == "all"
-Requires-Dist: numba (>=0.59.1)
-Requires-Dist: numpy (>=1.24.2)
-Requires-Dist: pandas (>=2.0)
-Requires-Dist: pillow (>=10.3.0)
-Requires-Dist: polars (>=1.0.0)
-Requires-Dist: requests
-Requires-Dist: scikit-learn (>=1.5.0)
-Requires-Dist: scipy (>=1.10)
-Requires-Dist: torch (>=2.2.0)
-Requires-Dist: torchvision (>=0.17.0)
-Requires-Dist: tqdm
-Requires-Dist: typing-extensions (>=4.12) ; python_version >= "3.9" and python_version < "4.0"
-Requires-Dist: xxhash (>=3.3)
-Project-URL: Documentation, https://dataeval.readthedocs.io/
-Project-URL: Repository, https://github.com/aria-ml/dataeval/
+Requires-Dist: matplotlib>=3.7.1; extra == 'all'
+Provides-Extra: cpu
+Requires-Dist: torch>=2.2.0; extra == 'cpu'
+Requires-Dist: torchvision>=0.17.0; extra == 'cpu'
+Provides-Extra: cu118
+Requires-Dist: torch>=2.2.0; extra == 'cu118'
+Requires-Dist: torchvision>=0.17.0; extra == 'cu118'
+Provides-Extra: cu124
+Requires-Dist: torch>=2.2.0; extra == 'cu124'
+Requires-Dist: torchvision>=0.17.0; extra == 'cu124'
 Description-Content-Type: text/markdown
 # DataEval
@@ -72,26 +79,28 @@ estimation, bias detection, and dataset linting.
 <!-- end needs -->
 <!-- start JATIC interop -->
 DataEval is easy to install, supports a wide range of Python versions, and is
 compatible with many of the most popular packages in the scientific and T&E
 communities.
 DataEval also has native interoperability between JATIC's suite of tools when
 using MAITE-compliant datasets and models.
 <!-- end JATIC interop -->
 ## Getting Started
 **Python versions:** 3.9 - 3.12
-**Supported packages**: *NumPy*, *Pandas*, *Sci-kit learn*, *MAITE*, *NRTK*
+**Supported packages**: _NumPy_, _Pandas_, _Sci-kit learn_, _MAITE_, _NRTK_
 Choose your preferred method of installation below or follow our
 [installation guide](https://dataeval.readthedocs.io/en/v0.74.2/installation.html).
-* [Installing with pip](#installing-with-pip)
-* [Installing with conda/mamba](#installing-with-conda)
-* [Installing from GitHub](#installing-from-github)
+- [Installing with pip](#installing-with-pip)
+- [Installing with conda/mamba](#installing-with-conda)
+- [Installing from GitHub](#installing-from-github)
 ### **Installing with pip**
@@ -105,7 +114,7 @@ pip install dataeval[all]
 ### **Installing with conda**
 DataEval can be installed in a Conda/Mamba environment using the provided
-`environment.yaml` file.  As some dependencies are installed from the `pytorch`
+`environment.yaml` file. As some dependencies are installed from the `pytorch`
 channel, the channel is specified in the below example.
 ```bash
@@ -115,12 +124,10 @@ micromamba create -f environment\environment.yaml -c pytorch
 ### **Installing from GitHub**
 To install DataEval from source locally on Ubuntu, you will need `git-lfs` to
-download larger, binary source files and `poetry` for project dependency
-management.
+download larger, binary source files.
 ```bash
 sudo apt-get install git-lfs
-pip install poetry
 ```
 Pull the source down and change to the DataEval project directory.
@@ -130,26 +137,40 @@ git clone https://github.com/aria-ml/dataeval.git
 cd dataeval
 ```
-Install DataEval with optional dependencies for development.
+#### **Using Poetry**
+Install DataEval with all extras.
 ```bash
-poetry install --all-extras --with dev
+poetry install --extras=all
 ```
-Now that DataEval is installed, you can run commands in the poetry virtual
-environment by prefixing shell commands with `poetry run`, or activate the
-virtual environment directly in the shell.
+Enable Poetry's virtual environment.
 ```bash
-poetry shell
+poetry env activate
+```
+#### **Using uv**
+Install DataEval with all extras and dependencies for development.
+```bash
+uv sync --extra=all
+```
+Enable uv's virtual environment.
+```bash
+source .venv/bin/activate
 ```
 ## Contact Us
 If you have any questions, feel free to reach out to the people below:
-* **POC**: Scott Swan @scott.swan
-* **DPOC**: Andrew Weng @aweng
+- **POC**: Scott Swan @scott.swan
+- **DPOC**: Andrew Weng @aweng
 ## Acknowledgement
@@ -164,4 +185,3 @@ interpreted as necessarily representing the official policies or endorsements,
 either expressed or implied, of the U.S. Government.
 <!-- end acknowledgement -->

{dataeval-0.86.7.dist-info → dataeval-0.86.8.dist-info}/RECORD RENAMED Viewed

@@ -1,6 +1,9 @@
-dataeval/__init__.py,sha256=P6WvVjHlE2nH57bXBR4A9ez6R32OQGm9bshYrxRKwFw,1636
+dataeval/__init__.py,sha256=dEDltdHOnbk4-XAbQwJLOZtCbRLZsDMnptWRwbF2r54,1773
 dataeval/_log.py,sha256=C7AGkIRzymvYJ0LQXtnShiy3i5Xrp8T58JzIHHguk_Q,365
-dataeval/config.py,sha256=bHa8np4FCtLLv8_xlfdDC4lb1InJ_kT0vXDO5P42rvk,4082
+dataeval/_version.py,sha256=IPUOExUy8nF4kYGtCPV5bg6_IYDRLVOKnFJcNllcO1M,513
+dataeval/config.py,sha256=g3Np0Q3J5Rzij6Gsz7tJh7eOxgwNPf6NsFYmAR8Atfs,4219
+dataeval/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+dataeval/typing.py,sha256=W8rqFFkAqE5a5ar3MmB-O5gcMJqvoDKXC8Y0ggBqAKo,7216
 dataeval/data/__init__.py,sha256=wzQ6uUFLNB3VJR0a2QnRBYwEmwXT93q0WpHu7FmFW1E,486
 dataeval/data/_embeddings.py,sha256=PFjpdV9bfusCB4taTIYSzx1hP8nJb_KCkZTN8kMw-Hs,12885
 dataeval/data/_images.py,sha256=Rc_59CuU4zfN7Xm7an1XUx8ZghQg6a56VJWMZD9edRw,2654
@@ -21,21 +24,21 @@ dataeval/detectors/drift/_base.py,sha256=6aNF1LzG3w1sNUrmSBbsvuN5IkQnoRikRacqobY
 dataeval/detectors/drift/_cvm.py,sha256=cS33zWJmFY1fft1XcANcP2jSD5ou7TxvIU2AldhTynM,3004
 dataeval/detectors/drift/_ks.py,sha256=uMc5-NA-lSV1IODrY8uJe87ll3uRJT_oXLJFXy95M1w,3186
 dataeval/detectors/drift/_mmd.py,sha256=uw8axM6dWxTBrCaXwkbldIDcdhe4hmim9yrsbuOwA-0,11523
-dataeval/detectors/drift/_mvdc.py,sha256=ABxGut6KzxF_oM-Hs87WARCR0692dhPVdZNoGGwJaa4,3058
+dataeval/detectors/drift/_mvdc.py,sha256=WMN6aDOWCh1q1MtdRXFIZlFcfnVi4XgBHsS0A6L5UuY,2942
+dataeval/detectors/drift/_uncertainty.py,sha256=BHlykJ-r7TGLJxdPfoazXnoAJ1qVDzbk5HjAMdsnHz8,5847
+dataeval/detectors/drift/updates.py,sha256=L1PnrPlIE1x6ujCc5mCwjcAZwadVTn-Zjb6MnTDvzJQ,2251
 dataeval/detectors/drift/_nml/__init__.py,sha256=MNyKyZlfTjr5uQql2uBBfRkUdsuduie_WJdn09GYmqg,137
 dataeval/detectors/drift/_nml/_base.py,sha256=o34LcCsD9p1A6u8UdQn-dxIVwC2CMr6uCpC0vq16JX0,2663
-dataeval/detectors/drift/_nml/_chunk.py,sha256=t12eouanRNiu5DJXOaYDZXUvFMqfcp1BETLOufdV79M,13567
+dataeval/detectors/drift/_nml/_chunk.py,sha256=xF3U-CAobzoKX-20yjWjGVD14IOcAV6rPaIrqCMwGdQ,13564
 dataeval/detectors/drift/_nml/_domainclassifier.py,sha256=n7Ttq5Ej7sAY9Jn2iagaGj4IIWiG8gmA3wwFizlBqes,7292
 dataeval/detectors/drift/_nml/_result.py,sha256=TMK17bnlgSdL0MCRHtQZJO8YoWWe4C2kh_akESrlP1g,3269
 dataeval/detectors/drift/_nml/_thresholds.py,sha256=WGdkLei9w_EvvsRHQzWdDyFVoZHIwM78k_aB3eoh31Q,12060
-dataeval/detectors/drift/_uncertainty.py,sha256=BHlykJ-r7TGLJxdPfoazXnoAJ1qVDzbk5HjAMdsnHz8,5847
-dataeval/detectors/drift/updates.py,sha256=L1PnrPlIE1x6ujCc5mCwjcAZwadVTn-Zjb6MnTDvzJQ,2251
 dataeval/detectors/linters/__init__.py,sha256=xn2zPwUcmsuf-Jd9uw6AVI11C9z1b1Y9fYtuFnXenZ0,404
 dataeval/detectors/linters/duplicates.py,sha256=X5WSEvI_BHkLoXjkaHK6wTnSkx4IjpO_exMRjSlhc70,4963
 dataeval/detectors/linters/outliers.py,sha256=GaM9n8yPgBPzVOL_bxJCj0eCwobEEP4JHKHD9liRdlw,10130
 dataeval/detectors/ood/__init__.py,sha256=juCYBDs7CQEAtMhnEpPqF6uTrOIH9kTBSuQ_GRw6a8o,283
-dataeval/detectors/ood/ae.py,sha256=fTrUfFxv6xUqzKpwMC8rW3JrizA16M_bgzqLuBKMrS0,2944
-dataeval/detectors/ood/base.py,sha256=9b-Ljznf0lB1SXF4F_Aj3eJ4Y3ijGEDPMjucUsWOGJM,3051
+dataeval/detectors/ood/ae.py,sha256=cJ7nq4iwTvW8uihHCUhGfTlKsAlthJ2tOhgSsB27cOY,2941
+dataeval/detectors/ood/base.py,sha256=hx-TPJnUTZ7KcBkm8SbN1RGhtJyQN0XLajDyNqiZrJo,3042
 dataeval/detectors/ood/mixin.py,sha256=0_o-1HPvgf3-Lf1MSOIfjj5UB8LTLEBGYtJJfyCCzwc,5431
 dataeval/metadata/__init__.py,sha256=XDDmJbOZBNM6pL0r6Nbu6oMRoyAh22IDkPYGndNlkZU,316
 dataeval/metadata/_distance.py,sha256=MbXM9idsooNWnGLaTKg8j4ZqavUeJUjuW7EPW3-UQyg,4234
@@ -44,14 +47,14 @@ dataeval/metadata/_utils.py,sha256=BcGoYVfA4AkAWpInY5txOc3QBpsGf6cnnUAsHOQTJAE,1
 dataeval/metrics/__init__.py,sha256=8VC8q3HuJN3o_WN51Ae2_wXznl3RMXIvA5GYVcy7vr8,225
 dataeval/metrics/bias/__init__.py,sha256=329S1_3WnWqeU4-qVcbe0fMy4lDrj9uKslWHIQf93yg,839
 dataeval/metrics/bias/_balance.py,sha256=fREtoMLUZPOf_ivqNKwij6oPiKMTk02ECO5rWURf3KY,5541
-dataeval/metrics/bias/_completeness.py,sha256=BysXU2Jpw33n5dl3acJFEqF3mFGiJLsfG4n5Q2fkTaY,4608
-dataeval/metrics/bias/_coverage.py,sha256=PeUoOiaghUEdn6Ov8z2-am7-fnBVIPcFbJK7Ty5JObA,3647
+dataeval/metrics/bias/_completeness.py,sha256=2cvOXe7fhtxZGH_4QBuiCafIeamxFBarMiUBuEP7QGI,4596
+dataeval/metrics/bias/_coverage.py,sha256=v2x2hbOf2za9jFcSVSJUAoJ2BJfzzlCzt0mFIGtBL0A,3639
 dataeval/metrics/bias/_diversity.py,sha256=25udDKmel9IjeVT5nM4dOa1apda66QdRxBc922yuUvI,5830
-dataeval/metrics/bias/_parity.py,sha256=Kmzr9-NXxGzGtj6A-qUa88FTGaRyJU2xQj7tsplXJH4,11427
+dataeval/metrics/bias/_parity.py,sha256=MKpqL4aoqEHkRl0vtGvVq9V3KBOtDFTtAo5I2GfIG4A,11443
 dataeval/metrics/estimators/__init__.py,sha256=Pnds8uIyAovt2fKqZjiHCIP_kVoBWlVllekYuK5UmmU,568
-dataeval/metrics/estimators/_ber.py,sha256=C30E5LiGGTAfo31zWFYDptDg0R7CTJGJ-a60YgzSkYY,5382
+dataeval/metrics/estimators/_ber.py,sha256=7noeRyOJJYqrJ_jt90nRHtR2t2u5MIvTCmWt0_rd4EU,5370
 dataeval/metrics/estimators/_clusterer.py,sha256=1HrpihGTJ63IkNSOy4Ibw633Gllkm1RxKmoKT5MOgt0,1434
-dataeval/metrics/estimators/_divergence.py,sha256=-np4nWNtRrHnvo4xdWuTzkyJJmobyjDnVDBOMjtBS1Y,4003
+dataeval/metrics/estimators/_divergence.py,sha256=t-Z_7Bq4V4FunxKlq7G4ThtgLany8n4iEU0n0afr7F8,3991
 dataeval/metrics/estimators/_uap.py,sha256=BULEBbJ9BQ1IcTeZf0x7iI60QHAWCccBOM97FIu9VXA,1928
 dataeval/metrics/stats/__init__.py,sha256=6tA_9nbbM5ObJ6cds8Y1VBtTQiTOxrpGQSFLu_lWGGA,1098
 dataeval/metrics/stats/_base.py,sha256=R-hxoEPLreZcxYxBfyjbKfdoGMMTPiqJ5g2zSO-1UYM,12541
@@ -66,19 +69,17 @@ dataeval/outputs/__init__.py,sha256=geHB5M3QOiFFaQGV4ZwDTTKpqZPvPePbqG7lzaPhaXQ,
 dataeval/outputs/_base.py,sha256=-Wa0gFcBVLbfWPMZyCql7x4vGsnkLP4pecsQIeUZ2_Y,5904
 dataeval/outputs/_bias.py,sha256=1OZpKncYTryjPLRHb4d6NlhE27uPT57gCob_5jtjKDI,10456
 dataeval/outputs/_drift.py,sha256=hXILED_soY8ppIQZgftQvmumtwDrTnABbYl-flIGEU4,4588
-dataeval/outputs/_estimators.py,sha256=mh-R08CgYtmq9ffANDMYR-V4vrZnSjOjEyOMiMDZ2Ic,3091
+dataeval/outputs/_estimators.py,sha256=IQgSbOPHYzzxn1X64XF2XxQhDlWy6jwy6RNyoyvsipE,3111
 dataeval/outputs/_linters.py,sha256=k8lkd8EZ23q0m-HOD-FgqMcLQFy1UH7vws2ucLPyn08,6697
 dataeval/outputs/_metadata.py,sha256=ffZgpX8KWURPHXpOWjbvJ2KRqWQkS2nWuIjKUzoHhMI,1710
 dataeval/outputs/_ood.py,sha256=suLKVXULGtXH0rq9eXHI1d3d2jhGmItJtz4QiQd47A4,1718
 dataeval/outputs/_stats.py,sha256=_ItGjs9YaMHqjivkR1YBcSErD5ICfa_-iV9nq0l8bTM,17451
 dataeval/outputs/_utils.py,sha256=NfhYaGT2PZlhIs8ICKUsPWHZXjhWYDkEJqBDdqMeaOM,929
 dataeval/outputs/_workflows.py,sha256=K786mOgegxVi81diUA-qpbwGEkwa8YA7Fk4ttgjJeaY,10831
-dataeval/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-dataeval/typing.py,sha256=W8rqFFkAqE5a5ar3MmB-O5gcMJqvoDKXC8Y0ggBqAKo,7216
 dataeval/utils/__init__.py,sha256=hRvyUK7b3d6JBEV5u47rFcOHEcmDYqAvZQw_T5pDAWw,264
-dataeval/utils/_array.py,sha256=ftX8S6HKAIUOuc1xd30VC3Pz5yUzRglDpCLisWY_tHs,5888
+dataeval/utils/_array.py,sha256=bIDbnv15_hNzFn2Uc4WV1qRyFzubQj2nNYsFUDIdwT0,6335
 dataeval/utils/_bin.py,sha256=w3eJ2Szw5eapqQ0cGv731rhNgLFGW0cCz2pXo9I6CuY,7296
-dataeval/utils/_clusterer.py,sha256=XmyW2j_JLMYLds8QYgV0nAfdqxWfNR0ZI-6rnZsyHwU,5630
+dataeval/utils/_clusterer.py,sha256=rUvEdyMwp95lffmt6xKMEwsjRXNoBS0n5mAS_HNOnck,5656
 dataeval/utils/_fast_mst.py,sha256=pv42flr1Uf5RBa9qDG0YLDXWH7Mr7a9zpauO1HqZXaY,8061
 dataeval/utils/_image.py,sha256=4uxTIOYZZlRJOfNmdA3ek3no3FrLWCK5un48kStMDt8,3578
 dataeval/utils/_method.py,sha256=9B9JQbgqWJBRhQJb7glajUtWaQzUTIUuvrZ9_bisxsM,394
@@ -102,12 +103,12 @@ dataeval/utils/datasets/_voc.py,sha256=pafY112O80isYkrdy7Quie9SBm_TmYhREuyl8Sxts
 dataeval/utils/torch/__init__.py,sha256=dn5mjCrFp0b1aL_UEURhONU0Ag0cmXoTOBSGagpkTiA,325
 dataeval/utils/torch/_blocks.py,sha256=HVhBTMMD5NA4qheMUgyol1KWiKZDIuc8k5j4RcMKmhk,1466
 dataeval/utils/torch/_gmm.py,sha256=XM68GNEP97EjaB1U49-ZXRb81d0CEFnPS910alrcB3g,3740
-dataeval/utils/torch/_internal.py,sha256=HuyBB7NWFI9sUrRbOCZFxOfZjRGPdqr5iF7_DT2S0wo,4159
+dataeval/utils/torch/_internal.py,sha256=9rzlMeM8i3p-ctulh9WDQATMXtlp-Jk2pBX7NGC8l2I,4146
 dataeval/utils/torch/models.py,sha256=1idpXyjrYcCBSsbxxRUOto8xr4MJNjDEqQHiIXVU5Zc,9700
-dataeval/utils/torch/trainer.py,sha256=Oc2lK13uPGhmLYbmAqlPWyKxgG4YJFlnSXCqFHUZbdA,5528
+dataeval/utils/torch/trainer.py,sha256=DRyPScGdE4o5Xo3BmD9p2PGOApzi1E-QfsBRNZ5IXW8,5544
 dataeval/workflows/__init__.py,sha256=ou8y0KO-d6W5lgmcyLjKlf-J_ckP3vilW7wHkgiDlZ4,255
 dataeval/workflows/sufficiency.py,sha256=j-R8dg4XE6a66p_oTXG2GNzgg3vGk85CTblxhFXaxog,8513
-dataeval-0.86.7.dist-info/LICENSE.txt,sha256=uAooygKWvX6NbU9Ran9oG2msttoG8aeTeHSTe5JeCnY,1061
-dataeval-0.86.7.dist-info/METADATA,sha256=7FTgPB4Yj2zF7z2B6IIRe9WFc9VCBqrcFEIf5ByVHdw,5353
-dataeval-0.86.7.dist-info/WHEEL,sha256=Nq82e9rUAnEjt98J6MlVmMCZb-t9cYE2Ir1kpBmnWfs,88
-dataeval-0.86.7.dist-info/RECORD,,
+dataeval-0.86.8.dist-info/METADATA,sha256=rCf58-uzgjsTNZkY3LOBMSi5fhQ2cdAtnrrDI_eYR_I,5925
+dataeval-0.86.8.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
+dataeval-0.86.8.dist-info/licenses/LICENSE.txt,sha256=uAooygKWvX6NbU9Ran9oG2msttoG8aeTeHSTe5JeCnY,1061
+dataeval-0.86.8.dist-info/RECORD,,

{dataeval-0.86.7.dist-info → dataeval-0.86.8.dist-info}/WHEEL RENAMED Viewed

@@ -1,4 +1,4 @@
 Wheel-Version: 1.0
-Generator: poetry-core 1.9.1
+Generator: hatchling 1.27.0
 Root-Is-Purelib: true
 Tag: py3-none-any

{dataeval-0.86.7.dist-info → dataeval-0.86.8.dist-info/licenses}/LICENSE.txt RENAMED Viewed

File without changes

dataeval 0.86.7__py3-none-any.whl → 0.86.8__py3-none-any.whl

dataeval 0.86.7py3-none-any.whl → 0.86.8py3-none-any.whl