PyPI - dataeval - Versions diffs - 0.74.1__py3-none-any.whl → 0.75.0__py3-none-any.whl - Mend

dataeval 0.74.1py3-none-any.whl → 0.75.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (68) hide show

dataeval/__init__.py +33 -10
dataeval/detectors/__init__.py +2 -2
dataeval/detectors/drift/__init__.py +14 -12
dataeval/detectors/drift/base.py +1 -1
dataeval/detectors/drift/cvm.py +1 -1
dataeval/detectors/drift/ks.py +1 -1
dataeval/detectors/drift/mmd.py +6 -5
dataeval/detectors/drift/torch.py +12 -12
dataeval/detectors/drift/uncertainty.py +3 -2
dataeval/detectors/linters/__init__.py +4 -4
dataeval/detectors/linters/clusterer.py +2 -7
dataeval/detectors/linters/duplicates.py +6 -10
dataeval/detectors/linters/outliers.py +4 -2
dataeval/detectors/ood/__init__.py +3 -10
dataeval/detectors/ood/{ae_torch.py → ae.py} +6 -4
dataeval/detectors/ood/base.py +64 -161
dataeval/detectors/ood/metadata_ks_compare.py +34 -42
dataeval/detectors/ood/metadata_least_likely.py +3 -3
dataeval/detectors/ood/metadata_ood_mi.py +6 -5
dataeval/detectors/ood/mixin.py +146 -0
dataeval/detectors/ood/output.py +63 -0
dataeval/interop.py +16 -3
dataeval/log.py +18 -0
dataeval/metrics/__init__.py +2 -2
dataeval/metrics/bias/__init__.py +9 -12
dataeval/metrics/bias/balance.py +10 -8
dataeval/metrics/bias/coverage.py +52 -4
dataeval/metrics/bias/diversity.py +42 -14
dataeval/metrics/bias/parity.py +15 -12
dataeval/metrics/estimators/__init__.py +2 -2
dataeval/metrics/estimators/ber.py +3 -1
dataeval/metrics/estimators/divergence.py +1 -1
dataeval/metrics/estimators/uap.py +1 -1
dataeval/metrics/stats/__init__.py +18 -18
dataeval/metrics/stats/base.py +4 -4
dataeval/metrics/stats/boxratiostats.py +8 -9
dataeval/metrics/stats/datasetstats.py +10 -14
dataeval/metrics/stats/dimensionstats.py +4 -4
dataeval/metrics/stats/hashstats.py +12 -8
dataeval/metrics/stats/labelstats.py +5 -5
dataeval/metrics/stats/pixelstats.py +4 -9
dataeval/metrics/stats/visualstats.py +4 -9
dataeval/output.py +1 -1
dataeval/utils/__init__.py +4 -13
dataeval/utils/dataset/__init__.py +7 -0
dataeval/utils/{torch → dataset}/datasets.py +2 -0
dataeval/utils/dataset/read.py +63 -0
dataeval/utils/dataset/split.py +527 -0
dataeval/utils/image.py +2 -2
dataeval/utils/metadata.py +310 -5
dataeval/{metrics/bias/metadata_utils.py → utils/plot.py} +1 -104
dataeval/utils/torch/__init__.py +2 -17
dataeval/utils/torch/gmm.py +29 -6
dataeval/utils/torch/{utils.py → internal.py} +82 -58
dataeval/utils/torch/models.py +10 -8
dataeval/utils/torch/trainer.py +6 -85
dataeval/workflows/__init__.py +2 -5
dataeval/workflows/sufficiency.py +16 -6
dataeval-0.75.0.dist-info/METADATA +136 -0
dataeval-0.75.0.dist-info/RECORD +67 -0
dataeval/detectors/ood/base_torch.py +0 -109
dataeval/metrics/bias/metadata_preprocessing.py +0 -285
dataeval/utils/gmm.py +0 -26
dataeval/utils/split_dataset.py +0 -492
dataeval-0.74.1.dist-info/METADATA +0 -120
dataeval-0.74.1.dist-info/RECORD +0 -65
{dataeval-0.74.1.dist-info → dataeval-0.75.0.dist-info}/LICENSE.txt +0 -0
{dataeval-0.74.1.dist-info → dataeval-0.75.0.dist-info}/WHEEL +0 -0

dataeval/utils/torch/models.py CHANGED Viewed

@@ -1,6 +1,8 @@
+"""Simple PyTorch model architectures used by DataEval."""
 from __future__ import annotations
-__all__ = ["AriaAutoencoder", "Encoder", "Decoder"]
+__all__ = ["Autoencoder", "Encoder", "Decoder"]
 import math
 from typing import Any
@@ -9,7 +11,7 @@ import torch
 import torch.nn as nn
-class AriaAutoencoder(nn.Module):
+class Autoencoder(nn.Module):
     """
     An autoencoder model with a separate encoder and decoder.
@@ -63,7 +65,7 @@ class Encoder(nn.Module):
     """
     A simple encoder to be used in an autoencoder model.
-    This is the encoder used by the AriaAutoencoder model.
+    This is the encoder used by the Autoencoder model.
     Parameters
     ----------
@@ -104,7 +106,7 @@ class Decoder(nn.Module):
     """
     A simple decoder to be used in an autoencoder model.
-    This is the decoder used by the AriaAutoencoder model.
+    This is the decoder used by the Autoencoder model.
     Parameters
     ----------
@@ -142,14 +144,14 @@ class Decoder(nn.Module):
 class AE(nn.Module):
     """
-    An autoencoder model with a separate encoder and decoder. Meant to replace the TensorFlow model called AE, which we
-      used as the core of an autoencoder-based OOD detector, i.e. as an argument to OOD_AE().
+    An autoencoder model with a separate encoder and decoder used as the core of an autoencoder-based
+    OOD detector, i.e. as an argument to OOD_AE().
     Parameters
     ----------
     input_shape : tuple[int, int, int]
         Number of input channels, number of rows, number of columns.() Number of examples per batch will be inferred
-          at runtime.)
+        at runtime.)
     """
     def __init__(self, input_shape: tuple[int, int, int]) -> None:
@@ -279,7 +281,7 @@ class Decoder_AE(nn.Module):
     """
     A simple decoder to be used in an autoencoder model.
-    This is the decoder used by the AriaAutoencoder model.
+    This is the decoder used by the Autoencoder model.
     Parameters
     ----------

dataeval/utils/torch/trainer.py CHANGED Viewed

@@ -1,15 +1,15 @@
+"""Utility classes for training PyTorch models."""
 from __future__ import annotations
-from typing import Any, Callable
+__all__ = ["AETrainer"]
+from typing import Any
 import torch
 import torch.nn as nn
-from numpy.typing import NDArray
 from torch.optim import Adam
-from torch.utils.data import DataLoader, Dataset, TensorDataset
-from tqdm import tqdm
-__all__ = ["AETrainer", "trainer"]
+from torch.utils.data import DataLoader, Dataset
 def get_images_from_batch(batch: Any) -> Any:
@@ -176,82 +176,3 @@ class AETrainer:
             encodings = torch.vstack((encodings, embeddings)) if len(encodings) else embeddings
         return encodings
-def trainer(
-    model: torch.nn.Module,
-    x_train: NDArray[Any],
-    y_train: NDArray[Any] | None,
-    loss_fn: Callable[..., torch.Tensor | torch.nn.Module] | None,
-    optimizer: torch.optim.Optimizer | None,
-    preprocess_fn: Callable[[torch.Tensor], torch.Tensor] | None,
-    epochs: int,
-    batch_size: int,
-    device: torch.device,
-    verbose: bool,
-) -> None:
-    """
-    Train Pytorch model.
-    Parameters
-    ----------
-    model
-        Model to train.
-    loss_fn
-        Loss function used for training.
-    x_train
-        Training data.
-    y_train
-        Training labels.
-    optimizer
-        Optimizer used for training.
-    preprocess_fn
-        Preprocessing function applied to each training batch.
-    epochs
-        Number of training epochs.
-    reg_loss_fn
-        Allows an additional regularisation term to be defined as reg_loss_fn(model)
-    batch_size
-        Batch size used for training.
-    buffer_size
-        Maximum number of elements that will be buffered when prefetching.
-    verbose
-        Whether to print training progress.
-    """
-    if optimizer is None:
-        optimizer = torch.optim.Adam(model.parameters(), lr=0.001)
-    if y_train is None:
-        dataset = TensorDataset(torch.from_numpy(x_train).to(torch.float32))
-    else:
-        dataset = TensorDataset(
-            torch.from_numpy(x_train).to(torch.float32), torch.from_numpy(y_train).to(torch.float32)
-        )
-    loader = DataLoader(dataset=dataset)
-    model = model.to(device)
-    # iterate over epochs
-    loss = torch.nan
-    disable_tqdm = not verbose
-    for epoch in (pbar := tqdm(range(epochs), disable=disable_tqdm)):
-        epoch_loss = loss
-        for step, data in enumerate(loader):
-            if step % 250 == 0:
-                pbar.set_description(f"Epoch: {epoch} ({epoch_loss:.3f}), loss: {loss:.3f}")
-            x, y = [d.to(device) for d in data] if len(data) > 1 else (data[0].to(device), None)
-            if isinstance(preprocess_fn, Callable):
-                x = preprocess_fn(x)
-            y_hat = model(x)
-            y = x if y is None else y
-            loss = loss_fn(y, y_hat)  # type: ignore
-            optimizer.zero_grad()
-            loss.backward()
-            optimizer.step()

dataeval/workflows/__init__.py CHANGED Viewed

@@ -2,9 +2,6 @@
 Workflows perform a sequence of actions to analyze the dataset and make predictions.
 """
-from dataeval import _IS_TORCH_AVAILABLE
+__all__ = ["Sufficiency", "SufficiencyOutput"]
-if _IS_TORCH_AVAILABLE:
-    from dataeval.workflows.sufficiency import Sufficiency, SufficiencyOutput
-    __all__ = ["Sufficiency", "SufficiencyOutput"]
+from dataeval.workflows.sufficiency import Sufficiency, SufficiencyOutput

dataeval/workflows/sufficiency.py CHANGED Viewed

@@ -1,16 +1,15 @@
 from __future__ import annotations
-__all__ = ["SufficiencyOutput", "Sufficiency"]
+__all__ = []
+import contextlib
 import warnings
 from dataclasses import dataclass
 from typing import Any, Callable, Generic, Iterable, Mapping, Sequence, TypeVar, cast
-import matplotlib.pyplot as plt
 import numpy as np
 import torch
 import torch.nn as nn
-from matplotlib.figure import Figure
 from numpy.typing import ArrayLike, NDArray
 from scipy.optimize import basinhopping
 from torch.utils.data import Dataset
@@ -18,6 +17,9 @@ from torch.utils.data import Dataset
 from dataeval.interop import as_numpy
 from dataeval.output import Output, set_metadata
+with contextlib.suppress(ImportError):
+    from matplotlib.figure import Figure
 @dataclass(frozen=True)
 class SufficiencyOutput(Output):
@@ -97,7 +99,7 @@ class SufficiencyOutput(Output):
         Returns
         -------
-        list[plt.Figure]
+        list[Figure]
             List of Figures for each measure
         Raises
@@ -344,7 +346,9 @@ def plot_measure(
     params: NDArray[Any],
     projection: NDArray[Any],
 ) -> Figure:
-    fig = plt.figure()
+    import matplotlib.pyplot
+    fig = matplotlib.pyplot.figure()
     fig = cast(Figure, fig)
     fig.tight_layout()
@@ -510,7 +514,13 @@ class Sufficiency(Generic[T]):
         Examples
         --------
         >>> suff = Sufficiency(
-        ...     model=model, train_ds=train_ds, test_ds=test_ds, train_fn=train_fn, eval_fn=eval_fn, runs=3, substeps=5
+        ...     model=model,
+        ...     train_ds=train_ds,
+        ...     test_ds=test_ds,
+        ...     train_fn=train_fn,
+        ...     eval_fn=eval_fn,
+        ...     runs=3,
+        ...     substeps=5,
         ... )
         >>> suff.evaluate()
         SufficiencyOutput(steps=array([  1,   3,  10,  31, 100], dtype=uint32), params={'test': array([ 0., 42.,  0.])}, measures={'test': array([1., 1., 1., 1., 1.])})

dataeval-0.75.0.dist-info/METADATA ADDED Viewed

@@ -0,0 +1,136 @@
+Metadata-Version: 2.1
+Name: dataeval
+Version: 0.75.0
+Summary: DataEval provides a simple interface to characterize image data and its impact on model performance across classification and object-detection tasks
+Home-page: https://dataeval.ai/
+License: MIT
+Author: Andrew Weng
+Author-email: andrew.weng@ariacoustics.com
+Maintainer: ARiA
+Maintainer-email: dataeval@ariacoustics.com
+Requires-Python: >=3.9,<3.13
+Classifier: Development Status :: 4 - Beta
+Classifier: Intended Audience :: Science/Research
+Classifier: License :: OSI Approved :: MIT License
+Classifier: Operating System :: OS Independent
+Classifier: Programming Language :: Python :: 3
+Classifier: Programming Language :: Python :: 3.9
+Classifier: Programming Language :: Python :: 3.10
+Classifier: Programming Language :: Python :: 3.11
+Classifier: Programming Language :: Python :: 3.12
+Classifier: Programming Language :: Python :: 3 :: Only
+Classifier: Topic :: Scientific/Engineering
+Provides-Extra: all
+Requires-Dist: matplotlib ; extra == "all"
+Requires-Dist: numpy (>=1.24.3)
+Requires-Dist: pillow (>=10.3.0)
+Requires-Dist: requests
+Requires-Dist: scikit-learn (>=1.5.0)
+Requires-Dist: scipy (>=1.10)
+Requires-Dist: torch (>=2.2.0)
+Requires-Dist: torchvision (>=0.17.0)
+Requires-Dist: tqdm
+Requires-Dist: typing-extensions (>=4.12) ; python_version >= "3.9" and python_version < "4.0"
+Requires-Dist: xxhash (>=3.3)
+Project-URL: Documentation, https://dataeval.readthedocs.io/
+Project-URL: Repository, https://github.com/aria-ml/dataeval/
+Description-Content-Type: text/markdown
+# DataEval
+To view our extensive collection of tutorials, how-to's, explanation guides, and reference material, please visit our documentation on **[Read the Docs](https://dataeval.readthedocs.io/)**
+## About DataEval
+<!-- start tagline -->
+DataEval curates datasets to train and test performant, robust, unbiased and reliable AI models and monitors for data shifts that impact performance of deployed models.
+<!-- end tagline -->
+### Our mission
+<!-- start needs -->
+DataEval is an effective, powerful, and reliable set of tools for any T&E engineer. Throughout all stages of the machine learning lifecycle, DataEval supports **model development, data analysis, and monitoring with state-of-the-art algorithms to help you solve difficult problems. With a focus on computer vision tasks, DataEval provides simple, but effective metrics for performance estimation, bias detection, and dataset linting.
+<!-- end needs -->
+<!-- start JATIC interop -->
+DataEval is easy to install, supports a wide range of Python versions, and is compatible with many of the most popular packages in the scientific and T&E communities.
+DataEval also has native interopability between JATIC's suite of tools when using MAITE-compliant datasets and models.
+<!-- end JATIC interop -->
+## Getting Started
+**Python versions:** 3.9 - 3.12
+**Supported packages**: *NumPy*, *Pandas*, *Sci-kit learn*, *MAITE*, *NRTK*, *Gradient*
+Choose your preferred method of installation below or follow our [installation guide](https://dataeval.readthedocs.io/en/v0.74.2/installation.html).
+* [Installing with pip](#installing-with-pip)
+* [Installing with conda/mamba](#installing-with-conda)
+* [Installing from GitHub](#installing-from-github)
+### **Installing with pip**
+You can install DataEval directly from pypi.org using the following command.  The optional dependencies of DataEval are `all`.
+```
+pip install dataeval[all]
+```
+### **Installing with conda**
+DataEval can be installed in a Conda/Mamba environment using the provided `environment.yaml` file.  As some dependencies
+are installed from the `pytorch` channel, the channel is specified in the below example.
+```
+micromamba create -f environment\environment.yaml -c pytorch
+```
+### **Installing from GitHub**
+To install DataEval from source locally on Ubuntu, you will need `git-lfs` to download larger, binary source files and `poetry` for project dependency management.
+```
+sudo apt-get install git-lfs
+pip install poetry
+```
+Pull the source down and change to the DataEval project directory.
+```
+git clone https://github.com/aria-ml/dataeval.git
+cd dataeval
+```
+Install DataEval with optional dependencies for development.
+```
+poetry install --all-extras --with dev
+```
+Now that DataEval is installed, you can run commands in the poetry virtual environment by prefixing shell commands with `poetry run`, or activate the virtual environment directly in the shell.
+```
+poetry shell
+```
+## Contact Us
+If you have any questions, feel free to reach out to the people below:
+- **POC**: Scott Swan @scott.swan
+- **DPOC**: Andrew Weng @aweng
+## Acknowledgement
+<!-- start attribution -->
+### Alibi-Detect
+This project uses code from the [Alibi-Detect](https://github.com/SeldonIO/alibi-detect) Python library developed by SeldonIO.\
+Additional documentation from their developers is available on the [Alibi-Detect documentation page](https://docs.seldon.io/projects/alibi-detect/en/stable/).
+### CDAO Funding Acknowledgement
+This material is based upon work supported by the Chief Digital and Artificial Intelligence Office under Contract No. W519TC-23-9-2033. The views and conclusions contained herein are those of the author(s) and should not be interpreted as necessarily representing the official policies or endorsements, either expressed or implied, of the U.S. Government.
+<!-- end attribution -->

dataeval-0.75.0.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,67 @@
+dataeval/__init__.py,sha256=yESctPswyAJ01Hr9k4QUoGZp8D0RtvoQ26k4AFE2vs4,1472
+dataeval/detectors/__init__.py,sha256=iifG-Z08mH5B4QhkKtAieDGJBKldKvmCXpDQJD9qVY8,206
+dataeval/detectors/drift/__init__.py,sha256=wO294Oz--l0GuZTAkBpyGwZphbQsot57HoiEX6kjNOc,652
+dataeval/detectors/drift/base.py,sha256=sX46grnr4DV0WMofLTI2a_tDHR4OLZEUCQrMLePouqg,14468
+dataeval/detectors/drift/cvm.py,sha256=TATS6IOE0INO1pkyRkesgrhDawD_kITsRsOOGVRs420,4132
+dataeval/detectors/drift/ks.py,sha256=3Jgh5W7pC1hO1yZPCiXc47snlSdXv5BIG8sCyRRz-Ec,4220
+dataeval/detectors/drift/mmd.py,sha256=lD__AouWlYWCJOD0eNNEhmLTnUPwNTBU6OCgITcpw40,7592
+dataeval/detectors/drift/torch.py,sha256=ykD-Nggys5T9FTGXXbYYOi2WRKwEzEjXhL8ZueVmTxU,7659
+dataeval/detectors/drift/uncertainty.py,sha256=Pdim80_-ainvOX5-7fhH9cvblYI2d-zocEwZO-JfCg4,5345
+dataeval/detectors/drift/updates.py,sha256=UJ0z5hlunRi7twnkLABfdJG3tT2EqX4y9IGx8_USYvo,1780
+dataeval/detectors/linters/__init__.py,sha256=CZV5naeYQYL3sHXO_CXB26AXkyTeKHI-TMaewtEs8Ag,483
+dataeval/detectors/linters/clusterer.py,sha256=1qIQo5NuJkx-phKFWuXkUpUJLcqTt92L8Cpv3AmO3xQ,20929
+dataeval/detectors/linters/duplicates.py,sha256=pcCRN27IuGa6ASkiFG73kYdI8_X0j12INbkD9GOlWPs,5614
+dataeval/detectors/linters/merged_stats.py,sha256=X-bDTwjyR8RuVmzxLaHZmQ5nI3oOWvsqVlitdSncapk,1355
+dataeval/detectors/linters/outliers.py,sha256=Fn6R_7mGOrWlTRCXFrjHvIFNELN6CTosoJgzDr8cVr0,10253
+dataeval/detectors/ood/__init__.py,sha256=hTeR-Aqt6SKWsqFusaKiw_TlnFPe_sV3fQ7NKUTzZrU,292
+dataeval/detectors/ood/ae.py,sha256=SL8oKTERhMwaZTQWwDhQQ6H07UKj8ozXqEWO3TaOAos,2151
+dataeval/detectors/ood/base.py,sha256=6gUkbGE6PbKmA899rXOTOIeT8u_gaD0DNDQV8Wyfk5Y,3421
+dataeval/detectors/ood/metadata_ks_compare.py,sha256=-hEhDNXFC7X8wmFeoigO7A7Qn90vRLroN_nKDwNgjnE,5204
+dataeval/detectors/ood/metadata_least_likely.py,sha256=rb8GOgsrlrEzc6fxccdmyZQ5PC7HtTsTY8U97D-h5OU,5088
+dataeval/detectors/ood/metadata_ood_mi.py,sha256=7_Sdzf7-x1TlrIQvSyOIB98C8_UQhUwmwFQmZ9_q1Uc,4042
+dataeval/detectors/ood/mixin.py,sha256=Ia-rJF6rtGhE8uavijdbzOha3ueFk2CFfA0Ah_mnF40,4976
+dataeval/detectors/ood/output.py,sha256=8UQbtudQ0gSeq_hQV67IE5SfHednaiGUHv9MideETdk,1710
+dataeval/interop.py,sha256=GLziERWQQGwUO4Nb-uHpbLlvBOT2WF2GVilTHmsDq8w,2279
+dataeval/log.py,sha256=Mn5bRWO0cgtAYd5VGYSFiPgu57ta3zoktrtHAZ1m3dU,357
+dataeval/metrics/__init__.py,sha256=p-lRjm0oVHD3cXZeEajTfuGTuQOCCVHbJ8CqAI_GHVY,238
+dataeval/metrics/bias/__init__.py,sha256=knYgCdeHredaHI6KGdjiYM6ViPfDf8NW35xkKiiGlVM,599
+dataeval/metrics/bias/balance.py,sha256=od3gcejOqJDDymy09OWSxzqkBNyh7Vf3aXN9o6IPKHY,9151
+dataeval/metrics/bias/coverage.py,sha256=k8TJAsUWlLgn_-JEtRWIOwhtMRwXmyGzLDndGxNTsAU,5745
+dataeval/metrics/bias/diversity.py,sha256=upj-Gx_4-bBF-4dDaUSuURIbP98Ghk-BSCK5ZJNGMEg,8318
+dataeval/metrics/bias/parity.py,sha256=wVMfzKFqzHkp3SNUJFjRH_Eej9DIg-xAhHkShIAek68,12755
+dataeval/metrics/estimators/__init__.py,sha256=oY_9jX7V-Kg7-4KpvMNB4rUhsk8QTA0DIoM8d2VtVIg,380
+dataeval/metrics/estimators/ber.py,sha256=p3KaY-rnK45CUDaqx-55wWG6yHcDnH6Kkkt9r6FkmZY,5003
+dataeval/metrics/estimators/divergence.py,sha256=QYkOs7In9un0tYHztwZ5kNqiWVNS3Lgmxn1716H8HG4,4243
+dataeval/metrics/estimators/uap.py,sha256=ELa5MixMOJZoW5rUuVLOXynfLMbVjxb-r7VYF5qqXrw,2139
+dataeval/metrics/stats/__init__.py,sha256=Js_mklHJbHwOXJtMFo9NIyePZLwLZL-jruwmcjoLsZc,1086
+dataeval/metrics/stats/base.py,sha256=U0yPaRSHuPGZk3A7hl8ghJCki7iBtW5wM1eZvElu1_w,12038
+dataeval/metrics/stats/boxratiostats.py,sha256=fNzHT_nZX0MYeHkWRdcfEz2mtRC2d1JxpoK3l4EBrQc,6301
+dataeval/metrics/stats/datasetstats.py,sha256=krOm48yjyzYOWKLaWFqHAQPmuhiN4manif7ZXh2Ohhg,5828
+dataeval/metrics/stats/dimensionstats.py,sha256=_mN7wHencHh4UNd9XUflhq0sIa9yLPk3yHqmossDEGk,3985
+dataeval/metrics/stats/hashstats.py,sha256=_zZOwnQDlpMoPyqbOV2v9V_Uqox0c4vX2Khv5u_fAk8,5068
+dataeval/metrics/stats/labelstats.py,sha256=mLH02Xy_uT-qN7HXuXEgs786T2Xr0BMudweBDeEWd5I,4065
+dataeval/metrics/stats/pixelstats.py,sha256=t8abfenA79x87CMqPuKtddglD3l_LA6nXS4K_FlL4-k,4148
+dataeval/metrics/stats/visualstats.py,sha256=UU0oa5BWuIOTDM1H1ZnlhYyu8ruVEnaLPCDOsbm-q1c,4546
+dataeval/output.py,sha256=hR5TJ67f7FgrZO9Du46aw-jvRpMjOimSgJSau4ZNK44,3565
+dataeval/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+dataeval/utils/__init__.py,sha256=fBpXVWzNaXySTuZWsD8Jg9LLHzb23nz_PfdxPD_gc8c,279
+dataeval/utils/dataset/__init__.py,sha256=IvRauQaa0CzJ5nZrfTSjGoaaKelyJcQDe3OPRw0-NXs,332
+dataeval/utils/dataset/datasets.py,sha256=7tSqN3d8UncqmXh4eiEwarXgVxc4sMuIKPTqBCE0pN8,15080
+dataeval/utils/dataset/read.py,sha256=tt-9blXzYLRb4Vgv6DrFj2ikUSvBF0-qTSnvvYec_2U,1523
+dataeval/utils/dataset/split.py,sha256=FpxHxmewjqIj6hikCsamNQTq877qu4HfKnzArOyvmyY,18957
+dataeval/utils/image.py,sha256=AQljELyMFkYsf2AoNOH5dZG8DYE4hPw0MCk85eIXqAw,1926
+dataeval/utils/metadata.py,sha256=mhMhBgb7nAIIljDdecOqiZ1zsYagE6h8DKxE_DFDW-E,22270
+dataeval/utils/plot.py,sha256=jQSiqDArFOlKZaIbv4Viso_ShU3LnZE-Y2qXKuKsa8M,3790
+dataeval/utils/shared.py,sha256=xvF3VLfyheVwJtdtDrneOobkKf7t-JTmf_w91FWXmqo,3616
+dataeval/utils/torch/__init__.py,sha256=dn5mjCrFp0b1aL_UEURhONU0Ag0cmXoTOBSGagpkTiA,325
+dataeval/utils/torch/blocks.py,sha256=HVhBTMMD5NA4qheMUgyol1KWiKZDIuc8k5j4RcMKmhk,1466
+dataeval/utils/torch/gmm.py,sha256=fQ8CBO4Bf6i9N1CZdeJ8VJP25fsPjgMextQkondwgvo,3693
+dataeval/utils/torch/internal.py,sha256=qAzQTwTI9Qy6f01Olw3d1TIJ4HoWGf0gQzgWVcdD2x4,6653
+dataeval/utils/torch/models.py,sha256=Df3B_9x5uu-Y5ZOyhRZYpKJnDvxt0hgMeJLy1E4oxpU,8519
+dataeval/utils/torch/trainer.py,sha256=Qay0LK63RuyoGYiJ5zI2C5BVym309ORvp6shhpcrIU4,5589
+dataeval/workflows/__init__.py,sha256=L9yfBipNFGnYuN2JbMknIHDvziwfa2XAGFnOwifZbls,216
+dataeval/workflows/sufficiency.py,sha256=nL99iDlu2bF_9VGu3ioLFDJBgBBJEdwEXROxXm_0sfY,18673
+dataeval-0.75.0.dist-info/LICENSE.txt,sha256=Kpzcfobf1HlqafF-EX6dQLw9TlJiaJzfgvLQFukyXYw,1060
+dataeval-0.75.0.dist-info/METADATA,sha256=6m2O6vreJR3Lq1_BXEU6DHnK2C5L_q5YAPofIl4kxCw,5410
+dataeval-0.75.0.dist-info/WHEEL,sha256=Nq82e9rUAnEjt98J6MlVmMCZb-t9cYE2Ir1kpBmnWfs,88
+dataeval-0.75.0.dist-info/RECORD,,

dataeval/detectors/ood/base_torch.py DELETED Viewed

@@ -1,109 +0,0 @@
-"""
-Source code derived from Alibi-Detect 0.11.4
-https://github.com/SeldonIO/alibi-detect/tree/v0.11.4
-Original code Copyright (c) 2023 Seldon Technologies Ltd
-Licensed under Apache Software License (Apache 2.0)
-"""
-from __future__ import annotations
-from typing import Callable, cast
-import torch
-from numpy.typing import ArrayLike
-from dataeval.detectors.drift.torch import get_device
-from dataeval.detectors.ood.base import OODBaseMixin, OODFitMixin, OODGMMMixin
-from dataeval.interop import to_numpy
-from dataeval.utils.torch.gmm import gmm_params
-from dataeval.utils.torch.trainer import trainer
-class OODBase(OODBaseMixin[torch.nn.Module], OODFitMixin[Callable[..., torch.nn.Module], torch.optim.Optimizer]):
-    def __init__(self, model: torch.nn.Module, device: str | torch.device | None = None) -> None:
-        self.device: torch.device = get_device(device)
-        super().__init__(model)
-    def fit(
-        self,
-        x_ref: ArrayLike,
-        threshold_perc: float,
-        loss_fn: Callable[..., torch.nn.Module] | None,
-        optimizer: torch.optim.Optimizer | None,
-        epochs: int,
-        batch_size: int,
-        verbose: bool,
-    ) -> None:
-        """
-        Train the model and infer the threshold value.
-        Parameters
-        ----------
-        x_ref : ArrayLike
-            Training data.
-        threshold_perc : float, default 100.0
-            Percentage of reference data that is normal.
-        loss_fn : Callable | None, default None
-            Loss function used for training.
-        optimizer : Optimizer, default keras.optimizers.Adam
-            Optimizer used for training.
-        epochs : int, default 20
-            Number of training epochs.
-        batch_size : int, default 64
-            Batch size used for training.
-        verbose : bool, default True
-            Whether to print training progress.
-        """
-        # Train the model
-        trainer(
-            model=self.model,
-            x_train=to_numpy(x_ref),
-            y_train=None,
-            loss_fn=loss_fn,
-            optimizer=optimizer,
-            preprocess_fn=None,
-            epochs=epochs,
-            batch_size=batch_size,
-            device=self.device,
-            verbose=verbose,
-        )
-        # Infer the threshold values
-        self._ref_score = self.score(x_ref, batch_size)
-        self._threshold_perc = threshold_perc
-class OODBaseGMM(OODBase, OODGMMMixin[torch.Tensor]):
-    def fit(
-        self,
-        x_ref: ArrayLike,
-        threshold_perc: float,
-        loss_fn: Callable[..., torch.nn.Module] | None,
-        optimizer: torch.optim.Optimizer | None,
-        epochs: int,
-        batch_size: int,
-        verbose: bool,
-    ) -> None:
-        # Train the model
-        trainer(
-            model=self.model,
-            x_train=to_numpy(x_ref),
-            y_train=None,
-            loss_fn=loss_fn,
-            optimizer=optimizer,
-            preprocess_fn=None,
-            epochs=epochs,
-            batch_size=batch_size,
-            device=self.device,
-            verbose=verbose,
-        )
-        # Calculate the GMM parameters
-        _, z, gamma = cast(tuple[torch.Tensor, torch.Tensor, torch.Tensor], self.model(x_ref))
-        self._gmm_params = gmm_params(z, gamma)
-        # Infer the threshold values
-        self._ref_score = self.score(x_ref, batch_size)
-        self._threshold_perc = threshold_perc

dataeval 0.74.1__py3-none-any.whl → 0.75.0__py3-none-any.whl

dataeval 0.74.1py3-none-any.whl → 0.75.0py3-none-any.whl