PyPI - dataeval - Versions diffs - 0.87.0__py3-none-any.whl → 0.88.1__py3-none-any.whl - Mend

dataeval 0.87.0py3-none-any.whl → 0.88.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (56) hide show

dataeval/_log.py +1 -1
dataeval/_version.py +2 -2
dataeval/data/_embeddings.py +78 -35
dataeval/data/_images.py +41 -8
dataeval/data/_metadata.py +294 -41
dataeval/data/_selection.py +22 -7
dataeval/data/_split.py +2 -1
dataeval/data/selections/_classfilter.py +4 -3
dataeval/data/selections/_indices.py +2 -1
dataeval/data/selections/_shuffle.py +3 -2
dataeval/detectors/drift/_base.py +2 -1
dataeval/detectors/drift/_mmd.py +2 -1
dataeval/detectors/drift/_nml/_base.py +1 -1
dataeval/detectors/drift/_nml/_chunk.py +2 -1
dataeval/detectors/drift/_nml/_result.py +3 -2
dataeval/detectors/drift/_nml/_thresholds.py +6 -5
dataeval/detectors/drift/_uncertainty.py +2 -1
dataeval/detectors/linters/duplicates.py +2 -1
dataeval/detectors/linters/outliers.py +4 -3
dataeval/detectors/ood/ae.py +1 -1
dataeval/detectors/ood/base.py +2 -1
dataeval/detectors/ood/mixin.py +2 -1
dataeval/metadata/_utils.py +1 -1
dataeval/metrics/bias/_balance.py +1 -1
dataeval/metrics/stats/_base.py +3 -29
dataeval/metrics/stats/_boxratiostats.py +2 -1
dataeval/metrics/stats/_dimensionstats.py +2 -1
dataeval/metrics/stats/_hashstats.py +2 -1
dataeval/metrics/stats/_pixelstats.py +2 -1
dataeval/metrics/stats/_visualstats.py +2 -1
dataeval/outputs/_base.py +2 -3
dataeval/outputs/_bias.py +2 -1
dataeval/outputs/_estimators.py +1 -1
dataeval/outputs/_linters.py +3 -3
dataeval/outputs/_stats.py +3 -3
dataeval/outputs/_utils.py +1 -1
dataeval/outputs/_workflows.py +85 -30
dataeval/typing.py +11 -9
dataeval/utils/_array.py +3 -2
dataeval/utils/_bin.py +2 -1
dataeval/utils/_method.py +2 -3
dataeval/utils/_multiprocessing.py +34 -0
dataeval/utils/_plot.py +2 -1
dataeval/utils/data/__init__.py +4 -5
dataeval/utils/data/{metadata.py → _merge.py} +3 -2
dataeval/utils/data/_validate.py +2 -1
dataeval/utils/data/collate.py +2 -1
dataeval/utils/torch/_internal.py +2 -1
dataeval/utils/torch/trainer.py +1 -1
dataeval/workflows/sufficiency.py +12 -9
{dataeval-0.87.0.dist-info → dataeval-0.88.1.dist-info}/METADATA +4 -5
dataeval-0.88.1.dist-info/RECORD +105 -0
dataeval/utils/data/_dataset.py +0 -253
dataeval-0.87.0.dist-info/RECORD +0 -105
{dataeval-0.87.0.dist-info → dataeval-0.88.1.dist-info}/WHEEL +0 -0
{dataeval-0.87.0.dist-info → dataeval-0.88.1.dist-info}/licenses/LICENSE +0 -0

dataeval/detectors/drift/_nml/_base.py CHANGED Viewed

@@ -9,8 +9,8 @@ from __future__ import annotations
 import logging
 from abc import ABC, abstractmethod
+from collections.abc import Sequence
 from logging import Logger
-from typing import Sequence
 import pandas as pd
 from typing_extensions import Self

dataeval/detectors/drift/_nml/_chunk.py CHANGED Viewed

@@ -13,7 +13,8 @@ import copy
 import logging
 import warnings
 from abc import ABC, abstractmethod
-from typing import Any, Generic, Literal, Sequence, TypeVar, cast
+from collections.abc import Sequence
+from typing import Any, Generic, Literal, TypeVar, cast
 import pandas as pd
 from pandas import Index, Period

dataeval/detectors/drift/_nml/_result.py CHANGED Viewed

@@ -11,7 +11,8 @@ from __future__ import annotations
 import copy
 from abc import ABC, abstractmethod
-from typing import NamedTuple, Sequence
+from collections.abc import Sequence
+from typing import NamedTuple
 import pandas as pd
 from typing_extensions import Self
@@ -52,7 +53,7 @@ class AbstractResult(GenericOutput[pd.DataFrame]):
     def filter(self, period: str = "all", metrics: str | Sequence[str] | None = None) -> Self:
         """Returns filtered result metric data."""
-        if metrics and not isinstance(metrics, (str, Sequence)):
+        if metrics and not isinstance(metrics, str | Sequence):
             raise ValueError("metrics value provided is not a valid metric or sequence of metrics")
         if isinstance(metrics, str):
             metrics = [metrics]

dataeval/detectors/drift/_nml/_thresholds.py CHANGED Viewed

@@ -9,7 +9,8 @@ from __future__ import annotations
 import logging
 from abc import ABC, abstractmethod
-from typing import Any, Callable, ClassVar
+from collections.abc import Callable
+from typing import Any, ClassVar
 import numpy as np
@@ -169,10 +170,10 @@ class ConstantThreshold(Threshold, threshold_type="constant"):
     @staticmethod
     def _validate_inputs(lower: float | int | None = None, upper: float | int | None = None) -> None:
-        if lower is not None and not isinstance(lower, (float, int)) or isinstance(lower, bool):
+        if lower is not None and not isinstance(lower, float | int) or isinstance(lower, bool):
             raise ValueError(f"expected type of 'lower' to be 'float', 'int' or None but got '{type(lower).__name__}'")
-        if upper is not None and not isinstance(upper, (float, int)) or isinstance(upper, bool):
+        if upper is not None and not isinstance(upper, float | int) or isinstance(upper, bool):
             raise ValueError(f"expected type of 'upper' to be 'float', 'int' or None but got '{type(upper).__name__}'")
         # explicit None check is required due to special interpretation of the value 0.0 as False
@@ -244,7 +245,7 @@ class StandardDeviationThreshold(Threshold, threshold_type="standard_deviation")
     ) -> None:
         if (
             std_lower_multiplier is not None
-            and not isinstance(std_lower_multiplier, (float, int))
+            and not isinstance(std_lower_multiplier, float | int)
             or isinstance(std_lower_multiplier, bool)
         ):
             raise ValueError(
@@ -257,7 +258,7 @@ class StandardDeviationThreshold(Threshold, threshold_type="standard_deviation")
         if (
             std_upper_multiplier is not None
-            and not isinstance(std_upper_multiplier, (float, int))
+            and not isinstance(std_upper_multiplier, float | int)
             or isinstance(std_upper_multiplier, bool)
         ):
             raise ValueError(

dataeval/detectors/drift/_uncertainty.py CHANGED Viewed

@@ -10,7 +10,8 @@ from __future__ import annotations
 __all__ = []
-from typing import Literal, Sequence, cast
+from collections.abc import Sequence
+from typing import Literal, cast
 import numpy as np
 import torch

dataeval/detectors/linters/duplicates.py CHANGED Viewed

@@ -2,7 +2,8 @@ from __future__ import annotations
 __all__ = []
-from typing import Any, Sequence, overload
+from collections.abc import Sequence
+from typing import Any, overload
 from dataeval.data._images import Images
 from dataeval.metrics.stats import hashstats

dataeval/detectors/linters/outliers.py CHANGED Viewed

@@ -2,7 +2,8 @@ from __future__ import annotations
 __all__ = []
-from typing import Any, Literal, Sequence, overload
+from collections.abc import Sequence
+from typing import Any, Literal, overload
 import numpy as np
 from numpy.typing import NDArray
@@ -201,7 +202,7 @@ class Outliers:
         >>> results.issues[1]
         {}
         """
-        if isinstance(stats, (ImageStatsOutput, DimensionStatsOutput, PixelStatsOutput, VisualStatsOutput)):
+        if isinstance(stats, ImageStatsOutput | DimensionStatsOutput | PixelStatsOutput | VisualStatsOutput):
             return OutliersOutput(self._get_outliers(stats.data()))
         if not isinstance(stats, Sequence):
@@ -212,7 +213,7 @@ class Outliers:
         stats_map: dict[type, list[int]] = {}
         for i, stats_output in enumerate(stats):
             if not isinstance(
-                stats_output, (ImageStatsOutput, DimensionStatsOutput, PixelStatsOutput, VisualStatsOutput)
+                stats_output, ImageStatsOutput | DimensionStatsOutput | PixelStatsOutput | VisualStatsOutput
             ):
                 raise TypeError(
                     "Invalid stats output type; only use output from dimensionstats, pixelstats or visualstats."

dataeval/detectors/ood/ae.py CHANGED Viewed

@@ -12,7 +12,7 @@ from __future__ import annotations
 __all__ = []
-from typing import Callable
+from collections.abc import Callable
 import numpy as np
 import torch

dataeval/detectors/ood/base.py CHANGED Viewed

@@ -11,7 +11,8 @@ from __future__ import annotations
 __all__ = []
 from abc import ABC, abstractmethod
-from typing import Any, Callable, cast
+from collections.abc import Callable
+from typing import Any, cast
 import numpy as np
 import torch

dataeval/detectors/ood/mixin.py CHANGED Viewed

@@ -3,7 +3,8 @@ from __future__ import annotations
 __all__ = []
 from abc import ABC, abstractmethod
-from typing import Callable, Generic, Literal, TypeVar
+from collections.abc import Callable
+from typing import Generic, Literal, TypeVar
 import numpy as np
 from numpy.typing import NDArray

dataeval/metadata/_utils.py CHANGED Viewed

@@ -1,6 +1,6 @@
 __all__ = []
-from typing import Sequence
+from collections.abc import Sequence
 from numpy.typing import NDArray

dataeval/metrics/bias/_balance.py CHANGED Viewed

@@ -16,7 +16,7 @@ from dataeval.utils._bin import get_counts
 def _validate_num_neighbors(num_neighbors: int) -> int:
-    if not isinstance(num_neighbors, (int, float)):
+    if not isinstance(num_neighbors, int | float):
         raise TypeError(
             f"Variable {num_neighbors} is not real-valued numeric type."
             "num_neighbors should be an int, greater than 0 and less than"

dataeval/metrics/stats/_base.py CHANGED Viewed

@@ -6,11 +6,11 @@ import math
 import re
 import warnings
 from collections import ChainMap
+from collections.abc import Callable, Iterable, Iterator, Sequence
 from copy import deepcopy
 from dataclasses import dataclass
 from functools import partial
-from multiprocessing import Pool
-from typing import Any, Callable, Generic, Iterable, Iterator, Sequence, TypeVar
+from typing import Any, Generic, TypeVar
 import numpy as np
 from numpy.typing import NDArray
@@ -21,14 +21,12 @@ from dataeval.outputs._stats import BASE_ATTRS, BaseStatsOutput, SourceIndex
 from dataeval.typing import Array, ArrayLike, Dataset, ObjectDetectionTarget
 from dataeval.utils._array import as_numpy, to_numpy
 from dataeval.utils._image import clip_and_pad, clip_box, is_valid_box, normalize_image_shape, rescale
+from dataeval.utils._multiprocessing import PoolWrapper
 DTYPE_REGEX = re.compile(r"NDArray\[np\.(.*?)\]")
 TStatsOutput = TypeVar("TStatsOutput", bound=BaseStatsOutput, covariant=True)
-_S = TypeVar("_S")
-_T = TypeVar("_T")
 @dataclass
 class BoundingBox:
@@ -67,30 +65,6 @@ class BoundingBox:
         return x0_int, y0_int, x1_int, y1_int
-class PoolWrapper:
-    """
-    Wraps `multiprocessing.Pool` to allow for easy switching between
-    multiprocessing and single-threaded execution.
-    This helps with debugging and profiling, as well as usage with Jupyter notebooks
-    in VS Code, which does not support subprocess debugging.
-    """
-    def __init__(self, processes: int | None) -> None:
-        self.pool = Pool(processes) if processes is None or processes > 1 else None
-    def imap(self, func: Callable[[_S], _T], iterable: Iterable[_S]) -> Iterator[_T]:
-        return map(func, iterable) if self.pool is None else self.pool.imap(func, iterable)
-    def __enter__(self, *args: Any, **kwargs: Any) -> PoolWrapper:
-        return self
-    def __exit__(self, *args: Any) -> None:
-        if self.pool is not None:
-            self.pool.close()
-            self.pool.join()
 class StatsProcessor(Generic[TStatsOutput]):
     output_class: type[TStatsOutput]
     cache_keys: set[str] = set()

dataeval/metrics/stats/_boxratiostats.py CHANGED Viewed

@@ -3,7 +3,8 @@ from __future__ import annotations
 __all__ = []
 import copy
-from typing import Any, Callable, Generic, TypeVar, cast
+from collections.abc import Callable
+from typing import Any, Generic, TypeVar, cast
 import numpy as np
 from numpy.typing import NDArray

dataeval/metrics/stats/_dimensionstats.py CHANGED Viewed

@@ -2,7 +2,8 @@ from __future__ import annotations
 __all__ = []
-from typing import Any, Callable
+from collections.abc import Callable
+from typing import Any
 import numpy as np

dataeval/metrics/stats/_hashstats.py CHANGED Viewed

@@ -4,7 +4,8 @@ import warnings
 __all__ = []
-from typing import Any, Callable
+from collections.abc import Callable
+from typing import Any
 import numpy as np
 import xxhash as xxh

dataeval/metrics/stats/_pixelstats.py CHANGED Viewed

@@ -2,7 +2,8 @@ from __future__ import annotations
 __all__ = []
-from typing import Any, Callable
+from collections.abc import Callable
+from typing import Any
 import numpy as np
 from scipy.stats import entropy, kurtosis, skew

dataeval/metrics/stats/_visualstats.py CHANGED Viewed

@@ -2,7 +2,8 @@ from __future__ import annotations
 __all__ = []
-from typing import Any, Callable
+from collections.abc import Callable
+from typing import Any
 import numpy as np

dataeval/outputs/_base.py CHANGED Viewed

@@ -4,14 +4,13 @@ __all__ = []
 import inspect
 import logging
-from collections.abc import Collection, Mapping, Sequence
+from collections.abc import Callable, Collection, Iterator, Mapping, Sequence
 from dataclasses import dataclass
 from datetime import datetime, timezone
 from functools import partial, wraps
-from typing import Any, Callable, Generic, Iterator, TypeVar, overload
+from typing import Any, Generic, ParamSpec, TypeVar, overload
 import numpy as np
-from typing_extensions import ParamSpec
 from dataeval import __version__

dataeval/outputs/_bias.py CHANGED Viewed

@@ -3,8 +3,9 @@ from __future__ import annotations
 __all__ = []
 import contextlib
+from collections.abc import Mapping, Sequence
 from dataclasses import asdict, dataclass
-from typing import Any, Mapping, Sequence, TypeVar
+from typing import Any, TypeVar
 import numpy as np
 import pandas as pd

dataeval/outputs/_estimators.py CHANGED Viewed

@@ -2,8 +2,8 @@ from __future__ import annotations
 __all__ = []
+from collections.abc import Sequence
 from dataclasses import dataclass
-from typing import Sequence
 import numpy as np
 from numpy.typing import NDArray

dataeval/outputs/_linters.py CHANGED Viewed

@@ -2,11 +2,11 @@ from __future__ import annotations
 __all__ = []
+from collections.abc import Mapping, Sequence
 from dataclasses import dataclass
-from typing import Generic, Mapping, Sequence, TypeVar, Union
+from typing import Generic, TypeAlias, TypeVar
 import pandas as pd
-from typing_extensions import TypeAlias
 from dataeval.outputs._base import Output
 from dataeval.outputs._stats import DimensionStatsOutput, LabelStatsOutput, PixelStatsOutput, VisualStatsOutput
@@ -16,7 +16,7 @@ DatasetDuplicateGroupMap: TypeAlias = Mapping[int, DuplicateGroup]
 TIndexCollection = TypeVar("TIndexCollection", DuplicateGroup, DatasetDuplicateGroupMap)
 IndexIssueMap: TypeAlias = Mapping[int, Mapping[str, float]]
-OutlierStatsOutput: TypeAlias = Union[DimensionStatsOutput, PixelStatsOutput, VisualStatsOutput]
+OutlierStatsOutput: TypeAlias = DimensionStatsOutput | PixelStatsOutput | VisualStatsOutput
 TIndexIssueMap = TypeVar("TIndexIssueMap", IndexIssueMap, Sequence[IndexIssueMap])

dataeval/outputs/_stats.py CHANGED Viewed

@@ -2,13 +2,13 @@ from __future__ import annotations
 __all__ = []
+from collections.abc import Iterable, Mapping, Sequence
 from dataclasses import dataclass
-from typing import TYPE_CHECKING, Any, Iterable, Mapping, NamedTuple, Optional, Sequence, Union
+from typing import TYPE_CHECKING, Any, NamedTuple, TypeAlias
 import numpy as np
 import polars as pl
 from numpy.typing import NDArray
-from typing_extensions import TypeAlias
 from dataeval.outputs._base import Output
 from dataeval.utils._plot import channel_histogram_plot, histogram_plot
@@ -16,7 +16,7 @@ from dataeval.utils._plot import channel_histogram_plot, histogram_plot
 if TYPE_CHECKING:
     from matplotlib.figure import Figure
-OptionalRange: TypeAlias = Optional[Union[int, Iterable[int]]]
+OptionalRange: TypeAlias = int | Iterable[int] | None
 SOURCE_INDEX = "source_index"
 OBJECT_COUNT = "object_count"

dataeval/outputs/_utils.py CHANGED Viewed

@@ -2,8 +2,8 @@ from __future__ import annotations
 __all__ = []
+from collections.abc import Sequence
 from dataclasses import dataclass
-from typing import Sequence
 import numpy as np
 from numpy.typing import NDArray

dataeval/outputs/_workflows.py CHANGED Viewed

@@ -4,8 +4,9 @@ __all__ = []
 import contextlib
 import warnings
-from dataclasses import dataclass
-from typing import Any, Iterable, Mapping, Sequence, cast
+from collections.abc import Iterable, Mapping, MutableMapping, Sequence
+from dataclasses import dataclass, field
+from typing import Any, cast
 import numpy as np
 from numpy.typing import NDArray
@@ -61,9 +62,12 @@ def project_steps(params: NDArray[Any], projection: NDArray[Any]) -> NDArray[Any
 def plot_measure(
     name: str,
     steps: NDArray[Any],
-    measure: NDArray[Any],
+    averaged_measure: NDArray[Any],
+    measures: NDArray[Any] | None,
     params: NDArray[Any],
     projection: NDArray[Any],
+    error_bars: bool,
+    asymptote: bool,
 ) -> Figure:
     import matplotlib.pyplot
@@ -72,23 +76,51 @@ def plot_measure(
     fig.tight_layout()
     ax = fig.add_subplot(111)
     ax.set_title(f"{name} Sufficiency")
     ax.set_ylabel(f"{name}")
     ax.set_xlabel("Steps")
-    # Plot measure over each step
-    ax.scatter(steps, measure, label=f"Model Results ({name})", s=15, c="black")
+    # Plot asymptote
+    if asymptote:
+        bound = 1 - params[2]
+        ax.axhline(y=bound, color="r", label=f"Asymptote: {bound:.4g}", zorder=1)
+    # Calculate error bars
+    # Plot measure over each step with associated error
+    if error_bars:
+        if measures is None:
+            warnings.warn(
+                "Error bars cannot be plotted without full, unaveraged data",
+                UserWarning,
+            )
+        else:
+            error = np.std(measures, axis=0)
+            ax.errorbar(
+                steps,
+                averaged_measure,
+                yerr=error,
+                capsize=7,
+                capthick=1.5,
+                elinewidth=1.5,
+                fmt="o",
+                label=f"Model Results ({name})",
+                markersize=5,
+                color="black",
+                ecolor="orange",
+                zorder=3,
+            )
+    else:
+        ax.scatter(steps, averaged_measure, label=f"Model Results ({name})", zorder=3, c="black")
     # Plot extrapolation
     ax.plot(
         projection,
         project_steps(params, projection),
         linestyle="dashed",
         label=f"Potential Model Results ({name})",
+        linewidth=2,
+        zorder=2,
     )
+    ax.set_xscale("log")
-    ax.legend()
+    ax.legend(loc="best")
     return fig
@@ -145,7 +177,7 @@ def inv_project_steps(params: NDArray[Any], targets: NDArray[Any]) -> NDArray[np
     return np.ceil(steps)
-def calc_params(p_i: NDArray[Any], n_i: NDArray[Any], niter: int) -> NDArray[Any]:
+def calc_params(p_i: NDArray[Any], n_i: NDArray[Any], niter: int) -> NDArray[np.float64]:
     """
     Retrieves the inverse power curve coefficients for the line of best fit.
     Global minimization is done via basin hopping. More info on this algorithm
@@ -191,11 +223,11 @@ def calc_params(p_i: NDArray[Any], n_i: NDArray[Any], niter: int) -> NDArray[Any
 def get_curve_params(
-    measures: Mapping[str, NDArray[Any]], ranges: NDArray[Any], niter: int
-) -> Mapping[str, NDArray[Any]]:
+    averaged_measures: MutableMapping[str, NDArray[Any]], ranges: NDArray[Any], niter: int
+) -> Mapping[str, NDArray[np.float64]]:
     """Calculates and aggregates parameters for both single and multi-class metrics"""
     output = {}
-    for name, measure in measures.items():
+    for name, measure in averaged_measures.items():
         measure = cast(np.ndarray, measure)
         if measure.ndim > 1:
             result = []
@@ -216,19 +248,25 @@ class SufficiencyOutput(Output):
     ----------
     steps : NDArray
         Array of sample sizes
-    measures : Dict[str, NDArray]
-        Average of values observed for each sample size step for each measure
+    measures : dict[str, NDArray]
+        3D array [runs, substep, classes] of values for all runs observed for each sample size step for each measure
+    averaged_measures : dict[str, NDArray]
+        Average of values for all runs observed for each sample size step for each measure
     n_iter : int, default 1000
         Number of iterations to perform in the basin-hopping curve-fit process
     """
     steps: NDArray[np.uint32]
-    measures: Mapping[str, NDArray[np.float64]]
+    measures: Mapping[str, NDArray[Any]]
+    averaged_measures: MutableMapping[str, NDArray[Any]] = field(default_factory=lambda: {})
     n_iter: int = 1000
     def __post_init__(self) -> None:
+        if len(self.averaged_measures) == 0:
+            for metric, values in self.measures.items():
+                self.averaged_measures[metric] = np.asarray(np.mean(values, axis=0)).T
         c = len(self.steps)
-        for m, v in self.measures.items():
+        for m, v in self.averaged_measures.items():
             c_v = v.shape[1] if v.ndim > 1 else len(v)
             if c != c_v:
                 raise ValueError(f"{m} does not contain the expected number ({c}) of data points.")
@@ -239,7 +277,7 @@ class SufficiencyOutput(Output):
         if self._params is None:
             self._params = {}
         if self.n_iter not in self._params:
-            self._params[self.n_iter] = get_curve_params(self.measures, self.steps, self.n_iter)
+            self._params[self.n_iter] = get_curve_params(self.averaged_measures, self.steps, self.n_iter)
         return self._params[self.n_iter]
     @set_metadata
@@ -272,20 +310,22 @@ class SufficiencyOutput(Output):
             raise ValueError("'projection' must consist of numerical values")
         output = {}
-        for name, measures in self.measures.items():
-            if measures.ndim > 1:
+        for name, averaged_measures in self.averaged_measures.items():
+            if averaged_measures.ndim > 1:
                 result = []
-                for i in range(len(measures)):
+                for i in range(len(averaged_measures)):
                     projected = project_steps(self.params[name][i], projection)
                     result.append(projected)
                 output[name] = np.array(result)
             else:
                 output[name] = project_steps(self.params[name], projection)
-        proj = SufficiencyOutput(projection, output, self.n_iter)
+        proj = SufficiencyOutput(projection, {}, output, self.n_iter)
         proj._params = self._params
         return proj
-    def plot(self, class_names: Sequence[str] | None = None) -> Sequence[Figure]:
+    def plot(
+        self, class_names: Sequence[str] | None = None, error_bars: bool = False, asymptote: bool = False
+    ) -> Sequence[Figure]:
         """
         Plotting function for data :term:`sufficience<Sufficiency>` tasks.
@@ -293,6 +333,10 @@ class SufficiencyOutput(Output):
         ----------
         class_names : Sequence[str] | None, default None
             List of class names
+        error_bars : bool, default False
+            True if error bars should be plotted, False if not
+        asymptote : bool, default False
+            True if asymptote should be plotted, False if not
         Returns
         -------
@@ -315,25 +359,36 @@ class SufficiencyOutput(Output):
         # Stores all plots
         plots = []
         # Create a plot for each measure on one figure
-        for name, measures in self.measures.items():
+        for name, measures in self.averaged_measures.items():
             if measures.ndim > 1:
                 if class_names is not None and len(measures) != len(class_names):
                     raise IndexError("Class name count does not align with measures")
-                for i, measure in enumerate(measures):
+                for i, values in enumerate(measures):
                     class_name = str(i) if class_names is None else class_names[i]
                     fig = plot_measure(
                         f"{name}_{class_name}",
                         self.steps,
-                        measure,
+                        values,
+                        self.measures[name][:, :, i] if len(self.measures) else None,
                         self.params[name][i],
                         extrapolated,
+                        error_bars,
+                        asymptote,
                     )
                     plots.append(fig)
             else:
-                fig = plot_measure(name, self.steps, measures, self.params[name], extrapolated)
+                fig = plot_measure(
+                    name,
+                    self.steps,
+                    measures,
+                    self.measures.get(name),
+                    self.params[name],
+                    extrapolated,
+                    error_bars,
+                    asymptote,
+                )
                 plots.append(fig)
         return plots
@@ -363,10 +418,10 @@ class SufficiencyOutput(Output):
         for name, target in targets.items():
             tarray = as_numpy(target)
-            if name not in self.measures:
+            if name not in self.averaged_measures:
                 continue
-            measure = self.measures[name]
+            measure = self.averaged_measures[name]
             if measure.ndim > 1:
                 projection[name] = np.zeros((len(measure), len(tarray)))
                 for i in range(len(measure)):

dataeval 0.87.0__py3-none-any.whl → 0.88.1__py3-none-any.whl

dataeval 0.87.0py3-none-any.whl → 0.88.1py3-none-any.whl