PyPI - anemoi-datasets - Versions diffs - 0.5.26__py3-none-any.whl → 0.5.27__py3-none-any.whl - Mend

anemoi-datasets 0.5.26py3-none-any.whl → 0.5.27py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (105) hide show

anemoi/datasets/__init__.py +1 -2
anemoi/datasets/_version.py +16 -3
anemoi/datasets/commands/check.py +1 -1
anemoi/datasets/commands/copy.py +1 -2
anemoi/datasets/commands/create.py +1 -1
anemoi/datasets/commands/inspect.py +27 -35
anemoi/datasets/commands/validate.py +59 -0
anemoi/datasets/compute/recentre.py +3 -6
anemoi/datasets/create/__init__.py +22 -25
anemoi/datasets/create/check.py +10 -12
anemoi/datasets/create/chunks.py +1 -2
anemoi/datasets/create/config.py +3 -6
anemoi/datasets/create/filter.py +1 -2
anemoi/datasets/create/input/__init__.py +1 -2
anemoi/datasets/create/input/action.py +3 -5
anemoi/datasets/create/input/concat.py +5 -8
anemoi/datasets/create/input/context.py +3 -6
anemoi/datasets/create/input/data_sources.py +5 -8
anemoi/datasets/create/input/empty.py +1 -2
anemoi/datasets/create/input/filter.py +2 -3
anemoi/datasets/create/input/function.py +1 -2
anemoi/datasets/create/input/join.py +4 -5
anemoi/datasets/create/input/misc.py +4 -6
anemoi/datasets/create/input/repeated_dates.py +13 -18
anemoi/datasets/create/input/result.py +29 -33
anemoi/datasets/create/input/step.py +4 -8
anemoi/datasets/create/input/template.py +3 -4
anemoi/datasets/create/input/trace.py +1 -1
anemoi/datasets/create/patch.py +1 -2
anemoi/datasets/create/persistent.py +3 -5
anemoi/datasets/create/size.py +1 -3
anemoi/datasets/create/sources/accumulations.py +47 -52
anemoi/datasets/create/sources/accumulations2.py +4 -8
anemoi/datasets/create/sources/constants.py +1 -3
anemoi/datasets/create/sources/empty.py +1 -2
anemoi/datasets/create/sources/fdb.py +133 -0
anemoi/datasets/create/sources/forcings.py +1 -2
anemoi/datasets/create/sources/grib.py +6 -10
anemoi/datasets/create/sources/grib_index.py +13 -15
anemoi/datasets/create/sources/hindcasts.py +2 -5
anemoi/datasets/create/sources/legacy.py +1 -1
anemoi/datasets/create/sources/mars.py +17 -21
anemoi/datasets/create/sources/netcdf.py +1 -2
anemoi/datasets/create/sources/opendap.py +1 -3
anemoi/datasets/create/sources/patterns.py +4 -6
anemoi/datasets/create/sources/recentre.py +8 -11
anemoi/datasets/create/sources/source.py +3 -6
anemoi/datasets/create/sources/tendencies.py +2 -5
anemoi/datasets/create/sources/xarray.py +4 -6
anemoi/datasets/create/sources/xarray_support/__init__.py +12 -13
anemoi/datasets/create/sources/xarray_support/coordinates.py +8 -12
anemoi/datasets/create/sources/xarray_support/field.py +16 -12
anemoi/datasets/create/sources/xarray_support/fieldlist.py +11 -15
anemoi/datasets/create/sources/xarray_support/flavour.py +42 -42
anemoi/datasets/create/sources/xarray_support/grid.py +15 -9
anemoi/datasets/create/sources/xarray_support/metadata.py +19 -128
anemoi/datasets/create/sources/xarray_support/patch.py +4 -6
anemoi/datasets/create/sources/xarray_support/time.py +10 -13
anemoi/datasets/create/sources/xarray_support/variable.py +21 -21
anemoi/datasets/create/sources/xarray_zarr.py +1 -2
anemoi/datasets/create/sources/zenodo.py +3 -5
anemoi/datasets/create/statistics/__init__.py +3 -6
anemoi/datasets/create/testing.py +4 -0
anemoi/datasets/create/typing.py +1 -2
anemoi/datasets/create/utils.py +1 -2
anemoi/datasets/create/zarr.py +7 -2
anemoi/datasets/data/__init__.py +15 -6
anemoi/datasets/data/complement.py +7 -12
anemoi/datasets/data/concat.py +5 -8
anemoi/datasets/data/dataset.py +42 -47
anemoi/datasets/data/debug.py +7 -9
anemoi/datasets/data/ensemble.py +4 -6
anemoi/datasets/data/fill_missing.py +7 -10
anemoi/datasets/data/forwards.py +22 -26
anemoi/datasets/data/grids.py +12 -16
anemoi/datasets/data/indexing.py +9 -12
anemoi/datasets/data/interpolate.py +7 -15
anemoi/datasets/data/join.py +8 -12
anemoi/datasets/data/masked.py +6 -11
anemoi/datasets/data/merge.py +5 -9
anemoi/datasets/data/misc.py +41 -45
anemoi/datasets/data/missing.py +11 -16
anemoi/datasets/data/observations/__init__.py +8 -14
anemoi/datasets/data/padded.py +3 -5
anemoi/datasets/data/records/backends/__init__.py +2 -2
anemoi/datasets/data/rescale.py +5 -12
anemoi/datasets/data/select.py +13 -16
anemoi/datasets/data/statistics.py +4 -7
anemoi/datasets/data/stores.py +16 -21
anemoi/datasets/data/subset.py +8 -11
anemoi/datasets/data/unchecked.py +7 -11
anemoi/datasets/data/xy.py +25 -21
anemoi/datasets/dates/__init__.py +13 -18
anemoi/datasets/dates/groups.py +7 -10
anemoi/datasets/grids.py +5 -9
anemoi/datasets/testing.py +93 -7
anemoi/datasets/validate.py +598 -0
{anemoi_datasets-0.5.26.dist-info → anemoi_datasets-0.5.27.dist-info}/METADATA +4 -4
anemoi_datasets-0.5.27.dist-info/RECORD +134 -0
anemoi/datasets/utils/__init__.py +0 -8
anemoi_datasets-0.5.26.dist-info/RECORD +0 -131
{anemoi_datasets-0.5.26.dist-info → anemoi_datasets-0.5.27.dist-info}/WHEEL +0 -0
{anemoi_datasets-0.5.26.dist-info → anemoi_datasets-0.5.27.dist-info}/entry_points.txt +0 -0
{anemoi_datasets-0.5.26.dist-info → anemoi_datasets-0.5.27.dist-info}/licenses/LICENSE +0 -0
{anemoi_datasets-0.5.26.dist-info → anemoi_datasets-0.5.27.dist-info}/top_level.txt +0 -0

anemoi/datasets/create/zarr.py CHANGED Viewed

@@ -11,7 +11,6 @@ import datetime
 import logging
 import shutil
 from typing import Any
-from typing import Optional
 import numpy as np
 import zarr
@@ -120,7 +119,7 @@ class ZarrBuiltRegistry:
     flags = None
     z = None
-    def __init__(self, path: str, synchronizer_path: Optional[str] = None, use_threads: bool = False):
+    def __init__(self, path: str, synchronizer_path: str | None = None, use_threads: bool = False):
         """Initialize the ZarrBuiltRegistry.
         Parameters
@@ -154,6 +153,12 @@ class ZarrBuiltRegistry:
             except FileNotFoundError:
                 pass
+        _build = self.zarr_path + "/_build"
+        try:
+            shutil.rmtree(_build)
+        except FileNotFoundError:
+            pass
     def _open_write(self) -> zarr.Group:
         """Open the Zarr store in write mode."""
         import zarr

anemoi/datasets/data/__init__.py CHANGED Viewed

@@ -8,9 +8,9 @@
 # nor does it submit to any jurisdiction.
 import logging
+import os
 from typing import TYPE_CHECKING
 from typing import Any
-from typing import Set
 # from .dataset import FullIndex
 # from .dataset import Shape
@@ -82,6 +82,9 @@ def open_dataset(*args: Any, **kwargs: Any) -> "Dataset":
     Dataset
         The opened dataset.
     """
+    trace = int(os.environ.get("ANEMOI_DATASETS_TRACE", 0))
     # That will get rid of OmegaConf objects
     args, kwargs = _convert(args), _convert(kwargs)
@@ -90,22 +93,28 @@ def open_dataset(*args: Any, **kwargs: Any) -> "Dataset":
     ds = ds.mutate()
     ds.arguments = {"args": args, "kwargs": kwargs}
     ds._check()
+    if trace:
+        from anemoi.datasets.testing import Trace
+        ds = Trace(ds)
     return ds
-def save_dataset(recipe: dict, zarr_path: str, n_workers: int = 1) -> None:
+def save_dataset(dataset: "Dataset", zarr_path: str, n_workers: int = 1) -> None:
     """Open a dataset and save it to disk.
     Parameters
     ----------
-    recipe : dict
-        Recipe used with open_dataset (not a dataset creation recipe).
+    dataset : Dataset
+        anemoi-dataset opened from python to save to Zarr store
     zarr_path : str
         Path to store the obtained anemoi dataset to disk.
     n_workers : int
         Number of workers to use for parallel processing. If none, sequential processing will be performed.
     """
-    _save_dataset(recipe, zarr_path, n_workers)
+    _save_dataset(dataset, zarr_path, n_workers)
 def list_dataset_names(*args: Any, **kwargs: Any) -> list[str]:
@@ -124,6 +133,6 @@ def list_dataset_names(*args: Any, **kwargs: Any) -> list[str]:
         The list of dataset names.
     """
     ds = _open_dataset(*args, **kwargs)
-    names: Set[str] = set()
+    names: set[str] = set()
     ds.get_dataset_names(names)
     return sorted(names)

anemoi/datasets/data/complement.py CHANGED Viewed

@@ -12,11 +12,6 @@ import logging
 from abc import abstractmethod
 from functools import cached_property
 from typing import Any
-from typing import Dict
-from typing import List
-from typing import Optional
-from typing import Set
-from typing import Tuple
 import numpy as np
 from numpy.typing import NDArray
@@ -91,26 +86,26 @@ class Complement(Combined):
             raise ValueError("Augment: no missing variables")
     @property
-    def variables(self) -> List[str]:
+    def variables(self) -> list[str]:
         """Returns the list of variables to be added to the target dataset."""
         return self._variables
     @property
-    def statistics(self) -> Dict[str, NDArray[Any]]:
+    def statistics(self) -> dict[str, NDArray[Any]]:
         datasets = [self._source, self._target]
         return {
             k: [d.statistics[k][d.name_to_index[i]] for d in datasets for i in d.variables if i in self.variables]
             for k in datasets[0].statistics
         }
-    def statistics_tendencies(self, delta: Optional[datetime.timedelta] = None) -> Dict[str, NDArray[Any]]:
+    def statistics_tendencies(self, delta: datetime.timedelta | None = None) -> dict[str, NDArray[Any]]:
         index = [self._source.name_to_index[v] for v in self._variables]
         if delta is None:
             delta = self.frequency
         return {k: v[index] for k, v in self._source.statistics_tendencies(delta).items()}
     @property
-    def name_to_index(self) -> Dict[str, int]:
+    def name_to_index(self) -> dict[str, int]:
         """Returns a dictionary mapping variable names to their indices."""
         return {v: i for i, v in enumerate(self.variables)}
@@ -121,7 +116,7 @@ class Complement(Combined):
         return (shape[0], len(self._variables)) + shape[2:]
     @property
-    def variables_metadata(self) -> Dict[str, Any]:
+    def variables_metadata(self) -> dict[str, Any]:
         """Returns the metadata of the variables to be added to the target dataset."""
         # Merge the two dicts first
         all_meta = {**self._source.variables_metadata, **self._target.variables_metadata}
@@ -142,7 +137,7 @@ class Complement(Combined):
         pass
     @cached_property
-    def missing(self) -> Set[int]:
+    def missing(self) -> set[int]:
         """Returns the set of missing indices in the source and target datasets."""
         missing = self._source.missing.copy()
         missing = missing | self._target.missing
@@ -317,7 +312,7 @@ class ComplementNearest(Complement):
         return apply_index_to_slices_changes(result, changes)
-def complement_factory(args: Tuple, kwargs: dict) -> Dataset:
+def complement_factory(args: tuple, kwargs: dict) -> Dataset:
     """Factory function to create a Complement instance based on the provided arguments.
     Parameters

anemoi/datasets/data/concat.py CHANGED Viewed

@@ -11,9 +11,6 @@
 import logging
 from functools import cached_property
 from typing import Any
-from typing import List
-from typing import Set
-from typing import Tuple
 import numpy as np
 from anemoi.utils.dates import frequency_to_timedelta
@@ -123,12 +120,12 @@ class ConcatMixin:
         return np.concatenate(result)
     @cached_property
-    def missing(self) -> Set[int]:
+    def missing(self) -> set[int]:
         """Returns the set of missing indices in the concatenated datasets."""
-        result: Set[int] = set()
+        result: set[int] = set()
         offset = 0
         for d in self.datasets:
-            result = result | set(m + offset for m in d.missing)
+            result = result | {m + offset for m in d.missing}
             offset += len(d)
         return result
@@ -195,7 +192,7 @@ class Concat(ConcatMixin, Combined):
         return Node(self, [d.tree() for d in self.datasets])
     @classmethod
-    def check_dataset_compatibility(cls, datasets: List[Any], fill_missing_gaps: bool = False) -> List[Any]:
+    def check_dataset_compatibility(cls, datasets: list[Any], fill_missing_gaps: bool = False) -> list[Any]:
         """Checks the compatibility of the datasets for concatenation and fills missing gaps if required.
         Parameters
@@ -259,7 +256,7 @@ class Concat(ConcatMixin, Combined):
         return {}
-def concat_factory(args: Tuple[Any, ...], kwargs: dict) -> Concat:
+def concat_factory(args: tuple[Any, ...], kwargs: dict) -> Concat:
     """Factory function to create a Concat object.
     Parameters

anemoi/datasets/data/dataset.py CHANGED Viewed

@@ -22,15 +22,10 @@ try:
 except ImportError:
     # Python 3.9
     EllipsisType = type(Ellipsis)
+from collections.abc import Sequence
+from collections.abc import Sized
 from typing import TYPE_CHECKING
 from typing import Any
-from typing import Dict
-from typing import List
-from typing import Optional
-from typing import Sequence
-from typing import Set
-from typing import Sized
-from typing import Tuple
 from typing import Union
 import numpy as np
@@ -48,8 +43,8 @@ if TYPE_CHECKING:
 LOG = logging.getLogger(__name__)
-Shape = Tuple[int, ...]
-TupleIndex = Tuple[Union[int, slice, EllipsisType], ...]
+Shape = tuple[int, ...]
+TupleIndex = tuple[Union[int, slice, EllipsisType], ...]
 FullIndex = Union[int, slice, TupleIndex]
@@ -92,8 +87,8 @@ def _tidy(v: Any) -> Any:
 class Dataset(ABC, Sized):
-    arguments: Dict[str, Any] = {}
-    _name: Union[str, None] = None
+    arguments: dict[str, Any] = {}
+    _name: str | None = None
     def mutate(self) -> "Dataset":
         """Give an opportunity to a subclass to return a new Dataset object of a different class, if needed.
@@ -148,7 +143,7 @@ class Dataset(ABC, Sized):
         return result
     @property
-    def name(self) -> Union[str, None]:
+    def name(self) -> str | None:
         """Return the name of the dataset."""
         return self._name
@@ -360,9 +355,9 @@ class Dataset(ABC, Sized):
     def _dates_to_indices(
         self,
-        start: Union[None, str, datetime.datetime],
-        end: Union[None, str, datetime.datetime],
-    ) -> List[int]:
+        start: None | str | datetime.datetime,
+        end: None | str | datetime.datetime,
+    ) -> list[int]:
         """Convert date range to a list of indices.
         Parameters
@@ -387,7 +382,7 @@ class Dataset(ABC, Sized):
         return [i for i, date in enumerate(self.dates) if start <= date <= end]
-    def _select_to_columns(self, vars: Union[str, List[str], Tuple[str], set]) -> List[int]:
+    def _select_to_columns(self, vars: str | list[str] | tuple[str] | set) -> list[int]:
         """Convert variable names to a list of column indices.
         Parameters
@@ -411,7 +406,7 @@ class Dataset(ABC, Sized):
         return [self.name_to_index[v] for v in vars]
-    def _drop_to_columns(self, vars: Union[str, Sequence[str]]) -> List[int]:
+    def _drop_to_columns(self, vars: str | Sequence[str]) -> list[int]:
         """Convert variable names to a list of column indices to drop.
         Parameters
@@ -432,7 +427,7 @@ class Dataset(ABC, Sized):
         return sorted([v for k, v in self.name_to_index.items() if k not in vars])
-    def _reorder_to_columns(self, vars: Union[str, List[str], Tuple[str], Dict[str, int]]) -> List[int]:
+    def _reorder_to_columns(self, vars: str | list[str] | tuple[str] | dict[str, int]) -> list[int]:
         """Convert variable names to a list of reordered column indices.
         Parameters
@@ -465,8 +460,8 @@ class Dataset(ABC, Sized):
         return indices
     def dates_interval_to_indices(
-        self, start: Union[None, str, datetime.datetime], end: Union[None, str, datetime.datetime]
-    ) -> List[int]:
+        self, start: None | str | datetime.datetime, end: None | str | datetime.datetime
+    ) -> list[int]:
         """Convert date interval to a list of indices.
         Parameters
@@ -483,7 +478,7 @@ class Dataset(ABC, Sized):
         """
         return self._dates_to_indices(start, end)
-    def provenance(self) -> Dict[str, Any]:
+    def provenance(self) -> dict[str, Any]:
         """Return the provenance information of the dataset.
         Returns
@@ -511,7 +506,7 @@ class Dataset(ABC, Sized):
         return tuple(shape)
     @property
-    def typed_variables(self) -> Dict[str, Any]:
+    def typed_variables(self) -> dict[str, Any]:
         """Return the variables with their types."""
         from anemoi.transform.variables import Variable
@@ -532,7 +527,7 @@ class Dataset(ABC, Sized):
         return result
-    def _input_sources(self) -> List[Any]:
+    def _input_sources(self) -> list[Any]:
         """Return the input sources of the dataset.
         Returns
@@ -544,7 +539,7 @@ class Dataset(ABC, Sized):
         self.collect_input_sources(sources)
         return sources
-    def metadata(self) -> Dict[str, Any]:
+    def metadata(self) -> dict[str, Any]:
         """Return the metadata of the dataset.
         Returns
@@ -588,7 +583,7 @@ class Dataset(ABC, Sized):
         """Return the end date of the dataset."""
         return self.dates[-1]
-    def dataset_metadata(self) -> Dict[str, Any]:
+    def dataset_metadata(self) -> dict[str, Any]:
         """Return the metadata of the dataset.
         Returns
@@ -608,7 +603,7 @@ class Dataset(ABC, Sized):
             name=self.name,
         )
-    def _supporting_arrays(self, *path: str) -> Dict[str, NDArray[Any]]:
+    def _supporting_arrays(self, *path: str) -> dict[str, NDArray[Any]]:
         """Return the supporting arrays of the dataset.
         Parameters
@@ -646,7 +641,7 @@ class Dataset(ABC, Sized):
         return result
-    def supporting_arrays(self) -> Dict[str, NDArray[Any]]:
+    def supporting_arrays(self) -> dict[str, NDArray[Any]]:
         """Return the supporting arrays to be saved in the checkpoints.
         Returns
@@ -657,7 +652,7 @@ class Dataset(ABC, Sized):
         arrays, _ = self._supporting_arrays_and_sources()
         return arrays
-    def _supporting_arrays_and_sources(self) -> Tuple[Dict[str, NDArray], Dict[int, List[str]]]:
+    def _supporting_arrays_and_sources(self) -> tuple[dict[str, NDArray], dict[int, list[str]]]:
         """Return the supporting arrays and their sources.
         Returns
@@ -684,7 +679,7 @@ class Dataset(ABC, Sized):
         return result, source_to_arrays
-    def collect_supporting_arrays(self, collected: List[Tuple[Tuple[str, ...], str, NDArray[Any]]], *path: str) -> None:
+    def collect_supporting_arrays(self, collected: list[tuple[tuple[str, ...], str, NDArray[Any]]], *path: str) -> None:
         """Collect supporting arrays.
         Parameters
@@ -697,7 +692,7 @@ class Dataset(ABC, Sized):
         # Override this method to add more arrays
         pass
-    def metadata_specific(self, **kwargs: Any) -> Dict[str, Any]:
+    def metadata_specific(self, **kwargs: Any) -> dict[str, Any]:
         """Return specific metadata of the dataset.
         Parameters
@@ -764,7 +759,7 @@ class Dataset(ABC, Sized):
         """Return the label of the dataset."""
         return self.__class__.__name__.lower()
-    def computed_constant_fields(self) -> List[str]:
+    def computed_constant_fields(self) -> list[str]:
         """Return the computed constant fields of the dataset.
         Returns
@@ -781,7 +776,7 @@ class Dataset(ABC, Sized):
         return sorted(self._compute_constant_fields_from_a_few_samples())
-    def _compute_constant_fields_from_a_few_samples(self) -> List[str]:
+    def _compute_constant_fields_from_a_few_samples(self) -> list[str]:
         """Compute constant fields from a few samples.
         Returns
@@ -822,7 +817,7 @@ class Dataset(ABC, Sized):
         return [v for i, v in enumerate(self.variables) if constants[i]]
-    def _compute_constant_fields_from_statistics(self) -> List[str]:
+    def _compute_constant_fields_from_statistics(self) -> list[str]:
         """Compute constant fields from statistics.
         Returns
@@ -842,8 +837,8 @@ class Dataset(ABC, Sized):
     def plot(
         self,
-        date: Union[int, datetime.datetime, np.datetime64, str],
-        variable: Union[int, str],
+        date: int | datetime.datetime | np.datetime64 | str,
+        variable: int | str,
         member: int = 0,
         **kwargs: Any,
     ) -> "matplotlib.pyplot.Axes":
@@ -873,10 +868,10 @@ class Dataset(ABC, Sized):
     def to_index(
         self,
-        date: Union[int, datetime.datetime, np.datetime64, str],
-        variable: Union[int, str],
+        date: int | datetime.datetime | np.datetime64 | str,
+        variable: int | str,
         member: int = 0,
-    ) -> Tuple[int, int, int]:
+    ) -> tuple[int, int, int]:
         """Convert date, variable, and member to indices.
         Parameters
@@ -945,7 +940,7 @@ class Dataset(ABC, Sized):
     @property
     @abstractmethod
-    def variables(self) -> List[str]:
+    def variables(self) -> list[str]:
         """Return the list of variables in the dataset."""
         pass
@@ -969,7 +964,7 @@ class Dataset(ABC, Sized):
     @property
     @abstractmethod
-    def name_to_index(self) -> Dict[str, int]:
+    def name_to_index(self) -> dict[str, int]:
         """Return the mapping of variable names to indices."""
         pass
@@ -1005,30 +1000,30 @@ class Dataset(ABC, Sized):
     @property
     @abstractmethod
-    def variables_metadata(self) -> Dict[str, Any]:
+    def variables_metadata(self) -> dict[str, Any]:
         """Return the metadata of the variables in the dataset."""
         pass
     @abstractmethod
     @cached_property
-    def missing(self) -> Set[int]:
+    def missing(self) -> set[int]:
         """Return the set of missing indices in the dataset."""
         pass
     @abstractmethod
     @cached_property
-    def constant_fields(self) -> List[str]:
+    def constant_fields(self) -> list[str]:
         """Return the list of constant fields in the dataset."""
         pass
     @abstractmethod
     @cached_property
-    def statistics(self) -> Dict[str, NDArray[Any]]:
+    def statistics(self) -> dict[str, NDArray[Any]]:
         """Return the statistics of the dataset."""
         pass
     @abstractmethod
-    def statistics_tendencies(self, delta: Optional[datetime.timedelta] = None) -> Dict[str, NDArray[Any]]:
+    def statistics_tendencies(self, delta: datetime.timedelta | None = None) -> dict[str, NDArray[Any]]:
         """Return the tendencies of the statistics in the dataset.
         Parameters
@@ -1071,7 +1066,7 @@ class Dataset(ABC, Sized):
         pass
     @abstractmethod
-    def collect_input_sources(self, sources: List[Any]) -> None:
+    def collect_input_sources(self, sources: list[Any]) -> None:
         """Collect the input sources of the dataset.
         Parameters
@@ -1082,7 +1077,7 @@ class Dataset(ABC, Sized):
         pass
     @abstractmethod
-    def get_dataset_names(self, names: Set[str]) -> None:
+    def get_dataset_names(self, names: set[str]) -> None:
         """Get the names of the datasets.
         Parameters

anemoi/datasets/data/debug.py CHANGED Viewed

@@ -11,12 +11,10 @@
 import logging
 import os
 import textwrap
+from collections.abc import Callable
 from functools import wraps
 from typing import TYPE_CHECKING
 from typing import Any
-from typing import Callable
-from typing import List
-from typing import Optional
 from anemoi.utils.text import Tree
 from numpy.typing import NDArray
@@ -56,7 +54,7 @@ def css(name: str) -> str:
 class Node:
     """A class to represent a node in a dataset tree."""
-    def __init__(self, dataset: "Dataset", kids: List[Any], **kwargs: Any) -> None:
+    def __init__(self, dataset: "Dataset", kids: list[Any], **kwargs: Any) -> None:
         """Initializes a Node object.
         Parameters
@@ -72,7 +70,7 @@ class Node:
         self.kids = kids
         self.kwargs = kwargs
-    def _put(self, indent: int, result: List[str]) -> None:
+    def _put(self, indent: int, result: list[str]) -> None:
         """Helper method to add the node representation to the result list.
         Parameters
@@ -103,11 +101,11 @@ class Node:
         str
             String representation of the node.
         """
-        result: List[str] = []
+        result: list[str] = []
         self._put(0, result)
         return "\n".join(result)
-    def graph(self, digraph: List[str], nodes: dict) -> None:
+    def graph(self, digraph: list[str], nodes: dict) -> None:
         """Generates a graph representation of the node.
         Parameters
@@ -170,7 +168,7 @@ class Node:
         digraph.append("}")
         return "\n".join(digraph)
-    def _html(self, indent: str, rows: List[List[str]]) -> None:
+    def _html(self, indent: str, rows: list[list[str]]) -> None:
         """Helper method to add the node representation to the HTML rows.
         Parameters
@@ -273,7 +271,7 @@ class Node:
 class Source:
     """A class used to follow the provenance of a data point."""
-    def __init__(self, dataset: Any, index: int, source: Optional[Any] = None, info: Optional[Any] = None) -> None:
+    def __init__(self, dataset: Any, index: int, source: Any | None = None, info: Any | None = None) -> None:
         """Initializes a Source object.
         Parameters

anemoi/datasets/data/ensemble.py CHANGED Viewed

@@ -10,8 +10,6 @@
 import logging
 from typing import Any
-from typing import Dict
-from typing import Tuple
 import numpy as np
 from numpy.typing import NDArray
@@ -105,7 +103,7 @@ class Number(Forwards):
         """
         return Node(self, [self.forward.tree()], numbers=[n + 1 for n in self.members])
-    def metadata_specific(self, **kwargs: Any) -> Dict[str, Any]:
+    def metadata_specific(self, **kwargs: Any) -> dict[str, Any]:
         """Returns metadata specific to the Number object.
         Parameters
@@ -122,7 +120,7 @@ class Number(Forwards):
             "numbers": [n + 1 for n in self.members],
         }
-    def forwards_subclass_metadata_specific(self) -> Dict[str, Any]:
+    def forwards_subclass_metadata_specific(self) -> dict[str, Any]:
         """Returns metadata specific to the Number object."""
         return {}
@@ -140,7 +138,7 @@ class Ensemble(GivenAxis):
         """
         return Node(self, [d.tree() for d in self.datasets])
-    def forwards_subclass_metadata_specific(self) -> Dict[str, Any]:
+    def forwards_subclass_metadata_specific(self) -> dict[str, Any]:
         """Get the metadata specific to the forwards subclass.
         Returns:
@@ -149,7 +147,7 @@ class Ensemble(GivenAxis):
         return {}
-def ensemble_factory(args: Tuple[Any, ...], kwargs: Dict[str, Any]) -> Ensemble:
+def ensemble_factory(args: tuple[Any, ...], kwargs: dict[str, Any]) -> Ensemble:
     """Factory function to create an Ensemble object.
     Parameters

anemoi/datasets/data/fill_missing.py CHANGED Viewed

@@ -10,9 +10,6 @@
 import logging
 from typing import Any
-from typing import Dict
-from typing import Optional
-from typing import Set
 import numpy as np
 from numpy.typing import NDArray
@@ -46,7 +43,7 @@ class MissingDatesFill(Forwards):
         """
         super().__init__(dataset)
         self._missing = set(dataset.missing)
-        self._warnings: Set[int] = set()
+        self._warnings: set[int] = set()
     @debug_indexing
     @expand_list_indexing
@@ -84,7 +81,7 @@ class MissingDatesFill(Forwards):
         return np.stack([self[i] for i in range(*s.indices(self._len))])
     @property
-    def missing(self) -> Set[int]:
+    def missing(self) -> set[int]:
         """Get the set of missing dates."""
         return set()
@@ -153,7 +150,7 @@ class MissingDatesClosest(MissingDatesFill):
         self.closest = closest
         self._closest = {}
-    def _fill_missing(self, n: int, a: Optional[int], b: Optional[int]) -> NDArray[Any]:
+    def _fill_missing(self, n: int, a: int | None, b: int | None) -> NDArray[Any]:
         """Fill the missing date at the given index.
         Parameters
@@ -189,7 +186,7 @@ class MissingDatesClosest(MissingDatesFill):
         return self.forward[self._closest[n]]
-    def forwards_subclass_metadata_specific(self) -> Dict[str, Any]:
+    def forwards_subclass_metadata_specific(self) -> dict[str, Any]:
         """Get metadata specific to the subclass.
         Returns
@@ -224,7 +221,7 @@ class MissingDatesInterpolate(MissingDatesFill):
         super().__init__(dataset)
         self._alpha = {}
-    def _fill_missing(self, n: int, a: Optional[int], b: Optional[int]) -> NDArray[Any]:
+    def _fill_missing(self, n: int, a: int | None, b: int | None) -> NDArray[Any]:
         """Fill the missing date at the given index using interpolation.
         Parameters
@@ -264,7 +261,7 @@ class MissingDatesInterpolate(MissingDatesFill):
         alpha = self._alpha[n]
         return self.forward[a] * (1 - alpha) + self.forward[b] * alpha
-    def forwards_subclass_metadata_specific(self) -> Dict[str, Any]:
+    def forwards_subclass_metadata_specific(self) -> dict[str, Any]:
         """Get metadata specific to the subclass.
         Returns
@@ -285,7 +282,7 @@ class MissingDatesInterpolate(MissingDatesFill):
         return Node(self, [self.forward.tree()])
-def fill_missing_dates_factory(dataset: Any, method: str, kwargs: Dict[str, Any]) -> Dataset:
+def fill_missing_dates_factory(dataset: Any, method: str, kwargs: dict[str, Any]) -> Dataset:
     """Factory function to create an instance of a class to fill missing dates.
     Parameters

anemoi-datasets 0.5.26__py3-none-any.whl → 0.5.27__py3-none-any.whl

anemoi-datasets 0.5.26py3-none-any.whl → 0.5.27py3-none-any.whl