PyPI - anemoi-datasets - Versions diffs - 0.5.16__py3-none-any.whl → 0.5.17__py3-none-any.whl - Mend

anemoi-datasets 0.5.16py3-none-any.whl → 0.5.17py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (155) hide show

anemoi/datasets/__init__.py +4 -1
anemoi/datasets/__main__.py +12 -2
anemoi/datasets/_version.py +9 -4
anemoi/datasets/commands/cleanup.py +17 -2
anemoi/datasets/commands/compare.py +18 -2
anemoi/datasets/commands/copy.py +196 -14
anemoi/datasets/commands/create.py +50 -7
anemoi/datasets/commands/finalise-additions.py +17 -2
anemoi/datasets/commands/finalise.py +17 -2
anemoi/datasets/commands/init-additions.py +17 -2
anemoi/datasets/commands/init.py +16 -2
anemoi/datasets/commands/inspect.py +283 -62
anemoi/datasets/commands/load-additions.py +16 -2
anemoi/datasets/commands/load.py +16 -2
anemoi/datasets/commands/patch.py +17 -2
anemoi/datasets/commands/publish.py +17 -2
anemoi/datasets/commands/scan.py +31 -3
anemoi/datasets/compute/recentre.py +47 -11
anemoi/datasets/create/__init__.py +612 -85
anemoi/datasets/create/check.py +142 -20
anemoi/datasets/create/chunks.py +64 -4
anemoi/datasets/create/config.py +185 -21
anemoi/datasets/create/filter.py +50 -0
anemoi/datasets/create/filters/__init__.py +33 -0
anemoi/datasets/create/filters/empty.py +37 -0
anemoi/datasets/create/filters/legacy.py +93 -0
anemoi/datasets/create/filters/noop.py +37 -0
anemoi/datasets/create/filters/orog_to_z.py +58 -0
anemoi/datasets/create/{functions/filters → filters}/pressure_level_relative_humidity_to_specific_humidity.py +33 -10
anemoi/datasets/create/{functions/filters → filters}/pressure_level_specific_humidity_to_relative_humidity.py +32 -8
anemoi/datasets/create/filters/rename.py +205 -0
anemoi/datasets/create/{functions/filters → filters}/rotate_winds.py +43 -28
anemoi/datasets/create/{functions/filters → filters}/single_level_dewpoint_to_relative_humidity.py +32 -9
anemoi/datasets/create/{functions/filters → filters}/single_level_relative_humidity_to_dewpoint.py +33 -9
anemoi/datasets/create/{functions/filters → filters}/single_level_relative_humidity_to_specific_humidity.py +55 -7
anemoi/datasets/create/{functions/filters → filters}/single_level_specific_humidity_to_relative_humidity.py +98 -37
anemoi/datasets/create/filters/speeddir_to_uv.py +95 -0
anemoi/datasets/create/{functions/filters → filters}/sum.py +24 -27
anemoi/datasets/create/filters/transform.py +53 -0
anemoi/datasets/create/{functions/filters → filters}/unrotate_winds.py +27 -18
anemoi/datasets/create/filters/uv_to_speeddir.py +94 -0
anemoi/datasets/create/{functions/filters → filters}/wz_to_w.py +51 -33
anemoi/datasets/create/input/__init__.py +76 -5
anemoi/datasets/create/input/action.py +149 -13
anemoi/datasets/create/input/concat.py +81 -10
anemoi/datasets/create/input/context.py +39 -4
anemoi/datasets/create/input/data_sources.py +72 -6
anemoi/datasets/create/input/empty.py +21 -3
anemoi/datasets/create/input/filter.py +60 -12
anemoi/datasets/create/input/function.py +154 -37
anemoi/datasets/create/input/join.py +86 -14
anemoi/datasets/create/input/misc.py +67 -17
anemoi/datasets/create/input/pipe.py +33 -6
anemoi/datasets/create/input/repeated_dates.py +189 -41
anemoi/datasets/create/input/result.py +202 -87
anemoi/datasets/create/input/step.py +119 -22
anemoi/datasets/create/input/template.py +100 -13
anemoi/datasets/create/input/trace.py +62 -7
anemoi/datasets/create/patch.py +52 -4
anemoi/datasets/create/persistent.py +134 -17
anemoi/datasets/create/size.py +15 -1
anemoi/datasets/create/source.py +51 -0
anemoi/datasets/create/sources/__init__.py +36 -0
anemoi/datasets/create/{functions/sources → sources}/accumulations.py +296 -30
anemoi/datasets/create/{functions/sources → sources}/constants.py +27 -2
anemoi/datasets/create/{functions/sources → sources}/eccc_fstd.py +7 -3
anemoi/datasets/create/sources/empty.py +37 -0
anemoi/datasets/create/{functions/sources → sources}/forcings.py +25 -1
anemoi/datasets/create/sources/grib.py +297 -0
anemoi/datasets/create/{functions/sources → sources}/hindcasts.py +38 -4
anemoi/datasets/create/sources/legacy.py +93 -0
anemoi/datasets/create/{functions/sources → sources}/mars.py +168 -20
anemoi/datasets/create/sources/netcdf.py +42 -0
anemoi/datasets/create/sources/opendap.py +43 -0
anemoi/datasets/create/{functions/sources/__init__.py → sources/patterns.py} +35 -4
anemoi/datasets/create/sources/recentre.py +150 -0
anemoi/datasets/create/{functions/sources → sources}/source.py +27 -5
anemoi/datasets/create/{functions/sources → sources}/tendencies.py +64 -7
anemoi/datasets/create/sources/xarray.py +92 -0
anemoi/datasets/create/sources/xarray_kerchunk.py +36 -0
anemoi/datasets/create/sources/xarray_support/README.md +1 -0
anemoi/datasets/create/{functions/sources/xarray → sources/xarray_support}/__init__.py +109 -8
anemoi/datasets/create/sources/xarray_support/coordinates.py +442 -0
anemoi/datasets/create/{functions/sources/xarray → sources/xarray_support}/field.py +94 -16
anemoi/datasets/create/{functions/sources/xarray → sources/xarray_support}/fieldlist.py +90 -25
anemoi/datasets/create/sources/xarray_support/flavour.py +1036 -0
anemoi/datasets/create/{functions/sources/xarray → sources/xarray_support}/grid.py +92 -31
anemoi/datasets/create/sources/xarray_support/metadata.py +395 -0
anemoi/datasets/create/sources/xarray_support/patch.py +91 -0
anemoi/datasets/create/sources/xarray_support/time.py +391 -0
anemoi/datasets/create/sources/xarray_support/variable.py +331 -0
anemoi/datasets/create/sources/xarray_zarr.py +41 -0
anemoi/datasets/create/{functions/sources → sources}/zenodo.py +34 -5
anemoi/datasets/create/statistics/__init__.py +233 -44
anemoi/datasets/create/statistics/summary.py +52 -6
anemoi/datasets/create/testing.py +76 -0
anemoi/datasets/create/{functions/filters/noop.py → typing.py} +6 -3
anemoi/datasets/create/utils.py +97 -6
anemoi/datasets/create/writer.py +26 -4
anemoi/datasets/create/zarr.py +170 -23
anemoi/datasets/data/__init__.py +51 -4
anemoi/datasets/data/complement.py +191 -40
anemoi/datasets/data/concat.py +141 -16
anemoi/datasets/data/dataset.py +552 -61
anemoi/datasets/data/debug.py +197 -26
anemoi/datasets/data/ensemble.py +93 -8
anemoi/datasets/data/fill_missing.py +165 -18
anemoi/datasets/data/forwards.py +428 -56
anemoi/datasets/data/grids.py +323 -97
anemoi/datasets/data/indexing.py +112 -19
anemoi/datasets/data/interpolate.py +92 -12
anemoi/datasets/data/join.py +158 -19
anemoi/datasets/data/masked.py +129 -15
anemoi/datasets/data/merge.py +137 -23
anemoi/datasets/data/misc.py +172 -16
anemoi/datasets/data/missing.py +233 -29
anemoi/datasets/data/rescale.py +111 -10
anemoi/datasets/data/select.py +168 -26
anemoi/datasets/data/statistics.py +67 -6
anemoi/datasets/data/stores.py +149 -64
anemoi/datasets/data/subset.py +159 -25
anemoi/datasets/data/unchecked.py +168 -57
anemoi/datasets/data/xy.py +168 -25
anemoi/datasets/dates/__init__.py +191 -16
anemoi/datasets/dates/groups.py +189 -47
anemoi/datasets/grids.py +270 -31
anemoi/datasets/testing.py +28 -1
{anemoi_datasets-0.5.16.dist-info → anemoi_datasets-0.5.17.dist-info}/METADATA +9 -6
anemoi_datasets-0.5.17.dist-info/RECORD +137 -0
{anemoi_datasets-0.5.16.dist-info → anemoi_datasets-0.5.17.dist-info}/WHEEL +1 -1
anemoi/datasets/create/functions/__init__.py +0 -66
anemoi/datasets/create/functions/filters/__init__.py +0 -9
anemoi/datasets/create/functions/filters/empty.py +0 -17
anemoi/datasets/create/functions/filters/orog_to_z.py +0 -58
anemoi/datasets/create/functions/filters/rename.py +0 -79
anemoi/datasets/create/functions/filters/speeddir_to_uv.py +0 -78
anemoi/datasets/create/functions/filters/uv_to_speeddir.py +0 -56
anemoi/datasets/create/functions/sources/empty.py +0 -15
anemoi/datasets/create/functions/sources/grib.py +0 -150
anemoi/datasets/create/functions/sources/netcdf.py +0 -15
anemoi/datasets/create/functions/sources/opendap.py +0 -15
anemoi/datasets/create/functions/sources/recentre.py +0 -60
anemoi/datasets/create/functions/sources/xarray/coordinates.py +0 -255
anemoi/datasets/create/functions/sources/xarray/flavour.py +0 -472
anemoi/datasets/create/functions/sources/xarray/metadata.py +0 -148
anemoi/datasets/create/functions/sources/xarray/patch.py +0 -44
anemoi/datasets/create/functions/sources/xarray/time.py +0 -177
anemoi/datasets/create/functions/sources/xarray/variable.py +0 -188
anemoi/datasets/create/functions/sources/xarray_kerchunk.py +0 -42
anemoi/datasets/create/functions/sources/xarray_zarr.py +0 -15
anemoi/datasets/utils/fields.py +0 -47
anemoi_datasets-0.5.16.dist-info/RECORD +0 -129
{anemoi_datasets-0.5.16.dist-info → anemoi_datasets-0.5.17.dist-info}/entry_points.txt +0 -0
{anemoi_datasets-0.5.16.dist-info → anemoi_datasets-0.5.17.dist-info/licenses}/LICENSE +0 -0
{anemoi_datasets-0.5.16.dist-info → anemoi_datasets-0.5.17.dist-info}/top_level.txt +0 -0

anemoi/datasets/data/grids.py CHANGED Viewed

@@ -10,10 +10,20 @@
 import logging
 from functools import cached_property
+from typing import Any
+from typing import Dict
+from typing import List
+from typing import Optional
+from typing import Tuple
 import numpy as np
+from numpy.typing import NDArray
 from scipy.spatial import cKDTree
+from .dataset import Dataset
+from .dataset import FullIndex
+from .dataset import Shape
+from .dataset import TupleIndex
 from .debug import Node
 from .debug import debug_indexing
 from .forwards import Combined
@@ -30,12 +40,33 @@ LOG = logging.getLogger(__name__)
 class Concat(Combined):
-    def __len__(self):
+    """A class to represent concatenated datasets."""
+    def __len__(self) -> int:
+        """Returns the total length of the concatenated datasets.
+        Returns
+        -------
+        int
+            Total length of the concatenated datasets.
+        """
         return sum(len(i) for i in self.datasets)
     @debug_indexing
     @expand_list_indexing
-    def _get_tuple(self, index):
+    def _get_tuple(self, index: TupleIndex) -> NDArray[Any]:
+        """Retrieves a tuple of data from the concatenated datasets based on the given index.
+        Parameters
+        ----------
+        index : TupleIndex
+            Index specifying the data to retrieve.
+        Returns
+        -------
+        NDArray[Any]
+            Concatenated data array from the specified index.
+        """
         index, changes = index_to_slices(index, self.shape)
         # print(index, changes)
         lengths = [d.shape[0] for d in self.datasets]
@@ -46,7 +77,19 @@ class Concat(Combined):
         return apply_index_to_slices_changes(result, changes)
     @debug_indexing
-    def __getitem__(self, n):
+    def __getitem__(self, n: FullIndex) -> NDArray[Any]:
+        """Retrieves data from the concatenated datasets based on the given index.
+        Parameters
+        ----------
+        n : FullIndex
+            Index specifying the data to retrieve.
+        Returns
+        -------
+        NDArray[Any]
+            Data array from the concatenated datasets based on the index.
+        """
         if isinstance(n, tuple):
             return self._get_tuple(n)
@@ -61,7 +104,19 @@ class Concat(Combined):
         return self.datasets[k][n]
     @debug_indexing
-    def _get_slice(self, s):
+    def _get_slice(self, s: slice) -> NDArray[Any]:
+        """Retrieves a slice of data from the concatenated datasets.
+        Parameters
+        ----------
+        s : slice
+            Slice object specifying the range of data to retrieve.
+        Returns
+        -------
+        NDArray[Any]
+            Concatenated data array from the specified slice.
+        """
         result = []
         lengths = [d.shape[0] for d in self.datasets]
@@ -71,50 +126,134 @@ class Concat(Combined):
         return np.concatenate(result)
-    def check_compatibility(self, d1, d2):
+    def check_compatibility(self, d1: Dataset, d2: Dataset) -> None:
+        """Check the compatibility of two datasets for concatenation.
+        Parameters
+        ----------
+        d1 : Dataset
+            The first dataset.
+        d2 : Dataset
+            The second dataset.
+        """
         super().check_compatibility(d1, d2)
         self.check_same_sub_shapes(d1, d2, drop_axis=0)
-    def check_same_lengths(self, d1, d2):
+    def check_same_lengths(self, d1: Dataset, d2: Dataset) -> None:
+        """Check if the lengths of two datasets are the same.
+        Parameters
+        ----------
+        d1 : Dataset
+            The first dataset.
+        d2 : Dataset
+            The second dataset.
+        """
         # Turned off because we are concatenating along the first axis
         pass
-    def check_same_dates(self, d1, d2):
+    def check_same_dates(self, d1: Dataset, d2: Dataset) -> None:
+        """Check if the dates of two datasets are the same.
+        Parameters
+        ----------
+        d1 : Dataset
+            The first dataset.
+        d2 : Dataset
+            The second dataset.
+        """
         # Turned off because we are concatenating along the dates axis
         pass
     @property
-    def dates(self):
+    def dates(self) -> NDArray[np.datetime64]:
+        """Returns the concatenated dates of all datasets."""
         return np.concatenate([d.dates for d in self.datasets])
     @property
-    def shape(self):
+    def shape(self) -> Shape:
+        """Returns the shape of the concatenated datasets."""
         return (len(self),) + self.datasets[0].shape[1:]
-    def tree(self):
+    def tree(self) -> Node:
+        """Generates a hierarchical tree structure for the concatenated datasets.
+        Returns
+        -------
+        Node
+            A Node object representing the concatenated datasets.
+        """
         return Node(self, [d.tree() for d in self.datasets])
 class GridsBase(GivenAxis):
-    def __init__(self, datasets, axis):
+    """A base class for handling grids in datasets."""
+    def __init__(self, datasets: List[Any], axis: int) -> None:
+        """Initializes a GridsBase object.
+        Parameters
+        ----------
+        datasets : List[Any]
+            List of datasets.
+        axis : int
+            Axis along which to combine the datasets.
+        """
         super().__init__(datasets, axis)
         # Shape: (dates, variables, ensemble, 1d-values)
         assert len(datasets[0].shape) == 4, "Grids must be 1D for now"
-    def check_same_grid(self, d1, d2):
+    def check_same_grid(self, d1: Dataset, d2: Dataset) -> None:
+        """Check if the grids of two datasets are the same.
+        Parameters
+        ----------
+        d1 : Dataset
+            The first dataset.
+        d2 : Dataset
+            The second dataset.
+        """
         # We don't check the grid, because we want to be able to combine
         pass
-    def check_same_resolution(self, d1, d2):
+    def check_same_resolution(self, d1: Dataset, d2: Dataset) -> None:
+        """Check if the resolutions of two datasets are the same.
+        Parameters
+        ----------
+        d1 : Dataset
+            The first dataset.
+        d2 : Dataset
+            The second dataset.
+        """
         # We don't check the resolution, because we want to be able to combine
         pass
-    def metadata_specific(self):
+    def metadata_specific(self, **kwargs: Any) -> Dict[str, Any]:
+        """Returns metadata specific to the GridsBase object.
+        Parameters
+        ----------
+        kwargs : Any
+            Additional keyword arguments.
+        Returns
+        -------
+        Dict[str, Any]
+            Metadata specific to the GridsBase object.
+        """
         return super().metadata_specific(
             multi_grids=True,
         )
-    def collect_input_sources(self, collected):
+    def collect_input_sources(self, collected: List[Any]) -> None:
+        """Collects input sources from the datasets.
+        Parameters
+        ----------
+        collected : List[Any]
+            List to which the input sources are appended.
+        """
         # We assume that,because they have different grids, they have different input sources
         for d in self.datasets:
             collected.append(d)
@@ -122,42 +261,75 @@ class GridsBase(GivenAxis):
 class Grids(GridsBase):
+    """A class to represent combined grids from multiple datasets."""
     # TODO: select the statistics of the most global grid?
     @property
-    def latitudes(self):
+    def latitudes(self) -> NDArray[Any]:
+        """Returns the concatenated latitudes of all datasets."""
         return np.concatenate([d.latitudes for d in self.datasets])
     @property
-    def longitudes(self):
+    def longitudes(self) -> NDArray[Any]:
+        """Returns the concatenated longitudes of all datasets."""
         return np.concatenate([d.longitudes for d in self.datasets])
     @property
-    def grids(self):
+    def grids(self) -> Tuple[Any, ...]:
+        """Returns the grids of all datasets."""
         result = []
         for d in self.datasets:
             result.extend(d.grids)
         return tuple(result)
-    def tree(self):
+    def tree(self) -> Node:
+        """Generates a hierarchical tree structure for the Grids object.
+        Returns
+        -------
+        Node
+            A Node object representing the Grids object.
+        """
         return Node(self, [d.tree() for d in self.datasets], mode="concat")
+    def forwards_subclass_metadata_specific(self) -> Dict[str, Any]:
+        """Get the metadata specific to the forwards subclass.
+        Returns:
+        Dict[str, Any]: The metadata specific to the forwards subclass.
+        """
+        return {}
 class Cutout(GridsBase):
-    def __init__(self, datasets, axis=3, cropping_distance=2.0, neighbours=5, min_distance_km=None, plot=None):
+    """A class to handle hierarchical management of Limited Area Models (LAMs) and a global dataset."""
+    def __init__(
+        self,
+        datasets: List[Any],
+        axis: int = 3,
+        cropping_distance: float = 2.0,
+        neighbours: int = 5,
+        min_distance_km: Optional[float] = None,
+        plot: Optional[bool] = None,
+    ) -> None:
         """Initializes a Cutout object for hierarchical management of Limited Area
         Models (LAMs) and a global dataset, handling overlapping regions.
-        Args:
-            datasets (list): List of LAM and global datasets.
-            axis (int): Concatenation axis, must be set to 3.
-            cropping_distance (float): Distance threshold in degrees for
-                cropping cutouts.
-            neighbours (int): Number of neighboring points to consider when
-                constructing masks.
-            min_distance_km (float, optional): Minimum distance threshold in km
-                between grid points.
-            plot (bool, optional): Flag to enable or disable visualization
-                plots.
+        Parameters
+        ----------
+        datasets : list
+            List of LAM and global datasets.
+        axis : int
+            Concatenation axis, must be set to 3.
+        cropping_distance : float
+            Distance threshold in degrees for cropping cutouts.
+        neighbours : int
+            Number of neighboring points to consider when constructing masks.
+        min_distance_km : float, optional
+            Minimum distance threshold in km between grid points.
+        plot : bool, optional
+            Flag to enable or disable visualization plots.
         """
         super().__init__(datasets, axis)
         assert len(datasets) >= 2, "CutoutGrids requires at least two datasets"
@@ -179,14 +351,13 @@ class Cutout(GridsBase):
         # Initialize cumulative masks
         self._initialize_masks()
-    def _initialize_masks(self):
-        """Generates hierarchical masks for each LAM dataset by excluding
-        overlapping regions with previous LAMs and creating a global mask for
-        the global dataset.
+    def _initialize_masks(self) -> None:
+        """Generate hierarchical masks for each LAM dataset by excluding overlapping regions with previous LAMs and creating a global mask for the global dataset.
-        Raises:
-            ValueError: If the global mask dimension does not match the global
-                dataset grid points.
+        Raises
+        ------
+        ValueError
+            If the global mask dimension does not match the global dataset grid points.
         """
         from anemoi.datasets.grids import cutout_mask
@@ -236,21 +407,33 @@ class Cutout(GridsBase):
                         lam_current_mask[~lam_overlap_mask] = False
             self.masks.append(lam_current_mask)
-    def has_overlap(self, lats1, lons1, lats2, lons2, distance_threshold=1.0):
-        """Checks for overlapping points between two sets of latitudes and
-        longitudes within a specified distance threshold.
-        Args:
-            lats1, lons1 (np.ndarray): Latitude and longitude arrays for the
-                first dataset.
-            lats2, lons2 (np.ndarray): Latitude and longitude arrays for the
-                second dataset.
-            distance_threshold (float): Distance in degrees to consider as
-                overlapping.
-        Returns:
-            bool: True if any points overlap within the distance threshold,
-                otherwise False.
+    def has_overlap(
+        self,
+        lats1: NDArray[Any],
+        lons1: NDArray[Any],
+        lats2: NDArray[Any],
+        lons2: NDArray[Any],
+        distance_threshold: float = 1.0,
+    ) -> bool:
+        """Check for overlapping points between two sets of latitudes and longitudes within a specified distance threshold.
+        Parameters
+        ----------
+        lats1 : NDArray[Any]
+            Latitude array for the first dataset.
+        lons1 : NDArray[Any]
+            Longitude array for the first dataset.
+        lats2 : NDArray[Any]
+            Latitude array for the second dataset.
+        lons2 : NDArray[Any]
+            Longitude array for the second dataset.
+        distance_threshold : float
+            Distance in degrees to consider as overlapping.
+        Returns
+        -------
+        bool
+            True if any points overlap within the distance threshold, otherwise False.
         """
         # Create KDTree for the first set of points
         tree = cKDTree(np.vstack((lats1, lons1)).T)
@@ -261,31 +444,35 @@ class Cutout(GridsBase):
         # Check if any distance is less than the specified threshold
         return np.any(distances < distance_threshold)
-    def __getitem__(self, index):
-        """Retrieves data from the masked LAMs and global dataset based on the
-        given index.
+    def __getitem__(self, index: FullIndex) -> NDArray[Any]:
+        """Retrieve data from the masked LAMs and global dataset based on the given index.
-        Args:
-            index (int or slice or tuple): Index specifying the data to
-                retrieve.
+        Parameters
+        ----------
+        index : FullIndex
+            Index specifying the data to retrieve.
-        Returns:
-            np.ndarray: Data array from the masked datasets based on the index.
+        Returns
+        -------
+        NDArray[Any]
+            Data array from the masked datasets based on the index.
         """
         if isinstance(index, (int, slice)):
             index = (index, slice(None), slice(None), slice(None))
         return self._get_tuple(index)
-    def _get_tuple(self, index):
-        """Helper method that applies masks and retrieves data from each dataset
-        according to the specified index.
+    def _get_tuple(self, index: TupleIndex) -> NDArray[Any]:
+        """Helper method that applies masks and retrieves data from each dataset according to the specified index.
-        Args:
-            index (tuple): Index specifying slices to retrieve data.
+        Parameters
+        ----------
+        index : TupleIndex
+            Index specifying slices to retrieve data.
-        Returns:
-            np.ndarray: Concatenated data array from all datasets based on the
-                index.
+        Returns
+        -------
+        NDArray[Any]
+            Concatenated data array from all datasets based on the index.
         """
         index, changes = index_to_slices(index, self.shape)
         # Select data from each LAM
@@ -300,13 +487,15 @@ class Cutout(GridsBase):
         return apply_index_to_slices_changes(result, changes)
-    def collect_supporting_arrays(self, collected, *path):
-        """Collects supporting arrays, including masks for each LAM and the global
-        dataset.
+    def collect_supporting_arrays(self, collected: List[Any], *path: Any) -> None:
+        """Collect supporting arrays, including masks for each LAM and the global dataset.
-        Args:
-            collected (list): List to which the supporting arrays are appended.
-            *path: Variable length argument list specifying the paths for the masks.
+        Parameters
+        ----------
+        collected : List[Any]
+            List to which the supporting arrays are appended.
+        *path : Any
+            Variable length argument list specifying the paths for the masks.
         """
         # Append masks for each LAM
         for i, (lam, mask) in enumerate(zip(self.lams, self.masks)):
@@ -316,41 +505,41 @@ class Cutout(GridsBase):
         collected.append((path + ("global",), "cutout_mask", self.global_mask))
     @cached_property
-    def shape(self):
+    def shape(self) -> Shape:
         """Returns the shape of the Cutout, accounting for retained grid points
         across all LAMs and the global dataset.
-        Returns:
-            tuple: Shape of the concatenated masked datasets.
         """
         shapes = [np.sum(mask) for mask in self.masks]
         global_shape = np.sum(self.global_mask)
         total_shape = sum(shapes) + global_shape
         return tuple(self.lams[0].shape[:-1] + (int(total_shape),))
-    def check_same_resolution(self, d1, d2):
+    def check_same_resolution(self, d1: Dataset, d2: Dataset) -> None:
+        """Checks if the resolutions of two datasets are the same.
+        Parameters
+        ----------
+        d1 : Dataset
+            The first dataset.
+        d2 : Dataset
+            The second dataset.
+        """
         # Turned off because we are combining different resolutions
         pass
     @property
-    def grids(self):
+    def grids(self) -> TupleIndex:
         """Returns the number of grid points for each LAM and the global dataset
         after applying masks.
-        Returns:
-            tuple: Count of retained grid points for each dataset.
         """
         grids = [np.sum(mask) for mask in self.masks]
         grids.append(np.sum(self.global_mask))
         return tuple(grids)
     @property
-    def latitudes(self):
+    def latitudes(self) -> NDArray[Any]:
         """Returns the concatenated latitudes of each LAM and the global dataset
         after applying masks.
-        Returns:
-            np.ndarray: Concatenated latitude array for the masked datasets.
         """
         lam_latitudes = np.concatenate([lam.latitudes[mask] for lam, mask in zip(self.lams, self.masks)])
@@ -362,12 +551,9 @@ class Cutout(GridsBase):
         return latitudes
     @property
-    def longitudes(self):
+    def longitudes(self) -> NDArray[Any]:
         """Returns the concatenated longitudes of each LAM and the global dataset
         after applying masks.
-        Returns:
-            np.ndarray: Concatenated longitude array for the masked datasets.
         """
         lam_longitudes = np.concatenate([lam.longitudes[mask] for lam, mask in zip(self.lams, self.masks)])
@@ -378,19 +564,45 @@ class Cutout(GridsBase):
         longitudes = np.concatenate([lam_longitudes, self.globe.longitudes[self.global_mask]])
         return longitudes
-    def tree(self):
+    def tree(self) -> Node:
         """Generates a hierarchical tree structure for the `Cutout` instance and
         its associated datasets.
-        Returns:
-            Node: A `Node` object representing the `Cutout` instance as the root
+        Returns
+        -------
+        Node
+            A `Node` object representing the `Cutout` instance as the root
             node, with each dataset in `self.datasets` represented as a child
             node.
         """
         return Node(self, [d.tree() for d in self.datasets])
+    def forwards_subclass_metadata_specific(self) -> Dict[str, Any]:
+        """Returns metadata specific to the Cutout object.
-def grids_factory(args, kwargs):
+        Returns
+        -------
+        Dict[str, Any]
+            Metadata specific to the Cutout object.
+        """
+        return {}
+def grids_factory(args: Tuple[Any, ...], kwargs: dict) -> Dataset:
+    """Factory function to create a Grids object.
+    Parameters
+    ----------
+    args : Tuple[Any, ...]
+        Positional arguments.
+    kwargs : dict
+        Keyword arguments.
+    Returns
+    -------
+    Dataset
+        A Grids object.
+    """
     if "ensemble" in kwargs:
         raise NotImplementedError("Cannot use both 'ensemble' and 'grids'")
@@ -406,7 +618,21 @@ def grids_factory(args, kwargs):
     return Grids(datasets, axis=axis)._subset(**kwargs)
-def cutout_factory(args, kwargs):
+def cutout_factory(args: Tuple[Any, ...], kwargs: Dict[str, Any]) -> Dataset:
+    """Factory function to create a Cutout object.
+    Parameters
+    ----------
+    args : Tuple[Any, ...]
+        Positional arguments.
+    kwargs : Dict[str, Any]
+        Keyword arguments.
+    Returns
+    -------
+    Dataset
+        A Cutout object.
+    """
     if "ensemble" in kwargs:
         raise NotImplementedError("Cannot use both 'ensemble' and 'cutout'")

anemoi-datasets 0.5.16__py3-none-any.whl → 0.5.17__py3-none-any.whl

anemoi-datasets 0.5.16py3-none-any.whl → 0.5.17py3-none-any.whl