PyPI - ocf-data-sampler - Versions diffs - 0.1.6__py3-none-any.whl → 0.1.8__py3-none-any.whl - Mend

ocf-data-sampler 0.1.6py3-none-any.whl → 0.1.8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of ocf-data-sampler might be problematic. Click here for more details.

Files changed (13) hide show

ocf_data_sampler/constants.py CHANGED Viewed

@@ -86,7 +86,7 @@ ECMWF_STD = {
     "lcc": 0.3791404366493225,
     "mcc": 0.38039860129356384,
     "prate": 9.81039775069803e-05,
-    "sde": 0.000913831521756947,
+    "sd": 0.000913831521756947,
     "sr": 16294988.0,
     "t2m": 3.692270040512085,
     "tcc": 0.37487083673477173,
@@ -110,7 +110,7 @@ ECMWF_MEAN = {
     "lcc": 0.44901806116104126,
     "mcc": 0.3288780450820923,
     "prate": 3.108070450252853e-05,
-    "sde": 8.107526082312688e-05,
+    "sd": 8.107526082312688e-05,
     "sr": 12905302.0,
     "t2m": 283.48333740234375,
     "tcc": 0.7049227356910706,

ocf_data_sampler/sample/base.py CHANGED Viewed

@@ -5,25 +5,34 @@ Handling of both flat and nested structures - consideration for NWP
 import logging
 import numpy as np
+import torch
+import xarray as xr
 from pathlib import Path
-from typing import Any, Dict, Optional, Union
+from typing import Any, Dict, Optional, Union, TypeAlias
 from abc import ABC, abstractmethod
 logger = logging.getLogger(__name__)
+NumpySample: TypeAlias = Dict[str, Union[np.ndarray, Dict[str, np.ndarray]]]
+NumpyBatch: TypeAlias = Dict[str, Union[np.ndarray, Dict[str, np.ndarray]]]
+TensorBatch: TypeAlias = Dict[str, Union[torch.Tensor, Dict[str, torch.Tensor]]]
 class SampleBase(ABC):
     """
     Abstract base class for all sample types
     Provides core data storage functionality
     """
-    def __init__(self):
+    def __init__(self, data: Optional[Union[NumpySample, xr.Dataset]] = None):
         """ Initialise data container """
         logger.debug("Initialising SampleBase instance")
+        self._data = data
     @abstractmethod
-    def to_numpy(self) -> Dict[str, Any]:
+    def to_numpy(self) -> NumpySample:
         """ Convert data to a numpy array representation """
         raise NotImplementedError
@@ -42,3 +51,25 @@ class SampleBase(ABC):
     def load(cls, path: Union[str, Path]) -> 'SampleBase':
         """ Abstract class method for loading sample data """
         raise NotImplementedError
+def batch_to_tensor(batch: NumpyBatch) -> TensorBatch:
+    """
+    Moves ndarrays in a nested dict to torch tensors
+    Args:
+        batch: NumpyBatch with data in numpy arrays
+    Returns:
+        TensorBatch with data in torch tensors
+    """
+    if not batch:
+        raise ValueError("Cannot convert empty batch to tensors")
+    for k, v in batch.items():
+        if isinstance(v, dict):
+            batch[k] = batch_to_tensor(v)
+        elif isinstance(v, np.ndarray):
+            if v.dtype == np.bool_:
+                batch[k] = torch.tensor(v, dtype=torch.bool)
+            elif np.issubdtype(v.dtype, np.number):
+                batch[k] = torch.as_tensor(v)
+    return batch

ocf_data_sampler/torch_datasets/datasets/pvnet_uk.py CHANGED Viewed

@@ -31,10 +31,15 @@ from ocf_data_sampler.torch_datasets.utils.merge_and_fill_utils import (
     merge_dicts,
     fill_nans_in_arrays,
 )
+from ocf_data_sampler.torch_datasets.utils.validate_channels import (
+    validate_nwp_channels,
+    validate_satellite_channels,
+)
 xr.set_options(keep_attrs=True)
 def process_and_combine_datasets(
     dataset_dict: dict,
     config: Configuration,
@@ -47,27 +52,23 @@ def process_and_combine_datasets(
     numpy_modalities = []
     if "nwp" in dataset_dict:
         nwp_numpy_modalities = dict()
         for nwp_key, da_nwp in dataset_dict["nwp"].items():
-            # Standardise
             provider = config.input_data.nwp[nwp_key].provider
-            da_nwp = (da_nwp - NWP_MEANS[provider]) / NWP_STDS[provider]
-            # Convert to NumpyBatch
+            # Standardise and convert to NumpyBatch
+            da_nwp = (da_nwp - NWP_MEANS[provider]) / NWP_STDS[provider]
             nwp_numpy_modalities[nwp_key] = convert_nwp_to_numpy_sample(da_nwp)
         # Combine the NWPs into NumpyBatch
         numpy_modalities.append({NWPSampleKey.nwp: nwp_numpy_modalities})
     if "sat" in dataset_dict:
-        # Standardise
         da_sat = dataset_dict["sat"]
-        da_sat = (da_sat - RSS_MEAN) / RSS_STD
-        # Convert to NumpyBatch
+        # Standardise and convert to NumpyBatch
+        da_sat = (da_sat - RSS_MEAN) / RSS_STD
         numpy_modalities.append(convert_satellite_to_numpy_sample(da_sat))
     gsp_config = config.input_data.gsp
@@ -186,9 +187,13 @@ class PVNetUKRegionalDataset(Dataset):
         """
         config = load_yaml_configuration(config_filename)
+        # Validate channels for NWP and satellite data
+        validate_nwp_channels(config)
+        validate_satellite_channels(config)
         datasets_dict = get_dataset_dict(config.input_data)
         # Get t0 times where all input data is available
         valid_t0_times = find_valid_t0_times(datasets_dict, config)
@@ -294,7 +299,11 @@ class PVNetUKConcurrentDataset(Dataset):
         """
         config = load_yaml_configuration(config_filename)
+        # Validate channels for NWP and satellite data
+        validate_nwp_channels(config)
+        validate_satellite_channels(config)
         datasets_dict = get_dataset_dict(config.input_data)
         # Get t0 times where all input data is available
@@ -361,4 +370,4 @@ class PVNetUKConcurrentDataset(Dataset):
         """
         # Check data is availablle for init-time t0
         assert t0 in self.valid_t0_times
-        return self._get_sample(t0)
+        return self._get_sample(t0)

ocf_data_sampler/torch_datasets/datasets/site.py CHANGED Viewed

@@ -1,4 +1,5 @@
 """Torch dataset for sites"""
 import logging
 import numpy as np
 import pandas as pd
@@ -19,6 +20,8 @@ from ocf_data_sampler.select import (
 from ocf_data_sampler.utils import minutes
 from ocf_data_sampler.torch_datasets.utils.valid_time_periods import find_valid_time_periods
 from ocf_data_sampler.torch_datasets.utils.merge_and_fill_utils import merge_dicts, fill_nans_in_arrays
+from ocf_data_sampler.torch_datasets.utils.validate_channels import validate_nwp_channels
 from ocf_data_sampler.numpy_sample import (
     convert_site_to_numpy_sample,
     convert_satellite_to_numpy_sample,
@@ -29,8 +32,10 @@ from ocf_data_sampler.numpy_sample import (
 from ocf_data_sampler.numpy_sample import NWPSampleKey
 from ocf_data_sampler.constants import NWP_MEANS, NWP_STDS
 xr.set_options(keep_attrs=True)
 class SitesDataset(Dataset):
     def __init__(
         self,
@@ -47,6 +52,10 @@ class SitesDataset(Dataset):
         """
         config: Configuration = load_yaml_configuration(config_filename)
+        # Validate NWP channels
+        validate_nwp_channels(config)
         datasets_dict = get_dataset_dict(config.input_data)
         # Assign config and input data to self
@@ -221,8 +230,9 @@ class SitesDataset(Dataset):
         if "nwp" in dataset_dict:
             for nwp_key, da_nwp in dataset_dict["nwp"].items():
-                # Standardise
                 provider = self.config.input_data.nwp[nwp_key].provider
+                # Standardise
                 da_nwp = (da_nwp - NWP_MEANS[provider]) / NWP_STDS[provider]
                 data_arrays.append((f"nwp-{provider}", da_nwp))

ocf_data_sampler/torch_datasets/utils/validate_channels.py ADDED Viewed

@@ -0,0 +1,82 @@
+import xarray as xr
+from ocf_data_sampler.config import Configuration
+from ocf_data_sampler.constants import NWP_MEANS, NWP_STDS, RSS_MEAN, RSS_STD
+def validate_channels(
+    data_channels: list,
+    means_channels: list,
+    stds_channels: list,
+    source_name: str | None = None
+) -> None:
+    """
+    Validates that all channels in data have corresponding normalisation constants.
+    Args:
+        data_channels: Set of channels from the data
+        means_channels: Set of channels from means constants
+        stds_channels: Set of channels from stds constants
+        source_name: Name of data source (e.g., 'ecmwf', 'satellite') for error messages
+    Raises:
+        ValueError: If there's a mismatch between data channels and normalisation constants
+    """
+    data_set = set(data_channels)
+    means_set = set(means_channels)
+    stds_set = set(stds_channels)
+    # Find missing channels in means
+    missing_in_means = data_set - means_set
+    if missing_in_means:
+        raise ValueError(
+            f"The following channels for {source_name} are missing in normalisation means: "
+            f"{missing_in_means}"
+        )
+    # Find missing channels in stds
+    missing_in_stds = data_set - stds_set
+    if missing_in_stds:
+        raise ValueError(
+            f"The following channels for {source_name} are missing in normalisation stds: "
+            f"{missing_in_stds}"
+        )
+def validate_nwp_channels(config: Configuration) -> None:
+    """Validate that NWP channels in config have corresponding normalisation constants.
+    Args:
+        config: Configuration object containing NWP channel information
+    Raises:
+        ValueError: If there's a mismatch between configured NWP channels and normalisation constants
+    """
+    if hasattr(config.input_data, "nwp"):
+        for nwp_key, nwp_config in config.input_data.nwp.items():
+            provider = nwp_config.provider
+            validate_channels(
+                data_channels=nwp_config.channels,
+                means_channels=NWP_MEANS[provider].channel.values,
+                stds_channels=NWP_STDS[provider].channel.values,
+                source_name=provider
+            )
+def validate_satellite_channels(config: Configuration) -> None:
+    """Validate that satellite channels in config have corresponding normalisation constants.
+    Args:
+        config: Configuration object containing satellite channel information
+    Raises:
+        ValueError: If there's a mismatch between configured satellite channels and normalisation constants
+    """
+    if hasattr(config.input_data, "satellite"):
+        validate_channels(
+            data_channels=config.input_data.satellite.channels,
+            means_channels=RSS_MEAN.channel.values,
+            stds_channels=RSS_STD.channel.values,
+            source_name="satellite"
+        )

{ocf_data_sampler-0.1.6.dist-info → ocf_data_sampler-0.1.8.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.2
 Name: ocf_data_sampler
-Version: 0.1.6
+Version: 0.1.8
 Summary: Sample from weather data for renewable energy prediction
 Author: James Fulton, Peter Dudfield, and the Open Climate Fix team
 Author-email: info@openclimatefix.org

{ocf_data_sampler-0.1.6.dist-info → ocf_data_sampler-0.1.8.dist-info}/RECORD RENAMED Viewed

@@ -1,5 +1,5 @@
 ocf_data_sampler/__init__.py,sha256=AbpHGcgLb-kRsJGnwFEktk7uzpZOCcBY74-YBdrKVGs,1
-ocf_data_sampler/constants.py,sha256=ClteRIgp7EPlUPqIbkel83BfIaD7_VIDjUeHzUfyhnM,5079
+ocf_data_sampler/constants.py,sha256=0HYNmqwBaHVTAEEx9qzk6WD9YInh0gSKLeI3pyq7aNs,5077
 ocf_data_sampler/utils.py,sha256=rKA0BHAyAG4f90zEcgxp25EEYrXS-aOVNzttZ6Mzv2k,250
 ocf_data_sampler/config/__init__.py,sha256=O29mbH0XG2gIY1g3BaveGCnpBO2SFqdu-qzJ7a6evl0,223
 ocf_data_sampler/config/load.py,sha256=sKCKmhkkeFvvkNL5xmnFvdAulaCtV4-rigPsFvVDPDc,634
@@ -27,7 +27,7 @@ ocf_data_sampler/numpy_sample/satellite.py,sha256=8OaTvkPjzSjotcdKsa6BKmmlBKDBun
 ocf_data_sampler/numpy_sample/site.py,sha256=I-cAXCOF0SDdm5Hx43lFqYZ3jh61kltLQK-fc4_nNu0,1314
 ocf_data_sampler/numpy_sample/sun_position.py,sha256=UklhucCxCT6GMlAhCWL6c4cfWrdc1cWgegrYaqUoHOY,1611
 ocf_data_sampler/sample/__init__.py,sha256=02CM7E5nKkGiYbVW-kvzjNd4RaqGuHCkDChtmDBDUoA,248
-ocf_data_sampler/sample/base.py,sha256=4U78tczCRsKMDwU4HkD20nyGyYjIBSZV5neF2mT--2M,1197
+ocf_data_sampler/sample/base.py,sha256=qeKuWyyO8M4QX6QDbItioeCiss0fG05NXRtf0TCMQSc,2246
 ocf_data_sampler/sample/site.py,sha256=0BvDXs0kxTjUq7kWpeoITK_uN4uE0w1IvEFXZUoKOb0,2507
 ocf_data_sampler/sample/uk_regional.py,sha256=D1A6nQB1PYCmxb3FzU9gqbNufQfx__wcprcDm50jCJw,4381
 ocf_data_sampler/select/__init__.py,sha256=E4AJulEbO2K-o0UlG1fgaEteuf_1ZFjHTvrotXSb4YU,332
@@ -41,10 +41,11 @@ ocf_data_sampler/select/select_time_slice.py,sha256=9M-yvDv9K77XfEys_OIR31_aVB56
 ocf_data_sampler/select/spatial_slice_for_dataset.py,sha256=3tRrMBXr7s4CnClbVSIq7hpls3H4Y3qYTDwswcxCCCE,1763
 ocf_data_sampler/select/time_slice_for_dataset.py,sha256=Z7pOiilSHScxmBKZNG18K5J-S4ifdXXAYGZoHRHD3AY,4324
 ocf_data_sampler/torch_datasets/datasets/__init__.py,sha256=jfJSFcR0eO1AqeH7S3KnGjsBqVZT5w3oyi784PUR6Q0,146
-ocf_data_sampler/torch_datasets/datasets/pvnet_uk.py,sha256=xuNJyCXZ4dZ9UldX1lqOoRSRNP39Vcy0DR77Vr7dxlk,11895
-ocf_data_sampler/torch_datasets/datasets/site.py,sha256=ZjvJS0mWUyQE7ZcrhS1TdMHaPrEZXVbBAv2vDwBvQwA,16044
+ocf_data_sampler/torch_datasets/datasets/pvnet_uk.py,sha256=N85duDyEm6LIYgYIpLhrpxHddMIcvFosuZg8rzIztwE,12267
+ocf_data_sampler/torch_datasets/datasets/site.py,sha256=L_4w967ZxPjd7vHRkPtj7ZSmamEShKRT28j9_f-enJY,16228
 ocf_data_sampler/torch_datasets/utils/merge_and_fill_utils.py,sha256=hIbekql64eXsNDFIoEc--GWxwdVWrh2qKegdOi70Bow,874
 ocf_data_sampler/torch_datasets/utils/valid_time_periods.py,sha256=Qo65qUHtle_bW5tLTYr7empHTRv-lpjvfx_6GNJj3Xg,4371
+ocf_data_sampler/torch_datasets/utils/validate_channels.py,sha256=u2EpiFAKAOHpmvINhOUJCT8Vbc-cle6qJ3YNVse4yLs,2884
 scripts/refactor_site.py,sha256=asZ27hQ4IyXgCCUaFJqcz1ObBNcV2W3ywqHBpSXA_fc,1728
 tests/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 tests/conftest.py,sha256=RlC7YYtBLipUzFS1tQxela1SgHCxSpReUKEJ4429PwQ,7689
@@ -67,14 +68,15 @@ tests/select/test_find_contiguous_time_periods.py,sha256=kOga_V7er5We7ewMARXaKdM
 tests/select/test_location.py,sha256=_WZk2FPYeJ-nIfCJS6Sp_yaVEEo7m31DmMFoZzgyCts,2712
 tests/select/test_select_spatial_slice.py,sha256=7EX9b6g-pMdACQx3yefjs5do2s-Rho2UmKevV4oglsU,5147
 tests/select/test_select_time_slice.py,sha256=nYrdlmZlGEygJKiE26bADiluNPN1qt5kD4FrI2vtxUw,9686
-tests/test_sample/test_base.py,sha256=ljtB38MmscTGN6OvUgclBceNnfx6m7AN8iHYDml9XW4,2189
+tests/test_sample/test_base.py,sha256=CkqKCZbrq3Vb4T7bOwPh3_0p8OTl0LfSLNBctYC_jag,4199
 tests/test_sample/test_site_sample.py,sha256=Gln-Or060cUWvA7Q7c1vsthgCttOAM2z9yBI9zUIrDw,6238
 tests/test_sample/test_uk_regional_sample.py,sha256=gkeQWC2wC757jKJz_QBmDMFQjn3R54q_tEo948yyxCY,4840
 tests/torch_datasets/test_merge_and_fill_utils.py,sha256=GtuQg82BM1eHQjT7Ik1x1zaVcuc7KJO4_NC9stXsd4s,1123
-tests/torch_datasets/test_pvnet_uk.py,sha256=loueo7PUUYJVda3-vBn3bQIC_zgrTAThfx-GTDcBOZg,5596
+tests/torch_datasets/test_pvnet_uk.py,sha256=F0D-DugFgVtt8G1q7lylmPLrOZj6H6YPNd9s_6Wn_yM,5594
 tests/torch_datasets/test_site.py,sha256=t57vAR_RRWcbG_kEFk6VrFCYzVxwFG6qJKBnRHF02fM,7000
-ocf_data_sampler-0.1.6.dist-info/LICENSE,sha256=F-Q3UFCR-BECSocV55BFDpn4YKxve9PKrm-lTt6o_Tg,1073
-ocf_data_sampler-0.1.6.dist-info/METADATA,sha256=qltSR8dsD54ufCfXXFFYYLY_l_1saBWGaxwzZDIaJoU,12173
-ocf_data_sampler-0.1.6.dist-info/WHEEL,sha256=In9FTNxeP60KnTkGw7wk6mJPYd_dQSjEZmXdBdMCI-8,91
-ocf_data_sampler-0.1.6.dist-info/top_level.txt,sha256=Faob6N6cFdPc5eUpCTYcXgCaNhi4XLLteUL5W5ayYmg,31
-ocf_data_sampler-0.1.6.dist-info/RECORD,,
+tests/torch_datasets/test_validate_channels_utils.py,sha256=Rzdweu98j1of45jCOUrSiBtyPlf-dDaCceulf0H7ml8,2921
+ocf_data_sampler-0.1.8.dist-info/LICENSE,sha256=F-Q3UFCR-BECSocV55BFDpn4YKxve9PKrm-lTt6o_Tg,1073
+ocf_data_sampler-0.1.8.dist-info/METADATA,sha256=hWohmy0-J73u-uy3MPEG0_tuprAXOh32hX8WyIDPqaU,12173
+ocf_data_sampler-0.1.8.dist-info/WHEEL,sha256=In9FTNxeP60KnTkGw7wk6mJPYd_dQSjEZmXdBdMCI-8,91
+ocf_data_sampler-0.1.8.dist-info/top_level.txt,sha256=Faob6N6cFdPc5eUpCTYcXgCaNhi4XLLteUL5W5ayYmg,31
+ocf_data_sampler-0.1.8.dist-info/RECORD,,

tests/test_sample/test_base.py CHANGED Viewed

@@ -3,11 +3,14 @@ Base class testing - SampleBase
 """
 import pytest
+import torch
 import numpy as np
 from pathlib import Path
-from ocf_data_sampler.sample.base import SampleBase
+from ocf_data_sampler.sample.base import (
+    SampleBase,
+    batch_to_tensor
+)
 class TestSample(SampleBase):
     """
@@ -84,3 +87,61 @@ def test_sample_base_to_numpy():
     assert isinstance(numpy_data, dict)
     assert all(isinstance(value, np.ndarray) for value in numpy_data.values())
     assert np.array_equal(numpy_data['list_data'], np.array([1, 2, 3]))
+def test_batch_to_tensor_nested():
+    """ Test nested dictionary conversion """
+    batch = {
+        'outer': {
+            'inner': np.array([1, 2, 3])
+        }
+    }
+    tensor_batch = batch_to_tensor(batch)
+    assert torch.equal(tensor_batch['outer']['inner'], torch.tensor([1, 2, 3]))
+def test_batch_to_tensor_mixed_types():
+    """ Test handling of mixed data types """
+    batch = {
+        'tensor_data': np.array([1, 2, 3]),
+        'string_data': 'not_a_tensor',
+        'nested': {
+            'numbers': np.array([4, 5, 6]),
+            'text': 'still_not_a_tensor'
+        }
+    }
+    tensor_batch = batch_to_tensor(batch)
+    assert isinstance(tensor_batch['tensor_data'], torch.Tensor)
+    assert isinstance(tensor_batch['string_data'], str)
+    assert isinstance(tensor_batch['nested']['numbers'], torch.Tensor)
+    assert isinstance(tensor_batch['nested']['text'], str)
+def test_batch_to_tensor_different_dtypes():
+    """ Test conversion of arrays with different dtypes """
+    batch = {
+        'float_data': np.array([1.0, 2.0, 3.0], dtype=np.float32),
+        'int_data': np.array([1, 2, 3], dtype=np.int64),
+        'bool_data': np.array([True, False, True], dtype=np.bool_)
+    }
+    tensor_batch = batch_to_tensor(batch)
+    assert isinstance(tensor_batch['bool_data'], torch.Tensor)
+    assert tensor_batch['float_data'].dtype == torch.float32
+    assert tensor_batch['int_data'].dtype == torch.int64
+    assert tensor_batch['bool_data'].dtype == torch.bool
+def test_batch_to_tensor_multidimensional():
+    """ Test conversion of multidimensional arrays """
+    batch = {
+        'matrix': np.array([[1, 2], [3, 4]]),
+        'tensor': np.array([[[1, 2], [3, 4]], [[5, 6], [7, 8]]])
+    }
+    tensor_batch = batch_to_tensor(batch)
+    assert tensor_batch['matrix'].shape == (2, 2)
+    assert tensor_batch['tensor'].shape == (2, 2, 2)
+    assert torch.equal(tensor_batch['matrix'], torch.tensor([[1, 2], [3, 4]]))

tests/torch_datasets/test_pvnet_uk.py CHANGED Viewed

@@ -24,7 +24,7 @@ def test_process_and_combine_datasets(pvnet_config_filename):
         dims=["time_utc", "channel", "y", "x"],
         coords={
             "time_utc": pd.date_range("2024-01-01 00:00", periods=4, freq="h"),
-            "channel": ["t2m", "dswrf"],
+            "channel": ["t", "dswrf"],
             "step": ("time_utc", pd.timedelta_range(start='0h', periods=4, freq='h')),
             "init_time_utc": pd.Timestamp("2024-01-01 00:00")
         }
@@ -54,7 +54,7 @@ def test_process_and_combine_datasets(pvnet_config_filename):
     assert isinstance(sample, dict)
     assert "nwp" in sample
     assert sample["satellite_actual"].shape == (7, 1, 2, 2)
-    assert sample["nwp"]["ukv"]["nwp"].shape == (4, 1, 2, 2)
+    assert sample["nwp"]["ukv"]["nwp"].shape == (4, 2, 2, 2)
     assert "gsp_id" in sample

tests/torch_datasets/test_validate_channels_utils.py ADDED Viewed

@@ -0,0 +1,78 @@
+"""Tests for channel validation utility functions"""
+import pytest
+from ocf_data_sampler.torch_datasets.utils.validate_channels import (
+    validate_channels,
+    validate_nwp_channels,
+    validate_satellite_channels,
+)
+class TestChannelValidation:
+    """Tests for channel validation functions"""
+    @pytest.mark.parametrize("test_case", [
+        # Base validation - success case
+        {
+            "data_channels": ["channel1", "channel2"],
+            "norm_channels": ["channel1", "channel2", "extra"],
+            "source_name": "test_source",
+            "expect_error": False
+        },
+        # Base validation - error case
+        {
+            "data_channels": ["channel1", "missing_channel"],
+            "norm_channels": ["channel1"],
+            "source_name": "test_source",
+            "expect_error": True,
+            "error_match": "following channels for test_source are missing in normalisation means"
+        },
+        # NWP case - success
+        {
+            "data_channels": ["t2m", "dswrf"],
+            "norm_channels": ["t2m", "dswrf", "extra"],
+            "source_name": "ecmwf",
+            "expect_error": False
+        },
+        # NWP case - error
+        {
+            "data_channels": ["t2m", "missing_channel"],
+            "norm_channels": ["t2m"],
+            "source_name": "ecmwf",
+            "expect_error": True,
+            "error_match": "following channels for ecmwf are missing in normalisation means"
+        },
+        # Satellite case - success
+        {
+            "data_channels": ["IR_016", "VIS006"],
+            "norm_channels": ["IR_016", "VIS006", "extra"],
+            "source_name": "satellite",
+            "expect_error": False
+        },
+        # Satellite case - error
+        {
+            "data_channels": ["IR_016", "missing_channel"],
+            "norm_channels": ["IR_016"],
+            "source_name": "satellite",
+            "expect_error": True,
+            "error_match": "following channels for satellite are missing in normalisation means"
+        }
+    ])
+    def test_channel_validation(self, test_case):
+        """Test channel validation for both base, NWP and satellite data"""
+        if test_case["expect_error"]:
+            with pytest.raises(ValueError, match=test_case["error_match"]):
+                validate_channels(
+                    data_channels=test_case["data_channels"],
+                    means_channels=test_case["norm_channels"],
+                    stds_channels=test_case["norm_channels"],
+                    source_name=test_case["source_name"]
+                )
+        else:
+            # Should not raise any exceptions
+            validate_channels(
+                data_channels=test_case["data_channels"],
+                means_channels=test_case["norm_channels"],
+                stds_channels=test_case["norm_channels"],
+                source_name=test_case["source_name"]
+            )

{ocf_data_sampler-0.1.6.dist-info → ocf_data_sampler-0.1.8.dist-info}/LICENSE RENAMED Viewed

File without changes

{ocf_data_sampler-0.1.6.dist-info → ocf_data_sampler-0.1.8.dist-info}/WHEEL RENAMED Viewed

File without changes

{ocf_data_sampler-0.1.6.dist-info → ocf_data_sampler-0.1.8.dist-info}/top_level.txt RENAMED Viewed

File without changes

ocf-data-sampler 0.1.6__py3-none-any.whl → 0.1.8__py3-none-any.whl

Potentially problematic release.

ocf-data-sampler 0.1.6py3-none-any.whl → 0.1.8py3-none-any.whl