PyPI - disdrodb - Versions diffs - 0.1.4__py3-none-any.whl → 0.2.0__py3-none-any.whl - Mend

disdrodb 0.1.4py3-none-any.whl → 0.2.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (135) hide show

disdrodb/__init__.py +1 -5
disdrodb/_version.py +2 -2
disdrodb/accessor/methods.py +14 -3
disdrodb/api/checks.py +10 -0
disdrodb/api/create_directories.py +0 -2
disdrodb/api/io.py +14 -17
disdrodb/api/path.py +42 -77
disdrodb/api/search.py +89 -23
disdrodb/cli/disdrodb_create_summary.py +11 -1
disdrodb/cli/disdrodb_create_summary_station.py +10 -0
disdrodb/cli/disdrodb_run_l0.py +1 -1
disdrodb/cli/disdrodb_run_l0a.py +1 -1
disdrodb/cli/disdrodb_run_l0b.py +1 -1
disdrodb/cli/disdrodb_run_l0c.py +1 -1
disdrodb/cli/disdrodb_run_l1.py +1 -1
disdrodb/cli/disdrodb_run_l2e.py +1 -1
disdrodb/cli/disdrodb_run_l2m.py +1 -1
disdrodb/configs.py +30 -83
disdrodb/constants.py +4 -3
disdrodb/data_transfer/download_data.py +4 -2
disdrodb/docs.py +2 -2
disdrodb/etc/products/L1/1MIN.yaml +13 -0
disdrodb/etc/products/L1/LPM/1MIN.yaml +13 -0
disdrodb/etc/products/L1/PARSIVEL/1MIN.yaml +13 -0
disdrodb/etc/products/L1/PARSIVEL2/1MIN.yaml +13 -0
disdrodb/etc/products/L1/PWS100/1MIN.yaml +13 -0
disdrodb/etc/products/L1/RD80/1MIN.yaml +13 -0
disdrodb/etc/products/L1/SWS250/1MIN.yaml +13 -0
disdrodb/etc/products/L1/global.yaml +7 -1
disdrodb/etc/products/L2E/10MIN.yaml +1 -12
disdrodb/etc/products/L2E/5MIN.yaml +1 -0
disdrodb/etc/products/L2E/global.yaml +1 -1
disdrodb/etc/products/L2M/MODELS/GAMMA_GS_ND_MAE.yaml +6 -0
disdrodb/etc/products/L2M/{GAMMA_ML.yaml → MODELS/GAMMA_ML.yaml} +1 -1
disdrodb/etc/products/L2M/MODELS/LOGNORMAL_GS_LOG_ND_MAE.yaml +6 -0
disdrodb/etc/products/L2M/MODELS/LOGNORMAL_GS_ND_MAE.yaml +6 -0
disdrodb/etc/products/L2M/MODELS/LOGNORMAL_ML.yaml +8 -0
disdrodb/etc/products/L2M/MODELS/NGAMMA_GS_R_MAE.yaml +6 -0
disdrodb/etc/products/L2M/global.yaml +11 -3
disdrodb/l0/check_configs.py +49 -16
disdrodb/l0/configs/LPM/l0a_encodings.yml +2 -2
disdrodb/l0/configs/LPM/l0b_cf_attrs.yml +2 -2
disdrodb/l0/configs/LPM/l0b_encodings.yml +2 -2
disdrodb/l0/configs/LPM/raw_data_format.yml +2 -2
disdrodb/l0/configs/PARSIVEL/l0b_encodings.yml +1 -1
disdrodb/l0/configs/PWS100/l0b_encodings.yml +1 -0
disdrodb/l0/configs/SWS250/bins_diameter.yml +108 -0
disdrodb/l0/configs/SWS250/bins_velocity.yml +83 -0
disdrodb/l0/configs/SWS250/l0a_encodings.yml +18 -0
disdrodb/l0/configs/SWS250/l0b_cf_attrs.yml +72 -0
disdrodb/l0/configs/SWS250/l0b_encodings.yml +155 -0
disdrodb/l0/configs/SWS250/raw_data_format.yml +148 -0
disdrodb/l0/l0_reader.py +2 -2
disdrodb/l0/l0b_processing.py +70 -15
disdrodb/l0/l0c_processing.py +7 -3
disdrodb/l0/readers/LPM/ARM/ARM_LPM.py +1 -1
disdrodb/l0/readers/LPM/AUSTRALIA/MELBOURNE_2007_LPM.py +2 -2
disdrodb/l0/readers/LPM/BELGIUM/ULIEGE.py +256 -0
disdrodb/l0/readers/LPM/BRAZIL/CHUVA_LPM.py +2 -2
disdrodb/l0/readers/LPM/BRAZIL/GOAMAZON_LPM.py +2 -2
disdrodb/l0/readers/LPM/GERMANY/DWD.py +491 -0
disdrodb/l0/readers/LPM/ITALY/GID_LPM.py +2 -2
disdrodb/l0/readers/LPM/ITALY/GID_LPM_W.py +2 -2
disdrodb/l0/readers/LPM/KIT/CHWALA.py +2 -2
disdrodb/l0/readers/LPM/SLOVENIA/ARSO.py +107 -12
disdrodb/l0/readers/LPM/SLOVENIA/UL.py +3 -3
disdrodb/l0/readers/LPM/SWITZERLAND/INNERERIZ_LPM.py +2 -2
disdrodb/l0/readers/PARSIVEL/BASQUECOUNTRY/EUSKALMET_OTT.py +227 -0
disdrodb/l0/readers/PARSIVEL/{GPM → NASA}/LPVEX.py +1 -1
disdrodb/l0/readers/PARSIVEL/NCAR/VORTEX2_2010.py +5 -14
disdrodb/l0/readers/PARSIVEL/NCAR/VORTEX2_2010_UF.py +8 -17
disdrodb/l0/readers/PARSIVEL/SLOVENIA/UL.py +117 -8
disdrodb/l0/readers/PARSIVEL2/BASQUECOUNTRY/EUSKALMET_OTT2.py +232 -0
disdrodb/l0/readers/PARSIVEL2/BRAZIL/CHUVA_PARSIVEL2.py +10 -14
disdrodb/l0/readers/PARSIVEL2/BRAZIL/GOAMAZON_PARSIVEL2.py +10 -14
disdrodb/l0/readers/PARSIVEL2/DENMARK/DTU.py +8 -14
disdrodb/l0/readers/PARSIVEL2/DENMARK/EROSION_raw.py +382 -0
disdrodb/l0/readers/PARSIVEL2/FINLAND/FMI_PARSIVEL2.py +4 -0
disdrodb/l0/readers/PARSIVEL2/FRANCE/OSUG.py +1 -1
disdrodb/l0/readers/PARSIVEL2/GREECE/NOA.py +127 -0
disdrodb/l0/readers/PARSIVEL2/ITALY/HYDROX.py +239 -0
disdrodb/l0/readers/PARSIVEL2/NCAR/FARM_PARSIVEL2.py +5 -11
disdrodb/l0/readers/PARSIVEL2/NCAR/PERILS_MIPS.py +4 -17
disdrodb/l0/readers/PARSIVEL2/NCAR/RELAMPAGO_PARSIVEL2.py +5 -14
disdrodb/l0/readers/PARSIVEL2/NCAR/SNOWIE_PJ.py +10 -13
disdrodb/l0/readers/PARSIVEL2/NCAR/SNOWIE_SB.py +10 -13
disdrodb/l0/readers/PARSIVEL2/PHILIPPINES/PAGASA.py +232 -0
disdrodb/l0/readers/PARSIVEL2/SPAIN/CENER.py +6 -18
disdrodb/l0/readers/PARSIVEL2/{NASA/LPVEX.py → SPAIN/GRANADA.py} +46 -35
disdrodb/l0/readers/PARSIVEL2/SWEDEN/SMHI.py +189 -0
disdrodb/l0/readers/PARSIVEL2/USA/{C3WE.py → CW3E.py} +10 -28
disdrodb/l0/readers/PWS100/AUSTRIA/HOAL.py +321 -0
disdrodb/l0/readers/SW250/BELGIUM/KMI.py +239 -0
disdrodb/l1/beard_model.py +31 -129
disdrodb/l1/fall_velocity.py +136 -83
disdrodb/l1/filters.py +25 -28
disdrodb/l1/processing.py +16 -17
disdrodb/l1/resampling.py +101 -38
disdrodb/l1_env/routines.py +46 -17
disdrodb/l2/empirical_dsd.py +6 -0
disdrodb/l2/processing.py +6 -5
disdrodb/metadata/geolocation.py +0 -2
disdrodb/metadata/search.py +3 -4
disdrodb/psd/fitting.py +16 -13
disdrodb/routines/l0.py +2 -2
disdrodb/routines/l1.py +173 -60
disdrodb/routines/l2.py +148 -284
disdrodb/routines/options.py +345 -0
disdrodb/routines/wrappers.py +14 -1
disdrodb/scattering/axis_ratio.py +90 -84
disdrodb/scattering/permittivity.py +6 -0
disdrodb/summary/routines.py +735 -670
disdrodb/utils/archiving.py +51 -44
disdrodb/utils/attrs.py +3 -1
disdrodb/utils/dask.py +4 -4
disdrodb/utils/dict.py +33 -0
disdrodb/utils/encoding.py +6 -1
disdrodb/utils/routines.py +9 -8
disdrodb/utils/time.py +11 -3
disdrodb/viz/__init__.py +0 -13
disdrodb/viz/plots.py +231 -1
{disdrodb-0.1.4.dist-info → disdrodb-0.2.0.dist-info}/METADATA +2 -1
{disdrodb-0.1.4.dist-info → disdrodb-0.2.0.dist-info}/RECORD +135 -103
/disdrodb/etc/products/L2M/{NGAMMA_GS_LOG_ND_MAE.yaml → MODELS/NGAMMA_GS_LOG_ND_MAE.yaml} +0 -0
/disdrodb/etc/products/L2M/{NGAMMA_GS_ND_MAE.yaml → MODELS/NGAMMA_GS_ND_MAE.yaml} +0 -0
/disdrodb/etc/products/L2M/{NGAMMA_GS_Z_MAE.yaml → MODELS/NGAMMA_GS_Z_MAE.yaml} +0 -0
/disdrodb/l0/readers/PARSIVEL/{GPM → NASA}/IFLOODS.py +0 -0
/disdrodb/l0/readers/PARSIVEL/{GPM → NASA}/MC3E.py +0 -0
/disdrodb/l0/readers/PARSIVEL/{GPM → NASA}/PIERS.py +0 -0
/disdrodb/l0/readers/PARSIVEL2/{GPM → NASA}/GCPEX.py +0 -0
/disdrodb/l0/readers/PARSIVEL2/{GPM → NASA}/NSSTC.py +0 -0
{disdrodb-0.1.4.dist-info → disdrodb-0.2.0.dist-info}/WHEEL +0 -0
{disdrodb-0.1.4.dist-info → disdrodb-0.2.0.dist-info}/entry_points.txt +0 -0
{disdrodb-0.1.4.dist-info → disdrodb-0.2.0.dist-info}/licenses/LICENSE +0 -0
{disdrodb-0.1.4.dist-info → disdrodb-0.2.0.dist-info}/top_level.txt +0 -0

disdrodb/routines/l2.py CHANGED Viewed

@@ -18,7 +18,6 @@
 import copy
 import datetime
-import json
 import logging
 import os
 import time
@@ -31,195 +30,51 @@ from disdrodb.api.create_directories import (
     create_logs_directory,
     create_product_directory,
 )
-from disdrodb.api.info import group_filepaths
 from disdrodb.api.io import open_netcdf_files
 from disdrodb.api.path import (
     define_file_folder_path,
     define_l2e_filename,
     define_l2m_filename,
-    define_temporal_resolution,
 )
 from disdrodb.api.search import get_required_product
 from disdrodb.configs import (
     get_data_archive_dir,
     get_metadata_archive_dir,
-    get_model_options,
-    get_product_options,
-    get_product_temporal_resolutions,
 )
-from disdrodb.l1.resampling import resample_dataset
 from disdrodb.l2.processing import (
     generate_l2_radar,
     generate_l2e,
     generate_l2m,
 )
 from disdrodb.metadata import read_station_metadata
+from disdrodb.routines.options import (
+    L2ProcessingOptions,
+    get_model_options,
+    get_product_temporal_resolutions,
+    is_possible_product,
+)
 from disdrodb.scattering.routines import precompute_scattering_tables
-from disdrodb.utils.archiving import define_temporal_partitions, get_files_partitions
 from disdrodb.utils.dask import execute_tasks_safely
 from disdrodb.utils.decorators import delayed_if_parallel, single_threaded_if_parallel
-from disdrodb.utils.list import flatten_list
-# Logger
 from disdrodb.utils.logger import (
     create_product_logs,
     log_info,
 )
 from disdrodb.utils.routines import (
-    is_possible_product,
     run_product_generation,
     try_get_required_filepaths,
 )
-from disdrodb.utils.time import (
-    ensure_sample_interval_in_seconds,
-    get_resampling_information,
-)
 from disdrodb.utils.writer import write_product
 logger = logging.getLogger(__name__)
-####----------------------------------------------------------------------------.
-class ProcessingOptions:
-    """Define L2 products processing options."""
-    # TODO: TO MOVE ELSEWHERE (AFTER L1 REFACTORING !)
-    def __init__(self, product, filepaths, parallel, temporal_resolutions=None):
-        """Define L2 products processing options."""
-        import disdrodb
-        # ---------------------------------------------------------------------.
-        # Define temporal resolutions for which to retrieve processing options
-        if temporal_resolutions is None:
-            temporal_resolutions = get_product_temporal_resolutions(product)
-        elif isinstance(temporal_resolutions, str):
-            temporal_resolutions = [temporal_resolutions]
-        # ---------------------------------------------------------------------.
-        # Get product options at various temporal resolutions
-        dict_product_options = {
-            temporal_resolution: get_product_options(product, temporal_resolution=temporal_resolution)
-            for temporal_resolution in temporal_resolutions
-        }
-        # ---------------------------------------------------------------------.
-        # Group filepaths by source sample intervals
-        # - Typically the sample interval is fixed and is just one
-        # - Some stations might change the sample interval along the years
-        # - For each sample interval, separated processing take place here after !
-        dict_filepaths = group_filepaths(filepaths, groups="sample_interval")
-        # ---------------------------------------------------------------------.
-        # Retrieve processing information for each temporal resolution
-        dict_folder_partitioning = {}
-        dict_files_partitions = {}
-        _cache_dict_list_partitions: dict[str, dict] = {}
-        for temporal_resolution in temporal_resolutions:
-            # -------------------------------------------------------------------------.
-            # Retrieve product options
-            product_options = dict_product_options[temporal_resolution].copy()
-            # Retrieve accumulation_interval and rolling option
-            accumulation_interval, rolling = get_resampling_information(temporal_resolution)
-            # Extract processing options
-            archive_options = product_options.pop("archive_options")
-            dict_product_options[temporal_resolution] = product_options
-            # -------------------------------------------------------------------------.
-            # Define folder partitioning
-            if "folder_partitioning" not in archive_options:
-                dict_folder_partitioning[temporal_resolution] = disdrodb.config.get("folder_partitioning")
-            else:
-                dict_folder_partitioning[temporal_resolution] = archive_options.pop("folder_partitioning")
-            # -------------------------------------------------------------------------.
-            # Define list of temporal partitions
-            # - [{start_time: np.datetime64, end_time: np.datetime64}, ....]
-            # - Either strategy: "event" or "time_block" or save_by_time_block"
-            # - "event" requires loading data into memory to identify events
-            #   --> Does some data filtering on what to process !
-            # - "time_block" does not require loading data into memory
-            #   --> Does not do data filtering on what to process !
-            # --> Here we cache dict_list_partitions so that we don't need to recompute
-            #     stuffs if processing options are the same
-            key = json.dumps(archive_options, sort_keys=True)
-            if key not in _cache_dict_list_partitions:
-                _cache_dict_list_partitions[key] = {
-                    sample_interval: define_temporal_partitions(filepaths, parallel=parallel, **archive_options)
-                    for sample_interval, filepaths in dict_filepaths.items()
-                }
-            dict_list_partitions = _cache_dict_list_partitions[key].copy()  # To avoid in-place replacement
-            # ------------------------------------------------------------------.
-            # Group filepaths by temporal partitions
-            # - This is done separately for each possible source sample interval
-            # - It groups filepaths by start_time and end_time provided by list_partitions
-            # - Here 'events' can also simply be period of times ('day', 'months', ...)
-            # - When aggregating/resampling/accumulating data, we need to load also
-            #   some data after the actual event end_time to ensure that the resampled dataset
-            #   contains the event_end_time
-            #   --> get_files_partitions adjust the event end_time to accounts for the required "border" data.
-            # - ATTENTION: get_files_partitions returns start_time and end_time as datetime objects !
-            files_partitions = [
-                get_files_partitions(
-                    list_partitions=list_partitions,
-                    filepaths=dict_filepaths[sample_interval],
-                    sample_interval=sample_interval,
-                    accumulation_interval=accumulation_interval,
-                    rolling=rolling,
-                )
-                for sample_interval, list_partitions in dict_list_partitions.items()
-                if product != "L2E"
-                or is_possible_product(
-                    accumulation_interval=accumulation_interval,
-                    sample_interval=sample_interval,
-                    rolling=rolling,
-                )
-            ]
-            files_partitions = flatten_list(files_partitions)
-            dict_files_partitions[temporal_resolution] = files_partitions
-        # ------------------------------------------------------------------.
-        # Keep only temporal_resolutions for which events could be defined
-        # - Remove e.g when not compatible accumulation_interval with source sample_interval
-        temporal_resolutions = [
-            temporal_resolution
-            for temporal_resolution in temporal_resolutions
-            if len(dict_files_partitions[temporal_resolution]) > 0
-        ]
-        # ------------------------------------------------------------------.
-        # Add attributes
-        self.temporal_resolutions = temporal_resolutions
-        self.dict_files_partitions = dict_files_partitions
-        self.dict_product_options = dict_product_options
-        self.dict_folder_partitioning = dict_folder_partitioning
-    def get_files_partitions(self, temporal_resolution):
-        """Return files partitions dictionary for a specific L2E product."""
-        return self.dict_files_partitions[temporal_resolution]
-    def get_product_options(self, temporal_resolution):
-        """Return product options dictionary for a specific L2E product."""
-        return self.dict_product_options[temporal_resolution]
-    def get_folder_partitioning(self, temporal_resolution):
-        """Return the folder partitioning for a specific L2E product."""
-        # to be used for logs and files !
-        return self.dict_folder_partitioning[temporal_resolution]
 ####----------------------------------------------------------------------------.
 #### L2E
-def define_l2e_logs_filename(campaign_name, station_name, start_time, end_time, accumulation_interval, rolling):
+def define_l2e_logs_filename(campaign_name, station_name, start_time, end_time, temporal_resolution):
     """Define L2E logs filename."""
-    temporal_resolution = define_temporal_resolution(seconds=accumulation_interval, rolling=rolling)
     starting_time = pd.to_datetime(start_time).strftime("%Y%m%d%H%M%S")
     ending_time = pd.to_datetime(end_time).strftime("%Y%m%d%H%M%S")
     logs_filename = f"L2E.{temporal_resolution}.{campaign_name}.{station_name}.s{starting_time}.e{ending_time}"
@@ -239,8 +94,7 @@ def _generate_l2e(
     campaign_name,
     station_name,
     # L2E options
-    accumulation_interval,
-    rolling,
+    temporal_resolution,
     product_options,
     # Processing options
     force,
@@ -254,42 +108,28 @@ def _generate_l2e(
     # Define product processing function
     def core(
         filepaths,
+        start_time,
+        end_time,
         campaign_name,
         station_name,
-        product_options,
         # Processing options
         logger,
         parallel,
         verbose,
         force,
-        # Resampling arguments
-        start_time,
-        end_time,
-        accumulation_interval,
-        rolling,
+        # Product options
+        temporal_resolution,
+        product_options,
         # Archiving arguments
         data_dir,
         folder_partitioning,
     ):
-        """Define L1 product processing."""
+        """Define L2E product processing."""
         # Copy to avoid in-place replacement (outside this function)
         product_options = product_options.copy()
         # Open the dataset over the period of interest
-        ds = open_netcdf_files(filepaths, start_time=start_time, end_time=end_time, parallel=False)
-        ds = ds.load()
-        ds.close()
-        # Resample dataset # TODO: in future to perform in L1
-        # - Define sample interval in seconds
-        sample_interval = ensure_sample_interval_in_seconds(ds["sample_interval"]).to_numpy().item()
-        # - Resample dataset
-        ds = resample_dataset(
-            ds=ds,
-            sample_interval=sample_interval,
-            accumulation_interval=accumulation_interval,
-            rolling=rolling,
-        )
+        ds = open_netcdf_files(filepaths, start_time=start_time, end_time=end_time, parallel=False, compute=True)
         # Extract L2E processing options
         l2e_options = product_options.get("product_options")
@@ -320,8 +160,7 @@ def _generate_l2e(
             ds,
             campaign_name=campaign_name,
             station_name=station_name,
-            sample_interval=accumulation_interval,
-            rolling=rolling,
+            temporal_resolution=temporal_resolution,
         )
         folder_path = define_file_folder_path(ds, dir_path=data_dir, folder_partitioning=folder_partitioning)
         filepath = os.path.join(folder_path, filename)
@@ -333,14 +172,14 @@ def _generate_l2e(
     # Define product processing function kwargs
     core_func_kwargs = dict(  # noqa: C408
         filepaths=filepaths,
+        start_time=start_time,
+        end_time=end_time,
+        # Station info
         campaign_name=campaign_name,
         station_name=station_name,
+        # Product options
+        temporal_resolution=temporal_resolution,
         product_options=product_options,
-        # Resampling arguments
-        start_time=start_time,
-        end_time=end_time,
-        accumulation_interval=accumulation_interval,
-        rolling=rolling,
         # Archiving arguments
         data_dir=data_dir,
         folder_partitioning=folder_partitioning,
@@ -449,57 +288,85 @@ def run_l2e_station(
         msg = f"{product} processing of station {station_name} has started."
         log_info(logger=logger, msg=msg, verbose=verbose)
-    # -------------------------------------------------------------------------.
-    # List files to process
-    # - If no data available, print error message and return None
-    required_product = get_required_product(product)
-    filepaths = try_get_required_filepaths(
-        data_archive_dir=data_archive_dir,
+    # ---------------------------------------------------------------------.
+    # Retrieve source sampling interval
+    # - If a station has varying measurement interval over time, choose the smallest one !
+    metadata = read_station_metadata(
+        metadata_archive_dir=metadata_archive_dir,
         data_source=data_source,
         campaign_name=campaign_name,
         station_name=station_name,
-        product=required_product,
-        # Processing options
-        debugging_mode=debugging_mode,
     )
-    if filepaths is None:
-        return
-    # -------------------------------------------------------------------------.
-    # Retrieve L2E processing options
-    l2e_processing_options = ProcessingOptions(product="L2E", filepaths=filepaths, parallel=parallel)
+    sample_interval = metadata["measurement_interval"]
+    if isinstance(sample_interval, list):
+        sample_interval = min(sample_interval)
-    # -------------------------------------------------------------------------.
+    # ---------------------------------------------------------------------.
     # Generate products for each temporal resolution
-    # rolling = False
-    # accumulation_interval = 60
+    # temporal_resolution = "1MIN"
     # temporal_resolution = "10MIN"
-    # folder_partitioning = ""
-    # product_options = l2e_processing_options.get_product_options(temporal_resolution)
+    temporal_resolutions = get_product_temporal_resolutions(product)
+    for temporal_resolution in temporal_resolutions:
-    for temporal_resolution in l2e_processing_options.temporal_resolutions:
-        # Print progress message
-        msg = f"Production of {product} {temporal_resolution} has started."
-        log_info(logger=logger, msg=msg, verbose=verbose)
+        # ------------------------------------------------------------------.
+        # Check if the product can be generated
+        if not is_possible_product(
+            temporal_resolution=temporal_resolution,
+            sample_interval=sample_interval,
+        ):
+            continue
-        # Retrieve event info
-        files_partitions = l2e_processing_options.get_files_partitions(temporal_resolution)
+        # ---------------------------------------------------------------------.
+        # List files to process
+        # - If no data available, print error message and try with other L2E accumulation intervals
+        required_product = get_required_product(product)
+        filepaths = try_get_required_filepaths(
+            data_archive_dir=data_archive_dir,
+            data_source=data_source,
+            campaign_name=campaign_name,
+            station_name=station_name,
+            product=required_product,
+            # Processing options
+            debugging_mode=debugging_mode,
+            # Product options
+            temporal_resolution=temporal_resolution,
+        )
+        if filepaths is None:
+            continue
+        # ---------------------------------------------------------------------.
+        # Retrieve L2E processing options
+        l2e_processing_options = L2ProcessingOptions(
+            product=product,
+            temporal_resolution=temporal_resolution,
+            filepaths=filepaths,
+            parallel=parallel,
+        )
+        # ---------------------------------------------------------------------.
+        # Retrieve files temporal partitions
+        files_partitions = l2e_processing_options.files_partitions
+        if len(files_partitions) == 0:
+            msg = (
+                f"{product} processing of {data_source} {campaign_name} {station_name} "
+                + f"has not been launched because of missing {required_product} {temporal_resolution} data."
+            )
+            log_info(logger=logger, msg=msg, verbose=verbose)
+            continue
         # Retrieve folder partitioning (for files and logs)
-        folder_partitioning = l2e_processing_options.get_folder_partitioning(temporal_resolution)
+        folder_partitioning = l2e_processing_options.folder_partitioning
         # Retrieve product options
-        product_options = l2e_processing_options.get_product_options(temporal_resolution)
-        # Retrieve accumulation_interval and rolling option
-        accumulation_interval, rolling = get_resampling_information(temporal_resolution)
+        product_options = l2e_processing_options.product_options
         # Precompute required scattering tables
         if product_options["radar_enabled"]:
             radar_options = product_options["radar_options"]
             precompute_scattering_tables(verbose=verbose, **radar_options)
-        # ------------------------------------------------------------------.
+        # ---------------------------------------------------------------------.
         # Create product directory
         data_dir = create_product_directory(
             data_archive_dir=data_archive_dir,
@@ -510,8 +377,7 @@ def run_l2e_station(
             product=product,
             force=force,
             # Option for L2E
-            sample_interval=accumulation_interval,
-            rolling=rolling,
+            temporal_resolution=temporal_resolution,
         )
         # Define logs directory
@@ -522,11 +388,10 @@ def run_l2e_station(
             campaign_name=campaign_name,
             station_name=station_name,
             # Option for L2E
-            sample_interval=accumulation_interval,
-            rolling=rolling,
+            temporal_resolution=temporal_resolution,
         )
-        # ------------------------------------------------------------------.
+        # ---------------------------------------------------------------------.
         # Generate files
         # - L2E product generation is optionally parallelized over events
         # - If parallel=True, it does that in parallel using dask.delayed
@@ -542,15 +407,13 @@ def run_l2e_station(
                     station_name=station_name,
                     start_time=event_info["start_time"],
                     end_time=event_info["end_time"],
-                    rolling=rolling,
-                    accumulation_interval=accumulation_interval,
+                    temporal_resolution=temporal_resolution,
                 ),
                 folder_partitioning=folder_partitioning,
                 campaign_name=campaign_name,
                 station_name=station_name,
                 # L2E options
-                rolling=rolling,
-                accumulation_interval=accumulation_interval,
+                temporal_resolution=temporal_resolution,
                 product_options=product_options,
                 # Processing options
                 force=force,
@@ -570,8 +433,7 @@ def run_l2e_station(
             station_name=station_name,
             data_archive_dir=data_archive_dir,
             # Product options
-            sample_interval=accumulation_interval,
-            rolling=rolling,
+            temporal_resolution=temporal_resolution,
             # Logs list
             list_logs=list_logs,
         )
@@ -586,9 +448,8 @@ def run_l2e_station(
 ####----------------------------------------------------------------------------.
 #### L2M
-def define_l2m_logs_filename(campaign_name, station_name, start_time, end_time, model_name, sample_interval, rolling):
+def define_l2m_logs_filename(campaign_name, station_name, start_time, end_time, model_name, temporal_resolution):
     """Define L2M logs filename."""
-    temporal_resolution = define_temporal_resolution(seconds=sample_interval, rolling=rolling)
     starting_time = pd.to_datetime(start_time).strftime("%Y%m%d%H%M%S")
     ending_time = pd.to_datetime(end_time).strftime("%Y%m%d%H%M%S")
     logs_filename = (
@@ -610,8 +471,7 @@ def _generate_l2m(
     campaign_name,
     station_name,
     # L2M options
-    sample_interval,
-    rolling,
+    temporal_resolution,
     model_name,
     product_options,
     # Processing options
@@ -636,14 +496,13 @@ def _generate_l2m(
         force,
         # Product options
         product_options,
-        sample_interval,
-        rolling,
+        temporal_resolution,
         model_name,
         # Archiving arguments
         data_dir,
         folder_partitioning,
     ):
-        """Define L1 product processing."""
+        """Define L2M product processing."""
         # Copy to avoid in-place replacement (outside this function)
         product_options = product_options.copy()
@@ -655,7 +514,10 @@ def _generate_l2m(
         # Define variables to load
         optimization_kwargs = l2m_options["optimization_kwargs"]
-        if "init_method" in optimization_kwargs:
+        if "init_method" in optimization_kwargs and optimization_kwargs["init_method"] is None:
+            optimization_kwargs["init_method"] = "None"
+        if optimization_kwargs.get("init_method", "None") != "None":
             init_method = optimization_kwargs["init_method"]
             moments = [f"M{order}" for order in init_method.replace("M", "")] + ["M1"]
         else:
@@ -673,9 +535,14 @@ def _generate_l2m(
         ##------------------------------------------------------------------------.
         # Open the netCDF files
-        ds = open_netcdf_files(filepaths, start_time=start_time, end_time=end_time, variables=variables)
-        ds = ds.load()
-        ds.close()
+        ds = open_netcdf_files(
+            filepaths,
+            start_time=start_time,
+            end_time=end_time,
+            variables=variables,
+            parallel=False,
+            compute=True,
+        )
         # Produce L2M dataset
         ds = generate_l2m(
@@ -699,8 +566,7 @@ def _generate_l2m(
             ds,
             campaign_name=campaign_name,
             station_name=station_name,
-            sample_interval=sample_interval,
-            rolling=rolling,
+            temporal_resolution=temporal_resolution,
             model_name=model_name,
         )
         folder_path = define_file_folder_path(ds, dir_path=data_dir, folder_partitioning=folder_partitioning)
@@ -722,8 +588,7 @@ def _generate_l2m(
         force=force,
         # Product options
         product_options=product_options,
-        sample_interval=sample_interval,
-        rolling=rolling,
+        temporal_resolution=temporal_resolution,
         model_name=model_name,
         # Archiving arguments
         data_dir=data_dir,
@@ -835,19 +700,15 @@ def run_l2m_station(
     # Loop
     # temporal_resolution = "1MIN"
     # temporal_resolution = "10MIN"
-    temporal_resolutions = get_product_temporal_resolutions("L2M")
+    temporal_resolutions = get_product_temporal_resolutions(product)
     for temporal_resolution in temporal_resolutions:
-        # Retrieve accumulation_interval and rolling option
-        accumulation_interval, rolling = get_resampling_information(temporal_resolution)
         # ------------------------------------------------------------------.
-        # Avoid generation of rolling products for source sample interval !
-        if rolling and accumulation_interval == sample_interval:
-            continue
-        # Avoid product generation if the accumulation_interval is less than the sample interval
-        if accumulation_interval < sample_interval:
+        # Check if the product can be generated
+        if not is_possible_product(
+            temporal_resolution=temporal_resolution,
+            sample_interval=sample_interval,
+        ):
             continue
         # -----------------------------------------------------------------.
@@ -863,29 +724,28 @@ def run_l2m_station(
             # Processing options
             debugging_mode=debugging_mode,
             # Product options
-            sample_interval=accumulation_interval,
-            rolling=rolling,
+            temporal_resolution=temporal_resolution,
         )
         if filepaths is None:
             continue
         # -------------------------------------------------------------------------.
         # Retrieve L2M processing options
-        l2m_processing_options = ProcessingOptions(
-            product="L2M",
-            temporal_resolutions=temporal_resolution,
+        l2m_processing_options = L2ProcessingOptions(
+            product=product,
+            temporal_resolution=temporal_resolution,
             filepaths=filepaths,
             parallel=parallel,
         )
         # Retrieve folder partitioning (for files and logs)
-        folder_partitioning = l2m_processing_options.get_folder_partitioning(temporal_resolution)
+        folder_partitioning = l2m_processing_options.folder_partitioning
         # Retrieve product options
-        global_product_options = l2m_processing_options.get_product_options(temporal_resolution)
+        global_product_options = l2m_processing_options.product_options
         # Retrieve files temporal partitions
-        files_partitions = l2m_processing_options.get_files_partitions(temporal_resolution)
+        files_partitions = l2m_processing_options.files_partitions
         if len(files_partitions) == 0:
             msg = (
@@ -898,6 +758,7 @@ def run_l2m_station(
         # -----------------------------------------------------------------.
         # Loop over distributions to fit
         # model_name = "GAMMA_ML"
+        # model_name = "LOGNORMAL_GS_ND_MAE"
         # model_options =  l2m_options["models"][model_name]
         # Retrieve list of models to fit
         models = global_product_options.pop("models")
@@ -917,30 +778,37 @@ def run_l2m_station(
                 precompute_scattering_tables(verbose=verbose, **radar_options)
             # -----------------------------------------------------------------.
-            msg = f"Production of L2M_{model_name} for sample interval {accumulation_interval} s has started."
+            msg = f"Production of L2M_{model_name} for {temporal_resolution} has started."
             log_info(logger=logger, msg=msg, verbose=verbose)
             msg = f"Estimating {psd_model} parameters using {optimization}."
             log_info(logger=logger, msg=msg, verbose=verbose)
             # -------------------------------------------------------------.
             # Create product directory
-            data_dir = create_product_directory(
-                # DISDRODB root directories
-                data_archive_dir=data_archive_dir,
-                metadata_archive_dir=metadata_archive_dir,
-                # Station arguments
-                data_source=data_source,
-                campaign_name=campaign_name,
-                station_name=station_name,
-                # Processing options
-                product=product,
-                force=force,
-                # Option for L2E
-                sample_interval=accumulation_interval,
-                rolling=rolling,
-                # Option for L2M
-                model_name=model_name,
-            )
+            try:
+                data_dir = create_product_directory(
+                    # DISDRODB root directories
+                    data_archive_dir=data_archive_dir,
+                    metadata_archive_dir=metadata_archive_dir,
+                    # Station arguments
+                    data_source=data_source,
+                    campaign_name=campaign_name,
+                    station_name=station_name,
+                    # Processing options
+                    product=product,
+                    force=force,
+                    # Option for L2E
+                    temporal_resolution=temporal_resolution,
+                    # Option for L2M
+                    model_name=model_name,
+                )
+            except Exception:
+                msg = (
+                    f"Production of L2M_{model_name} for {temporal_resolution} data has been "
+                    + "skipped because the product already exists and force=False."
+                )
+                log_info(logger=logger, msg=msg, verbose=verbose)
+                continue
             # Define logs directory
             logs_dir = create_logs_directory(
@@ -951,8 +819,7 @@ def run_l2m_station(
                 campaign_name=campaign_name,
                 station_name=station_name,
                 # Option for L2E
-                sample_interval=accumulation_interval,
-                rolling=rolling,
+                temporal_resolution=temporal_resolution,
                 # Option for L2M
                 model_name=model_name,
             )
@@ -973,15 +840,13 @@ def run_l2m_station(
                         start_time=event_info["start_time"],
                         end_time=event_info["end_time"],
                         model_name=model_name,
-                        sample_interval=accumulation_interval,
-                        rolling=rolling,
+                        temporal_resolution=temporal_resolution,
                     ),
                     folder_partitioning=folder_partitioning,
                     campaign_name=campaign_name,
                     station_name=station_name,
                     # L2M options
-                    sample_interval=accumulation_interval,
-                    rolling=rolling,
+                    temporal_resolution=temporal_resolution,
                     model_name=model_name,
                     product_options=product_options,
                     # Processing options
@@ -1005,8 +870,7 @@ def run_l2m_station(
                 data_archive_dir=data_archive_dir,
                 # Product options
                 model_name=model_name,
-                sample_interval=sample_interval,
-                rolling=rolling,
+                temporal_resolution=temporal_resolution,
                 # Logs list
                 list_logs=list_logs,
             )

disdrodb 0.1.4__py3-none-any.whl → 0.2.0__py3-none-any.whl

disdrodb 0.1.4py3-none-any.whl → 0.2.0py3-none-any.whl