PyPI - disdrodb - Versions diffs - 0.1.2__py3-none-any.whl → 0.1.4__py3-none-any.whl - Mend

disdrodb 0.1.2py3-none-any.whl → 0.1.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (142) hide show

disdrodb/__init__.py +68 -34
disdrodb/_config.py +5 -4
disdrodb/_version.py +16 -3
disdrodb/accessor/__init__.py +20 -0
disdrodb/accessor/methods.py +125 -0
disdrodb/api/checks.py +177 -24
disdrodb/api/configs.py +3 -3
disdrodb/api/info.py +13 -13
disdrodb/api/io.py +281 -22
disdrodb/api/path.py +184 -195
disdrodb/api/search.py +18 -9
disdrodb/cli/disdrodb_create_summary.py +103 -0
disdrodb/cli/disdrodb_create_summary_station.py +91 -0
disdrodb/cli/disdrodb_run_l0.py +1 -1
disdrodb/cli/disdrodb_run_l0_station.py +1 -1
disdrodb/cli/disdrodb_run_l0a_station.py +1 -1
disdrodb/cli/disdrodb_run_l0b.py +1 -1
disdrodb/cli/disdrodb_run_l0b_station.py +3 -3
disdrodb/cli/disdrodb_run_l0c.py +1 -1
disdrodb/cli/disdrodb_run_l0c_station.py +3 -3
disdrodb/cli/disdrodb_run_l1_station.py +2 -2
disdrodb/cli/disdrodb_run_l2e_station.py +2 -2
disdrodb/cli/disdrodb_run_l2m_station.py +2 -2
disdrodb/configs.py +149 -4
disdrodb/constants.py +61 -0
disdrodb/data_transfer/download_data.py +127 -11
disdrodb/etc/configs/attributes.yaml +339 -0
disdrodb/etc/configs/encodings.yaml +473 -0
disdrodb/etc/products/L1/global.yaml +13 -0
disdrodb/etc/products/L2E/10MIN.yaml +12 -0
disdrodb/etc/products/L2E/1MIN.yaml +1 -0
disdrodb/etc/products/L2E/global.yaml +22 -0
disdrodb/etc/products/L2M/10MIN.yaml +12 -0
disdrodb/etc/products/L2M/GAMMA_ML.yaml +8 -0
disdrodb/etc/products/L2M/NGAMMA_GS_LOG_ND_MAE.yaml +6 -0
disdrodb/etc/products/L2M/NGAMMA_GS_ND_MAE.yaml +6 -0
disdrodb/etc/products/L2M/NGAMMA_GS_Z_MAE.yaml +6 -0
disdrodb/etc/products/L2M/global.yaml +26 -0
disdrodb/issue/writer.py +2 -0
disdrodb/l0/__init__.py +13 -0
disdrodb/l0/configs/LPM/l0b_cf_attrs.yml +4 -4
disdrodb/l0/configs/PARSIVEL/l0b_cf_attrs.yml +1 -1
disdrodb/l0/configs/PARSIVEL/l0b_encodings.yml +3 -3
disdrodb/l0/configs/PARSIVEL/raw_data_format.yml +1 -1
disdrodb/l0/configs/PARSIVEL2/l0b_cf_attrs.yml +5 -5
disdrodb/l0/configs/PARSIVEL2/l0b_encodings.yml +3 -3
disdrodb/l0/configs/PARSIVEL2/raw_data_format.yml +1 -1
disdrodb/l0/configs/PWS100/l0b_cf_attrs.yml +4 -4
disdrodb/l0/configs/PWS100/raw_data_format.yml +1 -1
disdrodb/l0/l0a_processing.py +37 -32
disdrodb/l0/l0b_nc_processing.py +118 -8
disdrodb/l0/l0b_processing.py +30 -65
disdrodb/l0/l0c_processing.py +369 -259
disdrodb/l0/readers/LPM/ARM/ARM_LPM.py +7 -0
disdrodb/l0/readers/LPM/NETHERLANDS/DELFT_LPM_NC.py +66 -0
disdrodb/l0/readers/LPM/SLOVENIA/{CRNI_VRH.py → UL.py} +3 -0
disdrodb/l0/readers/LPM/SWITZERLAND/INNERERIZ_LPM.py +195 -0
disdrodb/l0/readers/PARSIVEL/GPM/PIERS.py +0 -2
disdrodb/l0/readers/PARSIVEL/JAPAN/JMA.py +4 -1
disdrodb/l0/readers/PARSIVEL/NCAR/PECAN_MOBILE.py +1 -1
disdrodb/l0/readers/PARSIVEL/NCAR/VORTEX2_2009.py +1 -1
disdrodb/l0/readers/PARSIVEL2/ARM/ARM_PARSIVEL2.py +4 -0
disdrodb/l0/readers/PARSIVEL2/BELGIUM/ILVO.py +168 -0
disdrodb/l0/readers/PARSIVEL2/CANADA/UQAM_NC.py +69 -0
disdrodb/l0/readers/PARSIVEL2/DENMARK/DTU.py +165 -0
disdrodb/l0/readers/PARSIVEL2/FINLAND/FMI_PARSIVEL2.py +69 -0
disdrodb/l0/readers/PARSIVEL2/FRANCE/ENPC_PARSIVEL2.py +255 -134
disdrodb/l0/readers/PARSIVEL2/FRANCE/OSUG.py +525 -0
disdrodb/l0/readers/PARSIVEL2/FRANCE/SIRTA_PARSIVEL2.py +1 -1
disdrodb/l0/readers/PARSIVEL2/GPM/GCPEX.py +9 -7
disdrodb/l0/readers/PARSIVEL2/KIT/BURKINA_FASO.py +1 -1
disdrodb/l0/readers/PARSIVEL2/KIT/TEAMX.py +123 -0
disdrodb/l0/readers/PARSIVEL2/{NETHERLANDS/DELFT.py → MPI/BCO_PARSIVEL2.py} +41 -71
disdrodb/l0/readers/PARSIVEL2/MPI/BOWTIE.py +220 -0
disdrodb/l0/readers/PARSIVEL2/NASA/APU.py +120 -0
disdrodb/l0/readers/PARSIVEL2/NASA/LPVEX.py +109 -0
disdrodb/l0/readers/PARSIVEL2/NCAR/FARM_PARSIVEL2.py +1 -0
disdrodb/l0/readers/PARSIVEL2/NCAR/PECAN_FP3.py +1 -1
disdrodb/l0/readers/PARSIVEL2/NCAR/PERILS_MIPS.py +126 -0
disdrodb/l0/readers/PARSIVEL2/NCAR/PERILS_PIPS.py +165 -0
disdrodb/l0/readers/PARSIVEL2/NCAR/VORTEX_SE_2016_P2.py +1 -1
disdrodb/l0/readers/PARSIVEL2/NCAR/VORTEX_SE_2016_PIPS.py +20 -12
disdrodb/l0/readers/PARSIVEL2/NETHERLANDS/DELFT_NC.py +5 -0
disdrodb/l0/readers/PARSIVEL2/SPAIN/CENER.py +144 -0
disdrodb/l0/readers/PARSIVEL2/SPAIN/CR1000DL.py +201 -0
disdrodb/l0/readers/PARSIVEL2/SPAIN/LIAISE.py +137 -0
disdrodb/l0/readers/PARSIVEL2/USA/C3WE.py +146 -0
disdrodb/l0/readers/PWS100/FRANCE/ENPC_PWS100.py +105 -99
disdrodb/l0/readers/PWS100/FRANCE/ENPC_PWS100_SIRTA.py +151 -0
disdrodb/l1/__init__.py +5 -0
disdrodb/l1/fall_velocity.py +46 -0
disdrodb/l1/filters.py +34 -20
disdrodb/l1/processing.py +46 -45
disdrodb/l1/resampling.py +77 -66
disdrodb/l1_env/routines.py +18 -3
disdrodb/l2/__init__.py +7 -0
disdrodb/l2/empirical_dsd.py +58 -10
disdrodb/l2/processing.py +268 -117
disdrodb/metadata/checks.py +132 -125
disdrodb/metadata/standards.py +3 -1
disdrodb/psd/fitting.py +631 -345
disdrodb/psd/models.py +9 -6
disdrodb/routines/__init__.py +54 -0
disdrodb/{l0/routines.py → routines/l0.py} +316 -355
disdrodb/{l1/routines.py → routines/l1.py} +76 -116
disdrodb/routines/l2.py +1019 -0
disdrodb/{routines.py → routines/wrappers.py} +98 -10
disdrodb/scattering/__init__.py +16 -4
disdrodb/scattering/axis_ratio.py +61 -37
disdrodb/scattering/permittivity.py +504 -0
disdrodb/scattering/routines.py +746 -184
disdrodb/summary/__init__.py +17 -0
disdrodb/summary/routines.py +4196 -0
disdrodb/utils/archiving.py +434 -0
disdrodb/utils/attrs.py +68 -125
disdrodb/utils/cli.py +5 -5
disdrodb/utils/compression.py +30 -1
disdrodb/utils/dask.py +121 -9
disdrodb/utils/dataframe.py +61 -7
disdrodb/utils/decorators.py +31 -0
disdrodb/utils/directories.py +35 -15
disdrodb/utils/encoding.py +37 -19
disdrodb/{l2 → utils}/event.py +15 -173
disdrodb/utils/logger.py +14 -7
disdrodb/utils/manipulations.py +81 -0
disdrodb/utils/routines.py +166 -0
disdrodb/utils/subsetting.py +214 -0
disdrodb/utils/time.py +35 -177
disdrodb/utils/writer.py +20 -7
disdrodb/utils/xarray.py +5 -4
disdrodb/viz/__init__.py +13 -0
disdrodb/viz/plots.py +398 -0
{disdrodb-0.1.2.dist-info → disdrodb-0.1.4.dist-info}/METADATA +4 -3
{disdrodb-0.1.2.dist-info → disdrodb-0.1.4.dist-info}/RECORD +139 -98
{disdrodb-0.1.2.dist-info → disdrodb-0.1.4.dist-info}/entry_points.txt +2 -0
disdrodb/l1/encoding_attrs.py +0 -642
disdrodb/l2/processing_options.py +0 -213
disdrodb/l2/routines.py +0 -868
/disdrodb/l0/readers/PARSIVEL/SLOVENIA/{UL_FGG.py → UL.py} +0 -0
{disdrodb-0.1.2.dist-info → disdrodb-0.1.4.dist-info}/WHEEL +0 -0
{disdrodb-0.1.2.dist-info → disdrodb-0.1.4.dist-info}/licenses/LICENSE +0 -0
{disdrodb-0.1.2.dist-info → disdrodb-0.1.4.dist-info}/top_level.txt +0 -0

disdrodb/api/path.py CHANGED Viewed

@@ -20,11 +20,12 @@
 import os
 from disdrodb.configs import get_data_archive_dir, get_metadata_archive_dir
+from disdrodb.constants import ARCHIVE_VERSION
 from disdrodb.utils.directories import check_directory_exists
 from disdrodb.utils.time import (
     ensure_sample_interval_in_seconds,
     get_file_start_end_time,
-    seconds_to_acronym,
+    seconds_to_temporal_resolution,
 )
 ####--------------------------------------------------------------------------.
@@ -62,14 +63,13 @@ def define_disdrodb_path(
         The campaign name.
     check_exists : bool, optional
         Whether to check if the directory exists. The default value is ``True``.
+        Raise error if the directory does not exist.
     Returns
     -------
     dir_path : str
         Directory path
     """
-    from disdrodb import ARCHIVE_VERSION
     if len(campaign_name) > 0 and len(data_source) == 0:
         raise ValueError("If campaign_name is specified, data_source must be specified.")
@@ -82,7 +82,7 @@ def define_disdrodb_path(
         dir_path = os.path.join(archive_dir, ARCHIVE_VERSION, data_source, campaign_name)
     if check_exists:
         check_directory_exists(dir_path)
-    return dir_path
+    return os.path.normpath(dir_path)
 def define_data_source_dir(
@@ -108,6 +108,7 @@ def define_data_source_dir(
         If not specified, the path specified in the DISDRODB active configuration will be used.
     check_exists : bool, optional
         Whether to check if the directory exists. The default value is ``False``.
+        Raise error if the directory does not exist.
     Returns
     -------
@@ -349,7 +350,56 @@ def define_config_dir(product):
 #### Directory/Filepaths L0A and L0B products
-def define_file_folder_path(obj, data_dir, folder_partitioning):
+def define_partitioning_tree(time, folder_partitioning):
+    """Define the time directory tree given a timestep.
+    Parameters
+    ----------
+    time : datetime.datetime
+        Timestep.
+    folder_partitioning : str or None
+        Define the subdirectory structure where saving files.
+        Allowed values are:
+          - None: Files are saved directly in data_dir.
+          - "year": Files are saved under a subdirectory for the year.
+          - "year/month": Files are saved under subdirectories for year and month.
+          - "year/month/day": Files are saved under subdirectories for year, month and day
+          - "year/month_name": Files are stored under subdirectories by year and month name
+          - "year/quarter": Files are saved under subdirectories for year and quarter.
+    Returns
+    -------
+    str
+        A time partitioned directory tree.
+    """
+    if folder_partitioning == "":
+        return ""
+    if folder_partitioning == "year":
+        year = str(time.year)
+        return year
+    if folder_partitioning == "year/month":
+        year = str(time.year)
+        month = str(time.month).zfill(2)
+        return os.path.join(year, month)
+    if folder_partitioning == "year/month/day":
+        year = str(time.year)
+        month = str(time.month).zfill(2)
+        day = str(time.day).zfill(2)
+        return os.path.join(year, month, day)
+    if folder_partitioning == "year/month_name":
+        year = str(time.year)
+        month = time.strftime("%B")
+        return os.path.join(year, month)
+    if folder_partitioning == "year/quarter":
+        year = str(time.year)
+        # Calculate quarter: months 1-3 => Q1, 4-6 => Q2, etc.
+        quarter = (time.month - 1) // 3 + 1
+        quarter_dir = f"Q{quarter}"
+        return os.path.join(year, quarter_dir)
+    raise NotImplementedError(f"Unrecognized '{folder_partitioning}' folder partitioning scheme.")
+def define_file_folder_path(obj, dir_path, folder_partitioning):
     """
     Define the folder path where saving a file based on the dataset's starting time.
@@ -357,12 +407,13 @@ def define_file_folder_path(obj, data_dir, folder_partitioning):
     ----------
     ds : xarray.Dataset or pandas.DataFrame
         The object containing time information.
-    data_dir : str
+    dir : str
         Directory within the DISDRODB Data Archive where DISDRODB product files are to be saved.
+        It can be a product directory or a logs directory.
     folder_partitioning : str or None
         Define the subdirectory structure where saving files.
         Allowed values are:
-          - None: Files are saved directly in data_dir.
+          - None or "": Files are saved directly in data_dir.
           - "year": Files are saved under a subdirectory for the year.
           - "year/month": Files are saved under subdirectories for year and month.
           - "year/month/day": Files are saved under subdirectories for year, month and day
@@ -382,32 +433,9 @@ def define_file_folder_path(obj, data_dir, folder_partitioning):
     # Retrieve the starting time from the dataset.
     starting_time, _ = get_file_start_end_time(obj)
-    # Build the folder path based on the chosen partition scheme.
-    if folder_partitioning == "":
-        return data_dir
-    if folder_partitioning == "year":
-        year = str(starting_time.year)
-        return os.path.join(data_dir, year)
-    if folder_partitioning == "year/month":
-        year = str(starting_time.year)
-        month = str(starting_time.month).zfill(2)
-        return os.path.join(data_dir, year, month)
-    if folder_partitioning == "year/month/day":
-        year = str(starting_time.year)
-        month = str(starting_time.month).zfill(2)
-        day = str(starting_time.day).zfill(2)
-        return os.path.join(data_dir, year, month, day)
-    if folder_partitioning == "year/month_name":
-        year = str(starting_time.year)
-        month = str(starting_time.month_name())
-        return os.path.join(data_dir, year, month)
-    if folder_partitioning == "year/quarter":
-        year = str(starting_time.year)
-        # Calculate quarter: months 1-3 => Q1, 4-6 => Q2, etc.
-        quarter = (starting_time.month - 1) // 3 + 1
-        quarter_dir = f"Q{quarter}"
-        return os.path.join(data_dir, year, quarter_dir)
-    raise NotImplementedError(f"Unrecognized '{folder_partitioning}' folder partitioning scheme.")
+    # Build the folder path based on the chosen partition scheme
+    partitioning_tree = define_partitioning_tree(time=starting_time, folder_partitioning=folder_partitioning)
+    return os.path.normpath(os.path.join(dir_path, partitioning_tree))
 def define_product_dir_tree(
@@ -448,17 +476,16 @@ def define_product_dir_tree(
         sample_interval = product_kwargs.get("sample_interval")
         check_rolling(rolling)
         check_sample_interval(sample_interval)
-        sample_interval_acronym = define_accumulation_acronym(seconds=sample_interval, rolling=rolling)
-        return os.path.join(sample_interval_acronym)
-    if product == "L2M":
-        rolling = product_kwargs.get("rolling")
-        sample_interval = product_kwargs.get("sample_interval")
-        model_name = product_kwargs.get("model_name")
-        check_rolling(rolling)
-        check_sample_interval(sample_interval)
-        sample_interval_acronym = define_accumulation_acronym(seconds=sample_interval, rolling=rolling)
-        return os.path.join(model_name, sample_interval_acronym)
-    raise ValueError(f"The product {product} is not defined.")
+        temporal_resolution = define_temporal_resolution(seconds=sample_interval, rolling=rolling)
+        return os.path.join(temporal_resolution)
+    # L2M if product == "L2M":
+    rolling = product_kwargs.get("rolling")
+    sample_interval = product_kwargs.get("sample_interval")
+    model_name = product_kwargs.get("model_name")
+    check_rolling(rolling)
+    check_sample_interval(sample_interval)
+    temporal_resolution = define_temporal_resolution(seconds=sample_interval, rolling=rolling)
+    return os.path.join(model_name, temporal_resolution)
 def define_logs_dir(
@@ -504,7 +531,7 @@ def define_logs_dir(
         product=product,
         **product_kwargs,
     )
-    logs_dir = os.path.join(campaign_dir, "logs", "files", product, product_dir_tree, station_name)
+    logs_dir = os.path.normpath(os.path.join(campaign_dir, "logs", "files", product, product_dir_tree, station_name))
     if check_exists:
         check_directory_exists(logs_dir)
     return str(logs_dir)
@@ -618,7 +645,7 @@ def define_data_dir(
         **product_kwargs,
     )
     # Define data directory
-    data_dir = os.path.join(station_dir, product_dir_tree)
+    data_dir = os.path.normpath(os.path.join(station_dir, product_dir_tree))
     # Check if directory exists
     if check_exists:
         check_directory_exists(data_dir)
@@ -629,15 +656,15 @@ def define_data_dir(
 #### Filenames for DISDRODB products
-def define_accumulation_acronym(seconds, rolling):
-    """Define the accumulation acronnym.
+def define_temporal_resolution(seconds, rolling):
+    """Define the DISDRODB product temporal resolution.
-    Prefix the accumulation interval acronym with ROLL if rolling=True.
+    Prefix the measurement interval with ROLL if rolling=True.
     """
-    accumulation_acronym = seconds_to_acronym(seconds)
+    temporal_resolution = seconds_to_temporal_resolution(seconds)
     if rolling:
-        accumulation_acronym = f"ROLL{accumulation_acronym}"
-    return accumulation_acronym
+        temporal_resolution = f"ROLL{temporal_resolution}"
+    return temporal_resolution
 ####--------------------------------------------------------------------------.
@@ -649,7 +676,8 @@ def define_filename(
     campaign_name: str,
     station_name: str,
     # Filename options
-    obj=None,
+    start_time=None,
+    end_time=None,
     add_version=True,
     add_time_period=True,
     add_extension=True,
@@ -663,19 +691,22 @@ def define_filename(
     Parameters
     ----------
-    obj  : xarray.Dataset or pandas.DataFrame
-        xarray Dataset or pandas DataFrame.
-        Required if add_time_period = True.
     campaign_name : str
        Name of the campaign.
     station_name : str
        Name of the station.
+    start_time : datetime.datatime, optional
+        Start time.
+        Required if add_time_period = True.
+    end_time : datetime.datatime, optional
+        End time.
+        Required if add_time_period = True.
     sample_interval : int, optional
         The sampling interval in seconds of the product.
-        It must be specified only for product L2E and L2M !
+        It must be specified only for product L0C, L1, L2E and L2M !
     rolling : bool, optional
         Whether the dataset has been resampled by aggregating or rolling.
-        It must be specified only for product L2E and L2M !
+        It must be specified only for product L1, L2E and L2M !
     model_name : str
         The model name of the fitted statistical distribution for the DSD.
         It must be specified only for product L2M !
@@ -685,32 +716,37 @@ def define_filename(
     str
         L0B file name.
     """
-    from disdrodb import ARCHIVE_VERSION
     from disdrodb.api.checks import check_product, check_product_kwargs
     product = check_product(product)
     product_kwargs = check_product_kwargs(product, product_kwargs)
-    # -----------------------------------------.
-    # TODO: Define sample_interval_acronym
-    # - ADD sample_interval_acronym also to L0A and L0B
-    # - Add sample_interval_acronym also to L0C and L1
+    if add_time_period and (start_time is None or end_time is None):
+        raise ValueError("If add_time_period=True, specify start_time and end_time.")
     # -----------------------------------------.
-    # Define product acronym
-    product_acronym = f"{product}"
+    # Define product name
+    product_name = f"{product}"
+    # L0C ... sample interval known only per-file
+    # L1 ... in future known a priori
+    # if product in ["L1"]:
+    #     # TODO: HACK FOR CURRENT L0C and L1 log files in create_product_logs
+    #     sample_interval = product_kwargs.get("sample_interval",  0)
+    #     temporal_resolution = define_temporal_resolution(seconds=sample_interval, rolling=False)
+    #     product_name = f"{product}.{temporal_resolution}"
     if product in ["L2E", "L2M"]:
         rolling = product_kwargs.get("rolling")
         sample_interval = product_kwargs.get("sample_interval")
-        sample_interval_acronym = define_accumulation_acronym(seconds=sample_interval, rolling=rolling)
-        product_acronym = f"L2E.{sample_interval_acronym}"
+        temporal_resolution = define_temporal_resolution(seconds=sample_interval, rolling=rolling)
+        product_name = f"{product}.{temporal_resolution}"
     if product in ["L2M"]:
         model_name = product_kwargs.get("model_name")
-        product_acronym = f"L2M_{model_name}.{sample_interval_acronym}"
+        product_name = f"L2M_{model_name}.{temporal_resolution}"
     # -----------------------------------------.
     # Define base filename
-    filename = f"{product_acronym}.{campaign_name}.{station_name}"
+    filename = f"{product_name}.{campaign_name}.{station_name}"
     # -----------------------------------------.
     # Add prefix
@@ -720,10 +756,9 @@ def define_filename(
     # -----------------------------------------.
     # Add time period information
     if add_time_period:
-        starting_time, ending_time = get_file_start_end_time(obj)
-        starting_time = starting_time.strftime("%Y%m%d%H%M%S")
-        ending_time = ending_time.strftime("%Y%m%d%H%M%S")
-        filename = f"{filename}.s{starting_time}.e{ending_time}"
+        start_time = start_time.strftime("%Y%m%d%H%M%S")
+        end_time = end_time.strftime("%Y%m%d%H%M%S")
+        filename = f"{filename}.s{start_time}.e{end_time}"
     # -----------------------------------------.
     # Add product version
@@ -759,133 +794,97 @@ def define_l0a_filename(df, campaign_name: str, station_name: str) -> str:
     str
         L0A file name.
     """
-    from disdrodb import ARCHIVE_VERSION
     starting_time, ending_time = get_file_start_end_time(df)
-    starting_time = starting_time.strftime("%Y%m%d%H%M%S")
-    ending_time = ending_time.strftime("%Y%m%d%H%M%S")
-    version = ARCHIVE_VERSION
-    filename = f"L0A.{campaign_name}.{station_name}.s{starting_time}.e{ending_time}.{version}.parquet"
+    filename = define_filename(
+        product="L0A",
+        campaign_name=campaign_name,
+        station_name=station_name,
+        # Filename options
+        start_time=starting_time,
+        end_time=ending_time,
+        add_version=True,
+        add_time_period=True,
+        add_extension=True,
+    )
     return filename
 def define_l0b_filename(ds, campaign_name: str, station_name: str) -> str:
-    """Define L0B file name.
-    Parameters
-    ----------
-    ds  : xarray.Dataset
-        L0B xarray Dataset.
-    campaign_name : str
-        Name of the campaign.
-    station_name : str
-        Name of the station.
-    Returns
-    -------
-    str
-        L0B file name.
-    """
-    from disdrodb import ARCHIVE_VERSION
+    """Define L0B file name."""
     starting_time, ending_time = get_file_start_end_time(ds)
-    starting_time = starting_time.strftime("%Y%m%d%H%M%S")
-    ending_time = ending_time.strftime("%Y%m%d%H%M%S")
-    version = ARCHIVE_VERSION
-    filename = f"L0B.{campaign_name}.{station_name}.s{starting_time}.e{ending_time}.{version}.nc"
+    filename = define_filename(
+        product="L0B",
+        campaign_name=campaign_name,
+        station_name=station_name,
+        # Filename options
+        start_time=starting_time,
+        end_time=ending_time,
+        add_version=True,
+        add_time_period=True,
+        add_extension=True,
+    )
     return filename
 def define_l0c_filename(ds, campaign_name: str, station_name: str) -> str:
-    """Define L0C file name.
-    Parameters
-    ----------
-    ds  : xarray.Dataset
-        L0B xarray Dataset.
-    campaign_name : str
-        Name of the campaign.
-    station_name : str
-        Name of the station.
-    Returns
-    -------
-    str
-        L0B file name.
-    """
-    from disdrodb import ARCHIVE_VERSION
-    # TODO: add sample_interval as argument
+    """Define L0C file name."""
+    # TODO: add sample_interval as function argument    s
     sample_interval = int(ensure_sample_interval_in_seconds(ds["sample_interval"]).data.item())
-    sample_interval_acronym = define_accumulation_acronym(sample_interval, rolling=False)
+    temporal_resolution = define_temporal_resolution(sample_interval, rolling=False)
     starting_time, ending_time = get_file_start_end_time(ds)
     starting_time = starting_time.strftime("%Y%m%d%H%M%S")
     ending_time = ending_time.strftime("%Y%m%d%H%M%S")
     version = ARCHIVE_VERSION
-    filename = (
-        f"L0C.{sample_interval_acronym}.{campaign_name}.{station_name}.s{starting_time}.e{ending_time}.{version}.nc"
-    )
+    filename = f"L0C.{temporal_resolution}.{campaign_name}.{station_name}.s{starting_time}.e{ending_time}.{version}.nc"
     return filename
 def define_l1_filename(ds, campaign_name, station_name: str) -> str:
-    """Define L1 file name.
-    Parameters
-    ----------
-    ds  : xarray.Dataset
-        L1 xarray Dataset.
-    campaign_name : str
-        Name of the campaign.
-    station_name : str
-        Name of the station.
+    """Define L1 file name."""
+    # TODO: add sample_interval and rolling as function argument
-    Returns
-    -------
-    str
-        L1 file name.
-    """
-    from disdrodb import ARCHIVE_VERSION
-    # TODO: add sample_interval as argument
+    starting_time, ending_time = get_file_start_end_time(ds)
     sample_interval = int(ensure_sample_interval_in_seconds(ds["sample_interval"]).data.item())
-    sample_interval_acronym = define_accumulation_acronym(sample_interval, rolling=False)
+    temporal_resolution = define_temporal_resolution(sample_interval, rolling=False)
     starting_time, ending_time = get_file_start_end_time(ds)
     starting_time = starting_time.strftime("%Y%m%d%H%M%S")
     ending_time = ending_time.strftime("%Y%m%d%H%M%S")
     version = ARCHIVE_VERSION
-    filename = (
-        f"L1.{sample_interval_acronym}.{campaign_name}.{station_name}.s{starting_time}.e{ending_time}.{version}.nc"
-    )
+    filename = f"L1.{temporal_resolution}.{campaign_name}.{station_name}.s{starting_time}.e{ending_time}.{version}.nc"
+    # filename = define_filename(
+    #     product="L1",
+    #     campaign_name=campaign_name,
+    #     station_name=station_name,
+    #     # Filename options
+    #     start_time=starting_time,
+    #     end_time=ending_time,
+    #     add_version=True,
+    #     add_time_period=True,
+    #     add_extension=True,
+    #     # Product options
+    #     # sample_interval=sample_interval,
+    #     # rolling=rolling,
+    # )
     return filename
 def define_l2e_filename(ds, campaign_name: str, station_name: str, sample_interval: int, rolling: bool) -> str:
-    """Define L2E file name.
-    Parameters
-    ----------
-    ds  : xarray.Dataset
-        L1 xarray Dataset
-    campaign_name : str
-        Name of the campaign.
-    station_name : str
-        Name of the station
-    Returns
-    -------
-    str
-        L0B file name.
-    """
-    from disdrodb import ARCHIVE_VERSION
-    sample_interval_acronym = define_accumulation_acronym(seconds=sample_interval, rolling=rolling)
+    """Define L2E file name."""
     starting_time, ending_time = get_file_start_end_time(ds)
-    starting_time = starting_time.strftime("%Y%m%d%H%M%S")
-    ending_time = ending_time.strftime("%Y%m%d%H%M%S")
-    version = ARCHIVE_VERSION
-    filename = (
-        f"L2E.{sample_interval_acronym}.{campaign_name}.{station_name}.s{starting_time}.e{ending_time}.{version}.nc"
+    filename = define_filename(
+        product="L2E",
+        campaign_name=campaign_name,
+        station_name=station_name,
+        # Filename options
+        start_time=starting_time,
+        end_time=ending_time,
+        add_version=True,
+        add_time_period=True,
+        add_extension=True,
+        # Product options
+        sample_interval=sample_interval,
+        rolling=rolling,
     )
     return filename
@@ -898,31 +897,21 @@ def define_l2m_filename(
     rolling: bool,
     model_name: str,
 ) -> str:
-    """Define L2M file name.
-    Parameters
-    ----------
-    ds  : xarray.Dataset
-        L1 xarray Dataset
-    campaign_name : str
-        Name of the campaign.
-    station_name : str
-        Name of the station
-    Returns
-    -------
-    str
-        L0B file name.
-    """
-    from disdrodb import ARCHIVE_VERSION
-    sample_interval_acronym = define_accumulation_acronym(seconds=sample_interval, rolling=rolling)
+    """Define L2M file name."""
     starting_time, ending_time = get_file_start_end_time(ds)
-    starting_time = starting_time.strftime("%Y%m%d%H%M%S")
-    ending_time = ending_time.strftime("%Y%m%d%H%M%S")
-    version = ARCHIVE_VERSION
-    filename = (
-        f"L2M_{model_name}.{sample_interval_acronym}.{campaign_name}."
-        + f"{station_name}.s{starting_time}.e{ending_time}.{version}.nc"
+    filename = define_filename(
+        product="L2M",
+        campaign_name=campaign_name,
+        station_name=station_name,
+        # Filename options
+        start_time=starting_time,
+        end_time=ending_time,
+        add_version=True,
+        add_time_period=True,
+        add_extension=True,
+        # Product options
+        sample_interval=sample_interval,
+        rolling=rolling,
+        model_name=model_name,
     )
     return filename

disdrodb/api/search.py CHANGED Viewed

@@ -16,14 +16,15 @@ from disdrodb.api.path import (
     define_station_dir,
 )
 from disdrodb.configs import get_data_archive_dir, get_metadata_archive_dir
-from disdrodb.utils.directories import contains_files, contains_netcdf_or_parquet_files
+from disdrodb.constants import PRODUCTS_REQUIREMENTS
+from disdrodb.utils.directories import contains_files, contains_netcdf_or_parquet_files, list_directories, list_files
 from disdrodb.utils.yaml import read_yaml
+####-------------------------------------------------------------------------
 def get_required_product(product):
     """Determine the required product for input product processing."""
-    from disdrodb import PRODUCTS_REQUIREMENTS
     # Check input
     check_product(product)
     # Determine required product
@@ -32,12 +33,13 @@ def get_required_product(product):
 ####-------------------------------------------------------------------------
-#### List DISDRODB infrastructure directories
+#### List DISDRODB Metadata directories
 def list_data_sources(metadata_archive_dir, data_sources=None, invalid_fields_policy="raise"):
     """List data sources names in the DISDRODB Metadata Archive."""
-    available_data_sources = os.listdir(os.path.join(metadata_archive_dir, "METADATA"))
+    path = os.path.join(metadata_archive_dir, "METADATA")
+    available_data_sources = sorted(list_directories(path, return_paths=False))
     # Filter by optionally specified data_sources
     if data_sources is not None:
         available_data_sources = check_valid_fields(
@@ -52,7 +54,7 @@ def list_data_sources(metadata_archive_dir, data_sources=None, invalid_fields_po
 def _list_campaign_names(metadata_archive_dir, data_source):
     data_source_dir = define_data_source_dir(metadata_archive_dir, product="METADATA", data_source=data_source)
-    campaign_names = os.listdir(data_source_dir)
+    campaign_names = sorted(list_directories(data_source_dir, return_paths=False))
     return campaign_names
@@ -109,7 +111,7 @@ def _list_station_names(metadata_archive_dir, data_source, campaign_name):
         data_source=data_source,
         campaign_name=campaign_name,
     )
-    metadata_filenames = os.listdir(metadata_dir)
+    metadata_filenames = sorted(list_files(metadata_dir, glob_pattern="*.yml", return_paths=False))
     station_names = [fname.replace(".yml", "").replace(".yaml", "") for fname in metadata_filenames]
     return station_names
@@ -167,6 +169,10 @@ def list_station_names(
     return station_names
+####-------------------------------------------------------------------------
+#### Filtering utilities for available_stations
 def _finalize_output(list_info, return_tuple):
     # - Return the (data_source, campaign_name, station_name) tuple
     if return_tuple:
@@ -228,7 +234,6 @@ def keep_list_info_elements_with_product_data(data_archive_dir, product, list_in
     checking_function = contains_files if product == "RAW" else contains_netcdf_or_parquet_files
     # Check presence of data for each station
-    # TODO: - In parallel over stations to speed up ?
     list_info_with_product_data = []
     for data_source, campaign_name, station_name in list_info:
         data_dir = define_data_dir(
@@ -362,10 +367,11 @@ def available_stations(
     metadata_archive_dir = get_metadata_archive_dir(metadata_archive_dir)
     product = check_product(product) if product is not None else None
     invalid_fields_policy = check_invalid_fields_policy(invalid_fields_policy)
     # Retrieve available stations from the Metadata Archive
     # - Raise error if no stations availables !
     list_info = list_station_names(
-        metadata_archive_dir,
+        metadata_archive_dir=metadata_archive_dir,
         data_sources=data_sources,
         campaign_names=campaign_names,
         station_names=station_names,
@@ -484,3 +490,6 @@ def available_campaigns(
     campaign_names = [info[1] for info in list_info]
     campaign_names = np.unique(campaign_names).tolist()
     return campaign_names
+####-------------------------------------------------------------------------

disdrodb 0.1.2__py3-none-any.whl → 0.1.4__py3-none-any.whl

disdrodb 0.1.2py3-none-any.whl → 0.1.4py3-none-any.whl