PyPI - disdrodb - Versions diffs - 0.1.3__py3-none-any.whl → 0.1.5__py3-none-any.whl - Mend

disdrodb 0.1.3py3-none-any.whl → 0.1.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (124) hide show

disdrodb/__init__.py +4 -0
disdrodb/_version.py +2 -2
disdrodb/api/checks.py +70 -47
disdrodb/api/configs.py +0 -2
disdrodb/api/create_directories.py +0 -2
disdrodb/api/info.py +3 -3
disdrodb/api/io.py +48 -8
disdrodb/api/path.py +116 -133
disdrodb/api/search.py +12 -3
disdrodb/cli/disdrodb_create_summary.py +113 -0
disdrodb/cli/disdrodb_create_summary_station.py +11 -1
disdrodb/cli/disdrodb_run_l0a_station.py +1 -1
disdrodb/cli/disdrodb_run_l0b_station.py +2 -2
disdrodb/cli/disdrodb_run_l0c_station.py +2 -2
disdrodb/cli/disdrodb_run_l1_station.py +2 -2
disdrodb/cli/disdrodb_run_l2e_station.py +2 -2
disdrodb/cli/disdrodb_run_l2m_station.py +2 -2
disdrodb/constants.py +1 -1
disdrodb/data_transfer/download_data.py +123 -7
disdrodb/etc/products/L1/global.yaml +1 -1
disdrodb/etc/products/L2E/5MIN.yaml +1 -0
disdrodb/etc/products/L2E/global.yaml +1 -1
disdrodb/etc/products/L2M/GAMMA_GS_ND_MAE.yaml +6 -0
disdrodb/etc/products/L2M/GAMMA_ML.yaml +1 -1
disdrodb/etc/products/L2M/LOGNORMAL_GS_LOG_ND_MAE.yaml +6 -0
disdrodb/etc/products/L2M/LOGNORMAL_GS_ND_MAE.yaml +6 -0
disdrodb/etc/products/L2M/LOGNORMAL_ML.yaml +8 -0
disdrodb/etc/products/L2M/global.yaml +11 -3
disdrodb/issue/writer.py +2 -0
disdrodb/l0/check_configs.py +49 -16
disdrodb/l0/configs/LPM/l0a_encodings.yml +2 -2
disdrodb/l0/configs/LPM/l0b_cf_attrs.yml +2 -2
disdrodb/l0/configs/LPM/l0b_encodings.yml +2 -2
disdrodb/l0/configs/LPM/raw_data_format.yml +2 -2
disdrodb/l0/configs/PWS100/l0b_encodings.yml +1 -0
disdrodb/l0/configs/SWS250/bins_diameter.yml +108 -0
disdrodb/l0/configs/SWS250/bins_velocity.yml +83 -0
disdrodb/l0/configs/SWS250/l0a_encodings.yml +18 -0
disdrodb/l0/configs/SWS250/l0b_cf_attrs.yml +72 -0
disdrodb/l0/configs/SWS250/l0b_encodings.yml +155 -0
disdrodb/l0/configs/SWS250/raw_data_format.yml +148 -0
disdrodb/l0/l0a_processing.py +10 -5
disdrodb/l0/l0b_nc_processing.py +10 -6
disdrodb/l0/l0b_processing.py +92 -72
disdrodb/l0/l0c_processing.py +369 -251
disdrodb/l0/readers/LPM/ARM/ARM_LPM.py +8 -1
disdrodb/l0/readers/LPM/AUSTRALIA/MELBOURNE_2007_LPM.py +2 -2
disdrodb/l0/readers/LPM/BELGIUM/ULIEGE.py +256 -0
disdrodb/l0/readers/LPM/BRAZIL/CHUVA_LPM.py +2 -2
disdrodb/l0/readers/LPM/BRAZIL/GOAMAZON_LPM.py +2 -2
disdrodb/l0/readers/LPM/GERMANY/DWD.py +491 -0
disdrodb/l0/readers/LPM/ITALY/GID_LPM.py +2 -2
disdrodb/l0/readers/LPM/ITALY/GID_LPM_W.py +2 -2
disdrodb/l0/readers/LPM/KIT/CHWALA.py +2 -2
disdrodb/l0/readers/LPM/SLOVENIA/ARSO.py +107 -12
disdrodb/l0/readers/LPM/SLOVENIA/UL.py +3 -3
disdrodb/l0/readers/LPM/SWITZERLAND/INNERERIZ_LPM.py +2 -2
disdrodb/l0/readers/PARSIVEL/NCAR/VORTEX2_2010.py +5 -14
disdrodb/l0/readers/PARSIVEL/NCAR/VORTEX2_2010_UF.py +5 -14
disdrodb/l0/readers/PARSIVEL/SLOVENIA/UL.py +117 -8
disdrodb/l0/readers/PARSIVEL2/ARM/ARM_PARSIVEL2.py +4 -0
disdrodb/l0/readers/PARSIVEL2/BRAZIL/CHUVA_PARSIVEL2.py +10 -14
disdrodb/l0/readers/PARSIVEL2/BRAZIL/GOAMAZON_PARSIVEL2.py +10 -14
disdrodb/l0/readers/PARSIVEL2/CANADA/UQAM_NC.py +69 -0
disdrodb/l0/readers/PARSIVEL2/DENMARK/DTU.py +8 -14
disdrodb/l0/readers/PARSIVEL2/DENMARK/EROSION_raw.py +382 -0
disdrodb/l0/readers/PARSIVEL2/FINLAND/FMI_PARSIVEL2.py +4 -0
disdrodb/l0/readers/PARSIVEL2/FRANCE/OSUG.py +1 -1
disdrodb/l0/readers/PARSIVEL2/GREECE/NOA.py +127 -0
disdrodb/l0/readers/PARSIVEL2/ITALY/HYDROX.py +239 -0
disdrodb/l0/readers/PARSIVEL2/MPI/BCO_PARSIVEL2.py +136 -0
disdrodb/l0/readers/PARSIVEL2/MPI/BOWTIE.py +220 -0
disdrodb/l0/readers/PARSIVEL2/NASA/LPVEX.py +109 -0
disdrodb/l0/readers/PARSIVEL2/NCAR/FARM_PARSIVEL2.py +5 -11
disdrodb/l0/readers/PARSIVEL2/NCAR/PERILS_MIPS.py +4 -17
disdrodb/l0/readers/PARSIVEL2/NCAR/RELAMPAGO_PARSIVEL2.py +5 -14
disdrodb/l0/readers/PARSIVEL2/NCAR/SNOWIE_PJ.py +10 -13
disdrodb/l0/readers/PARSIVEL2/NCAR/SNOWIE_SB.py +10 -13
disdrodb/l0/readers/PARSIVEL2/NETHERLANDS/DELFT_NC.py +3 -0
disdrodb/l0/readers/PARSIVEL2/PHILIPPINES/PANGASA.py +232 -0
disdrodb/l0/readers/PARSIVEL2/SPAIN/CENER.py +6 -18
disdrodb/l0/readers/PARSIVEL2/SPAIN/GRANADA.py +120 -0
disdrodb/l0/readers/PARSIVEL2/USA/C3WE.py +7 -25
disdrodb/l0/readers/PWS100/AUSTRIA/HOAL.py +321 -0
disdrodb/l0/readers/SW250/BELGIUM/KMI.py +239 -0
disdrodb/l1/beard_model.py +31 -129
disdrodb/l1/fall_velocity.py +156 -57
disdrodb/l1/filters.py +25 -28
disdrodb/l1/processing.py +12 -14
disdrodb/l1_env/routines.py +46 -17
disdrodb/l2/empirical_dsd.py +6 -0
disdrodb/l2/processing.py +3 -3
disdrodb/metadata/checks.py +132 -125
disdrodb/metadata/geolocation.py +0 -2
disdrodb/psd/fitting.py +180 -210
disdrodb/psd/models.py +1 -1
disdrodb/routines/__init__.py +54 -0
disdrodb/{l0/routines.py → routines/l0.py} +288 -418
disdrodb/{l1/routines.py → routines/l1.py} +60 -92
disdrodb/{l2/routines.py → routines/l2.py} +284 -485
disdrodb/{routines.py → routines/wrappers.py} +100 -7
disdrodb/scattering/axis_ratio.py +95 -85
disdrodb/scattering/permittivity.py +24 -0
disdrodb/scattering/routines.py +56 -36
disdrodb/summary/routines.py +147 -45
disdrodb/utils/archiving.py +434 -0
disdrodb/utils/attrs.py +2 -0
disdrodb/utils/cli.py +5 -5
disdrodb/utils/dask.py +62 -1
disdrodb/utils/decorators.py +31 -0
disdrodb/utils/encoding.py +10 -1
disdrodb/{l2 → utils}/event.py +1 -66
disdrodb/utils/logger.py +1 -1
disdrodb/utils/manipulations.py +22 -12
disdrodb/utils/routines.py +166 -0
disdrodb/utils/time.py +5 -293
disdrodb/utils/xarray.py +3 -0
disdrodb/viz/plots.py +109 -15
{disdrodb-0.1.3.dist-info → disdrodb-0.1.5.dist-info}/METADATA +3 -2
{disdrodb-0.1.3.dist-info → disdrodb-0.1.5.dist-info}/RECORD +124 -96
{disdrodb-0.1.3.dist-info → disdrodb-0.1.5.dist-info}/entry_points.txt +1 -0
{disdrodb-0.1.3.dist-info → disdrodb-0.1.5.dist-info}/WHEEL +0 -0
{disdrodb-0.1.3.dist-info → disdrodb-0.1.5.dist-info}/licenses/LICENSE +0 -0
{disdrodb-0.1.3.dist-info → disdrodb-0.1.5.dist-info}/top_level.txt +0 -0

disdrodb/api/path.py CHANGED Viewed

@@ -63,6 +63,7 @@ def define_disdrodb_path(
         The campaign name.
     check_exists : bool, optional
         Whether to check if the directory exists. The default value is ``True``.
+        Raise error if the directory does not exist.
     Returns
     -------
@@ -81,7 +82,7 @@ def define_disdrodb_path(
         dir_path = os.path.join(archive_dir, ARCHIVE_VERSION, data_source, campaign_name)
     if check_exists:
         check_directory_exists(dir_path)
-    return dir_path
+    return os.path.normpath(dir_path)
 def define_data_source_dir(
@@ -107,6 +108,7 @@ def define_data_source_dir(
         If not specified, the path specified in the DISDRODB active configuration will be used.
     check_exists : bool, optional
         Whether to check if the directory exists. The default value is ``False``.
+        Raise error if the directory does not exist.
     Returns
     -------
@@ -386,7 +388,7 @@ def define_partitioning_tree(time, folder_partitioning):
         return os.path.join(year, month, day)
     if folder_partitioning == "year/month_name":
         year = str(time.year)
-        month = str(time.month_name())
+        month = time.strftime("%B")
         return os.path.join(year, month)
     if folder_partitioning == "year/quarter":
         year = str(time.year)
@@ -397,7 +399,7 @@ def define_partitioning_tree(time, folder_partitioning):
     raise NotImplementedError(f"Unrecognized '{folder_partitioning}' folder partitioning scheme.")
-def define_file_folder_path(obj, data_dir, folder_partitioning):
+def define_file_folder_path(obj, dir_path, folder_partitioning):
     """
     Define the folder path where saving a file based on the dataset's starting time.
@@ -405,12 +407,13 @@ def define_file_folder_path(obj, data_dir, folder_partitioning):
     ----------
     ds : xarray.Dataset or pandas.DataFrame
         The object containing time information.
-    data_dir : str
+    dir : str
         Directory within the DISDRODB Data Archive where DISDRODB product files are to be saved.
+        It can be a product directory or a logs directory.
     folder_partitioning : str or None
         Define the subdirectory structure where saving files.
         Allowed values are:
-          - None: Files are saved directly in data_dir.
+          - None or "": Files are saved directly in data_dir.
           - "year": Files are saved under a subdirectory for the year.
           - "year/month": Files are saved under subdirectories for year and month.
           - "year/month/day": Files are saved under subdirectories for year, month and day
@@ -432,7 +435,7 @@ def define_file_folder_path(obj, data_dir, folder_partitioning):
     # Build the folder path based on the chosen partition scheme
     partitioning_tree = define_partitioning_tree(time=starting_time, folder_partitioning=folder_partitioning)
-    return os.path.join(data_dir, partitioning_tree)
+    return os.path.normpath(os.path.join(dir_path, partitioning_tree))
 def define_product_dir_tree(
@@ -475,15 +478,14 @@ def define_product_dir_tree(
         check_sample_interval(sample_interval)
         temporal_resolution = define_temporal_resolution(seconds=sample_interval, rolling=rolling)
         return os.path.join(temporal_resolution)
-    if product == "L2M":
-        rolling = product_kwargs.get("rolling")
-        sample_interval = product_kwargs.get("sample_interval")
-        model_name = product_kwargs.get("model_name")
-        check_rolling(rolling)
-        check_sample_interval(sample_interval)
-        temporal_resolution = define_temporal_resolution(seconds=sample_interval, rolling=rolling)
-        return os.path.join(model_name, temporal_resolution)
-    raise ValueError(f"The product {product} is not defined.")
+    # L2M if product == "L2M":
+    rolling = product_kwargs.get("rolling")
+    sample_interval = product_kwargs.get("sample_interval")
+    model_name = product_kwargs.get("model_name")
+    check_rolling(rolling)
+    check_sample_interval(sample_interval)
+    temporal_resolution = define_temporal_resolution(seconds=sample_interval, rolling=rolling)
+    return os.path.join(model_name, temporal_resolution)
 def define_logs_dir(
@@ -529,7 +531,7 @@ def define_logs_dir(
         product=product,
         **product_kwargs,
     )
-    logs_dir = os.path.join(campaign_dir, "logs", "files", product, product_dir_tree, station_name)
+    logs_dir = os.path.normpath(os.path.join(campaign_dir, "logs", "files", product, product_dir_tree, station_name))
     if check_exists:
         check_directory_exists(logs_dir)
     return str(logs_dir)
@@ -643,7 +645,7 @@ def define_data_dir(
         **product_kwargs,
     )
     # Define data directory
-    data_dir = os.path.join(station_dir, product_dir_tree)
+    data_dir = os.path.normpath(os.path.join(station_dir, product_dir_tree))
     # Check if directory exists
     if check_exists:
         check_directory_exists(data_dir)
@@ -674,7 +676,8 @@ def define_filename(
     campaign_name: str,
     station_name: str,
     # Filename options
-    obj=None,
+    start_time=None,
+    end_time=None,
     add_version=True,
     add_time_period=True,
     add_extension=True,
@@ -688,19 +691,22 @@ def define_filename(
     Parameters
     ----------
-    obj  : xarray.Dataset or pandas.DataFrame
-        xarray Dataset or pandas DataFrame.
-        Required if add_time_period = True.
     campaign_name : str
        Name of the campaign.
     station_name : str
        Name of the station.
+    start_time : datetime.datatime, optional
+        Start time.
+        Required if add_time_period = True.
+    end_time : datetime.datatime, optional
+        End time.
+        Required if add_time_period = True.
     sample_interval : int, optional
         The sampling interval in seconds of the product.
-        It must be specified only for product L2E and L2M !
+        It must be specified only for product L0C, L1, L2E and L2M !
     rolling : bool, optional
         Whether the dataset has been resampled by aggregating or rolling.
-        It must be specified only for product L2E and L2M !
+        It must be specified only for product L1, L2E and L2M !
     model_name : str
         The model name of the fitted statistical distribution for the DSD.
         It must be specified only for product L2M !
@@ -715,19 +721,25 @@ def define_filename(
     product = check_product(product)
     product_kwargs = check_product_kwargs(product, product_kwargs)
-    # -----------------------------------------.
-    # TODO: Define temporal_resolution
-    # - ADD temporal_resolution also to L0A and L0B
-    # - Add temporal_resolution also to L0C and L1
+    if add_time_period and (start_time is None or end_time is None):
+        raise ValueError("If add_time_period=True, specify start_time and end_time.")
     # -----------------------------------------.
     # Define product name
     product_name = f"{product}"
+    # L0C ... sample interval known only per-file
+    # L1 ... in future known a priori
+    # if product in ["L1"]:
+    #     # TODO: HACK FOR CURRENT L0C and L1 log files in create_product_logs
+    #     sample_interval = product_kwargs.get("sample_interval",  0)
+    #     temporal_resolution = define_temporal_resolution(seconds=sample_interval, rolling=False)
+    #     product_name = f"{product}.{temporal_resolution}"
     if product in ["L2E", "L2M"]:
         rolling = product_kwargs.get("rolling")
         sample_interval = product_kwargs.get("sample_interval")
         temporal_resolution = define_temporal_resolution(seconds=sample_interval, rolling=rolling)
-        product_name = f"L2E.{temporal_resolution}"
+        product_name = f"{product}.{temporal_resolution}"
     if product in ["L2M"]:
         model_name = product_kwargs.get("model_name")
         product_name = f"L2M_{model_name}.{temporal_resolution}"
@@ -744,10 +756,9 @@ def define_filename(
     # -----------------------------------------.
     # Add time period information
     if add_time_period:
-        starting_time, ending_time = get_file_start_end_time(obj)
-        starting_time = starting_time.strftime("%Y%m%d%H%M%S")
-        ending_time = ending_time.strftime("%Y%m%d%H%M%S")
-        filename = f"{filename}.s{starting_time}.e{ending_time}"
+        start_time = start_time.strftime("%Y%m%d%H%M%S")
+        end_time = end_time.strftime("%Y%m%d%H%M%S")
+        filename = f"{filename}.s{start_time}.e{end_time}"
     # -----------------------------------------.
     # Add product version
@@ -784,56 +795,40 @@ def define_l0a_filename(df, campaign_name: str, station_name: str) -> str:
         L0A file name.
     """
     starting_time, ending_time = get_file_start_end_time(df)
-    starting_time = starting_time.strftime("%Y%m%d%H%M%S")
-    ending_time = ending_time.strftime("%Y%m%d%H%M%S")
-    version = ARCHIVE_VERSION
-    filename = f"L0A.{campaign_name}.{station_name}.s{starting_time}.e{ending_time}.{version}.parquet"
+    filename = define_filename(
+        product="L0A",
+        campaign_name=campaign_name,
+        station_name=station_name,
+        # Filename options
+        start_time=starting_time,
+        end_time=ending_time,
+        add_version=True,
+        add_time_period=True,
+        add_extension=True,
+    )
     return filename
 def define_l0b_filename(ds, campaign_name: str, station_name: str) -> str:
-    """Define L0B file name.
-    Parameters
-    ----------
-    ds  : xarray.Dataset
-        L0B xarray Dataset.
-    campaign_name : str
-        Name of the campaign.
-    station_name : str
-        Name of the station.
-    Returns
-    -------
-    str
-        L0B file name.
-    """
+    """Define L0B file name."""
     starting_time, ending_time = get_file_start_end_time(ds)
-    starting_time = starting_time.strftime("%Y%m%d%H%M%S")
-    ending_time = ending_time.strftime("%Y%m%d%H%M%S")
-    version = ARCHIVE_VERSION
-    filename = f"L0B.{campaign_name}.{station_name}.s{starting_time}.e{ending_time}.{version}.nc"
+    filename = define_filename(
+        product="L0B",
+        campaign_name=campaign_name,
+        station_name=station_name,
+        # Filename options
+        start_time=starting_time,
+        end_time=ending_time,
+        add_version=True,
+        add_time_period=True,
+        add_extension=True,
+    )
     return filename
 def define_l0c_filename(ds, campaign_name: str, station_name: str) -> str:
-    """Define L0C file name.
-    Parameters
-    ----------
-    ds  : xarray.Dataset
-        L0B xarray Dataset.
-    campaign_name : str
-        Name of the campaign.
-    station_name : str
-        Name of the station.
-    Returns
-    -------
-    str
-        L0B file name.
-    """
-    # TODO: add sample_interval as argument
+    """Define L0C file name."""
+    # TODO: add sample_interval as function argument    s
     sample_interval = int(ensure_sample_interval_in_seconds(ds["sample_interval"]).data.item())
     temporal_resolution = define_temporal_resolution(sample_interval, rolling=False)
     starting_time, ending_time = get_file_start_end_time(ds)
@@ -845,23 +840,10 @@ def define_l0c_filename(ds, campaign_name: str, station_name: str) -> str:
 def define_l1_filename(ds, campaign_name, station_name: str) -> str:
-    """Define L1 file name.
+    """Define L1 file name."""
+    # TODO: add sample_interval and rolling as function argument
-    Parameters
-    ----------
-    ds  : xarray.Dataset
-        L1 xarray Dataset.
-    campaign_name : str
-        Name of the campaign.
-    station_name : str
-        Name of the station.
-    Returns
-    -------
-    str
-        L1 file name.
-    """
-    # TODO: add sample_interval as argument
+    starting_time, ending_time = get_file_start_end_time(ds)
     sample_interval = int(ensure_sample_interval_in_seconds(ds["sample_interval"]).data.item())
     temporal_resolution = define_temporal_resolution(sample_interval, rolling=False)
     starting_time, ending_time = get_file_start_end_time(ds)
@@ -869,32 +851,41 @@ def define_l1_filename(ds, campaign_name, station_name: str) -> str:
     ending_time = ending_time.strftime("%Y%m%d%H%M%S")
     version = ARCHIVE_VERSION
     filename = f"L1.{temporal_resolution}.{campaign_name}.{station_name}.s{starting_time}.e{ending_time}.{version}.nc"
+    # filename = define_filename(
+    #     product="L1",
+    #     campaign_name=campaign_name,
+    #     station_name=station_name,
+    #     # Filename options
+    #     start_time=starting_time,
+    #     end_time=ending_time,
+    #     add_version=True,
+    #     add_time_period=True,
+    #     add_extension=True,
+    #     # Product options
+    #     # sample_interval=sample_interval,
+    #     # rolling=rolling,
+    # )
     return filename
 def define_l2e_filename(ds, campaign_name: str, station_name: str, sample_interval: int, rolling: bool) -> str:
-    """Define L2E file name.
-    Parameters
-    ----------
-    ds  : xarray.Dataset
-        L1 xarray Dataset
-    campaign_name : str
-        Name of the campaign.
-    station_name : str
-        Name of the station
-    Returns
-    -------
-    str
-        L0B file name.
-    """
-    temporal_resolution = define_temporal_resolution(seconds=sample_interval, rolling=rolling)
+    """Define L2E file name."""
     starting_time, ending_time = get_file_start_end_time(ds)
-    starting_time = starting_time.strftime("%Y%m%d%H%M%S")
-    ending_time = ending_time.strftime("%Y%m%d%H%M%S")
-    version = ARCHIVE_VERSION
-    filename = f"L2E.{temporal_resolution}.{campaign_name}.{station_name}.s{starting_time}.e{ending_time}.{version}.nc"
+    filename = define_filename(
+        product="L2E",
+        campaign_name=campaign_name,
+        station_name=station_name,
+        # Filename options
+        start_time=starting_time,
+        end_time=ending_time,
+        add_version=True,
+        add_time_period=True,
+        add_extension=True,
+        # Product options
+        sample_interval=sample_interval,
+        rolling=rolling,
+    )
     return filename
@@ -906,29 +897,21 @@ def define_l2m_filename(
     rolling: bool,
     model_name: str,
 ) -> str:
-    """Define L2M file name.
-    Parameters
-    ----------
-    ds  : xarray.Dataset
-        L1 xarray Dataset
-    campaign_name : str
-        Name of the campaign.
-    station_name : str
-        Name of the station
-    Returns
-    -------
-    str
-        L0B file name.
-    """
-    temporal_resolution = define_temporal_resolution(seconds=sample_interval, rolling=rolling)
+    """Define L2M file name."""
     starting_time, ending_time = get_file_start_end_time(ds)
-    starting_time = starting_time.strftime("%Y%m%d%H%M%S")
-    ending_time = ending_time.strftime("%Y%m%d%H%M%S")
-    version = ARCHIVE_VERSION
-    filename = (
-        f"L2M_{model_name}.{temporal_resolution}.{campaign_name}."
-        + f"{station_name}.s{starting_time}.e{ending_time}.{version}.nc"
+    filename = define_filename(
+        product="L2M",
+        campaign_name=campaign_name,
+        station_name=station_name,
+        # Filename options
+        start_time=starting_time,
+        end_time=ending_time,
+        add_version=True,
+        add_time_period=True,
+        add_extension=True,
+        # Product options
+        sample_interval=sample_interval,
+        rolling=rolling,
+        model_name=model_name,
     )
     return filename

disdrodb/api/search.py CHANGED Viewed

@@ -20,6 +20,8 @@ from disdrodb.constants import PRODUCTS_REQUIREMENTS
 from disdrodb.utils.directories import contains_files, contains_netcdf_or_parquet_files, list_directories, list_files
 from disdrodb.utils.yaml import read_yaml
+####-------------------------------------------------------------------------
 def get_required_product(product):
     """Determine the required product for input product processing."""
@@ -31,7 +33,7 @@ def get_required_product(product):
 ####-------------------------------------------------------------------------
-#### List DISDRODB infrastructure directories
+#### List DISDRODB Metadata directories
 def list_data_sources(metadata_archive_dir, data_sources=None, invalid_fields_policy="raise"):
@@ -167,6 +169,10 @@ def list_station_names(
     return station_names
+####-------------------------------------------------------------------------
+#### Filtering utilities for available_stations
 def _finalize_output(list_info, return_tuple):
     # - Return the (data_source, campaign_name, station_name) tuple
     if return_tuple:
@@ -228,7 +234,6 @@ def keep_list_info_elements_with_product_data(data_archive_dir, product, list_in
     checking_function = contains_files if product == "RAW" else contains_netcdf_or_parquet_files
     # Check presence of data for each station
-    # TODO: - In parallel over stations to speed up ?
     list_info_with_product_data = []
     for data_source, campaign_name, station_name in list_info:
         data_dir = define_data_dir(
@@ -362,10 +367,11 @@ def available_stations(
     metadata_archive_dir = get_metadata_archive_dir(metadata_archive_dir)
     product = check_product(product) if product is not None else None
     invalid_fields_policy = check_invalid_fields_policy(invalid_fields_policy)
     # Retrieve available stations from the Metadata Archive
     # - Raise error if no stations availables !
     list_info = list_station_names(
-        metadata_archive_dir,
+        metadata_archive_dir=metadata_archive_dir,
         data_sources=data_sources,
         campaign_names=campaign_names,
         station_names=station_names,
@@ -484,3 +490,6 @@ def available_campaigns(
     campaign_names = [info[1] for info in list_info]
     campaign_names = np.unique(campaign_names).tolist()
     return campaign_names
+####-------------------------------------------------------------------------

disdrodb/cli/disdrodb_create_summary.py ADDED Viewed

@@ -0,0 +1,113 @@
+# -----------------------------------------------------------------------------.
+# Copyright (c) 2021-2023 DISDRODB developers
+#
+# This program is free software: you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation, either version 3 of the License, or
+# (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program.  If not, see <http://www.gnu.org/licenses/>.
+# -----------------------------------------------------------------------------.
+"""Script to create summary figures and tables for a DISDRODB stationn."""
+import sys
+from typing import Optional
+import click
+from disdrodb.utils.cli import (
+    click_data_archive_dir_option,
+    click_metadata_archive_dir_option,
+    click_stations_options,
+    parse_archive_dir,
+    parse_arg_to_list,
+)
+sys.tracebacklimit = 0  # avoid full traceback error if occur
+# -------------------------------------------------------------------------.
+# Click Command Line Interface decorator
+@click.command()
+@click_stations_options
+@click_data_archive_dir_option
+@click_metadata_archive_dir_option
+@click.option("-p", "--parallel", type=bool, show_default=True, default=False, help="Read files in parallel")
+@click.option(
+    "-t",
+    "--temporal_resolution",
+    type=str,
+    show_default=True,
+    default="1MIN",
+    help="Temporal resolution of the L2E product to be used for the summary.",
+)
+def disdrodb_create_summary(
+    # Stations options
+    data_sources: Optional[str] = None,
+    campaign_names: Optional[str] = None,
+    station_names: Optional[str] = None,
+    # Processing options:
+    parallel=False,
+    temporal_resolution="1MIN",
+    # DISDRODB root directories
+    data_archive_dir: Optional[str] = None,
+    metadata_archive_dir: Optional[str] = None,
+):
+    r"""Create summary figures and tables for a specific set of DISDRODB stations.
+    Parameters \n
+    ---------- \n
+    data_sources : str
+        Name of data source(s) to process.
+        The name(s) must be UPPER CASE.
+        If campaign_names and station are not specified, process all stations.
+        To specify multiple data sources, write i.e.: --data_sources 'GPM EPFL NCAR'
+    campaign_names : str
+        Name of the campaign(s) for which to create stations summaries.
+        The name(s) must be UPPER CASE.
+        To specify multiple campaigns, write i.e.: --campaign_names 'IPEX IMPACTS'
+    station_names : str
+        Station names.
+        To specify multiple stations, write i.e.: --station_names 'station1 station2'
+    data_archive_dir : str \n
+        DISDRODB Data Archive directory \n
+        Format: <...>/DISDRODB \n
+        If not specified, uses path specified in the DISDRODB active configuration. \n
+    """
+    from disdrodb.routines import create_summary
+    from disdrodb.utils.dask import close_dask_cluster, initialize_dask_cluster
+    data_archive_dir = parse_archive_dir(data_archive_dir)
+    data_sources = parse_arg_to_list(data_sources)
+    campaign_names = parse_arg_to_list(campaign_names)
+    station_names = parse_arg_to_list(station_names)
+    # -------------------------------------------------------------------------.
+    # If parallel=True, set the dask environment
+    if parallel:
+        cluster, client = initialize_dask_cluster()
+    # -------------------------------------------------------------------------.
+    create_summary(
+        # Station arguments
+        data_sources=data_sources,
+        campaign_names=campaign_names,
+        station_names=station_names,
+        # Options
+        parallel=parallel,
+        temporal_resolution=temporal_resolution,
+        # DISDRODB root directory
+        data_archive_dir=data_archive_dir,
+        metadata_archive_dir=metadata_archive_dir,
+    )
+    # -------------------------------------------------------------------------.
+    # Close the cluster
+    if parallel:
+        close_dask_cluster(cluster, client)

disdrodb/cli/disdrodb_create_summary_station.py CHANGED Viewed

@@ -14,7 +14,7 @@
 # You should have received a copy of the GNU General Public License
 # along with this program.  If not, see <http://www.gnu.org/licenses/>.
 # -----------------------------------------------------------------------------.
-"""Script to run the DISDRODB L0 station processing."""
+"""Script to create summary figures and tables for a DISDRODB station."""
 import sys
 from typing import Optional
@@ -36,6 +36,14 @@ sys.tracebacklimit = 0  # avoid full traceback error if occur
 @click_station_arguments
 @click_data_archive_dir_option
 @click.option("-p", "--parallel", type=bool, show_default=True, default=False, help="Read files in parallel")
+@click.option(
+    "-t",
+    "--temporal_resolution",
+    type=str,
+    show_default=True,
+    default="1MIN",
+    help="Temporal resolution of the L2E product to be used for the summary.",
+)
 def disdrodb_create_summary_station(
     # Station arguments
     data_source: str,
@@ -43,6 +51,7 @@ def disdrodb_create_summary_station(
     station_name: str,
     # Processing options:
     parallel=False,
+    temporal_resolution="1MIN",
     # DISDRODB root directories
     data_archive_dir: Optional[str] = None,
 ):
@@ -81,6 +90,7 @@ def disdrodb_create_summary_station(
         station_name=station_name,
         # Options
         parallel=parallel,
+        temporal_resolution=temporal_resolution,
         # DISDRODB root directory
         data_archive_dir=data_archive_dir,
     )

disdrodb/cli/disdrodb_run_l0a_station.py CHANGED Viewed

@@ -89,7 +89,7 @@ def disdrodb_run_l0a_station(
         Format: <...>/DISDRODB
         If not specified, uses path specified in the DISDRODB active configuration.
     """
-    from disdrodb.l0.routines import run_l0a_station
+    from disdrodb.routines.l0 import run_l0a_station
     from disdrodb.utils.dask import close_dask_cluster, initialize_dask_cluster
     data_archive_dir = parse_archive_dir(data_archive_dir)

disdrodb/cli/disdrodb_run_l0b_station.py CHANGED Viewed

@@ -91,7 +91,7 @@ def disdrodb_run_l0b_station(
         Format: <...>/DISDRODB
         If not specified, uses path specified in the DISDRODB active configuration.
     """
-    from disdrodb.l0.routines import run_l0b_station
+    from disdrodb.routines.l0 import run_l0b_station
     from disdrodb.utils.dask import close_dask_cluster, initialize_dask_cluster
     data_archive_dir = parse_archive_dir(data_archive_dir)
@@ -100,7 +100,7 @@ def disdrodb_run_l0b_station(
     # -------------------------------------------------------------------------.
     # If parallel=True, set the dask environment
     if parallel:
-        cluster, client = initialize_dask_cluster()
+        cluster, client = initialize_dask_cluster(minimum_memory="4GB")
     # -------------------------------------------------------------------------.
     run_l0b_station(

disdrodb/cli/disdrodb_run_l0c_station.py CHANGED Viewed

@@ -94,7 +94,7 @@ def disdrodb_run_l0c_station(
         Format: <...>/DISDRODB
         If not specified, uses path specified in the DISDRODB active configuration.
     """
-    from disdrodb.l0.routines import run_l0c_station
+    from disdrodb.routines.l0 import run_l0c_station
     from disdrodb.utils.dask import close_dask_cluster, initialize_dask_cluster
     data_archive_dir = parse_archive_dir(data_archive_dir)
@@ -103,7 +103,7 @@ def disdrodb_run_l0c_station(
     # -------------------------------------------------------------------------.
     # If parallel=True, set the dask environment
     if parallel:
-        cluster, client = initialize_dask_cluster()
+        cluster, client = initialize_dask_cluster(minimum_memory="4GB")
     # -------------------------------------------------------------------------.
     run_l0c_station(

disdrodb/cli/disdrodb_run_l1_station.py CHANGED Viewed

@@ -89,7 +89,7 @@ def disdrodb_run_l1_station(
         Format: <...>/DISDRODB
         If not specified, uses path specified in the DISDRODB active configuration.
     """
-    from disdrodb.l1.routines import run_l1_station
+    from disdrodb.routines.l1 import run_l1_station
     from disdrodb.utils.dask import close_dask_cluster, initialize_dask_cluster
     data_archive_dir = parse_archive_dir(data_archive_dir)
@@ -97,7 +97,7 @@ def disdrodb_run_l1_station(
     # -------------------------------------------------------------------------.
     # If parallel=True, set the dask environment
     if parallel:
-        cluster, client = initialize_dask_cluster()
+        cluster, client = initialize_dask_cluster(minimum_memory="4GB")
     # -------------------------------------------------------------------------.
     run_l1_station(

disdrodb 0.1.3__py3-none-any.whl → 0.1.5__py3-none-any.whl

disdrodb 0.1.3py3-none-any.whl → 0.1.5py3-none-any.whl