PyPI - disdrodb - Versions diffs - 0.5.0__py3-none-any.whl → 0.5.1__py3-none-any.whl - Mend

disdrodb 0.5.0py3-none-any.whl → 0.5.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (75) hide show

disdrodb/__init__.py +4 -0
disdrodb/_version.py +2 -2
disdrodb/accessor/methods.py +14 -0
disdrodb/api/checks.py +8 -7
disdrodb/api/io.py +81 -29
disdrodb/api/path.py +17 -14
disdrodb/api/search.py +15 -18
disdrodb/cli/disdrodb_open_products_options.py +38 -0
disdrodb/cli/disdrodb_run.py +2 -2
disdrodb/cli/disdrodb_run_station.py +4 -4
disdrodb/configs.py +1 -1
disdrodb/data_transfer/download_data.py +70 -1
disdrodb/etc/configs/attributes.yaml +62 -8
disdrodb/etc/configs/encodings.yaml +28 -0
disdrodb/etc/products/L2M/MODELS/GAMMA_GS_ND_SSE.yaml +8 -0
disdrodb/etc/products/L2M/MODELS/GAMMA_ML.yaml +1 -1
disdrodb/etc/products/L2M/MODELS/LOGNORMAL_GS_LOG_ND_SSE.yaml +8 -0
disdrodb/etc/products/L2M/MODELS/LOGNORMAL_GS_ND_SSE.yaml +8 -0
disdrodb/etc/products/L2M/MODELS/LOGNORMAL_ML.yaml +1 -1
disdrodb/etc/products/L2M/MODELS/NGAMMA_GS_LOG_ND_SSE.yaml +8 -0
disdrodb/etc/products/L2M/MODELS/NGAMMA_GS_ND_SSE.yaml +8 -0
disdrodb/etc/products/L2M/global.yaml +4 -4
disdrodb/fall_velocity/graupel.py +8 -8
disdrodb/fall_velocity/hail.py +2 -2
disdrodb/fall_velocity/rain.py +33 -5
disdrodb/issue/checks.py +1 -1
disdrodb/l0/l0_reader.py +1 -1
disdrodb/l0/l0a_processing.py +2 -2
disdrodb/l0/l0b_nc_processing.py +5 -5
disdrodb/l0/l0b_processing.py +20 -24
disdrodb/l0/l0c_processing.py +18 -13
disdrodb/l0/readers/LPM/SLOVENIA/ARSO.py +4 -0
disdrodb/l0/readers/PARSIVEL2/VIETNAM/IGE_PARSIVEL2.py +239 -0
disdrodb/l0/template_tools.py +13 -13
disdrodb/l1/classification.py +10 -6
disdrodb/l2/empirical_dsd.py +25 -15
disdrodb/l2/processing.py +32 -14
disdrodb/metadata/download.py +1 -1
disdrodb/metadata/geolocation.py +4 -4
disdrodb/metadata/reader.py +3 -3
disdrodb/metadata/search.py +10 -8
disdrodb/psd/__init__.py +4 -0
disdrodb/psd/fitting.py +2660 -592
disdrodb/psd/gof_metrics.py +389 -0
disdrodb/psd/grid_search.py +1066 -0
disdrodb/psd/models.py +1281 -145
disdrodb/routines/l2.py +6 -6
disdrodb/routines/options_validation.py +8 -8
disdrodb/scattering/axis_ratio.py +70 -2
disdrodb/scattering/permittivity.py +13 -10
disdrodb/scattering/routines.py +10 -10
disdrodb/summary/routines.py +23 -20
disdrodb/utils/archiving.py +29 -22
disdrodb/utils/attrs.py +6 -4
disdrodb/utils/dataframe.py +4 -4
disdrodb/utils/encoding.py +3 -1
disdrodb/utils/event.py +9 -9
disdrodb/utils/logger.py +4 -7
disdrodb/utils/manipulations.py +2 -2
disdrodb/utils/subsetting.py +1 -1
disdrodb/utils/time.py +8 -7
disdrodb/viz/plots.py +25 -17
{disdrodb-0.5.0.dist-info → disdrodb-0.5.1.dist-info}/METADATA +44 -33
{disdrodb-0.5.0.dist-info → disdrodb-0.5.1.dist-info}/RECORD +68 -66
{disdrodb-0.5.0.dist-info → disdrodb-0.5.1.dist-info}/entry_points.txt +1 -0
disdrodb/etc/products/L2M/MODELS/GAMMA_GS_ND_MAE.yaml +0 -6
disdrodb/etc/products/L2M/MODELS/LOGNORMAL_GS_LOG_ND_MAE.yaml +0 -6
disdrodb/etc/products/L2M/MODELS/LOGNORMAL_GS_ND_MAE.yaml +0 -6
disdrodb/etc/products/L2M/MODELS/NGAMMA_GS_LOG_ND_MAE.yaml +0 -6
disdrodb/etc/products/L2M/MODELS/NGAMMA_GS_ND_MAE.yaml +0 -6
disdrodb/etc/products/L2M/MODELS/NGAMMA_GS_R_MAE.yaml +0 -6
disdrodb/etc/products/L2M/MODELS/NGAMMA_GS_Z_MAE.yaml +0 -6
{disdrodb-0.5.0.dist-info → disdrodb-0.5.1.dist-info}/WHEEL +0 -0
{disdrodb-0.5.0.dist-info → disdrodb-0.5.1.dist-info}/licenses/LICENSE +0 -0
{disdrodb-0.5.0.dist-info → disdrodb-0.5.1.dist-info}/top_level.txt +0 -0

disdrodb/routines/l2.py CHANGED Viewed

@@ -514,12 +514,12 @@ def _generate_l2m(
         radar_options = product_options.get("radar_options")
         # Define variables to load
-        optimization_kwargs = l2m_options["optimization_kwargs"]
-        if "init_method" in optimization_kwargs and optimization_kwargs["init_method"] is None:
-            optimization_kwargs["init_method"] = "None"
+        optimization_settings = l2m_options["optimization_settings"]
+        if "init_method" in optimization_settings and optimization_settings["init_method"] is None:
+            optimization_settings["init_method"] = "None"
-        if optimization_kwargs.get("init_method", "None") != "None":
-            init_method = optimization_kwargs["init_method"]
+        if optimization_settings.get("init_method", "None") != "None":
+            init_method = optimization_settings["init_method"]
             moments = [f"M{order}" for order in init_method.replace("M", "")] + ["M1"]
         else:
             moments = ["M1"]
@@ -761,7 +761,7 @@ def run_l2m_station(
         # -----------------------------------------------------------------.
         # Loop over distributions to fit
         # model_name = "GAMMA_ML"
-        # model_name = "LOGNORMAL_GS_ND_MAE"
+        # model_name = "LOGNORMAL_GS_ND_SSE"
         # model_options =  l2m_options["models"][model_name]
         # Retrieve list of models to fit
         models = global_product_options.pop("models")

disdrodb/routines/options_validation.py CHANGED Viewed

@@ -8,7 +8,7 @@ from disdrodb.api.checks import check_folder_partitioning, check_temporal_resolu
 from disdrodb.api.configs import available_sensor_names
 from disdrodb.configs import get_products_configs_dir
 from disdrodb.fall_velocity.rain import check_rain_fall_velocity_model
-from disdrodb.psd.fitting import PSD_MODELS, check_optimization, check_optimization_kwargs
+from disdrodb.psd.fitting import PSD_MODELS, check_optimization, check_optimization_settings
 from disdrodb.routines.options import get_l2m_model_settings_files, get_model_options, get_product_options
 from disdrodb.scattering.axis_ratio import check_axis_ratio_model
 from disdrodb.scattering.permittivity import check_permittivity_model
@@ -464,7 +464,7 @@ class L2MModelConfig(CustomBaseModel):
     psd_model: str = Field(..., description="PSD model name")
     optimization: str = Field(..., description="Optimization method")
-    optimization_kwargs: dict[str, Any] = Field(..., description="Optimization-specific parameters")
+    optimization_settings: dict[str, Any] = Field(..., description="Optimization-specific parameters")
     @field_validator("psd_model")
     @classmethod
@@ -482,11 +482,11 @@ class L2MModelConfig(CustomBaseModel):
         return check_optimization(optimization)
     @model_validator(mode="after")
-    def validate_optimization_kwargs(self):
-        """Validate that optimization_kwargs matches the optimization method."""
+    def validate_optimization_settings(self):
+        """Validate that optimization_settings matches the optimization method."""
         # Use the existing validation function
-        check_optimization_kwargs(
-            optimization_kwargs=self.optimization_kwargs,
+        check_optimization_settings(
+            optimization_settings=self.optimization_settings,
             optimization=self.optimization,
             psd_model=self.psd_model,
         )
@@ -504,7 +504,7 @@ def validate_l2m_model_configs(products_configs_dir: str):
     Raises
     ------
-    ValidationError
+    pydantic.ValidationError
         If any L2M model configuration is invalid.
     """
     # Get all L2M model configuration files
@@ -622,7 +622,7 @@ def validate_all_product_yaml_files(products_configs_dir):
     Raises
     ------
-    ValidationError
+    pydantic.ValidationError
         If any YAML file validation fails with detailed information.
     """
     # Define product validators mapping

disdrodb/scattering/axis_ratio.py CHANGED Viewed

@@ -276,6 +276,72 @@ def get_axis_ratio_thurai_2007(diameter):
     return axis_ratio
+def get_axis_ratio_chang_2009(diameter):
+    """
+    Compute the axis ratio of raindrops using the Chang et al. (2009) model.
+    Parameters
+    ----------
+    diameter : array-like
+        Diameter of the raindrops in millimeters.
+    Returns
+    -------
+    axis_ratio : array-like
+        Calculated axis ratios corresponding to the input diameters.
+    References
+    ----------
+    Chang, W. Y., T. C. C. Wang, and P. L. Lin, 2009.
+    Characteristics of the Raindrop Size Distribution and Drop Shape Relation
+    in Typhoon Systems in the Western Pacific from the 2D Video Disdrometer and NCU C-Band Polarimetric Radar.
+    Journal of Atmospheric and Oceanic Technology, 26, 1973-1993.
+    https://doi.org/10.1175/2009JTECHA1236.1, 2009.
+    """
+    axis_ratio = (
+        0.98287 + 4.2514e-2 * diameter - 3.3439e-2 * diameter**2 + 4.3402e-3 * diameter**3 - 1.9223e-4 * diameter**4
+    )
+    return axis_ratio
+# def get_axis_ratio_wen_2018(diameter):
+#     """
+#     Compute the axis ratio of raindrops using the Wen et al. (2018) relationship.
+#     Parameters
+#     ----------
+#     diameter : array-like
+#         Diameter of the raindrops in millimeters.
+#     Returns
+#     -------
+#     axis_ratio : array-like
+#         Calculated axis ratios corresponding to the input diameters.
+#     References
+#     ----------
+#     Wen, L., Zhao, K., Chen, G., Wang, M., Zhou, B., Huang, H., Hu, D., Lee, W., and Hu, H., 2018.
+#     Drop Size Distribution Characteristics of Seven Typhoons in China.
+#     Journal of Geophysical Research: Atmospheres, 123, 6529-6548.
+#     https://doi.org/10.1029/2017JD027950
+#     Notes
+#     ------
+#     The polynomial formula presented in Wen et al., 2018
+#     does not correspond to the illustration in figure 9 of the manuscript.
+#     The resulting axis-ratio parameterization appears to be incorrect and
+#     therefore is not made available in disdrodb.
+#     """
+#     axis_ratio = (
+#         0.9946
+#         + 2.745e-2 * diameter
+#         - 1.868e-2 * diameter**2
+#         + 1.159e-3 * diameter**3
+#         - 2.143e-4 * diameter**4
+#     )
+#     return axis_ratio
 AXIS_RATIO_MODELS = {
     "Thurai2005": get_axis_ratio_thurai_2005,
     "Thurai2007": get_axis_ratio_thurai_2007,
@@ -284,6 +350,8 @@ AXIS_RATIO_MODELS = {
     "Pruppacher1970": get_axis_ratio_pruppacher_1970,
     "Beard1987": get_axis_ratio_beard_1987,
     "Andsager1999": get_axis_ratio_andsager_1999,
+    "Chang2009": get_axis_ratio_chang_2009,
+    # "Wen2018": get_axis_ratio_wen_2018,
 }
@@ -308,7 +376,7 @@ def get_axis_ratio_model(model):
     model : str
         The model to use for calculating the axis ratio. Available models are:
         'Thurai2005', 'Thurai2007', 'Parsivel', 'Brandes2002',
-        'Pruppacher1970', 'Beard1987', 'Andsager1999'.
+        'Pruppacher1970', 'Beard1987', 'Andsager1999', 'Chang2009'.
     Returns
     -------
@@ -340,7 +408,7 @@ def get_axis_ratio(diameter, model):
     model : str
         The axis ratio model to use for calculating the axis ratio. Available models are:
         'Thurai2005', 'Thurai2007', 'Parsivel', 'Brandes2002',
-        'Pruppacher1970', 'Beard1987', 'Andsager1999'.
+        'Pruppacher1970', 'Beard1987', 'Andsager1999', 'Chang2009'.
     Returns
     -------

disdrodb/scattering/permittivity.py CHANGED Viewed

@@ -19,6 +19,8 @@
 import numpy as np
 import xarray as xr
+from disdrodb.utils.warnings import suppress_warnings
 # Definitions
 # - Complex_refractive_index: m
 # - Complex dielectric constant = complex relative permittivity: eps
@@ -203,7 +205,7 @@ def get_rain_refractive_index_liebe1991_single(temperature, frequency):
     Notes
     -----
-    - The code of this function has been derived from RainSense code of Thomas van Leth available at
+    The code of this function has been derived from RainSense code of Thomas van Leth available at
     https://github.com/temperatureCvanLeth/RainSense/blob/master/rainsense/scattering.py#L149
     References
@@ -256,9 +258,9 @@ def get_rain_refractive_index_liebe1991(temperature, frequency):
     Notes
     -----
-    - The code of this function has been derived from pyradsim code of Daniel Wolfensberger available at
+    The code of this function has been derived from pyradsim code of Daniel Wolfensberger available at
     https://github.com/wolfidan/pyradsim/blob/master/pyradsim/permittivity_models.py#L37
-    - The Liebe et al. (1991) replaces the work of Ray et al. (1972).
+    The Liebe et al. (1991) replaces the work of Ray et al. (1972).
     References
     ----------
@@ -327,8 +329,8 @@ def get_rain_refractive_index_ellison2007(temperature, frequency):
     Notes
     -----
-    - The model is designed to operate only up to 1000 GHz and temperature ranging from 0 degC to 100 degC.
-    - The code of this function has been derived from Davide Ori raincoat code available at
+    The model is designed to operate only up to 1000 GHz and temperature ranging from 0 degC to 100 degC.
+    The code of this function has been derived from Davide Ori raincoat code available at
     https://github.com/OPTIMICe-team/raincoat/blob/master/raincoat/scatTable/water.py#L160
     References
@@ -380,7 +382,8 @@ def get_rain_refractive_index_ellison2007(temperature, frequency):
     eps = eps_real + 1j * eps_imag
     # Compute the refractive index
-    m = np.sqrt(eps)
+    with suppress_warnings():
+        m = np.sqrt(eps)  # on windows sqrt of eps=np.complex128(nan+nanj) raise warning
     return m
@@ -409,7 +412,7 @@ def get_rain_refractive_index_turner2016(frequency, temperature):
     Notes
     -----
-    - The code of this function has been checked against Joseph Hardin pyDSD and Davide Ori raincoat codes
+    The code of this function has been checked against Joseph Hardin pyDSD and Davide Ori raincoat codes
     available at:
     https://github.com/josephhardinee/PyDSD/blob/main/pydsd/utility/dielectric.py#L36
     https://github.com/OPTIMICe-team/raincoat/blob/master/raincoat/scatTable/water.py#L54
@@ -478,7 +481,7 @@ def get_rain_refractive_index_turner2016(frequency, temperature):
 ####----------------------------------------------------------------------------------------
 def get_rayleigh_dielectric_factor(m):
-    """Compute the Rayleigh dielectric factor |K|**2 from the complex refractive index.
+    r"""Compute the Rayleigh dielectric factor :math:`|K|^2` from the complex refractive index.
     The magnitude squared of the complex dielectric constant factor for liquid water,
     relative to the surrounding medium (typically air).
@@ -493,9 +496,9 @@ def get_rayleigh_dielectric_factor(m):
     Returns
     -------
     float
-        Dielectric factor |K|^2 used in Rayleigh scattering.
+        Dielectric factor :math:`|K|^2` used in Rayleigh scattering.
         Often also called the radar dieletric factor.
-        In pytmatrix, correspond to the Kw_sqr argument of the Scatterer object.
+        In pytmatrix, correspond to the ``Kw_sqr`` argument of the Scatterer object.
     """
     eps = m**2
     K_complex = (eps - 1.0) / (eps + 2.0)

disdrodb/scattering/routines.py CHANGED Viewed

@@ -197,7 +197,7 @@ def initialize_scatterer(
         Radar elevation angle in degrees.
         Specify 90 degrees for vertically pointing radars.
         The default is 0 degrees.
-    scattering_table_dir : str or Path, optional
+    scattering_table_dir : str or pathlib.Path, optional
         Directory path where T-Matrix scattering tables are stored. If None, the default
         location will be used.
     verbose: bool
@@ -205,7 +205,7 @@ def initialize_scatterer(
     Returns
     -------
-    scatterer : Scatterer
+    pytmatrix.Scatterer
         A scatterer object with the PSD integrator configured and scattering
         table loaded or generated.
     """
@@ -303,7 +303,7 @@ def calculate_scatterer(
     Returns
     -------
-    scatterer : Scatterer
+    pytmatrix.Scatterer
         A scatterer object with the PSD integrator configured and scattering
         table loaded or generated.
     """
@@ -369,7 +369,7 @@ def load_scatterer(
         Radar elevation angle in degrees.
         Specify 90 degrees for vertically pointing radars.
         The default is 0 degrees.
-    scattering_table_dir : str or Path, optional
+    scattering_table_dir : str or pathlib.Path, optional
         Directory path where T-Matrix scattering tables are stored. If None, the default
         location will be used.
     verbose: bool
@@ -377,7 +377,7 @@ def load_scatterer(
     Returns
     -------
-    scatterer : Scatterer
+    pytmatrix.Scatterer
         A scatterer object with the PSD integrator configured and scattering
         table loaded or generated.
     """
@@ -549,7 +549,7 @@ def _estimate_empirical_radar_parameters(
     scatterer,
 ):
     # Assign PSD model to the scatterer object
-    scatterer.psd = BinnedPSD(bin_edges, drop_number_concentration)
+    scatterer.psd = BinnedPSD(bin_edges, np.asarray(drop_number_concentration))
     # Get radar variables
     return _try_compute_radar_variables(scatterer)
@@ -562,7 +562,7 @@ def _estimate_model_radar_parameters(
     scatterer,
 ):
     # Assign PSD model to the scatterer object
-    parameters = dict(zip(psd_parameters_names, parameters, strict=True))
+    parameters = dict(zip(psd_parameters_names, np.asarray(parameters), strict=True))
     scatterer.psd = create_psd(psd_model, parameters)
     # Get radar variables
@@ -919,12 +919,12 @@ def get_radar_parameters(
     ----------
     ds : xarray.Dataset
         Dataset containing the drop number concentration variable.
-    frequency : str, float, or list of str and float, optional
+    frequency : str, float, or list of str or float, optional
         Frequencies in GHz for which to compute the radar parameters.
         Alternatively, also strings can be used to specify common radar frequencies.
         If ``None``, the common radar frequencies will be used.
         See ``disdrodb.scattering.available_radar_bands()``.
-    num_points: int or lis tof integer, optional
+    num_points: int or list of int, optional
         Number of bins into which discretize the PSD.
     diameter_max : float or list of float, optional
         Maximum diameter. The default value is 8 mm.
@@ -933,7 +933,7 @@ def get_radar_parameters(
     axis_ratio_model : str or list of str, optional
         Models to compute the axis ratio. The default model is ``Thurai2007``.
         See available models with ``disdrodb.scattering.available_axis_ratio_models()``.
-    permittivity_model : str str or list of str, optional
+    permittivity_model : str or list of str, optional
         Permittivity model to use to compute the refractive index and the
         rayleigh_dielectric_factor. The default is ``Turner2016``.
         See available models with ``disdrodb.scattering.available_permittivity_models()``.

disdrodb/summary/routines.py CHANGED Viewed

@@ -84,7 +84,7 @@ def save_table_to_pdf(
     Parameters
     ----------
-    df : pd.DataFrame
+    df : pandas.DataFrame
         The data to render.
     filepath : str
         File path where write the final PDF (e.g. '<...>/table.pdf').
@@ -93,8 +93,9 @@ def save_table_to_pdf(
     fontsize : str, optional
         LaTeX font-size command to wrap the table (e.g. '\\small').
         The default is '\\tiny'.
-    orientation : {'portrait', 'landscape'}
-        Page orientation. If 'landscape', the table will be laid out horizontally.
+    orientation : str
+        Page orientation. Allowed values are 'portrait' and 'landscape'.
+        If 'landscape', the table will be laid out horizontally.
         The default is 'landscape'.
     """
     # Export table to LaTeX
@@ -500,11 +501,11 @@ def fit_powerlaw(x, y, xbins, quantile=0.5, min_counts=10, x_in_db=False, use_ra
     Parameters
     ----------
-    x : array_like
+    x : array-like
         Independent variable values. Must be positive and finite after filtering.
-    y : array_like
+    y : array-like
         Dependent variable values. Must be positive and finite after filtering.
-    xbins : array_like
+    xbins : array-like
         Bin edges for grouping ``x`` values (passed to ``pandas.cut``).
     quantile : float, optional
       Quantile of ``y`` to compute in each bin (between 0 and 1).
@@ -642,7 +643,7 @@ def predict_from_powerlaw(x, a, b):
     Parameters
     ----------
-    x : array_like
+    x : array-like
         Independent variable values.
     a : float
         Power-law coefficient.
@@ -651,7 +652,7 @@ def predict_from_powerlaw(x, a, b):
     Returns
     -------
-    y : ndarray
+    y : numpy.ndarray
         Predicted dependent variable values.
     Notes
@@ -697,7 +698,7 @@ def predict_from_inverse_powerlaw(x, a, b):
     Parameters
     ----------
-    x : array_like
+    x : array-like
         Values of ``x`` (independent variable in the original power law).
     a : float
         Power-law coefficient of the inverse power-law model.
@@ -706,7 +707,7 @@ def predict_from_inverse_powerlaw(x, a, b):
     Returns
     -------
-    y : ndarray
+    y : numpy.ndarray
         Predicted dependent variable values.
     """
     return (x ** (1 / b)) / (a ** (1 / b))
@@ -1726,14 +1727,14 @@ def plot_dmax_relationships(df, diameter_bin_edges, dmax="Dmax", diameter_max=10
     Parameters
     ----------
-    df : DataFrame
+    df : pandas.DataFrame
         Input dataframe containing the precipitation data
-    dmax : str, default "Dmax"
-        Column name for maximum diameter
-    vmax : float, default 10
-        Maximum value for Dmax axis limits
-    dpi : int, default 300
-        Resolution for the figure
+    dmax : str, optional
+        Column name for maximum diameter. Default is 'Dmax'.
+    vmax : float, optional
+        Maximum value for Dmax axis limits. Default is 10 mm.
+    dpi : int, optional
+        Resolution for the figure. The default is 300.
     """
     # Compute 2D histograms
     # - Dmax-R
@@ -3739,12 +3740,14 @@ def define_filename(prefix, extension, data_source, campaign_name, station_name,
     """Define filename for summary files."""
     if extension in ["png", "jpeg"]:
         filename = f"Figure.{prefix}.{data_source}.{campaign_name}.{station_name}.{temporal_resolution}.{extension}"
-    if extension in ["csv", "pdf", "yaml", "yml"]:
+    elif extension in ["csv", "pdf", "yaml", "yml"]:
         filename = f"Table.{prefix}.{data_source}.{campaign_name}.{station_name}.{temporal_resolution}.{extension}"
-    if extension in ["nc"]:
+    elif extension in ["nc"]:
         filename = f"Dataset.{prefix}.{data_source}.{campaign_name}.{station_name}.{temporal_resolution}.{extension}"
-    if extension in ["parquet"]:
+    elif extension in ["parquet"]:
         filename = f"Dataframe.{prefix}.{data_source}.{campaign_name}.{station_name}.{temporal_resolution}.{extension}"
+    else:
+        raise NotImplementedError(f"Standardized filename not implemented for extension {extension}.")
     return filename

disdrodb/utils/archiving.py CHANGED Viewed

@@ -81,7 +81,7 @@ def generate_time_blocks(
     # Mapping from our custom freq to pandas frequency codes
     freq_map = {
         "hour": "h",
-        "day": "d",
+        "day": "D",
         "month": "M",
         "quarter": "Q",
         "year": "Y",
@@ -203,12 +203,13 @@ def identify_time_partitions(start_times, end_times, freq: str) -> list[dict]:
     Parameters
     ----------
-    start_times : numpy.ndarray of datetime64[s]
-        Array of inclusive start times for each file.
-    end_times : numpy.ndarray of datetime64[s]
-        Array of inclusive end times for each file.
-    freq : {'none', 'hour', 'day', 'month', 'quarter', 'season', 'year'}
+    start_times : numpy.ndarray
+        Array of inclusive start times in datetime64[s] format for each file.
+    end_times : numpy.ndarray
+        Array of inclusive end times in datetime64[s] format for each file.
+    freq : str
         Frequency determining the granularity of candidate blocks.
+        Allowed values are {'none', 'hour', 'day', 'month', 'quarter', 'season', 'year'}.
         See `generate_time_blocks` for more details.
     Returns
@@ -252,7 +253,9 @@ def define_temporal_partitions(filepaths, strategy, parallel, strategy_options):
         List of files paths to be processed
     strategy : str
-        Which partitioning strategy to apply:
+        Partitioning strategy to apply.
+        Supported values are:
         - ``'time_block'`` defines fixed time intervals (e.g. monthly) covering input files.
         - ``'event'`` detect clusters of precipitation ("events").
@@ -267,42 +270,46 @@ def define_temporal_partitions(filepaths, strategy, parallel, strategy_options):
         - ``freq``: Time unit for blocks. One of {'year', 'season', 'month', 'day'}.
-        See identify_time_partitions for more information.
+        See the ``identify_time_partitions`` function for more information.
         If ``strategy == 'event'``, supported options are:
         - ``variable`` : str
-          Name of the variable to use to apply the event detection.
+            Name of the variable to use to apply the event detection.
         - ``detection_threshold`` : int
-          Minimum number of drops to consider a timestep.
+            Minimum number of drops to consider a timestep.
         - ``neighbor_min_size`` : int
-          Minimum cluster size for merging neighboring events.
+            Minimum cluster size for merging neighboring events.
         - ``neighbor_time_interval`` : str
-          Time window (e.g. "5MIN") to merge adjacent clusters.
+            Time window (e.g. "5MIN") to merge adjacent clusters.
         - ``event_max_time_gap`` : str
-          Maximum allowed gap (e.g. "6H") within a single event.
+            Maximum allowed gap (e.g. "6H") within a single event.
         - ``event_min_duration`` : str
-          Minimum total duration (e.g. "5MIN") of an event.
+            Minimum total duration (e.g. "5MIN") of an event.
         - ``event_min_size`` : int
-          Minimum number of records in an event.
+            Minimum number of records in an event.
-        See identify_events for more information.
+        See the ``identify_events`` function for more information.
     Returns
     -------
     list
         A list of dictionaries, each containing:
-        - ``start_time`` (numpy.datetime64[s])
+        - ``start_time``: numpy.datetime64[s]
             Inclusive start of an event or time block.
-        - ``end_time`` (numpy.datetime64[s])
+        - ``end_time``: numpy.datetime64[s]
             Inclusive end of an event or time block.
     Notes
     -----
-    - The ``'event'`` strategy requires loading data into memory to identify clusters.
-    - The ``'time_block'`` strategy can operate on metadata alone, without full data loading.
-    - The ``'event'`` strategy implicitly performs data selection on which files to process !
-    - The ``'time_block'`` strategy does not performs data selection on which files to process !
+    The ``'event'`` strategy requires loading data into memory to identify clusters.
+    The ``'time_block'`` strategy can operate on metadata alone, without full data loading.
+    The ``'event'`` strategy implicitly performs data selection on which files to process !
+    The ``'time_block'`` strategy does not performs data selection on which files to process !
     """
     if strategy not in ["time_block", "event"]:
         raise ValueError(f"Unknown strategy: {strategy!r}. Must be 'time_block' or 'event'.")

disdrodb/utils/attrs.py CHANGED Viewed

@@ -20,6 +20,7 @@ import os
 from disdrodb.api.checks import get_current_utc_time
 from disdrodb.constants import ARCHIVE_VERSION, CONVENTIONS, COORDINATES, SOFTWARE_VERSION
+from disdrodb.utils.warnings import suppress_warnings
 from disdrodb.utils.yaml import read_yaml
 ####---------------------------------------------------------------------.
@@ -68,14 +69,14 @@ def update_disdrodb_attrs(ds, product: str):
     Parameters
     ----------
-    ds : xarray dataset.
+    ds : xarray.Dataset
         Dataset
     product: str
         DISDRODB product.
     Returns
     -------
-    xarray dataset
+    xarray.Dataset
         Dataset.
     """
     attrs = ds.attrs.copy()
@@ -96,7 +97,8 @@ def update_disdrodb_attrs(ds, product: str):
     if "time" in ds.dims:
         encoding = ds["time"].encoding
         ds["time"] = ds["time"].dt.floor("s")  # ensure no sub-second values
-        ds["time"] = ds["time"].astype("datetime64[s]")
+        with suppress_warnings():
+            ds["time"] = ds["time"].astype("datetime64[s]")
         ds["time"].encoding = encoding  # otherwise time encoding get lost !
         attrs["time_coverage_start"] = str(ds["time"].data[0])
@@ -136,7 +138,7 @@ def set_disdrodb_attrs(ds, product: str):
     Returns
     -------
-    xarray dataset
+    xarray.Dataset
         Dataset.
     """
     # Add dataset conventions

disdrodb/utils/dataframe.py CHANGED Viewed

@@ -39,7 +39,7 @@ def log_arange(start, stop, log_step=0.1, base=10):
     Returns
     -------
-    np.ndarray
+    numpy.ndarray
         Array of values spaced in log scale.
     """
     if start <= 0 or stop <= 0:
@@ -69,7 +69,7 @@ def log_linspace(start, stop, n_bins, base=10):
     Returns
     -------
-    np.ndarray
+    numpy.ndarray
         Array of values spaced evenly in log space.
     """
     if start <= 0 or stop <= 0:
@@ -146,7 +146,7 @@ def compute_1d_histogram(df, column, variables=None, bins=10, labels=None, prefi
     full_index = pd.Index(intervals, name=f"{column}_binned")
     # Define grouping object
-    df_grouped = df.groupby([f"{column}_binned"], observed=False)
+    df_grouped = df.groupby([f"{column}_binned"], observed=True)
     # Compute statistics for specified variables
     variables_stats = []
@@ -311,7 +311,7 @@ def compute_2d_histogram(
     full_index = pd.MultiIndex.from_product([x_intervals, y_intervals], names=[f"{x}_binned", f"{y}_binned"])
     # Define grouping object
-    df_grouped = df.groupby([f"{x}_binned", f"{y}_binned"], observed=False)
+    df_grouped = df.groupby([f"{x}_binned", f"{y}_binned"], observed=True)
     # Compute statistics for specified variables
     variables_stats = []

disdrodb/utils/encoding.py CHANGED Viewed

@@ -21,6 +21,7 @@ import os
 import numpy as np
 import xarray as xr
+from disdrodb.utils.warnings import suppress_warnings
 from disdrodb.utils.yaml import read_yaml
 EPOCH = "seconds since 1970-01-01 00:00:00"
@@ -67,7 +68,8 @@ def set_encodings(ds: xr.Dataset, encodings_dict: dict) -> xr.Dataset:
     # Set time encoding
     if "time" in ds:
         ds["time"] = ds["time"].dt.floor("s")  # ensure no sub-second values
-        ds["time"] = ds["time"].astype("datetime64[s]")
+        with suppress_warnings():
+            ds["time"] = ds["time"].astype("datetime64[s]")
         ds["time"].encoding.update(get_time_encoding())
     # Set the variable encodings

disdrodb 0.5.0__py3-none-any.whl → 0.5.1__py3-none-any.whl

disdrodb 0.5.0py3-none-any.whl → 0.5.1py3-none-any.whl