PyPI - disdrodb - Versions diffs - 0.0.20__py3-none-any.whl → 0.1.0__py3-none-any.whl - Mend

disdrodb 0.0.20py3-none-any.whl → 0.1.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (264) hide show

disdrodb/__init__.py +132 -15
disdrodb/_config.py +4 -2
disdrodb/_version.py +9 -4
disdrodb/api/checks.py +264 -237
disdrodb/api/configs.py +4 -8
disdrodb/api/create_directories.py +235 -290
disdrodb/api/info.py +217 -26
disdrodb/api/io.py +295 -269
disdrodb/api/path.py +597 -173
disdrodb/api/search.py +486 -0
disdrodb/{metadata/scripts → cli}/disdrodb_check_metadata_archive.py +12 -7
disdrodb/{utils/pandas.py → cli/disdrodb_data_archive_directory.py} +9 -18
disdrodb/cli/disdrodb_download_archive.py +86 -0
disdrodb/cli/disdrodb_download_metadata_archive.py +53 -0
disdrodb/cli/disdrodb_download_station.py +84 -0
disdrodb/{api/scripts → cli}/disdrodb_initialize_station.py +22 -10
disdrodb/cli/disdrodb_metadata_archive_directory.py +32 -0
disdrodb/{data_transfer/scripts/disdrodb_download_station.py → cli/disdrodb_open_data_archive.py} +22 -22
disdrodb/cli/disdrodb_open_logs_directory.py +69 -0
disdrodb/{data_transfer/scripts/disdrodb_upload_station.py → cli/disdrodb_open_metadata_archive.py} +22 -24
disdrodb/cli/disdrodb_open_metadata_directory.py +71 -0
disdrodb/cli/disdrodb_open_product_directory.py +74 -0
disdrodb/cli/disdrodb_open_readers_directory.py +32 -0
disdrodb/{l0/scripts → cli}/disdrodb_run_l0.py +38 -31
disdrodb/{l0/scripts → cli}/disdrodb_run_l0_station.py +32 -30
disdrodb/{l0/scripts → cli}/disdrodb_run_l0a.py +30 -21
disdrodb/{l0/scripts → cli}/disdrodb_run_l0a_station.py +24 -33
disdrodb/{l0/scripts → cli}/disdrodb_run_l0b.py +30 -21
disdrodb/{l0/scripts → cli}/disdrodb_run_l0b_station.py +25 -34
disdrodb/cli/disdrodb_run_l0c.py +130 -0
disdrodb/cli/disdrodb_run_l0c_station.py +129 -0
disdrodb/cli/disdrodb_run_l1.py +122 -0
disdrodb/cli/disdrodb_run_l1_station.py +121 -0
disdrodb/cli/disdrodb_run_l2e.py +122 -0
disdrodb/cli/disdrodb_run_l2e_station.py +122 -0
disdrodb/cli/disdrodb_run_l2m.py +122 -0
disdrodb/cli/disdrodb_run_l2m_station.py +122 -0
disdrodb/cli/disdrodb_upload_archive.py +105 -0
disdrodb/cli/disdrodb_upload_station.py +98 -0
disdrodb/configs.py +90 -25
disdrodb/data_transfer/__init__.py +22 -0
disdrodb/data_transfer/download_data.py +87 -90
disdrodb/data_transfer/upload_data.py +64 -37
disdrodb/data_transfer/zenodo.py +15 -18
disdrodb/docs.py +1 -1
disdrodb/issue/__init__.py +17 -4
disdrodb/issue/checks.py +10 -23
disdrodb/issue/reader.py +9 -12
disdrodb/issue/writer.py +14 -17
disdrodb/l0/__init__.py +17 -26
disdrodb/l0/check_configs.py +35 -23
disdrodb/l0/check_standards.py +32 -42
disdrodb/l0/configs/{Thies_LPM → LPM}/bins_diameter.yml +44 -44
disdrodb/l0/configs/{Thies_LPM → LPM}/bins_velocity.yml +40 -40
disdrodb/l0/configs/LPM/l0a_encodings.yml +80 -0
disdrodb/l0/configs/{Thies_LPM → LPM}/l0b_cf_attrs.yml +62 -59
disdrodb/l0/configs/{Thies_LPM → LPM}/l0b_encodings.yml +9 -9
disdrodb/l0/configs/{Thies_LPM → LPM}/raw_data_format.yml +245 -245
disdrodb/l0/configs/{OTT_Parsivel → PARSIVEL}/bins_diameter.yml +66 -66
disdrodb/l0/configs/{OTT_Parsivel → PARSIVEL}/bins_velocity.yml +64 -64
disdrodb/l0/configs/PARSIVEL/l0a_encodings.yml +32 -0
disdrodb/l0/configs/{OTT_Parsivel → PARSIVEL}/l0b_cf_attrs.yml +22 -20
disdrodb/l0/configs/{OTT_Parsivel → PARSIVEL}/l0b_encodings.yml +17 -17
disdrodb/l0/configs/{OTT_Parsivel → PARSIVEL}/raw_data_format.yml +77 -77
disdrodb/l0/configs/{OTT_Parsivel2 → PARSIVEL2}/bins_diameter.yml +64 -64
disdrodb/l0/configs/{OTT_Parsivel2 → PARSIVEL2}/bins_velocity.yml +64 -64
disdrodb/l0/configs/PARSIVEL2/l0a_encodings.yml +39 -0
disdrodb/l0/configs/{OTT_Parsivel2 → PARSIVEL2}/l0b_cf_attrs.yml +24 -22
disdrodb/l0/configs/{OTT_Parsivel2 → PARSIVEL2}/l0b_encodings.yml +20 -20
disdrodb/l0/configs/{OTT_Parsivel2 → PARSIVEL2}/raw_data_format.yml +98 -98
disdrodb/l0/configs/{RD_80 → RD80}/bins_diameter.yml +40 -40
disdrodb/l0/configs/RD80/l0a_encodings.yml +16 -0
disdrodb/l0/configs/{RD_80 → RD80}/l0b_cf_attrs.yml +3 -3
disdrodb/l0/configs/RD80/l0b_encodings.yml +135 -0
disdrodb/l0/configs/{RD_80 → RD80}/raw_data_format.yml +48 -48
disdrodb/l0/l0_reader.py +216 -340
disdrodb/l0/l0a_processing.py +237 -208
disdrodb/l0/l0b_nc_processing.py +227 -80
disdrodb/l0/l0b_processing.py +93 -173
disdrodb/l0/l0c_processing.py +627 -0
disdrodb/l0/readers/{ARM → LPM/ARM}/ARM_LPM.py +36 -58
disdrodb/l0/readers/LPM/AUSTRALIA/MELBOURNE_2007_LPM.py +226 -0
disdrodb/l0/readers/LPM/BRAZIL/CHUVA_LPM.py +185 -0
disdrodb/l0/readers/LPM/BRAZIL/GOAMAZON_LPM.py +183 -0
disdrodb/l0/readers/LPM/ITALY/GID_LPM.py +179 -0
disdrodb/l0/readers/{UK → LPM/UK}/DIVEN.py +14 -35
disdrodb/l0/readers/PARSIVEL/AUSTRALIA/MELBOURNE_2007_PARSIVEL.py +157 -0
disdrodb/l0/readers/PARSIVEL/CHINA/CHONGQING.py +113 -0
disdrodb/l0/readers/{EPFL → PARSIVEL/EPFL}/ARCTIC_2021.py +40 -57
disdrodb/l0/readers/{EPFL → PARSIVEL/EPFL}/COMMON_2011.py +37 -54
disdrodb/l0/readers/{EPFL → PARSIVEL/EPFL}/DAVOS_2009_2011.py +34 -51
disdrodb/l0/readers/{EPFL → PARSIVEL/EPFL}/EPFL_2009.py +34 -51
disdrodb/l0/readers/{EPFL/PARADISO_2014.py → PARSIVEL/EPFL/EPFL_ROOF_2008.py} +38 -50
disdrodb/l0/readers/PARSIVEL/EPFL/EPFL_ROOF_2010.py +105 -0
disdrodb/l0/readers/{EPFL → PARSIVEL/EPFL}/EPFL_ROOF_2011.py +34 -51
disdrodb/l0/readers/{EPFL → PARSIVEL/EPFL}/EPFL_ROOF_2012.py +33 -51
disdrodb/l0/readers/{EPFL → PARSIVEL/EPFL}/GENEPI_2007.py +25 -44
disdrodb/l0/readers/{EPFL → PARSIVEL/EPFL}/GRAND_ST_BERNARD_2007.py +25 -44
disdrodb/l0/readers/{EPFL → PARSIVEL/EPFL}/GRAND_ST_BERNARD_2007_2.py +25 -44
disdrodb/l0/readers/{EPFL → PARSIVEL/EPFL}/HPICONET_2010.py +34 -51
disdrodb/l0/readers/{EPFL/EPFL_ROOF_2010.py → PARSIVEL/EPFL/HYMEX_LTE_SOP2.py} +37 -50
disdrodb/l0/readers/PARSIVEL/EPFL/HYMEX_LTE_SOP3.py +111 -0
disdrodb/l0/readers/{EPFL → PARSIVEL/EPFL}/HYMEX_LTE_SOP4.py +36 -54
disdrodb/l0/readers/{EPFL → PARSIVEL/EPFL}/LOCARNO_2018.py +34 -52
disdrodb/l0/readers/{EPFL → PARSIVEL/EPFL}/LOCARNO_2019.py +38 -56
disdrodb/l0/readers/PARSIVEL/EPFL/PARADISO_2014.py +105 -0
disdrodb/l0/readers/{EPFL → PARSIVEL/EPFL}/PARSIVEL_2007.py +27 -45
disdrodb/l0/readers/{EPFL → PARSIVEL/EPFL}/PLATO_2019.py +24 -44
disdrodb/l0/readers/PARSIVEL/EPFL/RACLETS_2019.py +140 -0
disdrodb/l0/readers/{EPFL → PARSIVEL/EPFL}/RACLETS_2019_WJF.py +41 -59
disdrodb/l0/readers/{EPFL → PARSIVEL/EPFL}/RIETHOLZBACH_2011.py +34 -51
disdrodb/l0/readers/PARSIVEL/EPFL/SAMOYLOV_2017.py +117 -0
disdrodb/l0/readers/PARSIVEL/EPFL/SAMOYLOV_2019.py +137 -0
disdrodb/l0/readers/{EPFL → PARSIVEL/EPFL}/UNIL_2022.py +42 -55
disdrodb/l0/readers/PARSIVEL/GPM/IFLOODS.py +104 -0
disdrodb/l0/readers/{GPM → PARSIVEL/GPM}/LPVEX.py +29 -48
disdrodb/l0/readers/PARSIVEL/GPM/MC3E.py +184 -0
disdrodb/l0/readers/PARSIVEL/NCAR/CCOPE_2015.py +113 -0
disdrodb/l0/readers/{NCAR/VORTEX_SE_2016_P1.py → PARSIVEL/NCAR/OWLES_MIPS.py} +46 -72
disdrodb/l0/readers/PARSIVEL/NCAR/PECAN_MOBILE.py +125 -0
disdrodb/l0/readers/{NCAR/OWLES_MIPS.py → PARSIVEL/NCAR/PLOWS_MIPS.py} +45 -64
disdrodb/l0/readers/PARSIVEL/NCAR/VORTEX2_2009.py +114 -0
disdrodb/l0/readers/PARSIVEL/NCAR/VORTEX2_2010.py +176 -0
disdrodb/l0/readers/PARSIVEL/NCAR/VORTEX2_2010_UF.py +183 -0
disdrodb/l0/readers/{ARM/ARM_LD.py → PARSIVEL2/ARM/ARM_PARSIVEL2.py} +27 -50
disdrodb/l0/readers/PARSIVEL2/BRAZIL/CHUVA_PARSIVEL2.py +163 -0
disdrodb/l0/readers/PARSIVEL2/BRAZIL/GOAMAZON_PARSIVEL2.py +163 -0
disdrodb/l0/readers/{DENMARK → PARSIVEL2/DENMARK}/EROSION_nc.py +14 -35
disdrodb/l0/readers/PARSIVEL2/FRANCE/SIRTA_PARSIVEL2.py +119 -0
disdrodb/l0/readers/PARSIVEL2/GPM/GCPEX.py +104 -0
disdrodb/l0/readers/PARSIVEL2/GPM/NSSTC.py +176 -0
disdrodb/l0/readers/PARSIVEL2/ITALY/GID_PARSIVEL2.py +32 -0
disdrodb/l0/readers/PARSIVEL2/MEXICO/OH_IIUNAM_nc.py +56 -0
disdrodb/l0/readers/PARSIVEL2/NCAR/PECAN_FP3.py +120 -0
disdrodb/l0/readers/{NCAR → PARSIVEL2/NCAR}/PECAN_MIPS.py +45 -64
disdrodb/l0/readers/PARSIVEL2/NCAR/RELAMPAGO_PARSIVEL2.py +181 -0
disdrodb/l0/readers/PARSIVEL2/NCAR/SNOWIE_PJ.py +160 -0
disdrodb/l0/readers/PARSIVEL2/NCAR/SNOWIE_SB.py +160 -0
disdrodb/l0/readers/{NCAR/PLOWS_MIPS.py → PARSIVEL2/NCAR/VORTEX_SE_2016_P1.py} +49 -66
disdrodb/l0/readers/PARSIVEL2/NCAR/VORTEX_SE_2016_P2.py +118 -0
disdrodb/l0/readers/PARSIVEL2/NCAR/VORTEX_SE_2016_PIPS.py +152 -0
disdrodb/l0/readers/PARSIVEL2/NETHERLANDS/DELFT.py +166 -0
disdrodb/l0/readers/{NCAR/RELAMPAGO_RD80.py → RD80/BRAZIL/CHUVA_RD80.py} +36 -60
disdrodb/l0/readers/{BRAZIL → RD80/BRAZIL}/GOAMAZON_RD80.py +36 -55
disdrodb/l0/readers/{NCAR → RD80/NCAR}/CINDY_2011_RD80.py +35 -54
disdrodb/l0/readers/{BRAZIL/CHUVA_RD80.py → RD80/NCAR/RELAMPAGO_RD80.py} +40 -54
disdrodb/l0/readers/template_reader_raw_netcdf_data.py +62 -0
disdrodb/l0/readers/{reader_template.py → template_reader_raw_text_data.py} +20 -44
disdrodb/l0/routines.py +885 -581
disdrodb/l0/standards.py +72 -236
disdrodb/l0/template_tools.py +104 -109
disdrodb/l1/__init__.py +17 -0
disdrodb/l1/beard_model.py +716 -0
disdrodb/l1/encoding_attrs.py +620 -0
disdrodb/l1/fall_velocity.py +260 -0
disdrodb/l1/filters.py +192 -0
disdrodb/l1/processing.py +200 -0
disdrodb/l1/resampling.py +236 -0
disdrodb/l1/routines.py +357 -0
disdrodb/l1_env/__init__.py +17 -0
disdrodb/l1_env/routines.py +38 -0
disdrodb/l2/__init__.py +17 -0
disdrodb/l2/empirical_dsd.py +1735 -0
disdrodb/l2/event.py +388 -0
disdrodb/l2/processing.py +519 -0
disdrodb/l2/processing_options.py +213 -0
disdrodb/l2/routines.py +868 -0
disdrodb/metadata/__init__.py +9 -2
disdrodb/metadata/checks.py +165 -118
disdrodb/metadata/download.py +81 -0
disdrodb/metadata/geolocation.py +146 -0
disdrodb/metadata/info.py +20 -13
disdrodb/metadata/manipulation.py +1 -1
disdrodb/metadata/reader.py +59 -8
disdrodb/metadata/search.py +77 -144
disdrodb/metadata/standards.py +7 -8
disdrodb/metadata/writer.py +8 -14
disdrodb/psd/__init__.py +38 -0
disdrodb/psd/fitting.py +2146 -0
disdrodb/psd/models.py +774 -0
disdrodb/routines.py +1176 -0
disdrodb/scattering/__init__.py +28 -0
disdrodb/scattering/axis_ratio.py +344 -0
disdrodb/scattering/routines.py +456 -0
disdrodb/utils/__init__.py +17 -0
disdrodb/utils/attrs.py +208 -0
disdrodb/utils/cli.py +269 -0
disdrodb/utils/compression.py +60 -42
disdrodb/utils/dask.py +62 -0
disdrodb/utils/decorators.py +110 -0
disdrodb/utils/directories.py +107 -46
disdrodb/utils/encoding.py +127 -0
disdrodb/utils/list.py +29 -0
disdrodb/utils/logger.py +168 -46
disdrodb/utils/time.py +657 -0
disdrodb/utils/warnings.py +30 -0
disdrodb/utils/writer.py +57 -0
disdrodb/utils/xarray.py +138 -47
disdrodb/utils/yaml.py +0 -1
disdrodb/viz/__init__.py +17 -0
disdrodb/viz/plots.py +17 -0
disdrodb-0.1.0.dist-info/METADATA +321 -0
disdrodb-0.1.0.dist-info/RECORD +216 -0
{disdrodb-0.0.20.dist-info → disdrodb-0.1.0.dist-info}/WHEEL +1 -1
disdrodb-0.1.0.dist-info/entry_points.txt +30 -0
disdrodb/data_transfer/scripts/disdrodb_download_archive.py +0 -53
disdrodb/data_transfer/scripts/disdrodb_upload_archive.py +0 -57
disdrodb/l0/configs/OTT_Parsivel/l0a_encodings.yml +0 -32
disdrodb/l0/configs/OTT_Parsivel2/l0a_encodings.yml +0 -39
disdrodb/l0/configs/RD_80/l0a_encodings.yml +0 -16
disdrodb/l0/configs/RD_80/l0b_encodings.yml +0 -135
disdrodb/l0/configs/Thies_LPM/l0a_encodings.yml +0 -80
disdrodb/l0/io.py +0 -257
disdrodb/l0/l0_processing.py +0 -1091
disdrodb/l0/readers/AUSTRALIA/MELBOURNE_2007_OTT.py +0 -178
disdrodb/l0/readers/AUSTRALIA/MELBOURNE_2007_THIES.py +0 -247
disdrodb/l0/readers/BRAZIL/CHUVA_LPM.py +0 -204
disdrodb/l0/readers/BRAZIL/CHUVA_OTT.py +0 -183
disdrodb/l0/readers/BRAZIL/GOAMAZON_LPM.py +0 -204
disdrodb/l0/readers/BRAZIL/GOAMAZON_OTT.py +0 -183
disdrodb/l0/readers/CHINA/CHONGQING.py +0 -131
disdrodb/l0/readers/EPFL/EPFL_ROOF_2008.py +0 -128
disdrodb/l0/readers/EPFL/HYMEX_LTE_SOP2.py +0 -127
disdrodb/l0/readers/EPFL/HYMEX_LTE_SOP3.py +0 -129
disdrodb/l0/readers/EPFL/RACLETS_2019.py +0 -158
disdrodb/l0/readers/EPFL/SAMOYLOV_2017.py +0 -136
disdrodb/l0/readers/EPFL/SAMOYLOV_2019.py +0 -158
disdrodb/l0/readers/FRANCE/SIRTA_OTT2.py +0 -138
disdrodb/l0/readers/GPM/GCPEX.py +0 -123
disdrodb/l0/readers/GPM/IFLOODS.py +0 -123
disdrodb/l0/readers/GPM/MC3E.py +0 -123
disdrodb/l0/readers/GPM/NSSTC.py +0 -164
disdrodb/l0/readers/ITALY/GID.py +0 -199
disdrodb/l0/readers/MEXICO/OH_IIUNAM_nc.py +0 -92
disdrodb/l0/readers/NCAR/CCOPE_2015.py +0 -133
disdrodb/l0/readers/NCAR/PECAN_FP3.py +0 -137
disdrodb/l0/readers/NCAR/PECAN_MOBILE.py +0 -144
disdrodb/l0/readers/NCAR/RELAMPAGO_OTT.py +0 -195
disdrodb/l0/readers/NCAR/SNOWIE_PJ.py +0 -172
disdrodb/l0/readers/NCAR/SNOWIE_SB.py +0 -179
disdrodb/l0/readers/NCAR/VORTEX2_2009.py +0 -133
disdrodb/l0/readers/NCAR/VORTEX2_2010.py +0 -188
disdrodb/l0/readers/NCAR/VORTEX2_2010_UF.py +0 -191
disdrodb/l0/readers/NCAR/VORTEX_SE_2016_P2.py +0 -135
disdrodb/l0/readers/NCAR/VORTEX_SE_2016_PIPS.py +0 -170
disdrodb/l0/readers/NETHERLANDS/DELFT.py +0 -187
disdrodb/l0/readers/SPAIN/SBEGUERIA.py +0 -179
disdrodb/l0/scripts/disdrodb_run_l0b_concat.py +0 -93
disdrodb/l0/scripts/disdrodb_run_l0b_concat_station.py +0 -85
disdrodb/utils/netcdf.py +0 -452
disdrodb/utils/scripts.py +0 -102
disdrodb-0.0.20.dist-info/AUTHORS.md +0 -18
disdrodb-0.0.20.dist-info/METADATA +0 -186
disdrodb-0.0.20.dist-info/RECORD +0 -168
disdrodb-0.0.20.dist-info/entry_points.txt +0 -15
/disdrodb/l0/configs/{RD_80 → RD80}/bins_velocity.yml +0 -0
/disdrodb/l0/manuals/{Thies_LPM.pdf → LPM.pdf} +0 -0
/disdrodb/l0/manuals/{ODM_470.pdf → ODM470.pdf} +0 -0
/disdrodb/l0/manuals/{OTT_Parsivel.pdf → PARSIVEL.pdf} +0 -0
/disdrodb/l0/manuals/{OTT_Parsivel2.pdf → PARSIVEL2.pdf} +0 -0
/disdrodb/l0/manuals/{PWS_100.pdf → PWS100.pdf} +0 -0
/disdrodb/l0/manuals/{RD_80.pdf → RD80.pdf} +0 -0
{disdrodb-0.0.20.dist-info → disdrodb-0.1.0.dist-info/licenses}/LICENSE +0 -0
{disdrodb-0.0.20.dist-info → disdrodb-0.1.0.dist-info}/top_level.txt +0 -0

disdrodb/utils/netcdf.py DELETED Viewed

@@ -1,452 +0,0 @@
-#!/usr/bin/env python3
-# -----------------------------------------------------------------------------.
-# Copyright (c) 2021-2023 DISDRODB developers
-#
-# This program is free software: you can redistribute it and/or modify
-# it under the terms of the GNU General Public License as published by
-# the Free Software Foundation, either version 3 of the License, or
-# (at your option) any later version.
-#
-# This program is distributed in the hope that it will be useful,
-# but WITHOUT ANY WARRANTY; without even the implied warranty of
-# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-# GNU General Public License for more details.
-#
-# You should have received a copy of the GNU General Public License
-# along with this program.  If not, see <http://www.gnu.org/licenses/>.
-# -----------------------------------------------------------------------------.
-"""DISDRODB netCDF utility."""
-import logging
-from typing import Tuple
-import numpy as np
-import pandas as pd
-import xarray as xr
-from disdrodb.utils.logger import log_error, log_info, log_warning
-logger = logging.getLogger(__name__)
-####---------------------------------------------------------------------------.
-def _sort_datasets_by_dim(list_ds: list, filepaths: str, dim: str = "time") -> Tuple[list, list]:
-    """Sort a list of xarray.Dataset and corresponding file paths by the starting value of a specified dimension.
-    Parameters
-    ----------
-    filepaths : list
-        List of netCDFs file paths.
-    list_ds : list
-        List of xarray Dataset.
-    dim : str, optional
-        Dimension name. The default is "time".
-    Returns
-    -------
-    tuple
-        Tuple of sorted list of xarray datasets and sorted list of file paths.
-    """
-    start_values = [ds[dim].values[0] for ds in list_ds]
-    sorted_idx = np.argsort(start_values)
-    sorted_list_ds = [list_ds[i] for i in sorted_idx]
-    sorted_filepaths = [filepaths[i] for i in sorted_idx]
-    return sorted_list_ds, sorted_filepaths
-def _get_dim_values_index(list_ds: list, dim: str) -> Tuple[np.ndarray, np.ndarray, np.ndarray]:
-    """Get list and dataset indices associated to the dimension values."""
-    dim_values = np.concatenate([ds[dim].values for ds in list_ds])
-    list_index = np.concatenate([np.ones(len(ds[dim])) * i for i, ds in enumerate(list_ds)])
-    list_index = list_index.astype(int)
-    ds_index = np.concatenate([np.arange(0, len(ds[dim])) for i, ds in enumerate(list_ds)])
-    return dim_values, list_index, ds_index
-def _get_non_monotonic_indices_to_remove(dim_values: np.ndarray) -> np.ndarray:
-    """Returns the indices that cause a non-monotonic increasing series of values.
-    Assume that duplicated values, if present, occurs consecutively !
-    """
-    diff_dim_values = np.diff(dim_values)
-    indices_decreasing = np.where(diff_dim_values.astype(float) <= 0)[0] + 1
-    if len(indices_decreasing) == 0:
-        return []
-    idx_start_decreasing = indices_decreasing[0]
-    idx_restart_increase = np.max(np.where(dim_values <= dim_values[idx_start_decreasing - 1])[0])
-    idx_to_remove = np.arange(idx_start_decreasing, idx_restart_increase + 1)
-    return idx_to_remove
-def _get_duplicated_indices(x, keep="first"):
-    """Return the indices to remove for duplicated values in x such that there is only one value occurrence.
-    Parameters
-    ----------
-    x :  np.array
-        Array of values.
-    keep : str, optional
-        The value to keep, either 'first', 'last' or False.
-        The default is 'first'.
-        ‘first’ : Mark duplicates as True except for the first occurrence.
-        ‘last’ : Mark duplicates as True except for the last occurrence.
-        False : Mark all duplicates as True.
-    Returns
-    -------
-    np.array
-        Array of indices to remove.
-    """
-    # Check 'keep' argument
-    # if not isinstance(keep, str):
-    #     raise TypeError("`keep` must be a string. Either first or last.")
-    # if not np.isin(keep, ["first", "last"]):
-    #     raise ValueError("Invalid value for argument keep. Only 'first' and 'last' are accepted.")
-    # # Get
-    # x_indices = np.arange(len(x))
-    # unique_values, unique_counts = np.unique(x, return_counts=True)
-    # duplicated_values = unique_values[unique_counts > 1]
-    # duplicated_indices = np.array([], dtype=np.int32)
-    # if keep == 'first':
-    #     for value in duplicated_values:
-    #         indices = np.where(x == value)[0]
-    #         duplicated_indices = np.concatenate([duplicated_indices, indices[1:]])
-    # elif keep == 'last':
-    #     indices = np.where(x == value)[0]
-    #     duplicated_indices = np.concatenate([duplicated_indices, indices[:-1]])
-    # return duplicated_indices
-    # Get duplicate indices
-    idx_duplicated = pd.Index(x).duplicated(keep=keep)
-    return np.where(idx_duplicated)[0]
-def _get_bad_info_dict(
-    idx_to_remove: np.ndarray,
-    list_index: np.ndarray,
-    dim_values: np.ndarray,
-    ds_index: np.ndarray,
-) -> Tuple[dict, dict]:
-    """Return two dictionaries mapping, for each dataset, the bad values and indices to remove.
-    Parameters
-    ----------
-    idx_to_remove : np.ndarray
-        Indices to be removed to ensure monotonic dimension.
-    list_index : np.ndarray
-        Indices corresponding to the file in the `list_ds` parameter.
-    ds_index : np.ndarray
-        Indices corresponding to the dataset dimension index in the `list_ds` parameter.
-    Returns
-    -------
-    dict
-        A dictionary mapping the dimension values to remove for each file.
-    dict
-        A dictionary mapping the dataset dimension indices to remove for each file.
-    """
-    list_index_bad = list_index[idx_to_remove]
-    ds_index_bad = ds_index[idx_to_remove]
-    dim_values_bad = dim_values[idx_to_remove]
-    # Retrieve dictionary with the bad values in each dataset
-    dict_ds_bad_values = {k: dim_values_bad[np.where(list_index_bad == k)[0]] for k in np.unique(list_index_bad)}
-    # Retrieve dictionary with the index with the bad values in each dataset
-    dict_ds_bad_idx = {k: ds_index_bad[np.where(list_index_bad == k)[0]] for k in np.unique(list_index_bad)}
-    return dict_ds_bad_values, dict_ds_bad_idx
-def _remove_dataset_bad_values(list_ds, filepaths, dict_ds_bad_idx, dim):
-    """Remove portions of xarray Datasets corresponding to duplicated values.
-    Parameters
-    ----------
-    list_ds : list
-        List of xarray Dataset.
-    dict_ds_bad_idx : dict
-        Dictionary with the dimension indices corresponding to bad values in each xarray Dataset.
-    Returns
-    -------
-    list_ds : list
-        List of xarray Dataset without bad values.
-    """
-    list_index_valid = list(range(len(list_ds)))
-    for list_index_bad, bad_idx in dict_ds_bad_idx.items():
-        # Get dataset
-        ds = list_ds[list_index_bad]
-        # If resulting in a empty dataset, drop index from list_index_valid
-        if len(bad_idx) == len(list_ds[list_index_bad][dim]):
-            list_index_valid.remove(list_index_bad)
-        # Remove invalid indices
-        list_ds[list_index_bad] = ds.drop_isel({dim: bad_idx})
-    # Keep non-empty datasets
-    new_list_ds = [list_ds[idx] for idx in list_index_valid]
-    new_filepaths = [filepaths[idx] for idx in list_index_valid]
-    return new_list_ds, new_filepaths
-def ensure_unique_dimension_values(list_ds: list, filepaths: str, dim: str = "time", verbose: bool = False) -> list:
-    """Ensure that a list of xr.Dataset has non duplicated dimension values.
-    Parameters
-    ----------
-    list_ds : list
-        List of xarray Dataset.
-    filepaths : list
-        List of netCDFs file paths.
-    dim : str, optional
-        Dimension name.
-        The default is "time".
-    Returns
-    -------
-    list
-        List of xarray Dataset.
-    list
-        List of netCDFs file paths.
-    """
-    # Reorder the files and filepaths by the starting dimension value (time)
-    list_ds, filepaths = _sort_datasets_by_dim(list_ds=list_ds, filepaths=filepaths, dim=dim)
-    # Get the datasets dimension values array (and associated list_ds/xr.Dataset indices)
-    dim_values, list_index, ds_index = _get_dim_values_index(list_ds, dim=dim)
-    # Get duplicated indices
-    idx_duplicated = _get_duplicated_indices(dim_values, keep="first")
-    # Remove duplicated indices
-    if len(idx_duplicated) > 0:
-        # Retrieve dictionary providing bad values and indexes for each dataset
-        dict_ds_bad_values, dict_ds_bad_idx = _get_bad_info_dict(
-            idx_to_remove=idx_duplicated,
-            list_index=list_index,
-            dim_values=dim_values,
-            ds_index=ds_index,
-        )
-        # Report for each dataset, the duplicates values occurring
-        for list_index_bad, bad_values in dict_ds_bad_values.items():
-            # Retrieve dataset filepath
-            filepath = filepaths[list_index_bad]
-            # If all values inside the file are duplicated, report it
-            if len(bad_values) == len(list_ds[list_index_bad][dim]):
-                msg = (
-                    f"{filepath} is excluded from concatenation. All {dim} values are already present in some other"
-                    " file."
-                )
-                log_warning(logger=logger, msg=msg, verbose=verbose)
-            else:
-                if np.issubdtype(bad_values.dtype, np.datetime64):
-                    bad_values = bad_values.astype("M8[s]")
-                msg = f"In {filepath}, dropping {dim} values {bad_values} to avoid duplicated {dim} values."
-                log_warning(logger=logger, msg=msg, verbose=verbose)
-        # Remove duplicated values
-        list_ds, filepaths = _remove_dataset_bad_values(
-            list_ds=list_ds, filepaths=filepaths, dict_ds_bad_idx=dict_ds_bad_idx, dim=dim
-        )
-    return list_ds, filepaths
-def ensure_monotonic_dimension(list_ds: list, filepaths: str, dim: str = "time", verbose: bool = False) -> list:
-    """Ensure that a list of xr.Dataset has a monotonic increasing (non duplicated) dimension values.
-    Parameters
-    ----------
-    list_ds : list
-        List of xarray Dataset.
-    filepaths : list
-        List of netCDFs file paths.
-    dim : str, optional
-        Dimension name.
-        The default is "time".
-    Returns
-    -------
-    list
-        List of xarray Dataset.
-    list
-        List of netCDFs file paths.
-    """
-    # Reorder the files and filepaths by the starting dimension value (time)
-    # TODO: should maybe also split by non-continuous time ...
-    list_ds, filepaths = _sort_datasets_by_dim(list_ds=list_ds, filepaths=filepaths, dim=dim)
-    # Get the datasets dimension values array (and associated list_ds/xr.Dataset indices)
-    dim_values, list_index, ds_index = _get_dim_values_index(list_ds, dim=dim)
-    # Identify the indices to remove to ensure monotonic values
-    idx_to_remove = _get_non_monotonic_indices_to_remove(dim_values)
-    # Remove indices causing the values to be non-monotonic increasing
-    if len(idx_to_remove) > 0:
-        # Retrieve dictionary providing bad values and indexes for each dataset
-        dict_ds_bad_values, dict_ds_bad_idx = _get_bad_info_dict(
-            idx_to_remove=idx_to_remove,
-            list_index=list_index,
-            dim_values=dim_values,
-            ds_index=ds_index,
-        )
-        # Report for each dataset, the values to be dropped
-        for list_index_bad, bad_values in dict_ds_bad_values.items():
-            # Retrieve dataset filepath
-            filepath = filepaths[list_index_bad]
-            # If all values inside the file should be dropped, report it
-            if len(bad_values) == len(list_ds[list_index_bad][dim]):
-                msg = (
-                    f"{filepath} is excluded from concatenation. All {dim} values cause the dimension to be"
-                    " non-monotonic."
-                )
-                log_warning(logger=logger, msg=msg, verbose=verbose)
-            else:
-                if np.issubdtype(bad_values.dtype, np.datetime64):
-                    bad_values = bad_values.astype("M8[s]")
-                msg = f"In {filepath}, dropping {dim} values {bad_values} to ensure monotonic {dim} dimension."
-                log_warning(logger=logger, msg=msg, verbose=verbose)
-        # Remove duplicated values
-        list_ds, filepaths = _remove_dataset_bad_values(
-            list_ds=list_ds, filepaths=filepaths, dict_ds_bad_idx=dict_ds_bad_idx, dim=dim
-        )
-        # Iterative check
-        list_ds, filepaths = ensure_monotonic_dimension(list_ds=list_ds, filepaths=filepaths, dim=dim)
-    return list_ds, filepaths
-# ds_index = [0,1,2,3,0,1,2,3,4]
-# list_index = [0,0,0,0,1, 1, 1,1, 1]
-# dim_values = [0,1,5,5,5, 5, 6,7,8]
-# list_index = np.array(list_index)
-# dim_values = np.array(dim_values)
-# ds_index = np.array(ds_index)
-####---------------------------------------------------------------------------
-def get_list_ds(filepaths: str) -> list:
-    """Get list of xarray datasets from file paths.
-    Parameters
-    ----------
-    filepaths : list
-        List of netCDFs file paths.
-    Returns
-    -------
-    list
-        List of xarray datasets.
-    """
-    list_ds = []
-    for filepath in filepaths:
-        # This context manager is required to avoid random HDF locking
-        # - cache=True: store data in memory to avoid reading back from disk
-        # --> but LRU cache might cause the netCDF to not be closed !
-        with xr.open_dataset(filepath, cache=False) as data:
-            ds = data.load()
-        list_ds.append(ds)
-    return list_ds
-# def get_list_ds(filepaths: str) -> list:
-#     """Get list of xarray datasets from file paths.
-#     Parameters
-#     ----------
-#     filepaths : list
-#         List of netCDFs file paths.
-#     Returns
-#     -------
-#     list
-#         List of xarray datasets.
-#     """
-#     # WARNING: READING IN PARALLEL USING MULTIPROCESS CAUSE HDF LOCK ERRORS
-#     @dask.delayed
-#     def open_dataset_delayed(filepath):
-#         import os
-#         os.environ["HDF5_USE_FILE_LOCKING"] = "FALSE"
-#
-#         # This context manager is required to avoid random HDF locking
-#         # - cache=True: store data in memory to avoid reading back from disk
-#         # --> but LRU cache might cause the netCDF to not be closed !
-#         with xr.open_dataset(filepath, cache=False) as data:
-#             ds = data.load()
-#         return ds
-#     list_ds_delayed = []
-#     for filepath in filepaths:
-#         list_ds_delayed.append(open_dataset_delayed(filepath))
-#     list_ds = dask.compute(list_ds_delayed)[0]
-#     return list_ds
-####---------------------------------------------------------------------------
-def _concatenate_datasets(list_ds, dim="time", verbose=False):
-    try:
-        msg = "Start concatenating with xr.concat."
-        log_info(logger=logger, msg=msg, verbose=verbose)
-        ds = xr.concat(list_ds, dim="time", coords="minimal", compat="override")
-        msg = "Concatenation with xr.concat has been successful."
-        log_info(logger=logger, msg=msg, verbose=verbose)
-    except Exception as e:
-        msg = f"Concatenation with xr.concat failed. Error is {e}."
-        log_error(logger=logger, msg=msg, verbose=False)
-        raise ValueError(msg)
-    return ds
-def xr_concat_datasets(filepaths: str, verbose=False) -> xr.Dataset:
-    """Concat xr.Dataset in a robust and parallel way.
-    1. It checks for time dimension monotonicity
-    Parameters
-    ----------
-    filepaths : list
-        List of netCDFs file paths.
-    Returns
-    -------
-    xr.Dataset
-        A single xarray dataset.
-    Raises
-    ------
-    ValueError
-        Error if the merging/concatenation operations can not be achieved.
-    """
-    # --------------------------------------.
-    # Open xr.Dataset lazily in parallel using dask delayed
-    list_ds = get_list_ds(filepaths)
-    # --------------------------------------.
-    # Ensure time dimension contains no duplicated values
-    list_ds, filepaths = ensure_unique_dimension_values(
-        list_ds=list_ds, filepaths=filepaths, dim="time", verbose=verbose
-    )
-    # Ensure time dimension is monotonic increasingly
-    list_ds, filepaths = ensure_monotonic_dimension(list_ds=list_ds, filepaths=filepaths, dim="time", verbose=verbose)
-    # --------------------------------------.
-    # Concatenate all netCDFs
-    ds = _concatenate_datasets(list_ds=list_ds, dim="time", verbose=verbose)
-    # --------------------------------------.
-    # Return xr.Dataset
-    return ds

disdrodb/utils/scripts.py DELETED Viewed

@@ -1,102 +0,0 @@
-#!/usr/bin/env python3
-# -----------------------------------------------------------------------------.
-# Copyright (c) 2021-2023 DISDRODB developers
-#
-# This program is free software: you can redistribute it and/or modify
-# it under the terms of the GNU General Public License as published by
-# the Free Software Foundation, either version 3 of the License, or
-# (at your option) any later version.
-#
-# This program is distributed in the hope that it will be useful,
-# but WITHOUT ANY WARRANTY; without even the implied warranty of
-# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-# GNU General Public License for more details.
-#
-# You should have received a copy of the GNU General Public License
-# along with this program.  If not, see <http://www.gnu.org/licenses/>.
-# -----------------------------------------------------------------------------.
-"""DISDRODB scripts utility."""
-import click
-def _execute_cmd(cmd, raise_error=False):
-    """Execute command in the terminal, streaming output in python console."""
-    from subprocess import PIPE, CalledProcessError, Popen
-    with Popen(cmd, shell=True, stdout=PIPE, bufsize=1, universal_newlines=True) as p:
-        for line in p.stdout:
-            print(line, end="")
-    # Raise error if command didn't run successfully
-    if p.returncode != 0 and raise_error:
-        raise CalledProcessError(p.returncode, p.args)
-def _parse_empty_string_and_none(args):
-    """Utility to parse argument passed from the command line.
-    If args = '' --> None
-    If args = 'None' --> None
-    Otherwise return args
-    """
-    # If '', set to 'None'
-    args = None if args == "" else args
-    # - If multiple arguments, split by space
-    if isinstance(args, str):
-        if args == "None":
-            args = None
-    return args
-def parse_arg_to_list(args):
-    """Utility to pass list to command line scripts.
-    If args = '' --> None
-    If args = 'None' --> None
-    If args = 'variable' --> [variable]
-    If args = 'variable1 variable2' --> [variable1, variable2]
-    """
-    # If '' or 'None' --> Set to None
-    args = _parse_empty_string_and_none(args)
-    # - If multiple arguments, split by space
-    if isinstance(args, str):
-        # - Split by space
-        list_args = args.split(" ")
-        # - Remove '' (deal with multi space)
-        args = [args for args in list_args if len(args) > 0]
-    return args
-def parse_base_dir(base_dir):
-    """Utility to parse base_dir provided by command line.
-    If base_dir = 'None' --> None
-    If base_dir = '' --> None
-    """
-    # If '', set to 'None'
-    return _parse_empty_string_and_none(base_dir)
-def click_station_arguments(function: object):
-    """Click command line arguments for DISDRODB station processing.
-    Parameters
-    ----------
-    function : object
-        Function.
-    """
-    function = click.argument("station_name", metavar="<station>")(function)
-    function = click.argument("campaign_name", metavar="<CAMPAIGN_NAME>")(function)
-    function = click.argument("data_source", metavar="<DATA_SOURCE>")(function)
-    return function
-def click_base_dir_option(function: object):
-    function = click.option(
-        "--base_dir",
-        type=str,
-        show_default=True,
-        default=None,
-        help="DISDRODB base directory",
-    )(function)
-    return function

disdrodb-0.0.20.dist-info/AUTHORS.md DELETED Viewed

@@ -1,18 +0,0 @@
-# Project Contributors
-The following people have made contributions to this project:
-<!--- Use your GitHub account or any other personal reference URL --->
-<!--- If you wish to not use your real name, please use your github username --->
-<!--- The list should be alphabetical by last name if possible, with github usernames at the bottom  and the istitution --->
-<!--- See https://gist.github.com/djhoese/52220272ec73b12eb8f4a29709be110d for auto-generating parts of this list --->
-- [Alexis Berne](https://people.epfl.ch/alexis.berne?lang=en) - EPFL
-- [Gionata Ghiggi (ghiggi)](https://github.com/ghiggi) - EPFL
-- [Jacopo Grazioli (jacgraz)](https://github.com/jacgraz) - EPFL
-- [Saverio Guzzo  (saveriogzz)](https://github.com/saveriogzz) - TU DELFT
-- [Kim Candolfi (KimCandolfi)](https://github.com/KimCandolfi) - EPFL
-- [Régis Longchamp (regislon)](https://github.com/regislon) - EPFL
-- [Son Pham-Ba (sphamba)](https://github.com/sphamba) - EPFL
-- [Charlotte Gisèle Weil  (charlottegiseleweil)](https://github.com/charlottegiseleweil) - EPFL

disdrodb 0.0.20__py3-none-any.whl → 0.1.0__py3-none-any.whl

disdrodb 0.0.20py3-none-any.whl → 0.1.0py3-none-any.whl