disdrodb 0.2.0__py3-none-any.whl → 0.3.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (315) hide show
  1. disdrodb/__init__.py +1 -1
  2. disdrodb/_config.py +1 -3
  3. disdrodb/_version.py +2 -2
  4. disdrodb/accessor/__init__.py +1 -1
  5. disdrodb/accessor/methods.py +18 -11
  6. disdrodb/api/checks.py +2 -4
  7. disdrodb/api/configs.py +1 -3
  8. disdrodb/api/create_directories.py +4 -6
  9. disdrodb/api/info.py +1 -3
  10. disdrodb/api/io.py +15 -9
  11. disdrodb/api/path.py +1 -3
  12. disdrodb/cli/disdrodb_check_metadata_archive.py +2 -2
  13. disdrodb/cli/disdrodb_check_products_options.py +44 -0
  14. disdrodb/cli/disdrodb_create_summary.py +48 -22
  15. disdrodb/cli/disdrodb_create_summary_station.py +39 -18
  16. disdrodb/cli/disdrodb_data_archive_directory.py +1 -3
  17. disdrodb/cli/disdrodb_download_archive.py +45 -24
  18. disdrodb/cli/disdrodb_download_metadata_archive.py +27 -16
  19. disdrodb/cli/disdrodb_download_station.py +56 -26
  20. disdrodb/cli/disdrodb_initialize_station.py +40 -20
  21. disdrodb/cli/disdrodb_metadata_archive_directory.py +1 -3
  22. disdrodb/cli/disdrodb_open_data_archive.py +16 -11
  23. disdrodb/cli/disdrodb_open_logs_directory.py +29 -18
  24. disdrodb/cli/disdrodb_open_metadata_archive.py +25 -11
  25. disdrodb/cli/disdrodb_open_metadata_directory.py +32 -20
  26. disdrodb/cli/disdrodb_open_product_directory.py +38 -21
  27. disdrodb/cli/disdrodb_open_readers_directory.py +1 -3
  28. disdrodb/cli/disdrodb_run.py +189 -0
  29. disdrodb/cli/disdrodb_run_l0.py +55 -64
  30. disdrodb/cli/disdrodb_run_l0_station.py +47 -52
  31. disdrodb/cli/disdrodb_run_l0a.py +47 -45
  32. disdrodb/cli/disdrodb_run_l0a_station.py +38 -37
  33. disdrodb/cli/disdrodb_run_l0b.py +45 -45
  34. disdrodb/cli/disdrodb_run_l0b_station.py +37 -36
  35. disdrodb/cli/disdrodb_run_l0c.py +50 -47
  36. disdrodb/cli/disdrodb_run_l0c_station.py +41 -38
  37. disdrodb/cli/disdrodb_run_l1.py +49 -45
  38. disdrodb/cli/disdrodb_run_l1_station.py +40 -37
  39. disdrodb/cli/disdrodb_run_l2e.py +50 -45
  40. disdrodb/cli/disdrodb_run_l2e_station.py +41 -37
  41. disdrodb/cli/disdrodb_run_l2m.py +49 -45
  42. disdrodb/cli/disdrodb_run_l2m_station.py +40 -37
  43. disdrodb/cli/disdrodb_run_station.py +184 -0
  44. disdrodb/cli/disdrodb_upload_archive.py +45 -35
  45. disdrodb/cli/disdrodb_upload_station.py +39 -32
  46. disdrodb/configs.py +13 -8
  47. disdrodb/constants.py +4 -2
  48. disdrodb/data_transfer/__init__.py +1 -3
  49. disdrodb/data_transfer/download_data.py +38 -54
  50. disdrodb/data_transfer/upload_data.py +1 -3
  51. disdrodb/data_transfer/zenodo.py +1 -3
  52. disdrodb/docs.py +1 -3
  53. disdrodb/etc/configs/attributes.yaml +52 -2
  54. disdrodb/etc/configs/encodings.yaml +45 -1
  55. disdrodb/etc/products/L0C/ODM470/global.yaml +5 -0
  56. disdrodb/etc/products/L0C/global.yaml +5 -0
  57. disdrodb/etc/products/L1/ODM470/global.yaml +6 -0
  58. disdrodb/etc/products/L1/global.yaml +1 -14
  59. disdrodb/etc/products/L2E/LPM/1MIN.yaml +1 -0
  60. disdrodb/etc/products/L2E/LPM/global.yaml +36 -0
  61. disdrodb/etc/products/L2E/LPM_V0/1MIN.yaml +1 -0
  62. disdrodb/etc/products/L2E/LPM_V0/global.yaml +36 -0
  63. disdrodb/etc/products/L2E/ODM470/1MIN.yaml +1 -0
  64. disdrodb/etc/products/L2E/ODM470/global.yaml +36 -0
  65. disdrodb/etc/products/L2E/PARSIVEL/1MIN.yaml +1 -0
  66. disdrodb/etc/products/L2E/PARSIVEL/global.yaml +36 -0
  67. disdrodb/etc/products/L2E/PARSIVEL2/1MIN.yaml +1 -0
  68. disdrodb/etc/products/L2E/PARSIVEL2/global.yaml +36 -0
  69. disdrodb/etc/products/L2E/PWS100/1MIN.yaml +1 -0
  70. disdrodb/etc/products/L2E/PWS100/global.yaml +36 -0
  71. disdrodb/etc/products/L2E/RD80/1MIN.yaml +19 -0
  72. disdrodb/etc/products/L2E/SWS250/1MIN.yaml +19 -0
  73. disdrodb/etc/products/L2E/global.yaml +17 -3
  74. disdrodb/etc/products/L2M/global.yaml +1 -1
  75. disdrodb/fall_velocity/__init__.py +46 -0
  76. disdrodb/fall_velocity/graupel.py +483 -0
  77. disdrodb/fall_velocity/hail.py +287 -0
  78. disdrodb/{l1/fall_velocity.py → fall_velocity/rain.py} +265 -50
  79. disdrodb/issue/__init__.py +1 -3
  80. disdrodb/issue/checks.py +3 -5
  81. disdrodb/issue/reader.py +1 -3
  82. disdrodb/issue/writer.py +1 -3
  83. disdrodb/l0/__init__.py +1 -1
  84. disdrodb/l0/check_configs.py +26 -17
  85. disdrodb/l0/check_standards.py +1 -3
  86. disdrodb/l0/configs/LPM/l0a_encodings.yml +0 -1
  87. disdrodb/l0/configs/LPM/l0b_cf_attrs.yml +0 -4
  88. disdrodb/l0/configs/LPM/l0b_encodings.yml +9 -9
  89. disdrodb/l0/configs/LPM/raw_data_format.yml +11 -11
  90. disdrodb/l0/configs/LPM_V0/bins_diameter.yml +103 -0
  91. disdrodb/l0/configs/LPM_V0/bins_velocity.yml +103 -0
  92. disdrodb/l0/configs/LPM_V0/l0a_encodings.yml +45 -0
  93. disdrodb/l0/configs/LPM_V0/l0b_cf_attrs.yml +180 -0
  94. disdrodb/l0/configs/LPM_V0/l0b_encodings.yml +410 -0
  95. disdrodb/l0/configs/LPM_V0/raw_data_format.yml +474 -0
  96. disdrodb/l0/configs/ODM470/bins_diameter.yml +643 -0
  97. disdrodb/l0/configs/ODM470/bins_velocity.yml +0 -0
  98. disdrodb/l0/configs/ODM470/l0a_encodings.yml +11 -0
  99. disdrodb/l0/configs/ODM470/l0b_cf_attrs.yml +46 -0
  100. disdrodb/l0/configs/ODM470/l0b_encodings.yml +106 -0
  101. disdrodb/l0/configs/ODM470/raw_data_format.yml +111 -0
  102. disdrodb/l0/configs/PARSIVEL/l0b_cf_attrs.yml +1 -1
  103. disdrodb/l0/configs/PARSIVEL/raw_data_format.yml +8 -8
  104. disdrodb/l0/configs/PARSIVEL2/raw_data_format.yml +9 -9
  105. disdrodb/l0/l0_reader.py +1 -3
  106. disdrodb/l0/l0a_processing.py +7 -5
  107. disdrodb/l0/l0b_nc_processing.py +2 -4
  108. disdrodb/l0/l0b_processing.py +27 -22
  109. disdrodb/l0/l0c_processing.py +37 -11
  110. disdrodb/l0/manuals/LPM_V0.pdf +0 -0
  111. disdrodb/l0/readers/LPM/ARM/ARM_LPM.py +1 -1
  112. disdrodb/l0/readers/LPM/AUSTRALIA/MELBOURNE_2007_LPM.py +1 -1
  113. disdrodb/l0/readers/LPM/BRAZIL/CHUVA_LPM.py +1 -1
  114. disdrodb/l0/readers/LPM/BRAZIL/GOAMAZON_LPM.py +1 -1
  115. disdrodb/l0/readers/LPM/GERMANY/DWD.py +190 -12
  116. disdrodb/l0/readers/LPM/ITALY/GID_LPM.py +63 -14
  117. disdrodb/l0/readers/LPM/ITALY/GID_LPM_PI.py +279 -0
  118. disdrodb/l0/readers/LPM/ITALY/GID_LPM_T.py +279 -0
  119. disdrodb/l0/readers/LPM/ITALY/GID_LPM_W.py +3 -5
  120. disdrodb/l0/readers/LPM/KIT/CHWALA.py +1 -3
  121. disdrodb/l0/readers/LPM/NETHERLANDS/DELFT_LPM_NC.py +1 -1
  122. disdrodb/l0/readers/LPM/NETHERLANDS/DELFT_RWANDA_LPM_NC.py +103 -0
  123. disdrodb/l0/readers/LPM/NORWAY/HAUKELISETER_LPM.py +214 -0
  124. disdrodb/l0/readers/LPM/NORWAY/NMBU_LPM.py +206 -0
  125. disdrodb/l0/readers/LPM/SLOVENIA/ARSO.py +1 -3
  126. disdrodb/l0/readers/LPM/SLOVENIA/UL.py +1 -3
  127. disdrodb/l0/readers/LPM/SWITZERLAND/INNERERIZ_LPM.py +1 -3
  128. disdrodb/l0/readers/LPM/UK/DIVEN.py +1 -1
  129. disdrodb/l0/readers/LPM/UK/WITHWORTH_LPM.py +217 -0
  130. disdrodb/l0/readers/LPM/USA/CHARLESTON.py +227 -0
  131. disdrodb/l0/readers/{LPM → LPM_V0}/BELGIUM/ULIEGE.py +34 -52
  132. disdrodb/l0/readers/LPM_V0/ITALY/GID_LPM_V0.py +240 -0
  133. disdrodb/l0/readers/ODM470/OCEAN/OCEANRAIN.py +123 -0
  134. disdrodb/l0/readers/PARSIVEL/AUSTRALIA/MELBOURNE_2007_PARSIVEL.py +1 -1
  135. disdrodb/l0/readers/PARSIVEL/BASQUECOUNTRY/EUSKALMET_OTT.py +1 -1
  136. disdrodb/l0/readers/PARSIVEL/CHINA/CHONGQING.py +1 -3
  137. disdrodb/l0/readers/PARSIVEL/EPFL/ARCTIC_2021.py +1 -1
  138. disdrodb/l0/readers/PARSIVEL/EPFL/COMMON_2011.py +1 -1
  139. disdrodb/l0/readers/PARSIVEL/EPFL/DAVOS_2009_2011.py +1 -1
  140. disdrodb/l0/readers/PARSIVEL/EPFL/EPFL_2009.py +1 -1
  141. disdrodb/l0/readers/PARSIVEL/EPFL/EPFL_ROOF_2008.py +1 -1
  142. disdrodb/l0/readers/PARSIVEL/EPFL/EPFL_ROOF_2010.py +1 -1
  143. disdrodb/l0/readers/PARSIVEL/EPFL/EPFL_ROOF_2011.py +1 -1
  144. disdrodb/l0/readers/PARSIVEL/EPFL/EPFL_ROOF_2012.py +1 -1
  145. disdrodb/l0/readers/PARSIVEL/EPFL/GENEPI_2007.py +1 -1
  146. disdrodb/l0/readers/PARSIVEL/EPFL/GRAND_ST_BERNARD_2007.py +1 -1
  147. disdrodb/l0/readers/PARSIVEL/EPFL/GRAND_ST_BERNARD_2007_2.py +1 -1
  148. disdrodb/l0/readers/PARSIVEL/EPFL/HPICONET_2010.py +1 -1
  149. disdrodb/l0/readers/PARSIVEL/EPFL/HYMEX_LTE_SOP2.py +1 -1
  150. disdrodb/l0/readers/PARSIVEL/EPFL/HYMEX_LTE_SOP3.py +1 -1
  151. disdrodb/l0/readers/PARSIVEL/EPFL/HYMEX_LTE_SOP4.py +1 -1
  152. disdrodb/l0/readers/PARSIVEL/EPFL/LOCARNO_2018.py +1 -1
  153. disdrodb/l0/readers/PARSIVEL/EPFL/LOCARNO_2019.py +1 -1
  154. disdrodb/l0/readers/PARSIVEL/EPFL/PARADISO_2014.py +1 -1
  155. disdrodb/l0/readers/PARSIVEL/EPFL/PARSIVEL_2007.py +1 -1
  156. disdrodb/l0/readers/PARSIVEL/EPFL/PLATO_2019.py +1 -1
  157. disdrodb/l0/readers/PARSIVEL/EPFL/RACLETS_2019.py +1 -1
  158. disdrodb/l0/readers/PARSIVEL/EPFL/RACLETS_2019_WJF.py +1 -1
  159. disdrodb/l0/readers/PARSIVEL/EPFL/RIETHOLZBACH_2011.py +1 -1
  160. disdrodb/l0/readers/PARSIVEL/EPFL/SAMOYLOV_2017.py +1 -1
  161. disdrodb/l0/readers/PARSIVEL/EPFL/SAMOYLOV_2019.py +1 -1
  162. disdrodb/l0/readers/PARSIVEL/EPFL/UNIL_2022.py +1 -1
  163. disdrodb/l0/readers/PARSIVEL/JAPAN/JMA.py +1 -1
  164. disdrodb/l0/readers/PARSIVEL/KOREA/ICEPOP_MSC.py +159 -0
  165. disdrodb/l0/readers/PARSIVEL/NASA/LPVEX.py +26 -14
  166. disdrodb/l0/readers/PARSIVEL/NASA/MC3E.py +2 -2
  167. disdrodb/l0/readers/PARSIVEL/NCAR/CCOPE_2015.py +1 -1
  168. disdrodb/l0/readers/PARSIVEL/NCAR/OWLES_MIPS.py +1 -1
  169. disdrodb/l0/readers/PARSIVEL/NCAR/PECAN_MOBILE.py +1 -1
  170. disdrodb/l0/readers/PARSIVEL/NCAR/PLOWS_MIPS.py +1 -1
  171. disdrodb/l0/readers/PARSIVEL/NCAR/VORTEX2_2009.py +1 -1
  172. disdrodb/l0/readers/PARSIVEL/NCAR/VORTEX2_2010.py +1 -3
  173. disdrodb/l0/readers/PARSIVEL/NCAR/VORTEX2_2010_UF.py +1 -3
  174. disdrodb/l0/readers/PARSIVEL/SLOVENIA/UL.py +1 -1
  175. disdrodb/l0/readers/PARSIVEL2/ARM/ARM_PARSIVEL2.py +1 -1
  176. disdrodb/l0/readers/PARSIVEL2/BASQUECOUNTRY/EUSKALMET_OTT2.py +2 -2
  177. disdrodb/l0/readers/PARSIVEL2/BELGIUM/ILVO.py +1 -3
  178. disdrodb/l0/readers/PARSIVEL2/BRAZIL/CHUVA_PARSIVEL2.py +1 -1
  179. disdrodb/l0/readers/PARSIVEL2/BRAZIL/GOAMAZON_PARSIVEL2.py +1 -1
  180. disdrodb/l0/readers/PARSIVEL2/CANADA/UQAM_NC.py +1 -1
  181. disdrodb/l0/readers/PARSIVEL2/DENMARK/DTU.py +1 -1
  182. disdrodb/l0/readers/PARSIVEL2/DENMARK/EROSION_nc.py +1 -1
  183. disdrodb/l0/readers/PARSIVEL2/DENMARK/EROSION_raw.py +1 -1
  184. disdrodb/l0/readers/PARSIVEL2/FINLAND/FMI_PARSIVEL2.py +1 -1
  185. disdrodb/l0/readers/PARSIVEL2/FRANCE/ENPC_PARSIVEL2.py +1 -3
  186. disdrodb/l0/readers/PARSIVEL2/FRANCE/OSUG.py +1 -1
  187. disdrodb/l0/readers/PARSIVEL2/FRANCE/SIRTA_PARSIVEL2.py +1 -3
  188. disdrodb/l0/readers/PARSIVEL2/GREECE/NOA.py +4 -3
  189. disdrodb/l0/readers/PARSIVEL2/ITALY/GID_PARSIVEL2.py +1 -3
  190. disdrodb/l0/readers/PARSIVEL2/ITALY/HYDROX.py +5 -3
  191. disdrodb/l0/readers/PARSIVEL2/JAPAN/PRECIP.py +155 -0
  192. disdrodb/l0/readers/PARSIVEL2/KIT/BURKINA_FASO.py +1 -1
  193. disdrodb/l0/readers/PARSIVEL2/KIT/TEAMX.py +1 -1
  194. disdrodb/l0/readers/PARSIVEL2/KOREA/ICEPOP_MSC.py +161 -0
  195. disdrodb/l0/readers/PARSIVEL2/{NASA/GCPEX.py → KOREA/ICEPOP_UCLM.py} +51 -31
  196. disdrodb/l0/readers/PARSIVEL2/MEXICO/OH_IIUNAM_nc.py +1 -1
  197. disdrodb/l0/readers/PARSIVEL2/MPI/BCO_PARSIVEL2.py +15 -8
  198. disdrodb/l0/readers/PARSIVEL2/MPI/BOWTIE.py +9 -4
  199. disdrodb/l0/readers/PARSIVEL2/NASA/APU.py +31 -6
  200. disdrodb/l0/readers/PARSIVEL2/NASA/NSSTC.py +1 -1
  201. disdrodb/l0/readers/PARSIVEL2/NCAR/FARM_PARSIVEL2.py +1 -1
  202. disdrodb/l0/readers/PARSIVEL2/NCAR/PECAN_FP3.py +1 -1
  203. disdrodb/l0/readers/PARSIVEL2/NCAR/PECAN_MIPS.py +1 -1
  204. disdrodb/l0/readers/PARSIVEL2/NCAR/PERILS_MIPS.py +1 -1
  205. disdrodb/l0/readers/PARSIVEL2/NCAR/PERILS_PIPS.py +1 -1
  206. disdrodb/l0/readers/PARSIVEL2/NCAR/RELAMPAGO_PARSIVEL2.py +2 -2
  207. disdrodb/l0/readers/PARSIVEL2/NCAR/SNOWIE_PJ.py +1 -1
  208. disdrodb/l0/readers/PARSIVEL2/NCAR/SNOWIE_SB.py +1 -1
  209. disdrodb/l0/readers/PARSIVEL2/NCAR/VORTEX_SE_2016_P1.py +1 -3
  210. disdrodb/l0/readers/PARSIVEL2/NCAR/VORTEX_SE_2016_P2.py +1 -1
  211. disdrodb/l0/readers/PARSIVEL2/NCAR/VORTEX_SE_2016_PIPS.py +1 -1
  212. disdrodb/l0/readers/PARSIVEL2/NETHERLANDS/DELFT_NC.py +1 -1
  213. disdrodb/l0/readers/{PARSIVEL/NASA/PIERS.py → PARSIVEL2/NORWAY/UIB.py} +65 -31
  214. disdrodb/l0/readers/PARSIVEL2/PHILIPPINES/PAGASA.py +7 -6
  215. disdrodb/l0/readers/PARSIVEL2/SPAIN/CENER.py +1 -1
  216. disdrodb/l0/readers/PARSIVEL2/SPAIN/CR1000DL.py +1 -1
  217. disdrodb/l0/readers/PARSIVEL2/SPAIN/GRANADA.py +1 -3
  218. disdrodb/l0/readers/PARSIVEL2/SPAIN/LIAISE.py +1 -1
  219. disdrodb/l0/readers/PARSIVEL2/SWEDEN/SMHI.py +1 -1
  220. disdrodb/l0/readers/PARSIVEL2/USA/CSU.py +138 -0
  221. disdrodb/l0/readers/PARSIVEL2/USA/CW3E.py +49 -22
  222. disdrodb/l0/readers/PWS100/AUSTRIA/HOAL.py +1 -3
  223. disdrodb/l0/readers/PWS100/FRANCE/ENPC_PWS100.py +1 -3
  224. disdrodb/l0/readers/PWS100/FRANCE/ENPC_PWS100_SIRTA.py +1 -1
  225. disdrodb/l0/readers/{PARSIVEL/NASA/IFLOODS.py → RD80/BRAZIL/ATTO_RD80.py} +50 -36
  226. disdrodb/l0/readers/RD80/BRAZIL/CHUVA_RD80.py +1 -3
  227. disdrodb/l0/readers/RD80/BRAZIL/GOAMAZON_RD80.py +1 -3
  228. disdrodb/l0/readers/RD80/NCAR/CINDY_2011_RD80.py +1 -3
  229. disdrodb/l0/readers/RD80/NCAR/RELAMPAGO_RD80.py +1 -3
  230. disdrodb/l0/readers/RD80/NOAA/PSL_RD80.py +1 -3
  231. disdrodb/l0/readers/{SW250 → SWS250}/BELGIUM/KMI.py +2 -4
  232. disdrodb/l0/readers/template_reader_raw_netcdf_data.py +1 -3
  233. disdrodb/l0/readers/template_reader_raw_text_data.py +1 -3
  234. disdrodb/l0/standards.py +4 -5
  235. disdrodb/l0/template_tools.py +1 -3
  236. disdrodb/l1/__init__.py +1 -1
  237. disdrodb/l1/classification.py +913 -0
  238. disdrodb/l1/processing.py +36 -106
  239. disdrodb/l1/resampling.py +8 -3
  240. disdrodb/l1_env/__init__.py +1 -1
  241. disdrodb/l1_env/routines.py +6 -6
  242. disdrodb/l2/__init__.py +1 -1
  243. disdrodb/l2/empirical_dsd.py +61 -31
  244. disdrodb/l2/processing.py +327 -62
  245. disdrodb/metadata/checks.py +1 -3
  246. disdrodb/metadata/download.py +4 -4
  247. disdrodb/metadata/geolocation.py +1 -3
  248. disdrodb/metadata/info.py +1 -3
  249. disdrodb/metadata/manipulation.py +1 -3
  250. disdrodb/metadata/reader.py +1 -3
  251. disdrodb/metadata/search.py +1 -3
  252. disdrodb/metadata/standards.py +1 -3
  253. disdrodb/metadata/writer.py +1 -3
  254. disdrodb/physics/__init__.py +17 -0
  255. disdrodb/physics/atmosphere.py +272 -0
  256. disdrodb/physics/water.py +130 -0
  257. disdrodb/physics/wrappers.py +62 -0
  258. disdrodb/psd/__init__.py +1 -1
  259. disdrodb/psd/fitting.py +22 -9
  260. disdrodb/psd/models.py +1 -1
  261. disdrodb/routines/__init__.py +5 -1
  262. disdrodb/routines/l0.py +28 -18
  263. disdrodb/routines/l1.py +8 -6
  264. disdrodb/routines/l2.py +8 -4
  265. disdrodb/routines/options.py +116 -71
  266. disdrodb/routines/options_validation.py +728 -0
  267. disdrodb/routines/wrappers.py +431 -11
  268. disdrodb/scattering/__init__.py +1 -1
  269. disdrodb/scattering/axis_ratio.py +9 -6
  270. disdrodb/scattering/permittivity.py +8 -8
  271. disdrodb/scattering/routines.py +32 -14
  272. disdrodb/summary/__init__.py +1 -1
  273. disdrodb/summary/routines.py +146 -86
  274. disdrodb/utils/__init__.py +1 -1
  275. disdrodb/utils/archiving.py +16 -9
  276. disdrodb/utils/attrs.py +4 -3
  277. disdrodb/utils/cli.py +8 -10
  278. disdrodb/utils/compression.py +13 -13
  279. disdrodb/utils/dask.py +33 -14
  280. disdrodb/utils/dataframe.py +1 -3
  281. disdrodb/utils/decorators.py +1 -3
  282. disdrodb/utils/dict.py +1 -1
  283. disdrodb/utils/directories.py +3 -5
  284. disdrodb/utils/encoding.py +2 -4
  285. disdrodb/utils/event.py +1 -1
  286. disdrodb/utils/list.py +1 -3
  287. disdrodb/utils/logger.py +1 -3
  288. disdrodb/utils/manipulations.py +182 -6
  289. disdrodb/utils/pydantic.py +80 -0
  290. disdrodb/utils/routines.py +1 -3
  291. disdrodb/utils/subsetting.py +1 -1
  292. disdrodb/utils/time.py +3 -2
  293. disdrodb/utils/warnings.py +1 -3
  294. disdrodb/utils/writer.py +1 -3
  295. disdrodb/utils/xarray.py +30 -3
  296. disdrodb/utils/yaml.py +1 -3
  297. disdrodb/viz/__init__.py +1 -1
  298. disdrodb/viz/plots.py +197 -21
  299. {disdrodb-0.2.0.dist-info → disdrodb-0.3.0.dist-info}/METADATA +2 -2
  300. disdrodb-0.3.0.dist-info/RECORD +358 -0
  301. {disdrodb-0.2.0.dist-info → disdrodb-0.3.0.dist-info}/entry_points.txt +3 -0
  302. disdrodb/etc/products/L1/1MIN.yaml +0 -13
  303. disdrodb/etc/products/L1/LPM/1MIN.yaml +0 -13
  304. disdrodb/etc/products/L1/PARSIVEL/1MIN.yaml +0 -13
  305. disdrodb/etc/products/L1/PARSIVEL2/1MIN.yaml +0 -13
  306. disdrodb/etc/products/L1/PWS100/1MIN.yaml +0 -13
  307. disdrodb/etc/products/L1/RD80/1MIN.yaml +0 -13
  308. disdrodb/etc/products/L1/SWS250/1MIN.yaml +0 -13
  309. disdrodb/etc/products/L2M/10MIN.yaml +0 -12
  310. disdrodb/l1/beard_model.py +0 -618
  311. disdrodb/l1/filters.py +0 -203
  312. disdrodb-0.2.0.dist-info/RECORD +0 -312
  313. {disdrodb-0.2.0.dist-info → disdrodb-0.3.0.dist-info}/WHEEL +0 -0
  314. {disdrodb-0.2.0.dist-info → disdrodb-0.3.0.dist-info}/licenses/LICENSE +0 -0
  315. {disdrodb-0.2.0.dist-info → disdrodb-0.3.0.dist-info}/top_level.txt +0 -0
@@ -0,0 +1,206 @@
1
+ # -----------------------------------------------------------------------------.
2
+ # Copyright (c) 2021-2026 DISDRODB developers
3
+ #
4
+ # This program is free software: you can redistribute it and/or modify
5
+ # it under the terms of the GNU General Public License as published by
6
+ # the Free Software Foundation, either version 3 of the License, or
7
+ # (at your option) any later version.
8
+ #
9
+ # This program is distributed in the hope that it will be useful,
10
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
11
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12
+ # GNU General Public License for more details.
13
+ #
14
+ # You should have received a copy of the GNU General Public License
15
+ # along with this program. If not, see <http://www.gnu.org/licenses/>.
16
+ # -----------------------------------------------------------------------------.
17
+ """DISDRODB reader for NMBU BIOKLIM LPM sensor."""
18
+ import os
19
+
20
+ import pandas as pd
21
+
22
+ from disdrodb.l0.l0_reader import is_documented_by, reader_generic_docstring
23
+ from disdrodb.l0.l0a_processing import read_raw_text_file
24
+
25
+
26
+ @is_documented_by(reader_generic_docstring)
27
+ def reader(
28
+ filepath,
29
+ logger=None,
30
+ ):
31
+ """Reader."""
32
+ ##------------------------------------------------------------------------.
33
+ #### - Define raw data headers
34
+ column_names = ["TO_PARSE"]
35
+
36
+ ##------------------------------------------------------------------------.
37
+ #### Define reader options
38
+ # - For more info: https://pandas.pydata.org/docs/reference/api/pandas.read_csv.html
39
+ reader_kwargs = {}
40
+
41
+ # - Define delimiter
42
+ reader_kwargs["delimiter"] = "\\n"
43
+
44
+ # - Avoid first column to become df index !!!
45
+ reader_kwargs["index_col"] = False
46
+
47
+ # Since column names are expected to be passed explicitly, header is set to None
48
+ reader_kwargs["header"] = None
49
+
50
+ # - Number of rows to be skipped at the beginning of the file
51
+ reader_kwargs["skiprows"] = None
52
+
53
+ # - Define behaviour when encountering bad lines
54
+ reader_kwargs["on_bad_lines"] = "skip"
55
+
56
+ # - Define reader engine
57
+ # - C engine is faster
58
+ # - Python engine is more feature-complete
59
+ reader_kwargs["engine"] = "python"
60
+
61
+ # - Define on-the-fly decompression of on-disk data
62
+ # - Available: gzip, bz2, zip
63
+ reader_kwargs["compression"] = "infer"
64
+
65
+ # - Strings to recognize as NA/NaN and replace with standard NA flags
66
+ # - Already included: '#N/A', '#N/A N/A', '#NA', '-1.#IND', '-1.#QNAN',
67
+ # '-NaN', '-nan', '1.#IND', '1.#QNAN', '<NA>', 'N/A',
68
+ # 'NA', 'NULL', 'NaN', 'n/a', 'nan', 'null'
69
+ reader_kwargs["na_values"] = ["na", "", "error"]
70
+
71
+ ##------------------------------------------------------------------------.
72
+ #### Read the data
73
+ df = read_raw_text_file(
74
+ filepath=filepath,
75
+ column_names=column_names,
76
+ reader_kwargs=reader_kwargs,
77
+ logger=logger,
78
+ )
79
+
80
+ ##------------------------------------------------------------------------.
81
+ #### Adapt the dataframe to adhere to DISDRODB L0 standards
82
+ # Raise error if empty file
83
+ if len(df) == 0:
84
+ raise ValueError(f"{filepath} is empty.")
85
+
86
+ # Select only rows with expected number of delimiters
87
+ df = df[df["TO_PARSE"].str.count(";") == 525]
88
+
89
+ # Raise error if no data left
90
+ if len(df) == 0:
91
+ raise ValueError(f"No valid data in {filepath}.")
92
+
93
+ # Split by ; delimiter (before raw drop number)
94
+ df = df["TO_PARSE"].str.split(";", expand=True, n=80)
95
+
96
+ # Assign column names
97
+ names = [
98
+ "time",
99
+ "start_identifier",
100
+ "device_address",
101
+ "sensor_serial_number",
102
+ "sensor_date",
103
+ "sensor_time",
104
+ "weather_code_synop_4677_5min",
105
+ "weather_code_synop_4680_5min",
106
+ "weather_code_metar_4678_5min",
107
+ "precipitation_rate_5min",
108
+ "weather_code_synop_4677",
109
+ "weather_code_synop_4680",
110
+ "weather_code_metar_4678",
111
+ "precipitation_rate",
112
+ "rainfall_rate",
113
+ "snowfall_rate",
114
+ "precipitation_accumulated",
115
+ "mor_visibility",
116
+ "reflectivity",
117
+ "quality_index",
118
+ "max_hail_diameter",
119
+ "laser_status",
120
+ "static_signal_status",
121
+ "laser_temperature_analog_status",
122
+ "laser_temperature_digital_status",
123
+ "laser_current_analog_status",
124
+ "laser_current_digital_status",
125
+ "sensor_voltage_supply_status",
126
+ "current_heating_pane_transmitter_head_status",
127
+ "current_heating_pane_receiver_head_status",
128
+ "temperature_sensor_status",
129
+ "current_heating_voltage_supply_status",
130
+ "current_heating_house_status",
131
+ "current_heating_heads_status",
132
+ "current_heating_carriers_status",
133
+ "control_output_laser_power_status",
134
+ "reserved_status",
135
+ "temperature_interior",
136
+ "laser_temperature",
137
+ "laser_current_average",
138
+ "control_voltage",
139
+ "optical_control_voltage_output",
140
+ "sensor_voltage_supply",
141
+ "current_heating_pane_transmitter_head",
142
+ "current_heating_pane_receiver_head",
143
+ "temperature_ambient",
144
+ "current_heating_voltage_supply",
145
+ "current_heating_house",
146
+ "current_heating_heads",
147
+ "current_heating_carriers",
148
+ "number_particles",
149
+ "number_particles_internal_data",
150
+ "number_particles_min_speed",
151
+ "number_particles_min_speed_internal_data",
152
+ "number_particles_max_speed",
153
+ "number_particles_max_speed_internal_data",
154
+ "number_particles_min_diameter",
155
+ "number_particles_min_diameter_internal_data",
156
+ "number_particles_no_hydrometeor",
157
+ "number_particles_no_hydrometeor_internal_data",
158
+ "number_particles_unknown_classification",
159
+ "number_particles_unknown_classification_internal_data",
160
+ "number_particles_class_1",
161
+ "number_particles_class_1_internal_data",
162
+ "number_particles_class_2",
163
+ "number_particles_class_2_internal_data",
164
+ "number_particles_class_3",
165
+ "number_particles_class_3_internal_data",
166
+ "number_particles_class_4",
167
+ "number_particles_class_4_internal_data",
168
+ "number_particles_class_5",
169
+ "number_particles_class_5_internal_data",
170
+ "number_particles_class_6",
171
+ "number_particles_class_6_internal_data",
172
+ "number_particles_class_7",
173
+ "number_particles_class_7_internal_data",
174
+ "number_particles_class_8",
175
+ "number_particles_class_8_internal_data",
176
+ "number_particles_class_9",
177
+ "number_particles_class_9_internal_data",
178
+ "raw_drop_number",
179
+ ]
180
+ df.columns = names
181
+
182
+ # Remove checksum from raw_drop_number
183
+ df["raw_drop_number"] = df["raw_drop_number"].str.rsplit(";", n=6, expand=True)[0]
184
+
185
+ # Define datetime "time" column
186
+ # df["time"] = df["sensor_date"] + "-" + df["sensor_time"]
187
+ date_str = os.path.basename(filepath).split(".")[0]
188
+ time_str = date_str + "T" + df["time"]
189
+ df["time"] = pd.to_datetime(time_str, format="%Y-%m-%dT%H:%M:%S", errors="coerce")
190
+
191
+ # Drop row if start_identifier different than 00
192
+ # df = df[df["start_identifier"].astype(str) == "00"]
193
+
194
+ # Drop rows with invalid raw_drop_number
195
+ df = df[df["raw_drop_number"].astype(str).str.len() == 1759]
196
+
197
+ # Drop columns not agreeing with DISDRODB L0 standards
198
+ columns_to_drop = [
199
+ "start_identifier",
200
+ "device_address",
201
+ "sensor_serial_number",
202
+ "sensor_date",
203
+ "sensor_time",
204
+ ]
205
+ df = df.drop(columns=columns_to_drop)
206
+ return df
@@ -1,7 +1,5 @@
1
- #!/usr/bin/env python3
2
-
3
1
  # -----------------------------------------------------------------------------.
4
- # Copyright (c) 2021-2023 DISDRODB developers
2
+ # Copyright (c) 2021-2026 DISDRODB developers
5
3
  #
6
4
  # This program is free software: you can redistribute it and/or modify
7
5
  # it under the terms of the GNU General Public License as published by
@@ -1,7 +1,5 @@
1
- #!/usr/bin/env python3
2
-
3
1
  # -----------------------------------------------------------------------------.
4
- # Copyright (c) 2021-2023 DISDRODB developers
2
+ # Copyright (c) 2021-2026 DISDRODB developers
5
3
  #
6
4
  # This program is free software: you can redistribute it and/or modify
7
5
  # it under the terms of the GNU General Public License as published by
@@ -1,7 +1,5 @@
1
- #!/usr/bin/env python3
2
-
3
1
  # -----------------------------------------------------------------------------.
4
- # Copyright (c) 2021-2023 DISDRODB developers
2
+ # Copyright (c) 2021-2026 DISDRODB developers
5
3
  #
6
4
  # This program is free software: you can redistribute it and/or modify
7
5
  # it under the terms of the GNU General Public License as published by
@@ -1,6 +1,6 @@
1
1
  #!/usr/bin/env python3
2
2
  # -----------------------------------------------------------------------------.
3
- # Copyright (c) 2021-2023 DISDRODB developers
3
+ # Copyright (c) 2021-2026 DISDRODB developers
4
4
  #
5
5
  # This program is free software: you can redistribute it and/or modify
6
6
  # it under the terms of the GNU General Public License as published by
@@ -0,0 +1,217 @@
1
+ # -----------------------------------------------------------------------------.
2
+ # Copyright (c) 2021-2026 DISDRODB developers
3
+ #
4
+ # This program is free software: you can redistribute it and/or modify
5
+ # it under the terms of the GNU General Public License as published by
6
+ # the Free Software Foundation, either version 3 of the License, or
7
+ # (at your option) any later version.
8
+ #
9
+ # This program is distributed in the hope that it will be useful,
10
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
11
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12
+ # GNU General Public License for more details.
13
+ #
14
+ # You should have received a copy of the GNU General Public License
15
+ # along with this program. If not, see <http://www.gnu.org/licenses/>.
16
+ # -----------------------------------------------------------------------------.
17
+ """DISDRODB reader for the MANCHESTER Withworth Meteorological Observatory LPM sensor."""
18
+ import pandas as pd
19
+
20
+ from disdrodb.l0.l0_reader import is_documented_by, reader_generic_docstring
21
+ from disdrodb.l0.l0a_processing import read_raw_text_file
22
+
23
+
24
+ @is_documented_by(reader_generic_docstring)
25
+ def reader(
26
+ filepath,
27
+ logger=None,
28
+ ):
29
+ """Reader."""
30
+ ##------------------------------------------------------------------------.
31
+ #### - Define raw data headers
32
+ column_names = ["TO_PARSE"]
33
+
34
+ ##------------------------------------------------------------------------.
35
+ #### Define reader options
36
+ # - For more info: https://pandas.pydata.org/docs/reference/api/pandas.read_csv.html
37
+ reader_kwargs = {}
38
+
39
+ # - Define delimiter
40
+ reader_kwargs["delimiter"] = "\\n"
41
+
42
+ # - Avoid first column to become df index !!!
43
+ reader_kwargs["index_col"] = False
44
+
45
+ # - Define encoding
46
+ reader_kwargs["encoding"] = "latin"
47
+
48
+ # Since column names are expected to be passed explicitly, header is set to None
49
+ reader_kwargs["header"] = None
50
+
51
+ # - Number of rows to be skipped at the beginning of the file
52
+ reader_kwargs["skiprows"] = None
53
+
54
+ # - Define behaviour when encountering bad lines
55
+ reader_kwargs["on_bad_lines"] = "skip"
56
+
57
+ # - Define reader engine
58
+ # - C engine is faster
59
+ # - Python engine is more feature-complete
60
+ reader_kwargs["engine"] = "python"
61
+
62
+ # - Define on-the-fly decompression of on-disk data
63
+ # - Available: gzip, bz2, zip
64
+ reader_kwargs["compression"] = "infer"
65
+
66
+ # - Strings to recognize as NA/NaN and replace with standard NA flags
67
+ # - Already included: '#N/A', '#N/A N/A', '#NA', '-1.#IND', '-1.#QNAN',
68
+ # '-NaN', '-nan', '1.#IND', '1.#QNAN', '<NA>', 'N/A',
69
+ # 'NA', 'NULL', 'NaN', 'n/a', 'nan', 'null'
70
+ reader_kwargs["na_values"] = ["na", "", "error"]
71
+
72
+ ##------------------------------------------------------------------------.
73
+ #### Read the data
74
+ df = read_raw_text_file(
75
+ filepath=filepath,
76
+ column_names=column_names,
77
+ reader_kwargs=reader_kwargs,
78
+ logger=logger,
79
+ )
80
+
81
+ ##------------------------------------------------------------------------.
82
+ #### Adapt the dataframe to adhere to DISDRODB L0 standards
83
+ # Raise error if empty file
84
+ if len(df) == 0:
85
+ raise ValueError(f"{filepath} is empty.")
86
+
87
+ # Select only rows with expected number of delimiters
88
+ df = df[df["TO_PARSE"].str.count(";").isin([45, 522])]
89
+
90
+ # Raise error if no data left
91
+ if len(df) == 0:
92
+ raise ValueError(f"No valid data in {filepath}.")
93
+
94
+ # Split by ; delimiter (before raw drop number)
95
+ # - Add a dummy row with 82 delimiters so that str.split expand also if only 45 delimiters are present
96
+ dummy_row = ";".join(["DUMMY"] * 82)
97
+ df = pd.concat([df, pd.DataFrame({"TO_PARSE": [dummy_row]})], ignore_index=True)
98
+ # - Split columns
99
+ df = df["TO_PARSE"].str.split(";", expand=True, n=81)
100
+ # - Drop the dummy row (last one)
101
+ df = df.iloc[:-1, :]
102
+ # - Fill empty columns
103
+ df.loc[:, 46:50] = df.loc[:, 46:50].fillna("NaN")
104
+ df.loc[:, 51:] = df.loc[:, 51:].fillna("0")
105
+
106
+ # Assign column names
107
+ names = [
108
+ "date",
109
+ "time",
110
+ "start_identifier",
111
+ "device_address",
112
+ "sensor_serial_number",
113
+ "sensor_date",
114
+ "sensor_time",
115
+ "weather_code_synop_4677_5min",
116
+ "weather_code_synop_4680_5min",
117
+ "weather_code_metar_4678_5min",
118
+ "precipitation_rate_5min",
119
+ "weather_code_synop_4677",
120
+ "weather_code_synop_4680",
121
+ "weather_code_metar_4678",
122
+ "precipitation_rate",
123
+ "rainfall_rate",
124
+ "snowfall_rate",
125
+ "precipitation_accumulated",
126
+ "mor_visibility",
127
+ "reflectivity",
128
+ "quality_index",
129
+ "max_hail_diameter",
130
+ "laser_status",
131
+ "static_signal_status",
132
+ "laser_temperature_analog_status",
133
+ "laser_temperature_digital_status",
134
+ "laser_current_analog_status",
135
+ "laser_current_digital_status",
136
+ "sensor_voltage_supply_status",
137
+ "current_heating_pane_transmitter_head_status",
138
+ "current_heating_pane_receiver_head_status",
139
+ "temperature_sensor_status",
140
+ "current_heating_voltage_supply_status",
141
+ "current_heating_house_status",
142
+ "current_heating_heads_status",
143
+ "current_heating_carriers_status",
144
+ "control_output_laser_power_status",
145
+ "reserved_status",
146
+ "temperature_interior",
147
+ "laser_temperature",
148
+ "laser_current_average",
149
+ "control_voltage",
150
+ "optical_control_voltage_output",
151
+ "sensor_voltage_supply",
152
+ "current_heating_pane_transmitter_head",
153
+ "current_heating_pane_receiver_head",
154
+ "temperature_ambient",
155
+ "current_heating_voltage_supply",
156
+ "current_heating_house",
157
+ "current_heating_heads",
158
+ "current_heating_carriers",
159
+ "number_particles",
160
+ "number_particles_internal_data",
161
+ "number_particles_min_speed",
162
+ "number_particles_min_speed_internal_data",
163
+ "number_particles_max_speed",
164
+ "number_particles_max_speed_internal_data",
165
+ "number_particles_min_diameter",
166
+ "number_particles_min_diameter_internal_data",
167
+ "number_particles_no_hydrometeor",
168
+ "number_particles_no_hydrometeor_internal_data",
169
+ "number_particles_unknown_classification",
170
+ "number_particles_unknown_classification_internal_data",
171
+ "number_particles_class_1",
172
+ "number_particles_class_1_internal_data",
173
+ "number_particles_class_2",
174
+ "number_particles_class_2_internal_data",
175
+ "number_particles_class_3",
176
+ "number_particles_class_3_internal_data",
177
+ "number_particles_class_4",
178
+ "number_particles_class_4_internal_data",
179
+ "number_particles_class_5",
180
+ "number_particles_class_5_internal_data",
181
+ "number_particles_class_6",
182
+ "number_particles_class_6_internal_data",
183
+ "number_particles_class_7",
184
+ "number_particles_class_7_internal_data",
185
+ "number_particles_class_8",
186
+ "number_particles_class_8_internal_data",
187
+ "number_particles_class_9",
188
+ "number_particles_class_9_internal_data",
189
+ "raw_drop_number",
190
+ ]
191
+ df.columns = names
192
+
193
+ # Define datetime "time" column
194
+ time_str = df["date"] + " " + df["time"]
195
+ df["time"] = pd.to_datetime(time_str, format="%d/%m/%Y %H:%M:%S", errors="coerce")
196
+
197
+ # Remove checksum from raw_drop_number
198
+ df["raw_drop_number"] = df["raw_drop_number"].str.rsplit(";", n=2, expand=True)[0]
199
+
200
+ # Drop rows with invalid raw_drop_number
201
+ df = df[df["raw_drop_number"].astype(str).str.len().isin([1, 1759])]
202
+
203
+ # Drop row if start_identifier different than 00
204
+ # df["start_identifier"] = df["start_identifier"].astype(str).str[-2:]
205
+ # df = df[df["start_identifier"] == "00"]
206
+
207
+ # Drop columns not agreeing with DISDRODB L0 standards
208
+ columns_to_drop = [
209
+ "start_identifier",
210
+ "device_address",
211
+ "sensor_serial_number",
212
+ "sensor_date",
213
+ "sensor_time",
214
+ "date",
215
+ ]
216
+ df = df.drop(columns=columns_to_drop)
217
+ return df
@@ -0,0 +1,227 @@
1
+ # -----------------------------------------------------------------------------.
2
+ # Copyright (c) 2021-2026 DISDRODB developers
3
+ #
4
+ # This program is free software: you can redistribute it and/or modify
5
+ # it under the terms of the GNU General Public License as published by
6
+ # the Free Software Foundation, either version 3 of the License, or
7
+ # (at your option) any later version.
8
+ #
9
+ # This program is distributed in the hope that it will be useful,
10
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
11
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12
+ # GNU General Public License for more details.
13
+ #
14
+ # You should have received a copy of the GNU General Public License
15
+ # along with this program. If not, see <http://www.gnu.org/licenses/>.
16
+ # -----------------------------------------------------------------------------.
17
+ """DISDRODB reader for CHARLESTON experiment LPM sensors."""
18
+ import os
19
+
20
+ import numpy as np
21
+ import pandas as pd
22
+
23
+ from disdrodb.l0.l0_reader import is_documented_by, reader_generic_docstring
24
+ from disdrodb.l0.l0a_processing import read_raw_text_file
25
+
26
+
27
+ @is_documented_by(reader_generic_docstring)
28
+ def reader(
29
+ filepath,
30
+ logger=None,
31
+ ):
32
+ """Reader."""
33
+ ##------------------------------------------------------------------------.
34
+ #### - Define raw data headers
35
+ column_names = ["TO_PARSE"]
36
+
37
+ ##------------------------------------------------------------------------.
38
+ #### Define reader options
39
+ # - For more info: https://pandas.pydata.org/docs/reference/api/pandas.read_csv.html
40
+ reader_kwargs = {}
41
+
42
+ # - Define delimiter
43
+ reader_kwargs["delimiter"] = "\\n"
44
+
45
+ # - Avoid first column to become df index !!!
46
+ reader_kwargs["index_col"] = False
47
+
48
+ # - Define encoding
49
+ reader_kwargs["encoding"] = "ISO-8859-1"
50
+
51
+ # - Since column names are expected to be passed explicitly, header is set to None
52
+ reader_kwargs["header"] = None
53
+
54
+ # - Number of rows to be skipped at the beginning of the file
55
+ reader_kwargs["skiprows"] = None
56
+
57
+ # - Define behaviour when encountering bad lines
58
+ reader_kwargs["on_bad_lines"] = "skip"
59
+
60
+ # - Define reader engine
61
+ # - C engine is faster
62
+ # - Python engine is more feature-complete
63
+ reader_kwargs["engine"] = "python"
64
+
65
+ # - Define on-the-fly decompression of on-disk data
66
+ # - Available: gzip, bz2, zip
67
+ reader_kwargs["compression"] = "infer"
68
+
69
+ # - Strings to recognize as NA/NaN and replace with standard NA flags
70
+ # - Already included: '#N/A', '#N/A N/A', '#NA', '-1.#IND', '-1.#QNAN',
71
+ # '-NaN', '-nan', '1.#IND', '1.#QNAN', '<NA>', 'N/A',
72
+ # 'NA', 'NULL', 'NaN', 'n/a', 'nan', 'null'
73
+ reader_kwargs["na_values"] = ["na", "", "error"]
74
+
75
+ ##------------------------------------------------------------------------.
76
+ #### Read the data
77
+ df = read_raw_text_file(
78
+ filepath=filepath,
79
+ column_names=column_names,
80
+ reader_kwargs=reader_kwargs,
81
+ logger=logger,
82
+ )
83
+
84
+ ##------------------------------------------------------------------------.
85
+ #### Adapt the dataframe to adhere to DISDRODB L0 standards
86
+ # Raise error if empty file
87
+ if len(df) == 0:
88
+ raise ValueError(f"{filepath} is empty.")
89
+
90
+ # Select only rows with expected number of delimiters
91
+ df = df[df["TO_PARSE"].str.count(";") == 520]
92
+
93
+ # Raise error if no data left
94
+ if len(df) == 0:
95
+ raise ValueError(f"No valid data in {filepath}.")
96
+
97
+ # Split by ; delimiter (before raw drop number)
98
+ df = df["TO_PARSE"].str.split(";", expand=True, n=79)
99
+
100
+ # Assign column names
101
+ names = [
102
+ "start_identifier",
103
+ "device_address",
104
+ "sensor_serial_number",
105
+ "sensor_date",
106
+ "sensor_time",
107
+ "weather_code_synop_4677_5min",
108
+ "weather_code_synop_4680_5min",
109
+ "weather_code_metar_4678_5min",
110
+ "precipitation_rate_5min",
111
+ "weather_code_synop_4677",
112
+ "weather_code_synop_4680",
113
+ "weather_code_metar_4678",
114
+ "precipitation_rate",
115
+ "rainfall_rate",
116
+ "snowfall_rate",
117
+ "precipitation_accumulated",
118
+ "mor_visibility",
119
+ "reflectivity",
120
+ "quality_index",
121
+ "max_hail_diameter",
122
+ "laser_status",
123
+ "static_signal_status",
124
+ "laser_temperature_analog_status",
125
+ "laser_temperature_digital_status",
126
+ "laser_current_analog_status",
127
+ "laser_current_digital_status",
128
+ "sensor_voltage_supply_status",
129
+ "current_heating_pane_transmitter_head_status",
130
+ "current_heating_pane_receiver_head_status",
131
+ "temperature_sensor_status",
132
+ "current_heating_voltage_supply_status",
133
+ "current_heating_house_status",
134
+ "current_heating_heads_status",
135
+ "current_heating_carriers_status",
136
+ "control_output_laser_power_status",
137
+ "reserved_status",
138
+ "temperature_interior",
139
+ "laser_temperature",
140
+ "laser_current_average",
141
+ "control_voltage",
142
+ "optical_control_voltage_output",
143
+ "sensor_voltage_supply",
144
+ "current_heating_pane_transmitter_head",
145
+ "current_heating_pane_receiver_head",
146
+ "temperature_ambient",
147
+ "current_heating_voltage_supply",
148
+ "current_heating_house",
149
+ "current_heating_heads",
150
+ "current_heating_carriers",
151
+ "number_particles",
152
+ "number_particles_internal_data",
153
+ "number_particles_min_speed",
154
+ "number_particles_min_speed_internal_data",
155
+ "number_particles_max_speed",
156
+ "number_particles_max_speed_internal_data",
157
+ "number_particles_min_diameter",
158
+ "number_particles_min_diameter_internal_data",
159
+ "number_particles_no_hydrometeor",
160
+ "number_particles_no_hydrometeor_internal_data",
161
+ "number_particles_unknown_classification",
162
+ "number_particles_unknown_classification_internal_data",
163
+ "number_particles_class_1",
164
+ "number_particles_class_1_internal_data",
165
+ "number_particles_class_2",
166
+ "number_particles_class_2_internal_data",
167
+ "number_particles_class_3",
168
+ "number_particles_class_3_internal_data",
169
+ "number_particles_class_4",
170
+ "number_particles_class_4_internal_data",
171
+ "number_particles_class_5",
172
+ "number_particles_class_5_internal_data",
173
+ "number_particles_class_6",
174
+ "number_particles_class_6_internal_data",
175
+ "number_particles_class_7",
176
+ "number_particles_class_7_internal_data",
177
+ "number_particles_class_8",
178
+ "number_particles_class_8_internal_data",
179
+ "number_particles_class_9",
180
+ "number_particles_class_9_internal_data",
181
+ "raw_drop_number",
182
+ ]
183
+ df.columns = names
184
+
185
+ # Remove checksum from raw_drop_number
186
+ df["raw_drop_number"] = df["raw_drop_number"].str.rsplit(";", n=2, expand=True)[0]
187
+
188
+ # Remove corrupted characters
189
+ df = df.replace("°", "", regex=True) # station N
190
+
191
+ # Keep only rows where sensor_time matches HH:MM:SS format
192
+ df = df[df["sensor_time"].astype(str).str.match(r"^\d{2}:\d{2}:\d{2}$")]
193
+
194
+ # Keep only rows with valid spectrum
195
+ df = df[df["raw_drop_number"].astype(str).str.match(r"^(?:\d{3};)*\d{3};?$")]
196
+ if len(df) == 0:
197
+ raise ValueError("Spectra is corrupted")
198
+
199
+ # Define datetime "time" column
200
+ # - Define start time
201
+ filename = os.path.basename(filepath)
202
+ _, delta_dt, doy, year = filename.split(".")[0].split("_")
203
+ start_time = pd.to_datetime(f"{year}_{doy}", format="%y_%j") + pd.to_timedelta(int(delta_dt), unit="s")
204
+ # - Define timedelta based on sensor_time
205
+ # --> Add +24h to subsequent times when time resets
206
+ dt = pd.to_timedelta(df["sensor_time"]).to_numpy().astype("m8[s]")
207
+ rollover_indices = np.where(np.diff(dt) < np.timedelta64(0, "s"))[0]
208
+ if rollover_indices.size > 0:
209
+ for idx in rollover_indices:
210
+ dt[idx + 1 :] += np.timedelta64(24, "h")
211
+ dt = dt - dt[0]
212
+ # - Define measurement datetime
213
+ df["time"] = start_time + dt
214
+
215
+ # Drop rows with invalid raw_drop_number
216
+ df = df[df["raw_drop_number"].astype(str).str.len() == 1759]
217
+
218
+ # Drop columns not agreeing with DISDRODB L0 standards
219
+ variables_to_drop = [
220
+ "start_identifier",
221
+ "device_address",
222
+ "sensor_serial_number",
223
+ "sensor_date",
224
+ "sensor_time",
225
+ ]
226
+ df = df.drop(columns=variables_to_drop)
227
+ return df