PyPI - cloudnetpy-qc - Versions diffs - 1.24.3__tar.gz → 1.25.0__tar.gz - Mend

cloudnetpy-qc 1.24.3tar.gz → 1.25.0tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (24) hide show

{cloudnetpy_qc-1.24.3/cloudnetpy_qc.egg-info → cloudnetpy_qc-1.25.0}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: cloudnetpy_qc
-Version: 1.24.3
+Version: 1.25.0
 Summary: Quality control routines for CloudnetPy products
 Author-email: Finnish Meteorological Institute <actris-cloudnet@fmi.fi>
 License: MIT License
@@ -80,6 +80,7 @@ print(json_object)
 - `timestamp`: UTC timestamp of the test
 - `qcVersion`: `cloudnetpy-qc` version
 - `tests`: `Test[]`
+- `data_coverage`: float
 ### `Test`

{cloudnetpy_qc-1.24.3 → cloudnetpy_qc-1.25.0}/README.md RENAMED Viewed

@@ -27,6 +27,7 @@ print(json_object)
 - `timestamp`: UTC timestamp of the test
 - `qcVersion`: `cloudnetpy-qc` version
 - `tests`: `Test[]`
+- `data_coverage`: float
 ### `Test`

cloudnetpy_qc-1.25.0/cloudnetpy_qc/coverage.py ADDED Viewed

@@ -0,0 +1,66 @@
+import datetime
+import netCDF4
+import numpy as np
+from cloudnetpy_qc.variables import Product
+RESOLUTIONS = {
+    Product.DISDROMETER: datetime.timedelta(minutes=1),
+    Product.L3_CF: datetime.timedelta(hours=1),
+    Product.L3_IWC: datetime.timedelta(hours=1),
+    Product.L3_LWC: datetime.timedelta(hours=1),
+    Product.MWR: datetime.timedelta(minutes=5),
+    Product.MWR_MULTI: datetime.timedelta(minutes=30),
+    Product.MWR_SINGLE: datetime.timedelta(minutes=5),
+    Product.WEATHER_STATION: datetime.timedelta(minutes=10),
+    Product.RAIN_GAUGE: datetime.timedelta(minutes=1),
+    Product.DOPPLER_LIDAR_WIND: datetime.timedelta(hours=1.5),
+}
+DEFAULT_RESOLUTION = datetime.timedelta(seconds=30)
+def data_coverage(
+    nc: netCDF4.Dataset,
+) -> tuple[float, datetime.timedelta, datetime.timedelta] | None:
+    time = np.array(nc["time"][:])
+    time_unit = datetime.timedelta(hours=1)
+    try:
+        n_time = len(time)
+    except (TypeError, ValueError):
+        return None
+    if n_time < 2:
+        return None
+    if nc.cloudnet_file_type == "model":
+        expected_res = _model_resolution(nc)
+    else:
+        product = Product(nc.cloudnet_file_type)
+        expected_res = RESOLUTIONS.get(product, DEFAULT_RESOLUTION)
+    duration = get_duration(nc)
+    bins = max(1, duration // expected_res)
+    hist, _ = np.histogram(time, bins=bins, range=(0, duration / time_unit))
+    coverage = np.count_nonzero(hist > 0) / len(hist)
+    actual_res = np.median(np.diff(time)) * time_unit
+    return coverage, expected_res, actual_res
+def _model_resolution(nc: netCDF4.Dataset) -> datetime.timedelta:
+    source = nc.source.lower()
+    if "gdas" in source or "ecmwf open" in source:
+        return datetime.timedelta(hours=3)
+    return datetime.timedelta(hours=1)
+def get_duration(nc: netCDF4.Dataset) -> datetime.timedelta:
+    now = datetime.datetime.now(tz=datetime.timezone.utc)
+    if now.date() == _get_date(nc):
+        midnight = now.replace(hour=0, minute=0, second=0, microsecond=0)
+        duration = now - midnight
+    else:
+        duration = datetime.timedelta(days=1)
+    return duration
+def _get_date(nc: netCDF4.Dataset) -> datetime.date:
+    date_in_file = [int(getattr(nc, x)) for x in ("year", "month", "day")]
+    return datetime.date(*date_in_file)

{cloudnetpy_qc-1.24.3 → cloudnetpy_qc-1.25.0}/cloudnetpy_qc/quality.py RENAMED Viewed

@@ -17,6 +17,8 @@ import scipy.stats
 from numpy import ma
 from requests import RequestException
+from cloudnetpy_qc.coverage import data_coverage, get_duration
 from . import utils
 from .variables import LEVELS, VARIABLES, Product
 from .version import __version__
@@ -53,6 +55,7 @@ class FileReport(NamedTuple):
     timestamp: datetime.datetime
     qc_version: str
     tests: list[TestReport]
+    data_coverage: float | None
     def to_dict(self) -> dict:
         return {
@@ -84,6 +87,7 @@ def run_tests(
     ignore_tests: list[str] | None = None,
 ) -> FileReport:
     filename = Path(filename)
+    coverage = None
     if isinstance(product, str):
         product = Product(product)
     with netCDF4.Dataset(filename) as nc:
@@ -111,10 +115,13 @@ def run_tests(
                     f"Failed to run test: {err} ({type(err).__name__})"
                 )
             test_reports.append(test_instance.report)
+            if test_instance.coverage is not None:
+                coverage = test_instance.coverage
     return FileReport(
         timestamp=datetime.datetime.now(tz=datetime.timezone.utc),
         qc_version=__version__,
         tests=test_reports,
+        data_coverage=coverage,
     )
@@ -124,6 +131,7 @@ class Test:
     name: str
     description: str
     products: Iterable[Product] = Product.all()
+    coverage: float | None = None
     def __init__(
         self, nc: netCDF4.Dataset, filename: Path, product: Product, site_meta: SiteMeta
@@ -190,19 +198,6 @@ class Test:
                     )
                     self._add_warning(msg)
-    def _get_date(self):
-        date_in_file = [int(getattr(self.nc, x)) for x in ("year", "month", "day")]
-        return datetime.date(*date_in_file)
-    def _get_duration(self) -> datetime.timedelta:
-        now = datetime.datetime.now(tz=datetime.timezone.utc)
-        if now.date() == self._get_date():
-            midnight = now.replace(hour=0, minute=0, second=0, microsecond=0)
-            duration = now - midnight
-        else:
-            duration = datetime.timedelta(days=1)
-        return duration
 # --------------------#
 # ------ Infos ------ #
@@ -287,45 +282,12 @@ class TestDataCoverage(Test):
     name = "Data coverage"
     description = "Test that file contains enough data."
-    RESOLUTIONS = {
-        Product.DISDROMETER: datetime.timedelta(minutes=1),
-        Product.L3_CF: datetime.timedelta(hours=1),
-        Product.L3_IWC: datetime.timedelta(hours=1),
-        Product.L3_LWC: datetime.timedelta(hours=1),
-        Product.MWR: datetime.timedelta(minutes=5),
-        Product.MWR_MULTI: datetime.timedelta(minutes=30),
-        Product.MWR_SINGLE: datetime.timedelta(minutes=5),
-        Product.WEATHER_STATION: datetime.timedelta(minutes=10),
-        Product.RAIN_GAUGE: datetime.timedelta(minutes=1),
-        Product.DOPPLER_LIDAR_WIND: datetime.timedelta(hours=1.5),
-    }
-    DEFAULT_RESOLUTION = datetime.timedelta(seconds=30)
-    def _model_resolution(self):
-        source = self.nc.source.lower()
-        if "gdas" in source or "ecmwf open" in source:
-            return datetime.timedelta(hours=3)
-        return datetime.timedelta(hours=1)
     def run(self):
-        time = np.array(self.nc["time"][:])
-        time_unit = datetime.timedelta(hours=1)
-        try:
-            n_time = len(time)
-        except (TypeError, ValueError):
+        coverage, expected_res, actual_res = data_coverage(self.nc)
+        if coverage is None:
             return
-        if n_time < 2:
-            return
-        if self.nc.cloudnet_file_type == "model":
-            expected_res = self._model_resolution()
-        else:
-            expected_res = self.RESOLUTIONS.get(self.product, self.DEFAULT_RESOLUTION)
-        duration = self._get_duration()
-        bins = max(1, duration // expected_res)
-        hist, _bin_edges = np.histogram(
-            time, bins=bins, range=(0, duration / time_unit)
-        )
-        missing = np.count_nonzero(hist == 0) / len(hist) * 100
+        self.coverage = coverage
+        missing = (1 - coverage) * 100
         if missing > 20:
             message = f"{round(missing)}% of day's data is missing."
             if missing > 60:
@@ -333,7 +295,6 @@ class TestDataCoverage(Test):
             else:
                 self._add_info(message)
-        actual_res = np.median(np.diff(time)) * time_unit
         if actual_res > expected_res * 1.05:
             self._add_warning(
                 f"Expected a measurement with interval at least {expected_res},"
@@ -789,7 +750,7 @@ class TestModelData(Test):
         if n_time < 2:
             return
-        duration = self._get_duration()
+        duration = get_duration(self.nc)
         should_be_data_until = duration / time_unit
         for key in ("temperature", "pressure", "q"):

{cloudnetpy_qc-1.24.3 → cloudnetpy_qc-1.25.0}/cloudnetpy_qc/version.py RENAMED Viewed

@@ -1,6 +1,6 @@
 """Cloudnetpy-QC version."""
 MAJOR = 1
-MINOR = 24
-PATCH = 3
+MINOR = 25
+PATCH = 0
 __version__ = f"{MAJOR}.{MINOR}.{PATCH}"

{cloudnetpy_qc-1.24.3 → cloudnetpy_qc-1.25.0/cloudnetpy_qc.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: cloudnetpy_qc
-Version: 1.24.3
+Version: 1.25.0
 Summary: Quality control routines for CloudnetPy products
 Author-email: Finnish Meteorological Institute <actris-cloudnet@fmi.fi>
 License: MIT License
@@ -80,6 +80,7 @@ print(json_object)
 - `timestamp`: UTC timestamp of the test
 - `qcVersion`: `cloudnetpy-qc` version
 - `tests`: `Test[]`
+- `data_coverage`: float
 ### `Test`

{cloudnetpy_qc-1.24.3 → cloudnetpy_qc-1.25.0}/cloudnetpy_qc.egg-info/SOURCES.txt RENAMED Viewed

@@ -3,6 +3,7 @@ MANIFEST.in
 README.md
 pyproject.toml
 cloudnetpy_qc/__init__.py
+cloudnetpy_qc/coverage.py
 cloudnetpy_qc/py.typed
 cloudnetpy_qc/quality.py
 cloudnetpy_qc/utils.py