PyPI - doppy - Versions diffs - 0.5.9__cp310-abi3-macosx_10_12_x86_64.whl - Mend

doppy 0.5.9__cp310-abi3-macosx_10_12_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (33) hide show

doppy/__init__.py +6 -0
doppy/bench.py +13 -0
doppy/data/__init__.py +0 -0
doppy/data/api.py +58 -0
doppy/data/cache.py +43 -0
doppy/data/exceptions.py +6 -0
doppy/defaults.py +18 -0
doppy/exceptions.py +14 -0
doppy/netcdf.py +134 -0
doppy/options.py +13 -0
doppy/product/__init__.py +6 -0
doppy/product/noise_utils.py +106 -0
doppy/product/stare.py +807 -0
doppy/product/stare_depol.py +308 -0
doppy/product/turbulence.py +264 -0
doppy/product/utils.py +12 -0
doppy/product/wind.py +460 -0
doppy/py.typed +0 -0
doppy/raw/__init__.py +16 -0
doppy/raw/halo_bg.py +173 -0
doppy/raw/halo_hpl.py +480 -0
doppy/raw/halo_sys_params.py +135 -0
doppy/raw/utils.py +14 -0
doppy/raw/windcube.py +477 -0
doppy/raw/wls70.py +175 -0
doppy/raw/wls77.py +163 -0
doppy/rs.abi3.so +0 -0
doppy/utils.py +24 -0
doppy-0.5.9.dist-info/METADATA +144 -0
doppy-0.5.9.dist-info/RECORD +33 -0
doppy-0.5.9.dist-info/WHEEL +4 -0
doppy-0.5.9.dist-info/entry_points.txt +2 -0
doppy-0.5.9.dist-info/licenses/LICENSE +21 -0

doppy/product/stare_depol.py ADDED Viewed

@@ -0,0 +1,308 @@
+from __future__ import annotations
+from dataclasses import dataclass
+from io import BufferedIOBase
+from pathlib import Path
+from typing import Sequence
+import numpy as np
+import numpy.typing as npt
+import doppy
+from doppy import options
+from doppy.product.stare import PulsesPerRay, RayAccumulationTime, Stare
+@dataclass
+class StareDepol:
+    """
+    Stare product with depolarisation ratio derived from co-polarised and
+    cross-polarised stare data.
+    Attributes:
+    -----------
+    time
+        An array of datetime64 objects representing the observation times.
+    radial_distance
+        An array of radial distances from the observation point, in meters.
+    elevation
+        An array of elevation angles corresponding to the observation points, in
+        degrees.
+    beta
+        An array of backscatter coefficients for the co-polarised signal, in
+        sr-1 m-1.
+    beta_cross
+        An array of backscatter coefficients for the cross-polarised signal, in
+        sr-1 m-1.
+    radial_velocity
+        An array of radial velocities of the co-polarised signal, in m s-1.
+    mask_beta
+        A boolean array indicating signal (True) or noise (False) data points.
+    mask_radial_velocity
+        A boolean array indicating signal (True) or noise (False) data points.
+    depolarisation
+        An array of depolarisation ratios calculated as the ratio of
+        co-polarised to cross-polarised backscatter coefficients.
+    wavelength
+        The wavelength of the lidar, in meters.
+    system_id
+        A string identifier for the lidar.
+    Raises
+    ------
+    ValueError
+        If the input `co` and `cross` products have mismatched wavelengths,
+        system IDs, radial distances, or elevation angles, this exception is
+        raised.
+    References
+    ----------
+    Aerosol particle depolarization ratio at 1565 nm measured with a Halo Doppler lidar
+        authors: Ville Vakkari, Holger Baars, Stephanie Bohlmann, Johannes Bühl,
+            Mika Komppula, Rodanthi-Elisavet Mamouri, and Ewan James O'Connor
+        doi: https://doi.org/10.5194/acp-21-5807-2021
+    """
+    time: npt.NDArray[np.datetime64]
+    radial_distance: npt.NDArray[np.float64]
+    elevation: npt.NDArray[np.float64]
+    beta: npt.NDArray[np.float64]
+    beta_cross: npt.NDArray[np.float64]
+    radial_velocity: npt.NDArray[np.float64]
+    mask_beta: npt.NDArray[np.bool_]
+    mask_radial_velocity: npt.NDArray[np.bool_]
+    depolarisation: npt.NDArray[np.float64]
+    polariser_bleed_through: float
+    wavelength: float
+    system_id: str
+    ray_info: RayAccumulationTime | PulsesPerRay
+    def __init__(
+        self,
+        co: Stare,
+        cross: Stare,
+        polariser_bleed_through: float = 0.0,
+    ):
+        """
+        Parameters
+        ----------
+        co: Stare
+            The co-polarised data.
+        cross: Stare
+            The cross-polarised data. The `cross.time` array is expected to be sorted.
+        polariser_bleed_through: float, default=0.0
+            The amount of bleed-through from the polariser.
+        """
+        if co.beta.shape[1] != cross.beta.shape[1]:
+            raise doppy.exceptions.ShapeError(
+                "Range dimension mismatch in co and cross: "
+                f"{co.beta.shape[1]} vs {cross.beta.shape[1]}"
+            )
+        if not np.isclose(co.wavelength, cross.wavelength):
+            raise ValueError(
+                "Different wavelength in co and cross: "
+                f"{co.wavelength} vs {cross.wavelength}"
+            )
+        if co.system_id != cross.system_id:
+            raise ValueError(
+                "Different system ID in co and cross: "
+                f"{co.system_id} vs {cross.system_id}"
+            )
+        if not np.allclose(co.radial_distance, cross.radial_distance, atol=1):
+            raise ValueError("Different radial distance in co and cross")
+        ind = np.searchsorted(cross.time, co.time, side="left")
+        pick_ind = ind < len(cross.time)
+        time_diff_threshold = 2 * np.median(np.diff(co.time))
+        co_cross_timediff_below_threshold = (
+            cross.time[ind[pick_ind]] - co.time[pick_ind] < time_diff_threshold
+        )
+        pick_ind[pick_ind] &= co_cross_timediff_below_threshold
+        if not np.allclose(
+            co.elevation[pick_ind], cross.elevation[ind[pick_ind]], atol=1
+        ):
+            raise ValueError("Different elevation in co and cross")
+        depolarisation = np.full_like(co.beta, np.nan)
+        co_beta = co.beta[pick_ind]
+        depolarisation[pick_ind] = (
+            cross.beta[ind[pick_ind]] - polariser_bleed_through * co_beta
+        ) / co_beta
+        cross_beta = np.full_like(co.beta, np.nan)
+        cross_beta[pick_ind] = cross.beta[ind[pick_ind]]
+        self.time = co.time
+        self.radial_distance = co.radial_distance
+        self.elevation = co.elevation
+        self.beta = co.beta
+        self.beta_cross = cross_beta
+        self.radial_velocity = co.radial_velocity
+        self.mask_beta = co.mask_beta
+        self.mask_radial_velocity = co.mask_radial_velocity
+        self.depolarisation = depolarisation
+        self.polariser_bleed_through = polariser_bleed_through
+        self.wavelength = co.wavelength
+        self.system_id = co.system_id
+        self.ray_info = co.ray_info
+    @property
+    def mask_depolarisation(self) -> npt.NDArray[np.bool_]:
+        return np.isnan(self.depolarisation)
+    @property
+    def mask_beta_cross(self) -> npt.NDArray[np.bool_]:
+        return np.isnan(self.beta_cross)
+    @classmethod
+    def from_halo_data(
+        cls,
+        co_data: Sequence[str]
+        | Sequence[Path]
+        | Sequence[bytes]
+        | Sequence[BufferedIOBase],
+        co_data_bg: Sequence[str]
+        | Sequence[Path]
+        | Sequence[tuple[bytes, str]]
+        | Sequence[tuple[BufferedIOBase, str]],
+        cross_data: Sequence[str]
+        | Sequence[Path]
+        | Sequence[bytes]
+        | Sequence[BufferedIOBase],
+        cross_data_bg: Sequence[str]
+        | Sequence[Path]
+        | Sequence[tuple[bytes, str]]
+        | Sequence[tuple[BufferedIOBase, str]],
+        bg_correction_method: options.BgCorrectionMethod,
+        polariser_bleed_through: float = 0,
+    ) -> StareDepol:
+        co = Stare.from_halo_data(
+            data=co_data, data_bg=co_data_bg, bg_correction_method=bg_correction_method
+        )
+        cross = Stare.from_halo_data(
+            data=cross_data,
+            data_bg=cross_data_bg,
+            bg_correction_method=bg_correction_method,
+        )
+        return cls(co, cross, polariser_bleed_through)
+    def write_to_netcdf(self, filename: str | Path) -> None:
+        with doppy.netcdf.Dataset(filename) as nc:
+            nc.add_dimension("time")
+            nc.add_dimension("range")
+            nc.add_time(
+                name="time",
+                dimensions=("time",),
+                standard_name="time",
+                long_name="Time UTC",
+                data=self.time,
+                dtype="f8",
+            )
+            nc.add_variable(
+                name="range",
+                dimensions=("range",),
+                units="m",
+                data=self.radial_distance,
+                dtype="f4",
+            )
+            nc.add_variable(
+                name="elevation",
+                dimensions=("time",),
+                units="degrees",
+                data=self.elevation,
+                dtype="f4",
+                long_name="elevation from horizontal",
+            )
+            nc.add_variable(
+                name="beta_raw",
+                dimensions=("time", "range"),
+                units="sr-1 m-1",
+                data=self.beta,
+                dtype="f4",
+            )
+            nc.add_variable(
+                name="beta",
+                dimensions=("time", "range"),
+                units="sr-1 m-1",
+                data=self.beta,
+                dtype="f4",
+                mask=self.mask_beta,
+            )
+            nc.add_variable(
+                name="v",
+                dimensions=("time", "range"),
+                units="m s-1",
+                long_name="Doppler velocity",
+                data=self.radial_velocity,
+                dtype="f4",
+                mask=self.mask_radial_velocity,
+            )
+            nc.add_scalar_variable(
+                name="wavelength",
+                units="m",
+                standard_name="radiation_wavelength",
+                data=self.wavelength,
+                dtype="f4",
+            )
+            nc.add_variable(
+                name="depolarisation_raw",
+                dimensions=("time", "range"),
+                units="1",
+                data=self.depolarisation,
+                dtype="f4",
+                mask=self.mask_depolarisation,
+            )
+            nc.add_variable(
+                name="depolarisation",
+                dimensions=("time", "range"),
+                units="1",
+                data=self.depolarisation,
+                dtype="f4",
+                mask=self.mask_beta | self.mask_depolarisation,
+            )
+            nc.add_variable(
+                name="beta_cross_raw",
+                dimensions=("time", "range"),
+                units="sr-1 m-1",
+                data=self.beta_cross,
+                mask=self.mask_beta_cross,
+                dtype="f4",
+            )
+            nc.add_variable(
+                name="beta_cross",
+                dimensions=("time", "range"),
+                units="sr-1 m-1",
+                data=self.beta_cross,
+                mask=self.mask_beta | self.mask_beta_cross,
+                dtype="f4",
+            )
+            nc.add_scalar_variable(
+                name="polariser_bleed_through",
+                units="1",
+                long_name="Polariser bleed-through",
+                data=self.polariser_bleed_through,
+                dtype="f4",
+            )
+            match self.ray_info:
+                case RayAccumulationTime(value):
+                    nc.add_scalar_variable(
+                        name="ray_accumulation_time",
+                        units="s",
+                        long_name="ray accumulation time",
+                        data=value,
+                        dtype="f4",
+                    )
+                case PulsesPerRay(value):
+                    nc.add_scalar_variable(
+                        name="pulses_per_ray",
+                        units="1",
+                        long_name="pulses per ray",
+                        data=value,
+                        dtype="u4",
+                    )
+            nc.add_attribute("serial_number", self.system_id)
+            nc.add_attribute("doppy_version", doppy.__version__)

doppy/product/turbulence.py ADDED Viewed

@@ -0,0 +1,264 @@
+from __future__ import annotations
+from dataclasses import dataclass
+import numpy as np
+import numpy.typing as npt
+from scipy.interpolate import RegularGridInterpolator
+@dataclass
+class HorizontalWind:
+    time: npt.NDArray[np.datetime64]
+    height: npt.NDArray[np.float64]  # Height in meters from reference
+    V: npt.NDArray[np.float64]  # Horizontal wind speed in m/s
+@dataclass
+class VerticalWind:
+    time: npt.NDArray[np.datetime64]
+    height: npt.NDArray[np.float64]  # Height in meters from reference
+    w: npt.NDArray[np.float64]  # Vertical wind speed in m/s
+    mask: npt.NDArray[np.bool_]  # mask[t,h] = True iff w[t,h] should be masked
+@dataclass
+class Options:
+    ray_accumulation_time: float  # in seconds
+    period: float = 600  # period for computing the variance in seconds
+    beam_divergence: float = 33e-6  # radians
+@dataclass
+class Turbulence:
+    time: npt.NDArray[np.datetime64]
+    height: npt.NDArray[np.float64]
+    turbulent_kinetic_energy_dissipation_rate: npt.NDArray[np.float64]
+    mask: npt.NDArray[np.bool_]
+    @classmethod
+    def from_winds(
+        cls, vert: VerticalWind, hori: HorizontalWind, options: Options
+    ) -> Turbulence:
+        V = _preprocess_horiontal_wind(vert, hori, options)
+        ls_low = _length_scale_low(V, vert.height, options)
+        res = _compute_variance(vert, options.period)
+        sampling_time = _sampling_time_in_seconds(res)
+        ls_up = V * sampling_time
+        dissipation_rate = _compute_dissipation_rate(res.variance, ls_low, ls_up)
+        mask = np.isnan(dissipation_rate) | vert.mask
+        return cls(
+            time=vert.time.copy(),
+            height=vert.height.copy(),
+            turbulent_kinetic_energy_dissipation_rate=dissipation_rate,
+            mask=mask,
+        )
+def _sampling_time_in_seconds(r: VarResult) -> npt.NDArray[np.float64]:
+    if not all(
+        (
+            t == np.dtype("datetime64[us]")
+            for t in (r.period_start.dtype, r.period_stop.dtype)
+        )
+    ):
+        raise ValueError("period times must be on datetime64[us]")
+    td = r.period_stop - r.period_start
+    td_in_seconds = td / np.timedelta64(1, "s")
+    return np.array(td_in_seconds, dtype=np.float64)
+@dataclass
+class VarResult:
+    variance: npt.NDArray[np.float64]
+    period_start: npt.NDArray[np.datetime64]
+    period_stop: npt.NDArray[np.datetime64]
+    nsamples: npt.NDArray[np.int64]
+def _compute_variance(vert: VerticalWind, period: float) -> VarResult:
+    # NOTE: numerically unstable
+    # To compute actual time window
+    next_valid = _next_valid_from_mask(vert.mask)
+    prev_valid = _prev_valid_from_mask(vert.mask)
+    X = vert.w.copy()
+    X[vert.mask] = 0
+    X2 = X**2
+    X_cumsum = X.cumsum(axis=0)
+    X2_cumsum = X2.cumsum(axis=0)
+    N_i = (~vert.mask).astype(int)
+    N_cumsum = N_i.cumsum(axis=0)
+    def N_func(i: int, j: int) -> npt.NDArray[np.float64]:
+        return np.array(N_cumsum[j] - N_cumsum[i] + N_i[i], dtype=np.float64)
+    def S(i: int, j: int) -> npt.NDArray[np.float64]:
+        return np.array(X_cumsum[j] - X_cumsum[i] + X[i], dtype=np.float64)
+    def S2(i: int, j: int) -> npt.NDArray[np.float64]:
+        return np.array(X2_cumsum[j] - X2_cumsum[i] + X2[i], dtype=np.float64)
+    def var_ij(i: int, j: int) -> npt.NDArray[np.float64]:
+        N = N_func(i, j)
+        with np.errstate(invalid="ignore"):
+            return np.array((S2(i, j) - S(i, j) ** 2 / N) / N, dtype=np.float64)
+    half_period = np.timedelta64(int(1e6 * period / 2), "us")
+    period_start = np.full(vert.w.shape, np.datetime64("NaT", "us"))
+    period_stop = np.full(vert.w.shape, np.datetime64("NaT", "us"))
+    var = np.full(vert.w.shape, np.nan, dtype=np.float64)
+    nsamples = np.zeros_like(vert.w, dtype=np.int64)
+    i = 0
+    j = 0
+    n = len(vert.time)
+    for k, t in enumerate(vert.time):
+        while i + 1 < n and t - vert.time[i + 1] >= half_period:
+            i += 1
+        while j + 1 < n and vert.time[j] - t < half_period:
+            j += 1
+        i_valid = next_valid[i]
+        i_inbound = (0 <= i_valid) & (i_valid < n)
+        j_valid = prev_valid[j]
+        j_inbound = (0 <= j_valid) & (j_valid < n)
+        period_start[k][i_inbound] = vert.time[i_valid[i_inbound]]
+        period_stop[k][j_inbound] = vert.time[j_valid[j_inbound]]
+        var[k] = var_ij(i, j)
+        nsamples[k] = N_func(i, j)
+    return VarResult(
+        variance=var,
+        period_start=period_start,
+        period_stop=period_stop,
+        nsamples=nsamples,
+    )
+def _length_scale_low(
+    V: npt.NDArray[np.float64], height: npt.NDArray[np.float64], opts: Options
+) -> npt.NDArray[np.float64]:
+    integration_time = opts.ray_accumulation_time
+    from_beam = 2 * height * np.sin(opts.beam_divergence / 2)
+    from_wind = V * integration_time
+    return np.array(from_wind + from_beam[np.newaxis, :], dtype=np.float64)
+def _preprocess_horiontal_wind(
+    vert: VerticalWind, hori: HorizontalWind, options: Options
+) -> npt.NDArray[np.float64]:
+    if np.isnan(hori.V).any():
+        raise ValueError("horizontal wind speed cannot contains NaNs")
+    trg_points = np.meshgrid(vert.time, vert.height, indexing="ij")
+    src_points = (hori.time, hori.height)
+    src_vals = hori.V
+    interp_nearest = RegularGridInterpolator(
+        src_points,
+        src_vals,
+        method="nearest",
+        bounds_error=False,
+        fill_value=None,
+    )
+    interp_linear = RegularGridInterpolator(
+        src_points, src_vals, method="linear", bounds_error=False
+    )
+    V_nearest = interp_nearest(trg_points)
+    V_linear = interp_linear(trg_points)
+    V = V_linear
+    V[np.isnan(V)] = V_nearest[np.isnan(V)]
+    if np.isnan(V).any():
+        raise ValueError("Unexpected NaNs")
+    V_rmean = _rolling_mean_over_time(vert.time, V, options.period)
+    return V_rmean
+def _rolling_mean_over_time(
+    time: npt.NDArray[np.datetime64], arr: npt.NDArray[np.float64], period: float
+) -> npt.NDArray[np.float64]:
+    if arr.ndim != 2:
+        raise ValueError("number of dims on arr should be 2")
+    if time.ndim != 1 or time.shape[0] != arr.shape[0]:
+        raise ValueError("time and arr dimensions do not match")
+    if time.dtype != np.dtype("datetime64[us]"):
+        raise TypeError(f"Invalid time type: {time.dtype}")
+    S = arr.cumsum(axis=0)
+    def rolling_mean(i: int, j: int) -> npt.NDArray[np.float64]:
+        return np.array((S[j] - S[i] + arr[i]) / (j - i + 1), dtype=np.float64)
+    half_period = np.timedelta64(int(period * 0.5e6), "us")
+    rol_mean = np.full(arr.shape, np.nan, dtype=np.float64)
+    i = 0
+    j = 0
+    n = len(time)
+    for k, t in enumerate(time):
+        while i + 1 < n and t - time[i + 1] >= half_period:
+            i += 1
+        while j + 1 < n and time[j] - t < half_period:
+            j += 1
+        rol_mean[k] = rolling_mean(i, j)
+    return rol_mean
+def _compute_dissipation_rate(
+    variance: npt.NDArray[np.float64],
+    length_scale_lower: npt.NDArray[np.float64],
+    length_scale_upper: npt.NDArray[np.float64],
+) -> npt.NDArray[np.float64]:
+    """
+    Parameters
+    ----------
+    variance, length_scale_lower, and length_scale_upper
+        dimensions: (time,range)
+    """
+    kolmogorov_constant = 0.55
+    with np.errstate(invalid="ignore"):
+        dr = (
+            2
+            * np.pi
+            * (2 / (3 * kolmogorov_constant)) ** (3 / 2)
+            * variance ** (3 / 2)
+            * (length_scale_upper ** (2 / 3) - length_scale_lower ** (2 / 3))
+            ** (-3 / 2)
+        )
+    return np.array(dr, dtype=np.float64)
+def _next_valid_from_mask(mask: npt.NDArray[np.bool_]) -> npt.NDArray[np.int64]:
+    """
+    mask[t,v] (time,value)
+    returns N[t,v] = i where i = min { j | j >= t and mask[j,v] == False}
+    if the set is non empty and N[t,v] = len(mask) otherwise
+    """
+    n = len(mask)
+    N = np.full(mask.shape, n)
+    if mask.size == 0:
+        return N
+    N[-1][~mask[-1]] = n - 1
+    for t in reversed(range(n - 1)):
+        N[t][~mask[t]] = t
+        N[t][mask[t]] = N[t + 1][mask[t]]
+    return np.array(N, dtype=np.int64)
+def _prev_valid_from_mask(mask: npt.NDArray[np.bool_]) -> npt.NDArray[np.int64]:
+    """
+    mask[t,v] (time,value)
+    returns N[t,v] = i where i = max { j | j <= t and mask[j,v] == False}
+    if the set is non empty and N[t,v] = -1 otherwise
+    """
+    n = len(mask)
+    N = np.full(mask.shape, -1)
+    if mask.size == 0:
+        return N
+    N[0][~mask[0]] = 0
+    for t in range(1, n):
+        N[t][~mask[t]] = t
+        N[t][mask[t]] = N[t - 1][mask[t]]
+    return np.array(N, dtype=np.int64)

doppy/product/utils.py ADDED Viewed

@@ -0,0 +1,12 @@
+from collections import Counter
+import numpy as np
+import numpy.typing as npt
+def arr_to_rounded_set(arr: npt.NDArray[np.float64]) -> set[int]:
+    return set(int(x) for x in np.round(arr))
+def count_rounded(arr: npt.NDArray[np.float64]) -> Counter[int]:
+    return Counter(int(x) for x in np.round(arr))