PyPI - legend-pydataobj - Versions diffs - 1.0.0__py3-none-any.whl - Mend

legend-pydataobj 1.0.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (26) hide show

legend_pydataobj-1.0.0.dist-info/LICENSE +674 -0
legend_pydataobj-1.0.0.dist-info/METADATA +63 -0
legend_pydataobj-1.0.0.dist-info/RECORD +26 -0
legend_pydataobj-1.0.0.dist-info/WHEEL +5 -0
legend_pydataobj-1.0.0.dist-info/top_level.txt +1 -0
lgdo/__init__.py +75 -0
lgdo/_version.py +4 -0
lgdo/compression/__init__.py +36 -0
lgdo/compression/base.py +29 -0
lgdo/compression/generic.py +77 -0
lgdo/compression/radware.py +579 -0
lgdo/compression/utils.py +34 -0
lgdo/compression/varlen.py +449 -0
lgdo/lgdo_utils.py +196 -0
lgdo/lh5_store.py +1711 -0
lgdo/types/__init__.py +30 -0
lgdo/types/array.py +140 -0
lgdo/types/arrayofequalsizedarrays.py +133 -0
lgdo/types/encoded.py +390 -0
lgdo/types/fixedsizearray.py +43 -0
lgdo/types/lgdo.py +51 -0
lgdo/types/scalar.py +59 -0
lgdo/types/struct.py +108 -0
lgdo/types/table.py +349 -0
lgdo/types/vectorofvectors.py +627 -0
lgdo/types/waveform_table.py +264 -0

lgdo/types/waveform_table.py ADDED Viewed

@@ -0,0 +1,264 @@
+"""
+Implements a LEGEND Data Object representing a special
+:class:`~.lgdo.table.Table` to store blocks of one-dimensional time-series
+data.
+"""
+from __future__ import annotations
+import logging
+from typing import Any
+import numpy as np
+from .array import Array
+from .arrayofequalsizedarrays import ArrayOfEqualSizedArrays
+from .encoded import ArrayOfEncodedEqualSizedArrays, VectorOfEncodedVectors
+from .table import Table
+from .vectorofvectors import VectorOfVectors
+log = logging.getLogger(__name__)
+class WaveformTable(Table):
+    r"""An LGDO for storing blocks of (1D) time-series data.
+    A :class:`WaveformTable` is an LGDO :class:`.Table` with the 3
+    columns ``t0``, ``dt``, and ``values``:
+    * ``t0[i]`` is a time offset (relative to a user-defined global reference)
+      for the sample in ``values[i][0]``. Implemented as an LGDO
+      :class:`.Array` with optional attribute ``units``.
+    * ``dt[i]`` is the sampling period for the waveform at ``values[i]``.
+      Implemented as an LGDO :class:`.Array` with optional attribute ``units``.
+    * ``values[i]`` is the ``i``'th waveform in the table. Internally, the
+      waveforms values may be either an LGDO :class:`.ArrayOfEqualSizedArrays`\
+      ``<1,1>``, an LGDO :class:`.VectorOfVectors` or
+      :class:`.VectorOfEncodedVectors` that supports waveforms of unequal
+      length. Can optionally be given a ``units`` attribute.
+    Note
+    ----
+    On-disk and in-memory versions could be different e.g. if a compression
+    routine is used.
+    """
+    def __init__(
+        self,
+        size: int = None,
+        t0: float | Array | np.ndarray = 0,
+        t0_units: str = None,
+        dt: float | Array | np.ndarray = 1,
+        dt_units: str = None,
+        values: ArrayOfEqualSizedArrays | VectorOfVectors | np.ndarray = None,
+        values_units: str = None,
+        wf_len: int = None,
+        dtype: np.dtype = None,
+        attrs: dict[str, Any] = None,
+    ) -> None:
+        r"""
+        Parameters
+        ----------
+        size
+            sets the number of rows in the table. If ``None``, the size will be
+            determined from the first among `t0`, `dt`, or `values` to return a
+            valid length. If not ``None``, `t0`, `dt`, and values will be
+            resized as necessary to match `size`. If `size` is ``None`` and
+            `t0`, `dt`, and `values` are all non-array-like, a default size of
+            1024 is used.
+        t0
+            :math:`t_0` values to be used (or broadcast) to the `t0` column.
+        t0_units
+            units for the :math:`t_0` values. If not ``None`` and `t0` is an
+            LGDO :class:`.Array`, overrides what's in `t0`.
+        dt
+            :math:`\delta t` values (sampling period) to be used (or
+            broadcasted) to the `t0` column.
+        dt_units
+            units for the `dt` values. If not ``None`` and `dt` is an LGDO
+            :class:`.Array`, overrides what's in `dt`.
+        values
+            The waveform data to be stored in the table. If ``None`` a block of
+            data is prepared based on the `wf_len` and `dtype` arguments.
+        values_units
+            units for the waveform values. If not ``None`` and `values` is an
+            LGDO :class:`.Array`, overrides what's in `values`.
+        wf_len
+            The length of the waveforms in each entry of a table. If ``None``
+            (the default), unequal lengths are assumed and
+            :class:`.VectorOfVectors` is used for the `values` column. Ignored
+            if `values` is a 2D ndarray, in which case ``values.shape[1]`` is
+            used.
+        dtype
+            The NumPy :class:`numpy.dtype` of the waveform data. If `values` is
+            not ``None``, this argument is ignored. If both `values` and
+            `dtype` are ``None``, :class:`numpy.float64` is used.
+        attrs
+            A set of user attributes to be carried along with this LGDO.
+        """
+        if size is None:
+            if hasattr(t0, "__len__"):
+                size = len(t0)
+            elif hasattr(dt, "__len__"):
+                size = len(dt)
+            elif hasattr(values, "__len__"):
+                size = len(values)
+            if size is None:
+                size = 1024
+        if not isinstance(t0, Array):
+            shape = (size,)
+            t0_dtype = t0.dtype if hasattr(t0, "dtype") else np.float32
+            nda = (
+                t0 if isinstance(t0, np.ndarray) else np.full(shape, t0, dtype=t0_dtype)
+            )
+            if nda.shape != shape:
+                nda.resize(shape, refcheck=True)
+            t0 = Array(nda=nda)
+        if t0_units is not None:
+            t0.attrs["units"] = f"{t0_units}"
+        if not isinstance(dt, Array):
+            shape = (size,)
+            dt_dtype = dt.dtype if hasattr(dt, "dtype") else np.float32
+            nda = (
+                dt if isinstance(dt, np.ndarray) else np.full(shape, dt, dtype=dt_dtype)
+            )
+            if nda.shape != shape:
+                nda.resize(shape, refcheck=True)
+            dt = Array(nda=nda)
+        if dt_units is not None:
+            dt.attrs["units"] = f"{dt_units}"
+        if not isinstance(
+            values,
+            (
+                ArrayOfEqualSizedArrays,
+                VectorOfVectors,
+                VectorOfEncodedVectors,
+                ArrayOfEncodedEqualSizedArrays,
+            ),
+        ):
+            if isinstance(values, np.ndarray):
+                try:
+                    wf_len = values.shape[1]
+                except Exception:
+                    wf_len = None
+            if wf_len is None:  # make a VectorOfVectors
+                shape_guess = (size, 100)
+                if dtype is None:
+                    dtype = np.dtype(np.float64)
+                if values is None:
+                    values = VectorOfVectors(shape_guess=shape_guess, dtype=dtype)
+                else:
+                    flattened_data = np.concatenate(values)
+                    length = 0
+                    cumulative_length = []
+                    for i in range(size):
+                        length += len(values[i])
+                        cumulative_length.append(length)
+                    values = VectorOfVectors(
+                        flattened_data=flattened_data,
+                        cumulative_length=cumulative_length,
+                        dtype=dtype,
+                    )
+            else:  # make a ArrayOfEqualSizedArrays
+                shape = (size, wf_len)
+                if dtype is None:
+                    dtype = (
+                        values.dtype
+                        if hasattr(values, "dtype")
+                        else np.dtype(np.float64)
+                    )
+                nda = (
+                    values
+                    if isinstance(values, np.ndarray)
+                    else np.zeros(shape, dtype=dtype)
+                )
+                if nda.shape != shape:
+                    nda.resize(shape, refcheck=True)
+                values = ArrayOfEqualSizedArrays(dims=(1, 1), nda=nda)
+        if values_units is not None:
+            values.attrs["units"] = f"{values_units}"
+        col_dict = {}
+        col_dict["t0"] = t0
+        col_dict["dt"] = dt
+        col_dict["values"] = values
+        super().__init__(size=size, col_dict=col_dict, attrs=attrs)
+    @property
+    def values(self) -> ArrayOfEqualSizedArrays | VectorOfVectors:
+        return self["values"]
+    @property
+    def values_units(self) -> str:
+        return self.values.attrs.get("units", None)
+    @values_units.setter
+    def values_units(self, units) -> None:
+        self.values.attrs["units"] = f"{units}"
+    @property
+    def wf_len(self) -> int:
+        if isinstance(self.values, VectorOfVectors):
+            return -1
+        return self.values.nda.shape[1]
+    @wf_len.setter
+    def wf_len(self, wf_len) -> None:
+        if isinstance(self.values, VectorOfVectors):
+            return
+        shape = self.values.nda.shape
+        shape = (shape[0], wf_len)
+        self.values.nda.resize(shape, refcheck=True)
+    def resize_wf_len(self, new_len: int) -> None:
+        """Alias for `wf_len.setter`, for when we want to make it clear in
+        the code that memory is being reallocated.
+        """
+        self.wf_len = new_len
+    @property
+    def t0(self) -> Array:
+        return self["t0"]
+    @property
+    def t0_units(self) -> str:
+        return self.t0.attrs.get("units", None)
+    @t0_units.setter
+    def t0_units(self, units: str) -> None:
+        self.t0.attrs["units"] = f"{units}"
+    @property
+    def dt(self) -> Array:
+        return self["dt"]
+    @property
+    def dt_units(self) -> str:
+        return self.dt.attrs.get("units", None)
+    @dt_units.setter
+    def dt_units(self, units: str) -> None:
+        self.dt.attrs["units"] = f"{units}"
+    def __str__(self):
+        npopt = np.get_printoptions()
+        np.set_printoptions(threshold=100)
+        string = ""
+        for i in range(self.size):
+            string += f"{self.values[i]}, dt={self.dt[i]}"
+            if self.dt_units:
+                string += f" {self.dt_units}"
+            string += f", t0={self.t0[i]}"
+            if self.t0_units:
+                string += f" {self.t0_units}"
+            if i < self.size - 1:
+                string += "\n"
+        np.set_printoptions(**npopt)
+        return string