PyPI - reboost - Versions diffs - 0.6.2__py3-none-any.whl → 0.8.0__py3-none-any.whl - Mend

reboost 0.6.2py3-none-any.whl → 0.8.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (30) hide show

reboost/_version.py +16 -3
reboost/build_hit.py +102 -58
reboost/cli.py +1 -0
reboost/core.py +18 -9
reboost/daq/__init__.py +5 -0
reboost/daq/core.py +262 -0
reboost/daq/utils.py +28 -0
reboost/hpge/psd.py +444 -94
reboost/hpge/surface.py +34 -1
reboost/hpge/utils.py +2 -1
reboost/iterator.py +4 -1
reboost/math/stats.py +2 -2
reboost/optmap/cli.py +40 -101
reboost/optmap/convolve.py +206 -233
reboost/optmap/create.py +41 -124
reboost/optmap/evt.py +5 -2
reboost/optmap/mapview.py +9 -7
reboost/optmap/optmap.py +13 -14
reboost/shape/cluster.py +4 -4
reboost/spms/__init__.py +5 -0
reboost/spms/pe.py +178 -0
reboost/units.py +40 -8
reboost/utils.py +65 -3
{reboost-0.6.2.dist-info → reboost-0.8.0.dist-info}/METADATA +7 -5
reboost-0.8.0.dist-info/RECORD +42 -0
reboost-0.6.2.dist-info/RECORD +0 -37
{reboost-0.6.2.dist-info → reboost-0.8.0.dist-info}/WHEEL +0 -0
{reboost-0.6.2.dist-info → reboost-0.8.0.dist-info}/entry_points.txt +0 -0
{reboost-0.6.2.dist-info → reboost-0.8.0.dist-info}/licenses/LICENSE +0 -0
{reboost-0.6.2.dist-info → reboost-0.8.0.dist-info}/top_level.txt +0 -0

reboost/optmap/convolve.py CHANGED Viewed

@@ -2,17 +2,17 @@ from __future__ import annotations
 import logging
 import re
+from typing import NamedTuple
+import awkward as ak
 import legendoptics.scintillate as sc
 import numba
 import numpy as np
-import pint
-from legendoptics import lar
+from legendoptics import fibers, lar, pen
 from lgdo import lh5
-from lgdo.lh5 import LH5Iterator
 from lgdo.types import Array, Histogram, Table
-from numba import njit, prange
-from numpy.lib.recfunctions import structured_to_unstructured
+from numba import njit
+from numpy.typing import NDArray
 from .numba_pdg import numba_pdgid_funcs
@@ -23,22 +23,31 @@ OPTMAP_ANY_CH = -1
 OPTMAP_SUM_CH = -2
-def open_optmap(optmap_fn: str):
+class OptmapForConvolve(NamedTuple):
+    """A loaded optmap for convolving."""
+    detids: NDArray
+    detidx: NDArray
+    edges: NDArray
+    weights: NDArray
+def open_optmap(optmap_fn: str) -> OptmapForConvolve:
     maps = lh5.ls(optmap_fn)
     # only accept _<number> (/all is read separately)
     det_ntuples = [m for m in maps if re.match(r"_\d+$", m)]
     detids = np.array([int(m.lstrip("_")) for m in det_ntuples])
     detidx = np.arange(0, detids.shape[0])
-    optmap_all = lh5.read("/all/p_det", optmap_fn)
+    optmap_all = lh5.read("/all/prob", optmap_fn)
     assert isinstance(optmap_all, Histogram)
     optmap_edges = tuple([b.edges for b in optmap_all.binning])
     ow = np.empty((detidx.shape[0] + 2, *optmap_all.weights.nda.shape), dtype=np.float64)
     # 0, ..., len(detidx)-1 AND OPTMAP_ANY_CH might be negative.
     ow[OPTMAP_ANY_CH] = optmap_all.weights.nda
-    for i, nt in zip(detidx, det_ntuples):
-        optmap = lh5.read(f"/{nt}/p_det", optmap_fn)
+    for i, nt in zip(detidx, det_ntuples, strict=True):
+        optmap = lh5.read(f"/{nt}/prob", optmap_fn)
         assert isinstance(optmap, Histogram)
         ow[i] = optmap.weights.nda
@@ -69,38 +78,67 @@ def open_optmap(optmap_fn: str):
         if np.isfinite(optmap_multi_det_exp):
             msg = f"found finite _hitcounts_exp {optmap_multi_det_exp} which is not supported any more"
             raise RuntimeError(msg)
-    except KeyError:  # the _hitcounts_exp might not be always present.
+    except lh5.exceptions.LH5DecodeError:  # the _hitcounts_exp might not be always present.
         pass
-    return detids, detidx, optmap_edges, ow
+    return OptmapForConvolve(detids, detidx, optmap_edges, ow)
-def iterate_stepwise_depositions(
-    edep_df: np.rec.recarray,
-    optmap_for_convolve,
+def open_optmap_single(optmap_fn: str, spm_det_uid: int) -> OptmapForConvolve:
+    try:
+        # check the exponent from the optical map file
+        optmap_multi_det_exp = lh5.read("/_hitcounts_exp", optmap_fn).value
+        assert isinstance(optmap_multi_det_exp, float)
+        if np.isfinite(optmap_multi_det_exp):
+            msg = f"found finite _hitcounts_exp {optmap_multi_det_exp} which is not supported any more"
+            raise RuntimeError(msg)
+    except lh5.exceptions.LH5DecodeError:  # the _hitcounts_exp might not be always present.
+        pass
+    optmap = lh5.read(f"/_{spm_det_uid}/prob", optmap_fn)
+    assert isinstance(optmap, Histogram)
+    ow = np.empty((1, *optmap.weights.nda.shape), dtype=np.float64)
+    ow[0] = optmap.weights.nda
+    optmap_edges = tuple([b.edges for b in optmap.binning])
+    return OptmapForConvolve(np.array([spm_det_uid]), np.array([0]), optmap_edges, ow)
+def iterate_stepwise_depositions_pois(
+    edep_hits: ak.Array,
+    optmap: OptmapForConvolve,
     scint_mat_params: sc.ComputedScintParams,
-    rng: np.random.Generator = None,
-    dist: str = "poisson",
-    mode: str = "no-fano",
+    det_uid: int,
+    map_scaling: float = 1,
+    map_scaling_sigma: float = 0,
+    rng: np.random.Generator | None = None,
 ):
-    # those np functions are not supported by numba, but needed for efficient array access below.
-    if "xloc_pre" in edep_df.dtype.names:
-        x0 = structured_to_unstructured(edep_df[["xloc_pre", "yloc_pre", "zloc_pre"]], np.float64)
-        x1 = structured_to_unstructured(
-            edep_df[["xloc_post", "yloc_post", "zloc_post"]], np.float64
-        )
-    else:
-        x0 = structured_to_unstructured(edep_df[["xloc", "yloc", "zloc"]], np.float64)
-        x1 = None
+    if edep_hits.particle.ndim == 1:
+        msg = "the pe processors only support already reshaped output"
+        raise ValueError(msg)
     rng = np.random.default_rng() if rng is None else rng
-    output_map, res = _iterate_stepwise_depositions(
-        edep_df, x0, x1, rng, *optmap_for_convolve, scint_mat_params, dist, mode
+    res, output_list = _iterate_stepwise_depositions_pois(
+        edep_hits,
+        rng,
+        np.where(optmap.detids == det_uid)[0][0],
+        map_scaling,
+        map_scaling_sigma,
+        optmap.edges,
+        optmap.weights,
+        scint_mat_params,
     )
-    if res["any_no_stats"] > 0 or res["det_no_stats"] > 0:
+    # convert the numba result back into an awkward array.
+    builder = ak.ArrayBuilder()
+    for r in output_list:
+        with builder.list():
+            for a in r:
+                builder.extend(a)
+    if res["det_no_stats"] > 0:
         log.warning(
-            "had edep out in voxels without stats: %d (%.2f%%)",
-            res["any_no_stats"],
+            "had edep out in voxels without stats: %d",
             res["det_no_stats"],
         )
     if res["oob"] > 0:
@@ -110,14 +148,34 @@ def iterate_stepwise_depositions(
             (res["oob"] / (res["ib"] + res["oob"])) * 100,
         )
     log.debug(
-        "VUV_primary %d ->hits_any %d ->hits %d (%.2f %% primaries detected)",
+        "VUV_primary %d ->hits %d (%.2f %% primaries detected in this channel)",
         res["vuv_primary"],
-        res["hits_any"],
         res["hits"],
-        (res["hits_any"] / res["vuv_primary"]) * 100,
+        (res["hits"] / res["vuv_primary"]) * 100,
     )
-    log.debug("hits/hits_any %.2f", res["hits"] / res["hits_any"])
-    return output_map
+    return builder.snapshot()
+def iterate_stepwise_depositions_scintillate(
+    edep_hits: ak.Array,
+    scint_mat_params: sc.ComputedScintParams,
+    rng: np.random.Generator | None = None,
+    mode: str = "no-fano",
+):
+    if edep_hits.particle.ndim == 1:
+        msg = "the pe processors only support already reshaped output"
+        raise ValueError(msg)
+    rng = np.random.default_rng() if rng is None else rng
+    output_list = _iterate_stepwise_depositions_scintillate(edep_hits, rng, scint_mat_params, mode)
+    # convert the numba result back into an awkward array.
+    builder = ak.ArrayBuilder()
+    for r in output_list:
+        with builder.list():
+            builder.extend(r)
+    return builder.snapshot()
 _pdg_func = numba_pdgid_funcs()
@@ -144,178 +202,116 @@ __counts_per_bin_key_type = numba.types.UniTuple(numba.types.int64, 3)
 # - cache=True does not work with outer prange, i.e. loading the cached file fails (numba bug?)
 # - the output dictionary is not threadsafe, so parallel=True is not working with it.
 @njit(parallel=False, nogil=True, cache=True)
-def _iterate_stepwise_depositions(
-    edep_df,
-    x0,
-    x1,
+def _iterate_stepwise_depositions_pois(
+    edep_hits,
     rng,
-    detids,
-    detidx,
+    detidx: int,
+    map_scaling: float,
+    map_scaling_sigma: float,
     optmap_edges,
     optmap_weights,
     scint_mat_params: sc.ComputedScintParams,
-    dist: str,
-    mode: str,
 ):
     pdgid_map = {}
-    output_map = {}
-    oob = ib = ph_cnt = ph_det = ph_det2 = any_no_stats = det_no_stats = 0  # for statistics
-    for rowid in prange(edep_df.shape[0]):
-        # if rowid % 100000 == 0:
-        #     print(rowid)
-        t = edep_df[rowid]
-        # get the particle information.
-        if t.particle not in pdgid_map:
-            pdgid_map[t.particle] = (_pdgid_to_particle(t.particle), _pdg_func.charge(t.particle))
-        # do the scintillation.
-        part, charge = pdgid_map[t.particle]
-        # if we have both pre and post step points use them
-        # else pass as None
-        scint_times = sc.scintillate(
-            scint_mat_params,
-            x0[rowid],
-            x1[rowid] if x1 is not None else None,
-            t.v_pre if x1 is not None else None,
-            t.v_post if x1 is not None else None,
-            t.time,
-            part,
-            charge,
-            t.edep,
-            rng,
-            emission_term_model=("poisson" if mode == "no-fano" else "normal_fano"),
-        )
-        if scint_times.shape[0] == 0:  # short-circuit if we have no photons at all.
-            continue
-        ph_cnt += scint_times.shape[0]
-        # coordinates -> bins of the optical map.
-        bins = np.empty((scint_times.shape[0], 3), dtype=np.int64)
-        for j in range(3):
-            bins[:, j] = np.digitize(scint_times[:, j + 1], optmap_edges[j])
-            # normalize all out-of-bounds bins just to one end.
-            bins[:, j][bins[:, j] == optmap_edges[j].shape[0]] = 0
-        # there are _much_ less unique bins, unfortunately np.unique(..., axis=n) does not work
-        # with numba; also np.sort(..., axis=n) also does not work.
-        counts_per_bin = numba.typed.Dict.empty(
-            key_type=__counts_per_bin_key_type,
-            value_type=np.int64,
-        )
+    oob = ib = ph_cnt = ph_det2 = det_no_stats = 0  # for statistics
+    output_list = []
+    for rowid in range(len(edep_hits)):  # iterate hits
+        hit = edep_hits[rowid]
+        hit_output = []
+        map_scaling_evt = map_scaling
+        if map_scaling_sigma > 0:
+            map_scaling_evt = rng.normal(loc=map_scaling, scale=map_scaling_sigma)
+        assert len(hit.particle) == len(hit.num_scint_ph)
+        # iterate steps inside the hit
+        for si in range(len(hit.particle)):
+            loc = np.array([hit.xloc[si], hit.yloc[si], hit.zloc[si]])
+            # coordinates -> bins of the optical map.
+            bins = np.empty(3, dtype=np.int64)
+            for j in range(3):
+                bins[j] = np.digitize(loc[j], optmap_edges[j])
+                # normalize all out-of-bounds bins just to one end.
+                if bins[j] == optmap_edges[j].shape[0]:
+                    bins[j] = 0
-        # get probabilities from map.
-        hitcount = np.zeros((detidx.shape[0], bins.shape[0]), dtype=np.int64)
-        for j in prange(bins.shape[0]):
             # note: subtract 1 from bins, to account for np.digitize output.
-            cur_bins = (bins[j, 0] - 1, bins[j, 1] - 1, bins[j, 2] - 1)
+            cur_bins = (bins[0] - 1, bins[1] - 1, bins[2] - 1)
             if cur_bins[0] == -1 or cur_bins[1] == -1 or cur_bins[2] == -1:
                 oob += 1
                 continue  # out-of-bounds of optmap
             ib += 1
-            px_any = optmap_weights[OPTMAP_ANY_CH, cur_bins[0], cur_bins[1], cur_bins[2]]
-            if px_any < 0.0:
-                any_no_stats += 1
-                continue
-            if px_any == 0.0:
+            # get probabilities from map.
+            detp = optmap_weights[detidx, cur_bins[0], cur_bins[1], cur_bins[2]] * map_scaling_evt
+            if detp < 0.0:
+                det_no_stats += 1
                 continue
-            if dist == "multinomial":
-                if rng.uniform() >= px_any:
-                    continue
-                ph_det += 1
-                # we detect this energy deposition; we should at least get one photon out here!
-                detsel_size = 1
-                px_sum = optmap_weights[OPTMAP_SUM_CH, cur_bins[0], cur_bins[1], cur_bins[2]]
-                assert px_sum >= 0.0  # should not be negative.
-                detp = np.empty(detidx.shape, dtype=np.float64)
-                had_det_no_stats = 0
-                for d in detidx:
-                    # normalize so that sum(detp) = 1
-                    detp[d] = optmap_weights[d, cur_bins[0], cur_bins[1], cur_bins[2]] / px_sum
-                    if detp[d] < 0.0:
-                        had_det_no_stats = 1
-                        detp[d] = 0.0
-                det_no_stats += had_det_no_stats
-                # should be equivalent to rng.choice(detidx, size=detsel_size, p=detp)
-                detsel = detidx[
-                    np.searchsorted(np.cumsum(detp), rng.random(size=(detsel_size,)), side="right")
-                ]
-                for d in detsel:
-                    hitcount[d, j] += 1
-                ph_det2 += detsel.shape[0]
-            elif dist == "poisson":
-                # store the photon count in each bin, to sample them all at once below.
-                if cur_bins not in counts_per_bin:
-                    counts_per_bin[cur_bins] = 1
-                else:
-                    counts_per_bin[cur_bins] += 1
-            else:
-                msg = "unknown distribution"
-                raise RuntimeError(msg)
-        if dist == "poisson":
-            for j, (cur_bins, ph_counts_to_poisson) in enumerate(counts_per_bin.items()):
-                had_det_no_stats = 0
-                had_any = 0
-                for d in detidx:
-                    detp = optmap_weights[d, cur_bins[0], cur_bins[1], cur_bins[2]]
-                    if detp < 0.0:
-                        had_det_no_stats = 1
-                        continue
-                    pois_cnt = rng.poisson(lam=ph_counts_to_poisson * detp)
-                    hitcount[d, j] += pois_cnt
-                    ph_det2 += pois_cnt
-                    had_any = 1
-                ph_det += had_any
-                det_no_stats += had_det_no_stats
-        assert scint_times.shape[0] >= hitcount.shape[1]  # TODO: use the right assertion here.
-        out_hits_len = np.sum(hitcount)
-        if out_hits_len > 0:
-            out_times = np.empty(out_hits_len, dtype=np.float64)
-            out_det = np.empty(out_hits_len, dtype=np.int64)
-            out_idx = 0
-            for d in detidx:
-                hc_d_plane_max = np.max(hitcount[d, :])
-                # untangle the hitcount array in "planes" that only contain the given number of hits per
-                # channel. example: assume a "histogram" of hits per channel:
-                #     x |   |    <-- this is plane 2 with 1 hit ("max plane")
-                #     x |   | x  <-- this is plane 1 with 2 hits
-                # ch: 1 | 2 | 3
-                for hc_d_plane_cnt in range(1, hc_d_plane_max + 1):
-                    hc_d_plane = hitcount[d, :] >= hc_d_plane_cnt
-                    hc_d_plane_len = np.sum(hc_d_plane)
-                    if hc_d_plane_len == 0:
-                        continue
-                    # note: we assume "immediate" propagation after scintillation. Here, a single timestamp
-                    # might be coipied to output/"detected" twice.
-                    out_times[out_idx : out_idx + hc_d_plane_len] = scint_times[hc_d_plane, 0]
-                    out_det[out_idx : out_idx + hc_d_plane_len] = detids[d]
-                    out_idx += hc_d_plane_len
-            assert out_idx == out_hits_len  # ensure that all of out_{det,times} is filled.
-            output_map[np.int64(rowid)] = (t.evtid, out_det, out_times)
+            pois_cnt = rng.poisson(lam=hit.num_scint_ph[si] * detp)
+            ph_cnt += hit.num_scint_ph[si]
+            ph_det2 += pois_cnt
+            # get the particle information.
+            particle = hit.particle[si]
+            if particle not in pdgid_map:
+                pdgid_map[particle] = (_pdgid_to_particle(particle), _pdg_func.charge(particle))
+            part, _charge = pdgid_map[particle]
+            # get time spectrum.
+            # note: we assume "immediate" propagation after scintillation.
+            scint_times = sc.scintillate_times(scint_mat_params, part, pois_cnt, rng) + hit.time[si]
+            hit_output.append(scint_times)
+        output_list.append(hit_output)
     stats = {
         "oob": oob,
         "ib": ib,
         "vuv_primary": ph_cnt,
-        "hits_any": ph_det,
         "hits": ph_det2,
-        "any_no_stats": any_no_stats,
         "det_no_stats": det_no_stats,
     }
-    return output_map, stats
+    return stats, output_list
+# - run with NUMBA_FULL_TRACEBACKS=1 NUMBA_BOUNDSCHECK=1 for testing/checking
+# - cache=True does not work with outer prange, i.e. loading the cached file fails (numba bug?)
+@njit(parallel=False, nogil=True, cache=True)
+def _iterate_stepwise_depositions_scintillate(
+    edep_hits, rng, scint_mat_params: sc.ComputedScintParams, mode: str
+):
+    pdgid_map = {}
+    output_list = []
+    for rowid in range(len(edep_hits)):  # iterate hits
+        hit = edep_hits[rowid]
+        hit_output = []
+        # iterate steps inside the hit
+        for si in range(len(hit.particle)):
+            # get the particle information.
+            particle = hit.particle[si]
+            if particle not in pdgid_map:
+                pdgid_map[particle] = (_pdgid_to_particle(particle), _pdg_func.charge(particle))
+            part, _charge = pdgid_map[particle]
+            # do the scintillation.
+            num_phot = sc.scintillate_numphot(
+                scint_mat_params,
+                part,
+                hit.edep[si],
+                rng,
+                emission_term_model=("poisson" if mode == "no-fano" else "normal_fano"),
+            )
+            hit_output.append(num_phot)
+        assert len(hit_output) == len(hit.particle)
+        output_list.append(hit_output)
+    return output_list
 def get_output_table(output_map):
@@ -338,58 +334,35 @@ def get_output_table(output_map):
     return ph_count_o, tbl
-def convolve(
-    map_file: str,
-    edep_file: str,
-    edep_path: str,
-    material: str,
-    output_file: str | None = None,
-    buffer_len: int = int(1e6),
-    dist_mode: str = "poisson+no-fano",
-):
-    if material not in ["lar", "pen"]:
-        msg = f"unknown material {material} for scintillation"
-        raise ValueError(msg)
+def _reflatten_scint_vov(arr: ak.Array) -> ak.Array:
+    if all(arr[f].ndim == 1 for f in ak.fields(arr)):
+        return arr
+    group_num = ak.num(arr["edep"]).to_numpy()
+    flattened = {
+        f: ak.flatten(arr[f]) if arr[f].ndim > 1 else np.repeat(arr[f].to_numpy(), group_num)
+        for f in ak.fields(arr)
+    }
+    return ak.Array(flattened)
+def _get_scint_params(material: str):
     if material == "lar":
-        scint_mat_params = sc.precompute_scintillation_params(
+        return sc.precompute_scintillation_params(
             lar.lar_scintillation_params(),
             lar.lar_lifetimes().as_tuple(),
         )
-    elif material == "pen":
-        scint_mat_params = sc.precompute_scintillation_params(
-            lar.pen_scintillation_params(),
-            (1 * pint.get_application_registry().ns),  # dummy!
-        )
-    # special handling of distributions and flags.
-    dist, mode = dist_mode.split("+")
-    if (
-        dist not in ("multinomial", "poisson")
-        or mode not in ("", "no-fano")
-        or (dist == "poisson" and mode != "no-fano")
-    ):
-        msg = f"unsupported statistical distribution {dist_mode} for scintillation emission"
-        raise ValueError(msg)
-    log.info("opening map %s", map_file)
-    optmap_for_convolve = open_optmap(map_file)
-    log.info("opening energy deposition hit output %s", edep_file)
-    it = LH5Iterator(edep_file, edep_path, buffer_len=buffer_len)
-    for it_count, edep_lgdo in enumerate(it):
-        edep_df = edep_lgdo.view_as("pd").to_records()
-        log.info("start event processing (%d)", it_count)
-        output_map = iterate_stepwise_depositions(
-            edep_df, optmap_for_convolve, scint_mat_params, dist=dist, mode=mode
+    if material == "pen":
+        return sc.precompute_scintillation_params(
+            pen.pen_scintillation_params(),
+            (pen.pen_scint_timeconstant(),),
         )
-        log.info("store output photon hits (%d)", it_count)
-        ph_count_o, tbl = get_output_table(output_map)
-        log.debug(
-            "output photons: %d energy depositions -> %d photons", len(output_map), ph_count_o
+    if material == "fiber":
+        return sc.precompute_scintillation_params(
+            fibers.fiber_core_scintillation_params(),
+            (fibers.fiber_wls_timeconstant(),),
         )
-        if output_file is not None:
-            lh5.write(tbl, "optical", lh5_file=output_file, group="stp", wo_mode="append")
+    if isinstance(material, str):
+        msg = f"unknown material {material} for scintillation"
+        raise ValueError(msg)
+    return sc.precompute_scintillation_params(*material)

reboost 0.6.2__py3-none-any.whl → 0.8.0__py3-none-any.whl

reboost 0.6.2py3-none-any.whl → 0.8.0py3-none-any.whl