PyPI - legend-dataflow-scripts - Versions diffs - 0.1.4__py3-none-any.whl → 0.1.6__py3-none-any.whl - Mend

legend-dataflow-scripts 0.1.4py3-none-any.whl → 0.1.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

{legend_dataflow_scripts-0.1.4.dist-info → legend_dataflow_scripts-0.1.6.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: legend-dataflow-scripts
-Version: 0.1.4
+Version: 0.1.6
 Summary: Python package for the processing scripts for LEGEND-200 data
 Author-email: George Marshall <ggmarsh@uw.edu>, Luigi Pertoldi <gipert@pm.me>
 Maintainer: The LEGEND Collaboration

{legend_dataflow_scripts-0.1.4.dist-info → legend_dataflow_scripts-0.1.6.dist-info}/RECORD RENAMED Viewed

@@ -1,37 +1,37 @@
 legenddataflowscripts/__init__.py,sha256=hlpvTxSBjOyXlZUyOyYx3VwT5LS6zNzhAZnTmfT3NjU,303
-legenddataflowscripts/_version.py,sha256=hcPkC9vIGgfrKK6ft7ysLT7iOCjpFmCBmyKLmXiaZ1g,511
+legenddataflowscripts/_version.py,sha256=ESbJO0YD7TYfOUv_WDIJJgWELGepEWsoyhqVifEcXPA,511
 legenddataflowscripts/par/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 legenddataflowscripts/par/geds/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 legenddataflowscripts/par/geds/dsp/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 legenddataflowscripts/par/geds/dsp/dplms.py,sha256=OOvnN_OcU046zhuyNTGxcmGYLCZ7YseK4rNyMDaRsC4,5314
-legenddataflowscripts/par/geds/dsp/eopt.py,sha256=UklMozVw57X8EhOVjOxwKSXtuHkX45iJ2YMLx69TQps,13680
+legenddataflowscripts/par/geds/dsp/eopt.py,sha256=jmljkIPamz-L1lX8kEqSdmRuZJ-a9---9Qj-1ACghNQ,13792
 legenddataflowscripts/par/geds/dsp/evtsel.py,sha256=qheFqGezjRxW9UNf9DV1n8VuZjCLGZT-WaWyhrfgPJ4,16485
 legenddataflowscripts/par/geds/dsp/nopt.py,sha256=K7R4OBfO0wek03VvhBoYXDP7lURi_Xoph9Kb3iMkfx4,4263
 legenddataflowscripts/par/geds/dsp/pz.py,sha256=sucYUtsgWKYtR-GbmRh5b61EYHqNRMWGckD3DJdHUvs,8273
 legenddataflowscripts/par/geds/dsp/svm.py,sha256=eDneRB_PQZp8Q4n2VheTX3kbu4ufZQ-jnuCCjvtwFpk,826
 legenddataflowscripts/par/geds/dsp/svm_build.py,sha256=8K0NUpQqL2HUWRKjMpM5H-TienVPUzIuKED94ZZnIzA,2227
 legenddataflowscripts/par/geds/hit/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-legenddataflowscripts/par/geds/hit/aoe.py,sha256=4sXRz6UaPD7phihAO3_C42l7fJT8UrhhOZswzO8rAqw,11387
-legenddataflowscripts/par/geds/hit/ecal.py,sha256=tsIL9FP-aXgM2B1K8ygjcsLeNZ9Yv7je84fT-K7m3vQ,26194
-legenddataflowscripts/par/geds/hit/lq.py,sha256=td0qVvVRwYbhiA-IhAZYLgTdW6xpTeeE3mrSoWeLw2U,11307
+legenddataflowscripts/par/geds/hit/aoe.py,sha256=lkA7cgSRdyDt58AYOIuPoCBxiClVJU-6wwYSImpdVFg,11413
+legenddataflowscripts/par/geds/hit/ecal.py,sha256=HogjtX-QUkwogh-jA9F0jTTvEjEfCUK5GY4cHGUBaAw,27854
+legenddataflowscripts/par/geds/hit/lq.py,sha256=TW3vu0UFYgQz2-vrb_ic8ghIpe3ukKMF4Kt-iFP7VAQ,11346
 legenddataflowscripts/par/geds/hit/qc.py,sha256=16RWhybvnODv4dUuSkO6EDtPvJJJmeFwFaPTgS9N7cs,12746
 legenddataflowscripts/tier/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 legenddataflowscripts/tier/dsp.py,sha256=J_ABEqbQurZHJOg8LV2aporNjZQpPg2bDZG6DkmuAL4,8633
 legenddataflowscripts/tier/hit.py,sha256=-LCfsqYAYPAuN2OKbPuh4G2P5B4uA4YmQGcqUtbZxis,4989
 legenddataflowscripts/utils/__init__.py,sha256=NPpxqapio8CeQIbG8gYnz-OPoUbOlDT6tjXV-lJrKWc,426
-legenddataflowscripts/utils/alias_table.py,sha256=e0wRiDcpje8VVr_PlcbkA0kPz0qSGpGX4vJ3tfGefMA,742
+legenddataflowscripts/utils/alias_table.py,sha256=OfET_-ZG6FfXL9JRqPJiSWUdDrDQlNnz5RsLkH2sk5Y,1605
 legenddataflowscripts/utils/cfgtools.py,sha256=_1yxw_eJ08AihONhJ9sWet5HQZpOagj8Yg8y9LS3zX4,381
-legenddataflowscripts/utils/convert_np.py,sha256=8q_K3w3jAREG-9CJlErP3Vca0OYTYAYJIK4g_TClvBU,819
+legenddataflowscripts/utils/convert_np.py,sha256=qw-pX9345lhzLAwERLjEJtnikzAWWIeD9lyDre2n9P0,853
 legenddataflowscripts/utils/log.py,sha256=5v8J7PZJHHoSy12w9e9DkYmqdPvYXj6YfVaMbhvX614,2230
 legenddataflowscripts/utils/plot_dict.py,sha256=-wfJC5U9OTE1Asazz64kT5Ta008w6UJmDSsr3YAubRM,449
 legenddataflowscripts/utils/pulser_removal.py,sha256=kuARdp1jf-lsUWcb0_KRDp-ZXzkHNrDCXUc3h7TJm7Q,424
 legenddataflowscripts/workflow/__init__.py,sha256=JhudKYhBT8bXtX4LCqxQCHzUiITpugAtFxePWEtphC4,474
-legenddataflowscripts/workflow/execenv.py,sha256=O6Z6EH6Yp0JXnwX2wTzduHC9Q9gu-_d1RuuE2pQ5caE,9061
+legenddataflowscripts/workflow/execenv.py,sha256=qTG4N9ovEPxA0QtqG0wWUIuK50BZIcYvpVlpy-XgxPw,9257
 legenddataflowscripts/workflow/filedb.py,sha256=rbvOcXUxLbHz177QuDIDAL3aysz-bZDjHOiMsRHssZo,3434
 legenddataflowscripts/workflow/pre_compile_catalog.py,sha256=cEK0KXh-ClSE2Bo9MK471o79XG22bMY5r-2tIihtCfk,790
 legenddataflowscripts/workflow/utils.py,sha256=eKE8KIG2ffynZt9fTbI1SVQV85i3aW9GFGh1Nio1iDo,3118
-legend_dataflow_scripts-0.1.4.dist-info/METADATA,sha256=kCV4uTOiqJBCGvMteN0O5b0YGwLCMrZR8DF3LytqCF4,3122
-legend_dataflow_scripts-0.1.4.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
-legend_dataflow_scripts-0.1.4.dist-info/entry_points.txt,sha256=B197waSm-orA_ZS-9rkxNDsmOHdCn8CbWodnlqXQKRg,1313
-legend_dataflow_scripts-0.1.4.dist-info/top_level.txt,sha256=s8E2chjJNYUbrN6whFG_VCsJKySFp1IOXLcUefA7DB0,22
-legend_dataflow_scripts-0.1.4.dist-info/RECORD,,
+legend_dataflow_scripts-0.1.6.dist-info/METADATA,sha256=PTXbBwFCBHDbdxQamprkPrSTly1YVydK5y0HUb__9Bk,3122
+legend_dataflow_scripts-0.1.6.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+legend_dataflow_scripts-0.1.6.dist-info/entry_points.txt,sha256=B197waSm-orA_ZS-9rkxNDsmOHdCn8CbWodnlqXQKRg,1313
+legend_dataflow_scripts-0.1.6.dist-info/top_level.txt,sha256=s8E2chjJNYUbrN6whFG_VCsJKySFp1IOXLcUefA7DB0,22
+legend_dataflow_scripts-0.1.6.dist-info/RECORD,,

legenddataflowscripts/_version.py CHANGED Viewed

@@ -17,5 +17,5 @@ __version__: str
 __version_tuple__: VERSION_TUPLE
 version_tuple: VERSION_TUPLE
-__version__ = version = '0.1.4'
-__version_tuple__ = version_tuple = (0, 1, 4)
+__version__ = version = '0.1.6'
+__version_tuple__ = version_tuple = (0, 1, 6)

legenddataflowscripts/par/geds/dsp/eopt.py CHANGED Viewed

@@ -23,7 +23,10 @@ from pygama.pargen.dsp_optimize import (
 from ....utils import build_log
 warnings.filterwarnings(action="ignore", category=RuntimeWarning)
-warnings.filterwarnings(action="ignore", category=np.exceptions.RankWarning)
+try:
+    warnings.filterwarnings(action="ignore", category=np.exceptions.RankWarning)
+except AttributeError:  # np < 2
+    warnings.filterwarnings(action="ignore", category=np.RankWarning)
 def par_geds_dsp_eopt() -> None:

legenddataflowscripts/par/geds/hit/aoe.py CHANGED Viewed

@@ -297,6 +297,7 @@ def par_geds_hit_aoe() -> None:
     else:
         aoe = None
         plot_dict = out_plot_dict
+        results_dict = {}
     if args.plot_file:
         common_dict = plot_dict.pop("common") if "common" in list(plot_dict) else None

legenddataflowscripts/par/geds/hit/ecal.py CHANGED Viewed

@@ -33,7 +33,10 @@ mpl.use("agg")
 sto = lh5.LH5Store()
 warnings.filterwarnings(action="ignore", category=RuntimeWarning)
-warnings.filterwarnings(action="ignore", category=np.exceptions.RankWarning)
+try:
+    warnings.filterwarnings(action="ignore", category=np.exceptions.RankWarning)
+except AttributeError:  # np < 2
+    warnings.filterwarnings(action="ignore", category=np.RankWarning)
 def plot_2614_timemap(
@@ -485,7 +488,7 @@ def par_geds_hit_ecal() -> None:
         msg = "invalid tier"
         raise ValueError(msg)
-    build_log(config_dict, args.log)
+    log = build_log(config_dict, args.log)
     chmap = LegendMetadata(args.metadata).channelmap(
         args.timestamp, system=args.datatype
@@ -575,14 +578,23 @@ def par_geds_hit_ecal() -> None:
     ):
         e_uncal = data.query(selection_string)[energy_param].to_numpy()
-        hist, bins, bar = pgh.get_hist(
-            e_uncal[
-                (e_uncal > np.nanpercentile(e_uncal, 95))
-                & (e_uncal < np.nanpercentile(e_uncal, 99.9))
-            ],
-            dx=1,
-            range=[np.nanpercentile(e_uncal, 95), np.nanpercentile(e_uncal, 99.9)],
-        )
+        if len(e_uncal) > 0:
+            if isinstance(e_uncal[0], np.ndarray | list):
+                e_uncal = np.concatenate([arr for arr in e_uncal if len(arr) > 0])
+            hist, bins, _ = pgh.get_hist(
+                e_uncal[
+                    (e_uncal > np.nanpercentile(e_uncal, 95))
+                    & (e_uncal < np.nanpercentile(e_uncal, 99.9))
+                ],
+                dx=1,
+                range=[
+                    np.nanpercentile(e_uncal, 95),
+                    np.nanpercentile(e_uncal, 99.9),
+                ],
+            )
+        else:
+            msg = f"e_uncal should not be empty! energy_param: {energy_param}"
+            raise ValueError(msg)
         guess = 2614.511 / bins[np.nanargmax(hist)]
         full_object_dict[cal_energy_param] = HPGeCalibration(
@@ -644,8 +656,21 @@ def par_geds_hit_ecal() -> None:
             interp_energy_kev={"Qbb": 2039.0},
         )
+        energy = data[energy_param].to_numpy()
+        if isinstance(energy[0], np.ndarray | list):
+            energy = np.concatenate(energy)
+        if len(energy) < len(data):
+            log.warning("len(energy) and len(data) are not the same")
+            energy = np.pad(
+                energy, (0, len(data) - len(energy)), constant_values=np.nan
+            )
+        if len(data) < len(energy):
+            energy = energy[: len(data)]
         data[cal_energy_param] = nb_poly(
-            data[energy_param].to_numpy(), full_object_dict[cal_energy_param].pars
+            energy, full_object_dict[cal_energy_param].pars
         )
         results_dict[cal_energy_param] = get_results_dict(
@@ -655,18 +680,32 @@ def par_geds_hit_ecal() -> None:
         hit_dict.update(
             {cal_energy_param: full_object_dict[cal_energy_param].gen_pars_dict()}
         )
-        if "ctc" in cal_energy_param:
-            no_ctc_dict = full_object_dict[cal_energy_param].gen_pars_dict()
-            no_ctc_dict["expression"] = no_ctc_dict["expression"].replace("_ctc", "")
-            hit_dict.update({cal_energy_param.replace("ctc", "noctc"): no_ctc_dict})
-            hit_dict.update(
-                {
-                    cal_energy_param.replace("_ctc", ""): {
-                        "expression": f"where({cal_energy_param.replace('ctc', 'noctc')}>{kwarg_dict.get('dt_theshold_kev', 100)}, {cal_energy_param}, {cal_energy_param.replace('ctc', 'noctc')})",
-                        "parameters": {},
-                    }
-                }
-            )
+        if "copy_calibration" in kwarg_dict:
+            for copy_cal_param, _copy_to_cal_param in kwarg_dict[
+                "copy_calibration"
+            ].items():
+                if copy_cal_param not in full_object_dict:
+                    msg = f"copy_calibration parameter {copy_cal_param} not found in full_object_dict"
+                    raise ValueError(msg)
+                if isinstance(_copy_to_cal_param, str):
+                    copy_to_cal_param = [_copy_to_cal_param]
+                else:
+                    copy_to_cal_param = _copy_to_cal_param
+                for cal_par in copy_to_cal_param:
+                    if cal_par in full_object_dict:
+                        msg = f"copy_calibration parameter {cal_par} already exists in full_object_dict"
+                        raise ValueError(msg)
+                    copy_dict = {cal_par: full_object_dict[cal_par].gen_pars_dict()}
+                    copy_dict["expression"] = copy_dict[cal_par]["expression"].replace(
+                        copy_cal_param, cal_par
+                    )
+                    hit_dict.update({cal_par: copy_dict[cal_par]})
+        if "extra_blocks" in kwarg_dict:
+            if isinstance(kwarg_dict["extra_blocks"], dict):
+                kwarg_dict["extra_blocks"] = [kwarg_dict["extra_blocks"]]
+            for extra_block in kwarg_dict["extra_blocks"]:
+                hit_dict.update(extra_block)
         if args.plot_path:
             param_plot_dict = {}
             if ~np.isnan(full_object_dict[cal_energy_param].pars).all():

legenddataflowscripts/par/geds/hit/lq.py CHANGED Viewed

@@ -295,7 +295,7 @@ def par_geds_hit_lq() -> None:
         data["run_timestamp"] = args.timestamp
-        out_dicts, eres_dicts, plot_dicts, lq_dict = run_lq_calibration(
+        out_dicts, results_dicts, plot_dicts, lq_dict = run_lq_calibration(
             data,
             cal_dicts={args.timestamp: cal_dict},
             results_dicts={args.timestamp: eres_dict},
@@ -305,12 +305,13 @@ def par_geds_hit_lq() -> None:
             debug_mode=args.debug,
         )
         cal_dict = out_dicts[args.timestamp]
-        eres_dict = eres_dicts[args.timestamp]
+        results_dict = results_dicts[args.timestamp]
         plot_dict = plot_dicts[args.timestamp]
         lq = lq_dict[args.timestamp]
     else:
         lq = None
+        results_dict = {}
     if args.plot_file:
         Path(args.plot_file).parent.mkdir(parents=True, exist_ok=True)
@@ -320,7 +321,7 @@ def par_geds_hit_lq() -> None:
     final_hit_dict = convert_dict_np_to_float(
         {
             "pars": {"operations": cal_dict},
-            "results": dict(**ecal_dict["results"], lq=eres_dict),
+            "results": dict(**ecal_dict["results"], lq=results_dict),
         }
     )
     Path(args.hit_pars).parent.mkdir(parents=True, exist_ok=True)

legenddataflowscripts/utils/alias_table.py CHANGED Viewed

@@ -1,11 +1,35 @@
 from __future__ import annotations
 import json
+from pathlib import Path
 import h5py
-def alias_table(file, mapping):
+def convert_parents_to_structs(h5group):
+    if h5group.parent.name != "/" and len(h5group.parent.attrs) == 0:
+        h5group.parent.attrs.update(
+            {"datatype": "struct{" + h5group.name.split("/")[-1] + "}"}
+        )
+    elif (
+        len(h5group.parent.attrs) > 0
+        and h5group.name.split("/")[-1] not in h5group.parent.attrs["datatype"]
+    ):
+        h5group.parent.attrs.update(
+            {
+                "datatype": h5group.parent.attrs["datatype"][:-1]
+                + ","
+                + h5group.name.split("/")[-1]
+                + "}"
+            }
+        )
+    else:
+        return
+    convert_parents_to_structs(h5group.parent)
+    return
+def alias_table(file: str | Path, mapping: str):
     """
     Create an alias table for the given file and mapping.
@@ -13,16 +37,19 @@ def alias_table(file, mapping):
         file (str): Path to the input file.
         mapping (dict): Mapping of current table name and alias table name.
-    Returns:
-        dict: A dictionary containing the alias table.
     """
     if isinstance(mapping, str):
         mapping = json.loads(mapping)
+    if isinstance(mapping, list):
+        for m in mapping:
+            alias_table(file, m)
     with h5py.File(file, "a") as f:
         for raw_id, alias in mapping.items():
             if raw_id in f:
                 if isinstance(alias, list | tuple):
                     for a in alias:
                         f[a] = f[raw_id]
+                        convert_parents_to_structs(f[a])
                 else:
                     f[alias] = f[raw_id]
+                    convert_parents_to_structs(f[alias])

legenddataflowscripts/utils/convert_np.py CHANGED Viewed

@@ -24,7 +24,7 @@ def convert_dict_np_to_float(dic: dict) -> dict:
             convert_dict_np_to_float(value)
         elif isinstance(value, np.float32 | np.float64):
             dic[key] = float(value)
-        elif isinstance(dic[key], Sequence):
+        elif isinstance(dic[key], Sequence) and not isinstance(dic[key], str):
             dic[key] = [
                 float(x) if isinstance(x, np.float32 | np.float64) else x for x in value
             ]

legenddataflowscripts/workflow/execenv.py CHANGED Viewed

@@ -316,10 +316,16 @@ def cmdexec(args) -> None:
     )
     config_dict["execenv"] = config_dict["execenv"][args.system]
+    exe_path = Path(config_dict.paths.install).resolve() / "bin"
     cmd_prefix, cmd_env = execenv_prefix(config_dict, as_string=False)
     cmd_expr = [*cmd_prefix, *args.command]
     msg = "running: " + _execenv2str(cmd_expr, cmd_env)
     log.debug(msg)
-    subprocess.run(cmd_expr, env=os.environ | cmd_env, check=True)
+    env_dict = os.environ | cmd_env
+    env_dict["PATH"] = (
+        f"{exe_path}:{env_dict['PATH']}"  # prepend the virtualenv bin dir
+    )
+    subprocess.run(cmd_expr, env=env_dict, check=True)

{legend_dataflow_scripts-0.1.4.dist-info → legend_dataflow_scripts-0.1.6.dist-info}/WHEEL RENAMED Viewed

File without changes

{legend_dataflow_scripts-0.1.4.dist-info → legend_dataflow_scripts-0.1.6.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{legend_dataflow_scripts-0.1.4.dist-info → legend_dataflow_scripts-0.1.6.dist-info}/top_level.txt RENAMED Viewed

File without changes

legend-dataflow-scripts 0.1.4__py3-none-any.whl → 0.1.6__py3-none-any.whl

legend-dataflow-scripts 0.1.4py3-none-any.whl → 0.1.6py3-none-any.whl