PyPI - smftools - Versions diffs - 0.2.4__py3-none-any.whl → 0.3.0__py3-none-any.whl - Mend

smftools 0.2.4py3-none-any.whl → 0.3.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (181) hide show

smftools/__init__.py +43 -13
smftools/_settings.py +6 -6
smftools/_version.py +3 -1
smftools/cli/__init__.py +1 -0
smftools/cli/archived/cli_flows.py +2 -0
smftools/cli/helpers.py +9 -1
smftools/cli/hmm_adata.py +905 -242
smftools/cli/load_adata.py +432 -280
smftools/cli/preprocess_adata.py +287 -171
smftools/cli/spatial_adata.py +141 -53
smftools/cli_entry.py +119 -178
smftools/config/__init__.py +3 -1
smftools/config/conversion.yaml +5 -1
smftools/config/deaminase.yaml +1 -1
smftools/config/default.yaml +26 -18
smftools/config/direct.yaml +8 -3
smftools/config/discover_input_files.py +19 -5
smftools/config/experiment_config.py +511 -276
smftools/constants.py +37 -0
smftools/datasets/__init__.py +4 -8
smftools/datasets/datasets.py +32 -18
smftools/hmm/HMM.py +2133 -1428
smftools/hmm/__init__.py +24 -14
smftools/hmm/archived/apply_hmm_batched.py +2 -0
smftools/hmm/archived/calculate_distances.py +2 -0
smftools/hmm/archived/call_hmm_peaks.py +18 -1
smftools/hmm/archived/train_hmm.py +2 -0
smftools/hmm/call_hmm_peaks.py +176 -193
smftools/hmm/display_hmm.py +23 -7
smftools/hmm/hmm_readwrite.py +20 -6
smftools/hmm/nucleosome_hmm_refinement.py +104 -14
smftools/informatics/__init__.py +55 -13
smftools/informatics/archived/bam_conversion.py +2 -0
smftools/informatics/archived/bam_direct.py +2 -0
smftools/informatics/archived/basecall_pod5s.py +2 -0
smftools/informatics/archived/basecalls_to_adata.py +2 -0
smftools/informatics/archived/conversion_smf.py +2 -0
smftools/informatics/archived/deaminase_smf.py +1 -0
smftools/informatics/archived/direct_smf.py +2 -0
smftools/informatics/archived/fast5_to_pod5.py +2 -0
smftools/informatics/archived/helpers/archived/__init__.py +2 -0
smftools/informatics/archived/helpers/archived/align_and_sort_BAM.py +16 -1
smftools/informatics/archived/helpers/archived/aligned_BAM_to_bed.py +2 -0
smftools/informatics/archived/helpers/archived/bam_qc.py +14 -1
smftools/informatics/archived/helpers/archived/bed_to_bigwig.py +2 -0
smftools/informatics/archived/helpers/archived/canoncall.py +2 -0
smftools/informatics/archived/helpers/archived/concatenate_fastqs_to_bam.py +8 -1
smftools/informatics/archived/helpers/archived/converted_BAM_to_adata.py +2 -0
smftools/informatics/archived/helpers/archived/count_aligned_reads.py +2 -0
smftools/informatics/archived/helpers/archived/demux_and_index_BAM.py +2 -0
smftools/informatics/archived/helpers/archived/extract_base_identities.py +2 -0
smftools/informatics/archived/helpers/archived/extract_mods.py +2 -0
smftools/informatics/archived/helpers/archived/extract_read_features_from_bam.py +2 -0
smftools/informatics/archived/helpers/archived/extract_read_lengths_from_bed.py +2 -0
smftools/informatics/archived/helpers/archived/extract_readnames_from_BAM.py +2 -0
smftools/informatics/archived/helpers/archived/find_conversion_sites.py +2 -0
smftools/informatics/archived/helpers/archived/generate_converted_FASTA.py +2 -0
smftools/informatics/archived/helpers/archived/get_chromosome_lengths.py +2 -0
smftools/informatics/archived/helpers/archived/get_native_references.py +2 -0
smftools/informatics/archived/helpers/archived/index_fasta.py +2 -0
smftools/informatics/archived/helpers/archived/informatics.py +2 -0
smftools/informatics/archived/helpers/archived/load_adata.py +5 -3
smftools/informatics/archived/helpers/archived/make_modbed.py +2 -0
smftools/informatics/archived/helpers/archived/modQC.py +2 -0
smftools/informatics/archived/helpers/archived/modcall.py +2 -0
smftools/informatics/archived/helpers/archived/ohe_batching.py +2 -0
smftools/informatics/archived/helpers/archived/ohe_layers_decode.py +2 -0
smftools/informatics/archived/helpers/archived/one_hot_decode.py +2 -0
smftools/informatics/archived/helpers/archived/one_hot_encode.py +2 -0
smftools/informatics/archived/helpers/archived/plot_bed_histograms.py +5 -1
smftools/informatics/archived/helpers/archived/separate_bam_by_bc.py +2 -0
smftools/informatics/archived/helpers/archived/split_and_index_BAM.py +2 -0
smftools/informatics/archived/print_bam_query_seq.py +9 -1
smftools/informatics/archived/subsample_fasta_from_bed.py +2 -0
smftools/informatics/archived/subsample_pod5.py +2 -0
smftools/informatics/bam_functions.py +1059 -269
smftools/informatics/basecalling.py +53 -9
smftools/informatics/bed_functions.py +357 -114
smftools/informatics/binarize_converted_base_identities.py +21 -7
smftools/informatics/complement_base_list.py +9 -6
smftools/informatics/converted_BAM_to_adata.py +324 -137
smftools/informatics/fasta_functions.py +251 -89
smftools/informatics/h5ad_functions.py +202 -30
smftools/informatics/modkit_extract_to_adata.py +623 -274
smftools/informatics/modkit_functions.py +87 -44
smftools/informatics/ohe.py +46 -21
smftools/informatics/pod5_functions.py +114 -74
smftools/informatics/run_multiqc.py +20 -14
smftools/logging_utils.py +51 -0
smftools/machine_learning/__init__.py +23 -12
smftools/machine_learning/data/__init__.py +2 -0
smftools/machine_learning/data/anndata_data_module.py +157 -50
smftools/machine_learning/data/preprocessing.py +4 -1
smftools/machine_learning/evaluation/__init__.py +3 -1
smftools/machine_learning/evaluation/eval_utils.py +13 -14
smftools/machine_learning/evaluation/evaluators.py +52 -34
smftools/machine_learning/inference/__init__.py +3 -1
smftools/machine_learning/inference/inference_utils.py +9 -4
smftools/machine_learning/inference/lightning_inference.py +14 -13
smftools/machine_learning/inference/sklearn_inference.py +8 -8
smftools/machine_learning/inference/sliding_window_inference.py +37 -25
smftools/machine_learning/models/__init__.py +12 -5
smftools/machine_learning/models/base.py +34 -43
smftools/machine_learning/models/cnn.py +22 -13
smftools/machine_learning/models/lightning_base.py +78 -42
smftools/machine_learning/models/mlp.py +18 -5
smftools/machine_learning/models/positional.py +10 -4
smftools/machine_learning/models/rnn.py +8 -3
smftools/machine_learning/models/sklearn_models.py +46 -24
smftools/machine_learning/models/transformer.py +75 -55
smftools/machine_learning/models/wrappers.py +8 -3
smftools/machine_learning/training/__init__.py +4 -2
smftools/machine_learning/training/train_lightning_model.py +42 -23
smftools/machine_learning/training/train_sklearn_model.py +11 -15
smftools/machine_learning/utils/__init__.py +3 -1
smftools/machine_learning/utils/device.py +12 -5
smftools/machine_learning/utils/grl.py +8 -2
smftools/metadata.py +443 -0
smftools/optional_imports.py +31 -0
smftools/plotting/__init__.py +32 -17
smftools/plotting/autocorrelation_plotting.py +153 -48
smftools/plotting/classifiers.py +175 -73
smftools/plotting/general_plotting.py +350 -168
smftools/plotting/hmm_plotting.py +53 -14
smftools/plotting/position_stats.py +155 -87
smftools/plotting/qc_plotting.py +25 -12
smftools/preprocessing/__init__.py +35 -37
smftools/preprocessing/append_base_context.py +105 -79
smftools/preprocessing/append_binary_layer_by_base_context.py +75 -37
smftools/preprocessing/{archives → archived}/add_read_length_and_mapping_qc.py +2 -0
smftools/preprocessing/{archives → archived}/calculate_complexity.py +5 -1
smftools/preprocessing/{archives → archived}/mark_duplicates.py +2 -0
smftools/preprocessing/{archives → archived}/preprocessing.py +10 -6
smftools/preprocessing/{archives → archived}/remove_duplicates.py +2 -0
smftools/preprocessing/binarize.py +21 -4
smftools/preprocessing/binarize_on_Youden.py +127 -31
smftools/preprocessing/binary_layers_to_ohe.py +18 -11
smftools/preprocessing/calculate_complexity_II.py +89 -59
smftools/preprocessing/calculate_consensus.py +28 -19
smftools/preprocessing/calculate_coverage.py +44 -22
smftools/preprocessing/calculate_pairwise_differences.py +4 -1
smftools/preprocessing/calculate_pairwise_hamming_distances.py +7 -3
smftools/preprocessing/calculate_position_Youden.py +110 -55
smftools/preprocessing/calculate_read_length_stats.py +52 -23
smftools/preprocessing/calculate_read_modification_stats.py +91 -57
smftools/preprocessing/clean_NaN.py +38 -28
smftools/preprocessing/filter_adata_by_nan_proportion.py +24 -12
smftools/preprocessing/filter_reads_on_length_quality_mapping.py +72 -37
smftools/preprocessing/filter_reads_on_modification_thresholds.py +183 -73
smftools/preprocessing/flag_duplicate_reads.py +708 -303
smftools/preprocessing/invert_adata.py +26 -11
smftools/preprocessing/load_sample_sheet.py +40 -22
smftools/preprocessing/make_dirs.py +9 -3
smftools/preprocessing/min_non_diagonal.py +4 -1
smftools/preprocessing/recipes.py +58 -23
smftools/preprocessing/reindex_references_adata.py +93 -27
smftools/preprocessing/subsample_adata.py +33 -16
smftools/readwrite.py +264 -109
smftools/schema/__init__.py +11 -0
smftools/schema/anndata_schema_v1.yaml +227 -0
smftools/tools/__init__.py +25 -18
smftools/tools/archived/apply_hmm.py +2 -0
smftools/tools/archived/classifiers.py +165 -0
smftools/tools/archived/classify_methylated_features.py +2 -0
smftools/tools/archived/classify_non_methylated_features.py +2 -0
smftools/tools/archived/subset_adata_v1.py +12 -1
smftools/tools/archived/subset_adata_v2.py +14 -1
smftools/tools/calculate_umap.py +56 -15
smftools/tools/cluster_adata_on_methylation.py +122 -47
smftools/tools/general_tools.py +70 -25
smftools/tools/position_stats.py +220 -99
smftools/tools/read_stats.py +50 -29
smftools/tools/spatial_autocorrelation.py +365 -192
smftools/tools/subset_adata.py +23 -21
smftools-0.3.0.dist-info/METADATA +147 -0
smftools-0.3.0.dist-info/RECORD +182 -0
smftools-0.2.4.dist-info/METADATA +0 -141
smftools-0.2.4.dist-info/RECORD +0 -176
{smftools-0.2.4.dist-info → smftools-0.3.0.dist-info}/WHEEL +0 -0
{smftools-0.2.4.dist-info → smftools-0.3.0.dist-info}/entry_points.txt +0 -0
{smftools-0.2.4.dist-info → smftools-0.3.0.dist-info}/licenses/LICENSE +0 -0

smftools/plotting/autocorrelation_plotting.py CHANGED Viewed

@@ -1,5 +1,13 @@
+from __future__ import annotations
 from typing import Optional
+import numpy as np
+import pandas as pd
+from smftools.optional_imports import require
 def plot_spatial_autocorr_grid(
     adata,
     out_dir: str,
@@ -14,6 +22,7 @@ def plot_spatial_autocorr_grid(
     references: Optional[list] = None,
     annotate_periodicity: bool = True,
     counts_key_suffix: str = "_counts",
+    normalization_method: str = "pearson",
     # plotting thresholds
     plot_min_count: int = 10,
 ):
@@ -28,14 +37,15 @@ def plot_spatial_autocorr_grid(
     fall back to running the analyzer for that group (slow) and cache the result into adata.uns.
     """
     import os
-    import numpy as np
-    import pandas as pd
-    import matplotlib.pyplot as plt
     import warnings
+    plt = require("matplotlib.pyplot", extra="plotting", purpose="autocorrelation plots")
     # Try importing analyzer (used only as fallback)
     try:
-        from ..tools.spatial_autocorrelation import analyze_autocorr_matrix  # prefer packaged analyzer
+        from ..tools.spatial_autocorrelation import (
+            analyze_autocorr_matrix,
+        )  # prefer packaged analyzer
     except Exception:
         analyze_autocorr_matrix = globals().get("analyze_autocorr_matrix", None)
@@ -44,6 +54,7 @@ def plot_spatial_autocorr_grid(
     # small rolling average helper for smoother visualization
     def _rolling_1d(arr: np.ndarray, win: int) -> np.ndarray:
+        """Compute a rolling mean with NaN-aware normalization."""
         if win <= 1:
             return arr
         valid = np.isfinite(arr).astype(float)
@@ -58,6 +69,7 @@ def plot_spatial_autocorr_grid(
     # group summary extractor: returns (lags, mean_curve_smoothed, std_curve_smoothed, counts_block_or_None)
     def _compute_group_summary_for_mask(site: str, mask: np.ndarray):
+        """Extract summary curves for a site and mask."""
         obsm_key = f"{site}_spatial_autocorr"
         lags_key = f"{site}_spatial_autocorr_lags"
         counts_key = f"{site}_spatial_autocorr{counts_key_suffix}"
@@ -75,7 +87,12 @@ def plot_spatial_autocorr_grid(
         if counts_key in adata.obsm:
             counts_mat = np.asarray(adata.obsm[counts_key])
             counts = counts_mat[mask, :].astype(int)
-        return np.asarray(adata.uns[lags_key]), _rolling_1d(mean_per_lag, window), _rolling_1d(std_per_lag, window), counts
+        return (
+            np.asarray(adata.uns[lags_key]),
+            _rolling_1d(mean_per_lag, window),
+            _rolling_1d(std_per_lag, window),
+            counts,
+        )
     # samples meta
     if sample_col not in adata.obs:
@@ -116,7 +133,8 @@ def plot_spatial_autocorr_grid(
         nrows = len(chunk)
         fig, axes = plt.subplots(
-            nrows=nrows, ncols=ncols,
+            nrows=nrows,
+            ncols=ncols,
             figsize=(4.2 * ncols, 2.4 * nrows),
             dpi=dpi,
             squeeze=False,
@@ -141,9 +159,9 @@ def plot_spatial_autocorr_grid(
                     ax = axes[r, col_idx]
                     # compute mask
-                    sample_mask = (adata.obs[sample_col].values == sample_name)
+                    sample_mask = adata.obs[sample_col].values == sample_name
                     if col_kind == "ref":
-                        ref_mask = (adata.obs[reference_col].values == col_val)
+                        ref_mask = adata.obs[reference_col].values == col_val
                         mask = sample_mask & ref_mask
                     else:
                         mask = sample_mask
@@ -152,7 +170,9 @@ def plot_spatial_autocorr_grid(
                     n_reads_grp = int(mask.sum())
                     # group summary (mean/std and counts_block)
-                    lags_local, mean_curve, std_curve, counts_block = _compute_group_summary_for_mask(site, mask)
+                    lags_local, mean_curve, std_curve, counts_block = (
+                        _compute_group_summary_for_mask(site, mask)
+                    )
                     # plot title for top row
                     if r == 0:
@@ -164,9 +184,12 @@ def plot_spatial_autocorr_grid(
                         ax.text(0.5, 0.5, "No data", ha="center", va="center", fontsize=8)
                         ax.set_xlim(0, 1)
                         ax.set_xlabel("Lag (bp)", fontsize=7)
-                        ax.tick_params(axis='both', which='major', labelsize=6)
+                        ax.set_ylabel(
+                            f"Autocorrelation {normalization_method} normalized", fontsize=7
+                        )
+                        ax.tick_params(axis="both", which="major", labelsize=6)
                         ax.grid(True, alpha=0.22)
-                        #col_idx += 1
+                        # col_idx += 1
                         continue
                     # mask low-support lags if counts available
@@ -186,7 +209,13 @@ def plot_spatial_autocorr_grid(
                         # plot a faint grey line for the low-support regions (context only)
                         if low_support.any():
-                            ax.plot(lags_local[low_support], mean_curve_smooth[low_support], color="0.85", lw=0.6, label="_nolegend_")
+                            ax.plot(
+                                lags_local[low_support],
+                                mean_curve_smooth[low_support],
+                                color="0.85",
+                                lw=0.6,
+                                label="_nolegend_",
+                            )
                     # plot mean (high-support only) and +/- std (std is computed from all molecules)
                     ax.plot(lags_local, mean_plot, lw=1.1)
@@ -201,16 +230,25 @@ def plot_spatial_autocorr_grid(
                         # metrics_by_group_precomp can be dict-like
                         res = metrics_by_group_precomp.get(group_key, None)
-                    if res is None and annotate_periodicity and (analyze_autocorr_matrix is not None) and (ac_full is not None):
+                    if (
+                        res is None
+                        and annotate_periodicity
+                        and (analyze_autocorr_matrix is not None)
+                        and (ac_full is not None)
+                    ):
                         # fallback: run analyzer on the subset (warn + cache)
                         ac_sel = ac_full[mask, :]
                         cnt_sel = counts_full[mask, :] if counts_full is not None else None
                         if ac_sel.size:
-                            warnings.warn(f"Precomputed periodicity metrics for {site} {group_key} not found — running analyzer as fallback (slow).")
+                            warnings.warn(
+                                f"Precomputed periodicity metrics for {site} {group_key} not found — running analyzer as fallback (slow)."
+                            )
                             try:
                                 res = analyze_autocorr_matrix(
                                     ac_sel,
-                                    cnt_sel if cnt_sel is not None else np.zeros_like(ac_sel, dtype=int),
+                                    cnt_sel
+                                    if cnt_sel is not None
+                                    else np.zeros_like(ac_sel, dtype=int),
                                     lags_local,
                                     nrl_search_bp=(120, 260),
                                     pad_factor=4,
@@ -239,19 +277,38 @@ def plot_spatial_autocorr_grid(
                         # vertical NRL line & harmonics (safe check)
                         if (nrl is not None) and np.isfinite(nrl):
-                            ax.axvline(float(nrl), color="C3", linestyle="--", linewidth=1.0, alpha=0.9)
+                            ax.axvline(
+                                float(nrl), color="C3", linestyle="--", linewidth=1.0, alpha=0.9
+                            )
                             for m in range(2, 5):
-                                ax.axvline(float(nrl) * m, color="C3", linestyle=":", linewidth=0.7, alpha=0.6)
+                                ax.axvline(
+                                    float(nrl) * m,
+                                    color="C3",
+                                    linestyle=":",
+                                    linewidth=0.7,
+                                    alpha=0.6,
+                                )
                         # envelope points + fitted exponential
                         if sample_lags.size:
                             ax.scatter(sample_lags, envelope_heights, s=18, color="C2")
-                            if (xi_val is not None) and np.isfinite(xi_val) and np.isfinite(res.get("xi_A", np.nan)):
+                            if (
+                                (xi_val is not None)
+                                and np.isfinite(xi_val)
+                                and np.isfinite(res.get("xi_A", np.nan))
+                            ):
                                 A = float(res.get("xi_A", np.nan))
                                 xi_val = float(xi_val)
                                 env_x = np.linspace(np.min(sample_lags), np.max(sample_lags), 200)
                                 env_y = A * np.exp(-env_x / xi_val)
-                                ax.plot(env_x, env_y, linestyle="--", color="C2", linewidth=1.0, alpha=0.9)
+                                ax.plot(
+                                    env_x,
+                                    env_y,
+                                    linestyle="--",
+                                    color="C2",
+                                    linewidth=1.0,
+                                    alpha=0.9,
+                                )
                         # inset PSD plotted vs NRL (linear x-axis)
                         freqs = res.get("freqs", None)
@@ -266,7 +323,12 @@ def plot_spatial_autocorr_grid(
                                 nrl_vals = 1.0 / freqs[valid]  # convert freq -> NRL (bp)
                                 inset.plot(nrl_vals, power[valid], lw=0.7)
                                 if peak_f is not None and peak_f > 0:
-                                    inset.axvline(1.0 / float(peak_f), color="C3", linestyle="--", linewidth=0.8)
+                                    inset.axvline(
+                                        1.0 / float(peak_f),
+                                        color="C3",
+                                        linestyle="--",
+                                        linewidth=0.8,
+                                    )
                                 # choose a reasonable linear x-limits (prefer typical NRL range but fallback to data)
                                 default_xlim = (60, 400)
                                 data_xlim = (float(np.nanmin(nrl_vals)), 600)
@@ -278,17 +340,29 @@ def plot_spatial_autocorr_grid(
                                 inset.set_ylabel("power", fontsize=6)
                                 inset.tick_params(labelsize=6)
                                 if (snr is not None) and np.isfinite(snr):
-                                    inset.text(0.95, 0.95, f"SNR={float(snr):.1f}", transform=inset.transAxes,
-                                            ha="right", va="top", fontsize=6, bbox=dict(facecolor="white", alpha=0.6, edgecolor="none"))
+                                    inset.text(
+                                        0.95,
+                                        0.95,
+                                        f"SNR={float(snr):.1f}",
+                                        transform=inset.transAxes,
+                                        ha="right",
+                                        va="top",
+                                        fontsize=6,
+                                        bbox=dict(facecolor="white", alpha=0.6, edgecolor="none"),
+                                    )
                     # set x-limits based on finite lags
                     finite_mask = np.isfinite(lags_local)
                     if finite_mask.any():
-                        ax.set_xlim(float(np.nanmin(lags_local[finite_mask])), float(np.nanmax(lags_local[finite_mask])))
+                        ax.set_xlim(
+                            float(np.nanmin(lags_local[finite_mask])),
+                            float(np.nanmax(lags_local[finite_mask])),
+                        )
                     # small cosmetics
                     ax.set_xlabel("Lag (bp)", fontsize=7)
-                    ax.tick_params(axis='both', which='major', labelsize=6)
+                    ax.set_ylabel(f"Autocorrelation {normalization_method} normalized", fontsize=7)
+                    ax.tick_params(axis="both", which="major", labelsize=6)
                     ax.grid(True, alpha=0.22)
                 col_idx += 1
@@ -301,9 +375,13 @@ def plot_spatial_autocorr_grid(
             ycenter = pos.y0 + pos.height / 2.0
             n_reads_grp = int((adata.obs[sample_col].values == sample_name).sum())
             label = f"{sample_name}\n(n={n_reads_grp})"
-            fig.text(0.02, ycenter, label, va='center', ha='left', rotation='vertical', fontsize=9)
+            fig.text(0.02, ycenter, label, va="center", ha="left", rotation="vertical", fontsize=9)
-        fig.suptitle("Spatial autocorrelation by sample × (site_type × reference)", y=0.995, fontsize=11)
+        fig.suptitle(
+            f"Spatial autocorrelation ({normalization_method}) by sample × (site_type × reference)",
+            y=0.995,
+            fontsize=11,
+        )
         page_idx = start_idx // rows_per_fig + 1
         out_png = os.path.join(out_dir, f"{filename_prefix}_page{page_idx}.png")
@@ -365,6 +443,7 @@ def plot_spatial_autocorr_grid(
                     return arr.tolist()
                 def _safe_float(x):
+                    """Coerce a value to float, returning NaN on failure."""
                     try:
                         return float(x)
                     except Exception:
@@ -381,15 +460,33 @@ def plot_spatial_autocorr_grid(
                     "site": site,
                     "sample": sample_name,
                     "reference": ref,
-                    "nrl_bp": _safe_float(entry.get("nrl_bp", float("nan"))) if entry is not None else float("nan"),
-                    "snr": _safe_float(entry.get("snr", float("nan"))) if entry is not None else float("nan"),
-                    "fwhm_bp": _safe_float(entry.get("fwhm_bp", float("nan"))) if entry is not None else float("nan"),
-                    "xi": _safe_float(entry.get("xi", float("nan"))) if entry is not None else float("nan"),
-                    "xi_A": _safe_float(entry.get("xi_A", float("nan"))) if entry is not None else float("nan"),
-                    "xi_r2": _safe_float(entry.get("xi_r2", float("nan"))) if entry is not None else float("nan"),
-                    "envelope_sample_lags": ";".join(map(str, env_lags_list)) if len(env_lags_list) else "",
-                    "envelope_heights": ";".join(map(str, env_heights_list)) if len(env_heights_list) else "",
-                    "analyzer_error": entry.get("error", entry.get("analyzer_error", None)) if entry is not None else "no_metrics",
+                    "nrl_bp": _safe_float(entry.get("nrl_bp", float("nan")))
+                    if entry is not None
+                    else float("nan"),
+                    "snr": _safe_float(entry.get("snr", float("nan")))
+                    if entry is not None
+                    else float("nan"),
+                    "fwhm_bp": _safe_float(entry.get("fwhm_bp", float("nan")))
+                    if entry is not None
+                    else float("nan"),
+                    "xi": _safe_float(entry.get("xi", float("nan")))
+                    if entry is not None
+                    else float("nan"),
+                    "xi_A": _safe_float(entry.get("xi_A", float("nan")))
+                    if entry is not None
+                    else float("nan"),
+                    "xi_r2": _safe_float(entry.get("xi_r2", float("nan")))
+                    if entry is not None
+                    else float("nan"),
+                    "envelope_sample_lags": ";".join(map(str, env_lags_list))
+                    if len(env_lags_list)
+                    else "",
+                    "envelope_heights": ";".join(map(str, env_heights_list))
+                    if len(env_heights_list)
+                    else "",
+                    "analyzer_error": entry.get("error", entry.get("analyzer_error", None))
+                    if entry is not None
+                    else "no_metrics",
                 }
                 rows.append(row)
                 combined_rows.append(row)
@@ -404,6 +501,7 @@ def plot_spatial_autocorr_grid(
             except Exception as e:
                 # don't fail the whole pipeline for a single write error; log and continue
                 import warnings
                 warnings.warn(f"Failed to write {out_csv}: {e}")
     # write the single combined CSV (one row per sample x ref x site)
@@ -413,16 +511,19 @@ def plot_spatial_autocorr_grid(
         combined_df.to_csv(combined_out, index=False)
     except Exception as e:
         import warnings
         warnings.warn(f"Failed to write combined CSV {combined_out}: {e}")
     return saved_pages
 def plot_rolling_metrics(df, out_png=None, title=None, figsize=(10, 3.5), dpi=160, show=False):
     """
     Plot NRL and SNR vs window center from the dataframe returned by rolling_autocorr_metrics.
     If out_png is None, returns the matplotlib Figure object; otherwise saves PNG and returns path.
     """
-    import matplotlib.pyplot as plt
+    plt = require("matplotlib.pyplot", extra="plotting", purpose="autocorrelation plots")
     # sort by center
     df2 = df.sort_values("center")
     x = df2["center"].values
@@ -446,16 +547,16 @@ def plot_rolling_metrics(df, out_png=None, title=None, figsize=(10, 3.5), dpi=16
     if out_png:
         fig.savefig(out_png, bbox_inches="tight")
         if not show:
-            import matplotlib
+            matplotlib = require("matplotlib", extra="plotting", purpose="autocorrelation plots")
             matplotlib.pyplot.close(fig)
         return out_png
     if not show:
-        import matplotlib
+        matplotlib = require("matplotlib", extra="plotting", purpose="autocorrelation plots")
         matplotlib.pyplot.close(fig)
     return fig
-import numpy as np
-import pandas as pd
 def plot_rolling_grid(
     rolling_dict,
@@ -502,10 +603,8 @@ def plot_rolling_grid(
     pages_by_metric : dict mapping metric -> [out_png_paths]
     """
     import os
-    import math
-    import matplotlib.pyplot as plt
-    import numpy as np
-    import pandas as pd
+    plt = require("matplotlib.pyplot", extra="plotting", purpose="autocorrelation plots")
     if per_metric_ylim is None:
         per_metric_ylim = {}
@@ -520,7 +619,7 @@ def plot_rolling_grid(
     # normalize reference labels and keep mapping to original
     label_to_orig = {}
-    for (_sample, ref) in keys:
+    for _sample, ref in keys:
         label = "all" if (ref is None) else str(ref)
         if label not in label_to_orig:
             label_to_orig[label] = ref
@@ -532,7 +631,11 @@ def plot_rolling_grid(
     # reference labels ordering
     default_ref_labels = sorted(label_to_orig.keys(), key=lambda s: s)
     if reference_order is not None:
-        ref_labels = [("all" if r is None else str(r)) for r in reference_order if (("all" if r is None else str(r)) in label_to_orig)]
+        ref_labels = [
+            ("all" if r is None else str(r))
+            for r in reference_order
+            if (("all" if r is None else str(r)) in label_to_orig)
+        ]
     else:
         ref_labels = default_ref_labels
@@ -553,9 +656,11 @@ def plot_rolling_grid(
             nrows = len(page_samples)
             fig, axes = plt.subplots(
-                nrows=nrows, ncols=cols_per_page,
+                nrows=nrows,
+                ncols=cols_per_page,
                 figsize=(figsize_per_panel[0] * cols_per_page, figsize_per_panel[1] * nrows),
-                dpi=dpi, squeeze=False
+                dpi=dpi,
+                squeeze=False,
             )
             for i, sample in enumerate(page_samples):

smftools 0.2.4__py3-none-any.whl → 0.3.0__py3-none-any.whl

smftools 0.2.4py3-none-any.whl → 0.3.0py3-none-any.whl