PyPI - smftools - Versions diffs - 0.2.3__py3-none-any.whl → 0.2.5__py3-none-any.whl - Mend

smftools 0.2.3py3-none-any.whl → 0.2.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (137) hide show

smftools/__init__.py +6 -8
smftools/_settings.py +4 -6
smftools/_version.py +1 -1
smftools/cli/helpers.py +54 -0
smftools/cli/hmm_adata.py +937 -256
smftools/cli/load_adata.py +448 -268
smftools/cli/preprocess_adata.py +469 -263
smftools/cli/spatial_adata.py +536 -319
smftools/cli_entry.py +97 -182
smftools/config/__init__.py +1 -1
smftools/config/conversion.yaml +17 -6
smftools/config/deaminase.yaml +12 -10
smftools/config/default.yaml +142 -33
smftools/config/direct.yaml +11 -3
smftools/config/discover_input_files.py +19 -5
smftools/config/experiment_config.py +594 -264
smftools/constants.py +37 -0
smftools/datasets/__init__.py +2 -8
smftools/datasets/datasets.py +32 -18
smftools/hmm/HMM.py +2128 -1418
smftools/hmm/__init__.py +2 -9
smftools/hmm/archived/call_hmm_peaks.py +121 -0
smftools/hmm/call_hmm_peaks.py +299 -91
smftools/hmm/display_hmm.py +19 -6
smftools/hmm/hmm_readwrite.py +13 -4
smftools/hmm/nucleosome_hmm_refinement.py +102 -14
smftools/informatics/__init__.py +30 -7
smftools/informatics/archived/helpers/archived/align_and_sort_BAM.py +14 -1
smftools/informatics/archived/helpers/archived/bam_qc.py +14 -1
smftools/informatics/archived/helpers/archived/concatenate_fastqs_to_bam.py +8 -1
smftools/informatics/archived/helpers/archived/load_adata.py +3 -3
smftools/informatics/archived/helpers/archived/plot_bed_histograms.py +3 -1
smftools/informatics/archived/print_bam_query_seq.py +7 -1
smftools/informatics/bam_functions.py +397 -175
smftools/informatics/basecalling.py +51 -9
smftools/informatics/bed_functions.py +90 -57
smftools/informatics/binarize_converted_base_identities.py +18 -7
smftools/informatics/complement_base_list.py +7 -6
smftools/informatics/converted_BAM_to_adata.py +265 -122
smftools/informatics/fasta_functions.py +161 -83
smftools/informatics/h5ad_functions.py +196 -30
smftools/informatics/modkit_extract_to_adata.py +609 -270
smftools/informatics/modkit_functions.py +85 -44
smftools/informatics/ohe.py +44 -21
smftools/informatics/pod5_functions.py +112 -73
smftools/informatics/run_multiqc.py +20 -14
smftools/logging_utils.py +51 -0
smftools/machine_learning/__init__.py +2 -7
smftools/machine_learning/data/anndata_data_module.py +143 -50
smftools/machine_learning/data/preprocessing.py +2 -1
smftools/machine_learning/evaluation/__init__.py +1 -1
smftools/machine_learning/evaluation/eval_utils.py +11 -14
smftools/machine_learning/evaluation/evaluators.py +46 -33
smftools/machine_learning/inference/__init__.py +1 -1
smftools/machine_learning/inference/inference_utils.py +7 -4
smftools/machine_learning/inference/lightning_inference.py +9 -13
smftools/machine_learning/inference/sklearn_inference.py +6 -8
smftools/machine_learning/inference/sliding_window_inference.py +35 -25
smftools/machine_learning/models/__init__.py +10 -5
smftools/machine_learning/models/base.py +28 -42
smftools/machine_learning/models/cnn.py +15 -11
smftools/machine_learning/models/lightning_base.py +71 -40
smftools/machine_learning/models/mlp.py +13 -4
smftools/machine_learning/models/positional.py +3 -2
smftools/machine_learning/models/rnn.py +3 -2
smftools/machine_learning/models/sklearn_models.py +39 -22
smftools/machine_learning/models/transformer.py +68 -53
smftools/machine_learning/models/wrappers.py +2 -1
smftools/machine_learning/training/__init__.py +2 -2
smftools/machine_learning/training/train_lightning_model.py +29 -20
smftools/machine_learning/training/train_sklearn_model.py +9 -15
smftools/machine_learning/utils/__init__.py +1 -1
smftools/machine_learning/utils/device.py +7 -4
smftools/machine_learning/utils/grl.py +3 -1
smftools/metadata.py +443 -0
smftools/plotting/__init__.py +19 -5
smftools/plotting/autocorrelation_plotting.py +145 -44
smftools/plotting/classifiers.py +162 -72
smftools/plotting/general_plotting.py +422 -197
smftools/plotting/hmm_plotting.py +42 -13
smftools/plotting/position_stats.py +147 -87
smftools/plotting/qc_plotting.py +20 -12
smftools/preprocessing/__init__.py +10 -12
smftools/preprocessing/append_base_context.py +115 -80
smftools/preprocessing/append_binary_layer_by_base_context.py +77 -39
smftools/preprocessing/{calculate_complexity.py → archived/calculate_complexity.py} +3 -1
smftools/preprocessing/{archives → archived}/preprocessing.py +8 -6
smftools/preprocessing/binarize.py +21 -4
smftools/preprocessing/binarize_on_Youden.py +129 -31
smftools/preprocessing/binary_layers_to_ohe.py +17 -11
smftools/preprocessing/calculate_complexity_II.py +86 -59
smftools/preprocessing/calculate_consensus.py +28 -19
smftools/preprocessing/calculate_coverage.py +50 -25
smftools/preprocessing/calculate_pairwise_differences.py +2 -1
smftools/preprocessing/calculate_pairwise_hamming_distances.py +4 -3
smftools/preprocessing/calculate_position_Youden.py +118 -54
smftools/preprocessing/calculate_read_length_stats.py +52 -23
smftools/preprocessing/calculate_read_modification_stats.py +91 -57
smftools/preprocessing/clean_NaN.py +38 -28
smftools/preprocessing/filter_adata_by_nan_proportion.py +24 -12
smftools/preprocessing/filter_reads_on_length_quality_mapping.py +71 -38
smftools/preprocessing/filter_reads_on_modification_thresholds.py +181 -73
smftools/preprocessing/flag_duplicate_reads.py +689 -272
smftools/preprocessing/invert_adata.py +26 -11
smftools/preprocessing/load_sample_sheet.py +40 -22
smftools/preprocessing/make_dirs.py +8 -3
smftools/preprocessing/min_non_diagonal.py +2 -1
smftools/preprocessing/recipes.py +56 -23
smftools/preprocessing/reindex_references_adata.py +103 -0
smftools/preprocessing/subsample_adata.py +33 -16
smftools/readwrite.py +331 -82
smftools/schema/__init__.py +11 -0
smftools/schema/anndata_schema_v1.yaml +227 -0
smftools/tools/__init__.py +3 -4
smftools/tools/archived/classifiers.py +163 -0
smftools/tools/archived/subset_adata_v1.py +10 -1
smftools/tools/archived/subset_adata_v2.py +12 -1
smftools/tools/calculate_umap.py +54 -15
smftools/tools/cluster_adata_on_methylation.py +115 -46
smftools/tools/general_tools.py +70 -25
smftools/tools/position_stats.py +229 -98
smftools/tools/read_stats.py +50 -29
smftools/tools/spatial_autocorrelation.py +365 -192
smftools/tools/subset_adata.py +23 -21
{smftools-0.2.3.dist-info → smftools-0.2.5.dist-info}/METADATA +17 -39
smftools-0.2.5.dist-info/RECORD +181 -0
smftools-0.2.3.dist-info/RECORD +0 -173
/smftools/cli/{cli_flows.py → archived/cli_flows.py} +0 -0
/smftools/hmm/{apply_hmm_batched.py → archived/apply_hmm_batched.py} +0 -0
/smftools/hmm/{calculate_distances.py → archived/calculate_distances.py} +0 -0
/smftools/hmm/{train_hmm.py → archived/train_hmm.py} +0 -0
/smftools/preprocessing/{add_read_length_and_mapping_qc.py → archived/add_read_length_and_mapping_qc.py} +0 -0
/smftools/preprocessing/{archives → archived}/mark_duplicates.py +0 -0
/smftools/preprocessing/{archives → archived}/remove_duplicates.py +0 -0
{smftools-0.2.3.dist-info → smftools-0.2.5.dist-info}/WHEEL +0 -0
{smftools-0.2.3.dist-info → smftools-0.2.5.dist-info}/entry_points.txt +0 -0
{smftools-0.2.3.dist-info → smftools-0.2.5.dist-info}/licenses/LICENSE +0 -0

smftools/machine_learning/models/lightning_base.py CHANGED Viewed

@@ -1,10 +1,16 @@
-import torch
-import pytorch_lightning as pl
 import matplotlib.pyplot as plt
+import numpy as np
+import pytorch_lightning as pl
+import torch
 from sklearn.metrics import (
-    roc_auc_score, precision_recall_curve, auc, f1_score, confusion_matrix, roc_curve
+    auc,
+    confusion_matrix,
+    f1_score,
+    precision_recall_curve,
+    roc_auc_score,
+    roc_curve,
 )
-import numpy as np
 class TorchClassifierWrapper(pl.LightningModule):
     """
@@ -16,25 +22,26 @@ class TorchClassifierWrapper(pl.LightningModule):
     - Can pass the index of the class label to use as the focus class when calculating precision/recall.
     - Contains a prediction step to run inference with.
     """
     def __init__(
         self,
         model: torch.nn.Module,
         label_col: str,
         num_classes: int,
-        class_names: list=None,
+        class_names: list = None,
         optimizer_cls=torch.optim.AdamW,
         optimizer_kwargs=None,
         criterion_kwargs=None,
         lr: float = 1e-3,
         focus_class: int = 1,  # used for binary or multiclass precision-recall
         class_weights=None,
-        enforce_eval_balance: bool=False,
-        target_eval_freq: float=0.3,
-        max_eval_positive: int=None
+        enforce_eval_balance: bool = False,
+        target_eval_freq: float = 0.3,
+        max_eval_positive: int = None,
     ):
         super().__init__()
         self.model = model
-        self.save_hyperparameters(ignore=['model'])  # logs all except actual model instance
+        self.save_hyperparameters(ignore=["model"])  # logs all except actual model instance
         self.optimizer_cls = optimizer_cls
         self.optimizer_kwargs = optimizer_kwargs or {"weight_decay": 1e-4}
         self.criterion = None
@@ -57,14 +64,17 @@ class TorchClassifierWrapper(pl.LightningModule):
                 if torch.is_tensor(class_weights[self.focus_class]):
                     self.criterion_kwargs["pos_weight"] = class_weights[self.focus_class]
                 else:
-                    self.criterion_kwargs["pos_weight"] = torch.tensor(class_weights[self.focus_class], dtype=torch.float32, device=self.device)
+                    self.criterion_kwargs["pos_weight"] = torch.tensor(
+                        class_weights[self.focus_class], dtype=torch.float32, device=self.device
+                    )
             else:
                 # CrossEntropyLoss expects weight tensor of size C
                 if torch.is_tensor(class_weights):
                     self.criterion_kwargs["weight"] = class_weights
                 else:
-                    self.criterion_kwargs["weight"] = torch.tensor(class_weights, dtype=torch.float32)
+                    self.criterion_kwargs["weight"] = torch.tensor(
+                        class_weights, dtype=torch.float32
+                    )
         self._val_outputs = []
         self._test_outputs = []
@@ -78,12 +88,20 @@ class TorchClassifierWrapper(pl.LightningModule):
     def _init_criterion(self):
         if self.num_classes == 2:
-            if "pos_weight" in self.criterion_kwargs and not torch.is_tensor(self.criterion_kwargs["pos_weight"]):
-                self.criterion_kwargs["pos_weight"] = torch.tensor(self.criterion_kwargs["pos_weight"], dtype=torch.float32, device=self.device)
+            if "pos_weight" in self.criterion_kwargs and not torch.is_tensor(
+                self.criterion_kwargs["pos_weight"]
+            ):
+                self.criterion_kwargs["pos_weight"] = torch.tensor(
+                    self.criterion_kwargs["pos_weight"], dtype=torch.float32, device=self.device
+                )
             self.criterion = torch.nn.BCEWithLogitsLoss(**self.criterion_kwargs)
         else:
-            if "weight" in self.criterion_kwargs and not torch.is_tensor(self.criterion_kwargs["weight"]):
-                self.criterion_kwargs["weight"] = torch.tensor(self.criterion_kwargs["weight"], dtype=torch.float32, device=self.device)
+            if "weight" in self.criterion_kwargs and not torch.is_tensor(
+                self.criterion_kwargs["weight"]
+            ):
+                self.criterion_kwargs["weight"] = torch.tensor(
+                    self.criterion_kwargs["weight"], dtype=torch.float32, device=self.device
+                )
             self.criterion = torch.nn.CrossEntropyLoss(**self.criterion_kwargs)
     def _resolve_focus_class(self, focus_class):
@@ -93,11 +111,13 @@ class TorchClassifierWrapper(pl.LightningModule):
             if self.class_names is None:
                 raise ValueError("class_names must be provided if focus_class is a string.")
             if focus_class not in self.class_names:
-                raise ValueError(f"focus_class '{focus_class}' not found in class_names {self.class_names}.")
+                raise ValueError(
+                    f"focus_class '{focus_class}' not found in class_names {self.class_names}."
+                )
             return self.class_names.index(focus_class)
         else:
             raise ValueError(f"focus_class must be int or str, got {type(focus_class)}")
     def set_training_indices(self, datamodule):
         """
         Store obs_names for train/val/test subsets used during training.
@@ -140,7 +160,7 @@ class TorchClassifierWrapper(pl.LightningModule):
         self.log_dict({"val_loss": loss, "val_acc": acc}, prog_bar=False)
         self._val_outputs.append((logits.detach(), y.detach()))
         return loss
     def test_step(self, batch, batch_idx):
         """
         Test step for a batch through the Lightning Trainer.
@@ -189,7 +209,7 @@ class TorchClassifierWrapper(pl.LightningModule):
             return self.criterion(logits.view(-1, 1), y)
         else:
             return self.criterion(logits, y)
     def _get_probs(self, logits):
         """
         A helper function for getting class probabilities for binary vs multiclass classifications.
@@ -207,8 +227,10 @@ class TorchClassifierWrapper(pl.LightningModule):
             return (torch.sigmoid(logits.view(-1)) >= 0.5).long()
         else:
             return logits.argmax(dim=1)
-    def _subsample_for_fixed_positive_frequency(self, y_true, probs, target_freq=0.3, max_positive=None):
+    def _subsample_for_fixed_positive_frequency(
+        self, y_true, probs, target_freq=0.3, max_positive=None
+    ):
         pos_idx = np.where(y_true == self.focus_class)[0]
         neg_idx = np.where(y_true != self.focus_class)[0]
@@ -216,16 +238,20 @@ class TorchClassifierWrapper(pl.LightningModule):
         max_positives_possible = len(pos_idx)
         # maximum achievable positive class frequency
-        max_possible_freq = max_positives_possible / (max_positives_possible + max_negatives_possible)
+        max_possible_freq = max_positives_possible / (
+            max_positives_possible + max_negatives_possible
+        )
         if target_freq > max_possible_freq:
             target_freq = max_possible_freq  # clip if you ask for impossible freq
         # now calculate positive count
-        num_pos_target = min(int(target_freq * max_negatives_possible / (1 - target_freq)), max_positives_possible)
+        num_pos_target = min(
+            int(target_freq * max_negatives_possible / (1 - target_freq)), max_positives_possible
+        )
         num_neg_target = int(num_pos_target * (1 - target_freq) / target_freq)
         num_neg_target = min(num_neg_target, max_negatives_possible)
         pos_sampled = np.random.choice(pos_idx, size=num_pos_target, replace=False)
         neg_sampled = np.random.choice(neg_idx, size=num_neg_target, replace=False)
@@ -235,7 +261,7 @@ class TorchClassifierWrapper(pl.LightningModule):
         actual_freq = len(pos_sampled) / len(sampled_idx)
         return sampled_idx
     def _log_classification_metrics(self, logits, targets, prefix="val"):
         """
         A helper function for logging validation and testing split model evaluations.
@@ -252,9 +278,12 @@ class TorchClassifierWrapper(pl.LightningModule):
         num_pos = binary_focus.sum()
         # Subsample if you want to enforce a fixed proportion of the positive class
-        if prefix == 'test' and self.enforce_eval_balance:
+        if prefix == "test" and self.enforce_eval_balance:
             sampled_idx = self._subsample_for_fixed_positive_frequency(
-                y_true, probs, target_freq=self.target_eval_freq, max_positive=self.max_eval_positive
+                y_true,
+                probs,
+                target_freq=self.target_eval_freq,
+                max_positive=self.max_eval_positive,
             )
             y_true = y_true[sampled_idx]
             probs = probs[sampled_idx]
@@ -289,7 +318,7 @@ class TorchClassifierWrapper(pl.LightningModule):
         cm = confusion_matrix(y_true, preds)
         # Save attributes for later plotting
-        if prefix == 'test':
+        if prefix == "test":
             self.test_roc_curve = (fpr, tpr)
             self.test_pr_curve = (rc, pr)
             self.test_roc_auc = roc_auc
@@ -298,19 +327,21 @@ class TorchClassifierWrapper(pl.LightningModule):
             self.test_num_pos = num_pos
             self.test_acc = acc
             self.test_f1 = f1
-        elif prefix == 'val':
+        elif prefix == "val":
             pass
         # Logging
-        self.log_dict({
-            f"{prefix}_acc": acc,
-            f"{prefix}_f1": f1,
-            f"{prefix}_auc": roc_auc,
-            f"{prefix}_pr_auc": pr_auc,
-            f"{prefix}_pr_auc_norm": pr_auc_norm,
-            f"{prefix}_pos_freq": pos_freq,
-            f"{prefix}_num_pos": num_pos
-        })
+        self.log_dict(
+            {
+                f"{prefix}_acc": acc,
+                f"{prefix}_f1": f1,
+                f"{prefix}_auc": roc_auc,
+                f"{prefix}_pr_auc": pr_auc,
+                f"{prefix}_pr_auc_norm": pr_auc_norm,
+                f"{prefix}_pos_freq": pos_freq,
+                f"{prefix}_num_pos": num_pos,
+            }
+        )
         setattr(self, f"{prefix}_confusion_matrix", cm)
     def _plot_roc_pr_curves(self, logits, targets):
@@ -334,7 +365,7 @@ class TorchClassifierWrapper(pl.LightningModule):
         pos_freq = self.test_pos_freq
         plt.subplot(1, 2, 2)
         plt.plot(rc, pr, label=f"PR AUC={pr_auc:.3f}")
-        plt.axhline(pos_freq, linestyle='--', color="gray")
+        plt.axhline(pos_freq, linestyle="--", color="gray")
         plt.xlabel("Recall")
         plt.ylabel("Precision")
         plt.ylim(0, 1.05)

smftools/machine_learning/models/mlp.py CHANGED Viewed

@@ -1,9 +1,18 @@
-import torch
 import torch.nn as nn
 from .base import BaseTorchModel
 class MLPClassifier(BaseTorchModel):
-    def __init__(self, input_dim, num_classes=2, hidden_dims=[64, 64], dropout=0.2, use_batchnorm=True, **kwargs):
+    def __init__(
+        self,
+        input_dim,
+        num_classes=2,
+        hidden_dims=[64, 64],
+        dropout=0.2,
+        use_batchnorm=True,
+        **kwargs,
+    ):
         super().__init__(**kwargs)
         layers = []
         in_dim = input_dim
@@ -23,4 +32,4 @@ class MLPClassifier(BaseTorchModel):
         self.model = nn.Sequential(*layers)
     def forward(self, x):
-        return self.model(x)
+        return self.model(x)

smftools/machine_learning/models/positional.py CHANGED Viewed

@@ -2,6 +2,7 @@ import numpy as np
 import torch
 import torch.nn as nn
 class PositionalEncoding(nn.Module):
     def __init__(self, d_model, max_len=5000):
         super().__init__()
@@ -14,5 +15,5 @@ class PositionalEncoding(nn.Module):
         self.register_buffer("pe", pe)
     def forward(self, x):
-        x = x + self.pe[:, :x.size(1)]
-        return x
+        x = x + self.pe[:, : x.size(1)]
+        return x

smftools/machine_learning/models/rnn.py CHANGED Viewed

@@ -1,7 +1,8 @@
-import torch
 import torch.nn as nn
 from .base import BaseTorchModel
 class RNNClassifier(BaseTorchModel):
     def __init__(self, input_size, hidden_dim, num_classes, **kwargs):
         super().__init__(**kwargs)
@@ -14,4 +15,4 @@ class RNNClassifier(BaseTorchModel):
     def forward(self, x):
         x = x.unsqueeze(1)  # [B, 1, L] → for LSTM expecting batch_first
         _, (h_n, _) = self.lstm(x)  # h_n: [1, B, H]
-        return self.fc(h_n.squeeze(0))  # [B, H] → [B, num_classes]
+        return self.fc(h_n.squeeze(0))  # [B, H] → [B, num_classes]

smftools/machine_learning/models/sklearn_models.py CHANGED Viewed

@@ -1,23 +1,30 @@
-import numpy as np
 import matplotlib.pyplot as plt
+import numpy as np
 from sklearn.metrics import (
-    roc_auc_score, precision_recall_curve, auc, f1_score, confusion_matrix, roc_curve
+    auc,
+    confusion_matrix,
+    f1_score,
+    precision_recall_curve,
+    roc_auc_score,
+    roc_curve,
 )
 class SklearnModelWrapper:
     """
     Unified sklearn wrapper matching TorchClassifierWrapper interface.
     """
     def __init__(
-        self,
-        model,
+        self,
+        model,
         label_col: str,
-        num_classes: int,
-        class_names=None,
-        focus_class: int=1,
-        enforce_eval_balance: bool=False,
-        target_eval_freq: float=0.3,
-        max_eval_positive=None
+        num_classes: int,
+        class_names=None,
+        focus_class: int = 1,
+        enforce_eval_balance: bool = False,
+        target_eval_freq: float = 0.3,
+        max_eval_positive=None,
     ):
         self.model = model
         self.label_col = label_col
@@ -37,7 +44,9 @@ class SklearnModelWrapper:
             if self.class_names is None:
                 raise ValueError("class_names must be provided if focus_class is a string.")
             if focus_class not in self.class_names:
-                raise ValueError(f"focus_class '{focus_class}' not found in class_names {self.class_names}.")
+                raise ValueError(
+                    f"focus_class '{focus_class}' not found in class_names {self.class_names}."
+                )
             return self.class_names.index(focus_class)
         else:
             raise ValueError(f"focus_class must be int or str, got {type(focus_class)}")
@@ -130,7 +139,7 @@ class SklearnModelWrapper:
             f"{prefix}_pr_auc": pr_auc,
             f"{prefix}_pr_auc_norm": pr_auc_norm,
             f"{prefix}_pos_freq": pos_freq,
-            f"{prefix}_num_pos": num_pos
+            f"{prefix}_num_pos": num_pos,
         }
         return self.metrics
@@ -166,7 +175,10 @@ class SklearnModelWrapper:
     def fit_from_datamodule(self, datamodule):
         datamodule.setup()
-        X_tensor, y_tensor = datamodule.train_set.dataset.X_tensor, datamodule.train_set.dataset.y_tensor
+        X_tensor, y_tensor = (
+            datamodule.train_set.dataset.X_tensor,
+            datamodule.train_set.dataset.y_tensor,
+        )
         indices = datamodule.train_set.indices
         X_train = X_tensor[indices].numpy()
         y_train = y_tensor[indices].numpy()
@@ -190,11 +202,11 @@ class SklearnModelWrapper:
         y_eval = y_tensor[indices].numpy()
         return self.evaluate(X_eval, y_eval, prefix=split)
     def compute_shap(self, X, background=None, nsamples=100, target_class=None):
         """
         Compute SHAP values on input X, optionally for a specified target class.
         Parameters
         ----------
         X : array-like
@@ -225,7 +237,7 @@ class SklearnModelWrapper:
             shap_values = explainer.shap_values(X)
         else:
             shap_values = explainer.shap_values(X, nsamples=nsamples)
         if isinstance(shap_values, np.ndarray):
             if shap_values.ndim == 3:
                 if isinstance(target_class, int):
@@ -234,10 +246,7 @@ class SklearnModelWrapper:
                     # target_class is per-sample
                     if np.any(target_class >= shap_values.shape[2]):
                         raise ValueError(f"target_class values exceed {shap_values.shape[2]}")
-                    selected = np.array([
-                        shap_values[i, :, c]
-                        for i, c in enumerate(target_class)
-                    ])
+                    selected = np.array([shap_values[i, :, c] for i, c in enumerate(target_class)])
                     return selected
                 else:
                     # fallback to class 0
@@ -246,7 +255,15 @@ class SklearnModelWrapper:
                 # 2D shape (samples, features), no class dimension
                 return shap_values
-    def apply_shap_to_adata(self, dataloader, adata, background=None, adata_key="shap_values", target_class=None, normalize=True):
+    def apply_shap_to_adata(
+        self,
+        dataloader,
+        adata,
+        background=None,
+        adata_key="shap_values",
+        target_class=None,
+        normalize=True,
+    ):
         """
         Compute SHAP from a DataLoader and store in AnnData if provided.
         """
@@ -270,4 +287,4 @@ class SklearnModelWrapper:
             row_max[row_max == 0] = 1  # avoid divide by zero
             normalized = arr / row_max
-            adata.obsm[f"{adata_key}_normalized"] = normalized
+            adata.obsm[f"{adata_key}_normalized"] = normalized

smftools 0.2.3__py3-none-any.whl → 0.2.5__py3-none-any.whl

smftools 0.2.3py3-none-any.whl → 0.2.5py3-none-any.whl