PyPI - smftools - Versions diffs - 0.2.3__py3-none-any.whl → 0.2.5__py3-none-any.whl - Mend

smftools 0.2.3py3-none-any.whl → 0.2.5py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (137) hide show

smftools/__init__.py +6 -8
smftools/_settings.py +4 -6
smftools/_version.py +1 -1
smftools/cli/helpers.py +54 -0
smftools/cli/hmm_adata.py +937 -256
smftools/cli/load_adata.py +448 -268
smftools/cli/preprocess_adata.py +469 -263
smftools/cli/spatial_adata.py +536 -319
smftools/cli_entry.py +97 -182
smftools/config/__init__.py +1 -1
smftools/config/conversion.yaml +17 -6
smftools/config/deaminase.yaml +12 -10
smftools/config/default.yaml +142 -33
smftools/config/direct.yaml +11 -3
smftools/config/discover_input_files.py +19 -5
smftools/config/experiment_config.py +594 -264
smftools/constants.py +37 -0
smftools/datasets/__init__.py +2 -8
smftools/datasets/datasets.py +32 -18
smftools/hmm/HMM.py +2128 -1418
smftools/hmm/__init__.py +2 -9
smftools/hmm/archived/call_hmm_peaks.py +121 -0
smftools/hmm/call_hmm_peaks.py +299 -91
smftools/hmm/display_hmm.py +19 -6
smftools/hmm/hmm_readwrite.py +13 -4
smftools/hmm/nucleosome_hmm_refinement.py +102 -14
smftools/informatics/__init__.py +30 -7
smftools/informatics/archived/helpers/archived/align_and_sort_BAM.py +14 -1
smftools/informatics/archived/helpers/archived/bam_qc.py +14 -1
smftools/informatics/archived/helpers/archived/concatenate_fastqs_to_bam.py +8 -1
smftools/informatics/archived/helpers/archived/load_adata.py +3 -3
smftools/informatics/archived/helpers/archived/plot_bed_histograms.py +3 -1
smftools/informatics/archived/print_bam_query_seq.py +7 -1
smftools/informatics/bam_functions.py +397 -175
smftools/informatics/basecalling.py +51 -9
smftools/informatics/bed_functions.py +90 -57
smftools/informatics/binarize_converted_base_identities.py +18 -7
smftools/informatics/complement_base_list.py +7 -6
smftools/informatics/converted_BAM_to_adata.py +265 -122
smftools/informatics/fasta_functions.py +161 -83
smftools/informatics/h5ad_functions.py +196 -30
smftools/informatics/modkit_extract_to_adata.py +609 -270
smftools/informatics/modkit_functions.py +85 -44
smftools/informatics/ohe.py +44 -21
smftools/informatics/pod5_functions.py +112 -73
smftools/informatics/run_multiqc.py +20 -14
smftools/logging_utils.py +51 -0
smftools/machine_learning/__init__.py +2 -7
smftools/machine_learning/data/anndata_data_module.py +143 -50
smftools/machine_learning/data/preprocessing.py +2 -1
smftools/machine_learning/evaluation/__init__.py +1 -1
smftools/machine_learning/evaluation/eval_utils.py +11 -14
smftools/machine_learning/evaluation/evaluators.py +46 -33
smftools/machine_learning/inference/__init__.py +1 -1
smftools/machine_learning/inference/inference_utils.py +7 -4
smftools/machine_learning/inference/lightning_inference.py +9 -13
smftools/machine_learning/inference/sklearn_inference.py +6 -8
smftools/machine_learning/inference/sliding_window_inference.py +35 -25
smftools/machine_learning/models/__init__.py +10 -5
smftools/machine_learning/models/base.py +28 -42
smftools/machine_learning/models/cnn.py +15 -11
smftools/machine_learning/models/lightning_base.py +71 -40
smftools/machine_learning/models/mlp.py +13 -4
smftools/machine_learning/models/positional.py +3 -2
smftools/machine_learning/models/rnn.py +3 -2
smftools/machine_learning/models/sklearn_models.py +39 -22
smftools/machine_learning/models/transformer.py +68 -53
smftools/machine_learning/models/wrappers.py +2 -1
smftools/machine_learning/training/__init__.py +2 -2
smftools/machine_learning/training/train_lightning_model.py +29 -20
smftools/machine_learning/training/train_sklearn_model.py +9 -15
smftools/machine_learning/utils/__init__.py +1 -1
smftools/machine_learning/utils/device.py +7 -4
smftools/machine_learning/utils/grl.py +3 -1
smftools/metadata.py +443 -0
smftools/plotting/__init__.py +19 -5
smftools/plotting/autocorrelation_plotting.py +145 -44
smftools/plotting/classifiers.py +162 -72
smftools/plotting/general_plotting.py +422 -197
smftools/plotting/hmm_plotting.py +42 -13
smftools/plotting/position_stats.py +147 -87
smftools/plotting/qc_plotting.py +20 -12
smftools/preprocessing/__init__.py +10 -12
smftools/preprocessing/append_base_context.py +115 -80
smftools/preprocessing/append_binary_layer_by_base_context.py +77 -39
smftools/preprocessing/{calculate_complexity.py → archived/calculate_complexity.py} +3 -1
smftools/preprocessing/{archives → archived}/preprocessing.py +8 -6
smftools/preprocessing/binarize.py +21 -4
smftools/preprocessing/binarize_on_Youden.py +129 -31
smftools/preprocessing/binary_layers_to_ohe.py +17 -11
smftools/preprocessing/calculate_complexity_II.py +86 -59
smftools/preprocessing/calculate_consensus.py +28 -19
smftools/preprocessing/calculate_coverage.py +50 -25
smftools/preprocessing/calculate_pairwise_differences.py +2 -1
smftools/preprocessing/calculate_pairwise_hamming_distances.py +4 -3
smftools/preprocessing/calculate_position_Youden.py +118 -54
smftools/preprocessing/calculate_read_length_stats.py +52 -23
smftools/preprocessing/calculate_read_modification_stats.py +91 -57
smftools/preprocessing/clean_NaN.py +38 -28
smftools/preprocessing/filter_adata_by_nan_proportion.py +24 -12
smftools/preprocessing/filter_reads_on_length_quality_mapping.py +71 -38
smftools/preprocessing/filter_reads_on_modification_thresholds.py +181 -73
smftools/preprocessing/flag_duplicate_reads.py +689 -272
smftools/preprocessing/invert_adata.py +26 -11
smftools/preprocessing/load_sample_sheet.py +40 -22
smftools/preprocessing/make_dirs.py +8 -3
smftools/preprocessing/min_non_diagonal.py +2 -1
smftools/preprocessing/recipes.py +56 -23
smftools/preprocessing/reindex_references_adata.py +103 -0
smftools/preprocessing/subsample_adata.py +33 -16
smftools/readwrite.py +331 -82
smftools/schema/__init__.py +11 -0
smftools/schema/anndata_schema_v1.yaml +227 -0
smftools/tools/__init__.py +3 -4
smftools/tools/archived/classifiers.py +163 -0
smftools/tools/archived/subset_adata_v1.py +10 -1
smftools/tools/archived/subset_adata_v2.py +12 -1
smftools/tools/calculate_umap.py +54 -15
smftools/tools/cluster_adata_on_methylation.py +115 -46
smftools/tools/general_tools.py +70 -25
smftools/tools/position_stats.py +229 -98
smftools/tools/read_stats.py +50 -29
smftools/tools/spatial_autocorrelation.py +365 -192
smftools/tools/subset_adata.py +23 -21
{smftools-0.2.3.dist-info → smftools-0.2.5.dist-info}/METADATA +17 -39
smftools-0.2.5.dist-info/RECORD +181 -0
smftools-0.2.3.dist-info/RECORD +0 -173
/smftools/cli/{cli_flows.py → archived/cli_flows.py} +0 -0
/smftools/hmm/{apply_hmm_batched.py → archived/apply_hmm_batched.py} +0 -0
/smftools/hmm/{calculate_distances.py → archived/calculate_distances.py} +0 -0
/smftools/hmm/{train_hmm.py → archived/train_hmm.py} +0 -0
/smftools/preprocessing/{add_read_length_and_mapping_qc.py → archived/add_read_length_and_mapping_qc.py} +0 -0
/smftools/preprocessing/{archives → archived}/mark_duplicates.py +0 -0
/smftools/preprocessing/{archives → archived}/remove_duplicates.py +0 -0
{smftools-0.2.3.dist-info → smftools-0.2.5.dist-info}/WHEEL +0 -0
{smftools-0.2.3.dist-info → smftools-0.2.5.dist-info}/entry_points.txt +0 -0
{smftools-0.2.3.dist-info → smftools-0.2.5.dist-info}/licenses/LICENSE +0 -0

smftools/machine_learning/models/transformer.py CHANGED Viewed

@@ -1,9 +1,11 @@
+import numpy as np
 import torch
 import torch.nn as nn
-from .base import BaseTorchModel
-from .positional import PositionalEncoding
 from ..utils.grl import grad_reverse
-import numpy as np
+from .base import BaseTorchModel
+from .positional import PositionalEncoding
 class TransformerEncoderLayerWithAttn(nn.TransformerEncoderLayer):
     def __init__(self, *args, **kwargs):
@@ -11,12 +13,14 @@ class TransformerEncoderLayerWithAttn(nn.TransformerEncoderLayer):
     def forward(self, src, src_mask=None, is_causal=False, src_key_padding_mask=None):
         self_attn_output, attn_weights = self.self_attn(
-            src, src, src,
+            src,
+            src,
+            src,
             attn_mask=src_mask,
             key_padding_mask=src_key_padding_mask,
             need_weights=True,
             average_attn_weights=False,  # preserve [B, num_heads, S, S]
-            is_causal=is_causal
+            is_causal=is_causal,
         )
         src = src + self.dropout1(self_attn_output)
         src = self.norm1(src)
@@ -27,18 +31,21 @@ class TransformerEncoderLayerWithAttn(nn.TransformerEncoderLayer):
         # Save attention weights to module
         self.attn_weights = attn_weights  # Save to layer
         return src
 class BaseTransformer(BaseTorchModel):
-    def __init__(self,
-                 input_dim=1,
-                 model_dim=64,
-                 num_heads=4,
-                 num_layers=2,
-                 dropout=0.2,
-                 seq_len=None,
-                 use_learnable_pos=False,
-                 use_cls_token=True,
-                 **kwargs):
+    def __init__(
+        self,
+        input_dim=1,
+        model_dim=64,
+        num_heads=4,
+        num_layers=2,
+        dropout=0.2,
+        seq_len=None,
+        use_learnable_pos=False,
+        use_cls_token=True,
+        **kwargs,
+    ):
         super().__init__(**kwargs)
         # Input FC layer to map D_input to D_model
         self.model_dim = model_dim
@@ -52,7 +59,9 @@ class BaseTransformer(BaseTorchModel):
         if use_learnable_pos:
             assert seq_len is not None, "Must provide seq_len if use_learnable_pos=True"
-            self.pos_embed = nn.Parameter(torch.randn(seq_len + (1 if use_cls_token else 0), model_dim))
+            self.pos_embed = nn.Parameter(
+                torch.randn(seq_len + (1 if use_cls_token else 0), model_dim)
+            )
             self.pos_encoder = None
         else:
             self.pos_encoder = PositionalEncoding(model_dim)
@@ -62,7 +71,13 @@ class BaseTransformer(BaseTorchModel):
             self.cls_token = nn.Parameter(torch.zeros(1, 1, model_dim))  # (1, 1, D)
         # Specify the transformer encoder structure
-        encoder_layer = TransformerEncoderLayerWithAttn(d_model=model_dim, nhead=num_heads, batch_first=True, dim_feedforward=self.ff_dim, dropout=self.dropout)
+        encoder_layer = TransformerEncoderLayerWithAttn(
+            d_model=model_dim,
+            nhead=num_heads,
+            batch_first=True,
+            dim_feedforward=self.ff_dim,
+            dropout=self.dropout,
+        )
         # Stack the transformer encoder layers
         self.transformer = nn.TransformerEncoder(encoder_layer, num_layers=num_layers)
@@ -95,7 +110,7 @@ class BaseTransformer(BaseTorchModel):
             x = torch.cat([cls, x], dim=1)  # (B, S+1, D)
         if self.pos_embed is not None:
-            x = x + self.pos_embed.unsqueeze(0)[:, :x.shape[1], :]
+            x = x + self.pos_embed.unsqueeze(0)[:, : x.shape[1], :]
         elif self.pos_encoder is not None:
             x = self.pos_encoder(x)
@@ -106,8 +121,8 @@ class BaseTransformer(BaseTorchModel):
         encoded = self.transformer(x)
         return encoded
-    def compute_attn_grad(self, reduction='mean'):
+    def compute_attn_grad(self, reduction="mean"):
         """
         Computes attention × gradient scores across layers.
         Returns: [B, S] tensor of importance scores
@@ -116,19 +131,19 @@ class BaseTransformer(BaseTorchModel):
         for attn, grad in zip(self.attn_weights, self.attn_grads):
             # attn: [B, H, S, S]
             # grad: [B, S, D]
-            attn = attn.mean(dim=1)            # [B, S, S]
-            grad_norm = grad.norm(dim=-1)      # [B, S]
+            attn = attn.mean(dim=1)  # [B, S, S]
+            grad_norm = grad.norm(dim=-1)  # [B, S]
             attn_grad_score = (attn * grad_norm.unsqueeze(1)).sum(dim=-1)  # [B, S]
             scores.append(attn_grad_score)
         # Combine across layers
         stacked = torch.stack(scores, dim=0)  # [L, B, S]
         if reduction == "mean":
-            return stacked.mean(dim=0)        # [B, S]
+            return stacked.mean(dim=0)  # [B, S]
         elif reduction == "sum":
-            return stacked.sum(dim=0)         # [B, S]
+            return stacked.sum(dim=0)  # [B, S]
         else:
-            return stacked                    # [L, B, S]
+            return stacked  # [L, B, S]
     def compute_rollout(self):
         """
@@ -143,9 +158,9 @@ class BaseTransformer(BaseTorchModel):
             attn_heads = attn_heads + torch.eye(S, device=device).unsqueeze(0)  # add residual
             attn_heads = attn_heads / attn_heads.sum(dim=-1, keepdim=True).clamp(min=1e-6)
             rollout = torch.bmm(attn_heads, rollout)  # [B, S, S]
         return rollout  # [B, S, S]
     def reset_attn_buffers(self):
         self.attn_weights = []
         self.attn_grads = []
@@ -158,11 +173,15 @@ class BaseTransformer(BaseTorchModel):
         if head_idx is not None:
             attn = attn[:, head_idx]  # [B, S, S]
         return attn
-    def apply_attn_interpretations_to_adata(self, dataloader, adata,
-                                            obsm_key_grad="attn_grad",
-                                            obsm_key_rollout="attn_rollout",
-                                            device="cpu"):
+    def apply_attn_interpretations_to_adata(
+        self,
+        dataloader,
+        adata,
+        obsm_key_grad="attn_grad",
+        obsm_key_rollout="attn_rollout",
+        device="cpu",
+    ):
         self.to(device)
         self.eval()
         grad_maps = []
@@ -193,12 +212,10 @@ class BaseTransformer(BaseTorchModel):
         # add per-row normalized version
         grad_normed = grad_concat / (np.max(grad_concat, axis=1, keepdims=True) + 1e-8)
         adata.obsm[f"{obsm_key_grad}_normalized"] = grad_normed
 class TransformerClassifier(BaseTransformer):
-    def __init__(self,
-                 input_dim,
-                 num_classes,
-                 **kwargs):
+    def __init__(self, input_dim, num_classes, **kwargs):
         super().__init__(input_dim, **kwargs)
         # Classification head
         output_size = 1 if num_classes == 2 else num_classes
@@ -215,7 +232,7 @@ class TransformerClassifier(BaseTransformer):
             x = x.unsqueeze(0).unsqueeze(-1)  # just in case (S,) → (1, S, 1)
         else:
             pass
-        encoded = self.encode(x) # -> (B, S, D_model)
+        encoded = self.encode(x)  # -> (B, S, D_model)
         if self.use_cls_token:
             pooled = encoded[:, 0]  # (B, D)
         else:
@@ -223,14 +240,13 @@ class TransformerClassifier(BaseTransformer):
         out = self.cls_head(pooled)  # (B, C)
         return out
 class DANNTransformerClassifier(TransformerClassifier):
     def __init__(self, input_dim, model_dim, num_classes, n_domains, **kwargs):
         super().__init__(input_dim, model_dim, num_classes, **kwargs)
         self.domain_classifier = nn.Sequential(
-            nn.Linear(model_dim, 128),
-            nn.ReLU(),
-            nn.Linear(128, n_domains)
+            nn.Linear(model_dim, 128), nn.ReLU(), nn.Linear(128, n_domains)
         )
     def forward(self, x, alpha=1.0):
@@ -242,6 +258,7 @@ class DANNTransformerClassifier(TransformerClassifier):
         return class_logits, domain_logits
 class MaskedTransformerPretrainer(BaseTransformer):
     def __init__(self, input_dim, model_dim, num_heads=4, num_layers=2, **kwargs):
         super().__init__(input_dim, model_dim, num_heads, num_layers, **kwargs)
@@ -254,12 +271,13 @@ class MaskedTransformerPretrainer(BaseTransformer):
         """
         if x.dim() == 2:
             x = x.unsqueeze(-1)
-        encoded = self.encode(x, mask=mask) # -> (B, S, D_model)
-        return self.decoder(encoded) # -> (B, D_input)
+        encoded = self.encode(x, mask=mask)  # -> (B, S, D_model)
+        return self.decoder(encoded)  # -> (B, D_input)
 class DANNTransformer(BaseTransformer):
-    """
-    """
+    """ """
     def __init__(self, seq_len, model_dim, n_heads, n_layers, n_domains):
         super().__init__(
             input_dim=1,  # 1D scalar input per token
@@ -267,7 +285,7 @@ class DANNTransformer(BaseTransformer):
             num_heads=n_heads,
             num_layers=n_layers,
             seq_len=seq_len,
-            use_learnable_pos=True  # enables learnable pos_embed in base
+            use_learnable_pos=True,  # enables learnable pos_embed in base
         )
         # Reconstruction head
@@ -275,9 +293,7 @@ class DANNTransformer(BaseTransformer):
         # Domain classification head
         self.domain_classifier = nn.Sequential(
-            nn.Linear(model_dim, 128),
-            nn.ReLU(),
-            nn.Linear(128, n_domains)
+            nn.Linear(model_dim, 128), nn.ReLU(), nn.Linear(128, n_domains)
         )
     def forward(self, x, alpha=1.0):
@@ -300,4 +316,3 @@ class DANNTransformer(BaseTransformer):
         domain_logits = self.domain_classifier(rev)  # (B, n_batches)
         return recon, domain_logits

smftools/machine_learning/models/wrappers.py CHANGED Viewed

@@ -1,6 +1,7 @@
 import torch
 import torch.nn as nn
 class ScaledModel(nn.Module):
     def __init__(self, model, mean, std):
         super().__init__()
@@ -17,4 +18,4 @@ class ScaledModel(nn.Module):
             x = (x - mean[None, None, :]) / std[None, None, :]
         else:
             raise ValueError(f"Unsupported input shape {x.shape}")
-        return self.model(x)
+        return self.model(x)

smftools/machine_learning/training/__init__.py CHANGED Viewed

@@ -1,2 +1,2 @@
-from .train_lightning_model import train_lightning_model, run_sliding_window_lightning_training
-from .train_sklearn_model import train_sklearn_model, run_sliding_window_sklearn_training
+from .train_lightning_model import run_sliding_window_lightning_training, train_lightning_model
+from .train_sklearn_model import run_sliding_window_sklearn_training, train_sklearn_model

smftools/machine_learning/training/train_lightning_model.py CHANGED Viewed

@@ -1,9 +1,11 @@
 import torch
 from pytorch_lightning import Trainer
 from pytorch_lightning.callbacks import EarlyStopping, ModelCheckpoint
 from ..data import AnnDataModule
 from ..models import TorchClassifierWrapper
 def train_lightning_model(
     model,
     datamodule,
@@ -12,7 +14,7 @@ def train_lightning_model(
     monitor_metric="val_loss",
     checkpoint_path=None,
     evaluate_test=True,
-    devices=1
+    devices=1,
 ):
     """
     Takes a PyTorch Lightning Model and a Lightning DataLoader module to define a Lightning Trainer.
@@ -39,13 +41,15 @@ def train_lightning_model(
         EarlyStopping(monitor=monitor_metric, patience=patience, mode="min"),
     ]
     if checkpoint_path:
-        callbacks.append(ModelCheckpoint(
-            dirpath=checkpoint_path,
-            filename="{epoch}-{val_loss:.4f}",
-            monitor=monitor_metric,
-            save_top_k=1,
-            mode="min",
-        ))
+        callbacks.append(
+            ModelCheckpoint(
+                dirpath=checkpoint_path,
+                filename="{epoch}-{val_loss:.4f}",
+                monitor=monitor_metric,
+                save_top_k=1,
+                mode="min",
+            )
+        )
     # Trainer setup
     trainer = Trainer(
@@ -54,7 +58,7 @@ def train_lightning_model(
         accelerator=accelerator,
         devices=devices,
         log_every_n_steps=10,
-        enable_progress_bar=False
+        enable_progress_bar=False,
     )
     # Fit model with trainer
@@ -63,7 +67,7 @@ def train_lightning_model(
     # Test model (if applicable)
     if evaluate_test and hasattr(datamodule, "test_dataloader"):
         trainer.test(model, datamodule=datamodule)
     # Return best checkpoint path
     best_ckpt = None
     for cb in callbacks:
@@ -72,6 +76,7 @@ def train_lightning_model(
     return trainer, best_ckpt
 def run_sliding_window_lightning_training(
     adata,
     tensor_source,
@@ -86,13 +91,13 @@ def run_sliding_window_lightning_training(
     stride,
     max_epochs=30,
     patience=5,
-    enforce_eval_balance: bool=False,
-    target_eval_freq: float=0.3,
-    max_eval_positive: int=None
+    enforce_eval_balance: bool = False,
+    target_eval_freq: float = 0.3,
+    max_eval_positive: int = None,
 ):
     input_len = adata.shape[1]
     results = {}
     for start in range(0, input_len - window_size + 1, stride):
         center_idx = start + window_size // 2
         center_varname = adata.var_names[center_idx]
@@ -106,18 +111,22 @@ def run_sliding_window_lightning_training(
             label_col=label_col,
             batch_size=64,
             window_start=start,
-            window_size=window_size
+            window_size=window_size,
         )
         datamodule.setup()
         # Build model for this window
         model = model_class(window_size, num_classes)
         wrapper = TorchClassifierWrapper(
-            model, label_col=label_col, num_classes=num_classes,
+            model,
+            label_col=label_col,
+            num_classes=num_classes,
             class_names=class_names,
             class_weights=class_weights,
-            focus_class=focus_class, enforce_eval_balance=enforce_eval_balance,
-            target_eval_freq=target_eval_freq, max_eval_positive=max_eval_positive
+            focus_class=focus_class,
+            enforce_eval_balance=enforce_eval_balance,
+            target_eval_freq=target_eval_freq,
+            max_eval_positive=max_eval_positive,
         )
         # Train model
@@ -129,7 +138,7 @@ def run_sliding_window_lightning_training(
             "model": wrapper,
             "trainer": trainer,
             "checkpoint": ckpt,
-            "metrics": trainer.callback_metrics
+            "metrics": trainer.callback_metrics,
         }
     return results

smftools/machine_learning/training/train_sklearn_model.py CHANGED Viewed

@@ -1,16 +1,12 @@
 from ..data import AnnDataModule
 from ..models import SklearnModelWrapper
-def train_sklearn_model(
-    model_wrapper,
-    datamodule,
-    evaluate_test=True,
-    evaluate_val=False
-):
+def train_sklearn_model(model_wrapper, datamodule, evaluate_test=True, evaluate_val=False):
     """
     Fits a SklearnModelWrapper on the train split from datamodule.
     Evaluates on test and/or val set.
     Parameters:
         model_wrapper: SklearnModelWrapper instance
         datamodule: AnnDataModule instance (with setup() method)
@@ -39,6 +35,7 @@ def train_sklearn_model(
     return metrics
 def run_sliding_window_sklearn_training(
     adata,
     tensor_source,
@@ -58,7 +55,7 @@ def run_sliding_window_sklearn_training(
     enforce_eval_balance=False,
     target_eval_freq=0.3,
     max_eval_positive=None,
-    **model_kwargs
+    **model_kwargs,
 ):
     """
     Sliding window training for sklearn models using AnnData.
@@ -86,29 +83,26 @@ def run_sliding_window_sklearn_training(
             train_frac=train_frac,
             val_frac=val_frac,
             test_frac=test_frac,
-            random_seed=random_seed
+            random_seed=random_seed,
         )
         datamodule.setup()
         # Build model wrapper
         sklearn_model = model_class(**model_kwargs)
         wrapper = SklearnModelWrapper(
-            sklearn_model,
+            sklearn_model,
             num_classes=num_classes,
             label_col=label_col,
             class_names=class_names,
             focus_class=focus_class,
             enforce_eval_balance=enforce_eval_balance,
             target_eval_freq=target_eval_freq,
-            max_eval_positive=max_eval_positive
+            max_eval_positive=max_eval_positive,
         )
         # Fit and evaluate
         metrics = train_sklearn_model(wrapper, datamodule, evaluate_test=True, evaluate_val=False)
-        results[center_varname] = {
-            "model": wrapper,
-            "metrics": metrics
-        }
+        results[center_varname] = {"model": wrapper, "metrics": metrics}
     return results

smftools/machine_learning/utils/__init__.py CHANGED Viewed

@@ -1,2 +1,2 @@
 from .device import detect_device
-from .grl import GradReverse
+from .grl import GradReverse

smftools/machine_learning/utils/device.py CHANGED Viewed

@@ -1,10 +1,13 @@
 import torch
 def detect_device():
     device = (
-        torch.device('cuda') if torch.cuda.is_available() else
-        torch.device('mps') if torch.backends.mps.is_available() else
-        torch.device('cpu')
+        torch.device("cuda")
+        if torch.cuda.is_available()
+        else torch.device("mps")
+        if torch.backends.mps.is_available()
+        else torch.device("cpu")
     )
     print(f"Detected device: {device}")
-    return device
+    return device

smftools/machine_learning/utils/grl.py CHANGED Viewed

@@ -1,5 +1,6 @@
 import torch
 class GradReverse(torch.autograd.Function):
     @staticmethod
     def forward(ctx, x, alpha):
@@ -10,5 +11,6 @@ class GradReverse(torch.autograd.Function):
     def backward(ctx, grad_output):
         return -ctx.alpha * grad_output, None
 def grad_reverse(x, alpha=1.0):
-    return GradReverse.apply(x, alpha)
+    return GradReverse.apply(x, alpha)

smftools 0.2.3__py3-none-any.whl → 0.2.5__py3-none-any.whl

smftools 0.2.3py3-none-any.whl → 0.2.5py3-none-any.whl