PyPI - pg-sui - Versions diffs - 1.6.16a3__py3-none-any.whl → 1.7.0__py3-none-any.whl - Mend

pg-sui 1.6.16a3py3-none-any.whl → 1.7.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (33) hide show

{pg_sui-1.6.16a3.dist-info → pg_sui-1.7.0.dist-info}/METADATA +26 -30
{pg_sui-1.6.16a3.dist-info → pg_sui-1.7.0.dist-info}/RECORD +29 -33
pgsui/__init__.py +0 -8
pgsui/_version.py +2 -2
pgsui/cli.py +577 -125
pgsui/data_processing/config.py +1 -2
pgsui/data_processing/containers.py +203 -530
pgsui/data_processing/transformers.py +44 -20
pgsui/impute/deterministic/imputers/mode.py +475 -182
pgsui/impute/deterministic/imputers/ref_allele.py +454 -147
pgsui/impute/supervised/imputers/hist_gradient_boosting.py +4 -3
pgsui/impute/supervised/imputers/random_forest.py +3 -2
pgsui/impute/unsupervised/base.py +1269 -534
pgsui/impute/unsupervised/callbacks.py +28 -33
pgsui/impute/unsupervised/imputers/autoencoder.py +870 -841
pgsui/impute/unsupervised/imputers/vae.py +931 -787
pgsui/impute/unsupervised/loss_functions.py +156 -202
pgsui/impute/unsupervised/models/autoencoder_model.py +7 -49
pgsui/impute/unsupervised/models/vae_model.py +40 -221
pgsui/impute/unsupervised/nn_scorers.py +53 -13
pgsui/utils/classification_viz.py +240 -97
pgsui/utils/misc.py +201 -3
pgsui/utils/plotting.py +73 -58
pgsui/utils/pretty_metrics.py +2 -6
pgsui/utils/scorers.py +39 -0
pgsui/impute/unsupervised/imputers/nlpca.py +0 -1666
pgsui/impute/unsupervised/imputers/ubp.py +0 -1660
pgsui/impute/unsupervised/models/nlpca_model.py +0 -206
pgsui/impute/unsupervised/models/ubp_model.py +0 -200
{pg_sui-1.6.16a3.dist-info → pg_sui-1.7.0.dist-info}/WHEEL +0 -0
{pg_sui-1.6.16a3.dist-info → pg_sui-1.7.0.dist-info}/entry_points.txt +0 -0
{pg_sui-1.6.16a3.dist-info → pg_sui-1.7.0.dist-info}/licenses/LICENSE +0 -0
{pg_sui-1.6.16a3.dist-info → pg_sui-1.7.0.dist-info}/top_level.txt +0 -0

pgsui/impute/unsupervised/imputers/ubp.py DELETED Viewed

@@ -1,1660 +0,0 @@
-import copy
-from typing import TYPE_CHECKING, Any, Dict, Literal, Optional, Tuple
-from fastapi import params
-import numpy as np
-import optuna
-import torch
-import torch.nn.functional as F
-from sklearn.decomposition import PCA
-from sklearn.exceptions import NotFittedError
-from sklearn.model_selection import train_test_split
-from snpio.analysis.genotype_encoder import GenotypeEncoder
-from snpio.utils.logging import LoggerManager
-from pgsui.data_processing.config import apply_dot_overrides, load_yaml_to_dataclass
-from pgsui.data_processing.containers import UBPConfig
-from pgsui.data_processing.transformers import SimMissingTransformer
-from pgsui.impute.unsupervised.base import BaseNNImputer
-from pgsui.impute.unsupervised.callbacks import EarlyStopping
-from pgsui.impute.unsupervised.loss_functions import SafeFocalCELoss
-from pgsui.impute.unsupervised.models.ubp_model import UBPModel
-from pgsui.utils.logging_utils import configure_logger
-from pgsui.utils.pretty_metrics import PrettyMetrics
-if TYPE_CHECKING:
-    from snpio import TreeParser
-    from snpio.read_input.genotype_data import GenotypeData
-def ensure_ubp_config(config: UBPConfig | dict | str | None) -> UBPConfig:
-    """Return a concrete UBPConfig from dataclass, dict, YAML path, or None.
-    This method normalizes the input configuration for the UBP imputer. It accepts a UBPConfig instance, a dictionary, a YAML file path, or None. If None is provided, it returns a default UBPConfig instance. If a YAML path is given, it loads the configuration from the file, supporting top-level presets. If a dictionary is provided, it flattens any nested structures and applies dot-key overrides to a base configuration, which can also be influenced by a preset if specified. The method ensures that the final output is a fully populated UBPConfig instance.
-    Args:
-        config: UBPConfig | dict | YAML path | None.
-    Returns:
-        UBPConfig: Normalized configuration instance.
-    """
-    if config is None:
-        return UBPConfig()
-    if isinstance(config, UBPConfig):
-        return config
-    if isinstance(config, str):
-        # YAML path — support top-level `preset`
-        return load_yaml_to_dataclass(config, UBPConfig)
-    if isinstance(config, dict):
-        base = UBPConfig()
-        def _flatten(prefix: str, d: dict, out: dict) -> dict:
-            for k, v in d.items():
-                kk = f"{prefix}.{k}" if prefix else k
-                if isinstance(v, dict):
-                    _flatten(kk, v, out)
-                else:
-                    out[kk] = v
-            return out
-        preset_name = config.pop("preset", None)
-        if "io" in config and isinstance(config["io"], dict):
-            preset_name = preset_name or config["io"].pop("preset", None)
-        if preset_name:
-            base = UBPConfig.from_preset(preset_name)
-        flat = _flatten("", config, {})
-        return apply_dot_overrides(base, flat)
-    raise TypeError("config must be a UBPConfig, dict, YAML path, or None.")
-class ImputeUBP(BaseNNImputer):
-    """UBP imputer for 0/1/2 genotypes with a three-phase decoder schedule.
-    This imputer follows the training recipe from Unsupervised Backpropagation:
-    1. Phase 1 (joint warm start): Learn latent codes and the shallow linear decoder together.
-    2. Phase 2 (deep decoder reset): Reinitialize the deeper decoder, freeze the latent codes, and train only the decoder parameters.
-    3. Phase 3 (joint fine-tune): Unfreeze everything and jointly refine latent codes plus the deep decoder before evaluation/reporting.
-    References:
-        - Gashler, Michael S., Smith, Michael R., Morris, R., and Martinez, T. (2016) Missing Value Imputation with Unsupervised Backpropagation. Computational Intelligence, 32: 196-215. doi: 10.1111/coin.12048.
-    """
-    def __init__(
-        self,
-        genotype_data: "GenotypeData",
-        *,
-        tree_parser: Optional["TreeParser"] = None,
-        config: UBPConfig | dict | str | None = None,
-        overrides: dict | None = None,
-        simulate_missing: bool | None = None,
-        sim_strategy: (
-            Literal[
-                "random",
-                "random_weighted",
-                "random_weighted_inv",
-                "nonrandom",
-                "nonrandom_weighted",
-            ]
-            | None
-        ) = None,
-        sim_prop: float | None = None,
-        sim_kwargs: dict | None = None,
-    ):
-        """Initialize the UBP imputer via dataclass/dict/YAML config with overrides.
-        This constructor allows for flexible initialization of the UBP imputer by accepting various forms of configuration input. It ensures that the configuration is properly normalized and any specified overrides are applied. The method also sets up logging and initializes various attributes related to the model, training, tuning, and evaluation based on the provided configuration.
-        Args:
-            genotype_data (GenotypeData): Backing genotype data object.
-            tree_parser: "TreeParser" | None = None, Optional SNPio phylogenetic tree parser for nonrandom sim_strategy modes.
-            config (UBPConfig | dict | str | None): UBP configuration.
-            overrides (dict | None): Flat dot-key overrides applied after `config`.
-            simulate_missing (bool | None): Whether to simulate missing data during training.
-            sim_strategy (Literal[...] | None): Simulated missing strategy if simulating.
-            sim_prop (float | None): Proportion of data to simulate as missing if simulating.
-            sim_kwargs (dict | None): Additional kwargs for SimMissingTransformer.
-        """
-        self.model_name = "ImputeUBP"
-        self.genotype_data = genotype_data
-        self.tree_parser = tree_parser
-        # ---- normalize config, then apply overrides ----
-        cfg = ensure_ubp_config(config)
-        if overrides:
-            cfg = apply_dot_overrides(cfg, overrides)
-        self.cfg = cfg
-        # ---- logging ----
-        logman = LoggerManager(
-            __name__,
-            prefix=self.cfg.io.prefix,
-            debug=self.cfg.io.debug,
-            verbose=self.cfg.io.verbose,
-        )
-        self.logger = configure_logger(
-            logman.get_logger(),
-            verbose=self.cfg.io.verbose,
-            debug=self.cfg.io.debug,
-        )
-        # ---- Base init ----
-        super().__init__(
-            model_name=self.model_name,
-            genotype_data=self.genotype_data,
-            prefix=self.cfg.io.prefix,
-            device=self.cfg.train.device,
-            verbose=self.cfg.io.verbose,
-            debug=self.cfg.io.debug,
-        )
-        # ---- model/meta ----
-        self.Model = UBPModel
-        self.pgenc = GenotypeEncoder(genotype_data)
-        self.seed = self.cfg.io.seed
-        self.n_jobs = self.cfg.io.n_jobs
-        self.prefix = self.cfg.io.prefix
-        self.scoring_averaging = self.cfg.io.scoring_averaging
-        self.verbose = self.cfg.io.verbose
-        self.debug = self.cfg.io.debug
-        self.rng = np.random.default_rng(self.seed)
-        self.pos_weights_: torch.Tensor | None = None
-        # Simulated-missing controls (config defaults w/ overrides)
-        sim_cfg = getattr(self.cfg, "sim", None)
-        sim_cfg_kwargs = copy.deepcopy(getattr(sim_cfg, "sim_kwargs", None) or {})
-        if sim_kwargs:
-            sim_cfg_kwargs.update(sim_kwargs)
-        if sim_cfg is None:
-            default_sim_flag = bool(simulate_missing)
-            default_strategy = "random"
-            default_prop = 0.10
-        else:
-            default_sim_flag = sim_cfg.simulate_missing
-            default_strategy = sim_cfg.sim_strategy
-            default_prop = sim_cfg.sim_prop
-        self.simulate_missing = (
-            default_sim_flag if simulate_missing is None else bool(simulate_missing)
-        )
-        self.sim_strategy = sim_strategy or default_strategy
-        self.sim_prop = float(sim_prop if sim_prop is not None else default_prop)
-        self.sim_kwargs = sim_cfg_kwargs
-        # ---- model hyperparams ----
-        self.latent_dim = self.cfg.model.latent_dim
-        self.dropout_rate = self.cfg.model.dropout_rate
-        self.num_hidden_layers = self.cfg.model.num_hidden_layers
-        self.layer_scaling_factor = self.cfg.model.layer_scaling_factor
-        self.layer_schedule = self.cfg.model.layer_schedule
-        self.latent_init: Literal["pca", "random"] = self.cfg.model.latent_init
-        self.activation = self.cfg.model.hidden_activation
-        self.gamma = self.cfg.model.gamma
-        # ---- training ----
-        self.batch_size = self.cfg.train.batch_size
-        self.learning_rate = self.cfg.train.learning_rate
-        self.lr_input_factor = self.cfg.train.lr_input_factor
-        self.l1_penalty = self.cfg.train.l1_penalty
-        self.early_stop_gen = self.cfg.train.early_stop_gen
-        self.min_epochs = self.cfg.train.min_epochs
-        self.epochs = self.cfg.train.max_epochs
-        self.validation_split = self.cfg.train.validation_split
-        self.beta = self.cfg.train.weights_beta
-        self.max_ratio = self.cfg.train.weights_max_ratio
-        # ---- tuning ----
-        self.tune = self.cfg.tune.enabled
-        self.tune_fast = self.cfg.tune.fast
-        self.tune_proxy_metric_batch = self.cfg.tune.proxy_metric_batch
-        self.tune_batch_size = self.cfg.tune.batch_size
-        self.tune_epochs = self.cfg.tune.epochs
-        self.tune_eval_interval = self.cfg.tune.eval_interval
-        self.tune_metric: Literal[
-            "pr_macro",
-            "f1",
-            "accuracy",
-            "average_precision",
-            "precision",
-            "recall",
-            "roc_auc",
-        ] = self.cfg.tune.metric
-        self.n_trials = self.cfg.tune.n_trials
-        self.tune_save_db = self.cfg.tune.save_db
-        self.tune_resume = self.cfg.tune.resume
-        self.tune_max_samples = self.cfg.tune.max_samples
-        self.tune_max_loci = self.cfg.tune.max_loci
-        self.tune_infer_epochs = getattr(self.cfg.tune, "infer_epochs", 100)
-        self.tune_patience = self.cfg.tune.patience
-        # ---- evaluation ----
-        self.eval_latent_steps = self.cfg.evaluate.eval_latent_steps
-        self.eval_latent_lr = self.cfg.evaluate.eval_latent_lr
-        self.eval_latent_weight_decay = self.cfg.evaluate.eval_latent_weight_decay
-        # ---- plotting ----
-        self.plot_format = self.cfg.plot.fmt
-        self.plot_dpi = self.cfg.plot.dpi
-        self.plot_fontsize = self.cfg.plot.fontsize
-        self.title_fontsize = self.cfg.plot.fontsize
-        self.despine = self.cfg.plot.despine
-        self.show_plots = self.cfg.plot.show
-        # ---- core runtime ----
-        self.is_haploid = False
-        self.num_classes_ = False
-        self.model_params: Dict[str, Any] = {}
-        self.sim_mask_global_: np.ndarray | None = None
-        self.sim_mask_train_: np.ndarray | None = None
-        self.sim_mask_test_: np.ndarray | None = None
-        if self.tree_parser is None and self.sim_strategy.startswith("nonrandom"):
-            msg = "tree_parser is required for nonrandom and nonrandom_weighted simulated missing strategies."
-            self.logger.error(msg)
-            raise ValueError(msg)
-    def fit(self) -> "ImputeUBP":
-        """Fit the UBP decoder on 0/1/2 encodings (missing = -1) via three phases.
-        1. Phase 1 initializes latent vectors alongside the linear decoder.
-        2. Phase 2 resets and trains the deeper decoder while latents remain fixed.
-        3. Phase 3 jointly fine-tunes latents plus the deep decoder before evaluation.
-        Returns:
-            ImputeUBP: Fitted instance.
-        Raises:
-            NotFittedError: If training fails.
-        """
-        self.logger.info(f"Fitting {self.model_name} model...")
-        # --- Use 0/1/2 with -1 for missing ---
-        X012 = self._get_float_genotypes(copy=True)
-        GT_full = np.nan_to_num(X012, nan=-1.0, copy=True)
-        self.ground_truth_ = GT_full.astype(np.int64, copy=False)
-        cache_key = self._sim_mask_cache_key()
-        self.sim_mask_global_ = None
-        if self.simulate_missing:
-            cached_mask = (
-                None if cache_key is None else self._sim_mask_cache.get(cache_key)
-            )
-            if cached_mask is not None:
-                self.sim_mask_global_ = cached_mask.copy()
-            else:
-                tr = SimMissingTransformer(
-                    genotype_data=self.genotype_data,
-                    tree_parser=self.tree_parser,
-                    prop_missing=self.sim_prop,
-                    strategy=self.sim_strategy,
-                    missing_val=-9,
-                    mask_missing=True,
-                    verbose=self.verbose,
-                    **self.sim_kwargs,
-                )
-                tr.fit(X012.copy())
-                self.sim_mask_global_ = tr.sim_missing_mask_.astype(bool)
-                if cache_key is not None:
-                    self._sim_mask_cache[cache_key] = self.sim_mask_global_.copy()
-        X_for_model = self.ground_truth_.copy()
-        if self.sim_mask_global_ is not None:
-            X_for_model[self.sim_mask_global_] = -1
-        # --- Determine ploidy (haploid vs diploid) and classes ---
-        self.is_haploid = bool(
-            np.all(
-                np.isin(
-                    self.genotype_data.snp_data,
-                    ["A", "C", "G", "T", "N", "-", ".", "?"],
-                )
-            )
-        )
-        self.ploidy = 1 if self.is_haploid else 2
-        if self.is_haploid:
-            self.num_classes_ = 2
-            self.ground_truth_[self.ground_truth_ == 2] = 1
-            X_for_model[X_for_model == 2] = 1
-            self.logger.info("Haploid data detected. Using 2 classes (REF=0, ALT=1).")
-        else:
-            self.num_classes_ = 3
-            self.logger.info(
-                "Diploid data detected. Using 3 classes (REF=0, HET=1, ALT=2) for scoring."
-            )
-        # Model head always uses two channels; scoring uses num_classes_
-        self.output_classes_ = 2
-        n_samples, self.num_features_ = X_for_model.shape
-        # --- model params (decoder: Z -> L * num_classes) ---
-        self.model_params = {
-            "n_features": self.num_features_,
-            "num_classes": self.output_classes_,
-            "latent_dim": self.latent_dim,
-            "dropout_rate": self.dropout_rate,
-            "activation": self.activation,
-            # hidden_layer_sizes injected later
-        }
-        # --- split ---
-        indices = np.arange(n_samples)
-        train_idx, test_idx = train_test_split(
-            indices, test_size=self.validation_split, random_state=self.seed
-        )
-        self.train_idx_, self.test_idx_ = train_idx, test_idx
-        self.X_train_ = X_for_model[train_idx]
-        self.X_test_ = X_for_model[test_idx]
-        self.GT_train_full_ = self.ground_truth_[train_idx]
-        self.GT_test_full_ = self.ground_truth_[test_idx]
-        if self.sim_mask_global_ is not None:
-            self.sim_mask_train_ = self.sim_mask_global_[train_idx]
-            self.sim_mask_test_ = self.sim_mask_global_[test_idx]
-        else:
-            self.sim_mask_train_ = None
-            self.sim_mask_test_ = None
-        # pos weights for diploid multilabel path
-        if not self.is_haploid:
-            self.pos_weights_ = self._compute_pos_weights(self.X_train_)
-        else:
-            self.pos_weights_ = None
-        # --- plotting/scorers & tuning ---
-        self.plotter_, self.scorers_ = self.initialize_plotting_and_scorers()
-        if self.tune:
-            self.tune_hyperparameters()
-        # Fall back to default model params when none have been selected yet.
-        if not getattr(self, "best_params_", None):
-            self.best_params_ = self._set_best_params_default()
-        # --- class weights for 0/1/2 ---
-        self.class_weights_ = self._normalize_class_weights(
-            self._class_weights_from_zygosity(self.X_train_)
-        )
-        # --- latent init & loader ---
-        train_latent_vectors = self._create_latent_space(
-            self.best_params_, len(self.X_train_), self.X_train_, self.latent_init
-        )
-        train_loader = self._get_data_loaders(self.X_train_)
-        # --- final training (three-phase under the hood) ---
-        (self.best_loss_, self.model_, self.history_, self.train_latent_vectors_) = (
-            self._train_final_model(
-                loader=train_loader,
-                best_params=self.best_params_,
-                initial_latent_vectors=train_latent_vectors,
-            )
-        )
-        self.is_fit_ = True
-        self.plotter_.plot_history(self.history_)
-        eval_mask = (
-            self.sim_mask_test_
-            if (self.simulate_missing and self.sim_mask_test_ is not None)
-            else None
-        )
-        self._evaluate_model(
-            self.X_test_,
-            self.model_,
-            self.best_params_,
-            eval_mask_override=eval_mask,
-        )
-        self._save_best_params(self.best_params_)
-        return self
-    def transform(self) -> np.ndarray:
-        """Impute missing genotypes (0/1/2) and return IUPAC strings.
-        This method first checks if the model has been fitted. It then imputes the entire dataset by optimizing latent vectors for the ground truth data and predicting the missing genotypes using the trained UBP model. The imputed genotypes are decoded to IUPAC format, and genotype distributions are plotted only when ``self.show_plots`` is enabled.
-        Returns:
-            np.ndarray: IUPAC single-character array (n_samples x L).
-        Raises:
-            NotFittedError: If called before fit().
-        """
-        if not getattr(self, "is_fit_", False):
-            raise NotFittedError("Model is not fitted. Call fit() before transform().")
-        self.logger.info(f"Imputing entire dataset with {self.model_name}...")
-        X_to_impute = self.ground_truth_.copy()
-        optimized_latents = self._optimize_latents_for_inference(
-            X_to_impute, self.model_, self.best_params_
-        )
-        if not isinstance(optimized_latents, torch.nn.Parameter):
-            optimized_latents = torch.nn.Parameter(
-                optimized_latents, requires_grad=False
-            )
-        pred_labels, _ = self._predict(self.model_, latent_vectors=optimized_latents)
-        missing_mask = X_to_impute == -1
-        imputed_array = X_to_impute.copy()
-        imputed_array[missing_mask] = pred_labels[missing_mask]
-        # Decode to IUPAC for return & optional plots
-        imputed_genotypes = self.pgenc.decode_012(imputed_array)
-        if self.show_plots:
-            original_genotypes = self.pgenc.decode_012(X_to_impute)
-            self.plotter_.plot_gt_distribution(original_genotypes, is_imputed=False)
-            self.plotter_.plot_gt_distribution(imputed_genotypes, is_imputed=True)
-        return imputed_genotypes
-    def _train_step(
-        self,
-        loader: torch.utils.data.DataLoader,
-        optimizer: torch.optim.Optimizer,
-        latent_optimizer: torch.optim.Optimizer,
-        model: torch.nn.Module,
-        l1_penalty: float,
-        latent_vectors: torch.nn.Parameter,
-        class_weights: torch.Tensor,
-        phase: int,
-    ) -> Tuple[float, torch.nn.Parameter]:
-        """One epoch with stable focal CE, grad clipping, and NaN guards.
-        Returns:
-            Tuple[float, torch.nn.Parameter]: Mean loss and updated latents.
-        """
-        model.train()
-        running, used = 0.0, 0
-        if not isinstance(latent_vectors, torch.nn.Parameter):
-            latent_vectors = torch.nn.Parameter(latent_vectors, requires_grad=True)
-        gamma = float(getattr(model, "gamma", getattr(self, "gamma", 0.0)))
-        gamma = max(0.0, min(gamma, 10.0))
-        l1_params = tuple(p for p in model.parameters() if p.requires_grad)
-        if class_weights is not None and class_weights.device != self.device:
-            class_weights = class_weights.to(self.device)
-        criterion = SafeFocalCELoss(gamma=gamma, weight=class_weights, ignore_index=-1)
-        decoder: torch.Tensor | torch.nn.Module = (
-            model.phase1_decoder if phase == 1 else model.phase23_decoder
-        )
-        if not isinstance(decoder, torch.nn.Module):
-            msg = f"{self.model_name} Decoder is not a torch.nn.Module."
-            self.logger.error(msg)
-            raise TypeError(msg)
-        for batch_indices, y_batch in loader:
-            optimizer.zero_grad(set_to_none=True)
-            latent_optimizer.zero_grad(set_to_none=True)
-            batch_indices = batch_indices.to(latent_vectors.device, non_blocking=True)
-            z = latent_vectors[batch_indices]
-            y = y_batch.to(self.device, non_blocking=True).long()
-            logits = decoder(z).view(
-                len(batch_indices), self.num_features_, self.output_classes_
-            )
-            # Guard upstream explosions
-            if not torch.isfinite(logits).all():
-                continue
-            if self.is_haploid:
-                loss = criterion(logits.view(-1, self.output_classes_), y.view(-1))
-            else:
-                targets = self._multi_hot_targets(y)
-                bce = F.binary_cross_entropy_with_logits(
-                    logits, targets, pos_weight=self.pos_weights_, reduction="none"
-                )
-                mask = (y != -1).unsqueeze(-1).float()
-                loss = (bce * mask).sum() / mask.sum().clamp_min(1e-8)
-            if l1_penalty > 0:
-                l1 = torch.zeros((), device=self.device)
-                for p in l1_params:
-                    l1 = l1 + p.abs().sum()
-                loss = loss + l1_penalty * l1
-            if not torch.isfinite(loss):
-                continue
-            loss.backward()
-            # Clip returns the Total Norm
-            model_norm = torch.nn.utils.clip_grad_norm_(model.parameters(), 1.0)
-            latent_norm = torch.nn.utils.clip_grad_norm_([latent_vectors], 1.0)
-            # Skip update on non-finite grads
-            # Check norms instead of iterating all parameters
-            if torch.isfinite(model_norm) and torch.isfinite(latent_norm):
-                optimizer.step()
-                if phase != 2:
-                    latent_optimizer.step()
-            else:
-                # Logic to handle bad grads (zero out, skip, etc)
-                optimizer.zero_grad(set_to_none=True)
-                latent_optimizer.zero_grad(set_to_none=True)
-            running += float(loss.detach().item())
-            used += 1
-        return (running / used if used > 0 else float("inf")), latent_vectors
-    def _predict(
-        self,
-        model: torch.nn.Module,
-        latent_vectors: Optional[torch.nn.Parameter | torch.Tensor] = None,
-    ) -> Tuple[np.ndarray, np.ndarray]:
-        """Predict 0/1/2 labels & probabilities from latents via phase23 decoder. This method requires a trained model and latent vectors.
-        Args:
-            model (torch.nn.Module): Trained model.
-            latent_vectors (torch.nn.Parameter | None): Latent vectors.
-        Returns:
-            Tuple[np.ndarray, np.ndarray]: Predicted labels and probabilities.
-        """
-        if model is None or latent_vectors is None:
-            msg = "Model and latent vectors must be provided for prediction. Fit the model first."
-            self.logger.error(msg)
-            raise NotFittedError(msg)
-        model.eval()
-        nF = getattr(model, "n_features", self.num_features_)
-        with torch.no_grad():
-            decoder = model.phase23_decoder
-            if not isinstance(decoder, torch.nn.Module):
-                msg = f"{self.model_name} decoder is not a valid torch.nn.Module."
-                self.logger.error(msg)
-                raise TypeError(msg)
-            logits = decoder(latent_vectors.to(self.device)).view(
-                len(latent_vectors), nF, self.output_classes_
-            )
-            if self.is_haploid:
-                probas = torch.softmax(logits, dim=-1)
-                labels = torch.argmax(probas, dim=-1)
-            else:
-                probas2 = torch.sigmoid(logits)
-                p_ref = probas2[..., 0]
-                p_alt = probas2[..., 1]
-                p_het = p_ref * p_alt
-                p_ref_only = p_ref * (1 - p_alt)
-                p_alt_only = p_alt * (1 - p_ref)
-                probas = torch.stack([p_ref_only, p_het, p_alt_only], dim=-1)
-                probas = probas / probas.sum(dim=-1, keepdim=True).clamp_min(1e-8)
-                labels = torch.argmax(probas, dim=-1)
-        return labels.cpu().numpy(), probas.cpu().numpy()
-    def _evaluate_model(
-        self,
-        X_val: np.ndarray,
-        model: torch.nn.Module,
-        params: dict,
-        objective_mode: bool = False,
-        latent_vectors_val: torch.Tensor | None = None,
-        *,
-        eval_mask_override: np.ndarray | None = None,
-    ) -> Dict[str, float]:
-        """Evaluates the model on a validation set.
-        This method evaluates the trained UBP model on a validation dataset by optimizing latent vectors for the validation samples, predicting genotypes, and computing various performance metrics. It can operate in an objective mode that suppresses logging for automated evaluations.
-        Args:
-            X_val (np.ndarray): Validation data in 0/1/2 encoding with -1 for missing.
-            model (torch.nn.Module): Trained UBP model.
-            params (dict): Model parameters.
-            objective_mode (bool): If True, suppresses logging and reports only the metric.
-            latent_vectors_val (torch.Tensor | None): Pre-optimized latent vectors for validation data.
-            eval_mask_override (np.ndarray | None): Boolean mask to specify which entries to evaluate.
-        Returns:
-            Dict[str, float]: Dictionary of evaluation metrics.
-        """
-        if latent_vectors_val is not None:
-            test_latent_vectors = latent_vectors_val
-        else:
-            test_latent_vectors = self._optimize_latents_for_inference(
-                X_val, model, params
-            )
-        pred_labels, pred_probas = self._predict(
-            model=model, latent_vectors=test_latent_vectors
-        )
-        if eval_mask_override is not None:
-            # Validate row counts to allow feature subsetting during tuning
-            if eval_mask_override.shape[0] != X_val.shape[0]:
-                msg = (
-                    f"eval_mask_override rows {eval_mask_override.shape[0]} "
-                    f"does not match X_val rows {X_val.shape[0]}"
-                )
-                self.logger.error(msg)
-                raise ValueError(msg)
-            # FIX: Slice mask columns if override is wider than current X_val (tune_fast)
-            if eval_mask_override.shape[1] > X_val.shape[1]:
-                eval_mask = eval_mask_override[:, : X_val.shape[1]].astype(bool)
-            else:
-                eval_mask = eval_mask_override.astype(bool)
-        else:
-            # Default: score only observed entries
-            eval_mask = X_val != -1
-        # y_true should be drawn from the pre-mask ground truth
-        # Map X_val back to the correct full ground truth slice
-        # FIX: Check shape[0] (n_samples) only.
-        if X_val.shape[0] == self.X_test_.shape[0]:
-            GT_ref = self.GT_test_full_
-        elif X_val.shape[0] == self.X_train_.shape[0]:
-            GT_ref = self.GT_train_full_
-        else:
-            GT_ref = self.ground_truth_
-        # FIX: Slice Ground Truth columns if it is wider than X_val (tune_fast)
-        if GT_ref.shape[1] > X_val.shape[1]:
-            GT_ref = GT_ref[:, : X_val.shape[1]]
-        # Fallback safeguard
-        if GT_ref.shape != X_val.shape:
-            GT_ref = X_val
-        y_true_flat = GT_ref[eval_mask]
-        pred_labels_flat = pred_labels[eval_mask]
-        pred_probas_flat = pred_probas[eval_mask]
-        if y_true_flat.size == 0:
-            return {self.tune_metric: 0.0}
-        # For haploids, remap class 2 to 1 for scoring (e.g., f1-score)
-        labels_for_scoring = [0, 1] if self.is_haploid else [0, 1, 2]
-        target_names = ["REF", "ALT"] if self.is_haploid else ["REF", "HET", "ALT"]
-        y_true_ohe = np.eye(len(labels_for_scoring))[y_true_flat]
-        metrics = self.scorers_.evaluate(
-            y_true_flat,
-            pred_labels_flat,
-            y_true_ohe,
-            pred_probas_flat,
-            objective_mode,
-            self.tune_metric,
-        )
-        if not objective_mode:
-            pm = PrettyMetrics(
-                metrics, precision=3, title=f"{self.model_name} Validation Metrics"
-            )
-            pm.render()  # prints a command-line table
-            self._make_class_reports(
-                y_true=y_true_flat,
-                y_pred_proba=pred_probas_flat,
-                y_pred=pred_labels_flat,
-                metrics=metrics,
-                labels=target_names,
-            )
-            # FIX: Use X_val dimensions for reshaping, not self.num_features_
-            y_true_dec = self.pgenc.decode_012(
-                GT_ref.reshape(X_val.shape[0], X_val.shape[1])
-            )
-            X_pred = X_val.copy()
-            X_pred[eval_mask] = pred_labels_flat
-            y_pred_dec = self.pgenc.decode_012(
-                X_pred.reshape(X_val.shape[0], X_val.shape[1])
-            )
-            encodings_dict = {
-                "A": 0,
-                "C": 1,
-                "G": 2,
-                "T": 3,
-                "W": 4,
-                "R": 5,
-                "M": 6,
-                "K": 7,
-                "Y": 8,
-                "S": 9,
-                "N": -1,
-            }
-            y_true_int = self.pgenc.convert_int_iupac(
-                y_true_dec, encodings_dict=encodings_dict
-            )
-            y_pred_int = self.pgenc.convert_int_iupac(
-                y_pred_dec, encodings_dict=encodings_dict
-            )
-            # For IUPAC report
-            valid_true = y_true_int[eval_mask]
-            valid_true = valid_true[valid_true >= 0]  # drop -1 (N)
-            iupac_label_set = ["A", "C", "G", "T", "W", "R", "M", "K", "Y", "S"]
-            # For numeric report
-            if (
-                np.intersect1d(np.unique(y_true_flat), labels_for_scoring).size == 0
-                or valid_true.size == 0
-            ):
-                if not objective_mode:
-                    self.logger.warning(
-                        "Skipped numeric confusion matrix: no y_true labels present."
-                    )
-            else:
-                self._make_class_reports(
-                    y_true=valid_true,
-                    y_pred=y_pred_int[eval_mask][y_true_int[eval_mask] >= 0],
-                    metrics=metrics,
-                    y_pred_proba=None,
-                    labels=iupac_label_set,
-                )
-        return metrics
-    def _get_data_loaders(self, y: np.ndarray) -> torch.utils.data.DataLoader:
-        """Create DataLoader over indices + 0/1/2 target matrix.
-        This method creates a PyTorch DataLoader for the given genotype matrix, which contains 0/1/2 encodings with -1 for missing values. The DataLoader is constructed to yield batches of data during training, where each batch consists of indices and the corresponding genotype values. The genotype matrix is converted to a PyTorch tensor and moved to the appropriate device (CPU or GPU) before being wrapped in a TensorDataset. The DataLoader is configured to shuffle the data and use the specified batch size.
-        Args:
-            y (np.ndarray): (n_samples x L) int matrix with -1 missing.
-        Returns:
-            torch.utils.data.DataLoader: Shuffled mini-batches.
-        """
-        y_tensor = torch.from_numpy(y).long()
-        indices = torch.arange(len(y), dtype=torch.long)
-        dataset = torch.utils.data.TensorDataset(indices, y_tensor)
-        pin_memory = self.device.type == "cuda"
-        return torch.utils.data.DataLoader(
-            dataset,
-            batch_size=self.batch_size,
-            shuffle=True,
-            pin_memory=pin_memory,
-        )
-    def _objective(self, trial: optuna.Trial) -> float:
-        """Optuna objective using the UBP training loop.
-        This method defines the objective function for hyperparameter tuning using Optuna. It prepares the necessary artifacts for tuning, samples a set of hyperparameters for the current trial, and trains the UBP model using these hyperparameters. The model is evaluated on a validation set, and the specified tuning metric is returned as the objective value. If any exception occurs during the process, the trial is pruned.
-        """
-        try:
-            self._prepare_tuning_artifacts()
-            trial_params = self._sample_hyperparameters(trial)
-            model_params = trial_params["model_params"]
-            nfeat = self._tune_num_features
-            if self.tune and self.tune_fast:
-                model_params["n_features"] = nfeat
-            X_train_trial = getattr(
-                self, "X_train_", self.ground_truth_[self.train_idx_]
-            )
-            X_test_trial = getattr(self, "X_test_", self.ground_truth_[self.test_idx_])
-            class_weights = self._normalize_class_weights(
-                self._class_weights_from_zygosity(X_train_trial)
-            )
-            if not self.is_haploid:
-                self.pos_weights_ = self._compute_pos_weights(X_train_trial)
-            else:
-                self.pos_weights_ = None
-            train_loader = self._get_data_loaders(X_train_trial)
-            train_latent_vectors = self._create_latent_space(
-                model_params,
-                len(X_train_trial),
-                X_train_trial,
-                trial_params["latent_init"],
-            )
-            model = self.build_model(self.Model, model_params)
-            model.n_features = model_params["n_features"]
-            model.apply(self.initialize_weights)
-            _, model, __ = self._train_and_validate_model(
-                model=model,
-                loader=train_loader,
-                lr=trial_params["lr"],
-                l1_penalty=trial_params["l1_penalty"],
-                trial=trial,
-                return_history=False,
-                latent_vectors=train_latent_vectors,
-                lr_input_factor=trial_params["lr_input_factor"],
-                class_weights=class_weights,
-                X_val=X_test_trial,
-                params=model_params,
-                prune_metric=self.tune_metric,
-                prune_warmup_epochs=10,
-                eval_interval=self.tune_eval_interval,
-                eval_requires_latents=True,
-                eval_latent_steps=self.eval_latent_steps,
-                eval_latent_lr=self.eval_latent_lr,
-                eval_latent_weight_decay=self.eval_latent_weight_decay,
-            )
-            eval_mask = (
-                self.sim_mask_test_
-                if (
-                    self.simulate_missing
-                    and getattr(self, "sim_mask_test_", None) is not None
-                )
-                else None
-            )
-            metrics = self._evaluate_model(
-                X_test_trial,
-                model,
-                model_params,
-                objective_mode=True,
-                eval_mask_override=eval_mask,
-            )
-            self._clear_resources(
-                model, train_loader, latent_vectors=train_latent_vectors
-            )
-            return metrics[self.tune_metric]
-        except Exception as e:
-            raise optuna.exceptions.TrialPruned(f"Trial failed with error: {e}")
-    def _sample_hyperparameters(self, trial: optuna.Trial) -> dict:
-        """Sample UBP hyperparameters; compute hidden sizes for model_params.
-        This method samples a set of hyperparameters for the UBP model using the provided Optuna trial object. It defines a search space for various hyperparameters, including latent dimension, learning rate, dropout rate, number of hidden layers, activation function, and others. After sampling the hyperparameters, it computes the sizes of the hidden layers based on the sampled values and constructs the model parameters dictionary. The method returns a dictionary containing all sampled hyperparameters along with the computed model parameters.
-        Args:
-            trial (optuna.Trial): Current trial.
-        Returns:
-            Dict[str, int | float | str | list]: Sampled hyperparameters.
-        """
-        params = {
-            "latent_dim": trial.suggest_int("latent_dim", 4, 16, step=2),
-            "lr": trial.suggest_float("learning_rate", 3e-4, 1e-3, log=True),
-            "dropout_rate": trial.suggest_float("dropout_rate", 0.0, 0.30, step=0.05),
-            "num_hidden_layers": trial.suggest_int("num_hidden_layers", 1, 6),
-            "activation": trial.suggest_categorical(
-                "activation", ["relu", "elu", "selu", "leaky_relu"]
-            ),
-            "gamma": trial.suggest_float("gamma", 0.5, 3.0, step=0.5),
-            "lr_input_factor": trial.suggest_float(
-                "lr_input_factor", 0.3, 3.0, log=True
-            ),
-            "l1_penalty": trial.suggest_float("l1_penalty", 1e-6, 1e-3, log=True),
-            "layer_scaling_factor": trial.suggest_float(
-                "layer_scaling_factor", 2.0, 4.0, step=0.5
-            ),
-            "layer_schedule": trial.suggest_categorical(
-                "layer_schedule", ["pyramid", "linear"]
-            ),
-            "latent_init": trial.suggest_categorical("latent_init", ["random", "pca"]),
-        }
-        hidden_layer_sizes = self._compute_hidden_layer_sizes(
-            n_inputs=params["latent_dim"],
-            n_outputs=self.num_features_ * self.output_classes_,
-            n_samples=len(self.train_idx_),
-            n_hidden=params["num_hidden_layers"],
-            alpha=params["layer_scaling_factor"],
-            schedule=params["layer_schedule"],
-        )
-        # Keep the latent_dim as the first element,
-        # then the interior hidden widths.
-        # If there are no interior widths (very small nets),
-        # this still leaves [latent_dim].
-        hidden_only = [hidden_layer_sizes[0]] + hidden_layer_sizes[1:-1]
-        params["model_params"] = {
-            "n_features": self.num_features_,
-            "num_classes": self.output_classes_,
-            "latent_dim": params["latent_dim"],
-            "dropout_rate": params["dropout_rate"],
-            "hidden_layer_sizes": hidden_only,
-            "activation": params["activation"],
-        }
-        return params
-    def _set_best_params(self, best_params: dict) -> dict:
-        """Set best params onto instance; return model_params payload.
-        This method sets the best hyperparameters found during tuning onto the instance attributes of the ImputeUBP class. It extracts the relevant hyperparameters from the provided dictionary and updates the corresponding instance variables. Additionally, it computes the sizes of the hidden layers based on the best hyperparameters and constructs the model parameters dictionary. The method returns a dictionary containing the model parameters that can be used to build the UBP model.
-        Args:
-            best_params (dict): Best hyperparameters.
-        Returns:
-            dict: model_params payload.
-        Raises:
-            ValueError: If best_params is missing required keys.
-        """
-        self.latent_dim = best_params["latent_dim"]
-        self.dropout_rate = best_params["dropout_rate"]
-        self.learning_rate = best_params["learning_rate"]
-        self.gamma = best_params["gamma"]
-        self.lr_input_factor = best_params["lr_input_factor"]
-        self.l1_penalty = best_params["l1_penalty"]
-        self.activation = best_params["activation"]
-        self.latent_init = best_params["latent_init"]
-        hidden_layer_sizes = self._compute_hidden_layer_sizes(
-            n_inputs=self.latent_dim,
-            n_outputs=self.num_features_ * self.output_classes_,
-            n_samples=len(self.train_idx_),
-            n_hidden=best_params["num_hidden_layers"],
-            alpha=best_params["layer_scaling_factor"],
-            schedule=best_params["layer_schedule"],
-        )
-        hidden_only = [hidden_layer_sizes[0]] + hidden_layer_sizes[1:-1]
-        return {
-            "n_features": self.num_features_,
-            "latent_dim": self.latent_dim,
-            "hidden_layer_sizes": hidden_only,
-            "dropout_rate": self.dropout_rate,
-            "activation": self.activation,
-            "gamma": self.gamma,
-            "num_classes": self.output_classes_,
-        }
-    def _set_best_params_default(self) -> dict:
-        """Default (no-tuning) model_params aligned with current attributes.
-        This method constructs the model parameters dictionary using the current instance attributes of the ImputeUBP class. It computes the sizes of the hidden layers based on the instance's latent dimension, dropout rate, learning rate, and other relevant attributes. The method returns a dictionary containing the model parameters that can be used to build the UBP model when no hyperparameter tuning has been performed.
-        Returns:
-            dict: model_params payload.
-        """
-        hidden_layer_sizes = self._compute_hidden_layer_sizes(
-            n_inputs=self.latent_dim,
-            n_outputs=self.num_features_ * self.output_classes_,
-            n_samples=len(self.ground_truth_),
-            n_hidden=self.num_hidden_layers,
-            alpha=self.layer_scaling_factor,
-            schedule=self.layer_schedule,
-        )
-        hidden_only = [hidden_layer_sizes[0]] + hidden_layer_sizes[1:-1]
-        return {
-            "n_features": self.num_features_,
-            "latent_dim": self.latent_dim,
-            "hidden_layer_sizes": hidden_only,
-            "dropout_rate": self.dropout_rate,
-            "activation": self.activation,
-            "gamma": self.gamma,
-            "num_classes": self.output_classes_,
-        }
-    def _train_and_validate_model(
-        self,
-        model: torch.nn.Module,
-        loader: torch.utils.data.DataLoader,
-        lr: float,
-        l1_penalty: float,
-        trial: optuna.Trial | None = None,
-        return_history: bool = False,
-        latent_vectors: torch.nn.Parameter | None = None,
-        lr_input_factor: float = 1.0,
-        class_weights: torch.Tensor | None = None,
-        *,
-        X_val: np.ndarray | None = None,
-        params: dict | None = None,
-        prune_metric: str | None = None,  # "f1" | "accuracy" | "pr_macro"
-        prune_warmup_epochs: int = 10,
-        eval_interval: int = 1,
-        eval_requires_latents: bool = True,  # UBP needs latent eval
-        eval_latent_steps: int = 50,
-        eval_latent_lr: float = 1e-2,
-        eval_latent_weight_decay: float = 0.0,
-    ) -> tuple:
-        """Train & validate UBP model with three-phase loop.
-        This method trains and validates the UBP model using a three-phase training loop. It sets up the latent optimizer and invokes the training loop, which includes pre-training, fine-tuning, and joint training phases. The method ensures that the necessary latent vectors and class weights are provided before proceeding with training. It also incorporates new parameters for evaluation and pruning during training. The final best loss, best model, training history, and optimized latent vectors are returned.
-        Args:
-            model (torch.nn.Module): UBP model with phase1_decoder & phase23_decoder.
-            loader (torch.utils.data.DataLoader): DataLoader for training data.
-            lr (float): Learning rate for decoder.
-            l1_penalty (float): L1 regularization weight.
-            trial (optuna.Trial | None): Current trial or None.
-            return_history (bool): If True, return loss history.
-            latent_vectors (torch.nn.Parameter | None): Trainable Z.
-            lr_input_factor (float): LR factor for latents.
-            class_weights (torch.Tensor | None): Class weights for 0/1/2.
-            X_val (np.ndarray | None): Validation set for pruning/eval.
-            params (dict | None): Model params for eval.
-            prune_metric (str | None): Metric to monitor for pruning.
-            prune_warmup_epochs (int): Epochs before pruning starts.
-            eval_interval (int): Epochs between evaluations.
-            eval_requires_latents (bool): If True, optimize latents for eval.
-            eval_latent_steps (int): Latent optimization steps for eval.
-            eval_latent_lr (float): Latent optimization LR for eval.
-            eval_latent_weight_decay (float): Latent optimization weight decay for eval.
-        Returns:
-            Tuple[float, torch.nn.Module, dict, torch.nn.Parameter]: (best_loss, best_model, history, latents).
-        Raises:
-            TypeError: If latent_vectors or class_weights are
-                not provided.
-            ValueError: If X_val is not provided for evaluation.
-            RuntimeError: If eval_latent_steps is not positive.
-        """
-        if latent_vectors is None or class_weights is None:
-            msg = "Must provide latent_vectors and class_weights."
-            self.logger.error(msg)
-            raise TypeError(msg)
-        latent_optimizer = torch.optim.Adam([latent_vectors], lr=lr * lr_input_factor)
-        result = self._execute_training_loop(
-            loader=loader,
-            latent_optimizer=latent_optimizer,
-            lr=lr,
-            model=model,
-            l1_penalty=l1_penalty,
-            trial=trial,
-            return_history=return_history,
-            latent_vectors=latent_vectors,
-            class_weights=class_weights,
-            # NEW ↓↓↓
-            X_val=X_val,
-            params=params,
-            prune_metric=prune_metric,
-            prune_warmup_epochs=prune_warmup_epochs,
-            eval_interval=eval_interval,
-            eval_requires_latents=eval_requires_latents,
-            eval_latent_steps=eval_latent_steps,
-            eval_latent_lr=eval_latent_lr,
-            eval_latent_weight_decay=eval_latent_weight_decay,
-        )
-        if return_history:
-            return result
-        return result[0], result[1], result[3]
-    def _train_final_model(
-        self,
-        loader: torch.utils.data.DataLoader,
-        best_params: dict,
-        initial_latent_vectors: torch.nn.Parameter,
-    ) -> tuple:
-        """Train final UBP model with best params; save weights to disk.
-        This method trains the final UBP model using the best hyperparameters found during tuning. It builds the model with the specified parameters, initializes the weights, and invokes the training and validation process. The method saves the trained model's state dictionary to disk and returns the final loss, trained model, training history, and optimized latent vectors.
-        Args:
-            loader (torch.utils.data.DataLoader): DataLoader for training data.
-            best_params (Dict[str, int | float | str | list]): Best hyperparameters.
-            initial_latent_vectors (torch.nn.Parameter): Initialized latent vectors.
-        Returns:
-            Tuple[float, torch.nn.Module, dict, torch.nn.Parameter]: (loss, model, {"Train": history}, latents).
-        """
-        self.logger.info(f"Training the final {self.model_name} model...")
-        model = self.build_model(self.Model, best_params)
-        model.n_features = best_params["n_features"]
-        model.apply(self.initialize_weights)
-        loss, trained_model, history, latent_vectors = self._train_and_validate_model(
-            model=model,
-            loader=loader,
-            lr=self.learning_rate,
-            l1_penalty=self.l1_penalty,
-            return_history=True,
-            latent_vectors=initial_latent_vectors,
-            lr_input_factor=self.lr_input_factor,
-            class_weights=self.class_weights_,
-            X_val=self.X_test_,
-            params=best_params,
-            prune_metric=self.tune_metric,
-            prune_warmup_epochs=10,
-            eval_interval=1,
-            eval_requires_latents=True,
-            eval_latent_steps=self.eval_latent_steps,
-            eval_latent_lr=self.eval_latent_lr,
-            eval_latent_weight_decay=self.eval_latent_weight_decay,
-        )
-        if trained_model is None:
-            msg = "Final model training failed."
-            self.logger.error(msg)
-            raise RuntimeError(msg)
-        fout = self.models_dir / "final_model.pt"
-        torch.save(trained_model.state_dict(), fout)
-        return loss, trained_model, {"Train": history}, latent_vectors
-    def _execute_training_loop(
-        self,
-        loader: torch.utils.data.DataLoader,
-        latent_optimizer: torch.optim.Optimizer,
-        lr: float,
-        model: torch.nn.Module,
-        l1_penalty: float,
-        trial: optuna.Trial | None,
-        return_history: bool,
-        latent_vectors: torch.nn.Parameter,
-        class_weights: torch.Tensor,
-        *,
-        X_val: np.ndarray | None = None,
-        params: dict | None = None,
-        prune_metric: str | None = None,
-        prune_warmup_epochs: int = 10,
-        eval_interval: int = 1,
-        eval_requires_latents: bool = True,
-        eval_latent_steps: int = 50,
-        eval_latent_lr: float = 1e-2,
-        eval_latent_weight_decay: float = 0.0,
-    ) -> Tuple[float, torch.nn.Module, dict, torch.nn.Parameter]:
-        """Three-phase UBP with numeric guards, LR warmup, and pruning.
-        This method executes the three-phase training loop for the UBP model, incorporating numeric stability guards, learning rate warmup, and Optuna pruning. It iterates through three training phases: pre-training the phase 1 decoder, fine-tuning the phase 2 and 3 decoders, and joint training of all components. The method monitors training loss, applies early stopping, and evaluates the model on a validation set for pruning purposes. The final best loss, best model, training history, and optimized latent vectors are returned.
-        Args:
-            loader (torch.utils.data.DataLoader): DataLoader for training data.
-            latent_optimizer (torch.optim.Optimizer): Optimizer for latent vectors.
-            lr (float): Learning rate for decoder.
-            model (torch.nn.Module): UBP model with phase1_decoder & phase23_decoder.
-            l1_penalty (float): L1 regularization weight.
-            trial (optuna.Trial | None): Current trial or None.
-            return_history (bool): If True, return loss history.
-            latent_vectors (torch.nn.Parameter): Trainable Z.
-            class_weights (torch.Tensor): Class weights for
-                0/1/2.
-            X_val (np.ndarray | None): Validation set for pruning/eval.
-            params (dict | None): Model params for eval.
-            prune_metric (str | None): Metric to monitor for pruning.
-            prune_warmup_epochs (int): Epochs before pruning starts.
-            eval_interval (int): Epochs between evaluations.
-            eval_requires_latents (bool): If True, optimize latents for eval.
-            eval_latent_steps (int): Latent optimization steps for eval.
-            eval_latent_lr (float): Latent optimization LR for eval.
-            eval_latent_weight_decay (float): Latent optimization weight decay for eval.
-        Returns:
-            Tuple[float, torch.nn.Module, dict, torch.nn.Parameter]: (best_loss, best_model, history, latents).
-        Raises:
-            ValueError: If X_val is not provided for evaluation.
-            RuntimeError: If eval_latent_steps is not positive.
-        """
-        history: dict[str, list[float]] = {}
-        final_best_loss, final_best_model = float("inf"), None
-        warm, ramp, gamma_final = 50, 100, torch.tensor(self.gamma, device=self.device)
-        # Schema-aware latent cache for eval
-        _latent_cache: dict = {}
-        nF = getattr(model, "n_features", self.num_features_)
-        cache_key_root = f"{self.prefix}_ubp_val_latents_L{nF}_K{self.output_classes_}"
-        E = int(self.epochs)
-        phase_epochs = {
-            1: max(1, int(0.15 * E)),
-            2: max(1, int(0.35 * E)),
-            3: max(1, E - int(0.15 * E) - int(0.35 * E)),
-        }
-        for phase in (1, 2, 3):
-            steps_this_phase = phase_epochs[phase]
-            warmup_epochs = getattr(self, "lr_warmup_epochs", 5) if phase == 1 else 0
-            early_stopping = EarlyStopping(
-                patience=self.early_stop_gen,
-                min_epochs=self.min_epochs,
-                verbose=self.verbose,
-                prefix=self.prefix,
-                debug=self.debug,
-            )
-            if phase == 2:
-                self._reset_weights(model)
-            decoder: torch.Tensor | torch.nn.Module = (
-                model.phase1_decoder if phase == 1 else model.phase23_decoder
-            )
-            if not isinstance(decoder, torch.nn.Module):
-                msg = f"{self.model_name} Decoder is not a torch.nn.Module."
-                self.logger.error(msg)
-                raise TypeError(msg)
-            decoder_params = decoder.parameters()
-            optimizer = torch.optim.AdamW(decoder_params, lr=lr, eps=1e-7)
-            scheduler = torch.optim.lr_scheduler.CosineAnnealingLR(
-                optimizer, T_max=steps_this_phase
-            )
-            # Cache base LRs for warmup
-            dec_lr0 = optimizer.param_groups[0]["lr"]
-            lat_lr0 = latent_optimizer.param_groups[0]["lr"]
-            dec_lr_min, lat_lr_min = dec_lr0 * 0.1, lat_lr0 * 0.1
-            phase_hist: list[float] = []
-            gamma_init = torch.tensor(0.0, device=self.device)
-            for epoch in range(steps_this_phase):
-                # Focal gamma warm/ramp
-                if epoch < warm:
-                    model.gamma = gamma_init.cpu().numpy().item()
-                elif epoch < warm + ramp:
-                    model.gamma = gamma_final * ((epoch - warm) / ramp)
-                else:
-                    model.gamma = gamma_final
-                # Linear warmup for both optimizers
-                if warmup_epochs and epoch < warmup_epochs:
-                    scale = float(epoch + 1) / warmup_epochs
-                    for g in optimizer.param_groups:
-                        g["lr"] = dec_lr_min + (dec_lr0 - dec_lr_min) * scale
-                    for g in latent_optimizer.param_groups:
-                        g["lr"] = lat_lr_min + (lat_lr0 - lat_lr_min) * scale
-                train_loss, latent_vectors = self._train_step(
-                    loader=loader,
-                    optimizer=optimizer,
-                    latent_optimizer=latent_optimizer,
-                    model=model,
-                    l1_penalty=l1_penalty,
-                    latent_vectors=latent_vectors,
-                    class_weights=class_weights,
-                    phase=phase,
-                )
-                if not np.isfinite(train_loss):
-                    if trial:
-                        raise optuna.exceptions.TrialPruned("Epoch loss non-finite.")
-                    # reduce LRs and continue
-                    for g in optimizer.param_groups:
-                        g["lr"] *= 0.5
-                    for g in latent_optimizer.param_groups:
-                        g["lr"] *= 0.5
-                    continue
-                scheduler.step()
-                if return_history:
-                    phase_hist.append(train_loss)
-                early_stopping(train_loss, model)
-                if early_stopping.early_stop:
-                    self.logger.info(
-                        f"Early stopping at epoch {epoch + 1} (phase {phase})."
-                    )
-                    break
-                # Validation + pruning
-                if (
-                    trial is not None
-                    and X_val is not None
-                    and ((epoch + 1) % eval_interval == 0)
-                ):
-                    metric_key = prune_metric or getattr(self, "tune_metric", "f1")
-                    zdim = self._first_linear_in_features(model)
-                    schema_key = f"{cache_key_root}_z{zdim}"
-                    mask_override = None
-                    if (
-                        self.simulate_missing
-                        and getattr(self, "sim_mask_test_", None) is not None
-                        and getattr(self, "X_test_", None) is not None
-                        and X_val.shape == self.X_test_.shape
-                    ):
-                        mask_override = self.sim_mask_test_
-                    metric_val = self._eval_for_pruning(
-                        model=model,
-                        X_val=X_val,
-                        params=params or getattr(self, "best_params_", {}),
-                        metric=metric_key,
-                        objective_mode=True,
-                        do_latent_infer=eval_requires_latents,
-                        latent_steps=eval_latent_steps,
-                        latent_lr=eval_latent_lr,
-                        latent_weight_decay=eval_latent_weight_decay,
-                        latent_seed=self.seed,  # type: ignore
-                        _latent_cache=_latent_cache,
-                        _latent_cache_key=schema_key,
-                        eval_mask_override=mask_override,
-                    )
-                    if phase == 3:
-                        trial.report(metric_val, step=epoch + 1)
-                        if (epoch + 1) >= prune_warmup_epochs and trial.should_prune():
-                            raise optuna.exceptions.TrialPruned(
-                                f"Pruned at epoch {epoch + 1} (phase {phase}): {metric_key}={metric_val:.5f}"
-                            )
-            history[f"Phase {phase}"] = phase_hist
-            final_best_loss = early_stopping.best_score
-            if early_stopping.best_model is not None:
-                final_best_model = copy.deepcopy(early_stopping.best_model)
-            else:
-                final_best_model = copy.deepcopy(model)
-        if final_best_model is None:
-            final_best_model = copy.deepcopy(model)
-        return final_best_loss, final_best_model, history, latent_vectors
-    def _optimize_latents_for_inference(
-        self,
-        X_new: np.ndarray,
-        model: torch.nn.Module,
-        params: dict,
-        inference_epochs: int = 200,
-    ) -> torch.Tensor:
-        """Optimize latents for new 0/1/2 data with guards.
-        This method optimizes the latent vectors for new genotype data using the trained UBP model. It initializes the latent space based on the provided data and iteratively updates the latent vectors to minimize the cross-entropy loss between the model's predictions and the true genotype values. The optimization process includes numeric stability guards to ensure that gradients and losses remain finite. The optimized latent vectors are returned as a PyTorch tensor.
-        Args:
-            X_new (np.ndarray): New 0/1/2 data with -1 for missing.
-            model (torch.nn.Module): Trained UBP model.
-            params (dict): Model params.
-            inference_epochs (int): Number of optimization epochs.
-        Returns:
-            torch.Tensor: Optimized latent vectors.
-        """
-        model.eval()
-        nF = getattr(model, "n_features", self.num_features_)
-        if self.tune and self.tune_fast:
-            inference_epochs = min(
-                inference_epochs, getattr(self, "tune_infer_epochs", 20)
-            )
-        X_new = X_new.astype(np.int64, copy=False)
-        X_new[X_new < 0] = -1
-        y = torch.from_numpy(X_new).long().to(self.device)
-        z = self._create_latent_space(
-            params, len(X_new), X_new, self.latent_init
-        ).requires_grad_(True)
-        opt = torch.optim.AdamW(
-            [z], lr=self.learning_rate * self.lr_input_factor, eps=1e-7
-        )
-        for _ in range(inference_epochs):
-            decoder = model.phase23_decoder
-            if not isinstance(decoder, torch.nn.Module):
-                msg = f"{self.model_name} Decoder is not a torch.nn.Module."
-                self.logger.error(msg)
-                raise TypeError(msg)
-            opt.zero_grad(set_to_none=True)
-            logits = decoder(z).view(len(X_new), nF, self.output_classes_)
-            if not torch.isfinite(logits).all():
-                break
-            if self.is_haploid:
-                loss = F.cross_entropy(
-                    logits.view(-1, self.output_classes_), y.view(-1), ignore_index=-1
-                )
-            else:
-                targets = self._multi_hot_targets(y)
-                bce = F.binary_cross_entropy_with_logits(
-                    logits, targets, pos_weight=self.pos_weights_, reduction="none"
-                )
-                mask = (y != -1).unsqueeze(-1).float()
-                loss = (bce * mask).sum() / mask.sum().clamp_min(1e-8)
-            if not torch.isfinite(loss):
-                break
-            loss.backward()
-            torch.nn.utils.clip_grad_norm_([z], 1.0)
-            if z.grad is None or not torch.isfinite(z.grad).all():
-                break
-            opt.step()
-        return z.detach()
-    def _create_latent_space(
-        self,
-        params: dict,
-        n_samples: int,
-        X: np.ndarray,
-        latent_init: Literal["random", "pca"],
-    ) -> torch.nn.Parameter:
-        """Initialize latent space via random Xavier or PCA on 0/1/2 matrix.
-        This method initializes the latent space for the UBP model using either random Xavier initialization or PCA-based initialization. The choice of initialization strategy is determined by the latent_init parameter. If PCA is selected, the method handles missing values by imputing them with column means before performing PCA. The resulting latent vectors are standardized and converted to a PyTorch parameter that can be optimized during training.
-        Args:
-            params (dict): Contains 'latent_dim'.
-            n_samples (int): Number of samples.
-            X (np.ndarray): (n_samples x L) 0/1/2 with -1 missing.
-            latent_init (Literal["random","pca"]): Init strategy.
-        Returns:
-            torch.nn.Parameter: Trainable latent matrix.
-        """
-        latent_dim = int(params["latent_dim"])
-        if latent_init == "pca":
-            X_pca = X.astype(np.float32, copy=True)
-            # mark missing
-            X_pca[X_pca < 0] = np.nan
-            # ---- SAFE column means without warnings ----
-            valid_counts = np.sum(~np.isnan(X_pca), axis=0)
-            col_sums = np.nansum(X_pca, axis=0)
-            col_means = np.divide(
-                col_sums,
-                valid_counts,
-                out=np.zeros_like(col_sums, dtype=np.float32),
-                where=valid_counts > 0,
-            )
-            # impute NaNs with per-column means
-            # (all-NaN cols -> 0.0 by the divide above)
-            nan_r, nan_c = np.where(np.isnan(X_pca))
-            if nan_r.size:
-                X_pca[nan_r, nan_c] = col_means[nan_c]
-            # center columns
-            X_pca = X_pca - X_pca.mean(axis=0, keepdims=True)
-            # guard: degenerate / all-zero after centering ->
-            # fall back to random
-            if (not np.isfinite(X_pca).all()) or np.allclose(X_pca, 0.0):
-                latents = torch.empty(n_samples, latent_dim, device=self.device)
-                torch.nn.init.xavier_uniform_(latents)
-                return torch.nn.Parameter(latents, requires_grad=True)
-            # rank-aware component count, at least 1
-            try:
-                est_rank = np.linalg.matrix_rank(X_pca)
-            except Exception:
-                est_rank = min(n_samples, X_pca.shape[1])
-            n_components = max(1, min(latent_dim, est_rank, n_samples, X_pca.shape[1]))
-            # use deterministic SVD to avoid power-iteration warnings
-            pca = PCA(
-                n_components=n_components,
-                svd_solver="randomized",
-                random_state=self.seed,
-            )
-            initial = pca.fit_transform(X_pca)  # (n_samples, n_components)
-            # pad if latent_dim > n_components
-            if n_components < latent_dim:
-                pad = self.rng.standard_normal(
-                    size=(n_samples, latent_dim - n_components)
-                )
-                initial = np.hstack([initial, pad])
-            # standardize latent dims
-            initial = (initial - initial.mean(axis=0)) / (initial.std(axis=0) + 1e-6)
-            latents = torch.from_numpy(initial).float().to(self.device)
-            return torch.nn.Parameter(latents, requires_grad=True)
-        else:
-            latents = torch.empty(n_samples, latent_dim, device=self.device)
-            torch.nn.init.xavier_uniform_(latents)
-            return torch.nn.Parameter(latents, requires_grad=True)
-    def _multi_hot_targets(self, y: torch.Tensor) -> torch.Tensor:
-        """Two-channel multi-hot for diploid: REF-only, ALT-only; HET sets both."""
-        if self.is_haploid:
-            raise RuntimeError("_multi_hot_targets called for haploid data.")
-        y = y.to(self.device)
-        out = torch.zeros(y.shape + (2,), device=self.device, dtype=torch.float32)
-        valid = y != -1
-        ref_mask = valid & (y != 2)
-        alt_mask = valid & (y != 0)
-        out[ref_mask, 0] = 1.0
-        out[alt_mask, 1] = 1.0
-        return out
-    def _compute_pos_weights(self, X: np.ndarray) -> torch.Tensor:
-        """Balance REF/ALT channels for multilabel BCE."""
-        ref_pos = np.count_nonzero((X == 0) | (X == 1))
-        alt_pos = np.count_nonzero((X == 2) | (X == 1))
-        total_valid = np.count_nonzero(X != -1)
-        pos_counts = np.array([ref_pos, alt_pos], dtype=np.float32)
-        neg_counts = np.maximum(total_valid - pos_counts, 1.0)
-        pos_counts = np.maximum(pos_counts, 1.0)
-        weights = neg_counts / pos_counts
-        return torch.tensor(weights, device=self.device, dtype=torch.float32)
-    def _reset_weights(self, model: torch.nn.Module) -> None:
-        """Selectively resets only the weights of the phase 2/3 decoder.
-        This method targets only the `phase23_decoder` attribute of the UBPModel, leaving the `phase1_decoder` and other potential model components untouched. This allows the model to be re-initialized for the second phase of training without affecting other parts.
-        Args:
-            model (torch.nn.Module): The PyTorch model whose parameters are to be reset.
-        """
-        if hasattr(model, "phase23_decoder"):
-            decoder = model.phase23_decoder
-            if not isinstance(decoder, torch.nn.Module):
-                msg = f"{self.model_name} phase23_decoder is not a torch.nn.Module."
-                self.logger.error(msg)
-                raise TypeError(msg)
-            # Iterate through only the modules of the second decoder
-            for layer in decoder.modules():
-                if hasattr(layer, "reset_parameters") and isinstance(
-                    layer.reset_parameters, torch.nn.Module
-                ):
-                    layer.reset_parameters()
-        else:
-            self.logger.warning(
-                "Model does not have a 'phase23_decoder' attribute; skipping weight reset."
-            )
-    def _latent_infer_for_eval(
-        self,
-        model: torch.nn.Module,
-        X_val: np.ndarray,
-        *,
-        steps: int,
-        lr: float,
-        weight_decay: float,
-        seed: int,
-        cache: dict | None,
-        cache_key: str | None,
-    ) -> None:
-        """Freeze network; refine validation latents only with guards.
-        This method refines the latent vectors for the validation dataset using the trained UBP model. It freezes the model parameters to prevent updates during this phase and optimizes the latent vectors to minimize the cross-entropy loss between the model's predictions and the true genotype values. The optimization process includes numeric stability checks to ensure that gradients and losses remain finite. If a cache is provided, it stores the optimized latent vectors for future use.
-        Args:
-            model (torch.nn.Module): Trained UBP model.
-            X_val (np.ndarray): Validation set 0/1/2 with -1 missing
-            steps (int): Number of optimization steps.
-            lr (float): Learning rate for latent optimization.
-            weight_decay (float): Weight decay for latent optimization.
-            seed (int): Random seed for reproducibility.
-            cache (dict | None): Optional cache for latent vectors.
-            cache_key (str | None): Key for storing/retrieving from cache.
-        """
-        if seed is None:
-            seed = np.random.randint(0, 999_999)
-        torch.manual_seed(seed)
-        np.random.seed(seed)
-        model.eval()
-        for p in model.parameters():
-            p.requires_grad_(False)
-        nF = getattr(model, "n_features", self.num_features_)
-        X_val = X_val.astype(np.int64, copy=False)
-        X_val[X_val < 0] = -1
-        y = torch.from_numpy(X_val).long().to(self.device)
-        zdim = self._first_linear_in_features(model)
-        schema_key = (
-            f"{self.prefix}_ubp_val_latents_z{zdim}_L{nF}_K{self.output_classes_}"
-        )
-        if cache is not None and schema_key in cache:
-            z = cache[schema_key].detach().clone().requires_grad_(True)
-        else:
-            z = self._create_latent_space(
-                {"latent_dim": zdim}, X_val.shape[0], X_val, self.latent_init
-            ).requires_grad_(True)
-        opt = torch.optim.AdamW([z], lr=lr, weight_decay=weight_decay, eps=1e-7)
-        for _ in range(max(int(steps), 0)):
-            opt.zero_grad(set_to_none=True)
-            decoder: torch.Tensor | torch.nn.Module = model.phase23_decoder
-            if not isinstance(decoder, torch.nn.Module):
-                msg = f"{self.model_name} Decoder is not a torch.nn.Module."
-                self.logger.error(msg)
-                raise TypeError(msg)
-            logits = decoder(z).view(X_val.shape[0], nF, self.output_classes_)
-            if not torch.isfinite(logits).all():
-                break
-            if self.is_haploid:
-                loss = F.cross_entropy(
-                    logits.view(-1, self.output_classes_), y.view(-1), ignore_index=-1
-                )
-            else:
-                targets = self._multi_hot_targets(y)
-                bce = F.binary_cross_entropy_with_logits(
-                    logits, targets, pos_weight=self.pos_weights_, reduction="none"
-                )
-                mask = (y != -1).unsqueeze(-1).float()
-                loss = (bce * mask).sum() / mask.sum().clamp_min(1e-8)
-            if not torch.isfinite(loss):
-                break
-            loss.backward()
-            torch.nn.utils.clip_grad_norm_([z], 1.0)
-            if z.grad is None or not torch.isfinite(z.grad).all():
-                break
-            opt.step()
-        if cache is not None:
-            cache[schema_key] = z.detach().clone()
-        for p in model.parameters():
-            p.requires_grad_(True)

pg-sui 1.6.16a3__py3-none-any.whl → 1.7.0__py3-none-any.whl

pg-sui 1.6.16a3py3-none-any.whl → 1.7.0py3-none-any.whl