PyPI - pg-sui - Versions diffs - 0.2.3__py3-none-any.whl → 1.6.14.dev9__py3-none-any.whl - Mend

pg-sui 0.2.3py3-none-any.whl → 1.6.14.dev9py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (127) hide show

{pg_sui-0.2.3.dist-info → pg_sui-1.6.14.dev9.dist-info}/METADATA +99 -77
pg_sui-1.6.14.dev9.dist-info/RECORD +81 -0
{pg_sui-0.2.3.dist-info → pg_sui-1.6.14.dev9.dist-info}/WHEEL +1 -1
pg_sui-1.6.14.dev9.dist-info/entry_points.txt +4 -0
{pg_sui-0.2.3.dist-info → pg_sui-1.6.14.dev9.dist-info/licenses}/LICENSE +0 -0
pg_sui-1.6.14.dev9.dist-info/top_level.txt +1 -0
pgsui/__init__.py +35 -54
pgsui/_version.py +34 -0
pgsui/cli.py +909 -0
pgsui/data_processing/__init__.py +0 -0
pgsui/data_processing/config.py +565 -0
pgsui/data_processing/containers.py +1424 -0
pgsui/data_processing/transformers.py +557 -907
pgsui/{example_data/trees → electron/app}/__init__.py +0 -0
pgsui/electron/app/__main__.py +5 -0
pgsui/electron/app/extra-resources/.gitkeep +1 -0
pgsui/electron/app/icons/icons/1024x1024.png +0 -0
pgsui/electron/app/icons/icons/128x128.png +0 -0
pgsui/electron/app/icons/icons/16x16.png +0 -0
pgsui/electron/app/icons/icons/24x24.png +0 -0
pgsui/electron/app/icons/icons/256x256.png +0 -0
pgsui/electron/app/icons/icons/32x32.png +0 -0
pgsui/electron/app/icons/icons/48x48.png +0 -0
pgsui/electron/app/icons/icons/512x512.png +0 -0
pgsui/electron/app/icons/icons/64x64.png +0 -0
pgsui/electron/app/icons/icons/icon.icns +0 -0
pgsui/electron/app/icons/icons/icon.ico +0 -0
pgsui/electron/app/main.js +227 -0
pgsui/electron/app/package-lock.json +6894 -0
pgsui/electron/app/package.json +51 -0
pgsui/electron/app/preload.js +15 -0
pgsui/electron/app/server.py +157 -0
pgsui/electron/app/ui/logo.png +0 -0
pgsui/electron/app/ui/renderer.js +131 -0
pgsui/electron/app/ui/styles.css +59 -0
pgsui/electron/app/ui/ui_shim.js +72 -0
pgsui/electron/bootstrap.py +43 -0
pgsui/electron/launch.py +57 -0
pgsui/electron/package.json +14 -0
pgsui/example_data/__init__.py +0 -0
pgsui/example_data/phylip_files/__init__.py +0 -0
pgsui/example_data/phylip_files/test.phy +0 -0
pgsui/example_data/popmaps/__init__.py +0 -0
pgsui/example_data/popmaps/{test.popmap → phylogen_nomx.popmap} +185 -99
pgsui/example_data/structure_files/__init__.py +0 -0
pgsui/example_data/structure_files/test.pops.2row.allsites.str +0 -0
pgsui/example_data/vcf_files/phylogen_subset14K.vcf.gz +0 -0
pgsui/example_data/vcf_files/phylogen_subset14K.vcf.gz.tbi +0 -0
pgsui/impute/__init__.py +0 -0
pgsui/impute/deterministic/imputers/allele_freq.py +725 -0
pgsui/impute/deterministic/imputers/mode.py +844 -0
pgsui/impute/deterministic/imputers/nmf.py +221 -0
pgsui/impute/deterministic/imputers/phylo.py +973 -0
pgsui/impute/deterministic/imputers/ref_allele.py +669 -0
pgsui/impute/supervised/__init__.py +0 -0
pgsui/impute/supervised/base.py +343 -0
pgsui/impute/{unsupervised/models/in_development → supervised/imputers}/__init__.py +0 -0
pgsui/impute/supervised/imputers/hist_gradient_boosting.py +317 -0
pgsui/impute/supervised/imputers/random_forest.py +291 -0
pgsui/impute/unsupervised/__init__.py +0 -0
pgsui/impute/unsupervised/base.py +1118 -0
pgsui/impute/unsupervised/callbacks.py +92 -262
{simulation → pgsui/impute/unsupervised/imputers}/__init__.py +0 -0
pgsui/impute/unsupervised/imputers/autoencoder.py +1285 -0
pgsui/impute/unsupervised/imputers/nlpca.py +1554 -0
pgsui/impute/unsupervised/imputers/ubp.py +1575 -0
pgsui/impute/unsupervised/imputers/vae.py +1228 -0
pgsui/impute/unsupervised/loss_functions.py +261 -0
pgsui/impute/unsupervised/models/__init__.py +0 -0
pgsui/impute/unsupervised/models/autoencoder_model.py +215 -567
pgsui/impute/unsupervised/models/nlpca_model.py +155 -394
pgsui/impute/unsupervised/models/ubp_model.py +180 -1106
pgsui/impute/unsupervised/models/vae_model.py +269 -630
pgsui/impute/unsupervised/nn_scorers.py +255 -0
pgsui/utils/__init__.py +0 -0
pgsui/utils/classification_viz.py +608 -0
pgsui/utils/logging_utils.py +22 -0
pgsui/utils/misc.py +35 -480
pgsui/utils/plotting.py +996 -829
pgsui/utils/pretty_metrics.py +290 -0
pgsui/utils/scorers.py +213 -666
pg_sui-0.2.3.dist-info/RECORD +0 -75
pg_sui-0.2.3.dist-info/top_level.txt +0 -3
pgsui/example_data/phylip_files/test_n10.phy +0 -118
pgsui/example_data/phylip_files/test_n100.phy +0 -118
pgsui/example_data/phylip_files/test_n2.phy +0 -118
pgsui/example_data/phylip_files/test_n500.phy +0 -118
pgsui/example_data/structure_files/test.nopops.1row.10sites.str +0 -117
pgsui/example_data/structure_files/test.nopops.2row.100sites.str +0 -234
pgsui/example_data/structure_files/test.nopops.2row.10sites.str +0 -234
pgsui/example_data/structure_files/test.nopops.2row.30sites.str +0 -234
pgsui/example_data/structure_files/test.nopops.2row.allsites.str +0 -234
pgsui/example_data/structure_files/test.pops.1row.10sites.str +0 -117
pgsui/example_data/structure_files/test.pops.2row.10sites.str +0 -234
pgsui/example_data/trees/test.iqtree +0 -376
pgsui/example_data/trees/test.qmat +0 -5
pgsui/example_data/trees/test.rate +0 -2033
pgsui/example_data/trees/test.tre +0 -1
pgsui/example_data/trees/test_n10.rate +0 -19
pgsui/example_data/trees/test_n100.rate +0 -109
pgsui/example_data/trees/test_n500.rate +0 -509
pgsui/example_data/trees/test_siterates.txt +0 -2024
pgsui/example_data/trees/test_siterates_n10.txt +0 -10
pgsui/example_data/trees/test_siterates_n100.txt +0 -100
pgsui/example_data/trees/test_siterates_n500.txt +0 -500
pgsui/example_data/vcf_files/test.vcf +0 -244
pgsui/example_data/vcf_files/test.vcf.gz +0 -0
pgsui/example_data/vcf_files/test.vcf.gz.tbi +0 -0
pgsui/impute/estimators.py +0 -1268
pgsui/impute/impute.py +0 -1463
pgsui/impute/simple_imputers.py +0 -1431
pgsui/impute/supervised/iterative_imputer_fixedparams.py +0 -782
pgsui/impute/supervised/iterative_imputer_gridsearch.py +0 -1024
pgsui/impute/unsupervised/keras_classifiers.py +0 -697
pgsui/impute/unsupervised/models/in_development/cnn_model.py +0 -486
pgsui/impute/unsupervised/neural_network_imputers.py +0 -1440
pgsui/impute/unsupervised/neural_network_methods.py +0 -1395
pgsui/pg_sui.py +0 -261
pgsui/utils/sequence_tools.py +0 -407
simulation/sim_benchmarks.py +0 -333
simulation/sim_treeparams.py +0 -475
test/__init__.py +0 -0
test/pg_sui_simtest.py +0 -215
test/pg_sui_testing.py +0 -523
test/test.py +0 -151
test/test_pgsui.py +0 -374
test/test_tkc.py +0 -185

pgsui/impute/unsupervised/models/vae_model.py CHANGED Viewed

@@ -1,710 +1,349 @@
-import logging
-import os
-import sys
-import warnings
+from typing import List, Literal, Tuple
-# Import tensorflow with reduced warnings.
-os.environ["TF_CPP_MIN_LOG_LEVEL"] = "3"
-logging.getLogger("tensorflow").disabled = True
-warnings.filterwarnings("ignore", category=UserWarning)
+import numpy as np
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+from snpio.utils.logging import LoggerManager
+from torch.distributions import Normal
-import tensorflow as tf
+from pgsui.impute.unsupervised.loss_functions import MaskedFocalLoss
+from pgsui.utils.logging_utils import configure_logger
-# Disable can't find cuda .dll errors. Also turns of GPU support.
-tf.config.set_visible_devices([], "GPU")
-from tensorflow.python.util import deprecation
+class Sampling(nn.Module):
+    """A layer that samples from a latent distribution using the reparameterization trick.
-# Disable warnings and info logs.
-tf.compat.v1.logging.set_verbosity(tf.compat.v1.logging.ERROR)
-tf.get_logger().setLevel(logging.ERROR)
-# Monkey patching deprecation utils to supress warnings.
-# noinspection PyUnusedLocal
-def deprecated(
-    date, instructions, warn_once=True
-):  # pylint: disable=unused-argument
-    def deprecated_wrapper(func):
-        return func
-    return deprecated_wrapper
-deprecation.deprecated = deprecated
-from tensorflow.keras.layers import (
-    Dropout,
-    Dense,
-    Reshape,
-    Activation,
-    LeakyReLU,
-    PReLU,
-)
-from tensorflow.keras.regularizers import l1_l2
-from tensorflow.keras import backend as K
-# Custom Modules
-try:
-    from ..neural_network_methods import NeuralNetworkMethods
-except (ModuleNotFoundError, ValueError, ImportError):
-    from impute.unsupervised.neural_network_methods import NeuralNetworkMethods
+    This layer is a core component of a Variational Autoencoder (VAE). It takes the mean and log-variance of a latent distribution as input and generates a sample from that distribution. By using the reparameterization trick ($z = \mu + \sigma \cdot \epsilon$), it allows gradients to be backpropagated through the random sampling process, making the VAE trainable.
+    """
+    def forward(self, z_mean: torch.Tensor, z_log_var: torch.Tensor) -> torch.Tensor:
+        """Performs the forward pass to generate a latent sample.
-class Sampling(tf.keras.layers.Layer):
-    """Layer to calculate Z to sample from latent dimension."""
+        Args:
+            z_mean (torch.Tensor): The mean of the latent normal distribution.
+            z_log_var (torch.Tensor): The log of the variance of the latent normal distribution.
-    def __init__(self, *args, **kwargs):
-        self.is_placeholder = True
-        super(Sampling, self).__init__(*args, **kwargs)
+        Returns:
+            torch.Tensor: A sampled vector from the latent space.
+        """
+        z_sigma = torch.exp(0.5 * z_log_var)  # Precompute outside
-    def call(self, inputs):
-        """Sampling during forward pass."""
-        z_mean, z_log_var = inputs
-        z_sigma = tf.math.exp(0.5 * z_log_var)
-        batch = tf.shape(z_mean)[0]
-        dim = tf.shape(z_mean)[1]
-        epsilon = tf.random.normal(shape=(batch, dim))
+        # Ensure on GPU
+        # rand_like takes random values from a normal distribution
+        # of the same shape as z_mean.
+        epsilon = torch.randn_like(z_mean, device=z_mean.device)
         return z_mean + z_sigma * epsilon
-class Encoder(tf.keras.layers.Layer):
-    """VAE encoder to Encode genotypes to (z_mean, z_log_var, z).
-    Args:
-        n_features (int): Number of featuresi in input dataset.
-        num_classes (int): Number of classes in target data.
-        latent_dim (int): Number of latent dimensions to use.
-        hidden_layer_sizes (list of int): List of hidden layer sizes to use.
-        dropout_rate (float): Dropout rate for Dropout layer.
-        activation (str): Hidden activation function to use.
-        kernel_initializer (str): Initializer to use for weights.
-        kernel_regularizer (tf.keras.regularizers): L1 and/ or L2 objects.
-        beta (float, optional): KL divergence beta to use. Defualts to 1.0.
-        name (str): Name of model. Defaults to Encoder.
+class Encoder(nn.Module):
+    """The Encoder module of a Variational Autoencoder (VAE).
+    This module defines the encoder network, which takes high-dimensional input data and maps it to the parameters of a lower-dimensional latent distribution. The architecture consists of a series of fully-connected hidden layers that process the flattened input. The network culminates in two separate linear layers that output the mean (`z_mean`) and log-variance (`z_log_var`) of the approximate posterior distribution, $q(z|x)$.
     """
     def __init__(
         self,
-        n_features,
-        num_classes,
-        latent_dim,
-        hidden_layer_sizes,
-        dropout_rate,
-        activation,
-        kernel_initializer,
-        kernel_regularizer,
-        beta=1.0,
-        name="Encoder",
-        **kwargs,
+        n_features: int,
+        num_classes: int,
+        latent_dim: int,
+        hidden_layer_sizes: List[int],
+        dropout_rate: float,
+        activation: torch.nn.Module,
     ):
-        super(Encoder, self).__init__(name=name, **kwargs)
+        """Initializes the Encoder module.
+        Args:
+            n_features (int): The number of features in the input data (e.g., SNPs).
+            num_classes (int): Number of genotype states per locus (2 for haploid, 3 for diploid in practice).
+            latent_dim (int): The dimensionality of the latent space.
+            hidden_layer_sizes (List[int]): A list of integers specifying the size of each hidden layer.
+            dropout_rate (float): The dropout rate for regularization in the hidden layers.
+            activation (torch.nn.Module): An instantiated activation function module (e.g., `nn.ReLU()`) for the hidden layers.
+        """
+        super(Encoder, self).__init__()
+        self.flatten = nn.Flatten()
+        self.activation = (
+            getattr(F, activation) if isinstance(activation, str) else activation
+        )
-        self.beta = beta * latent_dim
+        layers = []
+        # The input dimension accounts for channels
+        input_dim = n_features * num_classes
+        for hidden_size in hidden_layer_sizes:
+            layers.append(nn.Linear(input_dim, hidden_size))
-        self.dense2 = None
-        self.dense3 = None
-        self.dense4 = None
-        self.dense5 = None
+            # BatchNorm can lead to faster convergence.
+            layers.append(nn.BatchNorm1d(hidden_size))
-        # # n_features * num_classes.
-        self.flatten = tf.keras.layers.Flatten()
+            layers.append(nn.Dropout(dropout_rate))
+            layers.append(activation)
+            input_dim = hidden_size
-        self.dense1 = Dense(
-            hidden_layer_sizes[0],
-            input_shape=(n_features * num_classes,),
-            activation=activation,
-            kernel_initializer=kernel_initializer,
-            kernel_regularizer=kernel_regularizer,
-            name="Encoder1",
-        )
+        self.hidden_layers = nn.Sequential(*layers)
+        self.dense_z_mean = nn.Linear(input_dim, latent_dim)
+        self.dense_z_log_var = nn.Linear(input_dim, latent_dim)
+        self.sampling = Sampling()
-        if len(hidden_layer_sizes) >= 2:
-            self.dense2 = Dense(
-                hidden_layer_sizes[1],
-                activation=activation,
-                kernel_initializer=kernel_initializer,
-                kernel_regularizer=kernel_regularizer,
-                name="Encoder2",
-            )
-        if len(hidden_layer_sizes) >= 3:
-            self.dense3 = Dense(
-                hidden_layer_sizes[2],
-                activation=activation,
-                kernel_initializer=kernel_initializer,
-                kernel_regularizer=kernel_regularizer,
-                name="Encoder3",
-            )
-        if len(hidden_layer_sizes) >= 4:
-            self.dense4 = Dense(
-                hidden_layer_sizes[3],
-                activation=activation,
-                kernel_initializer=kernel_initializer,
-                kernel_regularizer=kernel_regularizer,
-                name="Encoder4",
-            )
-        if len(hidden_layer_sizes) == 5:
-            self.dense5 = Dense(
-                hidden_layer_sizes[4],
-                activation=activation,
-                kernel_initializer=kernel_initializer,
-                kernel_regularizer=kernel_regularizer,
-                name="Encoder5",
-            )
-        self.dense_z_mean = Dense(
-            latent_dim,
-            name="z_mean",
-        )
-        self.dense_z_log_var = Dense(
-            latent_dim,
-            name="z_log_var",
-        )
-        # z_mean and z_log_var are inputs.
-        self.sampling = Sampling(
-            name="z",
-        )
+    def forward(
+        self, x: torch.Tensor
+    ) -> Tuple[torch.Tensor, torch.Tensor, torch.Tensor]:
+        """Performs the forward pass through the encoder.
-        self.dense_latent = Dense(
-            latent_dim,
-            activation=activation,
-            kernel_initializer=kernel_initializer,
-            kernel_regularizer=kernel_regularizer,
-            name="Encoder5",
-        )
+        Args:
+            x (torch.Tensor): The input data tensor of shape `(batch_size, n_features, num_classes)`.
-        self.dropout_layer = Dropout(dropout_rate)
-    def call(self, inputs, training=None):
-        """Forward pass for model."""
-        x = self.flatten(inputs)
-        x = self.dense1(x)
-        x = self.dropout_layer(x, training=training)
-        if self.dense2 is not None:
-            x = self.dense2(x)
-            x = self.dropout_layer(x, training=training)
-        if self.dense3 is not None:
-            x = self.dense3(x)
-            x = self.dropout_layer(x, training=training)
-        if self.dense4 is not None:
-            x = self.dense4(x)
-            x = self.dropout_layer(x, training=training)
-        if self.dense5 is not None:
-            x = self.dense5(x)
-            x = self.dropout_layer(x, training=training)
-        x = self.dense_latent(x)
+        Returns:
+            Tuple[torch.Tensor, torch.Tensor, torch.Tensor]: A tuple containing the latent mean (`z_mean`), latent log-variance (`z_log_var`), and a sample from the latent distribution (`z`).
+        """
+        x = self.flatten(x)
+        x = self.hidden_layers(x)
         z_mean = self.dense_z_mean(x)
         z_log_var = self.dense_z_log_var(x)
-        # Compute the KL divergence
-        kl_loss = -0.5 * tf.reduce_sum(
-            1 + z_log_var - tf.square(z_mean) - tf.exp(z_log_var), axis=-1
-        )
-        # Add the KL divergence to the model's total loss
-        self.add_loss(self.beta * tf.reduce_mean(kl_loss))
-        z = self.sampling([z_mean, z_log_var])
+        z = self.sampling(z_mean, z_log_var)
         return z_mean, z_log_var, z
-class Decoder(tf.keras.layers.Layer):
-    """Converts z, the encoded vector, back into the reconstructed output.
-    Args:
-        n_features (int): Number of features in input dataset.
+class Decoder(nn.Module):
+    """The Decoder module of a Variational Autoencoder (VAE).
-        num_classes (int): Number of classes in input dataset.
-        latent_dim (int): Number of latent dimensions to use.
-        hidden_layer_sizes (list of int): List of hidden layer sizes to use.
-        dropout_rate (float): Dropout rate for Dropout layer.
-        activation (str): Hidden activation function to use.
-        kernel initializer (str): Function for initilizing weights.
-        kernel_regularizer (tf.keras.regularizer): Initialized L1 and/ or L2 regularizer.
-        name (str): Name of model. Defaults to "Decoder".
+    This module defines the decoder network, which takes a sample from the low-dimensional latent space and maps it back to the high-dimensional data space. It aims to reconstruct the original input data. The architecture consists of a series of fully-connected hidden layers followed by a final linear layer that produces the reconstructed data, which is then reshaped to match the original input's dimensions.
     """
     def __init__(
         self,
-        n_features,
-        num_classes,
-        latent_dim,
-        hidden_layer_sizes,
-        dropout_rate,
-        activation,
-        kernel_initializer,
-        kernel_regularizer,
-        name="Decoder",
-        **kwargs,
-    ):
-        super(Decoder, self).__init__(name=name, **kwargs)
-        self.dense2 = None
-        self.dense3 = None
-        self.dense4 = None
-        self.dense5 = None
-        self.dense1 = Dense(
-            hidden_layer_sizes[0],
-            input_shape=(latent_dim,),
-            activation=activation,
-            kernel_initializer=kernel_initializer,
-            kernel_regularizer=kernel_regularizer,
-            name="Decoder1",
-        )
-        if len(hidden_layer_sizes) >= 2:
-            self.dense2 = Dense(
-                hidden_layer_sizes[1],
-                activation=activation,
-                kernel_initializer=kernel_initializer,
-                kernel_regularizer=kernel_regularizer,
-                name="Decoder2",
-            )
-        if len(hidden_layer_sizes) >= 3:
-            self.dense3 = Dense(
-                hidden_layer_sizes[2],
-                activation=activation,
-                kernel_initializer=kernel_initializer,
-                kernel_regularizer=kernel_regularizer,
-                name="Decoder3",
-            )
-        if len(hidden_layer_sizes) >= 4:
-            self.dense4 = Dense(
-                hidden_layer_sizes[3],
-                activation=activation,
-                kernel_initializer=kernel_initializer,
-                kernel_regularizer=kernel_regularizer,
-                name="Decoder4",
-            )
-        if len(hidden_layer_sizes) == 5:
-            self.dense5 = Dense(
-                hidden_layer_sizes[4],
-                activation=activation,
-                kernel_initializer=kernel_initializer,
-                kernel_regularizer=kernel_regularizer,
-                name="Decoder5",
-            )
-        # No activation for final layer.
-        self.dense_output = Dense(
-            n_features * num_classes,
-            kernel_initializer=kernel_initializer,
-            kernel_regularizer=kernel_regularizer,
-            name="DecoderExpanded",
-        )
-        self.rshp = Reshape((n_features, num_classes))
-        self.dropout_layer = Dropout(dropout_rate)
-    def call(self, inputs, training=None):
-        """Forward pass for model."""
-        x = self.dense1(inputs)
-        x = self.dropout_layer(x, training=training)
-        if self.dense2 is not None:
-            x = self.dense2(x)
-            x = self.dropout_layer(x, training=training)
-        if self.dense3 is not None:
-            x = self.dense3(x)
-            x = self.dropout_layer(x, training=training)
-        if self.dense4 is not None:
-            x = self.dense4(x)
-            x = self.dropout_layer(x, training=training)
-        if self.dense5 is not None:
-            x = self.dense5(x)
-            x = self.dropout_layer(x, training=training)
-        x = self.dense_output(x)
-        return self.rshp(x)
-class VAEModel(tf.keras.Model):
-    """Variational Autoencoder model. Runs the encdoer and decoder and outputs the reconsruction.
-    Args:
-        output_shape (tuple): Shape of output. Defaults to None.
-        n_components (int): Number of latent dimensions to use. Defaults to 3.
-        weights_initializer (str, optional): kernel initializer to use. Defaults to "glorot_normal".
-        hidden_layer_sizes (str or list, optional): List of hidden layer sizes to use, or can use "midpoint", "log2", or "sqrt". Defaults to "midpoint".
-        num_hidden_layers (int, optional): Number of hidden layers to use. Defaults to 1.
-        hidden_activation (str, optional): Hidden activation function to use. Defaults to "elu".
+        n_features: int,
+        num_classes: int,
+        latent_dim: int,
+        hidden_layer_sizes: List[int],
+        dropout_rate: float,
+        activation: torch.nn.Module,
+    ) -> None:
+        """Initializes the Decoder module.
+        Args:
+            n_features (int): The number of features in the output data (e.g., SNPs).
+            num_classes (int): Number of genotype states per locus (typically 2 or 3).
+            latent_dim (int): The dimensionality of the input latent space.
+            hidden_layer_sizes (List[int]): A list of integers specifying the size of each hidden layer.
+            dropout_rate (float): The dropout rate for regularization in the hidden layers.
+            activation (torch.nn.Module): An instantiated activation function module (e.g., `nn.ReLU()`) for the hidden layers.
+        """
+        super(Decoder, self).__init__()
-        l1_penalty (float, optional): L1 regularization penalty to use. Defaults to 1e-06.
+        layers = []
+        input_dim = latent_dim
+        for hidden_size in hidden_layer_sizes:
+            layers.append(nn.Linear(input_dim, hidden_size))
-        l2_penalty (float, optional): L2 regularization penalty. Defaults to 1e-06.
+            # BatchNorm can lead to faster convergence.
+            layers.append(nn.BatchNorm1d(hidden_size))
-        dropout_rate (float, optional): Dropout rate to use for Dropout layers.
+            layers.append(nn.Dropout(dropout_rate))
+            layers.append(activation)
+            input_dim = hidden_size
-        kl_beta (float, optional): Beta to use for KL divergence loss. The KL divergence gets multiplied by this value. Defaults to 1.0 (no scaling).
+        self.hidden_layers = nn.Sequential(*layers)
+        # UPDATED: Output dimension must account for channels
+        output_dim = n_features * num_classes
+        self.dense_output = nn.Linear(input_dim, output_dim)
+        # UPDATED: Reshape must account for channels
+        self.reshape = (n_features, num_classes)
-        num_classes (int, optional): Number of classes in input data. Defaults to 10.
+    def forward(self, x: torch.Tensor) -> torch.Tensor:
+        """Performs the forward pass through the decoder.
-        sample_weight (list of float, optional): sample weights to use. Defaults to None.
+        Args:
+            x (torch.Tensor): The input latent tensor of shape `(batch_size, latent_dim)`.
-        missing_mask (np.ndarray, optional): Missing mask to use in model for masking missing values. Defaults to None.
+        Returns:
+            torch.Tensor: The reconstructed output data of shape `(batch_size, n_features, num_classes)`.
+        """
+        x = self.hidden_layers(x)
+        x = self.dense_output(x)
+        return x.view(-1, *self.reshape)
-        batch_size (int, optional): Batch size to use for training. Defaults to 32.
-        final_activation (str, optional): Final activation function to use. Should be either "sigmoid" (if doing multilabel classification) or "softmax" (if doing multiclass). If left None, then activation is not performed. Defaults to None.
+class VAEModel(nn.Module):
+    """A Variational Autoencoder (VAE) model for imputation.
-        y (np.ndarray, optional): Input dataset y. Should be the full dataset. It will get subset by a callback to get batch_size samples. Default to None.
+    This class combines an `Encoder` and a `Decoder` to form a VAE, a generative model for learning complex data distributions. It is designed for imputing missing values in categorical data, such as genomic SNPs. The model is trained by maximizing the Evidence Lower Bound (ELBO), which is a lower bound on the log-likelihood of the data.
+    **Objective Function (ELBO):**
+    The VAE loss function is derived from the ELBO and consists of two main components: a reconstruction term and a regularization term.
+    $$
+    \\mathcal{L}(\\theta, \\phi; x) = \\underbrace{\\mathbb{E}_{q_{\\phi}(z|x)}[\\log p_{\\theta}(x|z)]}_{\\text{Reconstruction Loss}} - \\underbrace{D_{KL}(q_{\\phi}(z|x) || p(z))}_{\\text{KL Divergence}}
+    $$
+    -   The **Reconstruction Loss** encourages the decoder to accurately reconstruct the input data from its latent representation. This implementation uses a `MaskedFocalLoss`.
+    -   The **KL Divergence** acts as a regularizer, forcing the approximate posterior distribution $q_{\\phi}(z|x)$ learned by the encoder to be close to a prior distribution $p(z)$ (typically a standard normal distribution).
     """
     def __init__(
         self,
-        output_shape=None,
-        n_components=3,
-        weights_initializer="glorot_normal",
-        hidden_layer_sizes="midpoint",
-        num_hidden_layers=1,
-        hidden_activation="elu",
-        l1_penalty=1e-6,
-        l2_penalty=1e-6,
-        dropout_rate=0.2,
-        kl_beta=1.0,
-        num_classes=10,
-        sample_weight=None,
-        missing_mask=None,
-        batch_size=32,
-        final_activation=None,
-        y=None,
+        n_features: int,
+        prefix: str,
+        *,
+        num_classes: int = 4,
+        hidden_layer_sizes: List[int] | np.ndarray = [128, 64],
+        latent_dim: int = 2,
+        dropout_rate: float = 0.2,
+        activation: Literal["relu", "elu", "selu", "leaky_relu"] = "relu",
+        gamma: float = 2.0,
+        beta: float = 1.0,
+        device: Literal["cpu", "gpu", "mps"] = "cpu",
+        verbose: bool = False,
+        debug: bool = False,
     ):
+        """Initializes the VAEModel.
+        Args:
+            n_features (int): The number of features in the input data (e.g., SNPs).
+            prefix (str): A prefix used for logging.
+            num_classes (int): Number of genotype states per locus. Defaults to 4 for backward compatibility, though the imputer passes 2 (haploid) or 3 (diploid).
+            hidden_layer_sizes (List[int] | np.ndarray): A list of integers specifying the size of each hidden layer in the encoder and decoder. Defaults to [128, 64].
+            latent_dim (int): The dimensionality of the latent space. Defaults to 2.
+            dropout_rate (float): The dropout rate for regularization in the hidden layers. Defaults to 0.2.
+            activation (str): The name of the activation function to use in hidden layers. Defaults to "relu".
+            gamma (float): The focusing parameter for the focal loss component. Defaults to 2.0.
+            beta (float): A weighting factor for the KL divergence term in the total loss ($\beta$-VAE). Defaults to 1.0.
+            device (Literal["cpu", "gpu", "mps"]): The device to run the model on.
+            verbose (bool): If True, enables detailed logging. Defaults to False.
+            debug (bool): If True, enables debug mode. Defaults to False.
+        """
         super(VAEModel, self).__init__()
-        self.kl_beta = K.variable(0.0)
-        self.kl_beta._trainable = False
-        self._sample_weight = sample_weight
-        self._missing_mask = missing_mask
-        self._batch_idx = 0
-        self._batch_size = batch_size
-        self._y = y
-        self._final_activation = final_activation
-        if num_classes == 10 or num_classes == 3:
-            self.acc_func = tf.keras.metrics.categorical_accuracy
-        elif num_classes == 4:
-            self.acc_func = tf.keras.metrics.binary_accuracy
-        self.nn_ = NeuralNetworkMethods()
-        self.total_loss_tracker = tf.keras.metrics.Mean(name="loss")
-        self.reconstruction_loss_tracker = tf.keras.metrics.Mean(
-            name="reconstruction_loss"
-        )
-        # self.kl_loss_tracker = tf.keras.metrics.Mean(name="kl_loss")
-        self.accuracy_tracker = tf.keras.metrics.Mean(name="accuracy")
-        # y_train[1] dimension.
-        self.n_features = output_shape
-        self.n_components = n_components
-        self.weights_initializer = weights_initializer
-        self.hidden_layer_sizes = hidden_layer_sizes
-        self.num_hidden_layers = num_hidden_layers
-        self.hidden_activation = hidden_activation
-        self.l1_penalty = l1_penalty
-        self.l2_penalty = l2_penalty
-        self.dropout_rate = dropout_rate
         self.num_classes = num_classes
+        self.gamma = gamma
+        self.beta = beta
+        self.device = device
-        nn = NeuralNetworkMethods()
-        hidden_layer_sizes = nn.validate_hidden_layers(
-            self.hidden_layer_sizes, self.num_hidden_layers
+        logman = LoggerManager(
+            name=__name__, prefix=prefix, verbose=verbose, debug=debug
         )
-        hidden_layer_sizes = nn.get_hidden_layer_sizes(
-            self.n_features, self.n_components, hidden_layer_sizes, vae=True
+        self.logger = configure_logger(
+            logman.get_logger(), verbose=verbose, debug=debug
         )
-        hidden_layer_sizes = [h * self.num_classes for h in hidden_layer_sizes]
+        act = self._resolve_activation(activation)
-        if self.l1_penalty == 0.0 and self.l2_penalty == 0.0:
-            kernel_regularizer = None
+        if isinstance(hidden_layer_sizes, np.ndarray):
+            hls = hidden_layer_sizes.tolist()
         else:
-            kernel_regularizer = l1_l2(self.l1_penalty, self.l2_penalty)
-        kernel_initializer = self.weights_initializer
-        if self.hidden_activation.lower() == "leaky_relu":
-            activation = LeakyReLU(alpha=0.01)
-        elif self.hidden_activation.lower() == "prelu":
-            activation = PReLU()
-        elif self.hidden_activation.lower() == "selu":
-            activation = "selu"
-            kernel_initializer = "lecun_normal"
-        else:
-            activation = self.hidden_activation
-        if num_hidden_layers > 5:
-            raise ValueError(
-                f"The maximum number of hidden layers is 5, but got "
-                f"{num_hidden_layers}"
-            )
+            hls = hidden_layer_sizes
         self.encoder = Encoder(
-            self.n_features,
-            self.num_classes,
-            self.n_components,
-            hidden_layer_sizes,
-            self.dropout_rate,
-            activation,
-            kernel_initializer,
-            kernel_regularizer,
-            beta=self.kl_beta,
+            n_features, self.num_classes, latent_dim, hls, dropout_rate, act
         )
-        hidden_layer_sizes.reverse()
+        decoder_layer_sizes = list(reversed(hls))
         self.decoder = Decoder(
-            self.n_features,
+            n_features,
             self.num_classes,
-            self.n_components,
-            hidden_layer_sizes,
-            self.dropout_rate,
-            activation,
-            kernel_initializer,
-            kernel_regularizer,
+            latent_dim,
+            decoder_layer_sizes,
+            dropout_rate,
+            act,
         )
-        if final_activation is not None:
-            self.act = Activation(final_activation)
+    def forward(
+        self, x: torch.Tensor
+    ) -> Tuple[torch.Tensor, torch.Tensor, torch.Tensor]:
+        """Performs the forward pass through the full VAE model.
-    def call(self, inputs, training=None):
-        """Forward pass for model."""
-        z_mean, z_log_var, z = self.encoder(inputs)
-        reconstruction = self.decoder(z)
-        if self._final_activation is not None:
-            reconstruction = self.act(reconstruction)
-        return reconstruction
+        Args:
+            x (torch.Tensor): The input data tensor of shape `(batch_size, n_features, num_classes)`.
-    def model(self):
-        """Here so that mymodel.model().summary() can be called for debugging.
-        :noindex:
+        Returns:
+            Tuple[torch.Tensor, torch.Tensor, torch.Tensor]: A tuple containing the reconstructed output, the latent mean (`z_mean`), and the latent log-variance (`z_log_var`).
         """
-        x = tf.keras.Input(shape=(self.n_features, self.num_classes))
-        return tf.keras.Model(inputs=[x], outputs=self.call(x))
+        z_mean, z_log_var, z = self.encoder(x)
+        reconstruction = self.decoder(z)
+        return reconstruction, z_mean, z_log_var
-    def set_model_outputs(self):
-        """Set model output dimensions for building model.
-        :noindex:
+    def compute_loss(
+        self,
+        outputs: Tuple[torch.Tensor, torch.Tensor, torch.Tensor],
+        y: torch.Tensor,
+        mask: torch.Tensor | None = None,
+        class_weights: torch.Tensor | None = None,
+    ) -> torch.Tensor:
+        """Computes the VAE loss function (negative ELBO).
+        The loss is the sum of a reconstruction term and a regularizing KL divergence term. The reconstruction loss is calculated using a masked focal loss, and the KL divergence measures the difference between the learned latent distribution and a standard normal prior.
+        Args:
+            outputs (Tuple[torch.Tensor, torch.Tensor, torch.Tensor]): The tuple of (reconstruction, z_mean, z_log_var) from the model's forward pass.
+            y (torch.Tensor): The target data tensor, expected to be one-hot encoded. This is converted to class indices internally for the loss function.
+            mask (torch.Tensor | None): A boolean mask to exclude missing values from the reconstruction loss.
+            class_weights (torch.Tensor | None): Weights to apply to each class in the reconstruction loss to handle imbalance.
+        Returns:
+            torch.Tensor: The computed scalar loss value.
         """
-        x = tf.keras.Input(shape=(self.n_features, self.num_classes))
-        model = tf.keras.Model(inputs=[x], outputs=self.call(x))
-        self.outputs = model.outputs
-    @property
-    def metrics(self):
-        """Set metric trackers."""
-        return [
-            self.total_loss_tracker,
-            self.reconstruction_loss_tracker,
-            # self.kl_loss_tracker,
-            self.accuracy_tracker,
-        ]
-    @tf.function
-    def train_step(self, data):
-        y = self._y
-        (
-            y_true,
-            sample_weight,
-            missing_mask,
-        ) = self.nn_.prepare_training_batches(
-            y,
-            y,
-            self._batch_size,
-            self._batch_idx,
-            True,
-            self.n_components,
-            self._sample_weight,
-            self._missing_mask,
-            ubp=False,
+        reconstruction, z_mean, z_log_var = outputs
+        # 1. KL Divergence Calculation
+        prior = Normal(torch.zeros_like(z_mean), torch.ones_like(z_log_var))
+        posterior = Normal(z_mean, torch.exp(0.5 * z_log_var))
+        kl_loss = (
+            torch.distributions.kl.kl_divergence(posterior, prior).sum(dim=1).mean()
         )
-        if sample_weight is not None:
-            sample_weight_masked = tf.convert_to_tensor(
-                sample_weight[~missing_mask], dtype=tf.float32
-            )
+        if class_weights is None:
+            class_weights = torch.ones(self.num_classes, device=y.device)
+        # 2. Reconstruction Loss Calculation
+        # Reverting to the robust method of flattening tensors and using the
+        # custom loss function.
+        n_classes = reconstruction.shape[-1]
+        logits_flat = reconstruction.reshape(-1, n_classes)
+        # Convert one-hot `y` to class indices for the loss function.
+        targets_flat = torch.argmax(y, dim=-1).reshape(-1)
+        if mask is None:
+            # If no mask is provided, all targets are considered valid.
+            mask_flat = torch.ones_like(targets_flat, dtype=torch.bool)
         else:
-            sample_weight_masked = None
+            # The mask needs to be reshaped to match the flattened targets.
+            mask_flat = mask.reshape(-1)
-        y_true_masked = tf.boolean_mask(
-            tf.convert_to_tensor(y_true, dtype=tf.float32),
-            tf.reduce_any(tf.not_equal(y_true, -1), axis=-1),
-        )
+        # Logits, class-index targets, and the valid mask.
+        criterion = MaskedFocalLoss(alpha=class_weights, gamma=self.gamma)
-        with tf.GradientTape() as tape:
-            reconstruction = self(y_true, training=True)
-            y_pred_masked = tf.boolean_mask(
-                reconstruction,
-                tf.reduce_any(tf.not_equal(y_true, -1), axis=-1),
-            )
-            # Returns binary crossentropy loss.
-            reconstruction_loss = self.compiled_loss(
-                y_true_masked,
-                y_pred_masked,
-                sample_weight=sample_weight_masked,
-            )
-            # Doesn't include KL Divergence Loss.
-            regularization_loss = sum(self.losses)
-            total_loss = reconstruction_loss + regularization_loss
-        grads = tape.gradient(total_loss, self.trainable_variables)
-        self.optimizer.apply_gradients(zip(grads, self.trainable_variables))
-        ### NOTE: If you get the error, "'tuple' object has no attribute
-        ### 'rank', then convert y_true to a tensor object."
-        # self.compiled_metrics.update_state(
-        self.accuracy_tracker.update_state(
-            self.acc_func(
-                y_true_masked,
-                y_pred_masked,
-            )
+        reconstruction_loss = criterion(
+            logits_flat.to(self.device),
+            targets_flat.to(self.device),
+            valid_mask=mask_flat.to(self.device),
         )
-        self.total_loss_tracker.update_state(total_loss)
-        self.reconstruction_loss_tracker.update_state(reconstruction_loss)
-        return {
-            "loss": self.total_loss_tracker.result(),
-            "reconstruction_loss": self.reconstruction_loss_tracker.result(),
-            "accuracy": self.accuracy_tracker.result(),
-        }
-    # @tf.function
-    # def test_step(self, data):
-    #     if isinstance(data, tuple):
-    #         if len(data) == 2:
-    #             x, y = data
-    #             sample_weight = None
-    #         else:
-    #             x, y, sample_weight = data
-    #     else:
-    #         raise TypeError("Target y must be supplied to fit in this model.")
-    #     if sample_weight is not None:
-    #         sample_weight_masked = tf.boolean_mask(
-    #             tf.convert_to_tensor(sample_weight),
-    #             tf.reduce_any(tf.not_equal(y, -1), axis=2),
-    #         )
-    #     else:
-    #         sample_weight_masked = None
-    #     reconstruction, z_mean, z_log_var, z = self(x, training=False)
-    #     reconstruction_loss = self.compiled_loss(
-    #         y,
-    #         reconstruction,
-    #         sample_weight=sample_weight_masked,
-    #     )
-    #     # Includes KL Divergence Loss.
-    #     regularization_loss = sum(self.losses)
-    #     total_loss = reconstruction_loss + regularization_loss
-    #     self.accuracy_tracker.update_state(
-    #         self.cateogrical_accuracy(
-    #             y,
-    #             reconstruction,
-    #             sample_weight=sample_weight_masked,
-    #         )
-    #     )
-    #     self.total_loss_tracker.update_state(total_loss)
-    #     self.reconstruction_loss_tracker.update_state(reconstruction_loss)
-    #     self.kl_loss_tracker.update_state(regularization_loss)
-    #     return {
-    #         "loss": self.total_loss_tracker.result(),
-    #         "reconstruction_loss": self.reconstruction_loss_tracker.result(),
-    #         "kl_loss": self.kl_loss_tracker.result(),
-    #         "accuracy": self.accuracy_tracker.result(),
-    #     }
-    @property
-    def batch_size(self):
-        """Batch (=step) size per epoch."""
-        return self._batch_size
-    @property
-    def batch_idx(self):
-        """Current batch (=step) index."""
-        return self._batch_idx
-    @property
-    def y(self):
-        return self._y
-    @property
-    def missing_mask(self):
-        return self._missing_mask
-    @property
-    def sample_weight(self):
-        return self._sample_weight
-    @batch_size.setter
-    def batch_size(self, value):
-        """Set batch_size parameter."""
-        self._batch_size = int(value)
-    @batch_idx.setter
-    def batch_idx(self, value):
-        """Set current batch (=step) index."""
-        self._batch_idx = int(value)
-    @y.setter
-    def y(self, value):
-        """Set y after each epoch."""
-        self._y = value
-    @missing_mask.setter
-    def missing_mask(self, value):
-        """Set y after each epoch."""
-        self._missing_mask = value
-    @sample_weight.setter
-    def sample_weight(self, value):
-        self._sample_weight = value
+        return reconstruction_loss + self.beta * kl_loss
+    def _resolve_activation(
+        self, activation: Literal["relu", "elu", "leaky_relu", "selu"]
+    ) -> torch.nn.Module:
+        """Resolves an activation function module from a string name.
+        Args:
+            activation (Literal["relu", "elu", "leaky_relu", "selu"]): The name of the activation function.
+        Returns:
+            torch.nn.Module: The corresponding instantiated PyTorch activation function module.
+        Raises:
+            ValueError: If the provided activation name is not supported.
+        """
+        if isinstance(activation, str):
+            a = activation.lower()
+        if a == "relu":
+            return nn.ReLU()
+        elif a == "elu":
+            return nn.ELU()
+        elif a in {"leaky_relu", "leakyrelu"}:
+            return nn.LeakyReLU()
+        elif a == "selu":
+            return nn.SELU()
+        else:
+            msg = f"Activation {activation} not supported."
+            self.logger.error(msg)
+            raise ValueError(msg)

pg-sui 0.2.3__py3-none-any.whl → 1.6.14.dev9__py3-none-any.whl

pg-sui 0.2.3py3-none-any.whl → 1.6.14.dev9py3-none-any.whl