PyPI - pg-sui - Versions diffs - 0.2.0__py3-none-any.whl → 1.6.14.dev9__py3-none-any.whl - Mend

pg-sui 0.2.0py3-none-any.whl → 1.6.14.dev9py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (127) hide show

{pg_sui-0.2.0.dist-info → pg_sui-1.6.14.dev9.dist-info}/METADATA +101 -79
pg_sui-1.6.14.dev9.dist-info/RECORD +81 -0
{pg_sui-0.2.0.dist-info → pg_sui-1.6.14.dev9.dist-info}/WHEEL +1 -1
pg_sui-1.6.14.dev9.dist-info/entry_points.txt +4 -0
{pg_sui-0.2.0.dist-info → pg_sui-1.6.14.dev9.dist-info/licenses}/LICENSE +0 -0
pg_sui-1.6.14.dev9.dist-info/top_level.txt +1 -0
pgsui/__init__.py +35 -54
pgsui/_version.py +34 -0
pgsui/cli.py +909 -0
pgsui/data_processing/__init__.py +0 -0
pgsui/data_processing/config.py +565 -0
pgsui/data_processing/containers.py +1424 -0
pgsui/data_processing/transformers.py +557 -907
pgsui/{example_data/trees → electron/app}/__init__.py +0 -0
pgsui/electron/app/__main__.py +5 -0
pgsui/electron/app/extra-resources/.gitkeep +1 -0
pgsui/electron/app/icons/icons/1024x1024.png +0 -0
pgsui/electron/app/icons/icons/128x128.png +0 -0
pgsui/electron/app/icons/icons/16x16.png +0 -0
pgsui/electron/app/icons/icons/24x24.png +0 -0
pgsui/electron/app/icons/icons/256x256.png +0 -0
pgsui/electron/app/icons/icons/32x32.png +0 -0
pgsui/electron/app/icons/icons/48x48.png +0 -0
pgsui/electron/app/icons/icons/512x512.png +0 -0
pgsui/electron/app/icons/icons/64x64.png +0 -0
pgsui/electron/app/icons/icons/icon.icns +0 -0
pgsui/electron/app/icons/icons/icon.ico +0 -0
pgsui/electron/app/main.js +227 -0
pgsui/electron/app/package-lock.json +6894 -0
pgsui/electron/app/package.json +51 -0
pgsui/electron/app/preload.js +15 -0
pgsui/electron/app/server.py +157 -0
pgsui/electron/app/ui/logo.png +0 -0
pgsui/electron/app/ui/renderer.js +131 -0
pgsui/electron/app/ui/styles.css +59 -0
pgsui/electron/app/ui/ui_shim.js +72 -0
pgsui/electron/bootstrap.py +43 -0
pgsui/electron/launch.py +57 -0
pgsui/electron/package.json +14 -0
pgsui/example_data/__init__.py +0 -0
pgsui/example_data/phylip_files/__init__.py +0 -0
pgsui/example_data/phylip_files/test.phy +0 -0
pgsui/example_data/popmaps/__init__.py +0 -0
pgsui/example_data/popmaps/{test.popmap → phylogen_nomx.popmap} +185 -99
pgsui/example_data/structure_files/__init__.py +0 -0
pgsui/example_data/structure_files/test.pops.2row.allsites.str +0 -0
pgsui/example_data/vcf_files/phylogen_subset14K.vcf.gz +0 -0
pgsui/example_data/vcf_files/phylogen_subset14K.vcf.gz.tbi +0 -0
pgsui/impute/__init__.py +0 -0
pgsui/impute/deterministic/imputers/allele_freq.py +725 -0
pgsui/impute/deterministic/imputers/mode.py +844 -0
pgsui/impute/deterministic/imputers/nmf.py +221 -0
pgsui/impute/deterministic/imputers/phylo.py +973 -0
pgsui/impute/deterministic/imputers/ref_allele.py +669 -0
pgsui/impute/supervised/__init__.py +0 -0
pgsui/impute/supervised/base.py +343 -0
pgsui/impute/{unsupervised/models/in_development → supervised/imputers}/__init__.py +0 -0
pgsui/impute/supervised/imputers/hist_gradient_boosting.py +317 -0
pgsui/impute/supervised/imputers/random_forest.py +291 -0
pgsui/impute/unsupervised/__init__.py +0 -0
pgsui/impute/unsupervised/base.py +1118 -0
pgsui/impute/unsupervised/callbacks.py +92 -262
{simulation → pgsui/impute/unsupervised/imputers}/__init__.py +0 -0
pgsui/impute/unsupervised/imputers/autoencoder.py +1285 -0
pgsui/impute/unsupervised/imputers/nlpca.py +1554 -0
pgsui/impute/unsupervised/imputers/ubp.py +1575 -0
pgsui/impute/unsupervised/imputers/vae.py +1228 -0
pgsui/impute/unsupervised/loss_functions.py +261 -0
pgsui/impute/unsupervised/models/__init__.py +0 -0
pgsui/impute/unsupervised/models/autoencoder_model.py +215 -567
pgsui/impute/unsupervised/models/nlpca_model.py +155 -394
pgsui/impute/unsupervised/models/ubp_model.py +180 -1106
pgsui/impute/unsupervised/models/vae_model.py +269 -630
pgsui/impute/unsupervised/nn_scorers.py +255 -0
pgsui/utils/__init__.py +0 -0
pgsui/utils/classification_viz.py +608 -0
pgsui/utils/logging_utils.py +22 -0
pgsui/utils/misc.py +35 -480
pgsui/utils/plotting.py +996 -829
pgsui/utils/pretty_metrics.py +290 -0
pgsui/utils/scorers.py +213 -666
pg_sui-0.2.0.dist-info/RECORD +0 -75
pg_sui-0.2.0.dist-info/top_level.txt +0 -3
pgsui/example_data/phylip_files/test_n10.phy +0 -118
pgsui/example_data/phylip_files/test_n100.phy +0 -118
pgsui/example_data/phylip_files/test_n2.phy +0 -118
pgsui/example_data/phylip_files/test_n500.phy +0 -118
pgsui/example_data/structure_files/test.nopops.1row.10sites.str +0 -117
pgsui/example_data/structure_files/test.nopops.2row.100sites.str +0 -234
pgsui/example_data/structure_files/test.nopops.2row.10sites.str +0 -234
pgsui/example_data/structure_files/test.nopops.2row.30sites.str +0 -234
pgsui/example_data/structure_files/test.nopops.2row.allsites.str +0 -234
pgsui/example_data/structure_files/test.pops.1row.10sites.str +0 -117
pgsui/example_data/structure_files/test.pops.2row.10sites.str +0 -234
pgsui/example_data/trees/test.iqtree +0 -376
pgsui/example_data/trees/test.qmat +0 -5
pgsui/example_data/trees/test.rate +0 -2033
pgsui/example_data/trees/test.tre +0 -1
pgsui/example_data/trees/test_n10.rate +0 -19
pgsui/example_data/trees/test_n100.rate +0 -109
pgsui/example_data/trees/test_n500.rate +0 -509
pgsui/example_data/trees/test_siterates.txt +0 -2024
pgsui/example_data/trees/test_siterates_n10.txt +0 -10
pgsui/example_data/trees/test_siterates_n100.txt +0 -100
pgsui/example_data/trees/test_siterates_n500.txt +0 -500
pgsui/example_data/vcf_files/test.vcf +0 -244
pgsui/example_data/vcf_files/test.vcf.gz +0 -0
pgsui/example_data/vcf_files/test.vcf.gz.tbi +0 -0
pgsui/impute/estimators.py +0 -1268
pgsui/impute/impute.py +0 -1463
pgsui/impute/simple_imputers.py +0 -1431
pgsui/impute/supervised/iterative_imputer_fixedparams.py +0 -782
pgsui/impute/supervised/iterative_imputer_gridsearch.py +0 -1024
pgsui/impute/unsupervised/keras_classifiers.py +0 -697
pgsui/impute/unsupervised/models/in_development/cnn_model.py +0 -486
pgsui/impute/unsupervised/neural_network_imputers.py +0 -1440
pgsui/impute/unsupervised/neural_network_methods.py +0 -1395
pgsui/pg_sui.py +0 -261
pgsui/utils/sequence_tools.py +0 -407
simulation/sim_benchmarks.py +0 -333
simulation/sim_treeparams.py +0 -475
test/__init__.py +0 -0
test/pg_sui_simtest.py +0 -215
test/pg_sui_testing.py +0 -523
test/test.py +0 -151
test/test_pgsui.py +0 -374
test/test_tkc.py +0 -185

pgsui/impute/unsupervised/nn_scorers.py ADDED Viewed

@@ -0,0 +1,255 @@
+from typing import TYPE_CHECKING, Dict, Literal
+import numpy as np
+import pandas as pd
+from sklearn.metrics import (
+    accuracy_score,
+    average_precision_score,
+    f1_score,
+    precision_score,
+    recall_score,
+    roc_auc_score,
+)
+from snpio.utils.logging import LoggerManager
+from torch import Tensor
+from pgsui.utils.logging_utils import configure_logger
+from pgsui.utils.misc import validate_input_type
+class Scorer:
+    """Class for evaluating the performance of a model using various metrics.
+    This module provides a unified interface for computing common evaluation metrics. It supports accuracy, F1 score, precision, recall, ROC AUC, average precision, and macro-average precision. The class can handle both raw and one-hot encoded labels and includes options for logging and averaging methods.
+    """
+    def __init__(
+        self,
+        prefix: str,
+        average: Literal["weighted", "macro", "micro"] = "macro",
+        verbose: bool = False,
+        debug: bool = False,
+    ) -> None:
+        """Initialize a Scorer object.
+        This class provides a unified interface for computing common evaluation metrics. It supports accuracy, F1 score, precision, recall, ROC AUC, average precision, and macro-average precision. The class can handle both raw and one-hot encoded labels and includes options for logging and averaging methods.
+        Args:
+            prefix (str): The prefix to use for logging.
+            average (Literal["weighted", "macro", "micro"]): The averaging method to use for metrics. Must be one of 'micro', 'macro', or 'weighted'. Defaults to 'weighted'.
+            verbose (bool): If True, enable verbose logging. Defaults to False.
+            debug (bool): If True, enable debug logging. Defaults to False.
+        """
+        logman = LoggerManager(
+            name=__name__, prefix=prefix, debug=debug, verbose=verbose
+        )
+        self.logger = configure_logger(
+            logman.get_logger(), verbose=verbose, debug=debug
+        )
+        if average not in {"weighted", "micro", "macro"}:
+            msg = f"Invalid average parameter: {average}. Must be one of 'micro', 'macro', or 'weighted'."
+            self.logger.error(msg)
+            raise ValueError(msg)
+        self.average: Literal["micro", "macro", "weighted"] = average
+    def accuracy(self, y_true: np.ndarray, y_pred: np.ndarray) -> float:
+        """Compute the accuracy score.
+        Args:
+            y_true (np.ndarray): Ground truth (correct) target values.
+            y_pred (np.ndarray): Estimated target values.
+        Returns:
+            float: The accuracy score.
+        """
+        return float(accuracy_score(y_true, y_pred))
+    def f1(self, y_true: np.ndarray, y_pred: np.ndarray) -> float:
+        """Compute the F1 score.
+        Args:
+            y_true (np.ndarray): Ground truth (correct) target values.
+            y_pred (np.ndarray): Estimated target values.
+        Returns:
+            float: The F1 score.
+        """
+        return float(f1_score(y_true, y_pred, average=self.average, zero_division=0))
+    def precision(self, y_true: np.ndarray, y_pred: np.ndarray) -> float:
+        """Compute the precision score.
+        Args:
+            y_true (np.ndarray): Ground truth (correct) target values.
+            y_pred (np.ndarray): Estimated target values.
+        Returns:
+            float: The precision score.
+        """
+        return float(
+            precision_score(y_true, y_pred, average=self.average, zero_division=0)
+        )
+    def recall(self, y_true: np.ndarray, y_pred: np.ndarray) -> float:
+        """Compute the recall score.
+        Args:
+            y_true (np.ndarray): Ground truth (correct) target values.
+            y_pred (np.ndarray): Estimated target values.
+        Returns:
+            float: The recall score.
+        """
+        return float(
+            recall_score(y_true, y_pred, average=self.average, zero_division=0)
+        )
+    def roc_auc(self, y_true: np.ndarray, y_pred_proba: np.ndarray) -> float:
+        """Compute the ROC AUC score.
+        Args:
+            y_true (np.ndarray): Ground truth (correct) target values.
+            y_pred_proba (np.ndarray): Predicted probabilities.
+        Returns:
+            float: The ROC AUC score.
+        """
+        if len(np.unique(y_true)) < 2:
+            return 0.5
+        if y_pred_proba.shape[-1] == 2:
+            # Binary classification case
+            # Use probabilities for the positive class
+            # Otherwise it throws an error.
+            y_pred_proba = y_pred_proba[:, 1]
+        try:
+            return float(
+                roc_auc_score(
+                    y_true, y_pred_proba, average=self.average, multi_class="ovr"
+                )
+            )
+        except Exception:
+            return float(roc_auc_score(y_true, y_pred_proba, average=self.average))
+    # This method now correctly expects one-hot encoded true labels
+    def average_precision(
+        self, y_true_ohe: np.ndarray, y_pred_proba: np.ndarray
+    ) -> float:
+        """Compute the average precision score.
+        Args:
+            y_true_ohe (np.ndarray): One-hot encoded ground truth target values.
+            y_pred_proba (np.ndarray): Predicted probabilities.
+        Returns:
+            float: The average precision score.
+        """
+        if y_pred_proba.shape[-1] == 2:
+            # Binary classification case
+            # Use probabilities for the positive class
+            y_pred_proba = y_pred_proba[:, 1]
+        if y_true_ohe.shape[1] == 2:
+            # Binary classification case
+            y_true_ohe = y_true_ohe[:, 1]
+        return float(
+            average_precision_score(y_true_ohe, y_pred_proba, average=self.average)
+        )
+    def pr_macro(self, y_true_ohe: np.ndarray, y_pred_proba: np.ndarray) -> float:
+        """Compute the macro-average precision score.
+        Args:
+            y_true_ohe (np.ndarray): One-hot encoded ground truth target values.
+            y_pred_proba (np.ndarray): Predicted probabilities.
+        Returns:
+            float: The macro-average precision score.
+        """
+        if y_pred_proba.shape[-1] == 2:
+            # Binary classification case
+            # Use probabilities for the positive class
+            y_pred_proba = y_pred_proba[:, 1]
+        if y_true_ohe.shape[1] == 2:
+            # Binary classification case
+            y_true_ohe = y_true_ohe[:, 1]
+        return float(average_precision_score(y_true_ohe, y_pred_proba, average="macro"))
+    def evaluate(
+        self,
+        y_true: pd.DataFrame | np.ndarray | Tensor | list,
+        y_pred: pd.DataFrame | np.ndarray | Tensor | list,
+        y_true_ohe: pd.DataFrame | np.ndarray | Tensor | list,
+        y_pred_proba: pd.DataFrame | np.ndarray | Tensor | list,
+        objective_mode: bool = False,
+        tune_metric: Literal[
+            "pr_macro",
+            "roc_auc",
+            "average_precision",
+            "accuracy",
+            "f1",
+            "precision",
+            "recall",
+        ] = "pr_macro",
+    ) -> Dict[str, float]:
+        """Evaluate the model using various metrics.
+        Args:
+            y_true: Ground truth (correct) target values.
+            y_pred: Estimated target values.
+            y_true_ohe: One-hot encoded ground truth target values.
+            y_pred_proba: Predicted probabilities.
+            objective_mode: If True, only compute the metric specified by ``tune_metric``. Defaults to False.
+            tune_metric: The metric to optimize during tuning. Defaults to "pr_macro".
+        """
+        y_true, y_pred, y_true_ohe, y_pred_proba = [
+            validate_input_type(x) for x in (y_true, y_pred, y_true_ohe, y_pred_proba)
+        ]
+        if objective_mode:
+            metric_calculators = {
+                "pr_macro": lambda: self.pr_macro(
+                    np.asarray(y_true_ohe), np.asarray(y_pred_proba)
+                ),
+                "roc_auc": lambda: self.roc_auc(
+                    np.asarray(y_true), np.asarray(y_pred_proba)
+                ),
+                "average_precision": lambda: self.average_precision(
+                    np.asarray(y_true_ohe), np.asarray(y_pred_proba)
+                ),
+                "accuracy": lambda: self.accuracy(
+                    np.asarray(y_true), np.asarray(y_pred)
+                ),
+                "f1": lambda: self.f1(np.asarray(y_true), np.asarray(y_pred)),
+                "precision": lambda: self.precision(
+                    np.asarray(y_true), np.asarray(y_pred)
+                ),
+                "recall": lambda: self.recall(np.asarray(y_true), np.asarray(y_pred)),
+            }
+            if tune_metric not in metric_calculators:
+                msg = f"Invalid tune_metric provided: '{tune_metric}'."
+                self.logger.error(msg)
+                raise ValueError(msg)
+            metrics = {tune_metric: metric_calculators[tune_metric]()}
+        else:
+            metrics = {
+                "accuracy": self.accuracy(np.asarray(y_true), np.asarray(y_pred)),
+                "f1": self.f1(np.asarray(y_true), np.asarray(y_pred)),
+                "precision": self.precision(np.asarray(y_true), np.asarray(y_pred)),
+                "recall": self.recall(np.asarray(y_true), np.asarray(y_pred)),
+                "roc_auc": self.roc_auc(np.asarray(y_true), np.asarray(y_pred_proba)),
+                "average_precision": self.average_precision(
+                    np.asarray(y_true_ohe), np.asarray(y_pred_proba)
+                ),
+                "pr_macro": self.pr_macro(
+                    np.asarray(y_true_ohe), np.asarray(y_pred_proba)
+                ),
+            }
+        return {k: float(v) for k, v in metrics.items()}

pgsui/utils/__init__.py CHANGED Viewed

File without changes

pg-sui 0.2.0__py3-none-any.whl → 1.6.14.dev9__py3-none-any.whl

pg-sui 0.2.0py3-none-any.whl → 1.6.14.dev9py3-none-any.whl