PyPI - pertpy - Versions diffs - 0.7.0__py3-none-any.whl → 0.8.0__py3-none-any.whl - Mend

pertpy 0.7.0py3-none-any.whl → 0.8.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (56) hide show

pertpy/__init__.py +2 -1
pertpy/data/__init__.py +61 -0
pertpy/data/_dataloader.py +27 -23
pertpy/data/_datasets.py +58 -0
pertpy/metadata/__init__.py +2 -0
pertpy/metadata/_cell_line.py +39 -70
pertpy/metadata/_compound.py +3 -4
pertpy/metadata/_drug.py +2 -6
pertpy/metadata/_look_up.py +38 -51
pertpy/metadata/_metadata.py +7 -10
pertpy/metadata/_moa.py +2 -6
pertpy/plot/__init__.py +0 -5
pertpy/preprocessing/__init__.py +2 -0
pertpy/preprocessing/_guide_rna.py +2 -3
pertpy/tools/__init__.py +42 -4
pertpy/tools/_augur.py +14 -15
pertpy/tools/_cinemaot.py +2 -2
pertpy/tools/_coda/_base_coda.py +118 -142
pertpy/tools/_coda/_sccoda.py +16 -15
pertpy/tools/_coda/_tasccoda.py +21 -22
pertpy/tools/_dialogue.py +18 -23
pertpy/tools/_differential_gene_expression/__init__.py +20 -0
pertpy/tools/_differential_gene_expression/_base.py +657 -0
pertpy/tools/_differential_gene_expression/_checks.py +41 -0
pertpy/tools/_differential_gene_expression/_dge_comparison.py +86 -0
pertpy/tools/_differential_gene_expression/_edger.py +125 -0
pertpy/tools/_differential_gene_expression/_formulaic.py +189 -0
pertpy/tools/_differential_gene_expression/_pydeseq2.py +95 -0
pertpy/tools/_differential_gene_expression/_simple_tests.py +162 -0
pertpy/tools/_differential_gene_expression/_statsmodels.py +72 -0
pertpy/tools/_distances/_distance_tests.py +21 -16
pertpy/tools/_distances/_distances.py +406 -70
pertpy/tools/_enrichment.py +10 -15
pertpy/tools/_kernel_pca.py +1 -1
pertpy/tools/_milo.py +76 -53
pertpy/tools/_mixscape.py +15 -11
pertpy/tools/_perturbation_space/_clustering.py +5 -2
pertpy/tools/_perturbation_space/_comparison.py +112 -0
pertpy/tools/_perturbation_space/_discriminator_classifiers.py +20 -22
pertpy/tools/_perturbation_space/_perturbation_space.py +23 -21
pertpy/tools/_perturbation_space/_simple.py +3 -3
pertpy/tools/_scgen/__init__.py +1 -1
pertpy/tools/_scgen/_base_components.py +2 -3
pertpy/tools/_scgen/_scgen.py +33 -28
pertpy/tools/_scgen/_utils.py +2 -2
{pertpy-0.7.0.dist-info → pertpy-0.8.0.dist-info}/METADATA +22 -13
pertpy-0.8.0.dist-info/RECORD +57 -0
{pertpy-0.7.0.dist-info → pertpy-0.8.0.dist-info}/WHEEL +1 -1
pertpy/plot/_augur.py +0 -171
pertpy/plot/_coda.py +0 -601
pertpy/plot/_guide_rna.py +0 -64
pertpy/plot/_milopy.py +0 -209
pertpy/plot/_mixscape.py +0 -355
pertpy/tools/_differential_gene_expression.py +0 -325
pertpy-0.7.0.dist-info/RECORD +0 -53
{pertpy-0.7.0.dist-info → pertpy-0.8.0.dist-info}/licenses/LICENSE +0 -0

pertpy/tools/_differential_gene_expression/_statsmodels.py ADDED Viewed

@@ -0,0 +1,72 @@
+import numpy as np
+import pandas as pd
+import scanpy as sc
+import statsmodels
+import statsmodels.api as sm
+from tqdm.auto import tqdm
+from ._base import LinearModelBase
+from ._checks import check_is_integer_matrix
+class Statsmodels(LinearModelBase):
+    """Differential expression test using a statsmodels linear regression"""
+    def _check_counts(self):
+        check_is_integer_matrix(self.data)
+    def fit(
+        self,
+        regression_model: type[sm.OLS] | type[sm.GLM] = sm.OLS,
+        **kwargs,
+    ) -> None:
+        """Fit the specified regression model.
+        Args:
+            regression_model: A statsmodels regression model class, either OLS or GLM.
+            **kwargs: Additional arguments for fitting the specific method. In particular, this
+                is where you can specify the family for GLM.
+        Examples:
+            >>> import statsmodels.api as sm
+            >>> import pertpy as pt
+            >>> model = pt.tl.Statsmodels(adata, design="~condition")
+            >>> model.fit(sm.GLM, family=sm.families.NegativeBinomial(link=sm.families.links.Log()))
+            >>> results = model.test_contrasts(np.array([0, 1]))
+        """
+        self.models = []
+        for var in tqdm(self.adata.var_names):
+            mod = regression_model(
+                sc.get.obs_df(self.adata, keys=[var], layer=self.layer)[var],
+                self.design,
+                **kwargs,
+            )
+            mod = mod.fit()
+            self.models.append(mod)
+    def _test_single_contrast(self, contrast, **kwargs) -> pd.DataFrame:
+        res = []
+        for var, mod in zip(tqdm(self.adata.var_names), self.models, strict=False):
+            t_test = mod.t_test(contrast)
+            res.append(
+                {
+                    "variable": var,
+                    "p_value": t_test.pvalue,
+                    "t_value": t_test.tvalue.item(),
+                    "sd": t_test.sd.item(),
+                    "log_fc": t_test.effect.item(),
+                    "adj_p_value": statsmodels.stats.multitest.fdrcorrection(np.array([t_test.pvalue]))[1].item(),
+                }
+            )
+        return pd.DataFrame(res).sort_values("p_value")
+    def contrast(self, column: str, baseline: str, group_to_compare: str) -> np.ndarray:
+        """Build a simple contrast for pairwise comparisons.
+        This is equivalent to
+        ```
+        model.cond(<column> = baseline) - model.cond(<column> = group_to_compare)
+        ```
+        """
+        return self.cond(**{column: baseline}) - self.cond(**{column: group_to_compare})

pertpy/tools/_distances/_distance_tests.py CHANGED Viewed

@@ -23,20 +23,20 @@ class DistanceTest:
     Args:
         metric: Distance metric to use between groups of cells.
-        n_perms: Number of permutations to run. Defaults to 1000.
+        n_perms: Number of permutations to run.
         layer_key: Name of the counts layer containing raw counts to calculate distances for.
                    Mutually exclusive with 'obsm_key'.
-                   Defaults to None and is then not used.
+                   If equal to `None` the parameter is ignored.
         obsm_key: Name of embedding in adata.obsm to use.
                   Mutually exclusive with 'counts_layer_key'.
                   Defaults to None, but is set to "X_pca" if not set explicitly internally.
-        alpha: Significance level. Defaults to 0.05.
-        correction: Multiple testing correction method. Defaults to 'holm-sidak'.
-        cell_wise_metric: Metric to use between single cells. Defaults to "euclidean".
+        alpha: Significance level.
+        correction: Multiple testing correction method.
+        cell_wise_metric: Metric to use between single cells.
     Examples:
         >>> import pertpy as pt
-        >>> adata = pt.dt.distance_example_data()
+        >>> adata = pt.dt.distance_example()
         >>> distance_test = pt.tl.DistanceTest("edistance", n_perms=1000)
         >>> tab = distance_test(adata, groupby="perturbation", contrast="control")
     """
@@ -66,11 +66,14 @@ class DistanceTest:
         self.alpha = alpha
         self.correction = correction
         self.cell_wise_metric = (
-            cell_wise_metric if cell_wise_metric else Distance(self.metric, self.obsm_key).cell_wise_metric
+            cell_wise_metric if cell_wise_metric else Distance(self.metric, obsm_key=self.obsm_key).cell_wise_metric
         )
         self.distance = Distance(
-            self.metric, layer_key=self.layer_key, obsm_key=self.obsm_key, cell_wise_metric=self.cell_wise_metric
+            self.metric,
+            layer_key=self.layer_key,
+            obsm_key=self.obsm_key,
+            cell_wise_metric=self.cell_wise_metric,
         )
     def __call__(
@@ -87,7 +90,7 @@ class DistanceTest:
             adata: Annotated data matrix.
             groupby: Key in adata.obs for grouping cells.
             contrast: Name of the contrast group.
-            show_progressbar: Whether to print progress. Defaults to True.
+            show_progressbar: Whether to print progress.
         Returns:
             pandas.DataFrame: Results of the permutation test, with columns:
@@ -99,7 +102,7 @@ class DistanceTest:
         Examples:
             >>> import pertpy as pt
-            >>> adata = pt.dt.distance_example_data()
+            >>> adata = pt.dt.distance_example()
             >>> distance_test = pt.tl.DistanceTest("edistance", n_perms=1000)
             >>> tab = distance_test(adata, groupby="perturbation", contrast="control")
         """
@@ -121,7 +124,7 @@ class DistanceTest:
             adata: Annotated data matrix.
             groupby: Key in adata.obs for grouping cells.
             contrast: Name of the contrast group.
-            show_progressbar: Whether to print progress. Defaults to True.
+            show_progressbar: Whether to print progress.
         Returns:
             pandas.DataFrame: Results of the permutation test, with columns:
@@ -133,7 +136,7 @@ class DistanceTest:
         Examples:
             >>> import pertpy as pt
-            >>> adata = pt.dt.distance_example_data()
+            >>> adata = pt.dt.distance_example()
             >>> distance_test = pt.tl.DistanceTest("edistance", n_perms=1000)
             >>> test_results = distance_test.test_xy(adata, groupby="perturbation", contrast="control")
         """
@@ -176,7 +179,8 @@ class DistanceTest:
         # Evaluate the test
         # count times shuffling resulted in larger distance
         comparison_results = np.array(
-            pd.concat([r["distance"] - df["distance"] for r in results], axis=1) > 0, dtype=int
+            pd.concat([r["distance"] - df["distance"] for r in results], axis=1) > 0,
+            dtype=int,
         )
         n_failures = pd.Series(np.clip(np.sum(comparison_results, axis=1), 1, np.inf), index=df.index)
         pvalues = n_failures / self.n_perms
@@ -213,7 +217,7 @@ class DistanceTest:
             groupby: Key in adata.obs for grouping cells.
             contrast: Name of the contrast group.
             cell_wise_metric: Metric to use for pairwise distances.
-            verbose: Whether to print progress. Defaults to True.
+            verbose: Whether to print progress.
         Returns:
             pandas.DataFrame: Results of the permutation test, with columns:
@@ -225,7 +229,7 @@ class DistanceTest:
         Examples:
             >>> import pertpy as pt
-            >>> adata = pt.dt.distance_example_data()
+            >>> adata = pt.dt.distance_example()
             >>> distance_test = pt.tl.DistanceTest("edistance", n_perms=1000)
             >>> test_results = distance_test.test_precomputed(adata, groupby="perturbation", contrast="control")
         """
@@ -284,7 +288,8 @@ class DistanceTest:
         # Evaluate the test
         # count times shuffling resulted in larger distance
         comparison_results = np.array(
-            pd.concat([r["distance"] - df["distance"] for r in results], axis=1) > 0, dtype=int
+            pd.concat([r["distance"] - df["distance"] for r in results], axis=1) > 0,
+            dtype=int,
         )
         n_failures = pd.Series(np.clip(np.sum(comparison_results, axis=1), 1, np.inf), index=df.index)
         pvalues = n_failures / self.n_perms

pertpy 0.7.0__py3-none-any.whl → 0.8.0__py3-none-any.whl

pertpy 0.7.0py3-none-any.whl → 0.8.0py3-none-any.whl