PyPI - gsMap - Versions diffs - 1.71.2__py3-none-any.whl → 1.72.3__py3-none-any.whl - Mend

gsMap 1.71.2py3-none-any.whl → 1.72.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (30) hide show

gsMap/GNN/adjacency_matrix.py +25 -27
gsMap/GNN/model.py +9 -7
gsMap/GNN/train.py +8 -11
gsMap/__init__.py +3 -3
gsMap/__main__.py +3 -2
gsMap/cauchy_combination_test.py +75 -72
gsMap/config.py +822 -316
gsMap/create_slice_mean.py +154 -0
gsMap/diagnosis.py +179 -101
gsMap/find_latent_representation.py +28 -26
gsMap/format_sumstats.py +233 -201
gsMap/generate_ldscore.py +353 -209
gsMap/latent_to_gene.py +92 -60
gsMap/main.py +23 -14
gsMap/report.py +39 -25
gsMap/run_all_mode.py +86 -46
gsMap/setup.py +1 -1
gsMap/spatial_ldsc_multiple_sumstats.py +154 -80
gsMap/utils/generate_r2_matrix.py +173 -140
gsMap/utils/jackknife.py +84 -80
gsMap/utils/manhattan_plot.py +180 -207
gsMap/utils/regression_read.py +105 -122
gsMap/visualize.py +82 -64
{gsmap-1.71.2.dist-info → gsmap-1.72.3.dist-info}/METADATA +21 -6
gsmap-1.72.3.dist-info/RECORD +31 -0
{gsmap-1.71.2.dist-info → gsmap-1.72.3.dist-info}/WHEEL +1 -1
gsMap/utils/make_annotations.py +0 -518
gsmap-1.71.2.dist-info/RECORD +0 -31
{gsmap-1.71.2.dist-info → gsmap-1.72.3.dist-info}/LICENSE +0 -0
{gsmap-1.71.2.dist-info → gsmap-1.72.3.dist-info}/entry_points.txt +0 -0

gsMap/find_latent_representation.py CHANGED Viewed

@@ -1,13 +1,15 @@
 import logging
 import random
 import numpy as np
 import scanpy as sc
 import torch
 from sklearn.decomposition import PCA
 from sklearn.preprocessing import LabelEncoder
+from gsMap.config import FindLatentRepresentationsConfig
 from gsMap.GNN.adjacency_matrix import construct_adjacency_matrix
 from gsMap.GNN.train import ModelTrainer
-from gsMap.config import FindLatentRepresentationsConfig
 logger = logging.getLogger(__name__)
@@ -20,41 +22,40 @@ def set_seed(seed_value):
     np.random.seed(seed_value)
     random.seed(seed_value)
     if torch.cuda.is_available():
-        logger.info('Using GPU for computations.')
+        logger.info("Using GPU for computations.")
         torch.cuda.manual_seed(seed_value)
         torch.cuda.manual_seed_all(seed_value)
     else:
-        logger.info('Using CPU for computations.')
+        logger.info("Using CPU for computations.")
 def preprocess_data(adata, params):
     """
     Preprocess the AnnData
     """
-    logger.info('Preprocessing data...')
+    logger.info("Preprocessing data...")
     adata.var_names_make_unique()
     if params.data_layer in adata.layers.keys():
-        logger.info(f'Using data layer: {params.data_layer}...')
+        logger.info(f"Using data layer: {params.data_layer}...")
         adata.X = adata.layers[params.data_layer]
-        sc.pp.filter_genes(adata, min_cells=30)
-    elif params.data_layer == 'X':
-        logger.info(f'Using data layer: {params.data_layer}...')
-        if adata.X.dtype == 'float32' or adata.X.dtype == 'float64':
-            logger.warning(f'The data layer should be raw count data')
-        sc.pp.filter_genes(adata, min_cells=30)
+    elif params.data_layer == "X":
+        logger.info(f"Using data layer: {params.data_layer}...")
+        if adata.X.dtype == "float32" or adata.X.dtype == "float64":
+            logger.warning("The data layer should be raw count data")
     else:
-        raise ValueError(f'Invalid data layer: {params.data_layer}, please check the input data.')
+        raise ValueError(f"Invalid data layer: {params.data_layer}, please check the input data.")
-    if params.data_layer in ['count', 'counts', 'X']:
+    if params.data_layer in ["count", "counts", "X"]:
         # HVGs based on count
-        logger.info('Dealing with count data...')
-        sc.pp.highly_variable_genes(adata,flavor="seurat_v3",n_top_genes=params.feat_cell)
+        logger.info("Dealing with count data...")
+        sc.pp.highly_variable_genes(adata, flavor="seurat_v3", n_top_genes=params.feat_cell)
         # Normalize the data
         sc.pp.normalize_total(adata, target_sum=1e4)
         sc.pp.log1p(adata)
     elif params.data_layer in adata.layers.keys():
-        sc.pp.highly_variable_genes(adata,flavor="seurat",n_top_genes=params.feat_cell)
+        sc.pp.highly_variable_genes(adata, flavor="seurat", n_top_genes=params.feat_cell)
     return adata
@@ -70,11 +71,12 @@ class LatentRepresentationFinder:
         self.graph_dict = construct_adjacency_matrix(adata, self.params)
     def compute_pca(self):
-        self.latent_pca = PCA(n_components=self.params.n_comps).fit_transform(self.expression_array)
+        self.latent_pca = PCA(n_components=self.params.n_comps).fit_transform(
+            self.expression_array
+        )
         return self.latent_pca
-    def run_gnn_vae(self, label, verbose='whole ST data'):
+    def run_gnn_vae(self, label, verbose="whole ST data"):
         # Use PCA if specified
         if self.params.input_pca:
             node_X = self.compute_pca()
@@ -86,7 +88,7 @@ class LatentRepresentationFinder:
         self.params.feat_cell = node_X.shape[1]
         # Run GNN
-        logger.info(f'Finding latent representations for {verbose}...')
+        logger.info(f"Finding latent representations for {verbose}...")
         gvae = ModelTrainer(node_X, self.graph_dict, self.params, label)
         gvae.run_train()
@@ -99,9 +101,9 @@ def run_find_latent_representation(args: FindLatentRepresentationsConfig):
     set_seed(2024)
     # Load the ST data
-    logger.info(f'Loading ST data of {args.sample_name}...')
+    logger.info(f"Loading ST data of {args.sample_name}...")
     adata = sc.read_h5ad(args.input_hdf5_path)
-    logger.info(f'The ST data contains {adata.shape[0]} cells, {adata.shape[1]} genes.')
+    logger.info(f"The ST data contains {adata.shape[0]} cells, {adata.shape[1]} genes.")
     # Load the cell type annotation
     if args.annotation is not None:
@@ -112,7 +114,7 @@ def run_find_latent_representation(args: FindLatentRepresentationsConfig):
         adata = adata[adata.obs[args.annotation].isin(valid_annotations)]
         le = LabelEncoder()
-        label =  le.fit_transform(adata.obs[args.annotation])
+        label = le.fit_transform(adata.obs[args.annotation])
     else:
         label = None
@@ -124,16 +126,16 @@ def run_find_latent_representation(args: FindLatentRepresentationsConfig):
     latent_pca = latent_rep.latent_pca
     # Add latent representations to the AnnData object
-    logger.info('Adding latent representations...')
+    logger.info("Adding latent representations...")
     adata.obsm["latent_GVAE"] = latent_gvae
     adata.obsm["latent_PCA"] = latent_pca
     # Run UMAP based on latent representations
-    #for name in ['latent_GVAE', 'latent_PCA']:
+    # for name in ['latent_GVAE', 'latent_PCA']:
     #    sc.pp.neighbors(adata, n_neighbors=10, use_rep=name)
     #    sc.tl.umap(adata)
     #    adata.obsm['X_umap_' + name] = adata.obsm['X_umap']
     # Save the AnnData object
-    logger.info('Saving ST data...')
+    logger.info("Saving ST data...")
     adata.write(args.hdf5_with_latent_path)

gsMap 1.71.2__py3-none-any.whl → 1.72.3__py3-none-any.whl

gsMap 1.71.2py3-none-any.whl → 1.72.3py3-none-any.whl