PyPI - biopipen - Versions diffs - 0.27.6__py3-none-any.whl → 0.27.8__py3-none-any.whl - Mend

biopipen 0.27.6py3-none-any.whl → 0.27.8py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of biopipen might be problematic. Click here for more details.

Files changed (19) hide show

biopipen/__init__.py CHANGED Viewed

	@@ -1 +1 @@
1	- __version__ = "0.27.6"
1	+ __version__ = "0.27.8"

biopipen/core/filters.py CHANGED Viewed

@@ -235,8 +235,8 @@ def _render_fgsea(
     with Path(cont["dir"]).joinpath("fgsea.txt").open() as f:
         next(f)  # skip header
         for line in f:
-            pathway, _ = line.split("\t", 1)
-            pathways.append(pathway)
+            items = line.strip().split("\t")
+            pathways.append((items[0], items[-1]))
             if len(pathways) >= n_pathways:
                 break
@@ -263,6 +263,7 @@ def _render_fgsea(
                         {
                             "kind": "table",
                             "src": str(Path(cont["dir"]).joinpath("fgsea.txt")),
+                            "data": {"excluded": {"slug"}},
                         }
                     ],
                 },
@@ -274,10 +275,10 @@ def _render_fgsea(
             "ui": "table_of_images",
             "contents": [
                 {
-                    "src": str(Path(cont["dir"]) / f"fgsea_{pw.replace('/', '-')}.png"),
+                    "src": str(Path(cont["dir"]) / f"fgsea_{slug}.png"),
                     "title": pw,
                 }
-                for pw in pathways
+                for pw, slug in pathways
             ]
         },
     ]

biopipen/ns/scrna.py CHANGED Viewed

@@ -1241,7 +1241,7 @@ class TopExpressingGenes(Proc):
     }
-class ExprImpution(Proc):
+class ExprImputation(Proc):
     """This process imputes the dropout values in scRNA-seq data.
     It takes the Seurat object as input and outputs the Seurat object with
@@ -1317,13 +1317,13 @@ class ExprImpution(Proc):
         },
         "alra_args": {},
     }
-    script = "file://../scripts/scrna/ExprImpution.R"
+    script = "file://../scripts/scrna/ExprImputation.R"
 class SCImpute(Proc):
     """Impute the dropout values in scRNA-seq data.
-    Deprecated. Use `ExprImpution` instead.
+    Deprecated. Use `ExprImputation` instead.
     Input:
         infile: The input file for imputation
@@ -1769,13 +1769,18 @@ class SeuratMap2Ref(Proc):
         sobjfile: The seurat object
     Output:
-        outfile: The rds file of seurat object with cell type annotated
+        outfile: The rds file of seurat object with cell type annotated.
+            Note that the reduction name will be `ref.umap` for the mapping.
+            To visualize the mapping, you should use `ref.umap` as the reduction name.
     Envs:
         ncores (type=int;order=-100): Number of cores to use.
-            Used in `future::plan(strategy = "multicore", workers = <ncores>)`
+            When `split_by` is used, this will be the number of cores for each object to map to the reference.
+            When `split_by` is not used, this is used in `future::plan(strategy = "multicore", workers = <ncores>)`
             to parallelize some Seurat procedures.
-            See also: <https://satijalab.org/seurat/articles/future_vignette.html>
+            See also: <https://satijalab.org/seurat/archive/v3.0/future_vignette.html>
+        mutaters (type=json): The mutaters to mutate the metadata.
+            This is helpful when we want to create new columns for `split_by`.
         use: A column name of metadata from the reference
             (e.g. `celltype.l1`, `celltype.l2`) to transfer to the query as the
             cell types (ident) for downstream analysis. This field is required.
@@ -1787,16 +1792,29 @@ class SeuratMap2Ref(Proc):
             `Seurat::LoadH5Seurat()`.
             The file type is determined by the extension. `.rds` or `.RDS` for
             RDS file, `.h5seurat` or `.h5` for h5seurat file.
+        refnorm (choice): Normalization method the reference used. The same method will be used for the query.
+            - NormalizeData: Using [`NormalizeData`](https://satijalab.org/seurat/reference/normalizedata).
+            - SCTransform: Using [`SCTransform`](https://satijalab.org/seurat/reference/sctransform).
+            - auto: Automatically detect the normalization method.
+                If the default assay of reference is `SCT`, then `SCTransform` will be used.
+        split_by: The column name in metadata to split the query into multiple objects.
+            This helps when the original query is too large to process.
         SCTransform (ns): Arguments for [`SCTransform()`](https://satijalab.org/seurat/reference/sctransform)
             - do-correct-umi (flag): Place corrected UMI matrix in assay counts layer?
             - do-scale (flag): Whether to scale residuals to have unit variance?
             - do-center (flag): Whether to center residuals to have mean zero?
             - <more>: See <https://satijalab.org/seurat/reference/sctransform>.
                 Note that the hyphen (`-`) will be transformed into `.` for the keys.
+        NormalizeData (ns): Arguments for [`NormalizeData()`](https://satijalab.org/seurat/reference/normalizedata)
+            - normalization-method: Normalization method.
+            - <more>: See <https://satijalab.org/seurat/reference/normalizedata>.
+                Note that the hyphen (`-`) will be transformed into `.` for the keys.
         FindTransferAnchors (ns): Arguments for [`FindTransferAnchors()`](https://satijalab.org/seurat/reference/findtransferanchors)
             - normalization-method (choice): Name of normalization method used.
                 - LogNormalize: Log-normalize the data matrix
                 - SCT: Scale data using the SCTransform method
+                - auto: Automatically detect the normalization method.
+                    See `envs.refnorm`.
             - reference-reduction: Name of dimensional reduction to use from the reference if running the pcaproject workflow.
                 Optionally enables reuse of precomputed reference dimensional reduction.
             - <more>: See <https://satijalab.org/seurat/reference/findtransferanchors>.
@@ -1822,14 +1840,19 @@ class SeuratMap2Ref(Proc):
         "ncores": config.misc.ncores,
         "use": None,
         "ident": "seurat_clusters",
+        "mutaters": {},
         "ref": None,
+        "refnorm": "auto",
+        "split_by": None,
         "SCTransform": {
             "do-correct-umi": False,
             "do-scale": False,
             "do-center": True,
         },
+        "NormalizeData": {
+            "normalization-method": "LogNormalize",
+        },
         "FindTransferAnchors": {
-            "normalization-method": "SCT",
             "reference-reduction": "spca",
         },
         "MapQuery": {

biopipen/ns/scrna_metabolic_landscape.py CHANGED Viewed

@@ -566,8 +566,8 @@ class ScrnaMetabolicLandscape(ProcGroup):
             input_data = lambda ch: tibble(
                 srtobj=ch.iloc[:, 0],
                 metafile=[None],
-                mutaters=[self.opts.mutaters],
             )
+            envs = {"mutaters": self.opts.mutaters}
         return MetabolicSeuratMetadataMutater
@@ -577,10 +577,10 @@ class ScrnaMetabolicLandscape(ProcGroup):
         if self.opts.noimpute:
             return self.p_mutater
-        from .scrna import ExprImpution
+        from .scrna import ExprImputation
         @annotate.format_doc(indent=3)
-        class MetabolicExprImpution(ExprImpution):
+        class MetabolicExprImputation(ExprImputation):
             """{{Summary}}
             You can turn off the imputation by setting the `noimpute` option
@@ -588,7 +588,7 @@ class ScrnaMetabolicLandscape(ProcGroup):
             """
             requires = self.p_mutater
-        return MetabolicExprImpution
+        return MetabolicExprImputation
     @ProcGroup.add_proc
     def p_pathway_activity(self) -> Type[Proc]:

biopipen/scripts/scrna/ExprImputation.R ADDED Viewed

@@ -0,0 +1,7 @@
+{% if envs.tool == "rmagic" %}
+{% include biopipen_dir + "/scripts/scrna/ExprImputation-rmagic.R" %}
+{% elif envs.tool == "scimpute" %}
+{% include biopipen_dir + "/scripts/scrna/ExprImputation-scimpute.R" %}
+{% elif envs.tool == "alra" %}
+{% include biopipen_dir + "/scripts/scrna/ExprImputation-alra.R" %}
+{% endif %}

biopipen/scripts/scrna/SeuratClusterStats-stats.R CHANGED Viewed

@@ -38,7 +38,7 @@ do_one_stats = function(name) {
         df_cells = df_cells %>% filter(!!rlang::parse_expr(case$subset))
     }
-    select_cols = c(case$ident, case$group.by, case$split.by)
+    select_cols = unique(c(case$ident, case$group.by, case$split.by))
     if (!is.null(case$split.by)) {
         plot_df = do_call(rbind, lapply(group_split(
             df_cells %>% select(all_of(select_cols)),

biopipen/scripts/scrna/SeuratMap2Ref.R CHANGED Viewed

@@ -1,5 +1,6 @@
 source("{{biopipen_dir}}/utils/misc.R")
+library(parallel)
 library(Seurat)
 library(SeuratDisk)
 library(rlang)
@@ -12,8 +13,12 @@ outfile = {{out.outfile | r}}
 use = {{envs.use | r}}
 ident = {{envs.ident | r}}
 ref = {{envs.ref | r}}
+refnorm = {{envs.refnorm | r}}
 ncores = {{envs.ncores | r}}
+split_by = {{envs.split_by | r}}
+mutaters = {{envs.mutaters | r}}
 sctransform_args = {{envs.SCTransform | r: todot="-"}}
+normalizedata_args = {{envs.NormalizeData | r: todot="-"}}
 findtransferanchors_args = {{envs.FindTransferAnchors | r: todot="-"}}
 mappingscore_args = {{envs.MappingScore | r: todot="-"}}
 mapquery_args = {{envs.MapQuery | r: todot="-"}}
@@ -34,8 +39,10 @@ if (is.null(mapquery_args$refdata) || length(mapquery_args$refdata) == 0) {
 mapquery_args$refdata[[use]] = use
 outdir = dirname(outfile)
-options(future.globals.maxSize = 80000 * 1024^2)
-plan(strategy = "multicore", workers = ncores)
+if (is.null(split_by)) {
+    options(future.globals.maxSize = 80000 * 1024^2)
+    future::plan(strategy = "multicore", workers = ncores)
+}
 .expand_dims = function(args, name = "dims") {
     # Expand dims from 30 to 1:30
@@ -56,52 +63,191 @@ if (endsWith(ref, ".rds") || endsWith(ref, ".RDS")) {
     reference = LoadH5Seurat(ref)
 }
+if (refnorm == "auto" && DefaultAssay(reference) == "SCT") {
+    refnorm = "SCTransform"
+}
+log_info("  Normalization method used: {refnorm}")
+if (refnorm == "SCTransform") {
+    findtransferanchors_args$normalization.method = "SCT"
+} else if (refnorm == "NormalizeData") {
+    findtransferanchors_args$normalization.method = "LogNormalize"
+} else {
+    stop("Unknown normalization method: {refnorm}")
+}
 # Load Seurat object
 log_info("- Loading Seurat object")
 sobj = readRDS(sobjfile)
+if (!is.null(mutaters) && length(mutaters) > 0) {
+    log_info("- Applying mutaters")
+    sobj@meta.data <- sobj@meta.data %>% mutate(!!!lapply(mutaters, parse_expr))
+}
+if (!is.null(split_by)) {
+    # check if each split has more than 100 cells
+    cellno = table(sobj@meta.data[[split_by]])
+    cellno = cellno[cellno < 100]
+    if (length(cellno) > 0) {
+        # stop and print the splits with # cells
+        stop(paste0(
+            "The following splits have less than 100 cells: \n",
+            paste0("- ", names(cellno), ": ", cellno, collapse = "\n"),
+            "\n\n",
+            "You can use `envs.mutaters` to merge these splits and use `newsplit` as `envs.split_by`: \n",
+            "> mutaters = {\n",
+            ">   newsplit = \"if_else(oldsplit %in% c('split1', 'split2'), 'mergedsplit', oldsplit)\"\n",
+            "> }\n"
+        ))
+    }
+    sobj = SplitObject(sobj, split.by = split_by)
+}
 # Normalize data
 log_info("- Normalizing data")
-sctransform_args$object = sobj
-sctransform_args$residual.features = rownames(x = reference)
-query = do_call(SCTransform, sctransform_args)
+if (refnorm == "SCTransform") {
+    log_info("  Using SCTransform normalization")
+    sctransform_args$residual.features = rownames(x = reference)
+    if (is.null(split_by)) {
+        sctransform_args$object = sobj
+        query = do_call(SCTransform, sctransform_args)
+    } else {
+        query = mclapply(
+            X = sobj,
+            FUN = function(x) {
+                sctransform_args$object = x
+                do_call(SCTransform, sctransform_args)
+            },
+            mc.cores = ncores
+        )
+        if (any(unlist(lapply(query, class)) == "try-error")) {
+            stop(paste0("\nmclapply (SCTransform) error:", query))
+        }
+    }
+} else {
+    log_info("  Using NormalizeData normalization")
+    if (is.null(split_by)) {
+        normalizedata_args$object = sobj
+        query = do_call(NormalizeData, normalizedata_args)
+    } else {
+        query = mclapply(
+            X = sobj,
+            FUN = function(x) {
+                normalizedata_args$object = x
+                do_call(NormalizeData, normalizedata_args)
+            },
+            mc.cores = ncores
+        )
+        if (any(unlist(lapply(query, class)) == "try-error")) {
+            stop(paste0("\nmclapply (NormalizeData) error:", query))
+        }
+    }
+}
 # Find anchors between query and reference
 log_info("- Finding anchors")
 findtransferanchors_args$reference = reference
-findtransferanchors_args$query = query
-anchors = do_call(FindTransferAnchors, findtransferanchors_args)
+if (is.null(split_by)) {
+    findtransferanchors_args$query = query
+    anchors = do_call(FindTransferAnchors, findtransferanchors_args)
+} else {
+    anchors = mclapply(
+        X = query,
+        FUN = function(x) {
+            findtransferanchors_args$query = x
+            do_call(FindTransferAnchors, findtransferanchors_args)
+        },
+        mc.cores = ncores
+    )
+    if (any(unlist(lapply(anchors, class)) == "try-error")) {
+        stop(paste0("\nmclapply (FindTransferAnchors) error:", anchors))
+    }
+}
 # Map query to reference
 log_info("- Mapping query to reference")
 mapquery_args$reference = reference
-mapquery_args$query = query
-mapquery_args$anchorset = anchors
-query = do_call(MapQuery, mapquery_args)
+if (is.null(split_by)) {
+    mapquery_args$query = query
+    mapquery_args$anchorset = anchors
+    query = do_call(MapQuery, mapquery_args)
+} else {
+    query = mclapply(
+        X = seq_along(query),
+        FUN = function(i) {
+            mapquery_args$query = query[[i]]
+            mapquery_args$anchorset = anchors[[i]]
+            do_call(MapQuery, mapquery_args)
+        },
+        mc.cores = ncores
+    )
+    if (any(unlist(lapply(query, class)) == "try-error")) {
+        stop(paste0("\nmclapply (MapQuery) error:", query))
+    }
+}
 # Calculating mapping score
 log_info("- Calculating mapping score")
-mappingscore_args$anchors = anchors
-mappingscore = tryCatch({
-    do_call(MappingScore, mappingscore_args)
-}, error = function(e) {
-    if (e$message == "subscript out of bounds") {
-        stop(paste0(
-            "While calculating mapping score, the following error was encountered: \n",
-            "subscript out of bounds.  \n\n",
-            "You may want to try a smaller `ndim` (default: 50) in `envs.MappingScore`."
-        ))
+mappingscore_sob_msg = paste0(
+    "While calculating mapping score, the following error was encountered: \n",
+    "subscript out of bounds.  \n\n",
+    "You may want to try a smaller `ndim` (default: 50) in `envs.MappingScore`."
+)
+if (is.null(split_by)) {
+    mappingscore_args$anchors = anchors
+    mappingscore = tryCatch({
+        do_call(MappingScore, mappingscore_args)
+    }, error = function(e) {
+        if (e$message == "subscript out of bounds") stop(mappingscore_sob_msg)
+        stop(e)
+    })
+} else {
+    mappingscore = mclapply(
+        X = seq_along(query),
+        FUN = function(i) {
+            mappingscore_args$anchors = anchors[[i]]
+            tryCatch({
+                do_call(MappingScore, mappingscore_args)
+            }, error = function(e) {
+                if (e$message == "subscript out of bounds") stop(mappingscore_sob_msg)
+                stop(e)
+            })
+        },
+        mc.cores = ncores
+    )
+    if (any(unlist(lapply(mappingscore, class)) == "try-error")) {
+        stop(paste0("\nmclapply (MappingScore) error:", mappingscore))
     }
-    stop(e)
-})
+}
 # Calculate mapping score and add to metadata
-log_info("- Calculating mapping score")
-query = AddMetaData(
-  object = query,
-  metadata = mappingscore,
-  col.name = "mapping.score"
-)
+log_info("- Adding mapping score to metadata")
+if (is.null(split_by)) {
+    query = AddMetaData(
+        object = query,
+        metadata = mappingscore,
+        col.name = "mapping.score"
+    )
+} else {
+    query = mclapply(
+        X = seq_along(query),
+        FUN = function(i) {
+            AddMetaData(
+                object = query[[i]],
+                metadata = mappingscore[[i]],
+                col.name = "mapping.score"
+            )
+        },
+        mc.cores = ncores
+    )
+    if (any(unlist(lapply(query, class)) == "try-error")) {
+        stop(paste0("\nmclapply (AddMetaData) error:", query))
+    }
+    # Combine the results
+    log_info("- Merging the results")
+    query = merge(query[[1]], query[2:length(query)], merge.dr = "ref.umap")
+}
 # Add the alias to the metadata for the clusters
 log_info("- Adding ident to metadata and set as ident")

biopipen/scripts/scrna_metabolic_landscape/MetabolicFeatures.R CHANGED Viewed

@@ -50,8 +50,18 @@ do_one_group <- function(obj, features, group, outputdir, h1) {
     classes[classes != group] <- "_REST"
     classes[classes == group] <- groupname
     if (any(table(classes) < 5)) {
-        msg <- paste("Group", group, "has less than 5 cells, or only 5 cells left.")
+        msg <- paste("  Skipped. One of the groups has less than 5 cells.")
         log_warn(msg)
+        # write a warning.txt to odir with the message and table(classes)
+        write(paste0(msg, "\n\n"), file = file.path(odir, "warning.txt"))
+        write.table(
+            table(classes),
+            file = file.path(odir, "warning.txt"),
+            sep = "\t",
+            quote = FALSE,
+            row.names = FALSE,
+            append = TRUE
+        )
         return(
             list(
                 list(kind = "error", content = msg),

biopipen/scripts/scrna_metabolic_landscape/MetabolicFeaturesIntraSubset.R CHANGED Viewed

@@ -84,14 +84,18 @@ do_one_comparison <- function(
     odir = file.path(groupdir, paste0(subset_prefix, compname))
     dir.create(odir, showWarnings = FALSE)
-    if (ncol(exprs_case) < 3 || ncol(exprs_control) < 3) {
-        log_warn("          Skip (not enough cells)")
-        add_report(
+    if (ncol(exprs_case) < 5 || ncol(exprs_control) < 5) {
+        log_warn("  Skipped (not enough cells).")
+        wfile <- file.path(odir, "warning.txt")
+        write("Skipped (not enough cells)\n\n", file = wfile)
+        write(paste0("n_cells (Case):", ncol(exprs_case)), file = wfile, append = TRUE)
+        write(paste0("n_cells (Control):", ncol(exprs_control)), file = wfile, append = TRUE)
+        return(list(
             list(kind = "error", content = "Not enough cells"),
             h1 = groupname,
             h2 = compname
-        )
-        return (NULL)
+        ))
     }
     if (fgsea) {
         ranks = prerank(

biopipen/utils/gsea.R CHANGED Viewed

@@ -2,11 +2,36 @@ library(ggplot2)
 library(dplyr)
 library(tibble)
-.slugify <- function(x, non_alphanum_replace="-", collapse_replace=TRUE, tolower=FALSE) {
-    x <- gsub("[^[:alnum:]_]", non_alphanum_replace, x)
-    if(collapse_replace) x <- gsub(paste0(non_alphanum_replace, "+"), non_alphanum_replace, x)
-    if(tolower) x <- tolower(x)
-    x
+if (!exists("slugify")) {
+    slugify <- function(x, non_alphanum_replace="-", collapse_replace=TRUE, tolower=FALSE) {
+        subs <- list(
+            "š"="s", "œ"="oe", "ž"="z", "ß"="ss", "þ"="y", "à"="a", "á"="a", "â"="a",
+            "ã"="a", "ä"="a", "å"="a", "æ"="ae", "ç"="c", "è"="e", "é"="e", "ê"="e",
+            "ë"="e", "ì"="i", "í"="i", "î"="i", "ï"="i", "ð"="d", "ñ"="n", "ò"="o",
+            "ó"="o", "ô"="o", "õ"="o", "ö"="o", "ø"="oe", "ù"="u", "ú"="u", "û"="u",
+            "ü"="u", "ý"="y", "ÿ"="y", "ğ"="g", "ı"="i", "ĳ"="ij", "ľ"="l", "ň"="n",
+            "ř"="r", "ş"="s", "ť"="t", "ų"="u", "ů"="u", "ý"="y", "ź"="z", "ż"="z",
+            "ſ"="s", "α"="a", "β"="b", "γ"="g", "δ"="d", "ε"="e", "ζ"="z", "η"="h",
+            "θ"="th", "ι"="i", "κ"="k", "λ"="l", "μ"="m", "ν"="n", "ξ"="x", "ο"="o",
+            "π"="p", "ρ"="r", "σ"="s", "τ"="t", "υ"="u", "φ"="ph", "χ"="ch", "ψ"="ps",
+            "ω"="o", "ά"="a", "έ"="e", "ή"="h", "ί"="i", "ό"="o", "ύ"="u", "ώ"="o",
+            "ϐ"="b", "ϑ"="th", "ϒ"="y", "ϕ"="ph", "ϖ"="p", "Ϛ"="st", "ϛ"="st", "Ϝ"="f",
+            "ϝ"="f", "Ϟ"="k", "ϟ"="k", "Ϡ"="k", "ϡ"="k", "ϰ"="k", "ϱ"="r", "ϲ"="s",
+            "ϳ"="j", "ϴ"="th", "ϵ"="e", "϶"="p"
+        )
+        # replace latin and greek characters to the closest english character
+        for (k in names(subs)) {
+            x <- gsub(k, subs[[k]], x)
+        }
+        x <- gsub("[^[:alnum:]_]", non_alphanum_replace, x)
+        if(collapse_replace) x <- gsub(
+            paste0(gsub("([][{}()+*^$|\\\\?.])", "\\\\\\1", non_alphanum_replace), "+"),
+            non_alphanum_replace,
+            x
+        )
+        if(tolower) x <- tolower(x)
+        x
+    }
 }
 localizeGmtfile <- function(gmturl, cachedir = tempdir()) {
@@ -25,7 +50,12 @@ localizeGmtfile <- function(gmturl, cachedir = tempdir()) {
         if (nrow(items) == 0) {
             stop(paste0("Empty GMT file: ", gmtfile, ", from ", gmturl))
         }
-        if (nchar(items$V2[1]) < nchar(items$V1[1]) && nchar(items$V2[1]) > 0) {
+        if (
+            is.character(items$V2[1]) &&
+            nchar(items$V2[1]) < nchar(items$V1[1]) &&
+            nchar(items$V2[1]) > 0 &&
+            is.na(suppressWarnings(as.numeric(items$V2[1])))
+        ) {
             warning(paste0(
                 "The second column is shorter, switching the first and second columns in GMT file ",
                 gmtfile,
@@ -153,7 +183,8 @@ runFGSEA = function(
     write.table(
         gsea_res %>%
-            mutate(leadingEdge = sapply(leadingEdge, function(x) paste(x, collapse=","))),
+            mutate(leadingEdge = sapply(leadingEdge, function(x) paste(x, collapse=",")),
+                   slug = sapply(pathway, slugify)),
         file = file.path(outdir, "fgsea.txt"),
         row.names = FALSE,
         col.names = TRUE,
@@ -172,16 +203,16 @@ runFGSEA = function(
     tablefig = file.path(outdir, "gsea_table.png")
     png(tablefig, res=100, width=1000, height=200 + 40 * length(topPathways))
-    plotGseaTable(
+    print(plotGseaTable(
         envs$pathways[topPathways],
         ranks,
         gsea_res,
         gseaParam = if (!is.null(envs$gseaParam)) envs$gseaParam else 1
-    )
+    ))
     dev.off()
     for (pathway in topPathways) {
-        enrfig = file.path(outdir, paste0("fgsea_", .slugify(pathway), ".png"))
+        enrfig = file.path(outdir, paste0("fgsea_", slugify(pathway), ".png"))
         png(enrfig, res=100, width=1000, height=800)
         print(plotEnrichment(
             envs$pathways[[pathway]],

biopipen/utils/misc.R CHANGED Viewed

@@ -33,6 +33,7 @@ bQuote <- function(x) {
 }
 #' Slugify a string
+#' Remember also update the one in gsea.R
 #' @param x A string
 #' @param non_alphanum_replace Replace non-alphanumeric characters
 #' @param collapse_replace Collapse consecutive non-alphanumeric character replacements

{biopipen-0.27.6.dist-info → biopipen-0.27.8.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: biopipen
-Version: 0.27.6
+Version: 0.27.8
 Summary: Bioinformatics processes/pipelines that can be run from `pipen run`
 License: MIT
 Author: pwwang

{biopipen-0.27.6.dist-info → biopipen-0.27.8.dist-info}/RECORD RENAMED Viewed

@@ -1,9 +1,9 @@
-biopipen/__init__.py,sha256=BwKhBzWMdVser1JHOUEX0Aa2nBqgua67wsNi17fRle0,23
+biopipen/__init__.py,sha256=tTYofCNMPRiC5Qs7KVRV32NVPrdQ2HjfgoMDf4fChsQ,23
 biopipen/core/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 biopipen/core/config.py,sha256=edK5xnDhM8j27srDzsxubi934NMrglLoKrdcC8qsEPk,1069
 biopipen/core/config.toml,sha256=20RCI30Peee1EQdfb_UbV3Hf74XUPndJnYZlUThytsw,1781
 biopipen/core/defaults.py,sha256=yPeehPLk_OYCf71IgRVCWuQRxLAMixDF81Ium0HtPKI,344
-biopipen/core/filters.py,sha256=HLrjXGsvvjRtTWIAmg_f4IMymWaRD769HlDwsCTh170,12424
+biopipen/core/filters.py,sha256=-OIzS5F_yNZ0Nk5Ci16BepPWqLOGBmYVqX3W98RSK9Y,12488
 biopipen/core/proc.py,sha256=60lUP3PcUAaKbDETo9N5PEIoeOYrLgcSmuytmrhcx8g,912
 biopipen/core/testing.py,sha256=lZ_R5ZbYPO2NPuLHdbzg6HbD_f4j8paVVbyeUqwg6FE,3411
 biopipen/ns/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -21,8 +21,8 @@ biopipen/ns/gsea.py,sha256=EsNRAPYsagaV2KYgr4Jv0KCnZGqayM209v4yOGGTIOI,7423
 biopipen/ns/misc.py,sha256=fzn0pXvdghMkQhu-e3MMapPNMyO6IAJbtTzVU3GbFa0,3246
 biopipen/ns/plot.py,sha256=fzJAKKl4a_tsVkLREGCQTFVHP049m33LdWgeYRb6v7M,5483
 biopipen/ns/rnaseq.py,sha256=bKAa6friFWof4yDTWZQahm1MS-lrdetO1GqDKdfxXYc,7708
-biopipen/ns/scrna.py,sha256=7Gs1xxQoGM3TKxaQvbgKNyMDEsgatFopImzC-RcOEoA,103946
-biopipen/ns/scrna_metabolic_landscape.py,sha256=EhOtHQyoH-jRpzDoOI_06UbjEg6mhvbDEHKhek01bPk,28334
+biopipen/ns/scrna.py,sha256=KL5Eu0mnIITLLSHAIz_sgr4ssmEU6AuBDXwedqYU7BI,105633
+biopipen/ns/scrna_metabolic_landscape.py,sha256=6AhaynGG3lNRi96N2tReVT46BJMuEwooSSd2irBoN80,28347
 biopipen/ns/snp.py,sha256=EQ2FS0trQ7YThPmBVTpS66lc2OSfgQ6lCh6WnyP-C2g,5499
 biopipen/ns/stats.py,sha256=yJ6C1CXF84T7DDs9mgufqUOr89Rl6kybE5ji8Vnx6cw,13693
 biopipen/ns/tcgamaf.py,sha256=AFbUJIxiMSvsVY3RcHgjRFuMnNh2DG3Mr5slLNEyz6o,1455
@@ -126,10 +126,10 @@ biopipen/scripts/scrna/CellTypeAnnotation-sctype.R,sha256=1nKRtzhVoJ9y0yMg1sgI6u
 biopipen/scripts/scrna/CellTypeAnnotation.R,sha256=OwLM_G4D7TG4HhIJjQxgIQM92X86lsWp9MVyXTTkLSc,618
 biopipen/scripts/scrna/CellsDistribution.R,sha256=isDr5-EWvOeWwVZdjOSsdX3QUpEaDvQFulIYawqFaQc,18854
 biopipen/scripts/scrna/DimPlots.R,sha256=-mXOTMnpPxvR30XLjwcohFfFx7xTqWKKiICwJiD6yEo,1554
-biopipen/scripts/scrna/ExprImpution-alra.R,sha256=w3W1txJcdWg52-SETY2Z0lO7maDNfiMjBYIGN587YW0,843
-biopipen/scripts/scrna/ExprImpution-rmagic.R,sha256=jYIfqZpnvjKJkvItLnemPVtUApHBYQi1_L8rHVbEe1M,735
-biopipen/scripts/scrna/ExprImpution-scimpute.R,sha256=mg40qCUW7-nP5oHPvARq7dmtoahM0GRFWXQpum0BXVk,1082
-biopipen/scripts/scrna/ExprImpution.R,sha256=7768ezrr59xUZDXq8lO9jj2XhnkSsx-xxBmOD9_DO7c,313
+biopipen/scripts/scrna/ExprImputation-alra.R,sha256=w3W1txJcdWg52-SETY2Z0lO7maDNfiMjBYIGN587YW0,843
+biopipen/scripts/scrna/ExprImputation-rmagic.R,sha256=jYIfqZpnvjKJkvItLnemPVtUApHBYQi1_L8rHVbEe1M,735
+biopipen/scripts/scrna/ExprImputation-scimpute.R,sha256=mg40qCUW7-nP5oHPvARq7dmtoahM0GRFWXQpum0BXVk,1082
+biopipen/scripts/scrna/ExprImputation.R,sha256=GcdZJpkDpq88hRQjtLZY5-byp8V43stEFm5T-pQbU6A,319
 biopipen/scripts/scrna/MarkersFinder.R,sha256=M7fHTbHHErZ9JbLmjDkx-6yVIay0_h0MkvgFegnqL44,22918
 biopipen/scripts/scrna/MetaMarkers.R,sha256=9ve1X0TrDzS_ZEW6HtU3n8R-uPx7q-hYMMNFVDSE8wQ,11272
 biopipen/scripts/scrna/ModuleScoreCalculator.R,sha256=JSHd-_-KiFqW8avCGxgU4T-C5BtDr2u0kwIvEu2lFIg,4188
@@ -141,12 +141,12 @@ biopipen/scripts/scrna/SeuratClusterStats-dimplots.R,sha256=gViDgQ8NorYD64iK0Fgc
 biopipen/scripts/scrna/SeuratClusterStats-features.R,sha256=W7iYhaFsC5EMZLO50QukYPLYGK4bq9kQc1VT5FwvI68,15496
 biopipen/scripts/scrna/SeuratClusterStats-hists.R,sha256=YhuD-GePjJPSkR0iLRgV_hiGHD_bnOIKp-LB6GCwquo,5037
 biopipen/scripts/scrna/SeuratClusterStats-ngenes.R,sha256=GVKIXFNS_syCuSN8oxoBkjxxAeI5LdSxh-qLVkUsbDA,2146
-biopipen/scripts/scrna/SeuratClusterStats-stats.R,sha256=TxQ0OcLwXwIgwL1mTLArboK0ATJIJhxWiv9DV_jBlhE,9255
+biopipen/scripts/scrna/SeuratClusterStats-stats.R,sha256=bBbvNCvV6dZLg9zvhh2nR48_53md5A5UEqrPXD00MZU,9263
 biopipen/scripts/scrna/SeuratClusterStats.R,sha256=ouWoj7Q644uG3MUlT23AES8f74g38-jPtPhINSvoUas,1267
 biopipen/scripts/scrna/SeuratClustering.R,sha256=kAvQq3RV86_KSv9NlUtUeQrPKkbhSsnv6Q4DoiTu8M0,6403
 biopipen/scripts/scrna/SeuratFilter.R,sha256=BrYK0MLdaTtQvInMaQsmOt7oH_hlks0M1zykkJtg2lM,509
 biopipen/scripts/scrna/SeuratLoading.R,sha256=ekWKnHIqtQb3kHVQiVymAHXXqiUxs6KKefjZKjaykmk,900
-biopipen/scripts/scrna/SeuratMap2Ref.R,sha256=Xn3VnvKqShuC0Ju05380wjuLVSdW0uWVzntdxjme244,4359
+biopipen/scripts/scrna/SeuratMap2Ref.R,sha256=_G8pG7NRV2GOFDzKBLY1nkXR0DO1c-6NkX990_hC8mk,9127
 biopipen/scripts/scrna/SeuratMetadataMutater.R,sha256=Pp4GsF3hZ6ZC2vroC3LSBmVa4B1p2L3hbh981yaAIeQ,1093
 biopipen/scripts/scrna/SeuratPreparing.R,sha256=t6GOcc9ZNwpRLeES7uBWja9RF6u6k5I_TXcdK4Ve7d0,18683
 biopipen/scripts/scrna/SeuratSplit.R,sha256=vdK11V39_Uo_NaOh76QWCtxObGaEr5Ynxqq0hTiSvsU,754
@@ -157,8 +157,8 @@ biopipen/scripts/scrna/Subset10X.R,sha256=T2nJBTwOe12AIKC2FZsMSv6xx3s-67CYZokpz5
 biopipen/scripts/scrna/TopExpressingGenes.R,sha256=kXMCYHVytgVgO_Uq66fKKFCFV2PPXE8VREy_0yYPLpU,7475
 biopipen/scripts/scrna/celltypist-wrapper.py,sha256=f5M8f4rU5nC7l17RS0YVmUPpLLz4D6PIcgWtA77UExM,1722
 biopipen/scripts/scrna/sctype.R,sha256=NaUJkABwF5G1UVm1CCtcMbwLSj94Mo24mbYCKFqo1Bw,6524
-biopipen/scripts/scrna_metabolic_landscape/MetabolicFeatures.R,sha256=nSBNn1BMwqoApTqmvzLeRhFu2JW_mNhOXICxmBYIP6E,4813
-biopipen/scripts/scrna_metabolic_landscape/MetabolicFeaturesIntraSubset.R,sha256=ic8Fy8QqYDGh_izmvZVJ3KL66podg_CSF5ITL3FZsvo,5196
+biopipen/scripts/scrna_metabolic_landscape/MetabolicFeatures.R,sha256=sOnHSH0Ld-tXSIXJPnXLYgRtEru5M0g3HRxbrHWQ_0U,5170
+biopipen/scripts/scrna_metabolic_landscape/MetabolicFeaturesIntraSubset.R,sha256=RPSxEHWk50Fyw5YPBVVGeWwd55Hi0zjbipLuM5O4tjs,5465
 biopipen/scripts/scrna_metabolic_landscape/MetabolicPathwayActivity.R,sha256=95DLX1Rz0tobOuDZ8V9YdGgO0KiNthhccoeeOK21tno,16216
 biopipen/scripts/scrna_metabolic_landscape/MetabolicPathwayHeterogeneity.R,sha256=rQ9iwGh9FNRZlJJzM4QItdyXmebfzLAq05ZAjb1kGUw,9831
 biopipen/scripts/snp/MatrixEQTL.R,sha256=zOR_mhn_sUXuxqgV82TPvDp-E1i5aJVA45QixyRP8no,5930
@@ -230,9 +230,9 @@ biopipen/utils/caching.R,sha256=qANQqH8p-VpvD8V4VSoqSfp0TFr4esujC7x3OFZsJMw,1687
 biopipen/utils/common_docstrs.py,sha256=Ow-g-yS5P7DEO37cP1X-xioRbYWygfQHxIuLIaDdrjs,6288
 biopipen/utils/gene.R,sha256=BzAwlLA8hO12vF-3t6IwEuTEeLa_jBll4zm_5qe3qoE,1243
 biopipen/utils/gene.py,sha256=qE_BqTayrJWxRdniffhcz6OhZcw9GUoOrj2EtFWH9Gw,2246
-biopipen/utils/gsea.R,sha256=2sN3AM0XjLWbTv6cB3JHCBWjuhmD4wEjPaaBY7wkhCI,7542
+biopipen/utils/gsea.R,sha256=BUr4pwfo7ZyinOyNa4O4dDxA1c50qWb3lpph374Yw_A,9239
 biopipen/utils/io.R,sha256=jIYdqdn0iRWfQYAZa5CjXi3fikqmYvPPLIXhobRe8sw,537
-biopipen/utils/misc.R,sha256=jXusPDCxSIaYRq_qm4khUsu9nyMhbpBVcj8BVn4j8Ic,10629
+biopipen/utils/misc.R,sha256=Y9J8gZDuPPYFxYNQtDEvKAk5j-K8j_-n0DunYvu_Hv8,10671
 biopipen/utils/misc.py,sha256=KJziAFY4Kl-0ZsO93vteY9gRLZg9BSYig-TDocHY36k,3601
 biopipen/utils/mutate_helpers.R,sha256=Bqy6Oi4rrPEPJw0Jq32bVAwwBfZv7JJL9jFcK5x-cek,17649
 biopipen/utils/plot.R,sha256=pzl37PomNeUZPxohHZ2w93j3Fc4T0Qrc62FF-9MTKdw,4417
@@ -240,7 +240,7 @@ biopipen/utils/reference.py,sha256=6bPSwQa-GiDfr7xLR9a5T64Ey40y24yn3QfQ5wDFZkU,4
 biopipen/utils/rnaseq.R,sha256=Ro2B2dG-Z2oVaT5tkwp9RHBz4dp_RF-JcizlM5GYXFs,1298
 biopipen/utils/single_cell.R,sha256=pJjYP8bIZpNAtTQ32rOXhZxaM1Y-6D-xUcK3pql9tbk,4316
 biopipen/utils/vcf.py,sha256=ajXs0M_QghEctlvUlSRjWQIABVF02wPdYd-0LP4mIsU,9377
-biopipen-0.27.6.dist-info/METADATA,sha256=t7ROsmFyR6-E4YXGAwiuNxRjZz5IX6_H7mT1rs9OSfE,882
-biopipen-0.27.6.dist-info/WHEEL,sha256=sP946D7jFCHeNz5Iq4fL4Lu-PrWrFsgfLXbbkciIZwg,88
-biopipen-0.27.6.dist-info/entry_points.txt,sha256=wu70aoBcv1UahVbB_5237MY-9M9_mzqmWjDD-oi3yz0,621
-biopipen-0.27.6.dist-info/RECORD,,
+biopipen-0.27.8.dist-info/METADATA,sha256=3rTtE5ECOr8Y67BOOCAfleIqkVabeEstjmhzKwxUI-w,882
+biopipen-0.27.8.dist-info/WHEEL,sha256=sP946D7jFCHeNz5Iq4fL4Lu-PrWrFsgfLXbbkciIZwg,88
+biopipen-0.27.8.dist-info/entry_points.txt,sha256=wu70aoBcv1UahVbB_5237MY-9M9_mzqmWjDD-oi3yz0,621
+biopipen-0.27.8.dist-info/RECORD,,

biopipen/scripts/scrna/ExprImpution.R DELETED Viewed

@@ -1,7 +0,0 @@
-{% if envs.tool == "rmagic" %}
-{% include biopipen_dir + "/scripts/scrna/ExprImpution-rmagic.R" %}
-{% elif envs.tool == "scimpute" %}
-{% include biopipen_dir + "/scripts/scrna/ExprImpution-scimpute.R" %}
-{% elif envs.tool == "alra" %}
-{% include biopipen_dir + "/scripts/scrna/ExprImpution-alra.R" %}
-{% endif %}

/biopipen/scripts/scrna/{ExprImpution-alra.R → ExprImputation-alra.R} RENAMED Viewed

File without changes

/biopipen/scripts/scrna/{ExprImpution-rmagic.R → ExprImputation-rmagic.R} RENAMED Viewed

File without changes

/biopipen/scripts/scrna/{ExprImpution-scimpute.R → ExprImputation-scimpute.R} RENAMED Viewed

File without changes

{biopipen-0.27.6.dist-info → biopipen-0.27.8.dist-info}/WHEEL RENAMED Viewed

File without changes

{biopipen-0.27.6.dist-info → biopipen-0.27.8.dist-info}/entry_points.txt RENAMED Viewed

File without changes

biopipen 0.27.6__py3-none-any.whl → 0.27.8__py3-none-any.whl

Potentially problematic release.

biopipen 0.27.6py3-none-any.whl → 0.27.8py3-none-any.whl