PyPI - biopipen - Versions diffs - 0.21.2__py3-none-any.whl → 0.22.1__py3-none-any.whl - Mend

biopipen 0.21.2py3-none-any.whl → 0.22.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of biopipen might be problematic. Click here for more details.

Files changed (62) hide show

biopipen/__init__.py +1 -1
biopipen/core/filters.py +142 -0
biopipen/ns/scrna.py +19 -1
biopipen/ns/tcr.py +30 -10
biopipen/reports/delim/SampleInfo.svelte +2 -22
biopipen/reports/scrna/CellsDistribution.svelte +4 -39
biopipen/reports/scrna/MarkersFinder.svelte +6 -126
biopipen/reports/scrna/MetaMarkers.svelte +3 -75
biopipen/reports/scrna/RadarPlots.svelte +4 -20
biopipen/reports/scrna/ScFGSEA.svelte +4 -23
biopipen/reports/scrna/SeuratClusterStats.svelte +3 -69
biopipen/reports/scrna/SeuratPreparing.svelte +3 -26
biopipen/reports/scrna/TopExpressingGenes.svelte +3 -41
biopipen/reports/scrna_metabolic_landscape/MetabolicFeatures.svelte +17 -16
biopipen/reports/scrna_metabolic_landscape/MetabolicFeaturesIntraSubset.svelte +13 -16
biopipen/reports/scrna_metabolic_landscape/MetabolicPathwayActivity.svelte +44 -52
biopipen/reports/scrna_metabolic_landscape/MetabolicPathwayHeterogeneity.svelte +2 -8
biopipen/reports/tcr/CDR3AAPhyschem.svelte +18 -65
biopipen/reports/tcr/CloneResidency.svelte +3 -93
biopipen/reports/tcr/Immunarch.svelte +4 -168
biopipen/reports/tcr/TCRClusterStats.svelte +3 -45
biopipen/reports/tcr/TESSA.svelte +11 -28
biopipen/scripts/delim/SampleInfo.R +41 -7
biopipen/scripts/scrna/CellsDistribution.R +127 -16
biopipen/scripts/scrna/MarkersFinder.R +245 -100
biopipen/scripts/scrna/MetaMarkers.R +163 -82
biopipen/scripts/scrna/RadarPlots.R +163 -110
biopipen/scripts/scrna/ScFGSEA.R +51 -11
biopipen/scripts/scrna/SeuratClusterStats-dimplots.R +26 -13
biopipen/scripts/scrna/SeuratClusterStats-features.R +58 -53
biopipen/scripts/scrna/SeuratClusterStats-stats.R +39 -21
biopipen/scripts/scrna/SeuratClusterStats.R +4 -2
biopipen/scripts/scrna/SeuratClustering.R +73 -26
biopipen/scripts/scrna/SeuratMetadataMutater.R +13 -1
biopipen/scripts/scrna/SeuratPreparing.R +93 -19
biopipen/scripts/scrna/TopExpressingGenes.R +100 -18
biopipen/scripts/scrna_metabolic_landscape/MetabolicFeatures.R +21 -8
biopipen/scripts/scrna_metabolic_landscape/MetabolicFeaturesIntraSubset.R +25 -3
biopipen/scripts/scrna_metabolic_landscape/MetabolicPathwayActivity.R +1 -0
biopipen/scripts/scrna_metabolic_landscape/MetabolicPathwayHeterogeneity.R +14 -3
biopipen/scripts/tcr/Attach2Seurat.R +2 -1
biopipen/scripts/tcr/CDR3AAPhyschem.R +123 -10
biopipen/scripts/tcr/CloneResidency.R +114 -34
biopipen/scripts/tcr/Immunarch-basic.R +18 -4
biopipen/scripts/tcr/Immunarch-clonality.R +14 -0
biopipen/scripts/tcr/Immunarch-diversity.R +123 -18
biopipen/scripts/tcr/Immunarch-geneusage.R +23 -1
biopipen/scripts/tcr/Immunarch-kmer.R +45 -3
biopipen/scripts/tcr/Immunarch-overlap.R +62 -0
biopipen/scripts/tcr/Immunarch-spectratyping.R +18 -2
biopipen/scripts/tcr/Immunarch-tracking.R +24 -1
biopipen/scripts/tcr/Immunarch-vjjunc.R +17 -2
biopipen/scripts/tcr/Immunarch.R +7 -0
biopipen/scripts/tcr/ImmunarchLoading.R +22 -23
biopipen/scripts/tcr/TCRClusterStats.R +124 -11
biopipen/scripts/tcr/TCRClustering.R +8 -9
biopipen/scripts/tcr/TESSA.R +66 -41
biopipen/utils/misc.R +96 -1
{biopipen-0.21.2.dist-info → biopipen-0.22.1.dist-info}/METADATA +1 -1
{biopipen-0.21.2.dist-info → biopipen-0.22.1.dist-info}/RECORD +62 -62
{biopipen-0.21.2.dist-info → biopipen-0.22.1.dist-info}/WHEEL +0 -0
{biopipen-0.21.2.dist-info → biopipen-0.22.1.dist-info}/entry_points.txt +0 -0

biopipen/scripts/scrna/MetaMarkers.R CHANGED Viewed

@@ -12,16 +12,19 @@ library(ggplot2)
 library(ggprism)
 library(parallel)
 library(tidyseurat)
+library(slugify)
 setEnrichrSite("Enrichr")
 srtfile <- {{ in.srtobj | quote }}
 outdir <- {{ out.outdir | quote }}
+joboutdir <- {{ job.outdir | quote }}
 ncores <- {{ envs.ncores | int }}
 mutaters <- {{ envs.mutaters | r }}
 idents <- {{ envs.idents | r }}
 group_by <- {{ envs["group-by"] | r }}
 each <- {{ envs.each | r }}
+subset <- {{ envs.subset | r }}
 prefix_each <- {{ envs.prefix_each | r }}
 p_adjust <- {{ envs.p_adjust | r }}
 section <- {{ envs.section | r }}
@@ -32,15 +35,15 @@ cases <- {{ envs.cases | r: todot = "-" }}
 set.seed(8525)
-print("- Reading Seurat object ...")
+log_info("- Reading Seurat object ...")
 srtobj <- readRDS(srtfile)
-print("- Mutate meta data if needed ...")
+log_info("- Mutate meta data if needed ...")
 if (!is.null(mutaters) && length(mutaters)) {
     srtobj@meta.data <- srtobj@meta.data %>% mutate(!!!lapply(mutaters, parse_expr))
 }
-print("- Expanding cases ...")
+log_info("- Expanding cases ...")
 if (is.null(cases) || length(cases) == 0) {
     cases <- list(
         DEFAULT = list(
@@ -49,6 +52,7 @@ if (is.null(cases) || length(cases) == 0) {
             each = each,
             prefix_each = prefix_each,
             p_adjust = p_adjust,
+            subset = subset,
             section = section,
             dbs = dbs,
             sigmarkers = sigmarkers,
@@ -65,6 +69,7 @@ if (is.null(cases) || length(cases) == 0) {
             prefix_each = prefix_each,
             p_adjust = p_adjust,
             section = section,
+            subset = subset,
             dbs = dbs,
             sigmarkers = sigmarkers,
             method = method
@@ -74,12 +79,19 @@ if (is.null(cases) || length(cases) == 0) {
 }
 newcases <- list()
+sections <- c()
 for (name in names(cases)) {
     case <- cases[[name]]
     if (is.null(case$each)) {
+        sections <- c(sections, case$section)
         newcases[[paste0(case$section, ":", name)]] <- case
     } else {
-        eachs <- srtobj@meta.data %>% pull(case$each) %>% unique() %>% na.omit()
+        if (is.null(case$subset)) {
+            eachs <- srtobj@meta.data %>% pull(case$each) %>% unique() %>% na.omit()
+        } else {
+            eachs <- srtobj@meta.data %>% filter(!!parse_expr(case$subset)) %>% pull(case$each) %>% unique() %>% na.omit()
+        }
+        sections <- c(sections, case$each)
         for (each in eachs) {
             by = make.names(paste0(".", name, "_", case$each, "_", each))
             idents <- case$idents
@@ -111,98 +123,98 @@ for (name in names(cases)) {
     }
 }
 cases <- newcases
+single_section <- length(unique(sections)) == 1
+casename_info <- function(casename, create = FALSE) {
+    sec_case_names <- strsplit(casename, ":")[[1]]
+    cname <- paste(sec_case_names[-1], collapse = ":")
+    out <- list(
+        casename = casename,
+        section = sec_case_names[1],
+        case = cname,
+        section_slug = slugify(sec_case_names[1], tolower = FALSE),
+        case_slug = slugify(cname, tolower = FALSE)
+    )
+    out$casedir <- file.path(outdir, out$section_slug, out$case_slug)
+    if (create) {
+        dir.create(out$casedir, showWarnings = FALSE, recursive = TRUE)
+    }
+    out
+}
 # Do enrichment analysis for a case using Enrichr
 # Args:
 #   case: case name
 #   markers: markers dataframe
 #   sig: The expression to filter significant markers
-do_enrich <- function(case, markers, sig) {
-    print(paste("  Running enrichment for case:", case))
-    parts <- strsplit(case, ":")[[1]]
-    sec <- parts[1]
-    case <- paste0(parts[-1], collapse = ":")
-    casedir <- file.path(outdir, sec, case)
-    dir.create(casedir, showWarnings = FALSE, recursive = TRUE)
+do_enrich <- function(info, markers, sig) {
+    log_info("  Running enrichment for case: {info$casename}")
     if (nrow(markers) == 0) {
-        print(paste("  No markers found for case:", case))
-        cat("No markers found.", file = file.path(casedir, "error.txt"))
-        return()
+        msg <- paste0("No markers found for case: ", info$casename)
+        log_warn("  {msg}")
+        return(msg)
     }
     markers_sig <- markers %>% filter(!!parse_expr(sig))
     if (nrow(markers_sig) == 0) {
-        print(paste("  No significant markers found for case:", case))
-        cat("No significant markers.", file = file.path(casedir, "error.txt"))
-        return()
+        msg <- paste0("No significant markers found for case: ", info$casename)
+        log_warn("  {msg}")
+        return(msg)
     }
     write.table(
         markers_sig,
-        file.path(casedir, "markers.txt"),
+        file.path(info$casedir, "markers.txt"),
         sep = "\t",
         row.names = FALSE,
         col.names = TRUE,
         quote = FALSE
     )
     if (nrow(markers_sig) < 5) {
-        for (db in dbs) {
-            write.table(
-                data.frame(Warning = "Not enough significant markers."),
-                file.path(casedir, paste0("Enrichr-", db, ".txt")),
-                sep = "\t",
-                row.names = FALSE,
-                col.names = TRUE,
-                quote = FALSE
-            )
-            png(
-                file.path(casedir, paste0("Enrichr-", db, ".png")),
-                res = 100, height = 200, width = 1000
-            )
-            print(
-                ggplot() +
-                    annotate(
-                        "text",
-                        x = 1,
-                        y = 1,
-                        label = "Not enough significant markers."
-                    ) +
-                    theme_classic()
-            )
-            dev.off()
-        }
-    } else {
-        enriched <- enrichr(markers_sig$gene, dbs)
-        for (db in dbs) {
-            write.table(
-                enriched[[db]],
-                file.path(casedir, paste0("Enrichr-", db, ".txt")),
-                sep = "\t",
-                row.names = FALSE,
-                col.names = TRUE,
-                quote = FALSE
-            )
-            png(
-                file.path(casedir, paste0("Enrichr-", db, ".png")),
-                res = 100, height = 1000, width = 1000
-            )
-            print(plotEnrich(enriched[[db]], showTerms = 20, title = db))
-            dev.off()
-        }
+        msg <- paste0("Too few significant markers found for case: ", info$casename)
+        log_warn(msg)
+        return(msg)
+    }
+    enriched <- enrichr(markers_sig$gene, dbs)
+    for (db in dbs) {
+        write.table(
+            enriched[[db]],
+            file.path(info$casedir, paste0("Enrichr-", db, ".txt")),
+            sep = "\t",
+            row.names = FALSE,
+            col.names = TRUE,
+            quote = FALSE
+        )
+        png(
+            file.path(info$casedir, paste0("Enrichr-", db, ".png")),
+            res = 100, height = 600, width = 800
+        )
+        print(
+            plotEnrich(enriched[[db]], showTerms = 20, title = db) +
+            theme_prism()
+        )
+        dev.off()
     }
 }
 do_case <- function(casename) {
-    cat(paste("- Dealing with case:", casename, "...\n"))
+    log_info("- Dealing with case: {casename} ...")
+    info <- casename_info(casename, create = TRUE)
     case <- cases[[casename]]
     sobj <- srtobj %>% filter(!is.na(!!sym(case$group_by)))
+    if (!is.null(case$subset)) {
+        sobj <- srtobj %>% filter(!is.na(!!sym(case$group_by)), !!parse_expr(case$subset))
+    }
     df <- GetAssayData(sobj, slot = "data", assay = "RNA")
     genes <- rownames(df)
     # rows: cells, cols: genes
     df <- cbind(as.data.frame(scale(Matrix::t(df))), sobj@meta.data[, case$group_by])
     colnames(df)[ncol(df)] <- "GROUP"
-    cat(paste("  Running tests for case...\n"))
+    log_info("  Running tests for case...")
     test_result <- mclapply(genes, function(gene) {
         fm <- as.formula(paste(bQuote(gene), "~ GROUP"))
         res <- tryCatch({
@@ -230,28 +242,97 @@ do_case <- function(casename) {
     markers <- do_call(rbind, test_result)
     markers$p_adjust <- p.adjust(markers$p.value, method = case$p_adjust)
     markers <- markers %>% arrange(p_adjust)
-    do_enrich(casename, markers, case$sigmarkers)
-    print(paste("  Plotting top 10 genes ...\n"))
-    markers <- markers %>% head(10)
-    parts <- strsplit(casename, ":")[[1]]
-    sec <- parts[1]
-    casename <- paste0(parts[-1], collapse = ":")
-    plotdir <- file.path(outdir, sec, casename, "plots")
-    dir.create(plotdir, showWarnings = FALSE, recursive = TRUE)
+    msg <- do_enrich(info, markers, case$sigmarkers)
+    if (is.null(msg)) {
+        log_info("  Plotting top 10 genes ...")
+        markers <- markers %>% head(10)
+        plotdir <- file.path(info$casedir, "expr_plots")
+        dir.create(plotdir, showWarnings = FALSE, recursive = TRUE)
-    # Plot the top 10 genes in each group with violin plots
-    for (gene in markers$gene) {
-        outfile = file.path(plotdir, paste0(gene, ".png"))
-        p = ggplot(df, aes_string(x="GROUP", y=bQuote(gene), fill="GROUP")) +
-            geom_violin(alpha = .8) +
-            geom_boxplot(width=0.1, fill="white") +
-            theme_prism() +
-            ylab(paste0("Expression of ", gene))
-        png(outfile, res = 100, height = 800, width = 1000)
-        print(p)
-        dev.off()
+        # Plot the top 10 genes in each group with violin plots
+        geneplots = list()
+        for (gene in markers$gene) {
+            outfile = file.path(plotdir, paste0(slugify(gene, tolower = FALSE), ".png"))
+            p = ggplot(df, aes_string(x="GROUP", y=bQuote(gene), fill="GROUP")) +
+                geom_violin(alpha = .8) +
+                geom_boxplot(width=0.1, fill="white") +
+                theme_prism() +
+                ylab(paste0("Expression of ", gene))
+            png(outfile, res = 100, height = 600, width = 800)
+            print(p)
+            dev.off()
+            geneplots[[length(geneplots) + 1]] <- list(
+                kind = "table_image",
+                src = outfile,
+                name = gene
+            )
+        }
+        add_report(
+            list(
+                kind = "descr",
+                content = paste0(
+                    "Top 100 genes selected by ",
+                    "<code>", case$method, "</code> across ",
+                    "<code>", case$group_by, "</code> and filtered by ",
+                    "<code>", html_escape(case$sigmarkers), "</code>"
+                )
+            ),
+            h1 = ifelse(
+                info$section == "DEFAULT",
+                info$case,
+                ifelse(single_section, paste0(info$section, " - ", info$case), info$section)
+            ),
+            h2 = ifelse(single_section, "Meta-Markers", info$case),
+            h3 = ifelse(single_section, "#", "Meta-Markers")
+        )
+        add_report(
+            list(
+                name = "Meta-Markers",
+                contents = list(list(
+                    kind = "table",
+                    src = file.path(info$casedir, "markers.txt"),
+                    data = list(nrows = 100)
+                ))
+            ),
+            list(
+                name = "Volin Plots (Top 10)",
+                ui = "table_of_images:4",
+                contents = geneplots
+            ),
+            h1 = ifelse(
+                info$section == "DEFAULT",
+                info$case,
+                ifelse(single_section, paste0(info$section, " - ", info$case), info$section)
+            ),
+            h2 = ifelse(single_section, "Meta-Markers", info$case),
+            h3 = ifelse(single_section, "#", "Meta-Markers"),
+            ui = "tabs"
+        )
+        add_report(
+            list(kind = "enrichr", dir = info$casedir),
+            h1 = ifelse(
+                info$section == "DEFAULT",
+                info$case,
+                ifelse(single_section, paste0(info$section, " - ", info$case), info$section)
+            ),
+            h2 = ifelse(single_section, "Enrichment Analysis", info$case),
+            h3 = ifelse(single_section, "#", "Enrichment Analysis")
+        )
+    } else {
+        add_report(
+            list(kind = "error", content = msg),
+            h1 = ifelse(
+                info$section == "DEFAULT",
+                info$case,
+                ifelse(single_section, paste0(info$section, " - ", info$case), info$section)
+            ),
+            h2 = ifelse(single_section, "#", info$case)
+        )
     }
 }
 sapply(sort(names(cases)), do_case)
+save_report(joboutdir)

biopipen 0.21.2__py3-none-any.whl → 0.22.1__py3-none-any.whl

Potentially problematic release.

biopipen 0.21.2py3-none-any.whl → 0.22.1py3-none-any.whl