PyPI - biopipen - Versions diffs - 0.21.0__py3-none-any.whl → 0.34.26__py3-none-any.whl - Mend

biopipen 0.21.0py3-none-any.whl → 0.34.26py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (290) hide show

biopipen/__init__.py +1 -1
biopipen/core/config.toml +28 -0
biopipen/core/filters.py +79 -4
biopipen/core/proc.py +12 -3
biopipen/core/testing.py +75 -3
biopipen/ns/bam.py +148 -6
biopipen/ns/bed.py +75 -0
biopipen/ns/cellranger.py +186 -0
biopipen/ns/cellranger_pipeline.py +126 -0
biopipen/ns/cnv.py +19 -3
biopipen/ns/cnvkit.py +1 -1
biopipen/ns/cnvkit_pipeline.py +20 -12
biopipen/ns/delim.py +34 -35
biopipen/ns/gene.py +68 -23
biopipen/ns/gsea.py +63 -37
biopipen/ns/misc.py +39 -14
biopipen/ns/plot.py +304 -1
biopipen/ns/protein.py +183 -0
biopipen/ns/regulatory.py +290 -0
biopipen/ns/rnaseq.py +142 -5
biopipen/ns/scrna.py +2053 -473
biopipen/ns/scrna_metabolic_landscape.py +228 -382
biopipen/ns/snp.py +659 -0
biopipen/ns/stats.py +484 -0
biopipen/ns/tcr.py +683 -98
biopipen/ns/vcf.py +236 -2
biopipen/ns/web.py +97 -6
biopipen/reports/bam/CNVpytor.svelte +4 -9
biopipen/reports/cellranger/CellRangerCount.svelte +18 -0
biopipen/reports/cellranger/CellRangerSummary.svelte +16 -0
biopipen/reports/cellranger/CellRangerVdj.svelte +18 -0
biopipen/reports/cnvkit/CNVkitDiagram.svelte +1 -1
biopipen/reports/cnvkit/CNVkitHeatmap.svelte +1 -1
biopipen/reports/cnvkit/CNVkitScatter.svelte +1 -1
biopipen/reports/common.svelte +15 -0
biopipen/reports/protein/ProdigySummary.svelte +16 -0
biopipen/reports/scrna/CellsDistribution.svelte +4 -39
biopipen/reports/scrna/DimPlots.svelte +1 -1
biopipen/reports/scrna/MarkersFinder.svelte +6 -126
biopipen/reports/scrna/MetaMarkers.svelte +3 -75
biopipen/reports/scrna/RadarPlots.svelte +4 -20
biopipen/reports/scrna_metabolic_landscape/MetabolicFeatures.svelte +61 -22
biopipen/reports/scrna_metabolic_landscape/MetabolicPathwayActivity.svelte +88 -82
biopipen/reports/scrna_metabolic_landscape/MetabolicPathwayHeterogeneity.svelte +70 -10
biopipen/reports/snp/PlinkCallRate.svelte +24 -0
biopipen/reports/snp/PlinkFreq.svelte +18 -0
biopipen/reports/snp/PlinkHWE.svelte +18 -0
biopipen/reports/snp/PlinkHet.svelte +18 -0
biopipen/reports/snp/PlinkIBD.svelte +18 -0
biopipen/reports/tcr/CDR3AAPhyschem.svelte +19 -66
biopipen/reports/tcr/ClonalStats.svelte +16 -0
biopipen/reports/tcr/CloneResidency.svelte +3 -93
biopipen/reports/tcr/Immunarch.svelte +4 -155
biopipen/reports/tcr/TCRClusterStats.svelte +3 -45
biopipen/reports/tcr/TESSA.svelte +11 -28
biopipen/reports/utils/misc.liq +22 -7
biopipen/scripts/bam/BamMerge.py +11 -15
biopipen/scripts/bam/BamSampling.py +90 -0
biopipen/scripts/bam/BamSort.py +141 -0
biopipen/scripts/bam/BamSplitChroms.py +10 -10
biopipen/scripts/bam/BamSubsetByBed.py +38 -0
biopipen/scripts/bam/CNAClinic.R +41 -5
biopipen/scripts/bam/CNVpytor.py +153 -54
biopipen/scripts/bam/ControlFREEC.py +13 -14
biopipen/scripts/bam/SamtoolsView.py +33 -0
biopipen/scripts/bed/Bed2Vcf.py +5 -5
biopipen/scripts/bed/BedConsensus.py +5 -5
biopipen/scripts/bed/BedLiftOver.sh +6 -4
biopipen/scripts/bed/BedtoolsIntersect.py +54 -0
biopipen/scripts/bed/BedtoolsMakeWindows.py +47 -0
biopipen/scripts/bed/BedtoolsMerge.py +4 -4
biopipen/scripts/cellranger/CellRangerCount.py +138 -0
biopipen/scripts/cellranger/CellRangerSummary.R +181 -0
biopipen/scripts/cellranger/CellRangerVdj.py +112 -0
biopipen/scripts/cnv/AneuploidyScore.R +55 -20
biopipen/scripts/cnv/AneuploidyScoreSummary.R +221 -163
biopipen/scripts/cnv/TMADScore.R +25 -9
biopipen/scripts/cnv/TMADScoreSummary.R +57 -86
biopipen/scripts/cnvkit/CNVkitAccess.py +7 -6
biopipen/scripts/cnvkit/CNVkitAutobin.py +26 -18
biopipen/scripts/cnvkit/CNVkitBatch.py +6 -6
biopipen/scripts/cnvkit/CNVkitCall.py +3 -3
biopipen/scripts/cnvkit/CNVkitCoverage.py +4 -3
biopipen/scripts/cnvkit/CNVkitDiagram.py +5 -5
biopipen/scripts/cnvkit/CNVkitFix.py +3 -3
biopipen/scripts/cnvkit/CNVkitGuessBaits.py +12 -8
biopipen/scripts/cnvkit/CNVkitHeatmap.py +5 -5
biopipen/scripts/cnvkit/CNVkitReference.py +6 -5
biopipen/scripts/cnvkit/CNVkitScatter.py +5 -5
biopipen/scripts/cnvkit/CNVkitSegment.py +5 -5
biopipen/scripts/cnvkit/guess_baits.py +166 -93
biopipen/scripts/delim/RowsBinder.R +1 -1
biopipen/scripts/delim/SampleInfo.R +116 -118
biopipen/scripts/gene/GeneNameConversion.R +67 -0
biopipen/scripts/gene/GenePromoters.R +61 -0
biopipen/scripts/gsea/Enrichr.R +5 -5
biopipen/scripts/gsea/FGSEA.R +184 -50
biopipen/scripts/gsea/GSEA.R +2 -2
biopipen/scripts/gsea/PreRank.R +5 -5
biopipen/scripts/misc/Config2File.py +2 -2
biopipen/scripts/misc/Plot.R +80 -0
biopipen/scripts/misc/Shell.sh +15 -0
biopipen/scripts/misc/Str2File.py +2 -2
biopipen/scripts/plot/Heatmap.R +3 -3
biopipen/scripts/plot/Manhattan.R +147 -0
biopipen/scripts/plot/QQPlot.R +146 -0
biopipen/scripts/plot/ROC.R +88 -0
biopipen/scripts/plot/Scatter.R +112 -0
biopipen/scripts/plot/VennDiagram.R +5 -9
biopipen/scripts/protein/MMCIF2PDB.py +33 -0
biopipen/scripts/protein/PDB2Fasta.py +60 -0
biopipen/scripts/protein/Prodigy.py +119 -0
biopipen/scripts/protein/ProdigySummary.R +140 -0
biopipen/scripts/protein/RMSD.py +178 -0
biopipen/scripts/regulatory/MotifAffinityTest.R +102 -0
biopipen/scripts/regulatory/MotifAffinityTest_AtSNP.R +127 -0
biopipen/scripts/regulatory/MotifAffinityTest_MotifBreakR.R +104 -0
biopipen/scripts/regulatory/MotifScan.py +159 -0
biopipen/scripts/regulatory/VariantMotifPlot.R +78 -0
biopipen/scripts/regulatory/motifs-common.R +324 -0
biopipen/scripts/rnaseq/Simulation-ESCO.R +180 -0
biopipen/scripts/rnaseq/Simulation-RUVcorr.R +45 -0
biopipen/scripts/rnaseq/Simulation.R +21 -0
biopipen/scripts/rnaseq/UnitConversion.R +325 -54
biopipen/scripts/scrna/AnnData2Seurat.R +40 -0
biopipen/scripts/scrna/CCPlotR-patch.R +161 -0
biopipen/scripts/scrna/CellCellCommunication.py +150 -0
biopipen/scripts/scrna/CellCellCommunicationPlots.R +93 -0
biopipen/scripts/scrna/CellSNPLite.py +30 -0
biopipen/scripts/scrna/CellTypeAnnotation-celltypist.R +185 -0
biopipen/scripts/scrna/CellTypeAnnotation-direct.R +68 -31
biopipen/scripts/scrna/CellTypeAnnotation-hitype.R +27 -22
biopipen/scripts/scrna/CellTypeAnnotation-sccatch.R +28 -20
biopipen/scripts/scrna/CellTypeAnnotation-sctype.R +48 -25
biopipen/scripts/scrna/CellTypeAnnotation.R +37 -1
biopipen/scripts/scrna/CellsDistribution.R +456 -167
biopipen/scripts/scrna/DimPlots.R +1 -1
biopipen/scripts/scrna/ExprImputation-alra.R +109 -0
biopipen/scripts/scrna/ExprImputation-rmagic.R +256 -0
biopipen/scripts/scrna/{ExprImpution-scimpute.R → ExprImputation-scimpute.R} +8 -5
biopipen/scripts/scrna/ExprImputation.R +7 -0
biopipen/scripts/scrna/LoomTo10X.R +51 -0
biopipen/scripts/scrna/MQuad.py +25 -0
biopipen/scripts/scrna/MarkersFinder.R +679 -400
biopipen/scripts/scrna/MetaMarkers.R +265 -161
biopipen/scripts/scrna/ModuleScoreCalculator.R +66 -11
biopipen/scripts/scrna/PseudoBulkDEG.R +678 -0
biopipen/scripts/scrna/RadarPlots.R +355 -134
biopipen/scripts/scrna/ScFGSEA.R +298 -100
biopipen/scripts/scrna/ScSimulation.R +65 -0
biopipen/scripts/scrna/ScVelo.py +617 -0
biopipen/scripts/scrna/Seurat2AnnData.R +7 -0
biopipen/scripts/scrna/SeuratClusterStats-clustree.R +87 -0
biopipen/scripts/scrna/SeuratClusterStats-dimplots.R +36 -30
biopipen/scripts/scrna/SeuratClusterStats-features.R +138 -187
biopipen/scripts/scrna/SeuratClusterStats-ngenes.R +81 -0
biopipen/scripts/scrna/SeuratClusterStats-stats.R +78 -89
biopipen/scripts/scrna/SeuratClusterStats.R +47 -10
biopipen/scripts/scrna/SeuratClustering.R +36 -233
biopipen/scripts/scrna/SeuratLoading.R +2 -2
biopipen/scripts/scrna/SeuratMap2Ref.R +84 -113
biopipen/scripts/scrna/SeuratMetadataMutater.R +16 -6
biopipen/scripts/scrna/SeuratPreparing.R +223 -173
biopipen/scripts/scrna/SeuratSubClustering.R +64 -0
biopipen/scripts/scrna/SeuratTo10X.R +27 -0
biopipen/scripts/scrna/Slingshot.R +65 -0
biopipen/scripts/scrna/Subset10X.R +2 -2
biopipen/scripts/scrna/TopExpressingGenes.R +169 -135
biopipen/scripts/scrna/celltypist-wrapper.py +195 -0
biopipen/scripts/scrna/scvelo_paga.py +313 -0
biopipen/scripts/scrna/seurat_anndata_conversion.py +98 -0
biopipen/scripts/scrna_metabolic_landscape/MetabolicFeatures.R +447 -82
biopipen/scripts/scrna_metabolic_landscape/MetabolicPathwayActivity.R +348 -241
biopipen/scripts/scrna_metabolic_landscape/MetabolicPathwayHeterogeneity.R +188 -166
biopipen/scripts/snp/MatrixEQTL.R +217 -0
biopipen/scripts/snp/Plink2GTMat.py +148 -0
biopipen/scripts/snp/PlinkCallRate.R +199 -0
biopipen/scripts/snp/PlinkFilter.py +100 -0
biopipen/scripts/snp/PlinkFreq.R +291 -0
biopipen/scripts/snp/PlinkFromVcf.py +81 -0
biopipen/scripts/snp/PlinkHWE.R +85 -0
biopipen/scripts/snp/PlinkHet.R +96 -0
biopipen/scripts/snp/PlinkIBD.R +196 -0
biopipen/scripts/snp/PlinkSimulation.py +124 -0
biopipen/scripts/snp/PlinkUpdateName.py +124 -0
biopipen/scripts/stats/ChowTest.R +146 -0
biopipen/scripts/stats/DiffCoexpr.R +152 -0
biopipen/scripts/stats/LiquidAssoc.R +135 -0
biopipen/scripts/stats/Mediation.R +108 -0
biopipen/scripts/stats/MetaPvalue.R +130 -0
biopipen/scripts/stats/MetaPvalue1.R +74 -0
biopipen/scripts/tcgamaf/Maf2Vcf.py +2 -2
biopipen/scripts/tcgamaf/MafAddChr.py +2 -2
biopipen/scripts/tcr/Attach2Seurat.R +3 -2
biopipen/scripts/tcr/CDR3AAPhyschem.R +211 -143
biopipen/scripts/tcr/CDR3Clustering.R +343 -0
biopipen/scripts/tcr/ClonalStats.R +526 -0
biopipen/scripts/tcr/CloneResidency.R +255 -131
biopipen/scripts/tcr/CloneSizeQQPlot.R +4 -4
biopipen/scripts/tcr/GIANA/GIANA.py +1356 -797
biopipen/scripts/tcr/GIANA/GIANA4.py +1362 -789
biopipen/scripts/tcr/GIANA/query.py +164 -162
biopipen/scripts/tcr/Immunarch-basic.R +31 -9
biopipen/scripts/tcr/Immunarch-clonality.R +25 -5
biopipen/scripts/tcr/Immunarch-diversity.R +352 -134
biopipen/scripts/tcr/Immunarch-geneusage.R +45 -5
biopipen/scripts/tcr/Immunarch-kmer.R +68 -8
biopipen/scripts/tcr/Immunarch-overlap.R +84 -4
biopipen/scripts/tcr/Immunarch-spectratyping.R +35 -6
biopipen/scripts/tcr/Immunarch-tracking.R +38 -6
biopipen/scripts/tcr/Immunarch-vjjunc.R +165 -0
biopipen/scripts/tcr/Immunarch.R +63 -11
biopipen/scripts/tcr/Immunarch2VDJtools.R +2 -2
biopipen/scripts/tcr/ImmunarchFilter.R +4 -4
biopipen/scripts/tcr/ImmunarchLoading.R +38 -29
biopipen/scripts/tcr/SampleDiversity.R +1 -1
biopipen/scripts/tcr/ScRepCombiningExpression.R +40 -0
biopipen/scripts/tcr/ScRepLoading.R +166 -0
biopipen/scripts/tcr/TCRClusterStats.R +176 -22
biopipen/scripts/tcr/TCRDock.py +110 -0
biopipen/scripts/tcr/TESSA.R +102 -118
biopipen/scripts/tcr/VJUsage.R +5 -5
biopipen/scripts/tcr/immunarch-patched.R +142 -0
biopipen/scripts/tcr/vdjtools-patch.sh +1 -1
biopipen/scripts/vcf/BcftoolsAnnotate.py +91 -0
biopipen/scripts/vcf/BcftoolsFilter.py +90 -0
biopipen/scripts/vcf/BcftoolsMerge.py +31 -0
biopipen/scripts/vcf/BcftoolsSort.py +113 -0
biopipen/scripts/vcf/BcftoolsView.py +73 -0
biopipen/scripts/vcf/TruvariBench.sh +14 -7
biopipen/scripts/vcf/TruvariBenchSummary.R +16 -13
biopipen/scripts/vcf/TruvariConsistency.R +1 -1
biopipen/scripts/vcf/Vcf2Bed.py +2 -2
biopipen/scripts/vcf/VcfAnno.py +11 -11
biopipen/scripts/vcf/VcfDownSample.sh +22 -10
biopipen/scripts/vcf/VcfFilter.py +5 -5
biopipen/scripts/vcf/VcfFix.py +7 -7
biopipen/scripts/vcf/VcfFix_utils.py +13 -4
biopipen/scripts/vcf/VcfIndex.py +3 -3
biopipen/scripts/vcf/VcfIntersect.py +3 -3
biopipen/scripts/vcf/VcfLiftOver.sh +5 -0
biopipen/scripts/vcf/VcfSplitSamples.py +4 -4
biopipen/scripts/vcf/bcftools_utils.py +52 -0
biopipen/scripts/web/Download.py +8 -4
biopipen/scripts/web/DownloadList.py +5 -5
biopipen/scripts/web/GCloudStorageDownloadBucket.py +82 -0
biopipen/scripts/web/GCloudStorageDownloadFile.py +23 -0
biopipen/scripts/web/gcloud_common.py +49 -0
biopipen/utils/gene.py +108 -60
biopipen/utils/misc.py +146 -20
biopipen/utils/reference.py +64 -20
biopipen/utils/reporter.py +177 -0
biopipen/utils/vcf.py +1 -1
biopipen-0.34.26.dist-info/METADATA +27 -0
biopipen-0.34.26.dist-info/RECORD +292 -0
{biopipen-0.21.0.dist-info → biopipen-0.34.26.dist-info}/WHEEL +1 -1
{biopipen-0.21.0.dist-info → biopipen-0.34.26.dist-info}/entry_points.txt +6 -2
biopipen/ns/bcftools.py +0 -111
biopipen/ns/scrna_basic.py +0 -255
biopipen/reports/delim/SampleInfo.svelte +0 -36
biopipen/reports/scrna/GeneExpressionInvistigation.svelte +0 -32
biopipen/reports/scrna/ScFGSEA.svelte +0 -35
biopipen/reports/scrna/SeuratClusterStats.svelte +0 -82
biopipen/reports/scrna/SeuratMap2Ref.svelte +0 -20
biopipen/reports/scrna/SeuratPreparing.svelte +0 -38
biopipen/reports/scrna/TopExpressingGenes.svelte +0 -55
biopipen/reports/scrna_metabolic_landscape/MetabolicFeaturesIntraSubset.svelte +0 -31
biopipen/reports/utils/gsea.liq +0 -110
biopipen/scripts/bcftools/BcftoolsAnnotate.py +0 -42
biopipen/scripts/bcftools/BcftoolsFilter.py +0 -79
biopipen/scripts/bcftools/BcftoolsSort.py +0 -19
biopipen/scripts/gene/GeneNameConversion.py +0 -66
biopipen/scripts/scrna/ExprImpution-alra.R +0 -32
biopipen/scripts/scrna/ExprImpution-rmagic.R +0 -29
biopipen/scripts/scrna/ExprImpution.R +0 -7
biopipen/scripts/scrna/GeneExpressionInvistigation.R +0 -132
biopipen/scripts/scrna/Write10X.R +0 -11
biopipen/scripts/scrna_metabolic_landscape/MetabolicFeaturesIntraSubset.R +0 -150
biopipen/scripts/tcr/TCRClustering.R +0 -280
biopipen/utils/common_docstrs.py +0 -61
biopipen/utils/gene.R +0 -49
biopipen/utils/gsea.R +0 -193
biopipen/utils/io.R +0 -20
biopipen/utils/misc.R +0 -114
biopipen/utils/mutate_helpers.R +0 -433
biopipen/utils/plot.R +0 -173
biopipen/utils/rnaseq.R +0 -48
biopipen/utils/single_cell.R +0 -115
biopipen-0.21.0.dist-info/METADATA +0 -22
biopipen-0.21.0.dist-info/RECORD +0 -218

biopipen/scripts/scrna/RadarPlots.R CHANGED Viewed

@@ -1,3 +1,6 @@
+{{ biopipen_dir | joinpaths: "utils", "misc.R" | source_r }}
+{{ biopipen_dir | joinpaths: "utils", "repr.R" | source_r }}
 library(Seurat)
 library(rlang)
 library(dplyr)
@@ -5,28 +8,97 @@ library(tidyr)
 library(tibble)
 library(ggplot2)
 library(ggradar)
+library(ggprism)
+library(glue)
+library(gglogger)
 # input/output
 srtfile = {{in.srtobj | r}}
 outdir = {{out.outdir | r}}
+joboutdir = {{job.outdir | r}}
 # envs
 mutaters = {{envs.mutaters | r}}
 by = {{envs.by | r}}
 each = {{envs.each | r}}
+prefix_each = {{envs.prefix_each | r}}
 order = {{envs.order | r}}
-cluster_col = {{envs.cluster_col | r}}
+colors = {{envs.colors | r}}
+ident = {{envs.ident | r}}
 cluster_order = {{envs.cluster_order | r}}
 breaks = {{envs.breaks | r}}
+breakdown = {{envs.breakdown | r}}
+test = {{envs.test | r}}
 direction = {{envs.direction | r}}
 section = {{envs.section | r}}
+subset_ = {{envs.subset | r}}
+bar_devpars = {{envs.bar_devpars | r}}
 devpars = {{envs.devpars | r}}
 cases = {{envs.cases | r}}
-DEFAULT_CASE = "DEFAULT"
+# DEFAULT_CASE = "DEFAULT"
+# sections = c()
+log_info("- Reading srtobj ...")
+srtobj = biopipen.utils::read_obj(srtfile)
+meta = srtobj@meta.data
+log_info("- Mutating meta data if needed ...")
+if (is.list(mutaters) && length(mutaters) > 0) {
+    mutaters <- lapply(mutaters, function(x) parse_expr(x))
+    meta <- meta %>% mutate(!!!mutaters)
+}
-# Used for saving sections
-sections = list()
+defaults <- list(
+    by = by,
+    each = each,
+    prefix_each = prefix_each,
+    order = order,
+    colors = colors,
+    ident = ident,
+    cluster_order = cluster_order,
+    breaks = breaks,
+    breakdown = breakdown,
+    test = test,
+    direction = direction,
+    section = section,
+    subset = subset_,
+    bar_devpars = bar_devpars,
+    devpars = devpars
+)
+expand_each <- function(name,  case) {
+    outcases <- list()
+    if (is.null(case$each) || nchar(case$each) == 0) {
+        if (is.null(case$section) || case$section == "DEFAULT") {
+            outcases[[name]] <- case
+        } else {
+            outcases[[paste0(case$section, "::", name)]] <- case
+        }
+    } else {
+        if (is.null(case$subset)) {
+            eachs <- meta %>%
+                pull(case$each) %>% unique() %>% na.omit() %>% as.vector()
+        } else {
+            eachs <- meta %>% filter(!!parse_expr(case$subset)) %>%
+                pull(case$each) %>% unique() %>% na.omit() %>% as.vector()
+        }
+        for (each in eachs) {
+            if (isTRUE(case$prefix_each)) {
+                key <- paste0(name, "::", case$each, " - ", each)
+            } else {
+                key <- paste0(name, "::", each)
+            }
+            outcases[[key]] <- case
+            outcases[[key]]$section <- name
+            outcases[[key]]$each_value <- each
+        }
+    }
+    outcases
+}
+log_info("- Expanding cases ...")
+cases <- expand_cases(cases, defaults, expand_each)
 auto_breaks = function(maxval) {
     if (maxval <= 0.1) {  # 10%
@@ -52,24 +124,13 @@ auto_breaks = function(maxval) {
     }
 }
-run_one_case = function(casename) {
-    case = newcases[[casename]]
-    print(paste("- Running for case:", casename))
-    # Save the section
-    if (is.character(case$section) && nchar(case$section) > 0) {
-        sections[[case$section]] <<- c(sections[[case$section]], casename)
-    }
-    # Get the counts
-    counts = if (!is.null(case$each)) meta %>% filter(!!sym(case$each) == case$each_value) else meta
-    counts = counts %>%
-        filter(!is.na(!!sym(case$by))) %>%
-        group_by(!!sym(case$cluster_col), !!sym(case$by)) %>%
+do_radarplot <- function(info, case, counts) {
+    rdr_data = counts %>%
+        group_by(!!sym(case$ident), !!sym(case$by)) %>%
         count() %>%
         pivot_wider(
             id_cols = case$by,
-            names_from = !!sym(case$cluster_col),
+            names_from = !!sym(case$ident),
             values_from = n,
             values_fill = 0
         ) %>%
@@ -81,25 +142,26 @@ run_one_case = function(casename) {
     # Reorder the clusters if needed
     if (!is.null(case$cluster_order) && length(case$cluster_order) > 0) {
-        counts = counts[, case$cluster_order]
+        rdr_data = rdr_data[, case$cluster_order]
     }
     # If clusters are numbers, add a prefix "Cluster"
-    if (all(grepl("^\\d+$", colnames(counts)))) {
-        colnames(counts) = paste0("Cluster", colnames(counts))
+    if (all(grepl("^\\d+$", colnames(rdr_data)))) {
+        colnames(rdr_data) = paste0("Cluster", colnames(rdr_data))
     }
     if (!is.null(case$order) && length(case$order) > 0) {
-        counts = counts[case$order, ]
-        if (nrow(counts) == 0) {
+        rdr_data = rdr_data[case$order, ]
+        if (nrow(rdr_data) == 0) {
             stop("No data after reordering. Are items in `order` correct?")
         }
     }
     # Save the counts
+    counts_file = file.path(info$casedir, "counts.tsv")
     write.table(
-        counts,
-        file.path(outdir, paste0(casename, ".counts.tsv")),
+        t(rdr_data),
+        counts_file,
         sep = "\t",
         quote = FALSE,
         col.names = TRUE,
@@ -107,17 +169,18 @@ run_one_case = function(casename) {
     )
     # Calculate the percentage
-    counts = as.matrix(counts)
+    rdr_data = as.matrix(rdr_data)
     if (case$direction == "inter-cluster") {
-        counts = t(t(counts) / rowSums(t(counts)))
+        rdr_data = t(t(rdr_data) / rowSums(t(rdr_data)))
     } else {
-        counts = counts / rowSums(counts)
+        rdr_data = rdr_data / rowSums(rdr_data)
     }
     # Save the percentages
+    perc_file = file.path(info$casedir, "percentages.tsv")
     write.table(
-        counts,
-        file.path(outdir, paste0(casename, ".percentages.tsv")),
+        t(rdr_data),
+        perc_file,
         sep = "\t",
         quote = FALSE,
         col.names = TRUE,
@@ -126,132 +189,290 @@ run_one_case = function(casename) {
     # Get the breaks
     breaks = if (is.null(case$breaks) || length(case$breaks) == 0) {
-        auto_breaks(max(counts))
+        auto_breaks(max(rdr_data))
     } else {
         case$breaks
     }
     # Plot
+    if (!is.null(case$colors) && length(case$colors) == 1 && case$colors == "biopipen") {
+        colors = pal_biopipen()(nrow(rdr_data))
+    } else if (!is.null(case$colors) && length(case$colors) > 0) {
+        colors = trimws(unlist(strsplit(case$colors, ",")))
+    }
+    plotdf <- rdr_data %>%
+        as.data.frame() %>%
+        rownames_to_column("group") %>%
+        mutate(group = factor(group, levels = rownames(rdr_data)))
     p = ggradar(
-        counts %>% as.data.frame() %>% rownames_to_column("group"),
+        plotdf,
         values.radar = paste0(breaks, "%"),
         grid.min = breaks[1] / 100,
         grid.mid = breaks[2] / 100,
         grid.max = breaks[3] / 100,
-        plot.title = casename
+        group.colours = colors
     )
-    png(
-        file.path(outdir, paste0(casename, ".png")),
-        width = case$devpars$width,
-        height = case$devpars$height,
-        res = case$devpars$res
+    prefix <- file.path(info$casedir, "plot")
+    save_plot(p, prefix, case$devpars)
+    code_file <- paste0(prefix, ".R")
+    code = glue(
+        "library(ggradar)
+        plotdf <- {repr(plotdf)}
+        breaks <- {repr(breaks)}
+        colors <- {repr(colors)}
+        ggradar(
+            plotdf,
+            values.radar = paste0(breaks, '%'),
+            grid.min = breaks[1] / 100,
+            grid.mid = breaks[2] / 100,
+            grid.max = breaks[3] / 100,
+            group.colours = colors
+        )"
     )
-    print(p)
-    dev.off()
+    writeLines(code, code_file)
 }
-# fill up the cases
-if (length(cases) == 0) {
-    cases[[DEFAULT_CASE]] = list(
-        by = by,
-        each = each,
-        order = order,
-        cluster_col = cluster_col,
-        cluster_order = cluster_order,
-        breaks = breaks,
-        direction = direction,
-        section = section,
-        devpars = devpars
+do_barplot_and_tests <- function(info, case, counts) {
+    bardata <- counts %>%
+        group_by(!!sym(case$by), !!sym(case$breakdown), !!sym(case$ident)) %>%
+        summarise(.n = n(), .groups = "drop")
+    write.table(
+        bardata,
+        file.path(info$casedir, "breakdown-counts.txt"),
+        sep = "\t",
+        quote = FALSE,
+        col.names = TRUE,
+        row.names = FALSE
     )
-} else {
-    # Use the values given directly under `envs` as default
-    for (key in names(cases)) {
-        if (is.null(cases[[key]]$by)) {
-            cases[[key]]$by = by
-        }
-        if (is.null(cases[[key]]$each)) {
-            cases[[key]]$each = each
-        }
-        if (is.null(cases[[key]]$order)) {
-            cases[[key]]$order = order
-        }
-        if (is.null(cases[[key]]$cluster_col)) {
-            cases[[key]]$cluster_col = cluster_col
-        }
-        if (is.null(cases[[key]]$cluster_order)) {
-            cases[[key]]$cluster_order = cluster_order
-        }
-        if (is.null(cases[[key]]$breaks)) {
-            cases[[key]]$breaks = breaks
-        }
-        if (is.null(cases[[key]]$direction)) {
-            cases[[key]]$direction = direction
-        }
-        if (is.null(cases[[key]]$section)) {
-            cases[[key]]$section = section
-        }
-        if (is.null(cases[[key]]$devpars)) {
-            cases[[key]]$devpars = devpars
-        }
-        if (is.null(cases[[key]]$devpars$width)) {
-            cases[[key]]$devpars$width = devpars$width
-        }
-        if (is.null(cases[[key]]$devpars$height)) {
-            cases[[key]]$devpars$height = devpars$height
-        }
-        if (is.null(cases[[key]]$devpars$res)) {
-            cases[[key]]$devpars$res = devpars$res
-        }
+    if (case$direction == "inter-cluster") {
+        bardata <- bardata %>%
+            group_by(!!sym(case$ident)) %>%
+            mutate(.frac = .n / sum(.n)) %>%
+            ungroup()
+    } else {
+        bardata <- bardata %>%
+            group_by(!!sym(case$by), !!sym(case$breakdown)) %>%
+            mutate(.frac = .n / sum(.n)) %>%
+            ungroup()
     }
-}
-print("- Reading srtobj ...")
-srtobj = readRDS(srtfile)
-meta = srtobj@meta.data
+    # Save the percentages
+    write.table(
+        bardata,
+        file.path(info$casedir, "breakdown-percentages.txt"),
+        sep = "\t",
+        quote = FALSE,
+        col.names = TRUE,
+        row.names = FALSE
+    )
-print("- Mutating meta data if needed ...")
-if (is.list(mutaters) && length(mutaters) > 0) {
-    mutaters = lapply(mutaters, function(x) parse_expr(x))
-    meta = meta %>% mutate(!!!mutaters)
+    # Reorder the clusters if needed
+    if (!is.null(case$cluster_order) && length(case$cluster_order) > 0) {
+        bardata <- bardata %>%
+            mutate(!!sym(case$ident) := factor(!!sym(case$ident), levels = case$cluster_order))
+    }
+    # Calculate the mean, mean-sd, mean+sd
+    plotdata <- bardata %>%
+        group_by(!!sym(case$by), !!sym(case$ident)) %>%
+        summarise(.mean = mean(.frac), .sd = sd(.frac), .groups = "drop") %>%
+        rowwise() %>%
+        mutate(mean_sd1 = max(.mean - .sd, 0), mean_sd2 = .mean + .sd)
+    if (!is.null(case$colors) && length(case$colors) == 1 && case$colors == "biopipen") {
+        colors <- pal_biopipen(.8)(length(unique(plotdata[[case$by]])))
+    } else if (!is.null(case$colors) && length(case$colors) > 0) {
+        colors <- trimws(unlist(strsplit(case$colors, ",")))
+    }
+    # Plot the barplot
+    p = ggplot(plotdata, aes(x = !!sym(case$ident), y = .mean, fill = !!sym(case$by))) +
+        geom_bar(stat = "identity", position = "dodge", color = "#333333") +
+        geom_errorbar(
+            aes(ymin = mean_sd1, ymax = mean_sd2),
+            width = 0.2,
+            alpha = 0.5,
+            linewidth = 0.6,
+            position = position_dodge(0.9),
+            color = "#333333"
+        ) +
+        theme_prism(axis_text_angle = 45) +
+        ylab("Fraction of cells") +
+        scale_fill_manual(values = colors)
+    prefix = file.path(info$casedir, "barplot")
+    save_plot(p, prefix, case$bar_devpars)
+    neat_case <- list(by = case$by, ident = case$ident)
+    save_plotcode(
+        p,
+        setup = c(
+            'library(rlang)',
+            'library(ggplot2)',
+            'library(ggprism)',
+            '',
+            'load("data.RData")',
+            'case <- neat_case'
+        ),
+        prefix,
+        "plotdata", "neat_case", "colors")
+    # Do the tests in each cluster between groups on .frac
+    bys <- bardata %>% pull(!!sym(case$by)) %>% unique()
+    if (!is.null(case$test) && test != "none") {
+        if (length(bys) < 2) {
+            stop("  Cannot do tests with only one group.")
+        }
+        pairs <- combn(bys, 2, simplify = FALSE)
+        test_results <- NULL
+        for (pair in pairs) {
+            dat <- bardata %>%
+                filter(!!sym(case$by) %in% pair) %>%
+                select(!!sym(case$by), !!sym(case$ident), .frac) %>%
+                group_by(!!sym(case$ident)) %>%
+                summarise(
+                    comparison = paste0(pair, collapse = " - "),
+                    n = paste(as.list(table(!!sym(case$by)))[pair], collapse = "; "),
+                    mean = paste(
+                        (tibble(.frac, !!sym(case$by)) %>%
+                            group_by(!!sym(case$by)) %>%
+                            summarise(mean = mean(.frac)) %>%
+                            column_to_rownames(case$by) %>%
+                            t() %>%
+                            as.data.frame() %>%
+                            as.list())[pair] %>% unlist() %>% round(3),
+                        collapse = "; "
+                    ),
+                    !!sym(paste0(case$test, "_pval")) := ifelse(
+                        case$test == "wilcox",
+                        tryCatch(wilcox.test(.frac ~ !!sym(case$by))$p.value, error = function(e) NA),
+                        tryCatch(t.test(.frac ~ !!sym(case$by))$p.value, error = function(e) NA)
+                    )
+                )
+            test_results <- rbind(test_results, dat)
+        }
+        write.table(
+            test_results,
+            file.path(info$casedir, "tests.txt"),
+            sep = "\t",
+            quote = FALSE,
+            col.names = TRUE,
+            row.names = FALSE
+        )
+    }
 }
-# Expand the cases
-newcases = list()
-for (key in names(cases)) {
-    if (is.null(cases[[key]]$each)) {
-        newcases[[key]] = cases[[key]]
-    } else {
-        each_values = meta %>% pull(!!sym(cases[[key]]$each)) %>% unique() %>% na.omit()
-        for (evalue in each_values) {
-            ekey = if (key == DEFAULT_CASE) evalue else paste0(key, "_", evalue)
-            newcases[[ekey]] = cases[[key]]
-            newcases[[ekey]]$each_value = evalue
-            if (!is.null(cases[[key]]$section)) {
-                warn(
-                    sprintf("Case %s: `section` is ignored when `each` is specified.", key),
-                    immediate. = TRUE
+add_case_report = function(info, breakdown, test) {
+    report = list(
+        list(
+            name = "Radar Plot",
+            contents = list(
+                list(
+                    kind = "image",
+                    src = file.path(info$casedir, "plot.png"),
+                    download = list(
+                        file.path(info$casedir, "plot.pdf"),
+                        list(
+                            src = file.path(info$casedir, "plot.R"),
+                            tip = "Download the code used to reproduce the plot",
+                            icon = "Code"))
                 )
-            }
-            newcases[[ekey]]$section = key
+            )
+        ),
+        list(
+            name = "Count Table",
+            contents = list(
+                list(
+                    kind = "table",
+                    data = list(index_col = 0),
+                    src = file.path(info$casedir, "counts.tsv")
+                )
+            )
+        ),
+        list(
+            name = "Percentage Table",
+            contents = list(
+                list(
+                    kind = "table",
+                    data = list(index_col = 0),
+                    src = file.path(info$casedir, "percentages.tsv")
+                )
+            )
+        )
+    )
+    if (!is.null(breakdown)) {
+        report = c(
+            report,
+            list(list(
+                name = "Barplot",
+                contents = list(
+                    list(
+                        kind = "image",
+                        src = file.path(info$casedir, "barplot.png"),
+                        download = list(
+                            file.path(info$casedir, "barplot.pdf"),
+                            list(
+                                src = file.path(info$casedir, "barplot.code.zip"),
+                                tip = "Download the code used to reproduce the plot",
+                                icon = "Code"
+                            )
+                        )
+                    )
+                )
+            ))
+        )
+        if (!is.null(test) && test != "none") {
+            report = c(
+                report,
+                list(list(
+                    name = "Tests",
+                    contents = list(
+                        list(
+                            kind = "table",
+                            src = file.path(info$casedir, "tests.txt")
+                        )
+                    )
+                ))
+            )
         }
     }
+    report$h1 = info$h1
+    report$h2 = info$h2
+    report$ui = "tabs"
+    do_call(add_report, report)
 }
-casenames = names(newcases)
-sapply(casenames, run_one_case)
-print("- Saving sections if any ...")
-if (length(sections) > 0) {
-    # Write as TOML
-    #  section1 = ["case1", "case2"]
-    #  section2 = ["case3", "case4"]
-    #  ...
-    outstr = c()
-    for (sec in names(sections)) {
-        sec_str = paste0(sec, " = ")
-        sec_str = paste0(sec_str, "['", paste(sections[[sec]], collapse = "', '"), "']")
-        outstr = c(outstr, sec_str)
+run_one_case <- function(casename) {
+    info <- casename_info(casename, cases, outdir, create = TRUE)
+    case <- cases[[casename]]
+    log_info("- Running for case: {casename}")
+    if (!is.null(case$subset)) {
+        m <- meta %>% dplyr::filter(!!rlang::parse_expr(case$subset))
+    } else {
+        m <- meta
+    }
+    # Get the counts
+    if (!is.null(case$each)) {
+        counts <- m %>% dplyr::filter(!!sym(case$each) == case$each_value)
+    } else {
+        counts <- m
+    }
+    counts <- counts %>% drop_na(!!sym(case$by)) %>% drop_na(!!sym(case$ident))
+    do_radarplot(info, case, counts)
+    if (!is.null(case$breakdown)) {
+        do_barplot_and_tests(info, case, counts)
     }
-    section_file = file.path(outdir, "sections.toml")
-    writeLines(outstr, section_file)
-}
+    add_case_report(info, case$breakdown, case$test)
+}
+sapply(sort(names(cases)), run_one_case)
+save_report(joboutdir)

biopipen 0.21.0__py3-none-any.whl → 0.34.26__py3-none-any.whl

biopipen 0.21.0py3-none-any.whl → 0.34.26py3-none-any.whl