PyPI - biopipen - Versions diffs - 0.21.0__py3-none-any.whl → 0.34.26__py3-none-any.whl - Mend

biopipen 0.21.0py3-none-any.whl → 0.34.26py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (290) hide show

biopipen/__init__.py +1 -1
biopipen/core/config.toml +28 -0
biopipen/core/filters.py +79 -4
biopipen/core/proc.py +12 -3
biopipen/core/testing.py +75 -3
biopipen/ns/bam.py +148 -6
biopipen/ns/bed.py +75 -0
biopipen/ns/cellranger.py +186 -0
biopipen/ns/cellranger_pipeline.py +126 -0
biopipen/ns/cnv.py +19 -3
biopipen/ns/cnvkit.py +1 -1
biopipen/ns/cnvkit_pipeline.py +20 -12
biopipen/ns/delim.py +34 -35
biopipen/ns/gene.py +68 -23
biopipen/ns/gsea.py +63 -37
biopipen/ns/misc.py +39 -14
biopipen/ns/plot.py +304 -1
biopipen/ns/protein.py +183 -0
biopipen/ns/regulatory.py +290 -0
biopipen/ns/rnaseq.py +142 -5
biopipen/ns/scrna.py +2053 -473
biopipen/ns/scrna_metabolic_landscape.py +228 -382
biopipen/ns/snp.py +659 -0
biopipen/ns/stats.py +484 -0
biopipen/ns/tcr.py +683 -98
biopipen/ns/vcf.py +236 -2
biopipen/ns/web.py +97 -6
biopipen/reports/bam/CNVpytor.svelte +4 -9
biopipen/reports/cellranger/CellRangerCount.svelte +18 -0
biopipen/reports/cellranger/CellRangerSummary.svelte +16 -0
biopipen/reports/cellranger/CellRangerVdj.svelte +18 -0
biopipen/reports/cnvkit/CNVkitDiagram.svelte +1 -1
biopipen/reports/cnvkit/CNVkitHeatmap.svelte +1 -1
biopipen/reports/cnvkit/CNVkitScatter.svelte +1 -1
biopipen/reports/common.svelte +15 -0
biopipen/reports/protein/ProdigySummary.svelte +16 -0
biopipen/reports/scrna/CellsDistribution.svelte +4 -39
biopipen/reports/scrna/DimPlots.svelte +1 -1
biopipen/reports/scrna/MarkersFinder.svelte +6 -126
biopipen/reports/scrna/MetaMarkers.svelte +3 -75
biopipen/reports/scrna/RadarPlots.svelte +4 -20
biopipen/reports/scrna_metabolic_landscape/MetabolicFeatures.svelte +61 -22
biopipen/reports/scrna_metabolic_landscape/MetabolicPathwayActivity.svelte +88 -82
biopipen/reports/scrna_metabolic_landscape/MetabolicPathwayHeterogeneity.svelte +70 -10
biopipen/reports/snp/PlinkCallRate.svelte +24 -0
biopipen/reports/snp/PlinkFreq.svelte +18 -0
biopipen/reports/snp/PlinkHWE.svelte +18 -0
biopipen/reports/snp/PlinkHet.svelte +18 -0
biopipen/reports/snp/PlinkIBD.svelte +18 -0
biopipen/reports/tcr/CDR3AAPhyschem.svelte +19 -66
biopipen/reports/tcr/ClonalStats.svelte +16 -0
biopipen/reports/tcr/CloneResidency.svelte +3 -93
biopipen/reports/tcr/Immunarch.svelte +4 -155
biopipen/reports/tcr/TCRClusterStats.svelte +3 -45
biopipen/reports/tcr/TESSA.svelte +11 -28
biopipen/reports/utils/misc.liq +22 -7
biopipen/scripts/bam/BamMerge.py +11 -15
biopipen/scripts/bam/BamSampling.py +90 -0
biopipen/scripts/bam/BamSort.py +141 -0
biopipen/scripts/bam/BamSplitChroms.py +10 -10
biopipen/scripts/bam/BamSubsetByBed.py +38 -0
biopipen/scripts/bam/CNAClinic.R +41 -5
biopipen/scripts/bam/CNVpytor.py +153 -54
biopipen/scripts/bam/ControlFREEC.py +13 -14
biopipen/scripts/bam/SamtoolsView.py +33 -0
biopipen/scripts/bed/Bed2Vcf.py +5 -5
biopipen/scripts/bed/BedConsensus.py +5 -5
biopipen/scripts/bed/BedLiftOver.sh +6 -4
biopipen/scripts/bed/BedtoolsIntersect.py +54 -0
biopipen/scripts/bed/BedtoolsMakeWindows.py +47 -0
biopipen/scripts/bed/BedtoolsMerge.py +4 -4
biopipen/scripts/cellranger/CellRangerCount.py +138 -0
biopipen/scripts/cellranger/CellRangerSummary.R +181 -0
biopipen/scripts/cellranger/CellRangerVdj.py +112 -0
biopipen/scripts/cnv/AneuploidyScore.R +55 -20
biopipen/scripts/cnv/AneuploidyScoreSummary.R +221 -163
biopipen/scripts/cnv/TMADScore.R +25 -9
biopipen/scripts/cnv/TMADScoreSummary.R +57 -86
biopipen/scripts/cnvkit/CNVkitAccess.py +7 -6
biopipen/scripts/cnvkit/CNVkitAutobin.py +26 -18
biopipen/scripts/cnvkit/CNVkitBatch.py +6 -6
biopipen/scripts/cnvkit/CNVkitCall.py +3 -3
biopipen/scripts/cnvkit/CNVkitCoverage.py +4 -3
biopipen/scripts/cnvkit/CNVkitDiagram.py +5 -5
biopipen/scripts/cnvkit/CNVkitFix.py +3 -3
biopipen/scripts/cnvkit/CNVkitGuessBaits.py +12 -8
biopipen/scripts/cnvkit/CNVkitHeatmap.py +5 -5
biopipen/scripts/cnvkit/CNVkitReference.py +6 -5
biopipen/scripts/cnvkit/CNVkitScatter.py +5 -5
biopipen/scripts/cnvkit/CNVkitSegment.py +5 -5
biopipen/scripts/cnvkit/guess_baits.py +166 -93
biopipen/scripts/delim/RowsBinder.R +1 -1
biopipen/scripts/delim/SampleInfo.R +116 -118
biopipen/scripts/gene/GeneNameConversion.R +67 -0
biopipen/scripts/gene/GenePromoters.R +61 -0
biopipen/scripts/gsea/Enrichr.R +5 -5
biopipen/scripts/gsea/FGSEA.R +184 -50
biopipen/scripts/gsea/GSEA.R +2 -2
biopipen/scripts/gsea/PreRank.R +5 -5
biopipen/scripts/misc/Config2File.py +2 -2
biopipen/scripts/misc/Plot.R +80 -0
biopipen/scripts/misc/Shell.sh +15 -0
biopipen/scripts/misc/Str2File.py +2 -2
biopipen/scripts/plot/Heatmap.R +3 -3
biopipen/scripts/plot/Manhattan.R +147 -0
biopipen/scripts/plot/QQPlot.R +146 -0
biopipen/scripts/plot/ROC.R +88 -0
biopipen/scripts/plot/Scatter.R +112 -0
biopipen/scripts/plot/VennDiagram.R +5 -9
biopipen/scripts/protein/MMCIF2PDB.py +33 -0
biopipen/scripts/protein/PDB2Fasta.py +60 -0
biopipen/scripts/protein/Prodigy.py +119 -0
biopipen/scripts/protein/ProdigySummary.R +140 -0
biopipen/scripts/protein/RMSD.py +178 -0
biopipen/scripts/regulatory/MotifAffinityTest.R +102 -0
biopipen/scripts/regulatory/MotifAffinityTest_AtSNP.R +127 -0
biopipen/scripts/regulatory/MotifAffinityTest_MotifBreakR.R +104 -0
biopipen/scripts/regulatory/MotifScan.py +159 -0
biopipen/scripts/regulatory/VariantMotifPlot.R +78 -0
biopipen/scripts/regulatory/motifs-common.R +324 -0
biopipen/scripts/rnaseq/Simulation-ESCO.R +180 -0
biopipen/scripts/rnaseq/Simulation-RUVcorr.R +45 -0
biopipen/scripts/rnaseq/Simulation.R +21 -0
biopipen/scripts/rnaseq/UnitConversion.R +325 -54
biopipen/scripts/scrna/AnnData2Seurat.R +40 -0
biopipen/scripts/scrna/CCPlotR-patch.R +161 -0
biopipen/scripts/scrna/CellCellCommunication.py +150 -0
biopipen/scripts/scrna/CellCellCommunicationPlots.R +93 -0
biopipen/scripts/scrna/CellSNPLite.py +30 -0
biopipen/scripts/scrna/CellTypeAnnotation-celltypist.R +185 -0
biopipen/scripts/scrna/CellTypeAnnotation-direct.R +68 -31
biopipen/scripts/scrna/CellTypeAnnotation-hitype.R +27 -22
biopipen/scripts/scrna/CellTypeAnnotation-sccatch.R +28 -20
biopipen/scripts/scrna/CellTypeAnnotation-sctype.R +48 -25
biopipen/scripts/scrna/CellTypeAnnotation.R +37 -1
biopipen/scripts/scrna/CellsDistribution.R +456 -167
biopipen/scripts/scrna/DimPlots.R +1 -1
biopipen/scripts/scrna/ExprImputation-alra.R +109 -0
biopipen/scripts/scrna/ExprImputation-rmagic.R +256 -0
biopipen/scripts/scrna/{ExprImpution-scimpute.R → ExprImputation-scimpute.R} +8 -5
biopipen/scripts/scrna/ExprImputation.R +7 -0
biopipen/scripts/scrna/LoomTo10X.R +51 -0
biopipen/scripts/scrna/MQuad.py +25 -0
biopipen/scripts/scrna/MarkersFinder.R +679 -400
biopipen/scripts/scrna/MetaMarkers.R +265 -161
biopipen/scripts/scrna/ModuleScoreCalculator.R +66 -11
biopipen/scripts/scrna/PseudoBulkDEG.R +678 -0
biopipen/scripts/scrna/RadarPlots.R +355 -134
biopipen/scripts/scrna/ScFGSEA.R +298 -100
biopipen/scripts/scrna/ScSimulation.R +65 -0
biopipen/scripts/scrna/ScVelo.py +617 -0
biopipen/scripts/scrna/Seurat2AnnData.R +7 -0
biopipen/scripts/scrna/SeuratClusterStats-clustree.R +87 -0
biopipen/scripts/scrna/SeuratClusterStats-dimplots.R +36 -30
biopipen/scripts/scrna/SeuratClusterStats-features.R +138 -187
biopipen/scripts/scrna/SeuratClusterStats-ngenes.R +81 -0
biopipen/scripts/scrna/SeuratClusterStats-stats.R +78 -89
biopipen/scripts/scrna/SeuratClusterStats.R +47 -10
biopipen/scripts/scrna/SeuratClustering.R +36 -233
biopipen/scripts/scrna/SeuratLoading.R +2 -2
biopipen/scripts/scrna/SeuratMap2Ref.R +84 -113
biopipen/scripts/scrna/SeuratMetadataMutater.R +16 -6
biopipen/scripts/scrna/SeuratPreparing.R +223 -173
biopipen/scripts/scrna/SeuratSubClustering.R +64 -0
biopipen/scripts/scrna/SeuratTo10X.R +27 -0
biopipen/scripts/scrna/Slingshot.R +65 -0
biopipen/scripts/scrna/Subset10X.R +2 -2
biopipen/scripts/scrna/TopExpressingGenes.R +169 -135
biopipen/scripts/scrna/celltypist-wrapper.py +195 -0
biopipen/scripts/scrna/scvelo_paga.py +313 -0
biopipen/scripts/scrna/seurat_anndata_conversion.py +98 -0
biopipen/scripts/scrna_metabolic_landscape/MetabolicFeatures.R +447 -82
biopipen/scripts/scrna_metabolic_landscape/MetabolicPathwayActivity.R +348 -241
biopipen/scripts/scrna_metabolic_landscape/MetabolicPathwayHeterogeneity.R +188 -166
biopipen/scripts/snp/MatrixEQTL.R +217 -0
biopipen/scripts/snp/Plink2GTMat.py +148 -0
biopipen/scripts/snp/PlinkCallRate.R +199 -0
biopipen/scripts/snp/PlinkFilter.py +100 -0
biopipen/scripts/snp/PlinkFreq.R +291 -0
biopipen/scripts/snp/PlinkFromVcf.py +81 -0
biopipen/scripts/snp/PlinkHWE.R +85 -0
biopipen/scripts/snp/PlinkHet.R +96 -0
biopipen/scripts/snp/PlinkIBD.R +196 -0
biopipen/scripts/snp/PlinkSimulation.py +124 -0
biopipen/scripts/snp/PlinkUpdateName.py +124 -0
biopipen/scripts/stats/ChowTest.R +146 -0
biopipen/scripts/stats/DiffCoexpr.R +152 -0
biopipen/scripts/stats/LiquidAssoc.R +135 -0
biopipen/scripts/stats/Mediation.R +108 -0
biopipen/scripts/stats/MetaPvalue.R +130 -0
biopipen/scripts/stats/MetaPvalue1.R +74 -0
biopipen/scripts/tcgamaf/Maf2Vcf.py +2 -2
biopipen/scripts/tcgamaf/MafAddChr.py +2 -2
biopipen/scripts/tcr/Attach2Seurat.R +3 -2
biopipen/scripts/tcr/CDR3AAPhyschem.R +211 -143
biopipen/scripts/tcr/CDR3Clustering.R +343 -0
biopipen/scripts/tcr/ClonalStats.R +526 -0
biopipen/scripts/tcr/CloneResidency.R +255 -131
biopipen/scripts/tcr/CloneSizeQQPlot.R +4 -4
biopipen/scripts/tcr/GIANA/GIANA.py +1356 -797
biopipen/scripts/tcr/GIANA/GIANA4.py +1362 -789
biopipen/scripts/tcr/GIANA/query.py +164 -162
biopipen/scripts/tcr/Immunarch-basic.R +31 -9
biopipen/scripts/tcr/Immunarch-clonality.R +25 -5
biopipen/scripts/tcr/Immunarch-diversity.R +352 -134
biopipen/scripts/tcr/Immunarch-geneusage.R +45 -5
biopipen/scripts/tcr/Immunarch-kmer.R +68 -8
biopipen/scripts/tcr/Immunarch-overlap.R +84 -4
biopipen/scripts/tcr/Immunarch-spectratyping.R +35 -6
biopipen/scripts/tcr/Immunarch-tracking.R +38 -6
biopipen/scripts/tcr/Immunarch-vjjunc.R +165 -0
biopipen/scripts/tcr/Immunarch.R +63 -11
biopipen/scripts/tcr/Immunarch2VDJtools.R +2 -2
biopipen/scripts/tcr/ImmunarchFilter.R +4 -4
biopipen/scripts/tcr/ImmunarchLoading.R +38 -29
biopipen/scripts/tcr/SampleDiversity.R +1 -1
biopipen/scripts/tcr/ScRepCombiningExpression.R +40 -0
biopipen/scripts/tcr/ScRepLoading.R +166 -0
biopipen/scripts/tcr/TCRClusterStats.R +176 -22
biopipen/scripts/tcr/TCRDock.py +110 -0
biopipen/scripts/tcr/TESSA.R +102 -118
biopipen/scripts/tcr/VJUsage.R +5 -5
biopipen/scripts/tcr/immunarch-patched.R +142 -0
biopipen/scripts/tcr/vdjtools-patch.sh +1 -1
biopipen/scripts/vcf/BcftoolsAnnotate.py +91 -0
biopipen/scripts/vcf/BcftoolsFilter.py +90 -0
biopipen/scripts/vcf/BcftoolsMerge.py +31 -0
biopipen/scripts/vcf/BcftoolsSort.py +113 -0
biopipen/scripts/vcf/BcftoolsView.py +73 -0
biopipen/scripts/vcf/TruvariBench.sh +14 -7
biopipen/scripts/vcf/TruvariBenchSummary.R +16 -13
biopipen/scripts/vcf/TruvariConsistency.R +1 -1
biopipen/scripts/vcf/Vcf2Bed.py +2 -2
biopipen/scripts/vcf/VcfAnno.py +11 -11
biopipen/scripts/vcf/VcfDownSample.sh +22 -10
biopipen/scripts/vcf/VcfFilter.py +5 -5
biopipen/scripts/vcf/VcfFix.py +7 -7
biopipen/scripts/vcf/VcfFix_utils.py +13 -4
biopipen/scripts/vcf/VcfIndex.py +3 -3
biopipen/scripts/vcf/VcfIntersect.py +3 -3
biopipen/scripts/vcf/VcfLiftOver.sh +5 -0
biopipen/scripts/vcf/VcfSplitSamples.py +4 -4
biopipen/scripts/vcf/bcftools_utils.py +52 -0
biopipen/scripts/web/Download.py +8 -4
biopipen/scripts/web/DownloadList.py +5 -5
biopipen/scripts/web/GCloudStorageDownloadBucket.py +82 -0
biopipen/scripts/web/GCloudStorageDownloadFile.py +23 -0
biopipen/scripts/web/gcloud_common.py +49 -0
biopipen/utils/gene.py +108 -60
biopipen/utils/misc.py +146 -20
biopipen/utils/reference.py +64 -20
biopipen/utils/reporter.py +177 -0
biopipen/utils/vcf.py +1 -1
biopipen-0.34.26.dist-info/METADATA +27 -0
biopipen-0.34.26.dist-info/RECORD +292 -0
{biopipen-0.21.0.dist-info → biopipen-0.34.26.dist-info}/WHEEL +1 -1
{biopipen-0.21.0.dist-info → biopipen-0.34.26.dist-info}/entry_points.txt +6 -2
biopipen/ns/bcftools.py +0 -111
biopipen/ns/scrna_basic.py +0 -255
biopipen/reports/delim/SampleInfo.svelte +0 -36
biopipen/reports/scrna/GeneExpressionInvistigation.svelte +0 -32
biopipen/reports/scrna/ScFGSEA.svelte +0 -35
biopipen/reports/scrna/SeuratClusterStats.svelte +0 -82
biopipen/reports/scrna/SeuratMap2Ref.svelte +0 -20
biopipen/reports/scrna/SeuratPreparing.svelte +0 -38
biopipen/reports/scrna/TopExpressingGenes.svelte +0 -55
biopipen/reports/scrna_metabolic_landscape/MetabolicFeaturesIntraSubset.svelte +0 -31
biopipen/reports/utils/gsea.liq +0 -110
biopipen/scripts/bcftools/BcftoolsAnnotate.py +0 -42
biopipen/scripts/bcftools/BcftoolsFilter.py +0 -79
biopipen/scripts/bcftools/BcftoolsSort.py +0 -19
biopipen/scripts/gene/GeneNameConversion.py +0 -66
biopipen/scripts/scrna/ExprImpution-alra.R +0 -32
biopipen/scripts/scrna/ExprImpution-rmagic.R +0 -29
biopipen/scripts/scrna/ExprImpution.R +0 -7
biopipen/scripts/scrna/GeneExpressionInvistigation.R +0 -132
biopipen/scripts/scrna/Write10X.R +0 -11
biopipen/scripts/scrna_metabolic_landscape/MetabolicFeaturesIntraSubset.R +0 -150
biopipen/scripts/tcr/TCRClustering.R +0 -280
biopipen/utils/common_docstrs.py +0 -61
biopipen/utils/gene.R +0 -49
biopipen/utils/gsea.R +0 -193
biopipen/utils/io.R +0 -20
biopipen/utils/misc.R +0 -114
biopipen/utils/mutate_helpers.R +0 -433
biopipen/utils/plot.R +0 -173
biopipen/utils/rnaseq.R +0 -48
biopipen/utils/single_cell.R +0 -115
biopipen-0.21.0.dist-info/METADATA +0 -22
biopipen-0.21.0.dist-info/RECORD +0 -218

{biopipen-0.21.0.dist-info → biopipen-0.34.26.dist-info}/WHEEL RENAMED Viewed

@@ -1,4 +1,4 @@
 Wheel-Version: 1.0
-Generator: poetry-core 1.8.1
+Generator: poetry-core 2.2.1
 Root-Is-Purelib: true
 Tag: py3-none-any

{biopipen-0.21.0.dist-info → biopipen-0.34.26.dist-info}/entry_points.txt RENAMED Viewed

@@ -1,7 +1,8 @@
 [pipen_cli_run]
 bam=biopipen.ns.bam
-bcftools=biopipen.ns.bcftools
 bed=biopipen.ns.bed
+cellranger=biopipen.ns.cellranger
+cellranger_pipeline=biopipen.ns.cellranger_pipeline
 cnv=biopipen.ns.cnv
 cnvkit=biopipen.ns.cnvkit
 cnvkit_pipeline=biopipen.ns.cnvkit_pipeline
@@ -10,10 +11,13 @@ gene=biopipen.ns.gene
 gsea=biopipen.ns.gsea
 misc=biopipen.ns.misc
 plot=biopipen.ns.plot
+protein=biopipen.ns.protein
+regulatory=biopipen.ns.regulatory
 rnaseq=biopipen.ns.rnaseq
 scrna=biopipen.ns.scrna
-scrna_basic=biopipen.ns.scrna_basic
 scrna_metabolic_landscape=biopipen.ns.scrna_metabolic_landscape
+snp=biopipen.ns.snp
+stats=biopipen.ns.stats
 tcgamaf=biopipen.ns.tcgamaf
 tcr=biopipen.ns.tcr
 vcf=biopipen.ns.vcf

biopipen/ns/bcftools.py DELETED Viewed

@@ -1,111 +0,0 @@
-"""handling VCF files using bcftools"""
-from ..core.proc import Proc
-from ..core.config import config
-class BcftoolsAnnotate(Proc):
-    """Add or remove annotations from VCF files
-    Input:
-        infile: The input VCF file
-        annfile: The annotation file
-    Output:
-        outfile: The annotated VCF file
-    Envs:
-        bcftools: Path to bcftools
-        tabix: Path to tabix, used to index infile and annfile
-        annfile: The annotation file. If `in.annfile` is provided,
-            this is ignored
-        ncores: Number of cores (`--nthread`) to use
-        cols: Overwrite `-c/--columns`
-        header: Headers to be added
-        args: Other arguments for `bcftools annotate`
-    """
-    input = "infile:file, annfile:file"
-    output = "outfile:file:{{in.infile | basename}}"
-    lang = config.lang.python
-    envs = {
-        "bcftools": config.exe.bcftools,
-        "tabix": config.exe.tabix,
-        "annfile": "",
-        "cols": [],
-        "header": [],
-        "args": {},
-        "ncores": config.misc.ncores,
-    }
-    script = "file://../scripts/bcftools/BcftoolsAnnotate.py"
-class BcftoolsFilter(Proc):
-    """Apply fixed threshold filters to VCF files
-    Input:
-        infile: The input VCF file
-    Output:
-        outfile: The filtered VCF file. If the `in.infile` is gzipped, this is
-            gzipped as well.
-    Envs:
-        bcftools: Path to bcftools
-        ncores: Number of cores (`--nthread`) to use
-        keep: Whether we should keep the filtered variants or not.
-        args: Other arguments for `bcftools annotate`
-        ncores: `nthread`
-        tmpdir: Path to save the intermediate files
-            Since the filters need to be applied one by one by bcftools
-        includes: and
-        excludes: include/exclude only sites for which EXPRESSION is true.
-            See: https://samtools.github.io/bcftools/bcftools.html#expressions
-            If provided, `envs.args.include/exclude` will be ignored.
-            If `str`/`list` used, The filter names will be `Filter%d`
-            A dict is used when keys are filter names and values are expressions
-    """
-    input = "infile:file"
-    output = "outfile:file:{{in.infile | basename}}"
-    lang = config.lang.python
-    envs = {
-        "bcftools": config.exe.bcftools,
-        "keep": True,
-        "ncores": config.misc.ncores,
-        "includes": None,
-        "excludes": None,
-        "tmpdir": config.path.tmpdir,
-        "args": {},
-    }
-    script = "file://../scripts/bcftools/BcftoolsFilter.py"
-class BcftoolsSort(Proc):
-    """Sort VCF files
-    Input:
-        infile: The input VCF file
-    Output:
-        outfile: The sorted VCF file.
-    Envs:
-        bcftools: Path to bcftools
-        gz: Whether to gzip the output file
-        index: Whether to index the output file (tbi) (`envs.gz` forced to True)
-        tmpdir: Path to save the intermediate files
-        args: Other arguments for `bcftools sort`. For example `max-mem`.
-            See also https://samtools.github.io/bcftools/bcftools.html#sort
-    """
-    input = "infile:file"
-    output = (
-        "outfile:file:{{in.infile | stem0}}.vcf"
-        "{% if envs.gz or envs.index %}.gz{% endif %}"
-    )
-    lang = config.lang.python
-    envs = {
-        "bcftools": config.exe.bcftools,
-        "gz": True,
-        "index": True,
-        "tmpdir": config.path.tmpdir,
-        "args": {},
-    }
-    script = "file://../scripts/bcftools/BcftoolsSort.py"

biopipen/ns/scrna_basic.py DELETED Viewed

@@ -1,255 +0,0 @@
-"""Basic analysis for single cell RNA-seq data
-- QC
-- Clustering
-- Marker genes
-- Enrichment analysis
-"""
-from __future__ import annotations
-from pathlib import Path
-from typing import Type
-from pipen.utils import mark, is_loading_pipeline
-from pipen_annotate import annotate
-from pipen_args import ProcGroup
-from ..core.proc import Proc
-class ScrnaBasic(ProcGroup):
-    """Basic analysis for single cell RNA-seq data
-    Including QC, clustering, marker genes, and enrichment analysis.
-    See also the docs for details
-    <https://pwwang.github.io/biopipen/pipelines/scrna_basic/>
-    Args:
-        infile: The input file. Either a tab-delimited file containing
-            the information of metadata and paths to results of cellranger
-            or a seurat object has been saved as RDS file (with extension
-            `.rds` or `.RDS`), which QC is assumed to be done.
-            As for the tab-delimited file, it should have two columns:
-            `Sample` and `RNAData`. `Sample` should be the first column with
-            unique identifiers for the samples and `RNAData` indicates where the
-            barcodes, genes, expression matrices are.
-        is_seurat (flag): Whether the input file is a seurat object
-            in RDS format.
-            If this process group runs independently, this argument should
-            not be set. It will be recognized automatically by the extension
-            of `infile`. However, if this process group is run as a part of
-            a pipeline, this argument should be set manually since `infile`
-            should not be set in this case. It will be passed by other processes
-        clustering (choice;required): Which clustering method to use.
-            - supervised: Mapping the cells to given reference.
-                Using Seurat Reference Mapping procedure.
-                See: <https://satijalab.org/seurat/articles/multimodal_reference_mapping.html>
-            - unsupervised: Clustering the cells without reference.
-                Using Seurat FindClusters procedure.
-            - both: Both supervised and unsupervised clustering.
-                Performing both of the above procedures. The unsupervised
-                clustering will be added as `seurat_clusters_unsupervised`
-                to the metadata.
-        ref: The reference file for supervised clustering. It should be an
-            RDS file (with extension `.rds` or `.RDS`) containing a seurat
-            object, or a h5 file (with extension `.h5` or `.h5seurat`) that
-            can be loaded by `Seurat::LoadH5Seurat()`.
-    """  # noqa: E501
-    DEFAULTS = {
-        "infile": None,
-        "is_seurat": False,
-        "clustering": None,
-        "ref": None,
-    }
-    def post_init(self) -> None:
-        if self.opts.infile:
-            suffix = Path(self.opts.infile).suffix
-            self.opts.is_seurat = suffix in (".rds", ".RDS")
-    @ProcGroup.add_proc
-    def p_input(self) -> Type[Proc]:
-        """Build the input for the process group"""
-        from .misc import File2Proc
-        @mark(board_config_hidden=True)
-        class ScrnaBasicInput(File2Proc):
-            """Input file for scrna_basic process group
-            To specify the input file, use the `infile` argument of the
-            process group.
-            """
-            if self.opts.infile:
-                input_data = [self.opts.infile]
-        return ScrnaBasicInput
-    @ProcGroup.add_proc
-    def p_prepare(self) -> Type[Proc]:
-        """Prepare the input data into a Seurat object and do QC"""
-        if self.opts.is_seurat:
-            return self.p_input
-        from .scrna import SeuratPreparing
-        class ScrnaBasicPrepareAndQC(SeuratPreparing):
-            requires = self.p_input
-        return ScrnaBasicPrepareAndQC
-    @ProcGroup.add_proc
-    def p_supervised(self) -> Type[Proc]:
-        if (
-            self.opts.clustering == "unsupervised"
-            and not is_loading_pipeline()
-        ):
-            return None
-        from .scrna import SeuratMap2Ref
-        @annotate.format_doc(indent=3)
-        class ScrnaBasicSupervised(SeuratMap2Ref):
-            """{{Summary}}
-            **Only available when the group argument `clustering` is set to
-            `supervised` or `both`.**
-            Envs:
-                ref (pgarg): {{Envs.ref.help | indent(20)}}.
-                    Defaults to the `ref` argument of the process group.
-            """
-            requires = self.p_prepare
-            envs = {
-                "ref": self.opts.ref,
-            }
-        return ScrnaBasicSupervised
-    @ProcGroup.add_proc
-    def p_supervised_stats(self) -> Type[Proc]:
-        if not self.p_supervised and not is_loading_pipeline():
-            return None
-        from .scrna import SeuratClusterStats
-        @annotate.format_doc(indent=3)
-        class ScrnaBasicSupervisedStats(SeuratClusterStats):
-            """{{Summary}}
-            **Only available when the group argument `clustering` is set to
-            `supervised` or `both`.**
-            """
-            requires = self.p_supervised
-        return ScrnaBasicSupervisedStats
-    @ProcGroup.add_proc
-    def p_unsupervised(self) -> Type[Proc]:
-        if (
-            self.opts.clustering == "supervised"
-            and not is_loading_pipeline()
-        ):
-            return None
-        from .scrna import SeuratClustering
-        class ScrnaBasicUnsupervised(SeuratClustering):
-            requires = self.p_prepare
-        return ScrnaBasicUnsupervised
-    @ProcGroup.add_proc
-    def p_unsupervised_anno(self) -> Type[Proc]:
-        if not self.p_unsupervised and not is_loading_pipeline():
-            return None
-        from .scrna import CellTypeAnnotation
-        class ScrnaBasicAnnotation(CellTypeAnnotation):
-            requires = self.p_unsupervised
-        return ScrnaBasicAnnotation
-    @ProcGroup.add_proc
-    def p_unsupervised_stats(self) -> Type[Proc]:
-        if not self.p_unsupervised_anno and not is_loading_pipeline():
-            return None
-        from .scrna import SeuratClusterStats
-        class ScrnaBasicUnsupervisedStats(SeuratClusterStats):
-            requires = self.p_unsupervised_anno
-        return ScrnaBasicUnsupervisedStats
-    @ProcGroup.add_proc
-    def p_merge(self) -> Type[Proc]:
-        if self.opts.clustering == "supervised" and not is_loading_pipeline():
-            return self.p_supervised
-        if self.opts.clustering == "unsupervised" and not is_loading_pipeline():
-            return self.p_unsupervised_anno
-        @mark(board_config_hidden=True)
-        class ScrnaBasicMerge(Proc):
-            """Merge the supervised and unsupervised clustering results
-            Add unsupervised clustering as metadata to the seurat object
-            with supervised clustering.
-            The unsupervised clustering results are stored in the metadata
-            `seurat_clusters_unsupervised`.
-            **Only available when the group argument `clustering` is set to
-            `both`.**
-            """
-            requires = [self.p_supervised, self.p_unsupervised_anno]
-            lang = self.p_supervised.lang
-            input = "sobjfile:file, uobjfile:file"
-            output = "outfile:file:{{in.sobjfile | stem}}.rds"
-            script = """
-                library(Seurat)
-                sobj <- readRDS({{in.sobjfile | quote}})
-                uobj <- readRDS({{in.uobjfile | quote}})
-                umeta <- as.list(uobj$seurat_clusters)
-                names(umeta) <- rownames(uobj)
-                sobj <- AddMetaData(
-                    sobj,
-                    metadata=umeta,
-                    col.name="seurat_clusters_unsupervised"
-                )
-                saveRDS(sobj, {{out.outfile | quote}})
-            """
-        return ScrnaBasicMerge
-    @ProcGroup.add_proc
-    def p_findmarkers(self) -> Type[Proc]:
-        from .scrna import MarkersFinder
-        @annotate.format_doc(indent=3)
-        class ScrnaBasicMarkers(MarkersFinder):
-            """{{Summary}}
-            If the group argument `clustering` is set to `"both"`,
-            you can set `group-by` to `"seurat_clusters_unsupervised"` in
-            a different case to find the markers for the unsupervised clusters.
-            """
-            requires = self.p_merge
-        return ScrnaBasicMarkers
-    @ProcGroup.add_proc
-    def p_scgsea(self) -> Type[Proc]:
-        from .scrna import ScFGSEA
-        class ScrnaBasicScGSEA(ScFGSEA):
-            requires = self.p_merge
-        return ScrnaBasicScGSEA
-if __name__ == "__main__":
-    ScrnaBasic().as_pipen().run()

biopipen/reports/delim/SampleInfo.svelte DELETED Viewed

@@ -1,36 +0,0 @@
-{% from "utils/misc.liq" import report_jobs, table_of_images -%}
-<script>
-    import { Image, DataTable } from "$libs";
-</script>
-{%- macro report_job(job, h=1) -%}
-    {% if envs.stats %}
-    <h{{h}}>Sample Information</h{{h}}>
-    {% endif %}
-    {% if envs.exclude_cols and isinstance(envs.exclude_cols, str) %}
-        {% set excluded_cols = envs.exclude_cols | replace: " ", "" | split: "," %}
-    {% else %}
-        {% set excluded_cols = envs.exclude_cols %}
-    {% endif %}
-    <DataTable
-        data={ {{ job.out.outfile | datatable: sep="\t", excluded=excluded_cols }} }
-        pageSize={50}
-        />
-    {% if envs.stats %}
-        <h{{h}}>Statistics</h{{h}}>
-        {%- set stat_imgs = job.outdir | glob: "*.png" -%}
-        {{- table_of_images(stat_imgs) -}}
-    {% endif %}
-{%- endmacro -%}
-{%- macro head_job(job) -%}
-    <h1>{{job.in.infile | stem | escape }}</h1>
-{%- endmacro -%}
-{{ report_jobs(jobs, head_job, report_job) }}

biopipen/reports/scrna/GeneExpressionInvistigation.svelte DELETED Viewed

@@ -1,32 +0,0 @@
-{% from_ os import path %}
-{% from "utils/misc.liq" import report_jobs, table_of_images -%}
-<script>
-    import { Image } from "$libs";
-</script>
-{%- macro report_job(job, h=1) -%}
-{% assign boxplotpng = job.out.outdir | joinpaths: "boxplot.png" %}
-{% assign heatmappng = job.out.outdir | joinpaths: "heatmap.png" %}
-{% if path.exists(boxplotpng) %}
-<Image src={{boxplotpng | quote}} />
-{% endif %}
-{% if path.exists(heatmappng) %}
-<Image src={{heatmappng | quote}} />
-{% endif %}
-{%- endmacro -%}
-{%- macro head_job(job) -%}
-{% if job.in.configfile %}
-{%  assign name = job.in.configfile | toml_load | attr: "name" %}
-{% else %}
-{%  assign name = job.ennvs.config | attr: "name" %}
-{% endif %}
-<h1>{{name | escape}}</h1>
-{%- endmacro -%}
-{{ report_jobs(jobs, head_job, report_job) }}

biopipen/reports/scrna/ScFGSEA.svelte DELETED Viewed

@@ -1,35 +0,0 @@
-{% from "utils/gsea.liq" import fgsea_report -%}
-{% from "utils/misc.liq" import report_jobs -%}
-<script>
-    import { Image, DataTable } from "$libs";
-</script>
-{%- macro report_job(job, h=1) -%}
-    {%- set secdirs = job.out.outdir | glob: "*" -%}
-    {%- if len(secdirs) == 1 -%}
-        {%- set secname = secdirs | first | basename -%}
-        {%- for casedir in secdirs | first | glob: "*" -%}
-            {%- if secname == "DEFAULT" -%}
-                <h{{h}}>{{ casedir | basename | escape }}</h{{h}}>
-            {%- else -%}
-                <h{{h}}>{{secname | escape }} - {{ casedir | basename | escape }}</h{{h}}>
-            {%- endif -%}
-            {{ fgsea_report(casedir, h + 1) }}
-        {%- endfor -%}
-    {%- else -%}
-        {%- for secdir in secdirs -%}
-            {%- set sec = secdir | basename -%}
-            <h{{h}}>{{sec | escape}}</h{{h}}>
-            {%- for casedir in secdir | glob: "*" -%}
-                <h{{h+1}}>{{casedir | basename | escape}}</h{{h+1}}>
-                {{ fgsea_report(casedir, h + 2) }}
-            {%- endfor -%}
-        {%- endfor -%}
-    {%- endif -%}
-{%- endmacro -%}
-{%- macro head_job(job) -%}
-<h1>{{job.in.srtobj | stem0 | escape}}</h1>
-{%- endmacro -%}
-{{ report_jobs(jobs, head_job, report_job) }}

biopipen/reports/scrna/SeuratClusterStats.svelte DELETED Viewed

@@ -1,82 +0,0 @@
-{% from "utils/misc.liq" import report_jobs, table_of_images -%}
-{% from_ os import path %}
-<script>
-    import { DataTable, Image } from "$libs";
-    import { Tabs, Tab, TabContent } from "$ccs";
-</script>
-{%- macro report_job(job, h=1) -%}
-    {%- set stats_reports_file = job.out.outdir | joinpaths: "stats", "report_toc.json" -%}
-    {%- set features_reports_file = job.out.outdir | joinpaths: "features", "report_toc.json" -%}
-    {%- set dimplots_reports_file = job.out.outdir | joinpaths: "dimplots", "report_toc.json" -%}
-    {%- if stats_reports_file | exists -%}
-        {%- set stats = stats_reports_file | config: "json" -%}
-        {% for key, value in stats.items() -%}
-            <h{{h}}>{{key | escape}}</h{{h}}>
-            <Tabs>
-                {% if 'bar' in value -%}
-                    <Tab label="Bar plot" />
-                {% endif -%}
-                {% if 'pie' in value -%}
-                    <Tab label="Pie chart" />
-                {% endif -%}
-                {% if 'table' in value -%}
-                    <Tab label="Table" />
-                {% endif -%}
-                <svelte:fragment slot="content">
-                    {% if 'bar' in value -%}
-                        <TabContent>
-                            <Image src="{{job.out.outdir}}/stats/{{value.bar}}" />
-                        </TabContent>
-                    {% endif -%}
-                    {% if 'pie' in value -%}
-                        <TabContent>
-                            <Image src="{{job.out.outdir}}/stats/{{value.pie}}" />
-                        </TabContent>
-                    {% endif -%}
-                    {% if 'table' in value -%}
-                        <TabContent>
-                            <DataTable src="{{job.out.outdir}}/stats/{{value.table}}"
-                                data={ {{job.out.outdir | joinpaths: "stats", value.table | datatable: sep="\t", nrows=100 }} }
-                                />
-                        </TabContent>
-                    {% endif -%}
-                </svelte:fragment>
-            </Tabs>
-        {%- endfor -%}
-    {%- endif -%}
-    {%- if features_reports_file | exists -%}
-        {%- set features = features_reports_file | config: "json" %}
-        {% for key, value in features.items() -%}
-            <h{{h}}>{{key | escape}}</h{{h}}>
-            {% for val in value -%}
-                {% if "name" in val -%}
-                    <h{{h+1}}>{{val.name | escape}}</h{{h+1}}>
-                {%- endif -%}
-                {% if val.kind == "table" -%}
-                    <DataTable src="{{job.out.outdir}}/features/{{val.file}}"
-                        data={ {{job.out.outdir | joinpaths: "features", val.file | datatable: sep="\t", nrows=100 }} }
-                        />
-                {% else -%}
-                    <Image src="{{job.out.outdir}}/features/{{val.file}}" />
-                {% endif -%}
-            {%- endfor -%}
-        {%- endfor -%}
-    {%- endif -%}
-    {%- if dimplots_reports_file | exists -%}
-        {%- set dimplots = dimplots_reports_file | config: "json" %}
-        {% for key, value in dimplots.items() -%}
-            <h{{h}}>{{key | escape}}</h{{h}}>
-            <Image src="{{job.out.outdir}}/dimplots/{{value}}" />
-        {%- endfor -%}
-    {%- endif -%}
-{%- endmacro -%}
-{%- macro head_job(job) -%}
-<h1>{{job.in.srtobj | stem}}</h1>
-{%- endmacro -%}
-{{ report_jobs(jobs, head_job, report_job) }}

biopipen/reports/scrna/SeuratMap2Ref.svelte DELETED Viewed

@@ -1,20 +0,0 @@
-{% from "utils/misc.liq" import report_jobs, table_of_images -%}
-<script>
-    import { Image } from "$libs";
-</script>
-{%- macro report_job(job, h=1) -%}
-<h{{h}}>Reference UMAP</h{{h}}>
-{% set imgs = job.outdir | glob: "Reference_UMAP_*.png" %}
-{{ table_of_images(imgs) }}
-<h{{h}}>Query UMAP</h{{h}}>
-{% set imgs = job.outdir | glob: "Query_UMAP_*.png" %}
-{{ table_of_images(imgs) }}
-{%- endmacro -%}
-{%- macro head_job(job) -%}
-<h1>{{job.in.sobjfile | stem0 | escape}}</h1>
-{%- endmacro -%}
-{{ report_jobs(jobs, head_job, report_job) }}

biopipen/reports/scrna/SeuratPreparing.svelte DELETED Viewed

@@ -1,38 +0,0 @@
-{% from "utils/misc.liq" import report_jobs, table_of_images -%}
-{% from_ os import path %}
-<script>
-    import { Image, DataTable } from "$libs";
-    import { Tile } from "$ccs";
-</script>
-{%- macro report_job(job, h=1) -%}
-    <h{{h}}>Applied filters</h{{h}}>
-    <Tile>
-        <p>Cell filters: {{envs.cell_qc | str | escape}}</p>
-        <p>Gene filters: {{
-            proc.envs.gene_qc
-            | str
-            | replace: "{", "&#123"
-            | replace: "}", "&#125"
-        }}</p>
-        <DataTable
-            src={{job.outdir | joinpaths: 'plots', 'dim.txt' | quote}}
-            data={ {{job.outdir | joinpaths: 'plots', 'dim.txt' | datatable: sep="\t"}} } />
-    </Tile>
-    <h{{h}}>Violin plots</h{{h}}>
-    {% set qcimgs = job.outdir | glob: "plots", "*.vln.png" %}
-    {{ table_of_images(qcimgs) }}
-    <h{{h}}>Scatter plots</h{{h}}>
-    {% set qcimgs = job.outdir | glob: "plots", "*.scatter.png" %}
-    {{ table_of_images(qcimgs) }}
-{%- endmacro -%}
-{%- macro head_job(job) -%}
-    <h1>{{job.in.metafile | stem}}</h1>
-{%- endmacro -%}
-{{ report_jobs(jobs, head_job, report_job) }}

biopipen 0.21.0__py3-none-any.whl → 0.34.26__py3-none-any.whl

biopipen 0.21.0py3-none-any.whl → 0.34.26py3-none-any.whl