biopipen 0.7.1__tar.gz → 0.8.0__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of biopipen might be problematic. Click here for more details.
- {biopipen-0.7.1 → biopipen-0.8.0}/PKG-INFO +7 -8
- biopipen-0.8.0/biopipen/__init__.py +2 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/core/config.py +0 -5
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/core/config.toml +2 -4
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/core/defaults.py +3 -3
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/core/filters.py +1 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/core/proc.py +1 -3
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/core/testing.py +1 -2
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/ns/bam.py +10 -14
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/ns/bcftools.py +4 -7
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/ns/bed.py +9 -16
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/ns/cnv.py +8 -11
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/ns/cnvkit.py +32 -59
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/ns/cnvkit_pipeline.py +266 -310
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/ns/csv.py +0 -2
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/ns/gene.py +0 -1
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/ns/gsea.py +4 -10
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/ns/misc.py +0 -5
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/ns/plot.py +2 -4
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/ns/rnaseq.py +0 -1
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/ns/scrna.py +76 -119
- biopipen-0.8.0/biopipen/ns/scrna_metabolic_landscape.py +418 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/ns/tcr.py +5 -15
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/ns/vcf.py +52 -34
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/ns/web.py +8 -19
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/bam/CNAClinic.svelte +1 -1
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/bam/CNVpytor.svelte +2 -2
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/bam/ControlFREEC.svelte +1 -1
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/cnv/AneuploidyScore.svelte +2 -2
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/cnv/AneuploidyScoreSummary.svelte +1 -1
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/cnvkit/CNVkitDiagram.svelte +1 -1
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/cnvkit/CNVkitHeatmap.svelte +1 -1
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/cnvkit/CNVkitScatter.svelte +1 -1
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/gsea/FGSEA.svelte +1 -1
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/gsea/GSEA.svelte +2 -2
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/scrna/CellsDistribution.svelte +1 -1
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/scrna/DimPlots.svelte +1 -1
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/scrna/GeneExpressionInvistigation.svelte +1 -1
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/scrna/MarkersFinder.svelte +2 -2
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/scrna/ScFGSEA.svelte +1 -1
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/scrna/SeuratClusterStats.svelte +2 -2
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/scrna/SeuratPreparing.svelte +2 -2
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/scrna_metabolic_landscape/MetabolicFeaturesIntraSubsets.svelte +1 -1
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/scrna_metabolic_landscape/MetabolicPathwayActivity.svelte +1 -1
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/scrna_metabolic_landscape/MetabolicPathwayHeterogeneity.svelte +1 -1
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/tcr/CloneResidency.svelte +2 -2
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/tcr/Immunarch.svelte +2 -2
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/tcr/SampleDiversity.svelte +2 -2
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/tcr/TCRClusteringStats.svelte +2 -2
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/tcr/VJUsage.svelte +1 -1
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/utils/gsea.liq +1 -1
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/utils/misc.liq +1 -1
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/vcf/TruvariBenchSummary.svelte +1 -1
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/vcf/TruvariConsistency.svelte +2 -2
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/tcgamaf/maf2vcf.pl +10 -5
- biopipen-0.8.0/biopipen/scripts/vcf/VcfAnno.py +26 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/vcf/VcfFix_utils.py +3 -2
- {biopipen-0.7.1 → biopipen-0.8.0}/pyproject.toml +7 -10
- biopipen-0.7.1/biopipen/__init__.py +0 -2
- biopipen-0.7.1/biopipen/ns/scrna_metabolic_landscape.py +0 -460
- biopipen-0.7.1/setup.py +0 -89
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/core/__init__.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/ns/__init__.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/ns/tcgamaf.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/reports/scrna_metabolic_landscape/MetabolicFeatures.svelte +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/bam/CNAClinic.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/bam/CNVpytor.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/bam/ControlFREEC.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/bcftools/BcftoolsAnnotate.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/bcftools/BcftoolsFilter.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/bcftools/BcftoolsSort.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/bed/Bed2Vcf.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/bed/BedConsensus.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/bed/BedLiftOver.sh +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/cnv/AneuploidyScore.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/cnv/AneuploidyScoreSummary.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/cnvkit/CNVkitAccess.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/cnvkit/CNVkitAutobin.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/cnvkit/CNVkitBatch.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/cnvkit/CNVkitCall.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/cnvkit/CNVkitCoverage.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/cnvkit/CNVkitDiagram.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/cnvkit/CNVkitFix.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/cnvkit/CNVkitGuessBaits.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/cnvkit/CNVkitHeatmap.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/cnvkit/CNVkitReference.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/cnvkit/CNVkitScatter.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/cnvkit/CNVkitSegment.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/cnvkit/guess_baits.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/gene/GeneNameConversion.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/gsea/Enrichr.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/gsea/FGSEA.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/gsea/GSEA.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/gsea/PreRank.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/misc/Config2File.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/misc/Str2File.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/plot/Heatmap.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/plot/VennDiagram.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/rnaseq/UnitConversion.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna/CellTypeAnnotate-direct.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna/CellTypeAnnotate-sctype.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna/CellTypeAnnotate.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna/CellsDistribution.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna/DimPlots.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna/ExprImpute-alra.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna/ExprImpute-rmagic.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna/ExprImpute-scimpute.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna/ExprImpute.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna/GeneExpressionInvistigation.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna/MarkersFinder.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna/SCImpute.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna/ScFGSEA.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna/SeuratClusterStats.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna/SeuratClustering.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna/SeuratFilter.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna/SeuratLoading.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna/SeuratMetadataMutater.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna/SeuratPreparing.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna/SeuratSplit.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna/SeuratSubset.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna/Subset10X.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna/Write10X.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna/sctype.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna_metabolic_landscape/MetabolicFeatures.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna_metabolic_landscape/MetabolicFeaturesIntraSubsets.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna_metabolic_landscape/MetabolicPathwayActivity.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/scrna_metabolic_landscape/MetabolicPathwayHeterogeneity.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/tcgamaf/Maf2Vcf.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/tcgamaf/MafAddChr.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/tcr/Attach2Seurat.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/tcr/CloneResidency.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/tcr/CloneSizeQQPlot.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/tcr/Immunarch.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/tcr/Immunarch2VDJtools.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/tcr/ImmunarchFilter.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/tcr/ImmunarchLoading.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/tcr/ImmunarchSplitIdents.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/tcr/SampleDiversity.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/tcr/TCRClustering.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/tcr/TCRClusteringStats.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/tcr/VJUsage.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/tcr/vdjtools-patch.sh +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/vcf/TruvariBench.sh +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/vcf/TruvariBenchSummary.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/vcf/TruvariConsistency.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/vcf/Vcf2Bed.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/vcf/VcfDownSample.sh +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/vcf/VcfFilter.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/vcf/VcfFix.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/vcf/VcfIndex.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/vcf/VcfIntersect.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/vcf/VcfLiftOver.sh +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/vcf/VcfSplitSamples.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/web/Download.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/scripts/web/DownloadList.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/utils/gene.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/utils/gene.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/utils/gsea.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/utils/io.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/utils/misc.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/utils/plot.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/utils/reference.py +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/utils/rnaseq.R +0 -0
- {biopipen-0.7.1 → biopipen-0.8.0}/biopipen/utils/vcf.py +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.1
|
|
2
2
|
Name: biopipen
|
|
3
|
-
Version: 0.
|
|
3
|
+
Version: 0.8.0
|
|
4
4
|
Summary: Bioinformatics processes/pipelines that can be run from `pipen run`
|
|
5
5
|
License: MIT
|
|
6
6
|
Author: pwwang
|
|
@@ -12,12 +12,11 @@ Classifier: Programming Language :: Python :: 3.8
|
|
|
12
12
|
Classifier: Programming Language :: Python :: 3.9
|
|
13
13
|
Classifier: Programming Language :: Python :: 3.10
|
|
14
14
|
Classifier: Programming Language :: Python :: 3.11
|
|
15
|
-
Provides-Extra: test
|
|
16
15
|
Requires-Dist: cmdy (>=0.5,<0.6)
|
|
17
16
|
Requires-Dist: datar[pandas] (>=0.11,<0.12)
|
|
18
|
-
Requires-Dist: pipen (>=0.
|
|
19
|
-
Requires-Dist: pipen-args (>=0.
|
|
20
|
-
Requires-Dist: pipen-cli-run (>=0.
|
|
21
|
-
Requires-Dist: pipen-filters (>=0.
|
|
22
|
-
Requires-Dist: pipen-report (>=0.
|
|
23
|
-
Requires-Dist: pipen-verbose (>=0.
|
|
17
|
+
Requires-Dist: pipen (>=0.5,<0.6)
|
|
18
|
+
Requires-Dist: pipen-args (>=0.6,<0.7)
|
|
19
|
+
Requires-Dist: pipen-cli-run (>=0.5,<0.6)
|
|
20
|
+
Requires-Dist: pipen-filters (>=0.4,<0.5)
|
|
21
|
+
Requires-Dist: pipen-report (>=0.6,<0.7)
|
|
22
|
+
Requires-Dist: pipen-verbose (>=0.3,<0.4)
|
|
@@ -1,6 +1,5 @@
|
|
|
1
1
|
"""Provides the envs from configuration files"""
|
|
2
2
|
|
|
3
|
-
import sys
|
|
4
3
|
from typing import Any
|
|
5
4
|
from pathlib import Path
|
|
6
5
|
from tempfile import gettempdir
|
|
@@ -38,9 +37,5 @@ config_profiles = [
|
|
|
38
37
|
USER_CONFIG_FILE,
|
|
39
38
|
PROJ_CONFIG_FILE,
|
|
40
39
|
]
|
|
41
|
-
# scan sys.argv to see if +config <config file> passed in
|
|
42
|
-
if "+config" in sys.argv:
|
|
43
|
-
cindex = sys.argv.index("+config")
|
|
44
|
-
config_profiles.append(sys.argv[cindex + 1])
|
|
45
40
|
|
|
46
41
|
config = ConfigItems(Config.load(*config_profiles, ignore_nonexist=True))
|
|
@@ -36,6 +36,8 @@ samtools = "samtools"
|
|
|
36
36
|
magic_python = "python"
|
|
37
37
|
# truvari
|
|
38
38
|
truvari = "truvari"
|
|
39
|
+
# vcfanno
|
|
40
|
+
vcfanno = "vcfanno"
|
|
39
41
|
|
|
40
42
|
# Interpreters
|
|
41
43
|
[lang]
|
|
@@ -80,7 +82,3 @@ sctype_db = ""
|
|
|
80
82
|
[misc]
|
|
81
83
|
# Number of cores used for each job
|
|
82
84
|
ncores = 1
|
|
83
|
-
|
|
84
|
-
[pipeline.scrna_metabolic_landscape]
|
|
85
|
-
|
|
86
|
-
[pipeline.cnvkit_pipeline]
|
|
@@ -1,8 +1,8 @@
|
|
|
1
1
|
"""Provide default variables
|
|
2
2
|
|
|
3
|
-
-
|
|
4
|
-
-
|
|
5
|
-
-
|
|
3
|
+
- BIOPIPEN_DIR: the root directory of the biopipen source
|
|
4
|
+
- REPORT_DIR: the root directory of the report
|
|
5
|
+
- SCRIPTS_DIR: the root directory of the scripts
|
|
6
6
|
"""
|
|
7
7
|
from pathlib import Path
|
|
8
8
|
|
|
@@ -10,9 +10,7 @@ class Proc(PipenProc):
|
|
|
10
10
|
"""Base class for all processes in biopipen to subclass"""
|
|
11
11
|
|
|
12
12
|
template_opts = {
|
|
13
|
-
"globals": {
|
|
14
|
-
"biopipen_dir": str(BIOPIPEN_DIR),
|
|
15
|
-
},
|
|
13
|
+
"globals": {"biopipen_dir": str(BIOPIPEN_DIR)},
|
|
16
14
|
"filters": filtermanager.filters.copy(),
|
|
17
15
|
"search_paths": SEARCH_PATHS + [str(REPORT_DIR)],
|
|
18
16
|
}
|
|
@@ -33,11 +33,9 @@ class CNVpytor(Proc):
|
|
|
33
33
|
baf_nomask: Do not use P mask in BAF histograms
|
|
34
34
|
|
|
35
35
|
Requires:
|
|
36
|
-
|
|
37
|
-
|
|
38
|
-
{{proc.envs.cnvpytor}} --version
|
|
36
|
+
cnvpytor:
|
|
37
|
+
- check: {{proc.envs.cnvpytor}} --version
|
|
39
38
|
"""
|
|
40
|
-
|
|
41
39
|
input = "bamfile:file, snpfile:file"
|
|
42
40
|
output = "outdir:dir:{{in.bamfile | stem}}.cnvpytor"
|
|
43
41
|
lang = config.lang.python
|
|
@@ -93,9 +91,7 @@ class ControlFREEC(Proc):
|
|
|
93
91
|
freec: Path to Control-FREEC executable
|
|
94
92
|
ncores: Number of cores to use
|
|
95
93
|
arggs: Other arguments for Control-FREEC
|
|
96
|
-
|
|
97
94
|
"""
|
|
98
|
-
|
|
99
95
|
input = "bamfile:file, snpfile:file"
|
|
100
96
|
output = "outdir:dir:{{in.bamfile | stem}}.freec"
|
|
101
97
|
lang = config.lang.python
|
|
@@ -132,14 +128,14 @@ class CNAClinic(Proc):
|
|
|
132
128
|
Input:
|
|
133
129
|
metafile: The meta file, header included, tab-delimited, including
|
|
134
130
|
following columns:
|
|
135
|
-
|
|
136
|
-
|
|
131
|
+
- Bam: The path to bam file
|
|
132
|
+
- Sample: Optional. The sample names,
|
|
137
133
|
if you don't want filename of bam file to be used
|
|
138
|
-
|
|
139
|
-
|
|
134
|
+
- Group: Optional. The group names, either "Case" or "Control"
|
|
135
|
+
- Patient: Optional. The patient names. Since CNAClinic only
|
|
140
136
|
supports paired samples, you need to provide the patient names
|
|
141
137
|
for each sample. Required if "Group" is provided.
|
|
142
|
-
|
|
138
|
+
- Binsizer: Optional. Samples used to estimate the bin size
|
|
143
139
|
"Y", "Yes", "T", "True", will be treated as True
|
|
144
140
|
If not provided, will use `envs.binsizer` to get the samples
|
|
145
141
|
to use. Either this column or `envs.binsizer` should be
|
|
@@ -153,9 +149,9 @@ class CNAClinic(Proc):
|
|
|
153
149
|
seed: The seed for random number generator for choosing samples
|
|
154
150
|
for estimating bin size
|
|
155
151
|
binsizer: The samples used to estimate the bin size, it could be:
|
|
156
|
-
|
|
157
|
-
|
|
158
|
-
|
|
152
|
+
A list of sample names
|
|
153
|
+
A float number (0 < x <= 1), the fraction of samples to use
|
|
154
|
+
A integer number (x > 1), the number of samples to use
|
|
159
155
|
binsize: Directly use this binsize for CNAClinic, in kbp.
|
|
160
156
|
genome: The genome assembly
|
|
161
157
|
run_args: The arguments for CNAClinic::runSegmentation
|
|
@@ -23,7 +23,6 @@ class BcftoolsAnnotate(Proc):
|
|
|
23
23
|
header: Headers to be added
|
|
24
24
|
args: Other arguments for `bcftools annotate`
|
|
25
25
|
"""
|
|
26
|
-
|
|
27
26
|
input = "infile:file, annfile:file"
|
|
28
27
|
output = "outfile:file:{{in.infile | basename}}"
|
|
29
28
|
lang = config.lang.python
|
|
@@ -59,13 +58,11 @@ class BcftoolsFilter(Proc):
|
|
|
59
58
|
Since the filters need to be applied one by one by bcftools
|
|
60
59
|
includes: and
|
|
61
60
|
excludes: include/exclude only sites for which EXPRESSION is true.
|
|
62
|
-
|
|
63
|
-
|
|
64
|
-
|
|
65
|
-
|
|
66
|
-
expressions
|
|
61
|
+
See: https://samtools.github.io/bcftools/bcftools.html#expressions
|
|
62
|
+
If provided, `envs.args.include/exclude` will be ignored.
|
|
63
|
+
If `str`/`list` used, The filter names will be `Filter%d`
|
|
64
|
+
A dict is used when keys are filter names and values are expressions
|
|
67
65
|
"""
|
|
68
|
-
|
|
69
66
|
input = "infile:file"
|
|
70
67
|
output = "outfile:file:{{in.infile | basename}}"
|
|
71
68
|
lang = config.lang.python
|
|
@@ -17,11 +17,9 @@ class BedLiftOver(Proc):
|
|
|
17
17
|
chain: The map chain file for liftover
|
|
18
18
|
|
|
19
19
|
Requires:
|
|
20
|
-
|
|
21
|
-
|
|
22
|
-
{{proc.envs.liftover}} 2>&1 | grep "usage"
|
|
20
|
+
liftOver:
|
|
21
|
+
- check: {{proc.envs.liftover}} 2>&1 | grep "usage"
|
|
23
22
|
"""
|
|
24
|
-
|
|
25
23
|
input = "inbed:file"
|
|
26
24
|
output = "outbed:file:{{in.inbed | basename}}"
|
|
27
25
|
envs = {
|
|
@@ -64,18 +62,14 @@ class Bed2Vcf(Proc):
|
|
|
64
62
|
index: Sort and index output file
|
|
65
63
|
|
|
66
64
|
Requires:
|
|
67
|
-
|
|
68
|
-
|
|
69
|
-
|
|
70
|
-
|
|
71
|
-
|
|
72
|
-
{{proc.
|
|
73
|
-
|
|
74
|
-
if: {{proc.envs.index}}
|
|
75
|
-
check: |
|
|
76
|
-
{{proc.envs.bcftools}} --version
|
|
65
|
+
cyvcf2:
|
|
66
|
+
- check: {{proc.lang}} -c "import cyvcf2"
|
|
67
|
+
pysam:
|
|
68
|
+
- check: {{proc.lang}} -c "import pysam"
|
|
69
|
+
bcftools:
|
|
70
|
+
- if: {{proc.envs.index}}
|
|
71
|
+
- check: {{proc.envs.bcftools}} --version
|
|
77
72
|
"""
|
|
78
|
-
|
|
79
73
|
input = "inbed:file"
|
|
80
74
|
output = (
|
|
81
75
|
"outvcf:file:{{in.inbed | stem}}.vcf{{'.gz' if envs.index else ''}}"
|
|
@@ -141,7 +135,6 @@ class BedConsensus(Proc):
|
|
|
141
135
|
ncores: Number of cores to use to calculate the weights for
|
|
142
136
|
each bed file
|
|
143
137
|
"""
|
|
144
|
-
|
|
145
138
|
input = "bedfiles:files"
|
|
146
139
|
output = (
|
|
147
140
|
"outbed:file:{{in.bedfiles | first | stem | append: '_consensus'}}.bed"
|
|
@@ -19,17 +19,14 @@ class AneuploidyScore(Proc):
|
|
|
19
19
|
plot to show the CAAs for each chromosome arm
|
|
20
20
|
|
|
21
21
|
Requires:
|
|
22
|
-
|
|
23
|
-
|
|
24
|
-
|
|
25
|
-
|
|
26
|
-
|
|
27
|
-
|
|
28
|
-
{{proc.
|
|
29
|
-
|
|
30
|
-
if: {{ proc.envs.genome == 'hg38' }}
|
|
31
|
-
check: |
|
|
32
|
-
{{proc.lang}} <(echo "library(ucsc.hg38.cytoband)")
|
|
22
|
+
AneuploidyScore:
|
|
23
|
+
- check: {{proc.lang}} <(echo "library(AneuploidyScore)")
|
|
24
|
+
ucsc.hg19.cytoband:
|
|
25
|
+
- if: {{ proc.envs.genome == 'hg19' }}
|
|
26
|
+
- check: {{proc.lang}} <(echo "library(ucsc.hg19.cytoband)")
|
|
27
|
+
ucsc.hg38.cytoband:
|
|
28
|
+
- if: {{ proc.envs.genome == 'hg38' }}
|
|
29
|
+
- check: {{proc.lang}} <(echo "library(ucsc.hg38.cytoband)")
|
|
33
30
|
"""
|
|
34
31
|
input = "segfile:file"
|
|
35
32
|
output = "outdir:dir:{{in.segfile | stem}}.aneuploidy_score"
|
|
@@ -19,11 +19,9 @@ class CNVkitAccess(Proc):
|
|
|
19
19
|
ref: The reference genome fasta file
|
|
20
20
|
|
|
21
21
|
Requires:
|
|
22
|
-
|
|
23
|
-
|
|
24
|
-
{{proc.envs.cnvkit}} version
|
|
22
|
+
cnvkit:
|
|
23
|
+
- check: {{proc.envs.cnvkit}} version
|
|
25
24
|
"""
|
|
26
|
-
|
|
27
25
|
input = "excfiles:files"
|
|
28
26
|
output = (
|
|
29
27
|
"outfile:file:{{envs.ref | stem0}}.access.{{envs.min_gap_size}}.bed"
|
|
@@ -71,11 +69,9 @@ class CNVkitAutobin(Proc):
|
|
|
71
69
|
ref: The reference genome fasta file
|
|
72
70
|
|
|
73
71
|
Requires:
|
|
74
|
-
|
|
75
|
-
|
|
76
|
-
{{proc.envs.cnvkit}} version
|
|
72
|
+
cnvkit:
|
|
73
|
+
- check: {{proc.envs.cnvkit}} version
|
|
77
74
|
"""
|
|
78
|
-
|
|
79
75
|
input = "bamfiles:files, accfile:file, baitfile:file"
|
|
80
76
|
output = [
|
|
81
77
|
"target_file:file:{{in.bamfiles | first | stem0}}-etc.target.bed",
|
|
@@ -117,11 +113,9 @@ class CNVkitCoverage(Proc):
|
|
|
117
113
|
ref: The reference genome fasta file
|
|
118
114
|
|
|
119
115
|
Requires:
|
|
120
|
-
|
|
121
|
-
|
|
122
|
-
{{proc.envs.cnvkit}} version
|
|
116
|
+
cnvkit:
|
|
117
|
+
- check: {{proc.envs.cnvkit}} version
|
|
123
118
|
"""
|
|
124
|
-
|
|
125
119
|
input = "bamfile:file, target_file:file"
|
|
126
120
|
output = """
|
|
127
121
|
{%- if "antitarget" in basename(in.target_file) -%}
|
|
@@ -174,11 +168,9 @@ class CNVkitReference(Proc):
|
|
|
174
168
|
ref: The reference genome fasta file
|
|
175
169
|
|
|
176
170
|
Requires:
|
|
177
|
-
|
|
178
|
-
|
|
179
|
-
{{proc.envs.cnvkit}} version
|
|
171
|
+
cnvkit:
|
|
172
|
+
- check: {{proc.envs.cnvkit}} version
|
|
180
173
|
"""
|
|
181
|
-
|
|
182
174
|
input = (
|
|
183
175
|
"covfiles:files, target_file:file, antitarget_file:file, sample_sex:var"
|
|
184
176
|
)
|
|
@@ -221,11 +213,9 @@ class CNVkitFix(Proc):
|
|
|
221
213
|
no_rmask: Skip RepeatMasker correction.
|
|
222
214
|
|
|
223
215
|
Requires:
|
|
224
|
-
|
|
225
|
-
|
|
226
|
-
{{proc.envs.cnvkit}} version
|
|
216
|
+
cnvkit:
|
|
217
|
+
- check: {{proc.envs.cnvkit}} version
|
|
227
218
|
"""
|
|
228
|
-
|
|
229
219
|
input = (
|
|
230
220
|
"target_file:file, antitarget_file:file, reference:file, sample_id:var"
|
|
231
221
|
)
|
|
@@ -286,14 +276,11 @@ class CNVkitSegment(Proc):
|
|
|
286
276
|
zygosity from allele frequencies.
|
|
287
277
|
|
|
288
278
|
Requires:
|
|
289
|
-
|
|
290
|
-
|
|
291
|
-
|
|
292
|
-
|
|
293
|
-
check: |
|
|
294
|
-
{{proc.envs.rscript}} <(echo "library(DNAcopy)")
|
|
279
|
+
cnvkit:
|
|
280
|
+
- check: {{proc.envs.cnvkit}} version
|
|
281
|
+
r-DNAcopy:
|
|
282
|
+
- check: {{proc.envs.rscript}} <(echo "library(DNAcopy)")
|
|
295
283
|
"""
|
|
296
|
-
|
|
297
284
|
input = "cnrfile:file, vcf:file, sample_id:var, normal_id:var"
|
|
298
285
|
output = "outfile:file:{{in.cnrfile | stem0}}.cns"
|
|
299
286
|
lang = config.lang.python
|
|
@@ -366,14 +353,11 @@ class CNVkitScatter(Proc):
|
|
|
366
353
|
if no case specified
|
|
367
354
|
|
|
368
355
|
Requires:
|
|
369
|
-
|
|
370
|
-
|
|
371
|
-
|
|
372
|
-
|
|
373
|
-
check: |
|
|
374
|
-
{{proc.envs.convert}} -version
|
|
356
|
+
cnvkit:
|
|
357
|
+
- check: {{proc.envs.cnvkit}} version
|
|
358
|
+
convert:
|
|
359
|
+
- check: {{proc.envs.convert}} -version
|
|
375
360
|
"""
|
|
376
|
-
|
|
377
361
|
input = (
|
|
378
362
|
"cnrfile:file, cnsfile:file, config:var, "
|
|
379
363
|
"vcf:file, sample_id:var, normal_id:var"
|
|
@@ -439,14 +423,11 @@ class CNVkitDiagram(Proc):
|
|
|
439
423
|
and `title`
|
|
440
424
|
|
|
441
425
|
Requires:
|
|
442
|
-
|
|
443
|
-
|
|
444
|
-
|
|
445
|
-
|
|
446
|
-
check: |
|
|
447
|
-
{{proc.envs.convert}} -version
|
|
426
|
+
cnvkit:
|
|
427
|
+
- check: {{proc.envs.cnvkit}} version
|
|
428
|
+
convert:
|
|
429
|
+
- check: {{proc.envs.convert}} -version
|
|
448
430
|
"""
|
|
449
|
-
|
|
450
431
|
input = "cnrfile:file, cnsfile:file, sample_sex:var"
|
|
451
432
|
output = "outdir:dir:{{in.cnrfile | stem0}}.diagram"
|
|
452
433
|
lang = config.lang.python
|
|
@@ -510,14 +491,11 @@ class CNVkitHeatmap(Proc):
|
|
|
510
491
|
if no case specified
|
|
511
492
|
|
|
512
493
|
Requires:
|
|
513
|
-
|
|
514
|
-
|
|
515
|
-
|
|
516
|
-
|
|
517
|
-
check: |
|
|
518
|
-
{{proc.envs.convert}} -version
|
|
494
|
+
cnvkit:
|
|
495
|
+
- check: {{proc.envs.cnvkit}} version
|
|
496
|
+
convert:
|
|
497
|
+
- check: {{proc.envs.convert}} -version
|
|
519
498
|
"""
|
|
520
|
-
|
|
521
499
|
input = "segfiles:files, sample_sex: var"
|
|
522
500
|
output = "outdir:dir:{{in.segfiles | first | stem0}}-etc.heatmap"
|
|
523
501
|
lang = config.lang.python
|
|
@@ -587,11 +565,9 @@ class CNVkitCall(Proc):
|
|
|
587
565
|
zygosity from allele frequencies.
|
|
588
566
|
|
|
589
567
|
Requires:
|
|
590
|
-
|
|
591
|
-
|
|
592
|
-
{{proc.envs.cnvkit}} version
|
|
568
|
+
cnvkit:
|
|
569
|
+
- check: {{proc.envs.cnvkit}} version
|
|
593
570
|
"""
|
|
594
|
-
|
|
595
571
|
input = [
|
|
596
572
|
"cnrfile:file",
|
|
597
573
|
"cnsfile:file",
|
|
@@ -691,14 +667,11 @@ class CNVkitBatch(Proc):
|
|
|
691
667
|
`in.metafile`
|
|
692
668
|
|
|
693
669
|
Requires:
|
|
694
|
-
|
|
695
|
-
|
|
696
|
-
|
|
697
|
-
|
|
698
|
-
check: |
|
|
699
|
-
{{proc.envs.rscript}} <(echo "library(DNAcopy)")
|
|
670
|
+
cnvkit:
|
|
671
|
+
- check: {{proc.envs.cnvkit}} version
|
|
672
|
+
r-DNAcopy:
|
|
673
|
+
- check: {{proc.envs.rscript}} <(echo "library(DNAcopy)")
|
|
700
674
|
"""
|
|
701
|
-
|
|
702
675
|
input = "metafile:file"
|
|
703
676
|
output = "outdir:dir:{{in.metafile | stem0}}.cnvkit"
|
|
704
677
|
lang = config.lang.python
|