pupmapper 0.0.5__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- pupmapper-0.0.5/.gitignore +164 -0
- pupmapper-0.0.5/Images/Derrien2012.PmapFig.png +0 -0
- pupmapper-0.0.5/Images/pupmapper.logo.png +0 -0
- pupmapper-0.0.5/LICENSE +21 -0
- pupmapper-0.0.5/PKG-INFO +141 -0
- pupmapper-0.0.5/README.md +124 -0
- pupmapper-0.0.5/dev/README.md +3 -0
- pupmapper-0.0.5/pupmapper/__init__.py +420 -0
- pupmapper-0.0.5/pupmapper/_version.py +10 -0
- pupmapper-0.0.5/pupmapper/genmap.py +66 -0
- pupmapper-0.0.5/pupmapper/run_bigtools.py +30 -0
- pupmapper-0.0.5/pupmapper/utils.py +321 -0
- pupmapper-0.0.5/pyproject.toml +32 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1.genome.fasta +2 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/Ex1.genome.LowPileupMap.Below1.K4_E0.bed +2 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/Ex1.genome.PileupMap.K4_E0.Summary.tsv +2 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/Ex1.genome.PileupMap.K4_E0.bedgraph +8 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/Ex1.genome.PileupMap.K4_E0.bigwig +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/genmap_index/index.ids.concat +1 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/genmap_index/index.ids.limits +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/genmap_index/index.info.concat +1 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/genmap_index/index.info.limits +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/genmap_index/index.lf.drp +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/genmap_index/index.lf.drp.sbl +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/genmap_index/index.lf.drs +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/genmap_index/index.lf.drv +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/genmap_index/index.lf.drv.sbl +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/genmap_index/index.lf.pst +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/genmap_index/index.rev.lf.drp +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/genmap_index/index.rev.lf.drp.sbl +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/genmap_index/index.rev.lf.drs +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/genmap_index/index.rev.lf.drv +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/genmap_index/index.rev.lf.drv.sbl +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/genmap_index/index.rev.lf.pst +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/genmap_index/index.sa.ind +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/genmap_index/index.sa.len +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/genmap_index/index.sa.val +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/genmap_index/index.txt.concat +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/genmap_index/index.txt.limits +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/genmap_kmap_K4_E0/Ex1.genome.kmermap.K4_E0.bedgraph +3 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/genmap_kmap_K4_E0/Ex1.genome.kmermap.K4_E0.chrom.sizes +1 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_Seq_K4E0_outdir/genmap_kmap_K4_E0/Ex1.genome.kmermap.K4_E0.wig +6 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_index/index.ids.concat +1 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_index/index.ids.limits +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_index/index.info.concat +1 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_index/index.info.limits +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_index/index.lf.drp +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_index/index.lf.drp.sbl +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_index/index.lf.drs +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_index/index.lf.drv +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_index/index.lf.drv.sbl +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_index/index.lf.pst +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_index/index.rev.lf.drp +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_index/index.rev.lf.drp.sbl +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_index/index.rev.lf.drs +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_index/index.rev.lf.drv +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_index/index.rev.lf.drv.sbl +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_index/index.rev.lf.pst +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_index/index.sa.ind +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_index/index.sa.len +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_index/index.sa.val +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_index/index.txt.concat +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_index/index.txt.limits +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_output/Ex1_Kmap_K4E0.bedgraph +3 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_output/Ex1_Kmap_K4E0.chrom.sizes +1 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_output/Ex1_Kmap_K4E0.freq.txt +2 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_output/Ex1_Kmap_K4E0.nc.bedgraph +3 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_output/Ex1_Kmap_K4E0.nc.chrom.sizes +1 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_output/Ex1_Kmap_K4E0.nc.freq.txt +2 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_output/Ex1_Kmap_K4E0.nc.txt +2 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_output/Ex1_Kmap_K4E0.nc.wig +6 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_output/Ex1_Kmap_K4E0.txt +2 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_output/Ex1_Kmap_K4E0.wig +6 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_output/Ex1_Kmap_K4E1.bedgraph +8 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_output/Ex1_Kmap_K4E1.chrom.sizes +1 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_output/Ex1_Kmap_K4E1.freq.txt +2 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_output/Ex1_Kmap_K4E1.nc.bedgraph +9 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_output/Ex1_Kmap_K4E1.nc.chrom.sizes +1 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_output/Ex1_Kmap_K4E1.nc.freq.txt +2 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_output/Ex1_Kmap_K4E1.nc.txt +2 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_output/Ex1_Kmap_K4E1.nc.wig +14 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_output/Ex1_Kmap_K4E1.txt +2 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_output/Ex1_Kmap_K4E1.wig +14 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex1/Ex1_gm_output/Ex1_Pmap_K4E0.bedgraph +9 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2.genome.fasta +2 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/Ex2.genome.LowPileupMap.Below1.K4_E0.bed +2 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/Ex2.genome.PileupMap.K4_E0.Summary.tsv +2 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/Ex2.genome.PileupMap.K4_E0.bedgraph +9 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/Ex2.genome.PileupMap.K4_E0.bigwig +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/genmap_index/index.ids.concat +1 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/genmap_index/index.ids.limits +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/genmap_index/index.info.concat +1 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/genmap_index/index.info.limits +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/genmap_index/index.lf.drp +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/genmap_index/index.lf.drp.sbl +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/genmap_index/index.lf.drs +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/genmap_index/index.lf.drv +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/genmap_index/index.lf.drv.sbl +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/genmap_index/index.lf.pst +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/genmap_index/index.rev.lf.drp +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/genmap_index/index.rev.lf.drp.sbl +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/genmap_index/index.rev.lf.drs +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/genmap_index/index.rev.lf.drv +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/genmap_index/index.rev.lf.drv.sbl +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/genmap_index/index.rev.lf.pst +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/genmap_index/index.sa.ind +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/genmap_index/index.sa.len +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/genmap_index/index.sa.val +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/genmap_index/index.txt.concat +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/genmap_index/index.txt.limits +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/genmap_kmap_K4_E0/Ex2.genome.kmermap.K4_E0.bedgraph +5 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/genmap_kmap_K4_E0/Ex2.genome.kmermap.K4_E0.chrom.sizes +1 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_Seq_K4E0_outdir/genmap_kmap_K4_E0/Ex2.genome.kmermap.K4_E0.wig +10 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_index/index.ids.concat +1 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_index/index.ids.limits +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_index/index.info.concat +1 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_index/index.info.limits +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_index/index.lf.drp +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_index/index.lf.drp.sbl +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_index/index.lf.drs +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_index/index.lf.drv +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_index/index.lf.drv.sbl +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_index/index.lf.pst +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_index/index.rev.lf.drp +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_index/index.rev.lf.drp.sbl +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_index/index.rev.lf.drs +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_index/index.rev.lf.drv +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_index/index.rev.lf.drv.sbl +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_index/index.rev.lf.pst +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_index/index.sa.ind +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_index/index.sa.len +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_index/index.sa.val +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_index/index.txt.concat +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_index/index.txt.limits +0 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_output/Ex2_Kmap_K4E0.bedgraph +5 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_output/Ex2_Kmap_K4E0.chrom.sizes +1 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_output/Ex2_Kmap_K4E0.freq.txt +2 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_output/Ex2_Kmap_K4E0.nc.bedgraph +3 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_output/Ex2_Kmap_K4E0.nc.chrom.sizes +1 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_output/Ex2_Kmap_K4E0.nc.freq.txt +2 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_output/Ex2_Kmap_K4E0.nc.txt +2 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_output/Ex2_Kmap_K4E0.nc.wig +6 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_output/Ex2_Kmap_K4E0.txt +2 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_output/Ex2_Kmap_K4E0.wig +10 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_output/Ex2_Kmap_K4E1.bedgraph +10 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_output/Ex2_Kmap_K4E1.chrom.sizes +1 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_output/Ex2_Kmap_K4E1.freq.txt +2 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_output/Ex2_Kmap_K4E1.nc.bedgraph +8 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_output/Ex2_Kmap_K4E1.nc.chrom.sizes +1 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_output/Ex2_Kmap_K4E1.nc.freq.txt +2 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_output/Ex2_Kmap_K4E1.nc.txt +2 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_output/Ex2_Kmap_K4E1.nc.wig +13 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_output/Ex2_Kmap_K4E1.txt +2 -0
- pupmapper-0.0.5/tests/data/Genmap_Ex2/Ex2_gm_output/Ex2_Kmap_K4E1.wig +15 -0
|
@@ -0,0 +1,164 @@
|
|
|
1
|
+
# Byte-compiled / optimized / DLL files
|
|
2
|
+
__pycache__/
|
|
3
|
+
*.py[cod]
|
|
4
|
+
*$py.class
|
|
5
|
+
|
|
6
|
+
# C extensions
|
|
7
|
+
*.so
|
|
8
|
+
|
|
9
|
+
# Distribution / packaging
|
|
10
|
+
.Python
|
|
11
|
+
build/
|
|
12
|
+
develop-eggs/
|
|
13
|
+
dist/
|
|
14
|
+
downloads/
|
|
15
|
+
eggs/
|
|
16
|
+
.eggs/
|
|
17
|
+
lib/
|
|
18
|
+
lib64/
|
|
19
|
+
parts/
|
|
20
|
+
sdist/
|
|
21
|
+
var/
|
|
22
|
+
wheels/
|
|
23
|
+
share/python-wheels/
|
|
24
|
+
*.egg-info/
|
|
25
|
+
.installed.cfg
|
|
26
|
+
*.egg
|
|
27
|
+
MANIFEST
|
|
28
|
+
|
|
29
|
+
# PyInstaller
|
|
30
|
+
# Usually these files are written by a python script from a template
|
|
31
|
+
# before PyInstaller builds the exe, so as to inject date/other infos into it.
|
|
32
|
+
*.manifest
|
|
33
|
+
*.spec
|
|
34
|
+
|
|
35
|
+
# Installer logs
|
|
36
|
+
pip-log.txt
|
|
37
|
+
pip-delete-this-directory.txt
|
|
38
|
+
|
|
39
|
+
# Unit test / coverage reports
|
|
40
|
+
htmlcov/
|
|
41
|
+
.tox/
|
|
42
|
+
.nox/
|
|
43
|
+
.coverage
|
|
44
|
+
.coverage.*
|
|
45
|
+
.cache
|
|
46
|
+
nosetests.xml
|
|
47
|
+
coverage.xml
|
|
48
|
+
*.cover
|
|
49
|
+
*.py,cover
|
|
50
|
+
.hypothesis/
|
|
51
|
+
.pytest_cache/
|
|
52
|
+
cover/
|
|
53
|
+
|
|
54
|
+
# Translations
|
|
55
|
+
*.mo
|
|
56
|
+
*.pot
|
|
57
|
+
|
|
58
|
+
# Django stuff:
|
|
59
|
+
*.log
|
|
60
|
+
local_settings.py
|
|
61
|
+
db.sqlite3
|
|
62
|
+
db.sqlite3-journal
|
|
63
|
+
|
|
64
|
+
# Flask stuff:
|
|
65
|
+
instance/
|
|
66
|
+
.webassets-cache
|
|
67
|
+
|
|
68
|
+
# Scrapy stuff:
|
|
69
|
+
.scrapy
|
|
70
|
+
|
|
71
|
+
# Sphinx documentation
|
|
72
|
+
docs/_build/
|
|
73
|
+
|
|
74
|
+
# PyBuilder
|
|
75
|
+
.pybuilder/
|
|
76
|
+
target/
|
|
77
|
+
|
|
78
|
+
# Jupyter Notebook
|
|
79
|
+
.ipynb_checkpoints
|
|
80
|
+
|
|
81
|
+
# IPython
|
|
82
|
+
profile_default/
|
|
83
|
+
ipython_config.py
|
|
84
|
+
|
|
85
|
+
# pyenv
|
|
86
|
+
# For a library or package, you might want to ignore these files since the code is
|
|
87
|
+
# intended to run in multiple environments; otherwise, check them in:
|
|
88
|
+
# .python-version
|
|
89
|
+
|
|
90
|
+
# pipenv
|
|
91
|
+
# According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
|
|
92
|
+
# However, in case of collaboration, if having platform-specific dependencies or dependencies
|
|
93
|
+
# having no cross-platform support, pipenv may install dependencies that don't work, or not
|
|
94
|
+
# install all needed dependencies.
|
|
95
|
+
#Pipfile.lock
|
|
96
|
+
|
|
97
|
+
# poetry
|
|
98
|
+
# Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
|
|
99
|
+
# This is especially recommended for binary packages to ensure reproducibility, and is more
|
|
100
|
+
# commonly ignored for libraries.
|
|
101
|
+
# https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
|
|
102
|
+
#poetry.lock
|
|
103
|
+
|
|
104
|
+
# pdm
|
|
105
|
+
# Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
|
|
106
|
+
#pdm.lock
|
|
107
|
+
# pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
|
|
108
|
+
# in version control.
|
|
109
|
+
# https://pdm.fming.dev/#use-with-ide
|
|
110
|
+
.pdm.toml
|
|
111
|
+
|
|
112
|
+
# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
|
|
113
|
+
__pypackages__/
|
|
114
|
+
|
|
115
|
+
# Celery stuff
|
|
116
|
+
celerybeat-schedule
|
|
117
|
+
celerybeat.pid
|
|
118
|
+
|
|
119
|
+
# SageMath parsed files
|
|
120
|
+
*.sage.py
|
|
121
|
+
|
|
122
|
+
# Environments
|
|
123
|
+
.env
|
|
124
|
+
.venv
|
|
125
|
+
env/
|
|
126
|
+
venv/
|
|
127
|
+
ENV/
|
|
128
|
+
env.bak/
|
|
129
|
+
venv.bak/
|
|
130
|
+
|
|
131
|
+
# Spyder project settings
|
|
132
|
+
.spyderproject
|
|
133
|
+
.spyproject
|
|
134
|
+
|
|
135
|
+
# Rope project settings
|
|
136
|
+
.ropeproject
|
|
137
|
+
|
|
138
|
+
# mkdocs documentation
|
|
139
|
+
/site
|
|
140
|
+
|
|
141
|
+
# mypy
|
|
142
|
+
.mypy_cache/
|
|
143
|
+
.dmypy.json
|
|
144
|
+
dmypy.json
|
|
145
|
+
|
|
146
|
+
# Pyre type checker
|
|
147
|
+
.pyre/
|
|
148
|
+
|
|
149
|
+
# pytype static type analyzer
|
|
150
|
+
.pytype/
|
|
151
|
+
|
|
152
|
+
# Cython debug symbols
|
|
153
|
+
cython_debug/
|
|
154
|
+
|
|
155
|
+
# PyCharm
|
|
156
|
+
# JetBrains specific template is maintained in a separate JetBrains.gitignore that can
|
|
157
|
+
# be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
|
|
158
|
+
# and can be added to the global gitignore or merged into this file. For a more nuclear
|
|
159
|
+
# option (not recommended) you can uncomment the following to ignore the entire idea folder.
|
|
160
|
+
#.idea/
|
|
161
|
+
|
|
162
|
+
|
|
163
|
+
.DS_Store
|
|
164
|
+
|
|
Binary file
|
|
Binary file
|
pupmapper-0.0.5/LICENSE
ADDED
|
@@ -0,0 +1,21 @@
|
|
|
1
|
+
MIT License
|
|
2
|
+
|
|
3
|
+
Copyright (c) 2024 Maximillian Marin
|
|
4
|
+
|
|
5
|
+
Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
6
|
+
of this software and associated documentation files (the "Software"), to deal
|
|
7
|
+
in the Software without restriction, including without limitation the rights
|
|
8
|
+
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
9
|
+
copies of the Software, and to permit persons to whom the Software is
|
|
10
|
+
furnished to do so, subject to the following conditions:
|
|
11
|
+
|
|
12
|
+
The above copyright notice and this permission notice shall be included in all
|
|
13
|
+
copies or substantial portions of the Software.
|
|
14
|
+
|
|
15
|
+
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
16
|
+
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
17
|
+
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
18
|
+
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
19
|
+
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
20
|
+
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
21
|
+
SOFTWARE.
|
pupmapper-0.0.5/PKG-INFO
ADDED
|
@@ -0,0 +1,141 @@
|
|
|
1
|
+
Metadata-Version: 2.1
|
|
2
|
+
Name: pupmapper
|
|
3
|
+
Version: 0.0.5
|
|
4
|
+
Summary: Tool & python package for calculating genome wide pileup mappability
|
|
5
|
+
Project-URL: Homepage, https://github.com/maxgmarin/pupmapper
|
|
6
|
+
Author-email: Maximillian Marin <maximilliangmarin@gmail.com>
|
|
7
|
+
License-File: LICENSE
|
|
8
|
+
Requires-Python: >=3.8
|
|
9
|
+
Requires-Dist: bioframe>=0.7.2
|
|
10
|
+
Requires-Dist: numpy
|
|
11
|
+
Requires-Dist: pandas
|
|
12
|
+
Requires-Dist: pybigtools==0.2.1
|
|
13
|
+
Requires-Dist: tqdm
|
|
14
|
+
Provides-Extra: test
|
|
15
|
+
Requires-Dist: pytest; extra == 'test'
|
|
16
|
+
Description-Content-Type: text/markdown
|
|
17
|
+
|
|
18
|
+
<img width="500" src="https://github.com/maxgmarin/pupmapper/raw/main/Images/pupmapper.logo.png" alt="pupmapper logo">
|
|
19
|
+
|
|
20
|
+
[](https://opensource.org/licenses/MIT)
|
|
21
|
+

|
|
22
|
+
<!---[![Build Status]()]()
|
|
23
|
+
[![github release version]()]()
|
|
24
|
+
[![DOI]()]()
|
|
25
|
+
--->
|
|
26
|
+
|
|
27
|
+
Pupmapper: A **P**ile**up** **Map**pability Calculato**r**
|
|
28
|
+
|
|
29
|
+
<!---
|
|
30
|
+
> TBD Reference
|
|
31
|
+
--->
|
|
32
|
+
|
|
33
|
+
[TOC]: #
|
|
34
|
+
## Table of Contents
|
|
35
|
+
- [Motivation](#motivation)
|
|
36
|
+
- [Installation](#installation)
|
|
37
|
+
- [Install locally](#install-locally)
|
|
38
|
+
- [`pip`](#pip)
|
|
39
|
+
- [Basic usage](#basic-usage)
|
|
40
|
+
- [test data set](#analyzing-included-test-data-set)
|
|
41
|
+
- [Full usage](#full-usage)
|
|
42
|
+
|
|
43
|
+
|
|
44
|
+
## Motivation
|
|
45
|
+
The Pileup Mappability metric can be used to quickly identify regions which may be more difficult to perform variant calling with short-read WGS data. `pupmapper` was created to allow users to quickly convert k-mer mappability scores to pileup mappability.
|
|
46
|
+
|
|
47
|
+
The first step of the `pupmapper` pipeline is to calculate k-mer uniquness scores using the [Genmap](https://github.com/cpockrandt/genmap) software. Then pupmapper will summarize the pileup mappability of each genomic position using the k-mer uniqueness of all overlapping k-mers.
|
|
48
|
+
|
|
49
|
+
|
|
50
|
+
### How is pileup mappability calculated from individual k-mer uniqueness/mappability scores?
|
|
51
|
+
|
|
52
|
+
<img width="500" src="https://github.com/maxgmarin/pupmapper/raw/main/Images/Derrien2012.PmapFig.png" alt="PmapFig">
|
|
53
|
+
The Pileup mappability of a position is specifically calculated as the mean k-mer mappability of all k-mers overlapping a given position. <br>
|
|
54
|
+
|
|
55
|
+
A pileup mappability score of 1 indicates that all k-mers overlapping with a position are unique within the genome (using the user defined parameters of uniqueness).
|
|
56
|
+
|
|
57
|
+
**Pileup mappability is useful because it gives a sense of uniquemess of all possible reads (of defined length) that could align to a given position.**
|
|
58
|
+
|
|
59
|
+
|
|
60
|
+
### Useful reading for k-mer mappability and pileup mappability:
|
|
61
|
+
|
|
62
|
+
> Derrien, T, (2012). Fast Computation and Applications of Genome Mappability. PLOS ONE 7(1): e30377. [https://doi.org/10.1371/journal.pone.0030377](https://doi.org/10.1371/journal.pone.0030377)
|
|
63
|
+
|
|
64
|
+
> Pockrandt C, (2020) GenMap: ultra-fast computation of genome mappability, Bioinformatics, Volume 36, Issue 12, June 2020, Pages 3687–3692, [https://doi.org/10.1093/bioinformatics/btaa222](https://doi.org/10.1093/bioinformatics/btaa222)
|
|
65
|
+
|
|
66
|
+
> Lee H, Schatz MC. (2012). Genomic dark matter: the reliability of short read mapping illustrated by the genome mappability score, Bioinformatics, Volume 28, Issue 16, August 2012, Pages 2097–2105, [https://doi.org/10.1093/bioinformatics/bts330](https://doi.org/10.1093/bioinformatics/bts330)
|
|
67
|
+
|
|
68
|
+
## Installation
|
|
69
|
+
### Install locally
|
|
70
|
+
`pupmapper` can be installed by cloning this repository and installing with `pip`.
|
|
71
|
+
|
|
72
|
+
```
|
|
73
|
+
git clone git@github.com:maxgmarin/pupmapper.git
|
|
74
|
+
|
|
75
|
+
cd pupmapper
|
|
76
|
+
|
|
77
|
+
pip install .
|
|
78
|
+
```
|
|
79
|
+
|
|
80
|
+
### `pip`
|
|
81
|
+
>🚧 Check back soon 🚧
|
|
82
|
+
|
|
83
|
+
### `conda`
|
|
84
|
+
>🚧 Check back soon 🚧
|
|
85
|
+
|
|
86
|
+
|
|
87
|
+
## Basic usage
|
|
88
|
+
|
|
89
|
+
|
|
90
|
+
#### 1) `run_all` - Run the full pipeline starting with an input genome
|
|
91
|
+
|
|
92
|
+
```
|
|
93
|
+
pupmapper run_all -i Input.Genome.fasta -o output_directory/ -k 50 -e 1
|
|
94
|
+
```
|
|
95
|
+
The above command will first use genmap to calculate k-mer mappability scores for the input genome and then calculate pileup mappability scores.
|
|
96
|
+
|
|
97
|
+
Arguments:
|
|
98
|
+
|
|
99
|
+
`-i, --in_genome_fa`: Input genome FASTA file. <br>
|
|
100
|
+
`-o, --outdir`: Directory for output files. <br>
|
|
101
|
+
`-k, --kmer_len`: K-mer length (e.g., 50 bp). <br>
|
|
102
|
+
`-e, --errors`: Number of allowed mismatches in k-mer mapping. <br>
|
|
103
|
+
`-g, --gff`: (Optional) Input genome annotations in GFF format. <br>
|
|
104
|
+
`--save-numpy`: (Optional) Save results as compressed numpy arrays. <br>
|
|
105
|
+
|
|
106
|
+
|
|
107
|
+
### Analyzing included test sequence
|
|
108
|
+
|
|
109
|
+
If you wish to run an `pupmapper` on a small test sequence (15 bp), you can run the following commands:
|
|
110
|
+
```
|
|
111
|
+
cd tests/data/Genmap_Ex1/
|
|
112
|
+
|
|
113
|
+
pupmapper run_all -i Ex1.genome.fasta -o Ex1_OutputDir -k 4 -e 0
|
|
114
|
+
```
|
|
115
|
+
This command will analyze the pileup mappability of the test sequence with a k-mer size of 4 bp and a max mismatch of 0 (K=4,E=0).
|
|
116
|
+
|
|
117
|
+
|
|
118
|
+
## Full usage
|
|
119
|
+
```
|
|
120
|
+
pupmapper run_all --help
|
|
121
|
+
usage: pupmapper run_all [-h] -i IN_GENOME_FA -o OUTDIR -k KMER_LEN -e ERRORS [-g GFF] [--save-numpy]
|
|
122
|
+
|
|
123
|
+
optional arguments:
|
|
124
|
+
-h, --help show this help message and exit
|
|
125
|
+
-i IN_GENOME_FA, --in_genome_fa IN_GENOME_FA
|
|
126
|
+
Input genome fasta file (.fasta)
|
|
127
|
+
-o OUTDIR, --outdir OUTDIR
|
|
128
|
+
Directory for all outputs of k-mer and pileup mappability processing.
|
|
129
|
+
-k KMER_LEN, --kmer_len KMER_LEN
|
|
130
|
+
k-mer length (bp) used to generate the k-mer mappability values
|
|
131
|
+
-e ERRORS, --errors ERRORS
|
|
132
|
+
Number of errors (mismatches) allowed in Genmap's k-mer mappability calculation
|
|
133
|
+
-g GFF, --gff GFF GFF formatted genome annotations for input genome (.gff) (Optional)
|
|
134
|
+
--save-numpy If enabled, all pileup mappability scores will be output as compressed numpy arrays (.npz).
|
|
135
|
+
```
|
|
136
|
+
|
|
137
|
+
|
|
138
|
+
|
|
139
|
+
|
|
140
|
+
|
|
141
|
+
|
|
@@ -0,0 +1,124 @@
|
|
|
1
|
+
<img width="500" src="https://github.com/maxgmarin/pupmapper/raw/main/Images/pupmapper.logo.png" alt="pupmapper logo">
|
|
2
|
+
|
|
3
|
+
[](https://opensource.org/licenses/MIT)
|
|
4
|
+

|
|
5
|
+
<!---[![Build Status]()]()
|
|
6
|
+
[![github release version]()]()
|
|
7
|
+
[![DOI]()]()
|
|
8
|
+
--->
|
|
9
|
+
|
|
10
|
+
Pupmapper: A **P**ile**up** **Map**pability Calculato**r**
|
|
11
|
+
|
|
12
|
+
<!---
|
|
13
|
+
> TBD Reference
|
|
14
|
+
--->
|
|
15
|
+
|
|
16
|
+
[TOC]: #
|
|
17
|
+
## Table of Contents
|
|
18
|
+
- [Motivation](#motivation)
|
|
19
|
+
- [Installation](#installation)
|
|
20
|
+
- [Install locally](#install-locally)
|
|
21
|
+
- [`pip`](#pip)
|
|
22
|
+
- [Basic usage](#basic-usage)
|
|
23
|
+
- [test data set](#analyzing-included-test-data-set)
|
|
24
|
+
- [Full usage](#full-usage)
|
|
25
|
+
|
|
26
|
+
|
|
27
|
+
## Motivation
|
|
28
|
+
The Pileup Mappability metric can be used to quickly identify regions which may be more difficult to perform variant calling with short-read WGS data. `pupmapper` was created to allow users to quickly convert k-mer mappability scores to pileup mappability.
|
|
29
|
+
|
|
30
|
+
The first step of the `pupmapper` pipeline is to calculate k-mer uniquness scores using the [Genmap](https://github.com/cpockrandt/genmap) software. Then pupmapper will summarize the pileup mappability of each genomic position using the k-mer uniqueness of all overlapping k-mers.
|
|
31
|
+
|
|
32
|
+
|
|
33
|
+
### How is pileup mappability calculated from individual k-mer uniqueness/mappability scores?
|
|
34
|
+
|
|
35
|
+
<img width="500" src="https://github.com/maxgmarin/pupmapper/raw/main/Images/Derrien2012.PmapFig.png" alt="PmapFig">
|
|
36
|
+
The Pileup mappability of a position is specifically calculated as the mean k-mer mappability of all k-mers overlapping a given position. <br>
|
|
37
|
+
|
|
38
|
+
A pileup mappability score of 1 indicates that all k-mers overlapping with a position are unique within the genome (using the user defined parameters of uniqueness).
|
|
39
|
+
|
|
40
|
+
**Pileup mappability is useful because it gives a sense of uniquemess of all possible reads (of defined length) that could align to a given position.**
|
|
41
|
+
|
|
42
|
+
|
|
43
|
+
### Useful reading for k-mer mappability and pileup mappability:
|
|
44
|
+
|
|
45
|
+
> Derrien, T, (2012). Fast Computation and Applications of Genome Mappability. PLOS ONE 7(1): e30377. [https://doi.org/10.1371/journal.pone.0030377](https://doi.org/10.1371/journal.pone.0030377)
|
|
46
|
+
|
|
47
|
+
> Pockrandt C, (2020) GenMap: ultra-fast computation of genome mappability, Bioinformatics, Volume 36, Issue 12, June 2020, Pages 3687–3692, [https://doi.org/10.1093/bioinformatics/btaa222](https://doi.org/10.1093/bioinformatics/btaa222)
|
|
48
|
+
|
|
49
|
+
> Lee H, Schatz MC. (2012). Genomic dark matter: the reliability of short read mapping illustrated by the genome mappability score, Bioinformatics, Volume 28, Issue 16, August 2012, Pages 2097–2105, [https://doi.org/10.1093/bioinformatics/bts330](https://doi.org/10.1093/bioinformatics/bts330)
|
|
50
|
+
|
|
51
|
+
## Installation
|
|
52
|
+
### Install locally
|
|
53
|
+
`pupmapper` can be installed by cloning this repository and installing with `pip`.
|
|
54
|
+
|
|
55
|
+
```
|
|
56
|
+
git clone git@github.com:maxgmarin/pupmapper.git
|
|
57
|
+
|
|
58
|
+
cd pupmapper
|
|
59
|
+
|
|
60
|
+
pip install .
|
|
61
|
+
```
|
|
62
|
+
|
|
63
|
+
### `pip`
|
|
64
|
+
>🚧 Check back soon 🚧
|
|
65
|
+
|
|
66
|
+
### `conda`
|
|
67
|
+
>🚧 Check back soon 🚧
|
|
68
|
+
|
|
69
|
+
|
|
70
|
+
## Basic usage
|
|
71
|
+
|
|
72
|
+
|
|
73
|
+
#### 1) `run_all` - Run the full pipeline starting with an input genome
|
|
74
|
+
|
|
75
|
+
```
|
|
76
|
+
pupmapper run_all -i Input.Genome.fasta -o output_directory/ -k 50 -e 1
|
|
77
|
+
```
|
|
78
|
+
The above command will first use genmap to calculate k-mer mappability scores for the input genome and then calculate pileup mappability scores.
|
|
79
|
+
|
|
80
|
+
Arguments:
|
|
81
|
+
|
|
82
|
+
`-i, --in_genome_fa`: Input genome FASTA file. <br>
|
|
83
|
+
`-o, --outdir`: Directory for output files. <br>
|
|
84
|
+
`-k, --kmer_len`: K-mer length (e.g., 50 bp). <br>
|
|
85
|
+
`-e, --errors`: Number of allowed mismatches in k-mer mapping. <br>
|
|
86
|
+
`-g, --gff`: (Optional) Input genome annotations in GFF format. <br>
|
|
87
|
+
`--save-numpy`: (Optional) Save results as compressed numpy arrays. <br>
|
|
88
|
+
|
|
89
|
+
|
|
90
|
+
### Analyzing included test sequence
|
|
91
|
+
|
|
92
|
+
If you wish to run an `pupmapper` on a small test sequence (15 bp), you can run the following commands:
|
|
93
|
+
```
|
|
94
|
+
cd tests/data/Genmap_Ex1/
|
|
95
|
+
|
|
96
|
+
pupmapper run_all -i Ex1.genome.fasta -o Ex1_OutputDir -k 4 -e 0
|
|
97
|
+
```
|
|
98
|
+
This command will analyze the pileup mappability of the test sequence with a k-mer size of 4 bp and a max mismatch of 0 (K=4,E=0).
|
|
99
|
+
|
|
100
|
+
|
|
101
|
+
## Full usage
|
|
102
|
+
```
|
|
103
|
+
pupmapper run_all --help
|
|
104
|
+
usage: pupmapper run_all [-h] -i IN_GENOME_FA -o OUTDIR -k KMER_LEN -e ERRORS [-g GFF] [--save-numpy]
|
|
105
|
+
|
|
106
|
+
optional arguments:
|
|
107
|
+
-h, --help show this help message and exit
|
|
108
|
+
-i IN_GENOME_FA, --in_genome_fa IN_GENOME_FA
|
|
109
|
+
Input genome fasta file (.fasta)
|
|
110
|
+
-o OUTDIR, --outdir OUTDIR
|
|
111
|
+
Directory for all outputs of k-mer and pileup mappability processing.
|
|
112
|
+
-k KMER_LEN, --kmer_len KMER_LEN
|
|
113
|
+
k-mer length (bp) used to generate the k-mer mappability values
|
|
114
|
+
-e ERRORS, --errors ERRORS
|
|
115
|
+
Number of errors (mismatches) allowed in Genmap's k-mer mappability calculation
|
|
116
|
+
-g GFF, --gff GFF GFF formatted genome annotations for input genome (.gff) (Optional)
|
|
117
|
+
--save-numpy If enabled, all pileup mappability scores will be output as compressed numpy arrays (.npz).
|
|
118
|
+
```
|
|
119
|
+
|
|
120
|
+
|
|
121
|
+
|
|
122
|
+
|
|
123
|
+
|
|
124
|
+
|