RubyGems - miga-base - Versions diffs - 0.3.0.0 → 0.3.0.1 - Mend

miga-base 0.3.0.0 → 0.3.0.1

Files changed (260) hide show

checksums.yaml +4 -4
data/README.md +21 -4
data/actions/init.rb +258 -0
data/actions/run_local.rb +1 -2
data/actions/test_taxonomy.rb +4 -1
data/bin/miga +8 -1
data/lib/miga/dataset.rb +4 -4
data/lib/miga/dataset_result.rb +7 -4
data/lib/miga/version.rb +2 -2
data/scripts/_distances_noref_nomulti.bash +3 -1
data/scripts/clade_finding.bash +1 -1
data/scripts/init.bash +1 -1
data/scripts/miga.bash +1 -1
data/scripts/mytaxa.bash +78 -72
data/scripts/mytaxa_scan.bash +67 -62
data/scripts/ogs.bash +1 -1
data/scripts/trimmed_fasta.bash +4 -3
data/utils/enveomics/Examples/aai-matrix.bash +66 -0
data/utils/enveomics/Examples/ani-matrix.bash +66 -0
data/utils/enveomics/Examples/essential-phylogeny.bash +105 -0
data/utils/enveomics/Examples/unus-genome-phylogeny.bash +100 -0
data/utils/enveomics/LICENSE.txt +73 -0
data/utils/enveomics/Makefile +52 -0
data/utils/enveomics/Manifest/Tasks/aasubs.json +103 -0
data/utils/enveomics/Manifest/Tasks/blasttab.json +703 -0
data/utils/enveomics/Manifest/Tasks/distances.json +161 -0
data/utils/enveomics/Manifest/Tasks/fasta.json +571 -0
data/utils/enveomics/Manifest/Tasks/fastq.json +208 -0
data/utils/enveomics/Manifest/Tasks/graphics.json +126 -0
data/utils/enveomics/Manifest/Tasks/ogs.json +339 -0
data/utils/enveomics/Manifest/Tasks/other.json +746 -0
data/utils/enveomics/Manifest/Tasks/remote.json +355 -0
data/utils/enveomics/Manifest/Tasks/sequence-identity.json +454 -0
data/utils/enveomics/Manifest/Tasks/tables.json +308 -0
data/utils/enveomics/Manifest/Tasks/trees.json +68 -0
data/utils/enveomics/Manifest/Tasks/variants.json +111 -0
data/utils/enveomics/Manifest/categories.json +132 -0
data/utils/enveomics/Manifest/examples.json +154 -0
data/utils/enveomics/Manifest/tasks.json +4 -0
data/utils/enveomics/Pipelines/assembly.pbs/CONFIG.mock.bash +69 -0
data/utils/enveomics/Pipelines/assembly.pbs/FastA.N50.pl +56 -0
data/utils/enveomics/Pipelines/assembly.pbs/FastA.filterN.pl +60 -0
data/utils/enveomics/Pipelines/assembly.pbs/FastA.length.pl +38 -0
data/utils/enveomics/Pipelines/assembly.pbs/README.md +189 -0
data/utils/enveomics/Pipelines/assembly.pbs/RUNME-2.bash +112 -0
data/utils/enveomics/Pipelines/assembly.pbs/RUNME-3.bash +23 -0
data/utils/enveomics/Pipelines/assembly.pbs/RUNME-4.bash +44 -0
data/utils/enveomics/Pipelines/assembly.pbs/RUNME.bash +50 -0
data/utils/enveomics/Pipelines/assembly.pbs/kSelector.R +37 -0
data/utils/enveomics/Pipelines/assembly.pbs/newbler.pbs +68 -0
data/utils/enveomics/Pipelines/assembly.pbs/newbler_preparator.pl +49 -0
data/utils/enveomics/Pipelines/assembly.pbs/soap.pbs +80 -0
data/utils/enveomics/Pipelines/assembly.pbs/stats.pbs +57 -0
data/utils/enveomics/Pipelines/assembly.pbs/velvet.pbs +63 -0
data/utils/enveomics/Pipelines/blast.pbs/01.pbs.bash +38 -0
data/utils/enveomics/Pipelines/blast.pbs/02.pbs.bash +73 -0
data/utils/enveomics/Pipelines/blast.pbs/03.pbs.bash +21 -0
data/utils/enveomics/Pipelines/blast.pbs/BlastTab.recover_job.pl +72 -0
data/utils/enveomics/Pipelines/blast.pbs/CONFIG.mock.bash +98 -0
data/utils/enveomics/Pipelines/blast.pbs/FastA.split.pl +55 -0
data/utils/enveomics/Pipelines/blast.pbs/README.md +127 -0
data/utils/enveomics/Pipelines/blast.pbs/RUNME.bash +109 -0
data/utils/enveomics/Pipelines/blast.pbs/TASK.check.bash +128 -0
data/utils/enveomics/Pipelines/blast.pbs/TASK.dry.bash +16 -0
data/utils/enveomics/Pipelines/blast.pbs/TASK.eo.bash +22 -0
data/utils/enveomics/Pipelines/blast.pbs/TASK.pause.bash +26 -0
data/utils/enveomics/Pipelines/blast.pbs/TASK.run.bash +89 -0
data/utils/enveomics/Pipelines/blast.pbs/sentinel.pbs.bash +29 -0
data/utils/enveomics/Pipelines/idba.pbs/README.md +49 -0
data/utils/enveomics/Pipelines/idba.pbs/RUNME.bash +95 -0
data/utils/enveomics/Pipelines/idba.pbs/run.pbs +56 -0
data/utils/enveomics/Pipelines/trim.pbs/README.md +54 -0
data/utils/enveomics/Pipelines/trim.pbs/RUNME.bash +70 -0
data/utils/enveomics/Pipelines/trim.pbs/run.pbs +130 -0
data/utils/enveomics/README.md +40 -0
data/utils/enveomics/Scripts/AAsubs.log2ratio.rb +171 -0
data/utils/enveomics/Scripts/Aln.cat.rb +162 -0
data/utils/enveomics/Scripts/Aln.convert.pl +35 -0
data/utils/enveomics/Scripts/AlphaDiversity.pl +152 -0
data/utils/enveomics/Scripts/BlastPairwise.AAsubs.pl +102 -0
data/utils/enveomics/Scripts/BlastTab.addlen.rb +61 -0
data/utils/enveomics/Scripts/BlastTab.advance.bash +48 -0
data/utils/enveomics/Scripts/BlastTab.best_hit_sorted.pl +55 -0
data/utils/enveomics/Scripts/BlastTab.catsbj.pl +106 -0
data/utils/enveomics/Scripts/BlastTab.cogCat.rb +76 -0
data/utils/enveomics/Scripts/BlastTab.filter.pl +47 -0
data/utils/enveomics/Scripts/BlastTab.kegg_pep2path_rest.pl +194 -0
data/utils/enveomics/Scripts/BlastTab.metaxaPrep.pl +104 -0
data/utils/enveomics/Scripts/BlastTab.pairedHits.rb +157 -0
data/utils/enveomics/Scripts/BlastTab.recplot2.R +40 -0
data/utils/enveomics/Scripts/BlastTab.seqdepth.pl +86 -0
data/utils/enveomics/Scripts/BlastTab.seqdepth_ZIP.pl +119 -0
data/utils/enveomics/Scripts/BlastTab.seqdepth_nomedian.pl +86 -0
data/utils/enveomics/Scripts/BlastTab.subsample.pl +47 -0
data/utils/enveomics/Scripts/BlastTab.sumPerHit.pl +114 -0
data/utils/enveomics/Scripts/BlastTab.taxid2taxrank.pl +90 -0
data/utils/enveomics/Scripts/BlastTab.topHits_sorted.rb +101 -0
data/utils/enveomics/Scripts/Chao1.pl +97 -0
data/utils/enveomics/Scripts/CharTable.classify.rb +234 -0
data/utils/enveomics/Scripts/EBIseq2tax.rb +83 -0
data/utils/enveomics/Scripts/FastA.N50.pl +56 -0
data/utils/enveomics/Scripts/FastA.filter.pl +52 -0
data/utils/enveomics/Scripts/FastA.filterLen.pl +28 -0
data/utils/enveomics/Scripts/FastA.filterN.pl +60 -0
data/utils/enveomics/Scripts/FastA.fragment.rb +92 -0
data/utils/enveomics/Scripts/FastA.gc.pl +42 -0
data/utils/enveomics/Scripts/FastA.interpose.pl +87 -0
data/utils/enveomics/Scripts/FastA.length.pl +38 -0
data/utils/enveomics/Scripts/FastA.per_file.pl +36 -0
data/utils/enveomics/Scripts/FastA.qlen.pl +57 -0
data/utils/enveomics/Scripts/FastA.rename.pl +65 -0
data/utils/enveomics/Scripts/FastA.revcom.pl +23 -0
data/utils/enveomics/Scripts/FastA.slider.pl +85 -0
data/utils/enveomics/Scripts/FastA.split.pl +55 -0
data/utils/enveomics/Scripts/FastA.subsample.pl +131 -0
data/utils/enveomics/Scripts/FastA.tag.rb +64 -0
data/utils/enveomics/Scripts/FastA.wrap.rb +48 -0
data/utils/enveomics/Scripts/FastQ.filter.pl +54 -0
data/utils/enveomics/Scripts/FastQ.interpose.pl +90 -0
data/utils/enveomics/Scripts/FastQ.offset.pl +90 -0
data/utils/enveomics/Scripts/FastQ.split.pl +53 -0
data/utils/enveomics/Scripts/FastQ.tag.rb +63 -0
data/utils/enveomics/Scripts/FastQ.toFastA.awk +24 -0
data/utils/enveomics/Scripts/GenBank.add_fields.rb +84 -0
data/utils/enveomics/Scripts/HMM.essential.rb +254 -0
data/utils/enveomics/Scripts/HMMsearch.extractIds.rb +83 -0
data/utils/enveomics/Scripts/JPlace.distances.rb +88 -0
data/utils/enveomics/Scripts/JPlace.to_iToL.rb +306 -0
data/utils/enveomics/Scripts/M5nr.getSequences.rb +81 -0
data/utils/enveomics/Scripts/MeTaxa.distribution.pl +198 -0
data/utils/enveomics/Scripts/MyTaxa.fragsByTax.pl +35 -0
data/utils/enveomics/Scripts/MyTaxa.seq-taxrank.rb +49 -0
data/utils/enveomics/Scripts/NCBIacc2tax.rb +92 -0
data/utils/enveomics/Scripts/Newick.autoprune.R +27 -0
data/utils/enveomics/Scripts/RAxML-EPA.to_iToL.pl +228 -0
data/utils/enveomics/Scripts/RefSeq.download.bash +48 -0
data/utils/enveomics/Scripts/SRA.download.bash +50 -0
data/utils/enveomics/Scripts/TRIBS.plot-test.R +36 -0
data/utils/enveomics/Scripts/TRIBS.test.R +39 -0
data/utils/enveomics/Scripts/Table.barplot.R +30 -0
data/utils/enveomics/Scripts/Table.df2dist.R +30 -0
data/utils/enveomics/Scripts/Table.filter.pl +61 -0
data/utils/enveomics/Scripts/Table.merge.pl +77 -0
data/utils/enveomics/Scripts/Table.replace.rb +69 -0
data/utils/enveomics/Scripts/Table.round.rb +63 -0
data/utils/enveomics/Scripts/Table.split.pl +57 -0
data/utils/enveomics/Scripts/Taxonomy.silva2ncbi.rb +227 -0
data/utils/enveomics/Scripts/VCF.KaKs.rb +147 -0
data/utils/enveomics/Scripts/VCF.SNPs.rb +88 -0
data/utils/enveomics/Scripts/aai.rb +373 -0
data/utils/enveomics/Scripts/ani.rb +362 -0
data/utils/enveomics/Scripts/gi2tax.rb +103 -0
data/utils/enveomics/Scripts/in_silico_GA_GI.pl +96 -0
data/utils/enveomics/Scripts/lib/data/essential.hmm.gz +0 -0
data/utils/enveomics/Scripts/lib/enveomics_rb/enveomics.rb +26 -0
data/utils/enveomics/Scripts/lib/enveomics_rb/jplace.rb +253 -0
data/utils/enveomics/Scripts/lib/enveomics_rb/og.rb +182 -0
data/utils/enveomics/Scripts/lib/enveomics_rb/remote_data.rb +74 -0
data/utils/enveomics/Scripts/lib/enveomics_rb/seq_range.rb +237 -0
data/utils/enveomics/Scripts/lib/enveomics_rb/stat.rb +30 -0
data/utils/enveomics/Scripts/lib/enveomics_rb/vcf.rb +135 -0
data/utils/enveomics/Scripts/ogs.annotate.rb +88 -0
data/utils/enveomics/Scripts/ogs.core-pan.rb +160 -0
data/utils/enveomics/Scripts/ogs.extract.rb +125 -0
data/utils/enveomics/Scripts/ogs.mcl.rb +186 -0
data/utils/enveomics/Scripts/ogs.rb +104 -0
data/utils/enveomics/Scripts/ogs.stats.rb +131 -0
data/utils/enveomics/Scripts/rbm.rb +137 -0
data/utils/enveomics/Tests/Makefile +10 -0
data/utils/enveomics/Tests/Mgen_M2288.faa +3189 -0
data/utils/enveomics/Tests/Mgen_M2288.fna +8282 -0
data/utils/enveomics/Tests/Mgen_M2321.fna +8288 -0
data/utils/enveomics/Tests/Nequ_Kin4M.faa +2970 -0
data/utils/enveomics/Tests/Xanthomonas_oryzae-PilA.tribs.Rdata +0 -0
data/utils/enveomics/Tests/Xanthomonas_oryzae-PilA.txt +7 -0
data/utils/enveomics/Tests/Xanthomonas_oryzae.aai-mat.tsv +17 -0
data/utils/enveomics/Tests/Xanthomonas_oryzae.aai.tsv +137 -0
data/utils/enveomics/Tests/a_mg.cds-go.blast.tsv +123 -0
data/utils/enveomics/Tests/a_mg.reads-cds.blast.tsv +200 -0
data/utils/enveomics/Tests/a_mg.reads-cds.counts.tsv +55 -0
data/utils/enveomics/Tests/alkB.nwk +1 -0
data/utils/enveomics/Tests/anthrax-cansnp-data.tsv +13 -0
data/utils/enveomics/Tests/anthrax-cansnp-key.tsv +17 -0
data/utils/enveomics/Tests/hiv1.faa +59 -0
data/utils/enveomics/Tests/hiv1.fna +134 -0
data/utils/enveomics/Tests/hiv2.faa +70 -0
data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv +233 -0
data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv.lim +1 -0
data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv.rec +233 -0
data/utils/enveomics/Tests/phyla_counts.tsv +10 -0
data/utils/enveomics/Tests/primate_lentivirus.ogs +11 -0
data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-hiv1.rbm +9 -0
data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-hiv2.rbm +8 -0
data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-siv.rbm +6 -0
data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv2-hiv2.rbm +9 -0
data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv2-siv.rbm +6 -0
data/utils/enveomics/Tests/primate_lentivirus.rbm/siv-siv.rbm +6 -0
data/utils/enveomics/build_enveomics_r.bash +44 -0
data/utils/enveomics/enveomics.R/DESCRIPTION +31 -0
data/utils/enveomics/enveomics.R/NAMESPACE +35 -0
data/utils/enveomics/enveomics.R/R/autoprune.R +121 -0
data/utils/enveomics/enveomics.R/R/barplot.R +165 -0
data/utils/enveomics/enveomics.R/R/cliopts.R +119 -0
data/utils/enveomics/enveomics.R/R/df2dist.R +117 -0
data/utils/enveomics/enveomics.R/R/growthcurve.R +263 -0
data/utils/enveomics/enveomics.R/R/recplot.R +320 -0
data/utils/enveomics/enveomics.R/R/recplot2.R +745 -0
data/utils/enveomics/enveomics.R/R/tribs.R +423 -0
data/utils/enveomics/enveomics.R/R/utils.R +16 -0
data/utils/enveomics/enveomics.R/README.md +52 -0
data/utils/enveomics/enveomics.R/data/growth.curves.rda +0 -0
data/utils/enveomics/enveomics.R/data/phyla.counts.rda +0 -0
data/utils/enveomics/enveomics.R/man/enve.GrowthCurve-class.Rd +30 -0
data/utils/enveomics/enveomics.R/man/enve.TRIBS-class.Rd +43 -0
data/utils/enveomics/enveomics.R/man/enve.TRIBS.merge.Rd +19 -0
data/utils/enveomics/enveomics.R/man/enve.TRIBStest-class.Rd +37 -0
data/utils/enveomics/enveomics.R/man/enve.__prune.iter.Rd +24 -0
data/utils/enveomics/enveomics.R/man/enve.__prune.reduce.Rd +24 -0
data/utils/enveomics/enveomics.R/man/enve.__tribs.Rd +33 -0
data/utils/enveomics/enveomics.R/man/enve.barplot.Rd +64 -0
data/utils/enveomics/enveomics.R/man/enve.cliopts.Rd +37 -0
data/utils/enveomics/enveomics.R/man/enve.col.alpha.Rd +19 -0
data/utils/enveomics/enveomics.R/man/enve.col2alpha.Rd +18 -0
data/utils/enveomics/enveomics.R/man/enve.df2dist.Rd +26 -0
data/utils/enveomics/enveomics.R/man/enve.df2dist.group.Rd +25 -0
data/utils/enveomics/enveomics.R/man/enve.df2dist.list.Rd +26 -0
data/utils/enveomics/enveomics.R/man/enve.growthcurve.Rd +49 -0
data/utils/enveomics/enveomics.R/man/enve.prune.dist.Rd +28 -0
data/utils/enveomics/enveomics.R/man/enve.recplot.Rd +97 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2-class.Rd +40 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.Rd +40 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.__counts.Rd +24 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.__findPeak.Rd +40 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.__findPeaks.Rd +18 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.__peakHist.Rd +22 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.__whichClosestPeak.Rd +20 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.changeCutoff.Rd +18 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.corePeak.Rd +18 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.extractWindows.Rd +27 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.Rd +53 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.peak-class.Rd +44 -0
data/utils/enveomics/enveomics.R/man/enve.tribs.Rd +44 -0
data/utils/enveomics/enveomics.R/man/enve.tribs.test.Rd +21 -0
data/utils/enveomics/enveomics.R/man/enveomics.R-package.Rd +15 -0
data/utils/enveomics/enveomics.R/man/growth.curves.Rd +14 -0
data/utils/enveomics/enveomics.R/man/phyla.counts.Rd +13 -0
data/utils/enveomics/enveomics.R/man/plot.enve.GrowthCurve.Rd +43 -0
data/utils/enveomics/enveomics.R/man/plot.enve.TRIBS.Rd +29 -0
data/utils/enveomics/enveomics.R/man/plot.enve.TRIBStest.Rd +30 -0
data/utils/enveomics/enveomics.R/man/plot.enve.recplot2.Rd +71 -0
data/utils/enveomics/enveomics.R/man/summary.enve.GrowthCurve.Rd +18 -0
data/utils/enveomics/enveomics.R/man/summary.enve.TRIBS.Rd +18 -0
data/utils/enveomics/enveomics.R/man/summary.enve.TRIBStest.Rd +18 -0
data/utils/enveomics/enveomics.R/man/z$-methods.Rd +27 -0
data/utils/enveomics/globals.mk +8 -0
data/utils/enveomics/manifest.json +9 -0
data/utils/index_metadata.rb +0 -0
data/utils/plot-taxdist.R +0 -0
data/utils/requirements.txt +19 -19
metadata +242 -2

data/utils/enveomics/enveomics.R/R/recplot.R ADDED Viewed

@@ -0,0 +1,320 @@
+enve.recplot <- structure(function(
+	### Produces recruitment plots provided that BlastTab.catsbj.pl has
+	### been previously executed. Requires the gplots library.
+	prefix,
+	### Path to the prefix of the BlastTab.catsbj.pl output files. At
+	### least the files .rec and .lim must exist with this prefix.
+	# Id. hist.
+	id.min=NULL,
+	### Minimum identity to be considered. By default, the minimum detected
+	### identity. This value is a percentage.
+	id.max=NULL,
+	### Maximum identity to be considered. By default, 100.
+	id.binsize=NULL,
+	### Size of the identity bins (vertical histograms). By default, 0.1 for
+	### identity metrics and 5 for bit score.
+	id.splines=0,
+	### Smoothing parameter for the splines in the identity histogram. Zero (0) for no
+	### splines. A generally good value is 1/2. If non-zero, requires the stats package.
+	id.metric='id',
+	### Metric of identity to be used (Y-axis). It can be any unambiguous prefix
+	### of "identity", "corrected identity", or "bit score".
+	id.summary='sum',
+	### Method used to build the identity histogram (Horizontal axis of the right panel).
+	### It can be any unambiguous prefix of "sum", "average", "median", "90% lower bound",
+	### "90% upper bound", "95% lower bound", and "95% upper bound". The last four options
+	### correspond to the upper and lower boundaries of the 90% and 95% empirical confidence
+	### intervals.
+	# Pos. hist.
+	pos.min=1,
+	### Minimum (leftmost) position in the reference (concatenated) genome (in bp).
+	pos.max=NULL,
+	### Maximum (rightmost) position in the reference (concatenated) genome (in bp).
+	### By default: Length of the genome.
+	pos.binsize=1e3,
+	### Size of the position bins (horizontal histograms) in bp.
+	pos.splines=0,
+	### Smoothing parameter for the splines in the position histogram. Zero (0) for no splines.
+	### If non-zero, requires the stats package.
+	# Rec. plot
+	rec.col1='white',
+	### Lightest color in the recruitment plot.
+	rec.col2='black',
+	### Darkest color in the recruitment plot.
+	# General
+	main=NULL,
+	### Title of the plot.
+	contig.col=grey(0.85),
+	### Color of the Contig boundaries. Set to NA to ignore Contig boundaries.
+	# Return
+	ret.recplot=FALSE,
+	### Indicates if the matrix of the recruitment plot is to be returned.
+	ret.hist=FALSE,
+	### Indicates if the vectors of the identity and position histograms are to be returned.
+	ret.mode=FALSE,
+	### Indicates if the mode of the identity is to be computed. It requires the modeest
+	### package.
+	# General
+	id.cutoff=NULL,
+	### Minimum identity to consider an alignment as "top". By default, it is 0.95 for the
+	### identity metrics and 95% of the best scoring alignment for bit score.
+	verbose=TRUE,
+	### Indicates if the function should report the advance.
+	...
+	### Any additional graphic parameters to be passed to plot for all panels except the
+	### recruitment plot (lower-left).
+	){
+   # Settings
+   METRICS <- c('identity', 'corrected identity', 'bit score');
+   SUMMARY <- c('sum', 'average', 'median', '');
+   if(is.null(prefix)) stop('Parameter prefix is mandatory.');
+   if(!requireNamespace("gplots", quietly=TRUE)) stop('Unavailable gplots library.');
+   # Read files
+   if(verbose) cat("Reading files.\n")
+   rec <- read.table(paste(prefix, '.rec', sep=''), sep="\t", comment.char='', quote='');
+   lim <- read.table(paste(prefix, '.lim', sep=''), sep="\t", comment.char='', quote='');
+   # Configure ID summary
+   id.summary <- pmatch(id.summary, SUMMARY);
+   if(is.na(id.summary)) stop('Invalid identity summary.');
+   if(id.summary == -1) stop('Ambiguous identity summary.');
+   if(id.summary==1){
+      id.summary.func <- function(x) colSums(x);
+      id.summary.name <- 'sum'
+   }else if(id.summary==2){
+      id.summary.func <- function(x) colMeans(x);
+      id.summary.name <- 'mean'
+   }else if(id.summary==3){
+      id.summary.func <- function(x) apply(x,2,median);
+      id.summary.name <- 'median'
+   }else if(id.summary==4){
+      id.summary.func <- function(x) apply(x,2,quantile,probs=0.05,names=FALSE);
+      id.summary.name <- '90% LB'
+   }else if(id.summary==5){
+      id.summary.func <- function(x) apply(x,2,quantile,probs=0.95,names=FALSE);
+      id.summary.name <- '90% UB'
+   }else if(id.summary==6){
+      id.summary.func <- function(x) apply(x,2,quantile,probs=0.025,names=FALSE);
+      id.summary.name <- '95% LB'
+   }else if(id.summary==7){
+      id.summary.func <- function(x) apply(x,2,quantile,probs=0.975,names=FALSE);
+      id.summary.name <- '95% UB'
+   }
+   # Configure metrics
+   id.metric <- pmatch(id.metric, METRICS);
+   if(is.na(id.metric)) stop('Invalid identity metric.');
+   if(id.metric == -1) stop('Ambiguous identity metric.');
+   if(id.metric==1){
+      id.reccol <- 3
+      id.shortname <- 'Id.'
+      id.fullname  <- 'Identity'
+      id.units     <- '%'
+      id.hallmarks <- seq(0, 100, by=5)
+      if(is.null(id.max)) id.max <- 100
+      if(is.null(id.cutoff)) id.cutoff <- 95
+      if(is.null(id.binsize)) id.binsize <- 0.1
+   }else if(id.metric==2){
+      if(ncol(rec)<6) stop("Requesting corrected identity, but .rec file doesn't have 6th column")
+      id.reccol <- 6
+      id.shortname <- 'cId.'
+      id.fullname  <- 'Corrected identity'
+      id.units     <- '%'
+      id.hallmarks <- seq(0, 100, by=5)
+      if(is.null(id.max)) id.max <- 100
+      if(is.null(id.cutoff)) id.cutoff <- 95
+      if(is.null(id.binsize)) id.binsize <- 0.1
+   }else if(id.metric==3){
+      id.reccol <- 4
+      id.shortname <- 'BSc.'
+      id.fullname  <- 'Bit score'
+      id.units     <- 'bits'
+      max.bs <- max(rec[, id.reccol])
+      id.hallmarks <- seq(0, max.bs*1.2, by=50)
+      if(is.null(id.max)) id.max <- max.bs
+      if(is.null(id.cutoff)) id.cutoff <- 0.95 * max.bs
+      if(is.null(id.binsize)) id.binsize <- 5
+   }
+   if(is.null(id.min)) id.min <- min(rec[, id.reccol]);
+   if(is.null(pos.max)) pos.max <- max(lim[, 3]);
+   id.lim <- c(id.min, id.max);
+   pos.lim <- c(pos.min, pos.max)/1e6;
+   id.breaks <- round((id.max-id.min)/id.binsize);
+   pos.breaks <- round((pos.max-pos.min)/pos.binsize);
+   if(is.null(main)) main <- paste('Recruitment plot of ', prefix, sep='');
+   pos.marks=seq(pos.min, pos.max, length.out=pos.breaks+1)/1e6;
+   id.marks=seq(id.min, id.max, length.out=id.breaks+1);
+   id.topclasses <- 0;
+   for(i in length(id.marks):1) if(id.marks[i]>id.cutoff) id.topclasses <- id.topclasses + 1;
+   # Set-up image
+   layout(matrix(c(3,4,1,2), nrow=2, byrow=TRUE), widths=c(2,1), heights=c(1,2));
+   out <- list();
+   # Recruitment plot
+   if(verbose) cat("Rec. plot.\n")
+   par(mar=c(5,4,0,0)+0.1);
+   rec.hist <- matrix(0, nrow=pos.breaks, ncol=id.breaks);
+   for(i in 1:nrow(rec)){
+      id.class <- ceiling((id.breaks)*((rec[i, id.reccol]-id.min)/(id.max-id.min)));
+      if(id.class<=id.breaks & id.class>0){
+	 for(pos in rec[i, 1]:rec[i, 2]){
+	    pos.class <- ceiling((pos.breaks)*((pos-pos.min)/(pos.max-pos.min)));
+	    if(pos.class<=pos.breaks & pos.class>0) rec.hist[pos.class, id.class] <- rec.hist[pos.class, id.class]+1;
+	 }
+      }
+   }
+   id.top <- c((1-id.topclasses):0) + id.breaks;
+   rec.col=gplots::colorpanel(256, rec.col1, rec.col2);
+   image(x=pos.marks, y=id.marks, z=log10(rec.hist),
+   		breaks=seq(0, log10(max(rec.hist)), length.out=1+length(rec.col)), col=rec.col,
+		xlim=pos.lim, ylim=id.lim, xlab='Position in genome (Mbp)',
+		ylab=paste(id.fullname, ' (',id.units,')', sep=''), xaxs='i', yaxs='r');
+   if(!is.na(contig.col)) abline(v=c(lim$V2, lim$V3)/1e6, lty=1, col=contig.col);
+   abline(h=id.hallmarks, lty=2, col=grey(0.7));
+   abline(h=id.marks[id.top[1]], lty=3, col=grey(0.5))
+   legend('bottomleft', 'Rec. plot', bg=rgb(1,1,1,2/3));
+   out <- c(out, list(pos.marks=pos.marks, id.marks=id.marks));
+   if(ret.recplot) out <- c(out, list(recplot=rec.hist));
+   # Identity histogram
+   if(verbose) cat(id.shortname, " hist.\n", sep='')
+   par(mar=c(5,0,0,2)+0.1);
+   id.hist <- id.summary.func(rec.hist);
+   plot(1, t='n', xlim=c(1, max(id.hist)), ylim=id.lim, ylab='', yaxt='n', xlab=paste('Sequences (bp),', id.summary.name), log='x', ...);
+   id.x <- rep(id.marks, each=2)[2:(id.breaks*2+1)]
+   id.f <- rep(id.hist, each=2)[1:(id.breaks*2)]
+   if(sum(id.f)>0){
+      lines(id.f, id.x, lwd=ifelse(id.splines>0, 1/2, 2), type='o', pch='.');
+      if(id.splines>0){
+	 id.spline <- smooth.spline(id.x[id.f>0], log(id.f[id.f>0]), spar=id.splines)
+	 lines(exp(id.spline$y), id.spline$x, lwd=2)
+      }
+   }
+   abline(h=id.hallmarks, lty=2, col=grey(0.7));
+   abline(h=id.marks[id.top[1]], lty=3, col=grey(0.5))
+   legend('bottomright', paste(id.shortname, 'histogram'), bg=rgb(1,1,1,2/3));
+   out <- c(out, list(id.mean=mean(rec[, id.reccol])));
+   out <- c(out, list(id.median=median(rec[, id.reccol])));
+   if(ret.mode)   out <- c(out, list(id.mode=modeest::mlv(rec[, id.reccol], method='mfv')$M));
+   if(ret.hist)  out <- c(out, list(id.hist=id.hist));
+   # Position histogram
+   if(verbose) cat("Pos. hist.\n")
+   par(mar=c(0,4,4,0)+0.1);
+   h1<-rep(0,nrow(rec.hist)) ;
+   h2<-rep(0,nrow(rec.hist)) ;
+   pos.winsize <- (pos.max-pos.min+1)/pos.breaks;
+   if(sum(rec.hist[, id.top])>0) h1 <- rowSums(matrix(rec.hist[, id.top], nrow=nrow(rec.hist)))/pos.winsize;
+   if(sum(rec.hist[,-id.top])>0) h2 <- rowSums(matrix(rec.hist[,-id.top], nrow=nrow(rec.hist)))/pos.winsize;
+   ymin <- min(1, h1[h1>0], h2[h2>0]);
+   ymax <- max(10, h1, h2);
+   if(is.na(ymin) || ymin<=0) ymin <- 1e-10;
+   if(is.na(ymax) || ymax<=0) ymax <- 1;
+   plot(1, t='n', xlab='', xaxt='n', ylab='Sequencing depth (X)', log='y', xlim=pos.lim,
+   	ylim=c(ymin, ymax), xaxs='i', main=main, ...);
+   if(!is.na(contig.col)) abline(v=c(lim[,2], lim[,3])/1e6, lty=1, col=contig.col);
+   abline(h=10^c(0:5), lty=2, col=grey(0.7));
+   if(sum(h2)>0){
+      h2.x <- rep(pos.marks, each=2)[2:(pos.breaks*2+1)]
+      h2.y <- rep(h2, each=2)[1:(pos.breaks*2)]
+      lines(h2.x, h2.y, lwd=ifelse(pos.splines>0, 1/2, 2), col=grey(0.5));
+      if(pos.splines>0){
+         h2.spline <- smooth.spline(h2.x[h2.y>0], log(h2.y[h2.y>0]), spar=pos.splines)
+	 lines(h2.spline$x, exp(h2.spline$y), lwd=2, col=grey(0.5))
+      }
+      if(ret.hist) out <- c(out, list(pos.hist.low=h2.y));
+   }
+   if(sum(h1)>0){
+      h1.x <- rep(pos.marks, each=2)[2:(pos.breaks*2+1)]
+      h1.y <- rep(h1, each=2)[1:(pos.breaks*2)]
+      lines(h1.x, h1.y, lwd=ifelse(pos.splines>0, 1/2, 2), col=grey(0));
+      if(pos.splines>0){
+         h1.spline <- smooth.spline(h1.x[h1.y>0], log(h1.y[h1.y>0]), spar=pos.splines)
+	 lines(h1.spline$x, exp(h1.spline$y), lwd=2, col=grey(0))
+      }
+      if(ret.hist) out <- c(out, list(pos.hist.top=h1.y));
+   }
+   legend('topleft', 'Pos. histogram', bg=rgb(1,1,1,2/3));
+   out <- c(out, list(id.max=id.max, id.cutoff=id.marks[id.top[1]]));
+   out <- c(out, list(seqdepth.mean.top=mean(h1)));
+   out <- c(out, list(seqdepth.mean.low=mean(h2)));
+   out <- c(out, list(seqdepth.mean=mean(h1+h2)));
+   out <- c(out, list(seqdepth.median.top=median(h1)));
+   out <- c(out, list(seqdepth.median.low=median(h2)));
+   out <- c(out, list(seqdepth.median=median(h1+h2)));
+   out <- c(out, list(id.metric=id.fullname));
+   out <- c(out, list(id.summary=id.summary.name));
+   # Legend
+   par(mar=c(0,0,4,2)+0.1);
+   plot(1, t='n', xlab='', xaxt='n', ylab='', yaxt='n', xlim=c(0,1), ylim=c(0,1), xaxs='r', yaxs='i', ...);
+   text(1/2, 5/6, labels=paste('Reads per ', signif((pos.max-pos.min)/pos.breaks, 2), ' bp (rec. plot)', sep=''), pos=3);
+   leg.col <- gplots::colorpanel(100, rec.col1, rec.col2);
+   leg.lab <- signif(10^seq(0, log10(max(rec.hist)), length.out=10), 2);
+   for(i in 1:10){
+      for(j in 1:10){
+         k <- (i-1)*10 + j;
+	 polygon(c(k-1, k, k, k-1)/100, c(2/3, 2/3, 5/6, 5/6), border=leg.col[k], col=leg.col[k]);
+      }
+      text((i-0.5)/10, 2/3, labels=paste(leg.lab[i], ''), srt=90, pos=2, offset=0, cex=3/4);
+   }
+   legend('bottom',
+   	legend=c('Contig boundary', 'Hallmark', paste(id.fullname, 'cutoff'),
+		paste('Pos. hist.: ',id.shortname,' > ',signif(id.marks[id.top[1]],2),id.units,sep=''),
+		paste('Pos. hist.: ',id.shortname,' < ',signif(id.marks[id.top[1]],2),id.units,sep='')), ncol=2,
+   	col=grey(c(0.85, 0.7, 0.5, 0, 0.5)), lty=c(1,2,3,1,1), lwd=c(1,1,1,2,2), bty='n', inset=0.05, cex=5/6);
+   return(out);
+   ### A list with the following elements:
+   ###
+   ### pos.marks: Midpoints of the position histogram.
+   ###
+   ### id.matrix: Midpoints of the identity histogram.
+   ###
+   ### recplot (if ret.recplot=TRUE): Matrix containing the recruitment plot values.
+   ###
+   ### id.mean: Mean identity.
+   ###
+   ### id.median: Median identity.
+   ###
+   ### id.mode (if ret.mode=TRUE): Mode of the identity.
+   ###
+   ### id.hist (if ret.hist=TRUE): Values of the identity histogram.
+   ###
+   ### pos.hist.low (if ret.hist=TRUE): Values of the position histogram (depth) with "low"
+   ### identity (i.e., below id.cutoff).
+   ###
+   ### pos.hist.top (if ret.hist=TRUE): Values of the position histogram (depth) with "top"
+   ### identity (i.e., above id.cutoff).
+   ###
+   ### id.max: Value of id.max. This is returned because id.max=NULL may vary.
+   ###
+   ### id.cutoff: Value of id.cutoff. This is returned because id.cutoff=NULL may vary.
+   ###
+   ### seqdepth.mean.top: Average sequencing depth with identity above id.cutoff.
+   ###
+   ### seqdepth.mean.low: Average sequencing depth with identity below id.cutoff.
+   ###
+   ### seqdepth.mean.all: Average sequencing depth without identity filtering.
+   ###
+   ### seqdepth.median.top: Median sequencing depth with identity above id.cutoff.
+   ###
+   ### seqdepth.median.low: Median sequencing depth with identity below id.cutoff.
+   ###
+   ### seqdepth.median.all: Median sequencing depth without identity filtering.
+   ###
+   ### id.metric: Full name of the used identity metric.
+   ###
+   ### id.summary: Full name of the summary method used to build the identity plot.
+});

data/utils/enveomics/enveomics.R/R/recplot2.R ADDED Viewed

@@ -0,0 +1,745 @@
+#==============> Define S4 classes
+setClass("enve.RecPlot2",
+   ### Enve-omics representation of Recruitment plots. This object can
+   ### be produced by `enve.recplot2` and supports S4 method plot.
+   representation(
+   counts='matrix',		##<< Counts as a two-dimensional histogram.
+   pos.counts.in='numeric',	##<< Counts of in-group hits per position bin.
+   pos.counts.out='numeric',	##<< Counts of out-group hits per position bin.
+   id.counts='numeric',		##<< Counts per ID bin.
+   id.breaks='numeric',		##<< Breaks of identity bins.
+   pos.breaks='numeric',	##<< Breaks of position bins.
+   seq.breaks='numeric',
+   peaks='list',                ##<< Peaks identified in the recplot.
+   ### Limits of the subject sequences after concatenation.
+   seq.names='character',	##<< Names of the subject sequences.
+   id.metric='character',	##<< Metric used as 'identity'.
+   id.ingroup='logical',	##<< Identity bins considered in-group.
+   call='call')			##<< Call producing this object.
+   ,package='enveomics.R'
+   );
+setClass("enve.RecPlot2.Peak",
+### Enve-omics representation of a peak in the sequencing depth histogram
+### of a Recruitment plot (see `enve.recplot2.findPeaks`).
+   representation(
+   dist='character',
+   ### Distribution of the peak. Currently supported: 'norm' (normal) and 'sn'
+   ### (skew-normal).
+   values='numeric',
+   ### Sequencing depth values predicted to conform the peak.
+   values.res='numeric',
+   ### Sequencing depth values not explained by this or previously identified
+   ### peaks.
+   mode='numeric',
+   ### Seed-value of mode anchoring the peak.
+   param.hat='list',
+   ### Parameters of the distribution. A list of two values if dist='norm' (sd
+   ### and mean), or three values if dist='sn' (omega=scale, alpha=shape, and
+   ### xi=location). Note that the "dispersion" parameter is always first and
+   ### the "location" parameter is always last.
+   n.hat='numeric',
+   ### Number of bins estimated to be explained by this peak. This should
+   ### ideally be equal to the length of `values`, but it's not and integer.
+   n.total='numeric',
+   ### Total number of bins from which the peak was extracted. I.e., total
+   ### number of position bins with non-zero sequencing depth in the recruitment
+   ### plot (regardless of peak count).
+   err.res='numeric',
+   ### Error left after adding the peak.
+   merge.logdist='numeric'
+   ### Attempted `merge.logdist` parameter.
+   ));
+setMethod("$", "enve.RecPlot2", function(x, name) attr(x, name))
+setMethod("$", "enve.RecPlot2.Peak", function(x, name) attr(x, name))
+#==============> Define S4 methods
+plot.enve.RecPlot2 <- function
+   ### Plots an `enve.RecPlot2` object.
+      (x,
+      ### `enve.RecPlot2` object to plot.
+      layout=matrix(c(5,5,2,1,4,3), nrow=2),
+      ### Matrix indicating the position of the different panels in the layout,
+      ### where:
+      ###   0: Empty space,
+      ###   1: Counts matrix,
+      ###   2: position histogram (sequencing depth),
+      ###   3: identity histogram,
+      ###   4: Populations histogram (histogram of sequencing depths),
+      ###   5: Color scale for the counts matrix (vertical),
+      ###   6: Color scale of the counts
+      ### matrix (horizontal). Only panels indicated here will be plotted. To
+      ### plot only one panel simply set this to the number of the panel you
+      ### want to plot.
+      widths=c(1,7,2),
+      ### Relative widths of the columns of `layout`.
+      heights=c(1,2),
+      ### Relative heights of the rows of `layout`.
+      palette=grey((100:0)/100),
+      ### Colors to be used to represent the counts matrix, sorted from no hits
+      ### to the maximum sequencing depth.
+      underlay.group=TRUE,
+      ### If TRUE, it indicates the in-group and out-group areas couloured based
+      ### on `in.col` and `out.col`. Requires support for semi-transparency.
+      peaks.col='darkred',
+      ### If not NA, it attempts to represent peaks in the population histogram
+      ### in the specified color. Set to NA to avoid peak-finding.
+      id.lim=range(x$id.breaks),
+      ### Limits of identities to represent.
+      pos.lim=range(x$pos.breaks),
+      ### Limits of positions to represent (in bp, regardless of `pos.units`).
+      pos.units=c('Mbp','Kbp','bp'),
+      ### Units in which the positions should be represented (powers of 1,000
+      ### base pairs).
+      mar=list('1'=c(5,4,1,1)+.1, '2'=c(ifelse(any(layout==1),1,5),4,4,1)+.1,
+	 '3'=c(5,ifelse(any(layout==1),1,4),1,2)+0.1,
+	 '4'=c(ifelse(any(layout==1),1,5),ifelse(any(layout==2),1,4),4,2)+0.1,
+	 '5'=c(5,3,4,1)+0.1, '6'=c(5,4,4,2)+0.1),
+      ### Margins of the panels as a list, with the character representation of
+      ### the number of the panel as index (see `layout`).
+      pos.splines=0,
+      ### Smoothing parameter for the splines in the position histogram. Zero
+      ### (0) for no splines. If non-zero, requires the stats package.
+      id.splines=1/2,
+      ### Smoothing parameter for the splines in the identity histogram. Zero
+      ### (0) for no splines. If non-zero, requires the stats package.
+      in.lwd=ifelse(pos.splines>0, 1/2, 2),
+      ### Line width for the sequencing depth of in-group matches.
+      out.lwd=ifelse(pos.splines>0, 1/2, 2),
+      ### Line width for the sequencing depth of out-group matches.
+      id.lwd=ifelse(id.splines>0, 1/2, 2),
+      ### Line width for the identity histogram.
+      in.col='darkblue',
+      ### Color associated to in-group matches.
+      out.col='lightblue',
+      ### Color associated to out-group matches.
+      id.col='black',
+      ### Color for the identity histogram.
+      breaks.col='#AAAAAA40',
+      ### Color of the vertical lines indicating sequence breaks.
+      peaks.opts=list(),
+      ### Options passed to `enve.recplot2.findPeaks`, if `peaks.col` is not NA.
+      ...
+      ### Any other graphic parameters (currently ignored).
+   ){
+   pos.units	<- match.arg(pos.units);
+   pos.factor	<- ifelse(pos.units=='bp',1,ifelse(pos.units=='Kbp',1e3,1e6));
+   pos.lim	<- pos.lim/pos.factor;
+   lmat <- layout;
+   for(i in 1:6) if(!any(layout==i)) lmat[layout>i] <- lmat[layout>i]-1;
+   layout(lmat, widths=widths, heights=heights);
+   ori.mar <- par('mar');
+   # Essential vars
+   counts	<- x$counts
+   id.ingroup	<- x$id.ingroup
+   id.counts	<- x$id.counts
+   id.breaks	<- x$id.breaks
+   id.mids	<- (id.breaks[-length(id.breaks)]+id.breaks[-1])/2
+   id.binsize	<- id.breaks[-1] - id.breaks[-length(id.breaks)]
+   pos.counts.in  <- x$pos.counts.in
+   pos.counts.out <- x$pos.counts.out
+   pos.breaks   <- x$pos.breaks/pos.factor
+   pos.mids     <- (pos.breaks[-length(pos.breaks)]+pos.breaks[-1])/2
+   pos.binsize  <- (pos.breaks[-1] - pos.breaks[-length(pos.breaks)])*pos.factor
+   seqdepth.in  <- pos.counts.in/pos.binsize
+   seqdepth.out <- pos.counts.out/pos.binsize
+   seqdepth.lim <- range(c(seqdepth.in[seqdepth.in>0],
+		     seqdepth.out[seqdepth.out>0]))*c(1/2,2)
+   if(underlay.group){
+      in.bg  <- do.call(rgb, c(as.list(col2rgb(in.col)),
+		  list(maxColorValue=256, alpha=62)));
+      out.bg <- do.call(rgb, c(as.list(col2rgb(out.col)[,1]),
+		  list(maxColorValue=256, alpha=52)));
+   }
+   # Counts matrix
+   if(any(layout==1)){
+      par(mar=mar[['1']]);
+      plot(1, t='n', bty='l',
+	 xlim=pos.lim, xlab=paste('Position in genome (',pos.units,')',sep=''),
+	    xaxs='i', ylim=id.lim,  ylab=x$id.metric, yaxs='i');
+      if(underlay.group){
+	 rect(pos.lim[1], id.lim[1], pos.lim[2],
+	    min(id.breaks[c(id.ingroup,TRUE)]), col=out.bg, border=NA);
+	 rect(pos.lim[1], min(id.breaks[c(id.ingroup,TRUE)]), pos.lim[2],
+	    id.lim[2], col=in.bg,  border=NA);
+      }
+      abline(v=x$seq.breaks/pos.factor, col=breaks.col);
+      image(x=pos.breaks, y=id.breaks, z=log10(counts),col=palette,
+	 bg=grey(1,0), breaks=seq(-.1,log10(max(counts)),
+	 length.out=1+length(palette)), add=TRUE);
+   }
+   # Position histogram
+   if(any(layout==2)){
+      par(mar=mar[['2']]);
+      if(any(layout==1)){
+	 xlab=''
+	 xaxt='n'
+      }else{
+	 xlab=paste('Position in genome (',pos.units,')',sep='')
+	 xaxt='s'
+      }
+      plot(1,t='n', bty='l', log='y',
+	 xlim=pos.lim, xlab=xlab, xaxt=xaxt, xaxs='i',
+	 ylim=seqdepth.lim, yaxs='i', ylab='Sequencing depth (X)');
+      abline(v=x$seq.breaks/pos.factor, col=breaks.col)
+      pos.x <- rep(pos.breaks,each=2)[-c(1,2*length(pos.breaks))]
+      pos.f <- rep(seqdepth.in,each=2)
+      lines(pos.x, rep(seqdepth.out,each=2), lwd=out.lwd, col=out.col);
+      lines(pos.x, pos.f, lwd=in.lwd, col=in.col);
+      if(pos.splines > 0){
+	 pos.spline <- smooth.spline(pos.x[pos.f>0], log(pos.f[pos.f>0]),
+	    spar=pos.splines)
+	 lines(pos.spline$x, exp(pos.spline$y), lwd=2, col=in.col)
+      }
+      if(any(pos.counts.out==0)) rect(pos.breaks[c(pos.counts.out==0,FALSE)],
+	       seqdepth.lim[1], pos.breaks[c(FALSE,pos.counts.out==0)],
+	       seqdepth.lim[1]*3/2, col=out.col, border=NA);
+      if(any(pos.counts.in==0))  rect(pos.breaks[c(pos.counts.in==0,FALSE)],
+	       seqdepth.lim[1], pos.breaks[c(FALSE,pos.counts.in==0)],
+	       seqdepth.lim[1]*3/2, col=in.col,  border=NA);
+   }
+   # Identity histogram
+   if(any(layout==3)){
+      par(mar=mar[['3']]);
+      if(any(layout==1)){
+	 ylab=''
+	 yaxt='n'
+      }else{
+	 ylab=x$id.metric
+	 yaxt='s'
+      }
+      if(sum(id.counts>0) >= 4){
+	 id.counts.range <- range(id.counts[id.counts>0])*c(1/2,2);
+	 plot(1,t='n', bty='l', log='x',
+	       xlim=id.counts.range, xlab='bps per bin', xaxs='i',
+	       ylim=id.lim, yaxs='i', ylab=ylab, yaxt=yaxt);
+	 if(underlay.group){
+	    rect(id.counts.range[1], id.lim[1], id.counts.range[2],
+	       min(id.breaks[c(id.ingroup,TRUE)]), col=out.bg, border=NA);
+	    rect(id.counts.range[1], min(id.breaks[c(id.ingroup,TRUE)]),
+	       id.counts.range[2], id.lim[2], col=in.bg,  border=NA);
+	 }
+	 id.f <- rep(id.counts,each=2)
+	 id.x <- rep(id.breaks,each=2)[-c(1,2*length(id.breaks))]
+	 lines(id.f, id.x, lwd=id.lwd, col=id.col);
+	 if(id.splines > 0){
+	    id.spline <- smooth.spline(id.x[id.f>0], log(id.f[id.f>0]),
+	       spar=id.splines)
+	    lines(exp(id.spline$y), id.spline$x, lwd=2, col=id.col)
+	 }
+      }else{
+	 plot(1,t='n',bty='l',xlab='', xaxt='n', ylab='', yaxt='n')
+	 text(1,1,labels='Insufficient data', srt=90)
+      }
+   }
+   # Populations histogram
+   peaks <- NA;
+   if(any(layout==4)){
+      par(mar=mar[['4']]);
+      if(any(layout==2)){
+	 ylab=''
+	 yaxt='n'
+      }else{
+	 ylab='Sequencing depth (X)'
+	 yaxt='s'
+      }
+      h.breaks <- seq(log10(seqdepth.lim[1]*2), log10(seqdepth.lim[2]/2),
+	 length.out=200);
+      h.in <- hist(log10(seqdepth.in), breaks=h.breaks, plot=FALSE);
+      h.out <- hist(log10(seqdepth.out), breaks=h.breaks, plot=FALSE);
+      plot(1, t='n', log='y',
+	 xlim=range(c(h.in$counts,h.out$counts,sum(pos.counts.in==0))),
+	 xaxs='r', xlab='', xaxt='n', ylim=seqdepth.lim, yaxs='i', ylab=ylab,
+	 yaxt=yaxt)
+      y.tmp.in <- c(rep(10^h.in$breaks,each=2),seqdepth.lim[1]*c(1,1,3/2,3/2))
+      y.tmp.out <- c(rep(10^h.out$breaks,each=2),seqdepth.lim[1]*c(1,1,3/2,3/2))
+      lines(c(0,rep(h.out$counts,each=2),0,0,rep(sum(pos.counts.out==0),2),0),
+	 y.tmp.out, col=out.col)
+      polygon(c(0,rep(h.in$counts,each=2),0,0,rep(sum(pos.counts.in==0),2),0),
+	 y.tmp.in, border=NA, col=in.col)
+      if(!is.na(peaks.col)){
+	 o	<- peaks.opts; o$x = x;
+	 peaks	<- do.call(enve.recplot2.findPeaks, o);
+	 h.mids <- (10^h.breaks[-1] + 10^h.breaks[-length(h.breaks)])/2
+	 if(!is.null(peaks) & length(peaks)>0){
+	    pf <- h.mids*0;
+	    for(i in 1:length(peaks)){
+	       cnt <- enve.recplot2.__peakHist(peaks[[i]], h.mids)
+	       lines(cnt, h.mids, col='red');
+	       pf <- pf+cnt;
+	       axis(4, at=peaks[[i]]$param.hat[[length(peaks[[i]]$param.hat)]],
+		  letters[i], las=1, hadj=1/2)
+	    }
+	    lines(pf, h.mids, col='red',lwd=1.5);
+	    legend('bottomright', legend=paste(
+	       letters[1:length(peaks)],'. ',
+	       signif(as.numeric(lapply(peaks,
+		  function(x) tail(as.numeric(x$param.hat),n=1))),3),'X (',
+	       signif(100*as.numeric(lapply(peaks,
+		  function(x) (length(x$values)/x$n.total))), 3), '%, err: ',
+	       signif(as.numeric(lapply(peaks, function(x) x$err.res)), 3), ')',
+	       sep=''), bty='n');
+	 }
+      }
+   }
+   # Color scale
+   count.bins <- 10^seq(log10(min(counts[counts>0])), log10(max(counts)),
+      length.out=1+length(palette))
+   if(any(layout==5)){
+      par(mar=mar[['5']]);
+      plot(1,t='n',log='y',xlim=0:1,xaxt='n',xlab='',xaxs='i',
+	 ylim=range(count.bins), yaxs='i', ylab='')
+      rect(0,count.bins[-length(count.bins)],1,count.bins[-1],col=palette,
+	 border=NA)
+   }
+   if(any(layout==6)){
+      par(mar=mar[['6']]);
+      plot(1,t='n',log='x',ylim=0:1,yaxt='n',ylab='',yaxs='i',
+	 xlim=range(count.bins), xaxs='i',xlab='');
+      rect(count.bins[-length(count.bins)],0,count.bins[-1],1,col=palette,
+	 border=NA);
+   }
+   par(mar=ori.mar);
+   return(peaks);
+   ### Returns a list of `enve.RecPlot2.Peak` objects (see
+   ### `enve.recplot2.findPeaks`). If `peaks.col`=NA or `layout` doesn't include
+   ### 4, returns NA.
+}
+#==============> Define core functions
+enve.recplot2 <- function(
+   ### Produces recruitment plots provided that BlastTab.catsbj.pl has
+   ### been previously executed.
+      prefix,
+      ### Path to the prefix of the BlastTab.catsbj.pl output files. At
+      ### least the files .rec and .lim must exist with this prefix.
+      plot=TRUE,
+      ### Should the object be plotted?
+      pos.breaks=1e3,
+      ### Breaks in the positions histogram. It can also be a vector of break
+      ### points, and values outside the range are ignored. If zero (0), it
+      ### uses the sequence breaks as defined in the .lim file, which means
+      ### one bin per contig (or gene, if the mapping is agains genes).
+      id.breaks=300,
+      ### Breaks in the identity histogram. It can also be a vector of break
+      ### points, and values outside the range are ignored.
+      id.metric=c('identity', 'corrected identity', 'bit score'),
+      ### Metric of identity to be used (Y-axis). Corrected identity is only
+      ### supported if the original BLAST file included sequence lengths.
+      id.summary=sum,
+      ### Function summarizing the identity bins. Other recommended options
+      ### include: `median` to estimate the median instead of total bins, and
+      ### `function(x) mlv(x,method='parzen')$M` to estimate the mode.
+      id.cutoff=95,
+      ### Cutoff of identity metric above which the hits are considered
+      ### 'in-group'. The 95% identity corresponds to the expectation of
+      ### ANI<95% within species.
+      threads=2,
+      ### Number of threads to use.
+      verbose=TRUE,
+      ### Indicates if the function should report the advance.
+      ...
+      ### Any additional parameters supported by `plot.enve.RecPlot2`.
+   ){
+   # Settings
+   id.metric <- match.arg(id.metric);
+   #Read files
+   if(verbose) cat("Reading files.\n")
+   rec <- read.table(paste(prefix, ".rec", sep=""), sep="\t", comment.char="",
+      quote="");
+   lim <- read.table(paste(prefix, ".lim", sep=""), sep="\t", comment.char="",
+      quote="", as.is=TRUE);
+   # Build matrix
+   if(verbose) cat("Building counts matrix.\n")
+   if(id.metric=="corrected identity" & ncol(rec)<6){
+      stop("Requesting corr. identity, but .rec file doesn't have 6th column")
+   }
+   rec.idcol <- ifelse(id.metric=="identity", 3,
+      ifelse(id.metric=="corrected identity", 6, 4));
+   if(length(pos.breaks)==1){
+      if(pos.breaks>0){
+         pos.breaks <- seq(min(lim[,2]), max(lim[,3]), length.out=pos.breaks+1);
+      }else{
+         pos.breaks <- c(lim[,2], tail(lim[,3], n=1))
+      }
+   }
+   if(length(id.breaks)==1){
+      id.breaks <- seq(min(rec[,rec.idcol]), max(rec[,rec.idcol]),
+	 length.out=id.breaks+1);
+   }
+   # Run in parallel
+   if(nrow(rec) < 200) threads <- 1 # It doesn't worth the overhead
+   cl		<- makeCluster(threads)
+   rec.l	<- list()
+   thl		<- ceiling(nrow(rec)/threads)
+   for(i in 0:(threads-1)){
+      rec.l[[i+1]] <- list(rec=rec[ (i*thl+1):min(((i+1)*thl),nrow(rec)), ],
+			verbose=ifelse(i==0, verbose, FALSE))
+   }
+   counts.l	<- clusterApply(cl, rec.l, enve.recplot2.__counts,
+			pos.breaks=pos.breaks, id.breaks=id.breaks,
+			rec.idcol=rec.idcol)
+   counts	<- counts.l[[1]]
+   if(threads>1) for(i in 2:threads) counts <- counts + counts.l[[i]]
+   stopCluster(cl)
+   # Estimate 1D histograms
+   if(verbose) cat("Building histograms.\n")
+   id.mids	<- (id.breaks[-length(id.breaks)]+id.breaks[-1])/2;
+   id.ingroup	<- (id.mids > id.cutoff);
+   id.counts	<- apply(counts, 2, id.summary);
+   pos.counts.in   <- apply(counts[,id.ingroup], 1, sum);
+   pos.counts.out  <- apply(counts[,!id.ingroup], 1, sum);
+   # Plot and return
+   recplot <- new('enve.RecPlot2',
+      counts=counts, id.counts=id.counts, pos.counts.in=pos.counts.in,
+      pos.counts.out=pos.counts.out,
+      id.breaks=id.breaks, pos.breaks=pos.breaks,
+      seq.breaks=c(lim[1,2], lim[,3]), seq.names=lim[,1],
+      id.ingroup=id.ingroup,id.metric=id.metric,
+      call=match.call());
+   if(plot){
+      if(verbose) cat("Plotting.\n")
+      peaks <- plot(recplot, ...);
+      attr(recplot, "peaks") <- peaks
+   }
+   return(recplot);
+   ### Returns an object of class `enve.RecPlot2`.
+}
+enve.recplot2.findPeaks <- function(
+   ### Identifies peaks in the population histogram potentially indicating
+   ### sub-population mixtures.
+      x,
+      ### An `enve.RecPlot2` object.
+      min.points=10,
+      ### Minimum number of points in the quantile-estimation-range
+      ### (`quant.est`) to estimate a peak.
+      quant.est=c(0.002, 0.998),
+      ### Range of quantiles to be used in the estimation of a peak's
+      ### parameters.
+      mlv.opts=list(method='parzen'),
+      ### Options passed to `mlv` to estimate the mode.
+      fitdist.opts.sn=list(distr='sn', method='qme', probs=c(0.1,0.5,0.8),
+	 start=list(omega=1, alpha=-1), lower=c(1e-6, -Inf, 0),
+	 upper=c(Inf, 0, Inf)),
+      ### Options passed to `fitdist` to estimate the standard deviation if
+      ### with.skewness=TRUE. Note that the `start` parameter will be ammended
+      ### with xi=estimated mode for each peak.
+      fitdist.opts.norm=list(distr='norm', method='qme', probs=c(.4,.6),
+	 start=list(sd=1), lower=c(1e-8, 0)),
+      ### Options passed to `fitdist` to estimate the standard deviation if
+      ### with.skewness=FALSE. Note that the `start` parameter will be ammended
+      ### with mean=estimated mode for each peak.
+      rm.top=0.05,
+      ### Top-values to remove before finding peaks, as a quantile probability.
+      ### This step is useful to remove highly conserved regions, but can be
+      ### turned off by setting rm.top=0. The quantile is determined *after*
+      ### removing zero-coverage windows.
+      with.skewness=TRUE,
+      ### Allow skewness correction of the peaks. Typically, the
+      ### sequencing-depth distribution for a single peak is left-skewed, due
+      ### partly (but not exclusively) to fragmentation and mapping sensitivity.
+      ### See Lindner et al 2013, Bioinformatics 29(10):1260-7 for an
+      ### alternative solution for the first problem (fragmentation) called
+      ### "tail distribution".
+      optim.rounds=200,
+      ### Maximum rounds of peak optimization.
+      optim.epsilon=1e-8,
+      ### Trace change at which optimization stops (unless `optim.rounds` is
+      ### reached first). The trace change is estimated as the sum of square
+      ### differences between parameters in one round and those from two rounds
+      ### earlier (to avoid infinite loops from approximation).
+      merge.logdist=log(1.75),
+      ### Maximum value of |log-ratio| between centrality parameters in peaks to
+      ### attempt merging. The default of ~0.22 corresponds to a maximum
+      ### difference of 25%.
+      verbose=FALSE
+      ### Display (mostly debugging) information.
+   ){
+   # Essential vars
+   pos.binsize	<- x$pos.breaks[-1] - x$pos.breaks[-length(x$pos.breaks)];
+   seqdepth.in	<- x$pos.counts.in/pos.binsize;
+   lsd1 <- seqdepth.in[seqdepth.in>0];
+   lsd1 <- lsd1[ lsd1 < quantile(lsd1, 1-rm.top, names=FALSE) ]
+   if(with.skewness){
+      fitdist.opts <- fitdist.opts.sn
+   }else{
+      fitdist.opts <- fitdist.opts.norm
+   }
+   peaks.opts <- list(lsd1=lsd1, min.points=min.points, quant.est=quant.est,
+      mlv.opts=mlv.opts, fitdist.opts=fitdist.opts, with.skewness=with.skewness,
+      optim.rounds=optim.rounds, optim.epsilon=optim.epsilon, verbose=verbose,
+      n.total=length(lsd1), merge.logdist=merge.logdist)
+   # Find seed peaks
+   if(verbose) cat('Mowing peaks for n =',length(lsd1),'\n')
+   peaks <- enve.recplot2.__findPeaks(peaks.opts);
+   # Merge overlapping peaks
+   if(verbose) cat('Trying to merge',length(peaks),'peaks\n')
+   merged <- (length(peaks)>1)
+   while(merged){
+      merged <- FALSE
+      ignore <- c()
+      peaks2 <- list();
+      for(i in 1:length(peaks)){
+	 if(i %in% ignore) next
+	 p <- peaks[[ i ]]
+	 j <- enve.recplot2.__whichClosestPeak(p, peaks)
+	 p2 <- peaks[[ j ]]
+	 dst.a <- p$param.hat[[ length(p$param.hat) ]]
+	 dst.b <- p2$param.hat[[ length(p2$param.hat) ]]
+	 if( abs(log(dst.a/dst.b)) < merge.logdist ){
+	    if(verbose) cat('==> Attempting a merge at',
+		  p$param.hat[[ length(p$param.hat) ]],'&',
+		  p2$param.hat[[ length(p2$param.hat) ]],'X\n');
+	    peaks.opts$lsd1 <- c(p$values, p2$values)
+	    p.new <- enve.recplot2.__findPeaks(peaks.opts)
+	    if(length(p.new)==1){
+	       peaks2[[ length(peaks2)+1 ]] <- p.new[[ 1 ]]
+	       ignore <- c(ignore, j)
+	       merged <- TRUE
+	    }
+	 }
+	 if(!merged) peaks2[[ length(peaks2)+1 ]] <- p
+      }
+      peaks <- peaks2
+      if(length(peaks)==1) break
+   }
+   if(verbose) cat('Found',length(peaks),'peak(s)\n')
+   return(peaks);
+   ### Returns a list of `enve.RecPlot2.Peak` objects.
+}
+#==============> Define utils
+enve.recplot2.corePeak <- function
+   ### Finds the peak in a list of peaks that is most likely to represent the
+   ### "core genome" of a population.
+      (x
+      ### `list` of `enve.RecPlot2.Peak` objects.
+   ){
+   # Find the peak with maximum depth (centrality)
+   maxPeak <- x[[
+	 which.max(as.numeric(lapply(x,
+	    function(y) y$param.hat[[ length(y$param.hat) ]])))
+      ]]
+   # If a "larger" peak (a peak explaining more bins of the genome) is within
+   # the "merge.logdist" distance, take that one instead.
+   corePeak <- maxPeak
+   for(p in x){
+      sz.d = log(length(p$values)/length(corePeak$values))
+      if(sz.d < 0)
+	 next;
+      sq.d.a <- p$param.hat[[ length(p$param.hat) ]]
+      sq.d.b <- maxPeak$param.hat[[ length(maxPeak$param.hat) ]]
+      if(abs(log(sq.d.a/sq.d.b )) < maxPeak$merge.logdist+sz.d/5)
+         corePeak <- p
+   }
+   return(corePeak)
+}
+enve.recplot2.changeCutoff <- function
+   ### Change the intra-species cutoff of an existing recruitment plot.
+      (rp,
+      ### enve.RecPlot2 object.
+      new.cutoff=98
+      ### New cutoff to use.
+      ){
+   # Re-calculate vectors
+   id.mids	<- (rp$id.breaks[-length(rp$id.breaks)]+rp$id.breaks[-1])/2
+   id.ingroup	<- (id.mids > new.cutoff)
+   pos.counts.in  <- apply(rp$counts[,id.ingroup], 1, sum)
+   pos.counts.out <- apply(rp$counts[,!id.ingroup], 1, sum)
+   # Update object
+   attr(rp, "id.ingroup")     <- id.ingroup
+   attr(rp, "pos.counts.in")  <- pos.counts.in
+   attr(rp, "pos.counts.out") <- pos.counts.out
+   attr(rp, "call")           <- match.call()
+   return(rp)
+}
+enve.recplot2.extractWindows <- function
+   ### Extract windows significantly below (or above) the peak in sequencing
+   ### depth.
+      (rp,
+      ### Recruitment plot, a enve.Recplot2 object.
+      peak,
+      ### Peak, a enve.RecPlot2.Peak object. If list, it is assumed to be a list
+      ### of enve.RecPlot2.Peak objects, in which case the core peak is used
+      ### (see enve.recplot2.corePeak).
+      lower.tail=TRUE,
+      ### If FALSE, it returns windows significantly above the peak in
+      ### sequencing depth.
+      significance=0.05,
+      ### Significance threshold (alpha) to select windows.
+      seq.names=FALSE
+      ### Returns subject sequence names instead of a vector of Booleans. It
+      ### assumes that the recruitment plot was generated with pos.breaks=0.
+      ){
+   # Determine the threshold
+   if(is.list(peak)) peak <- enve.recplot2.corePeak(peak)
+   par <- peak$param.hat
+   par[["p"]] <- ifelse(lower.tail, significance, 1-significance)
+   thr <- do.call(ifelse(length(par)==4, qsn, qnorm), par)
+   # Estimate sequencing depths per window
+   pos.cnts.in <- rp$pos.counts.in
+   pos.breaks  <- rp$pos.breaks
+   pos.binsize <- (pos.breaks[-1] - pos.breaks[-length(pos.breaks)])
+   seqdepth.in <- pos.cnts.in/pos.binsize
+   # Select windows past the threshold
+   if(lower.tail){
+      sel <- seqdepth.in < thr
+   }else{
+      sel <- seqdepth.in > thr
+   }
+   if(!seq.names) return(sel)
+   if(length(seqdepth.in) != length(rp$seq.names))
+      stop(paste("Requesting subject sequence names, but the recruitment plot",
+         "was not generated with pos.breaks=0."))
+   return(rp$seq.names[sel])
+}
+#==============> Define internal functions
+enve.recplot2.__counts <- function
+   ### Internal ancilliary function (see `enve.recplot2`).
+      (x, pos.breaks, id.breaks, rec.idcol){
+   rec <- x$rec
+   verbose <- x$verbose
+   counts <- matrix(0, nrow=length(pos.breaks)-1, ncol=length(id.breaks)-1);
+   for(i in 1:nrow(rec)){
+      if(verbose & i%%100==0) cat("   [",signif(i*100/nrow(rec),3),"% ]   \r");
+      y.bin <- which(
+	 rec[i,rec.idcol]>=id.breaks[-length(id.breaks)] &
+	 rec[i,rec.idcol]<=id.breaks[-1])[1] ;
+      for(pos in rec[i,1]:rec[i,2]){
+	 x.bin <- which(
+	    pos>=pos.breaks[-length(pos.breaks)] & pos<=pos.breaks[-1])[1] ;
+	 counts[x.bin, y.bin] <- counts[x.bin, y.bin]+1 ;
+      }
+   }
+   return(counts);
+}
+enve.recplot2.__peakHist <- function
+   ### Internal ancilliary function (see `enve.RecPlot2.Peak`).
+      (x, mids, counts=TRUE){
+   d.o <- x$param.hat
+   d.o$x <- mids
+   prob  <- do.call(paste('d', x$dist, sep=''), d.o)
+   if(!counts) return(prob)
+   if(length(x$values)>0) return(prob*length(x$values)/sum(prob))
+   return(prob*x$n.hat/sum(prob))
+}
+enve.recplot2.__findPeak <- function
+   ### Internall ancilliary function (see `enve.recplot2.findPeaks`).
+      (lsd1, min.points, quant.est, mlv.opts, fitdist.opts, with.skewness,
+      optim.rounds, optim.epsilon, n.total, merge.logdist, verbose
+   ){
+   dist	<- ifelse(with.skewness, 'sn', 'norm');
+   # Find peak
+   o <- mlv.opts; o$x = lsd1;
+   mode1 <- do.call(mlv, o)$M;
+   if(verbose) cat('Anchoring at mode =',mode1,'\n')
+   param.hat <- fitdist.opts$start; last.hat <- param.hat;
+   lim <- NA;
+   if(with.skewness){ param.hat$xi <- mode1 }else{ param.hat$mean <- mode1 }
+   # Refine peak parameters
+   for(round in 1:optim.rounds){
+      param.hat[[ 1 ]] <- param.hat[[ 1 ]]/diff(quant.est)# <- expand dispersion
+      lim.o <- param.hat
+      lim.o$p <- quant.est; lim <- do.call(paste('q',dist,sep=''), lim.o)
+      lsd1.pop <- lsd1[(lsd1>lim[1]) & (lsd1<lim[2])];
+      if(verbose) cat(' Round', round, 'with n =',length(lsd1.pop),
+	    'and params =',as.numeric(param.hat),' \r')
+      if(length(lsd1.pop) < min.points) break;
+      o <- fitdist.opts; o$data = lsd1.pop; o$start = param.hat;
+      last.last.hat <- last.hat
+      last.hat <- param.hat
+      param.hat <- as.list(do.call(fitdist, o)$estimate);
+      if(any(is.na(param.hat))){
+	 if(round>1) param.hat <- last.hat;
+	 break;
+      }
+      epsilon <- sum((as.numeric(last.last.hat)-as.numeric(param.hat))^2)
+      if(round>2) if(epsilon < optim.epsilon) break;
+   }
+   if(verbose) cat('\n')
+   if(is.na(param.hat[1]) | is.na(lim[1])) return(NULL);
+   # Mow distribution
+   lsd2 <- c();
+   lsd.pop <- c();
+   n.hat <- length(lsd1.pop)/diff(quant.est)
+   peak <- new('enve.RecPlot2.Peak', dist=dist, values=as.numeric(), mode=mode1,
+      param.hat=param.hat, n.hat=n.hat, n.total=n.total,
+      merge.logdist=merge.logdist)
+   peak.breaks <- seq(min(lsd1), max(lsd1), length=20)
+   peak.cnt <- enve.recplot2.__peakHist(peak,
+      (peak.breaks[-length(peak.breaks)]+peak.breaks[-1])/2)
+   for(i in 2:length(peak.breaks)){
+      values <- lsd1[ (lsd1 >= peak.breaks[i-1]) & (lsd1 < peak.breaks[i]) ]
+      n.exp <- peak.cnt[i-1]
+      if(n.exp==0) n.exp=0.1
+      if(length(values)==0) next
+      in.peak <- runif(length(values)) <= n.exp/length(values)
+      lsd2 <- c(lsd2, values[!in.peak])
+      lsd.pop <- c(lsd.pop, values[in.peak])
+   }
+   if(length(lsd.pop) < min.points) return(NULL)
+   # Return peak
+   attr(peak, 'values') <- lsd.pop
+   attr(peak, 'values.res') <- lsd2
+   attr(peak, 'err.res') <- 1-(cor(hist(lsd.pop, breaks=peak.breaks,
+      plot=FALSE)$counts, hist(lsd1, breaks=peak.breaks,
+      plot=FALSE)$counts)+1)/2
+   if(verbose) cat(' Extracted peak with n =',length(lsd.pop),
+	 'with expected n =',n.hat,'\n')
+   return(peak)
+}
+enve.recplot2.__findPeaks <- function
+   ### Internal ancilliary function (see `enve.recplot2.findPeaks`).
+      (peaks.opts){
+   peaks <- list()
+   while(length(peaks.opts$lsd1) > peaks.opts$min.points){
+      peak <- do.call(enve.recplot2.__findPeak, peaks.opts)
+      if(is.null(peak)) break
+      peaks[[ length(peaks)+1 ]] <- peak
+      peaks.opts$lsd1 <- peak$values.res
+   }
+   return(peaks)
+}
+enve.recplot2.__whichClosestPeak <- function
+   ### Internal ancilliary function (see `enve.recplot2.findPeaks`).
+      (peak, peaks){
+   dist <- as.numeric(lapply(peaks, function(x) abs(log(x$param.hat[[ length(x$param.hat) ]]/peak$param.hat[[ length(peak$param.hat) ]] ))))
+   dist[ dist==0 ] <- Inf
+   return(which.min(dist))
+}