RubyGems - miga-base - Versions diffs - 1.2.17.0 → 1.2.17.1 - Mend

miga-base 1.2.17.0 → 1.2.17.1

Files changed (299) hide show

checksums.yaml +4 -4
data/lib/miga/version.rb +1 -1
data/utils/FastAAI/00.Libraries/01.SCG_HMMs/Archaea_SCG.hmm +41964 -0
data/utils/FastAAI/00.Libraries/01.SCG_HMMs/Bacteria_SCG.hmm +32439 -0
data/utils/FastAAI/00.Libraries/01.SCG_HMMs/Complete_SCG_DB.hmm +62056 -0
data/utils/FastAAI/FastAAI +3659 -0
data/utils/FastAAI/FastAAI-legacy/FastAAI +1336 -0
data/utils/FastAAI/FastAAI-legacy/kAAI_v1.0_virus.py +1296 -0
data/utils/FastAAI/README.md +84 -0
data/utils/enveomics/Docs/recplot2.md +244 -0
data/utils/enveomics/Examples/aai-matrix.bash +66 -0
data/utils/enveomics/Examples/ani-matrix.bash +66 -0
data/utils/enveomics/Examples/essential-phylogeny.bash +105 -0
data/utils/enveomics/Examples/unus-genome-phylogeny.bash +100 -0
data/utils/enveomics/LICENSE.txt +73 -0
data/utils/enveomics/Makefile +52 -0
data/utils/enveomics/Manifest/Tasks/aasubs.json +103 -0
data/utils/enveomics/Manifest/Tasks/blasttab.json +790 -0
data/utils/enveomics/Manifest/Tasks/distances.json +161 -0
data/utils/enveomics/Manifest/Tasks/fasta.json +802 -0
data/utils/enveomics/Manifest/Tasks/fastq.json +291 -0
data/utils/enveomics/Manifest/Tasks/graphics.json +126 -0
data/utils/enveomics/Manifest/Tasks/mapping.json +137 -0
data/utils/enveomics/Manifest/Tasks/ogs.json +382 -0
data/utils/enveomics/Manifest/Tasks/other.json +906 -0
data/utils/enveomics/Manifest/Tasks/remote.json +355 -0
data/utils/enveomics/Manifest/Tasks/sequence-identity.json +650 -0
data/utils/enveomics/Manifest/Tasks/tables.json +308 -0
data/utils/enveomics/Manifest/Tasks/trees.json +68 -0
data/utils/enveomics/Manifest/Tasks/variants.json +111 -0
data/utils/enveomics/Manifest/categories.json +165 -0
data/utils/enveomics/Manifest/examples.json +162 -0
data/utils/enveomics/Manifest/tasks.json +4 -0
data/utils/enveomics/Pipelines/assembly.pbs/CONFIG.mock.bash +69 -0
data/utils/enveomics/Pipelines/assembly.pbs/FastA.N50.pl +1 -0
data/utils/enveomics/Pipelines/assembly.pbs/FastA.filterN.pl +1 -0
data/utils/enveomics/Pipelines/assembly.pbs/FastA.length.pl +1 -0
data/utils/enveomics/Pipelines/assembly.pbs/README.md +189 -0
data/utils/enveomics/Pipelines/assembly.pbs/RUNME-2.bash +112 -0
data/utils/enveomics/Pipelines/assembly.pbs/RUNME-3.bash +23 -0
data/utils/enveomics/Pipelines/assembly.pbs/RUNME-4.bash +44 -0
data/utils/enveomics/Pipelines/assembly.pbs/RUNME.bash +50 -0
data/utils/enveomics/Pipelines/assembly.pbs/kSelector.R +37 -0
data/utils/enveomics/Pipelines/assembly.pbs/newbler.pbs +68 -0
data/utils/enveomics/Pipelines/assembly.pbs/newbler_preparator.pl +49 -0
data/utils/enveomics/Pipelines/assembly.pbs/soap.pbs +80 -0
data/utils/enveomics/Pipelines/assembly.pbs/stats.pbs +57 -0
data/utils/enveomics/Pipelines/assembly.pbs/velvet.pbs +63 -0
data/utils/enveomics/Pipelines/blast.pbs/01.pbs.bash +38 -0
data/utils/enveomics/Pipelines/blast.pbs/02.pbs.bash +73 -0
data/utils/enveomics/Pipelines/blast.pbs/03.pbs.bash +21 -0
data/utils/enveomics/Pipelines/blast.pbs/BlastTab.recover_job.pl +72 -0
data/utils/enveomics/Pipelines/blast.pbs/CONFIG.mock.bash +98 -0
data/utils/enveomics/Pipelines/blast.pbs/FastA.split.pl +1 -0
data/utils/enveomics/Pipelines/blast.pbs/README.md +127 -0
data/utils/enveomics/Pipelines/blast.pbs/RUNME.bash +109 -0
data/utils/enveomics/Pipelines/blast.pbs/TASK.check.bash +128 -0
data/utils/enveomics/Pipelines/blast.pbs/TASK.dry.bash +16 -0
data/utils/enveomics/Pipelines/blast.pbs/TASK.eo.bash +22 -0
data/utils/enveomics/Pipelines/blast.pbs/TASK.pause.bash +26 -0
data/utils/enveomics/Pipelines/blast.pbs/TASK.run.bash +89 -0
data/utils/enveomics/Pipelines/blast.pbs/sentinel.pbs.bash +29 -0
data/utils/enveomics/Pipelines/idba.pbs/README.md +49 -0
data/utils/enveomics/Pipelines/idba.pbs/RUNME.bash +95 -0
data/utils/enveomics/Pipelines/idba.pbs/run.pbs +56 -0
data/utils/enveomics/Pipelines/trim.pbs/README.md +54 -0
data/utils/enveomics/Pipelines/trim.pbs/RUNME.bash +70 -0
data/utils/enveomics/Pipelines/trim.pbs/run.pbs +130 -0
data/utils/enveomics/README.md +42 -0
data/utils/enveomics/Scripts/AAsubs.log2ratio.rb +171 -0
data/utils/enveomics/Scripts/Aln.cat.rb +221 -0
data/utils/enveomics/Scripts/Aln.convert.pl +35 -0
data/utils/enveomics/Scripts/AlphaDiversity.pl +152 -0
data/utils/enveomics/Scripts/BedGraph.tad.rb +93 -0
data/utils/enveomics/Scripts/BedGraph.window.rb +71 -0
data/utils/enveomics/Scripts/BlastPairwise.AAsubs.pl +102 -0
data/utils/enveomics/Scripts/BlastTab.addlen.rb +63 -0
data/utils/enveomics/Scripts/BlastTab.advance.bash +48 -0
data/utils/enveomics/Scripts/BlastTab.best_hit_sorted.pl +55 -0
data/utils/enveomics/Scripts/BlastTab.catsbj.pl +104 -0
data/utils/enveomics/Scripts/BlastTab.cogCat.rb +76 -0
data/utils/enveomics/Scripts/BlastTab.filter.pl +47 -0
data/utils/enveomics/Scripts/BlastTab.kegg_pep2path_rest.pl +194 -0
data/utils/enveomics/Scripts/BlastTab.metaxaPrep.pl +104 -0
data/utils/enveomics/Scripts/BlastTab.pairedHits.rb +157 -0
data/utils/enveomics/Scripts/BlastTab.recplot2.R +48 -0
data/utils/enveomics/Scripts/BlastTab.seqdepth.pl +86 -0
data/utils/enveomics/Scripts/BlastTab.seqdepth_ZIP.pl +119 -0
data/utils/enveomics/Scripts/BlastTab.seqdepth_nomedian.pl +86 -0
data/utils/enveomics/Scripts/BlastTab.subsample.pl +47 -0
data/utils/enveomics/Scripts/BlastTab.sumPerHit.pl +114 -0
data/utils/enveomics/Scripts/BlastTab.taxid2taxrank.pl +90 -0
data/utils/enveomics/Scripts/BlastTab.topHits_sorted.rb +123 -0
data/utils/enveomics/Scripts/Chao1.pl +97 -0
data/utils/enveomics/Scripts/CharTable.classify.rb +234 -0
data/utils/enveomics/Scripts/EBIseq2tax.rb +83 -0
data/utils/enveomics/Scripts/FastA.N50.pl +60 -0
data/utils/enveomics/Scripts/FastA.extract.rb +152 -0
data/utils/enveomics/Scripts/FastA.filter.pl +52 -0
data/utils/enveomics/Scripts/FastA.filterLen.pl +28 -0
data/utils/enveomics/Scripts/FastA.filterN.pl +60 -0
data/utils/enveomics/Scripts/FastA.fragment.rb +100 -0
data/utils/enveomics/Scripts/FastA.gc.pl +42 -0
data/utils/enveomics/Scripts/FastA.interpose.pl +93 -0
data/utils/enveomics/Scripts/FastA.length.pl +38 -0
data/utils/enveomics/Scripts/FastA.mask.rb +89 -0
data/utils/enveomics/Scripts/FastA.per_file.pl +36 -0
data/utils/enveomics/Scripts/FastA.qlen.pl +57 -0
data/utils/enveomics/Scripts/FastA.rename.pl +65 -0
data/utils/enveomics/Scripts/FastA.revcom.pl +23 -0
data/utils/enveomics/Scripts/FastA.sample.rb +98 -0
data/utils/enveomics/Scripts/FastA.slider.pl +85 -0
data/utils/enveomics/Scripts/FastA.split.pl +55 -0
data/utils/enveomics/Scripts/FastA.split.rb +79 -0
data/utils/enveomics/Scripts/FastA.subsample.pl +131 -0
data/utils/enveomics/Scripts/FastA.tag.rb +65 -0
data/utils/enveomics/Scripts/FastA.toFastQ.rb +69 -0
data/utils/enveomics/Scripts/FastA.wrap.rb +48 -0
data/utils/enveomics/Scripts/FastQ.filter.pl +54 -0
data/utils/enveomics/Scripts/FastQ.interpose.pl +90 -0
data/utils/enveomics/Scripts/FastQ.maskQual.rb +89 -0
data/utils/enveomics/Scripts/FastQ.offset.pl +90 -0
data/utils/enveomics/Scripts/FastQ.split.pl +53 -0
data/utils/enveomics/Scripts/FastQ.tag.rb +70 -0
data/utils/enveomics/Scripts/FastQ.test-error.rb +81 -0
data/utils/enveomics/Scripts/FastQ.toFastA.awk +24 -0
data/utils/enveomics/Scripts/GFF.catsbj.pl +127 -0
data/utils/enveomics/Scripts/GenBank.add_fields.rb +84 -0
data/utils/enveomics/Scripts/HMM.essential.rb +351 -0
data/utils/enveomics/Scripts/HMM.haai.rb +168 -0
data/utils/enveomics/Scripts/HMMsearch.extractIds.rb +83 -0
data/utils/enveomics/Scripts/JPlace.distances.rb +88 -0
data/utils/enveomics/Scripts/JPlace.to_iToL.rb +320 -0
data/utils/enveomics/Scripts/M5nr.getSequences.rb +81 -0
data/utils/enveomics/Scripts/MeTaxa.distribution.pl +198 -0
data/utils/enveomics/Scripts/MyTaxa.fragsByTax.pl +35 -0
data/utils/enveomics/Scripts/MyTaxa.seq-taxrank.rb +49 -0
data/utils/enveomics/Scripts/NCBIacc2tax.rb +92 -0
data/utils/enveomics/Scripts/Newick.autoprune.R +27 -0
data/utils/enveomics/Scripts/RAxML-EPA.to_iToL.pl +228 -0
data/utils/enveomics/Scripts/RecPlot2.compareIdentities.R +32 -0
data/utils/enveomics/Scripts/RefSeq.download.bash +48 -0
data/utils/enveomics/Scripts/SRA.download.bash +55 -0
data/utils/enveomics/Scripts/TRIBS.plot-test.R +36 -0
data/utils/enveomics/Scripts/TRIBS.test.R +39 -0
data/utils/enveomics/Scripts/Table.barplot.R +31 -0
data/utils/enveomics/Scripts/Table.df2dist.R +30 -0
data/utils/enveomics/Scripts/Table.filter.pl +61 -0
data/utils/enveomics/Scripts/Table.merge.pl +77 -0
data/utils/enveomics/Scripts/Table.prefScore.R +60 -0
data/utils/enveomics/Scripts/Table.replace.rb +69 -0
data/utils/enveomics/Scripts/Table.round.rb +63 -0
data/utils/enveomics/Scripts/Table.split.pl +57 -0
data/utils/enveomics/Scripts/Taxonomy.silva2ncbi.rb +227 -0
data/utils/enveomics/Scripts/VCF.KaKs.rb +147 -0
data/utils/enveomics/Scripts/VCF.SNPs.rb +88 -0
data/utils/enveomics/Scripts/aai.rb +421 -0
data/utils/enveomics/Scripts/ani.rb +362 -0
data/utils/enveomics/Scripts/anir.rb +137 -0
data/utils/enveomics/Scripts/clust.rand.rb +102 -0
data/utils/enveomics/Scripts/gi2tax.rb +103 -0
data/utils/enveomics/Scripts/in_silico_GA_GI.pl +96 -0
data/utils/enveomics/Scripts/lib/data/dupont_2012_essential.hmm.gz +0 -0
data/utils/enveomics/Scripts/lib/data/lee_2019_essential.hmm.gz +0 -0
data/utils/enveomics/Scripts/lib/enveomics.R +1 -0
data/utils/enveomics/Scripts/lib/enveomics_rb/anir.rb +293 -0
data/utils/enveomics/Scripts/lib/enveomics_rb/bm_set.rb +175 -0
data/utils/enveomics/Scripts/lib/enveomics_rb/enveomics.rb +24 -0
data/utils/enveomics/Scripts/lib/enveomics_rb/errors.rb +17 -0
data/utils/enveomics/Scripts/lib/enveomics_rb/gmm_em.rb +30 -0
data/utils/enveomics/Scripts/lib/enveomics_rb/jplace.rb +253 -0
data/utils/enveomics/Scripts/lib/enveomics_rb/match.rb +88 -0
data/utils/enveomics/Scripts/lib/enveomics_rb/og.rb +182 -0
data/utils/enveomics/Scripts/lib/enveomics_rb/rbm.rb +49 -0
data/utils/enveomics/Scripts/lib/enveomics_rb/remote_data.rb +74 -0
data/utils/enveomics/Scripts/lib/enveomics_rb/seq_range.rb +237 -0
data/utils/enveomics/Scripts/lib/enveomics_rb/stats/rand.rb +31 -0
data/utils/enveomics/Scripts/lib/enveomics_rb/stats/sample.rb +152 -0
data/utils/enveomics/Scripts/lib/enveomics_rb/stats.rb +3 -0
data/utils/enveomics/Scripts/lib/enveomics_rb/utils.rb +74 -0
data/utils/enveomics/Scripts/lib/enveomics_rb/vcf.rb +135 -0
data/utils/enveomics/Scripts/ogs.annotate.rb +88 -0
data/utils/enveomics/Scripts/ogs.core-pan.rb +160 -0
data/utils/enveomics/Scripts/ogs.extract.rb +125 -0
data/utils/enveomics/Scripts/ogs.mcl.rb +186 -0
data/utils/enveomics/Scripts/ogs.rb +104 -0
data/utils/enveomics/Scripts/ogs.stats.rb +131 -0
data/utils/enveomics/Scripts/rbm-legacy.rb +172 -0
data/utils/enveomics/Scripts/rbm.rb +108 -0
data/utils/enveomics/Scripts/sam.filter.rb +148 -0
data/utils/enveomics/Tests/Makefile +10 -0
data/utils/enveomics/Tests/Mgen_M2288.faa +3189 -0
data/utils/enveomics/Tests/Mgen_M2288.fna +8282 -0
data/utils/enveomics/Tests/Mgen_M2321.fna +8288 -0
data/utils/enveomics/Tests/Nequ_Kin4M.faa +2970 -0
data/utils/enveomics/Tests/Xanthomonas_oryzae-PilA.tribs.Rdata +0 -0
data/utils/enveomics/Tests/Xanthomonas_oryzae-PilA.txt +7 -0
data/utils/enveomics/Tests/Xanthomonas_oryzae.aai-mat.tsv +17 -0
data/utils/enveomics/Tests/Xanthomonas_oryzae.aai.tsv +137 -0
data/utils/enveomics/Tests/a_mg.cds-go.blast.tsv +123 -0
data/utils/enveomics/Tests/a_mg.reads-cds.blast.tsv +200 -0
data/utils/enveomics/Tests/a_mg.reads-cds.counts.tsv +55 -0
data/utils/enveomics/Tests/alkB.nwk +1 -0
data/utils/enveomics/Tests/anthrax-cansnp-data.tsv +13 -0
data/utils/enveomics/Tests/anthrax-cansnp-key.tsv +17 -0
data/utils/enveomics/Tests/hiv1.faa +59 -0
data/utils/enveomics/Tests/hiv1.fna +134 -0
data/utils/enveomics/Tests/hiv2.faa +70 -0
data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv +233 -0
data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv.lim +1 -0
data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv.rec +233 -0
data/utils/enveomics/Tests/phyla_counts.tsv +10 -0
data/utils/enveomics/Tests/primate_lentivirus.ogs +11 -0
data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-hiv1.rbm +9 -0
data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-hiv2.rbm +8 -0
data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-siv.rbm +6 -0
data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv2-hiv2.rbm +9 -0
data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv2-siv.rbm +6 -0
data/utils/enveomics/Tests/primate_lentivirus.rbm/siv-siv.rbm +6 -0
data/utils/enveomics/build_enveomics_r.bash +45 -0
data/utils/enveomics/enveomics.R/DESCRIPTION +31 -0
data/utils/enveomics/enveomics.R/NAMESPACE +39 -0
data/utils/enveomics/enveomics.R/R/autoprune.R +155 -0
data/utils/enveomics/enveomics.R/R/barplot.R +184 -0
data/utils/enveomics/enveomics.R/R/cliopts.R +135 -0
data/utils/enveomics/enveomics.R/R/df2dist.R +154 -0
data/utils/enveomics/enveomics.R/R/growthcurve.R +331 -0
data/utils/enveomics/enveomics.R/R/prefscore.R +79 -0
data/utils/enveomics/enveomics.R/R/recplot.R +354 -0
data/utils/enveomics/enveomics.R/R/recplot2.R +1631 -0
data/utils/enveomics/enveomics.R/R/tribs.R +583 -0
data/utils/enveomics/enveomics.R/R/utils.R +80 -0
data/utils/enveomics/enveomics.R/README.md +81 -0
data/utils/enveomics/enveomics.R/data/growth.curves.rda +0 -0
data/utils/enveomics/enveomics.R/data/phyla.counts.rda +0 -0
data/utils/enveomics/enveomics.R/man/cash-enve.GrowthCurve-method.Rd +16 -0
data/utils/enveomics/enveomics.R/man/cash-enve.RecPlot2-method.Rd +16 -0
data/utils/enveomics/enveomics.R/man/cash-enve.RecPlot2.Peak-method.Rd +16 -0
data/utils/enveomics/enveomics.R/man/enve.GrowthCurve-class.Rd +25 -0
data/utils/enveomics/enveomics.R/man/enve.TRIBS-class.Rd +46 -0
data/utils/enveomics/enveomics.R/man/enve.TRIBS.merge.Rd +23 -0
data/utils/enveomics/enveomics.R/man/enve.TRIBStest-class.Rd +47 -0
data/utils/enveomics/enveomics.R/man/enve.__prune.iter.Rd +23 -0
data/utils/enveomics/enveomics.R/man/enve.__prune.reduce.Rd +23 -0
data/utils/enveomics/enveomics.R/man/enve.__tribs.Rd +40 -0
data/utils/enveomics/enveomics.R/man/enve.barplot.Rd +103 -0
data/utils/enveomics/enveomics.R/man/enve.cliopts.Rd +67 -0
data/utils/enveomics/enveomics.R/man/enve.col.alpha.Rd +24 -0
data/utils/enveomics/enveomics.R/man/enve.col2alpha.Rd +19 -0
data/utils/enveomics/enveomics.R/man/enve.df2dist.Rd +45 -0
data/utils/enveomics/enveomics.R/man/enve.df2dist.group.Rd +44 -0
data/utils/enveomics/enveomics.R/man/enve.df2dist.list.Rd +47 -0
data/utils/enveomics/enveomics.R/man/enve.growthcurve.Rd +75 -0
data/utils/enveomics/enveomics.R/man/enve.prefscore.Rd +50 -0
data/utils/enveomics/enveomics.R/man/enve.prune.dist.Rd +44 -0
data/utils/enveomics/enveomics.R/man/enve.recplot.Rd +139 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2-class.Rd +45 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.ANIr.Rd +24 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.Rd +77 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.__counts.Rd +25 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.__peakHist.Rd +21 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.__whichClosestPeak.Rd +19 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.changeCutoff.Rd +19 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.compareIdentities.Rd +47 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.coordinates.Rd +29 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.corePeak.Rd +18 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.extractWindows.Rd +45 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.Rd +36 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__em_e.Rd +19 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__em_m.Rd +19 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__emauto_one.Rd +27 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__mow_one.Rd +52 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__mower.Rd +17 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.em.Rd +51 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.emauto.Rd +43 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.mower.Rd +82 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.peak-class.Rd +59 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.seqdepth.Rd +27 -0
data/utils/enveomics/enveomics.R/man/enve.recplot2.windowDepthThreshold.Rd +36 -0
data/utils/enveomics/enveomics.R/man/enve.selvector.Rd +23 -0
data/utils/enveomics/enveomics.R/man/enve.tribs.Rd +68 -0
data/utils/enveomics/enveomics.R/man/enve.tribs.test.Rd +28 -0
data/utils/enveomics/enveomics.R/man/enve.truncate.Rd +27 -0
data/utils/enveomics/enveomics.R/man/growth.curves.Rd +14 -0
data/utils/enveomics/enveomics.R/man/phyla.counts.Rd +13 -0
data/utils/enveomics/enveomics.R/man/plot.enve.GrowthCurve.Rd +78 -0
data/utils/enveomics/enveomics.R/man/plot.enve.TRIBS.Rd +46 -0
data/utils/enveomics/enveomics.R/man/plot.enve.TRIBStest.Rd +45 -0
data/utils/enveomics/enveomics.R/man/plot.enve.recplot2.Rd +125 -0
data/utils/enveomics/enveomics.R/man/summary.enve.GrowthCurve.Rd +19 -0
data/utils/enveomics/enveomics.R/man/summary.enve.TRIBS.Rd +19 -0
data/utils/enveomics/enveomics.R/man/summary.enve.TRIBStest.Rd +19 -0
data/utils/enveomics/globals.mk +8 -0
data/utils/enveomics/manifest.json +9 -0
data/utils/multitrim/Multitrim How-To.pdf +0 -0
data/utils/multitrim/README.md +67 -0
data/utils/multitrim/multitrim.py +1555 -0
data/utils/multitrim/multitrim.yml +13 -0
metadata +301 -5

data/utils/enveomics/Manifest/Tasks/blasttab.json ADDED Viewed

@@ -0,0 +1,790 @@
+{
+  "tasks": [
+    {
+      "task": "BlastTab.addlen.rb",
+      "description": ["Appends an extra column to a tabular BLAST with the",
+        "length of the query or the subject sequence."],
+      "help_arg": "--help",
+      "options": [
+        {
+          "opt": "--fasta",
+          "arg": "in_file",
+          "description": "FastA file of the query or the subject.",
+          "mandatory": true
+        },
+        {
+          "opt": "--subject",
+          "description": ["Use the subject column of the BLAST, by default the",
+            "query column is used."],
+          "note": "If used, the input FastA must contain subject sequences."
+        },
+        {
+          "opt": "--quiet",
+          "description": "Run quietly (no STDERR output)."
+        },
+        "<",
+        {
+          "arg": "in_file",
+          "description": "Input tabular BLAST file.",
+          "mandatory": true
+        },
+        ">",
+        {
+          "arg": "out_file",
+          "description": "Output tabular BLAST file with additional column.",
+          "mandatory": true
+        }
+      ]
+    },
+    {
+      "task": "BlastTab.advance.bash",
+      "description": ["Calculates the percentage of a partial BLAST result.",
+        "The value produced slightly subestimates the actual advance, due to",
+        "un-flushed output and trailing queries that could be processed but",
+        "generate no results."],
+      "help_arg": "",
+      "requires": [ { "interpreter": "awk" } ],
+      "options": [
+        {
+          "name": "Blast",
+          "arg": "in_file",
+          "description": "Incomplete Tabular BLAST output.",
+          "mandatory": true
+        },
+        {
+          "name": "Query FastA",
+          "arg": "in_file",
+          "description": "FastA file with query sequences.",
+          "mandatory": true
+        }
+      ]
+    },
+    {
+      "task": "BlastTab.best_hit_sorted.pl",
+      "description": "Filters a tabular BLAST to retain only the best matches.",
+      "help_arg": "--help",
+      "see_also": ["BlastTab.topHits_sorted.rb"],
+      "options": [
+        {
+          "name": "Sort",
+          "arg": "select",
+          "values": ["sort","cat"],
+          "mandatory": true,
+          "description": ["Use 'sort' if your BLAST is not pre-sorted by the",
+            "first column (or if you're not sure). Use 'cat' otherwise."]
+        },
+        {
+          "name": "Input BLAST",
+          "arg": "in_file",
+          "multiple_sep": " ",
+          "mandatory": true,
+          "description": "Tabular BLAST file to filter."
+        },
+        "|",
+        { "arg": "task" },
+        ">",
+        {
+          "name": "Output BLAST",
+          "arg": "out_file",
+          "mandatory": true,
+          "description": "Filetered tabular BLAST output."
+        }
+      ]
+    },
+    {
+      "task": "BlastTab.catsbj.pl",
+      "description": ["Generates a list of hits from a BLAST result",
+        "concatenating the subject sequences. This can be used, e.g., to",
+        "analyze BLAST results against draft genomes. This script creates two",
+        "files using <map.bls> as prefix with extensions .rec (for the",
+        "recruitment plot) and .lim (for the limits of the different sequences",
+        "in <seq.fa>)."],
+      "see_also": ["BlastTab.recplot2.R", "GFF.catsbj.pl"],
+      "help_arg": "-h",
+      "options": [
+         {
+           "opt": "-i",
+           "name": "Identity",
+           "description": "Minimum identity (in %) to report a result.",
+           "arg": "float",
+           "default": 70.0
+         },
+         {
+           "opt": "-l",
+           "name": "Length",
+           "description": "Minimum alignment length to report a result.",
+           "default": 60.0,
+           "arg": "float"
+         },
+         {
+           "opt": "-s",
+           "name": "Subset",
+           "description": ["The FastA provided is to be treated as a subset of",
+             "the subject. By default, it expects all the BLAST subjects to be",
+             "present in the FastA."]
+         },
+         {
+           "opt": "-q",
+           "name": "Quiet",
+           "description": "Run quietly."
+         },
+         {
+           "name": "seq.fa",
+           "description": "Subject sequences (ref) in FastA format.",
+           "mandatory": true,
+           "arg": "in_file"
+         },
+         {
+           "name": "map.bls",
+           "description": ["Mapping of the reads to the reference in Tabular",
+             "BLAST format."],
+           "mandatory": true,
+           "arg": "in_file"
+         }
+      ]
+    },
+    {
+      "task": "BlastTab.cogCat.rb",
+      "description": ["Replaces the COG gene IDs in a BLAST for the COG",
+        "category."],
+      "help_arg": "--help",
+      "options": [
+        {
+          "opt": "--whog",
+          "arg": "in_file",
+          "mandatory": true,
+          "description": "COG's 'whog' file."
+        },
+        {
+          "opt": "--blast",
+          "arg": "in_file",
+          "mandatory": true,
+          "description": "Tabular BLAST file with COG IDs as subject."
+        },
+        {
+          "opt": "--cog",
+          "description": "If set, returns the COG ID, not the COG category."
+        },
+        {
+          "opt": "--desc",
+          "description": "Includes COG description (requires --cog)."
+        },
+        {
+          "opt": "--noverbose",
+          "description": "Run quietly, but show warnings."
+        },
+        {
+          "opt": "--quiet",
+          "description": "Run quietly."
+        },
+        ">",
+        {
+          "arg": "out_file",
+          "name": "COG Blast",
+          "mandatory": true,
+          "description": "Tabular BLAST with COG ID's or categories as subject."
+        }
+      ]
+    },
+    {
+      "task": "BlastTab.filter.pl",
+      "description": ["Extracts a subset of hits (queries or subjects) from a",
+        "tabular BLAST."],
+      "help_arg": "",
+      "see_also": "BlastTab.subsample.pl",
+      "options": [
+        {
+          "name": "Subject",
+          "opt": "-s",
+          "description": ["If set, assumes that list.txt contains subject IDs.",
+            "By default: assumes query IDs."]
+        },
+        {
+          "name": "Inverse",
+          "opt": "-i",
+          "description": ["If set, reports the inverse of the list (i.e.,",
+            "reports only hits absent in the list)."]
+        },
+        {
+          "name": "list.txt",
+          "arg": "in_file",
+          "mandatory": true,
+          "description": "List of IDs to extract."
+        },
+        {
+          "name": "blast.txt",
+          "arg": "in_file",
+          "mandatory": true,
+          "description": "Tabular BLAST file containing the superset of hits."
+        },
+        ">",
+        {
+          "name": "subset.txt",
+          "arg": "out_file",
+          "mandatory": true,
+          "description": "Tabulat BLAST file to be created."
+        }
+      ]
+    },
+    {
+      "task": "BlastTab.pairedHits.rb",
+      "description": "Identifies the best hits of paired-reads.",
+      "help_arg": "--help",
+      "options": [
+        {
+          "opt": "--blast",
+          "arg": "in_file",
+          "mandatory": true,
+          "description": "Input Tabular BLAST file.",
+          "note": ["This script assumes that paired hits are next to each",
+            "other. If this is not the case (e.g., because the blast was",
+            "concatenated), you must sort the input before running this",
+            "script."]
+        },
+        {
+          "name": "Min score",
+          "opt": "--minscore",
+          "arg": "float",
+          "default": 0.0,
+          "description": "Minimum (summed) Bit-Score to consider a pair-match."
+        },
+        {
+          "name": "Best hits",
+          "opt": "--besthits",
+          "arg": "integer",
+          "default": 0,
+          "description": ["Outputs top best-hits only (use 0 to output all the",
+            "paired hits)."]
+        },
+        {
+          "name": "Orientation",
+          "opt": "--orient",
+          "arg": "select",
+          "values": [0,1,2,3,4],
+          "default": 0,
+          "description": ["Checks the orientation of the hit. Values are: 0,",
+            "no checking; 1, same direction; 2, inwards; 3, outwards; 4,",
+            "different direction (i.e., 2 or 3)."]
+        },
+        {
+          "name": "Sister prefix",
+          "opt": "--sisprefix",
+          "arg": "string",
+          "default": "_",
+          "description": ["Sister read number prefix in the name of the reads.",
+            "Escape characters as dots (\\.), parenthesis (\\(, \\), \\[,",
+            "\\]), other characters with special meaning in regular",
+            "expressions (\\*, \\+, \\^, \\$, \\|). This prefix allows regular",
+            "expressions (for example, use ':|\\.' to use any of colon or",
+            "dot). Note that the prefix will not be included in the base name",
+            "reported in the output."]
+        },
+        ">",
+        {
+          "arg": "out_file",
+          "mandatory": true,
+          "description": ["Tab-delimited flat file, with the following",
+            "columns: (1) Query ID (without the \"sister\" identifier). (2)",
+            "Subject ID. (3) Bit score (summed from both sister reads). (4/5)",
+            "From/To (subject) coordinates for read 1. (6/7) From/To (subject)",
+            "coordinates for read 2. (8) Reads orientation (1: same direction,",
+            "2: inwards, 3: outwards). (9) Estimated insert size."]
+        }
+      ]
+    },
+    {
+      "task": "BlastTab.seqdepth.pl",
+      "description": "Estimates the sequencing depth of subject sequences.",
+      "help_arg": "",
+      "see_also": ["BlastTab.seqdepth_ZIP.pl", "BlastTab.seqdepth_nomedian.pl",
+        "BedGraph.tad.rb"],
+      "options": [
+        "cat",
+        {
+          "arg": "in_file",
+          "multiple_sep": " ",
+          "mandatory": true,
+          "description": ["One or more Tabular BLAST files of reads vs genes",
+            "(or contigs)."]
+        },
+        "|",
+        { "arg": "task" },
+        {
+          "name": "genes_or_ctgs.fna",
+          "arg": "in_file",
+          "mandatory": true,
+          "description": ["A FastA file containing the genes or the contigs",
+            "(db)."]
+        },
+        ">",
+        {
+          "name": "genes_or_ctgs.cov",
+          "arg": "out_file",
+          "mandatory": true,
+          "description": ["A tab-delimited file with the following columns:",
+            "(1) Subject ID. (2) Average sequencing depth. (3) Median",
+            "sequencing depth. (4) Number of mapped reads. (5) Length of the",
+            "subject sequence."]
+        }
+      ]
+    },
+    {
+      "task": "BlastTab.seqdepth_ZIP.pl",
+      "description": ["Estimates the average sequencing depth of subject",
+        "sequences (genes or contigs) assuming a Zero-Inflated Poisson",
+        "distribution (ZIP) to correct for non-covered positions. It uses the",
+        "corrected method of moments estimators (CMMEs) as described by",
+        "Beckett et al [1]. Note that [1] has a mistake in eq. (2.4), that",
+        "should be: pi-hat-MM = 1 - (X-bar / lambda-hat-MM). Also note that a",
+        "more elaborated mixture distribution can arise from coverage",
+        "histograms (e.g., see [2] for an additional correction called 'tail",
+        "distribution' and mixtures involving negative binomial) so take these",
+        "results cum grano salis.\n [1]",
+        "http://anisette.ucs.louisiana.edu/Academic/Sciences/MATH/stage/stat2012.pdf\n",
+        "[2] Lindner et al, Bioinformatics, 2013."],
+      "help_arg": "",
+      "see_also": ["BlastTab.seqdepth.pl", "BlastTab.seqdepth_nomedian.pl",
+        "BedGraph.tad.rb"],
+      "options": [
+        "cat",
+        {
+          "name": "blast",
+          "arg": "in_file",
+          "multiple_sep": " ",
+          "mandatory": true,
+          "description": ["One or more Tabular BLAST files of reads vs genes",
+            "(or contigs)."]
+        },
+        "|",
+        { "arg": "task" },
+        {
+          "name": "genes_or_ctgs.fna",
+          "arg": "in_file",
+          "mandatory": true,
+          "description": ["A FastA file containing the genes or the contigs",
+            "(db)."]
+        },
+        ">",
+        {
+          "name": "genes_or_ctgs.cov",
+          "arg": "out_file",
+          "mandatory": true,
+          "description": ["Output file with the following columns:",
+            "(1) Subject ID.",
+            "(2) Estimated average sequencing depth (CMME lambda).",
+            "(3) Zero-inflation (CMME pi).",
+            "(4) Observed average sequencing depth.",
+            "(5) Observed median sequencing depth.",
+            "(6) Observed median sequencing depth excluding zeroes.",
+            "(7) Number of mapped reads.",
+            "(8) Length of the subject sequence."]
+        }
+      ]
+    },
+    {
+      "task": "BlastTab.seqdepth_nomedian.pl",
+      "description": ["Estimates the sequencing depth of subject",
+        "sequences. The values reported by this script may differ from those",
+        "of BlastTab.seqdepth.pl, because this script uses the aligned length",
+        "of the read while BlastTab.seqdepth.pl uses the aligned length of the",
+        "subject sequence."],
+      "help_arg": "",
+      "see_also": ["BlastTab.seqdepth.pl", "BlastTab.seqdepth_ZIP.pl"],
+      "options": [
+        "cat",
+        {
+          "arg": "in_file",
+          "multiple_sep": " ",
+          "mandatory": true,
+          "description": ["One or more Tabular BLAST files of reads vs genes",
+            "(or contigs)."]
+        },
+        "|",
+        { "arg": "task" },
+        {
+          "name": "genes_or_ctgs.fna",
+          "arg": "in_file",
+          "mandatory": true,
+          "description": ["A FastA file containing the genes or the contigs",
+            "(db)."]
+        },
+        ">",
+        {
+          "name": "genes_or_ctgs.cov",
+          "arg": "out_file",
+          "mandatory": true,
+          "description": ["A tab-delimited file with the following columns:",
+            "(1) Subject ID. (2) Average sequencing depth. (3) Number of",
+            "mapped reads. (4) Length of the subject sequence."]
+        }
+      ]
+    },
+    {
+      "task": "BlastTab.subsample.pl",
+      "description": ["Filters a BLAST output including only the hits produced",
+        "by any of the given sequences as query."],
+      "help_arg": "",
+      "see_also": "BlastTab.filter.pl",
+      "options": [
+        {
+          "name": "blast.tab",
+          "mandatory": true,
+          "arg": "in_file",
+          "description": "BLAST output to be filtered (tabular format)."
+        },
+        {
+          "name": "sample.fa",
+          "mandatory": true,
+          "arg": "in_file",
+          "description": "Sequences to use as query (FastA format)."
+        },
+        ">",
+        {
+          "arg": "out_file",
+          "mandatory": true,
+          "description": "The filtered BLAST output (tabular format)."
+        }
+      ]
+    },
+    {
+      "task": "BlastTab.sumPerHit.pl",
+      "description": ["Sums the weights of all the queries hitting each",
+        "subject. Often (but not necessarily) the BLAST files contain only",
+        "best matches. The weights can be any number, but a common use of this",
+        "Script is to add up counts (weights are integers). For example, in a",
+        "BLAST of predicted genes vs some annotation source, the weights could",
+        "be the number of reads recruited by each gene."],
+      "help_arg": "-h",
+      "options": [
+        {
+          "name": "Weights file",
+          "opt": "-w",
+          "arg": "in_file",
+          "description": ["A two-columns tab-delimited file containing the",
+            "the name (column 1) and the weight (column 2) of each query."]
+        },
+        {
+          "name": "Minimum score",
+          "opt": "-s",
+          "arg": "float",
+          "default": 0.0
+        },
+        {
+          "name": "Minimum identity (%)",
+          "opt": "-i",
+          "arg": "float",
+          "default": 0.0
+        },
+        {
+          "name": "Queries",
+          "opt": "-m",
+          "arg": "integer",
+          "default": 0,
+          "description": "Maximum number of queries. Set to 0 for all."
+        },
+        {
+          "name": "Normalize",
+          "opt": "-n",
+          "description": "Normalize weights by the number of hits per query."
+        },
+        {
+          "name": "Include zeroes",
+          "opt": "-z",
+          "description": ["Add zero when weight is not found (by default:",
+            "doesn't list them)."]
+        },
+        {
+          "name": "Run quietly",
+          "opt": "-q"
+        },
+        {
+          "name": "blast",
+          "arg": "in_file",
+          "multiple_sep": " ",
+          "mandatory": true,
+          "description": "One or more BLAST files."
+        },
+        ">",
+        {
+          "arg": "out_file",
+          "mandatory": true,
+          "description": ["A two-columns tab-delimited file containing the",
+            "summed weights per hit."]
+        }
+      ]
+    },
+    {
+      "task": "BlastTab.taxid2taxrank.pl",
+      "description": ["Takes a BLAST with NCBI Taxonomy IDs as subjects and",
+        "replaces them by names at a given taxonomic rank."],
+      "help_arg": "",
+      "options": [
+        {
+          "name": "tax_blast.txt",
+          "mandatory": true,
+          "arg": "in_file",
+          "description": ["BLAST output, where subject IDs are NCBI Taxonomy",
+            "IDs."]
+        },
+        {
+          "name": "nodes.dmp",
+          "mandatory": true,
+          "arg": "in_file",
+          "description": "Nodes file from NCBI Taxonomy.",
+          "source_url": "ftp://ftp.ncbi.nih.gov/pub/taxonomy/taxdump.tar.gz"
+        },
+        {
+          "name": "names.dmp",
+          "mandatory": true,
+          "arg": "in_file",
+          "description": "Names file from NCBI Taxonomy.",
+          "source_url": "ftp://ftp.ncbi.nih.gov/pub/taxonomy/taxdump.tar.gz"
+        },
+        {
+          "name": "rank",
+          "arg": "string",
+          "mandatory": true,
+          "default": "genus",
+          "description": ["The rank to be reported. All the reported nodes",
+            "will have the same rank. To see supported values, run:\n",
+            "`cut -f 5 nodes.dmp | sort -u`."]
+        },
+        {
+          "name": "Best-hit",
+          "arg": "select",
+          "values": ["yes", "no"],
+          "default": "yes",
+          "description": ["Should it take into account the best hit per query",
+            "only? This is: should it filter by best-hit?"]
+        },
+        ">",
+        {
+          "name": "taxrank_list.txt",
+          "arg": "out_file",
+          "mandatory": true,
+          "description": ["BLAST-like output, where subject IDs are Taxonomy",
+            "names."]
+        }
+      ]
+    },
+    {
+      "task": "BlastTab.topHits_sorted.rb",
+      "description": "Reports the top-N best hits of a BLAST.",
+      "help_arg": "--help",
+      "see_also": "BlastTab.best_hit_sorted.pl",
+      "options": [
+        {
+          "name": "Sort",
+          "arg": "select",
+          "values": ["sort","cat"],
+          "mandatory": true,
+          "description": ["Use 'sort' if your BLAST is not pre-sorted by the",
+            "first column (or if you're not sure). Use 'cat' otherwise."]
+        },
+        {
+          "arg": "in_file",
+          "mandatory": true,
+          "description": "Tabular BLAST file."
+        },
+        "|",
+        { "arg": "task" },
+        "--blast",
+        "-",
+        {
+          "name": "Output",
+          "opt": "--out",
+          "arg": "out_file",
+          "mandatory": true,
+          "description": [
+            "Output filtered BLAST file.",
+            "Supports compression with .gz extension."
+          ]
+        },
+        {
+          "opt": "--top",
+          "arg": "integer",
+          "default": 5,
+          "description": "Maximum number of hits to report for each query."
+        },
+        {
+          "opt": "--sort-by",
+          "arg": "select",
+          "values": ["bitscore", "evalue", "identity", "length", "no"],
+          "default": "bitscore",
+          "description": "Parameter used to detect the 'best' hits."
+        },
+        {
+          "opt": "--quiet",
+          "description": "Run quietly."
+        }
+      ]
+    },
+    {
+      "task": "BlastTab.recplot2.R",
+      "description": ["Produce recruitment plot objects provided that",
+        "BlastTab.catsbj.pl has been previously executed."],
+      "help_arg": "--help",
+      "requires": [
+        { "r_package": "optparse" },
+        { "r_package": "enveomics.R" }
+      ],
+      "see_also": ["BlastTab.catsbj.pl", "GFF.catsbj.pl",
+        "RecPlot2.compareIdentities.R"],
+      "options": [
+        {
+          "opt": "--prefix",
+          "arg": "in_file",
+          "mandatory": true,
+          "description": ["Path to the prefix of the BlastTab.catsbj.pl output",
+            "files. At least the files .rec and .lim must exist with this",
+            "prefix."]
+        },
+        {
+          "opt": "--pos-breaks",
+          "arg": "integer",
+          "default": 1000,
+          "description": "Breaks in the positions histogram."
+        },
+        {
+          "opt": "--pos-breaks-tsv",
+          "arg": "in_file",
+          "description": ["File with (absolute) coordinates of breaks in the",
+            "position histogram."]
+        },
+        {
+          "opt": "--id-breaks",
+          "arg": "integer",
+          "default": 300,
+          "description": ["Breaks in the identity histogram."]
+        },
+        {
+          "opt": "--id-free-range",
+          "description": ["Indicates that the range should be freely set from",
+            "the observed values. Otherwise, 70-100% is included in the",
+            "identity histogram (default)."]
+        },
+        {
+          "opt": "--id-metric",
+          "arg": "select",
+          "values": ["identity", "corrected identity", "bit score"],
+          "default": "identity",
+          "description": ["Metric of identity to be used (Y-axis). Corrected",
+            "identity is only supported if the original BLAST file included",
+            "sequence lengths."]
+        },
+        {
+          "opt": "--id-summary",
+          "arg": "string",
+          "default": "sum",
+          "description": "Function summarizing the identity bins."
+        },
+        {
+          "opt": "--id-cutoff",
+          "arg": "float",
+          "default": 95.0,
+          "description": ["Cutoff of identity metric above which the hits are",
+            "considered 'in-group'. The 95% identity corresponds to the",
+            "expectation of ANI<95% within species."]
+        },
+        {
+          "opt": "--threads",
+          "arg": "integer",
+          "default": 2,
+          "description": "Number of threads to use."
+        },
+        {
+          "opt": "--no-verbose",
+          "description": "Indicates if the function should report the advance."
+        },
+        {
+          "opt": "--peaks-col",
+          "arg": "string",
+          "default": "NA",
+          "description": ["Color of peaks, mandatory for peak-finding (e.g.,",
+            "darkred)."]
+        },
+        {
+          "opt": "--peaks-method",
+          "arg": "select",
+          "values": ["emauto","em","mower"],
+          "default": "emauto",
+          "description": "Method to detect peaks."
+        },
+        {
+          "name": "R Object Output",
+          "arg": "out_file",
+          "mandatory": true,
+          "description": ["Recplo2 object that can be re-plotted using",
+            "R function plot."]
+        },
+        {
+          "name": "Graphical Output",
+          "arg": "out_file",
+          "description": "Recruitment plot in PDF."
+        },
+        {
+          "name": "Width",
+          "arg": "float",
+          "description": "Width of the plot in inches (7 by default)."
+        },
+        {
+          "name": "Height",
+          "arg": "float",
+          "description": "Height of the plot in inches (7 by default)."
+        }
+      ]
+    },
+    {
+      "task": "RecPlot2.compareIdentities.R",
+      "description": ["Calculates the difference between identity",
+        "distributions of two recruitment plots."],
+      "help_arg": "--help",
+      "requires": [
+        { "r_package": "optparse" },
+        { "r_package": "enveomics.R" }
+      ],
+      "see_also": [ "BlastTab.recplot2.R" ],
+      "options": [
+        {
+          "opt": "--method",
+          "arg": "string",
+          "default": "hellinger",
+          "description": ["Distance method to use. This should be (an",
+            "unambiguous abbreviation of) one of:",
+            "'hellinger' (Hellinger, 1090, doi:10.1515/crll.1909.136.210),",
+            "'bhattacharyya' (Bhattacharyya, 1943, Bull. Calcutta Math. Soc.",
+            "35), 'kl' or 'kullback–leibler' (Kullback & Leibler, 1951,",
+            "doi:10.1214/aoms/1177729694), or 'euclidean'."]
+        },
+        {
+          "opt": "--pseudocounts",
+          "arg": "float",
+          "default": 0.0,
+          "description": ["Smoothing parameter for Laplace smoothing. Use 0",
+            "for no smoothing, or 1 for add-one smoothing."]
+        },
+        {
+          "opt": "--max-deviation",
+          "arg": "float",
+          "description": ["Maximum mean deviation between identity breaks",
+            "tolerated (as percent identity). Difference in number of",
+            "id.breaks is never tolerated."]
+        },
+        {
+          "arg": "in_file",
+          "name": "RecPlot A",
+          "mandatory": true,
+          "description": ["File containing the R object `rp` for the first",
+            "recruitment plot."]
+        },
+        {
+          "arg": "in_file",
+          "name": "RecPlot B",
+          "mandatory": true,
+          "description": ["File containing the R object `rp` for the second",
+            "recruitment plot."]
+        }
+      ]
+    }
+  ]
+}