miga-base 1.2.15.2 → 1.2.15.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (306) hide show
  1. checksums.yaml +4 -4
  2. data/lib/miga/cli/action/download/gtdb.rb +4 -1
  3. data/lib/miga/cli/action/gtdb_get.rb +4 -0
  4. data/lib/miga/daemon.rb +4 -1
  5. data/lib/miga/lair.rb +6 -4
  6. data/lib/miga/remote_dataset/download.rb +3 -2
  7. data/lib/miga/remote_dataset.rb +25 -7
  8. data/lib/miga/taxonomy.rb +6 -0
  9. data/lib/miga/version.rb +2 -2
  10. metadata +6 -302
  11. data/utils/FastAAI/00.Libraries/01.SCG_HMMs/Archaea_SCG.hmm +0 -41964
  12. data/utils/FastAAI/00.Libraries/01.SCG_HMMs/Bacteria_SCG.hmm +0 -32439
  13. data/utils/FastAAI/00.Libraries/01.SCG_HMMs/Complete_SCG_DB.hmm +0 -62056
  14. data/utils/FastAAI/FastAAI +0 -3659
  15. data/utils/FastAAI/FastAAI-legacy/FastAAI +0 -1336
  16. data/utils/FastAAI/FastAAI-legacy/kAAI_v1.0_virus.py +0 -1296
  17. data/utils/FastAAI/README.md +0 -84
  18. data/utils/enveomics/Docs/recplot2.md +0 -244
  19. data/utils/enveomics/Examples/aai-matrix.bash +0 -66
  20. data/utils/enveomics/Examples/ani-matrix.bash +0 -66
  21. data/utils/enveomics/Examples/essential-phylogeny.bash +0 -105
  22. data/utils/enveomics/Examples/unus-genome-phylogeny.bash +0 -100
  23. data/utils/enveomics/LICENSE.txt +0 -73
  24. data/utils/enveomics/Makefile +0 -52
  25. data/utils/enveomics/Manifest/Tasks/aasubs.json +0 -103
  26. data/utils/enveomics/Manifest/Tasks/blasttab.json +0 -790
  27. data/utils/enveomics/Manifest/Tasks/distances.json +0 -161
  28. data/utils/enveomics/Manifest/Tasks/fasta.json +0 -802
  29. data/utils/enveomics/Manifest/Tasks/fastq.json +0 -291
  30. data/utils/enveomics/Manifest/Tasks/graphics.json +0 -126
  31. data/utils/enveomics/Manifest/Tasks/mapping.json +0 -137
  32. data/utils/enveomics/Manifest/Tasks/ogs.json +0 -382
  33. data/utils/enveomics/Manifest/Tasks/other.json +0 -906
  34. data/utils/enveomics/Manifest/Tasks/remote.json +0 -355
  35. data/utils/enveomics/Manifest/Tasks/sequence-identity.json +0 -650
  36. data/utils/enveomics/Manifest/Tasks/tables.json +0 -308
  37. data/utils/enveomics/Manifest/Tasks/trees.json +0 -68
  38. data/utils/enveomics/Manifest/Tasks/variants.json +0 -111
  39. data/utils/enveomics/Manifest/categories.json +0 -165
  40. data/utils/enveomics/Manifest/examples.json +0 -162
  41. data/utils/enveomics/Manifest/tasks.json +0 -4
  42. data/utils/enveomics/Pipelines/assembly.pbs/CONFIG.mock.bash +0 -69
  43. data/utils/enveomics/Pipelines/assembly.pbs/FastA.N50.pl +0 -1
  44. data/utils/enveomics/Pipelines/assembly.pbs/FastA.filterN.pl +0 -1
  45. data/utils/enveomics/Pipelines/assembly.pbs/FastA.length.pl +0 -1
  46. data/utils/enveomics/Pipelines/assembly.pbs/README.md +0 -189
  47. data/utils/enveomics/Pipelines/assembly.pbs/RUNME-2.bash +0 -112
  48. data/utils/enveomics/Pipelines/assembly.pbs/RUNME-3.bash +0 -23
  49. data/utils/enveomics/Pipelines/assembly.pbs/RUNME-4.bash +0 -44
  50. data/utils/enveomics/Pipelines/assembly.pbs/RUNME.bash +0 -50
  51. data/utils/enveomics/Pipelines/assembly.pbs/kSelector.R +0 -37
  52. data/utils/enveomics/Pipelines/assembly.pbs/newbler.pbs +0 -68
  53. data/utils/enveomics/Pipelines/assembly.pbs/newbler_preparator.pl +0 -49
  54. data/utils/enveomics/Pipelines/assembly.pbs/soap.pbs +0 -80
  55. data/utils/enveomics/Pipelines/assembly.pbs/stats.pbs +0 -57
  56. data/utils/enveomics/Pipelines/assembly.pbs/velvet.pbs +0 -63
  57. data/utils/enveomics/Pipelines/blast.pbs/01.pbs.bash +0 -38
  58. data/utils/enveomics/Pipelines/blast.pbs/02.pbs.bash +0 -73
  59. data/utils/enveomics/Pipelines/blast.pbs/03.pbs.bash +0 -21
  60. data/utils/enveomics/Pipelines/blast.pbs/BlastTab.recover_job.pl +0 -72
  61. data/utils/enveomics/Pipelines/blast.pbs/CONFIG.mock.bash +0 -98
  62. data/utils/enveomics/Pipelines/blast.pbs/FastA.split.pl +0 -1
  63. data/utils/enveomics/Pipelines/blast.pbs/README.md +0 -127
  64. data/utils/enveomics/Pipelines/blast.pbs/RUNME.bash +0 -109
  65. data/utils/enveomics/Pipelines/blast.pbs/TASK.check.bash +0 -128
  66. data/utils/enveomics/Pipelines/blast.pbs/TASK.dry.bash +0 -16
  67. data/utils/enveomics/Pipelines/blast.pbs/TASK.eo.bash +0 -22
  68. data/utils/enveomics/Pipelines/blast.pbs/TASK.pause.bash +0 -26
  69. data/utils/enveomics/Pipelines/blast.pbs/TASK.run.bash +0 -89
  70. data/utils/enveomics/Pipelines/blast.pbs/sentinel.pbs.bash +0 -29
  71. data/utils/enveomics/Pipelines/idba.pbs/README.md +0 -49
  72. data/utils/enveomics/Pipelines/idba.pbs/RUNME.bash +0 -95
  73. data/utils/enveomics/Pipelines/idba.pbs/run.pbs +0 -56
  74. data/utils/enveomics/Pipelines/trim.pbs/README.md +0 -54
  75. data/utils/enveomics/Pipelines/trim.pbs/RUNME.bash +0 -70
  76. data/utils/enveomics/Pipelines/trim.pbs/run.pbs +0 -130
  77. data/utils/enveomics/README.md +0 -42
  78. data/utils/enveomics/Scripts/AAsubs.log2ratio.rb +0 -171
  79. data/utils/enveomics/Scripts/Aln.cat.rb +0 -221
  80. data/utils/enveomics/Scripts/Aln.convert.pl +0 -35
  81. data/utils/enveomics/Scripts/AlphaDiversity.pl +0 -152
  82. data/utils/enveomics/Scripts/BedGraph.tad.rb +0 -93
  83. data/utils/enveomics/Scripts/BedGraph.window.rb +0 -71
  84. data/utils/enveomics/Scripts/BlastPairwise.AAsubs.pl +0 -102
  85. data/utils/enveomics/Scripts/BlastTab.addlen.rb +0 -63
  86. data/utils/enveomics/Scripts/BlastTab.advance.bash +0 -48
  87. data/utils/enveomics/Scripts/BlastTab.best_hit_sorted.pl +0 -55
  88. data/utils/enveomics/Scripts/BlastTab.catsbj.pl +0 -104
  89. data/utils/enveomics/Scripts/BlastTab.cogCat.rb +0 -76
  90. data/utils/enveomics/Scripts/BlastTab.filter.pl +0 -47
  91. data/utils/enveomics/Scripts/BlastTab.kegg_pep2path_rest.pl +0 -194
  92. data/utils/enveomics/Scripts/BlastTab.metaxaPrep.pl +0 -104
  93. data/utils/enveomics/Scripts/BlastTab.pairedHits.rb +0 -157
  94. data/utils/enveomics/Scripts/BlastTab.recplot2.R +0 -48
  95. data/utils/enveomics/Scripts/BlastTab.seqdepth.pl +0 -86
  96. data/utils/enveomics/Scripts/BlastTab.seqdepth_ZIP.pl +0 -119
  97. data/utils/enveomics/Scripts/BlastTab.seqdepth_nomedian.pl +0 -86
  98. data/utils/enveomics/Scripts/BlastTab.subsample.pl +0 -47
  99. data/utils/enveomics/Scripts/BlastTab.sumPerHit.pl +0 -114
  100. data/utils/enveomics/Scripts/BlastTab.taxid2taxrank.pl +0 -90
  101. data/utils/enveomics/Scripts/BlastTab.topHits_sorted.rb +0 -123
  102. data/utils/enveomics/Scripts/Chao1.pl +0 -97
  103. data/utils/enveomics/Scripts/CharTable.classify.rb +0 -234
  104. data/utils/enveomics/Scripts/EBIseq2tax.rb +0 -83
  105. data/utils/enveomics/Scripts/FastA.N50.pl +0 -60
  106. data/utils/enveomics/Scripts/FastA.extract.rb +0 -152
  107. data/utils/enveomics/Scripts/FastA.filter.pl +0 -52
  108. data/utils/enveomics/Scripts/FastA.filterLen.pl +0 -28
  109. data/utils/enveomics/Scripts/FastA.filterN.pl +0 -60
  110. data/utils/enveomics/Scripts/FastA.fragment.rb +0 -100
  111. data/utils/enveomics/Scripts/FastA.gc.pl +0 -42
  112. data/utils/enveomics/Scripts/FastA.interpose.pl +0 -93
  113. data/utils/enveomics/Scripts/FastA.length.pl +0 -38
  114. data/utils/enveomics/Scripts/FastA.mask.rb +0 -89
  115. data/utils/enveomics/Scripts/FastA.per_file.pl +0 -36
  116. data/utils/enveomics/Scripts/FastA.qlen.pl +0 -57
  117. data/utils/enveomics/Scripts/FastA.rename.pl +0 -65
  118. data/utils/enveomics/Scripts/FastA.revcom.pl +0 -23
  119. data/utils/enveomics/Scripts/FastA.sample.rb +0 -98
  120. data/utils/enveomics/Scripts/FastA.slider.pl +0 -85
  121. data/utils/enveomics/Scripts/FastA.split.pl +0 -55
  122. data/utils/enveomics/Scripts/FastA.split.rb +0 -79
  123. data/utils/enveomics/Scripts/FastA.subsample.pl +0 -131
  124. data/utils/enveomics/Scripts/FastA.tag.rb +0 -65
  125. data/utils/enveomics/Scripts/FastA.toFastQ.rb +0 -69
  126. data/utils/enveomics/Scripts/FastA.wrap.rb +0 -48
  127. data/utils/enveomics/Scripts/FastQ.filter.pl +0 -54
  128. data/utils/enveomics/Scripts/FastQ.interpose.pl +0 -90
  129. data/utils/enveomics/Scripts/FastQ.maskQual.rb +0 -89
  130. data/utils/enveomics/Scripts/FastQ.offset.pl +0 -90
  131. data/utils/enveomics/Scripts/FastQ.split.pl +0 -53
  132. data/utils/enveomics/Scripts/FastQ.tag.rb +0 -70
  133. data/utils/enveomics/Scripts/FastQ.test-error.rb +0 -81
  134. data/utils/enveomics/Scripts/FastQ.toFastA.awk +0 -24
  135. data/utils/enveomics/Scripts/GFF.catsbj.pl +0 -127
  136. data/utils/enveomics/Scripts/GenBank.add_fields.rb +0 -84
  137. data/utils/enveomics/Scripts/HMM.essential.rb +0 -351
  138. data/utils/enveomics/Scripts/HMM.haai.rb +0 -168
  139. data/utils/enveomics/Scripts/HMMsearch.extractIds.rb +0 -83
  140. data/utils/enveomics/Scripts/JPlace.distances.rb +0 -88
  141. data/utils/enveomics/Scripts/JPlace.to_iToL.rb +0 -320
  142. data/utils/enveomics/Scripts/M5nr.getSequences.rb +0 -81
  143. data/utils/enveomics/Scripts/MeTaxa.distribution.pl +0 -198
  144. data/utils/enveomics/Scripts/MyTaxa.fragsByTax.pl +0 -35
  145. data/utils/enveomics/Scripts/MyTaxa.seq-taxrank.rb +0 -49
  146. data/utils/enveomics/Scripts/NCBIacc2tax.rb +0 -92
  147. data/utils/enveomics/Scripts/Newick.autoprune.R +0 -27
  148. data/utils/enveomics/Scripts/RAxML-EPA.to_iToL.pl +0 -228
  149. data/utils/enveomics/Scripts/RecPlot2.compareIdentities.R +0 -32
  150. data/utils/enveomics/Scripts/RefSeq.download.bash +0 -48
  151. data/utils/enveomics/Scripts/SRA.download.bash +0 -55
  152. data/utils/enveomics/Scripts/TRIBS.plot-test.R +0 -36
  153. data/utils/enveomics/Scripts/TRIBS.test.R +0 -39
  154. data/utils/enveomics/Scripts/Table.barplot.R +0 -31
  155. data/utils/enveomics/Scripts/Table.df2dist.R +0 -30
  156. data/utils/enveomics/Scripts/Table.filter.pl +0 -61
  157. data/utils/enveomics/Scripts/Table.merge.pl +0 -77
  158. data/utils/enveomics/Scripts/Table.prefScore.R +0 -60
  159. data/utils/enveomics/Scripts/Table.replace.rb +0 -69
  160. data/utils/enveomics/Scripts/Table.round.rb +0 -63
  161. data/utils/enveomics/Scripts/Table.split.pl +0 -57
  162. data/utils/enveomics/Scripts/Taxonomy.silva2ncbi.rb +0 -227
  163. data/utils/enveomics/Scripts/VCF.KaKs.rb +0 -147
  164. data/utils/enveomics/Scripts/VCF.SNPs.rb +0 -88
  165. data/utils/enveomics/Scripts/aai.rb +0 -421
  166. data/utils/enveomics/Scripts/ani.rb +0 -362
  167. data/utils/enveomics/Scripts/anir.rb +0 -137
  168. data/utils/enveomics/Scripts/clust.rand.rb +0 -102
  169. data/utils/enveomics/Scripts/gi2tax.rb +0 -103
  170. data/utils/enveomics/Scripts/in_silico_GA_GI.pl +0 -96
  171. data/utils/enveomics/Scripts/lib/data/dupont_2012_essential.hmm.gz +0 -0
  172. data/utils/enveomics/Scripts/lib/data/lee_2019_essential.hmm.gz +0 -0
  173. data/utils/enveomics/Scripts/lib/enveomics.R +0 -1
  174. data/utils/enveomics/Scripts/lib/enveomics_rb/anir.rb +0 -293
  175. data/utils/enveomics/Scripts/lib/enveomics_rb/bm_set.rb +0 -175
  176. data/utils/enveomics/Scripts/lib/enveomics_rb/enveomics.rb +0 -24
  177. data/utils/enveomics/Scripts/lib/enveomics_rb/errors.rb +0 -17
  178. data/utils/enveomics/Scripts/lib/enveomics_rb/gmm_em.rb +0 -30
  179. data/utils/enveomics/Scripts/lib/enveomics_rb/jplace.rb +0 -253
  180. data/utils/enveomics/Scripts/lib/enveomics_rb/match.rb +0 -88
  181. data/utils/enveomics/Scripts/lib/enveomics_rb/og.rb +0 -182
  182. data/utils/enveomics/Scripts/lib/enveomics_rb/rbm.rb +0 -49
  183. data/utils/enveomics/Scripts/lib/enveomics_rb/remote_data.rb +0 -74
  184. data/utils/enveomics/Scripts/lib/enveomics_rb/seq_range.rb +0 -237
  185. data/utils/enveomics/Scripts/lib/enveomics_rb/stats/rand.rb +0 -31
  186. data/utils/enveomics/Scripts/lib/enveomics_rb/stats/sample.rb +0 -152
  187. data/utils/enveomics/Scripts/lib/enveomics_rb/stats.rb +0 -3
  188. data/utils/enveomics/Scripts/lib/enveomics_rb/utils.rb +0 -74
  189. data/utils/enveomics/Scripts/lib/enveomics_rb/vcf.rb +0 -135
  190. data/utils/enveomics/Scripts/ogs.annotate.rb +0 -88
  191. data/utils/enveomics/Scripts/ogs.core-pan.rb +0 -160
  192. data/utils/enveomics/Scripts/ogs.extract.rb +0 -125
  193. data/utils/enveomics/Scripts/ogs.mcl.rb +0 -186
  194. data/utils/enveomics/Scripts/ogs.rb +0 -104
  195. data/utils/enveomics/Scripts/ogs.stats.rb +0 -131
  196. data/utils/enveomics/Scripts/rbm-legacy.rb +0 -172
  197. data/utils/enveomics/Scripts/rbm.rb +0 -108
  198. data/utils/enveomics/Scripts/sam.filter.rb +0 -148
  199. data/utils/enveomics/Tests/Makefile +0 -10
  200. data/utils/enveomics/Tests/Mgen_M2288.faa +0 -3189
  201. data/utils/enveomics/Tests/Mgen_M2288.fna +0 -8282
  202. data/utils/enveomics/Tests/Mgen_M2321.fna +0 -8288
  203. data/utils/enveomics/Tests/Nequ_Kin4M.faa +0 -2970
  204. data/utils/enveomics/Tests/Xanthomonas_oryzae-PilA.tribs.Rdata +0 -0
  205. data/utils/enveomics/Tests/Xanthomonas_oryzae-PilA.txt +0 -7
  206. data/utils/enveomics/Tests/Xanthomonas_oryzae.aai-mat.tsv +0 -17
  207. data/utils/enveomics/Tests/Xanthomonas_oryzae.aai.tsv +0 -137
  208. data/utils/enveomics/Tests/a_mg.cds-go.blast.tsv +0 -123
  209. data/utils/enveomics/Tests/a_mg.reads-cds.blast.tsv +0 -200
  210. data/utils/enveomics/Tests/a_mg.reads-cds.counts.tsv +0 -55
  211. data/utils/enveomics/Tests/alkB.nwk +0 -1
  212. data/utils/enveomics/Tests/anthrax-cansnp-data.tsv +0 -13
  213. data/utils/enveomics/Tests/anthrax-cansnp-key.tsv +0 -17
  214. data/utils/enveomics/Tests/hiv1.faa +0 -59
  215. data/utils/enveomics/Tests/hiv1.fna +0 -134
  216. data/utils/enveomics/Tests/hiv2.faa +0 -70
  217. data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv +0 -233
  218. data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv.lim +0 -1
  219. data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv.rec +0 -233
  220. data/utils/enveomics/Tests/phyla_counts.tsv +0 -10
  221. data/utils/enveomics/Tests/primate_lentivirus.ogs +0 -11
  222. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-hiv1.rbm +0 -9
  223. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-hiv2.rbm +0 -8
  224. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-siv.rbm +0 -6
  225. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv2-hiv2.rbm +0 -9
  226. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv2-siv.rbm +0 -6
  227. data/utils/enveomics/Tests/primate_lentivirus.rbm/siv-siv.rbm +0 -6
  228. data/utils/enveomics/build_enveomics_r.bash +0 -45
  229. data/utils/enveomics/enveomics.R/DESCRIPTION +0 -31
  230. data/utils/enveomics/enveomics.R/NAMESPACE +0 -39
  231. data/utils/enveomics/enveomics.R/R/autoprune.R +0 -155
  232. data/utils/enveomics/enveomics.R/R/barplot.R +0 -184
  233. data/utils/enveomics/enveomics.R/R/cliopts.R +0 -135
  234. data/utils/enveomics/enveomics.R/R/df2dist.R +0 -154
  235. data/utils/enveomics/enveomics.R/R/growthcurve.R +0 -331
  236. data/utils/enveomics/enveomics.R/R/prefscore.R +0 -79
  237. data/utils/enveomics/enveomics.R/R/recplot.R +0 -354
  238. data/utils/enveomics/enveomics.R/R/recplot2.R +0 -1631
  239. data/utils/enveomics/enveomics.R/R/tribs.R +0 -583
  240. data/utils/enveomics/enveomics.R/R/utils.R +0 -80
  241. data/utils/enveomics/enveomics.R/README.md +0 -81
  242. data/utils/enveomics/enveomics.R/data/growth.curves.rda +0 -0
  243. data/utils/enveomics/enveomics.R/data/phyla.counts.rda +0 -0
  244. data/utils/enveomics/enveomics.R/man/cash-enve.GrowthCurve-method.Rd +0 -16
  245. data/utils/enveomics/enveomics.R/man/cash-enve.RecPlot2-method.Rd +0 -16
  246. data/utils/enveomics/enveomics.R/man/cash-enve.RecPlot2.Peak-method.Rd +0 -16
  247. data/utils/enveomics/enveomics.R/man/enve.GrowthCurve-class.Rd +0 -25
  248. data/utils/enveomics/enveomics.R/man/enve.TRIBS-class.Rd +0 -46
  249. data/utils/enveomics/enveomics.R/man/enve.TRIBS.merge.Rd +0 -23
  250. data/utils/enveomics/enveomics.R/man/enve.TRIBStest-class.Rd +0 -47
  251. data/utils/enveomics/enveomics.R/man/enve.__prune.iter.Rd +0 -23
  252. data/utils/enveomics/enveomics.R/man/enve.__prune.reduce.Rd +0 -23
  253. data/utils/enveomics/enveomics.R/man/enve.__tribs.Rd +0 -40
  254. data/utils/enveomics/enveomics.R/man/enve.barplot.Rd +0 -103
  255. data/utils/enveomics/enveomics.R/man/enve.cliopts.Rd +0 -67
  256. data/utils/enveomics/enveomics.R/man/enve.col.alpha.Rd +0 -24
  257. data/utils/enveomics/enveomics.R/man/enve.col2alpha.Rd +0 -19
  258. data/utils/enveomics/enveomics.R/man/enve.df2dist.Rd +0 -45
  259. data/utils/enveomics/enveomics.R/man/enve.df2dist.group.Rd +0 -44
  260. data/utils/enveomics/enveomics.R/man/enve.df2dist.list.Rd +0 -47
  261. data/utils/enveomics/enveomics.R/man/enve.growthcurve.Rd +0 -75
  262. data/utils/enveomics/enveomics.R/man/enve.prefscore.Rd +0 -50
  263. data/utils/enveomics/enveomics.R/man/enve.prune.dist.Rd +0 -44
  264. data/utils/enveomics/enveomics.R/man/enve.recplot.Rd +0 -139
  265. data/utils/enveomics/enveomics.R/man/enve.recplot2-class.Rd +0 -45
  266. data/utils/enveomics/enveomics.R/man/enve.recplot2.ANIr.Rd +0 -24
  267. data/utils/enveomics/enveomics.R/man/enve.recplot2.Rd +0 -77
  268. data/utils/enveomics/enveomics.R/man/enve.recplot2.__counts.Rd +0 -25
  269. data/utils/enveomics/enveomics.R/man/enve.recplot2.__peakHist.Rd +0 -21
  270. data/utils/enveomics/enveomics.R/man/enve.recplot2.__whichClosestPeak.Rd +0 -19
  271. data/utils/enveomics/enveomics.R/man/enve.recplot2.changeCutoff.Rd +0 -19
  272. data/utils/enveomics/enveomics.R/man/enve.recplot2.compareIdentities.Rd +0 -47
  273. data/utils/enveomics/enveomics.R/man/enve.recplot2.coordinates.Rd +0 -29
  274. data/utils/enveomics/enveomics.R/man/enve.recplot2.corePeak.Rd +0 -18
  275. data/utils/enveomics/enveomics.R/man/enve.recplot2.extractWindows.Rd +0 -45
  276. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.Rd +0 -36
  277. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__em_e.Rd +0 -19
  278. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__em_m.Rd +0 -19
  279. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__emauto_one.Rd +0 -27
  280. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__mow_one.Rd +0 -52
  281. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__mower.Rd +0 -17
  282. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.em.Rd +0 -51
  283. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.emauto.Rd +0 -43
  284. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.mower.Rd +0 -82
  285. data/utils/enveomics/enveomics.R/man/enve.recplot2.peak-class.Rd +0 -59
  286. data/utils/enveomics/enveomics.R/man/enve.recplot2.seqdepth.Rd +0 -27
  287. data/utils/enveomics/enveomics.R/man/enve.recplot2.windowDepthThreshold.Rd +0 -36
  288. data/utils/enveomics/enveomics.R/man/enve.selvector.Rd +0 -23
  289. data/utils/enveomics/enveomics.R/man/enve.tribs.Rd +0 -68
  290. data/utils/enveomics/enveomics.R/man/enve.tribs.test.Rd +0 -28
  291. data/utils/enveomics/enveomics.R/man/enve.truncate.Rd +0 -27
  292. data/utils/enveomics/enveomics.R/man/growth.curves.Rd +0 -14
  293. data/utils/enveomics/enveomics.R/man/phyla.counts.Rd +0 -13
  294. data/utils/enveomics/enveomics.R/man/plot.enve.GrowthCurve.Rd +0 -78
  295. data/utils/enveomics/enveomics.R/man/plot.enve.TRIBS.Rd +0 -46
  296. data/utils/enveomics/enveomics.R/man/plot.enve.TRIBStest.Rd +0 -45
  297. data/utils/enveomics/enveomics.R/man/plot.enve.recplot2.Rd +0 -125
  298. data/utils/enveomics/enveomics.R/man/summary.enve.GrowthCurve.Rd +0 -19
  299. data/utils/enveomics/enveomics.R/man/summary.enve.TRIBS.Rd +0 -19
  300. data/utils/enveomics/enveomics.R/man/summary.enve.TRIBStest.Rd +0 -19
  301. data/utils/enveomics/globals.mk +0 -8
  302. data/utils/enveomics/manifest.json +0 -9
  303. data/utils/multitrim/Multitrim How-To.pdf +0 -0
  304. data/utils/multitrim/README.md +0 -67
  305. data/utils/multitrim/multitrim.py +0 -1555
  306. data/utils/multitrim/multitrim.yml +0 -13
@@ -1,790 +0,0 @@
1
- {
2
- "tasks": [
3
- {
4
- "task": "BlastTab.addlen.rb",
5
- "description": ["Appends an extra column to a tabular BLAST with the",
6
- "length of the query or the subject sequence."],
7
- "help_arg": "--help",
8
- "options": [
9
- {
10
- "opt": "--fasta",
11
- "arg": "in_file",
12
- "description": "FastA file of the query or the subject.",
13
- "mandatory": true
14
- },
15
- {
16
- "opt": "--subject",
17
- "description": ["Use the subject column of the BLAST, by default the",
18
- "query column is used."],
19
- "note": "If used, the input FastA must contain subject sequences."
20
- },
21
- {
22
- "opt": "--quiet",
23
- "description": "Run quietly (no STDERR output)."
24
- },
25
- "<",
26
- {
27
- "arg": "in_file",
28
- "description": "Input tabular BLAST file.",
29
- "mandatory": true
30
- },
31
- ">",
32
- {
33
- "arg": "out_file",
34
- "description": "Output tabular BLAST file with additional column.",
35
- "mandatory": true
36
- }
37
- ]
38
- },
39
- {
40
- "task": "BlastTab.advance.bash",
41
- "description": ["Calculates the percentage of a partial BLAST result.",
42
- "The value produced slightly subestimates the actual advance, due to",
43
- "un-flushed output and trailing queries that could be processed but",
44
- "generate no results."],
45
- "help_arg": "",
46
- "requires": [ { "interpreter": "awk" } ],
47
- "options": [
48
- {
49
- "name": "Blast",
50
- "arg": "in_file",
51
- "description": "Incomplete Tabular BLAST output.",
52
- "mandatory": true
53
- },
54
- {
55
- "name": "Query FastA",
56
- "arg": "in_file",
57
- "description": "FastA file with query sequences.",
58
- "mandatory": true
59
- }
60
- ]
61
- },
62
- {
63
- "task": "BlastTab.best_hit_sorted.pl",
64
- "description": "Filters a tabular BLAST to retain only the best matches.",
65
- "help_arg": "--help",
66
- "see_also": ["BlastTab.topHits_sorted.rb"],
67
- "options": [
68
- {
69
- "name": "Sort",
70
- "arg": "select",
71
- "values": ["sort","cat"],
72
- "mandatory": true,
73
- "description": ["Use 'sort' if your BLAST is not pre-sorted by the",
74
- "first column (or if you're not sure). Use 'cat' otherwise."]
75
- },
76
- {
77
- "name": "Input BLAST",
78
- "arg": "in_file",
79
- "multiple_sep": " ",
80
- "mandatory": true,
81
- "description": "Tabular BLAST file to filter."
82
- },
83
- "|",
84
- { "arg": "task" },
85
- ">",
86
- {
87
- "name": "Output BLAST",
88
- "arg": "out_file",
89
- "mandatory": true,
90
- "description": "Filetered tabular BLAST output."
91
- }
92
- ]
93
- },
94
- {
95
- "task": "BlastTab.catsbj.pl",
96
- "description": ["Generates a list of hits from a BLAST result",
97
- "concatenating the subject sequences. This can be used, e.g., to",
98
- "analyze BLAST results against draft genomes. This script creates two",
99
- "files using <map.bls> as prefix with extensions .rec (for the",
100
- "recruitment plot) and .lim (for the limits of the different sequences",
101
- "in <seq.fa>)."],
102
- "see_also": ["BlastTab.recplot2.R", "GFF.catsbj.pl"],
103
- "help_arg": "-h",
104
- "options": [
105
- {
106
- "opt": "-i",
107
- "name": "Identity",
108
- "description": "Minimum identity (in %) to report a result.",
109
- "arg": "float",
110
- "default": 70.0
111
- },
112
- {
113
- "opt": "-l",
114
- "name": "Length",
115
- "description": "Minimum alignment length to report a result.",
116
- "default": 60.0,
117
- "arg": "float"
118
- },
119
- {
120
- "opt": "-s",
121
- "name": "Subset",
122
- "description": ["The FastA provided is to be treated as a subset of",
123
- "the subject. By default, it expects all the BLAST subjects to be",
124
- "present in the FastA."]
125
- },
126
- {
127
- "opt": "-q",
128
- "name": "Quiet",
129
- "description": "Run quietly."
130
- },
131
- {
132
- "name": "seq.fa",
133
- "description": "Subject sequences (ref) in FastA format.",
134
- "mandatory": true,
135
- "arg": "in_file"
136
- },
137
- {
138
- "name": "map.bls",
139
- "description": ["Mapping of the reads to the reference in Tabular",
140
- "BLAST format."],
141
- "mandatory": true,
142
- "arg": "in_file"
143
- }
144
- ]
145
- },
146
- {
147
- "task": "BlastTab.cogCat.rb",
148
- "description": ["Replaces the COG gene IDs in a BLAST for the COG",
149
- "category."],
150
- "help_arg": "--help",
151
- "options": [
152
- {
153
- "opt": "--whog",
154
- "arg": "in_file",
155
- "mandatory": true,
156
- "description": "COG's 'whog' file."
157
- },
158
- {
159
- "opt": "--blast",
160
- "arg": "in_file",
161
- "mandatory": true,
162
- "description": "Tabular BLAST file with COG IDs as subject."
163
- },
164
- {
165
- "opt": "--cog",
166
- "description": "If set, returns the COG ID, not the COG category."
167
- },
168
- {
169
- "opt": "--desc",
170
- "description": "Includes COG description (requires --cog)."
171
- },
172
- {
173
- "opt": "--noverbose",
174
- "description": "Run quietly, but show warnings."
175
- },
176
- {
177
- "opt": "--quiet",
178
- "description": "Run quietly."
179
- },
180
- ">",
181
- {
182
- "arg": "out_file",
183
- "name": "COG Blast",
184
- "mandatory": true,
185
- "description": "Tabular BLAST with COG ID's or categories as subject."
186
- }
187
- ]
188
- },
189
- {
190
- "task": "BlastTab.filter.pl",
191
- "description": ["Extracts a subset of hits (queries or subjects) from a",
192
- "tabular BLAST."],
193
- "help_arg": "",
194
- "see_also": "BlastTab.subsample.pl",
195
- "options": [
196
- {
197
- "name": "Subject",
198
- "opt": "-s",
199
- "description": ["If set, assumes that list.txt contains subject IDs.",
200
- "By default: assumes query IDs."]
201
- },
202
- {
203
- "name": "Inverse",
204
- "opt": "-i",
205
- "description": ["If set, reports the inverse of the list (i.e.,",
206
- "reports only hits absent in the list)."]
207
- },
208
- {
209
- "name": "list.txt",
210
- "arg": "in_file",
211
- "mandatory": true,
212
- "description": "List of IDs to extract."
213
- },
214
- {
215
- "name": "blast.txt",
216
- "arg": "in_file",
217
- "mandatory": true,
218
- "description": "Tabular BLAST file containing the superset of hits."
219
- },
220
- ">",
221
- {
222
- "name": "subset.txt",
223
- "arg": "out_file",
224
- "mandatory": true,
225
- "description": "Tabulat BLAST file to be created."
226
- }
227
- ]
228
- },
229
- {
230
- "task": "BlastTab.pairedHits.rb",
231
- "description": "Identifies the best hits of paired-reads.",
232
- "help_arg": "--help",
233
- "options": [
234
- {
235
- "opt": "--blast",
236
- "arg": "in_file",
237
- "mandatory": true,
238
- "description": "Input Tabular BLAST file.",
239
- "note": ["This script assumes that paired hits are next to each",
240
- "other. If this is not the case (e.g., because the blast was",
241
- "concatenated), you must sort the input before running this",
242
- "script."]
243
- },
244
- {
245
- "name": "Min score",
246
- "opt": "--minscore",
247
- "arg": "float",
248
- "default": 0.0,
249
- "description": "Minimum (summed) Bit-Score to consider a pair-match."
250
- },
251
- {
252
- "name": "Best hits",
253
- "opt": "--besthits",
254
- "arg": "integer",
255
- "default": 0,
256
- "description": ["Outputs top best-hits only (use 0 to output all the",
257
- "paired hits)."]
258
- },
259
- {
260
- "name": "Orientation",
261
- "opt": "--orient",
262
- "arg": "select",
263
- "values": [0,1,2,3,4],
264
- "default": 0,
265
- "description": ["Checks the orientation of the hit. Values are: 0,",
266
- "no checking; 1, same direction; 2, inwards; 3, outwards; 4,",
267
- "different direction (i.e., 2 or 3)."]
268
- },
269
- {
270
- "name": "Sister prefix",
271
- "opt": "--sisprefix",
272
- "arg": "string",
273
- "default": "_",
274
- "description": ["Sister read number prefix in the name of the reads.",
275
- "Escape characters as dots (\\.), parenthesis (\\(, \\), \\[,",
276
- "\\]), other characters with special meaning in regular",
277
- "expressions (\\*, \\+, \\^, \\$, \\|). This prefix allows regular",
278
- "expressions (for example, use ':|\\.' to use any of colon or",
279
- "dot). Note that the prefix will not be included in the base name",
280
- "reported in the output."]
281
- },
282
- ">",
283
- {
284
- "arg": "out_file",
285
- "mandatory": true,
286
- "description": ["Tab-delimited flat file, with the following",
287
- "columns: (1) Query ID (without the \"sister\" identifier). (2)",
288
- "Subject ID. (3) Bit score (summed from both sister reads). (4/5)",
289
- "From/To (subject) coordinates for read 1. (6/7) From/To (subject)",
290
- "coordinates for read 2. (8) Reads orientation (1: same direction,",
291
- "2: inwards, 3: outwards). (9) Estimated insert size."]
292
- }
293
- ]
294
- },
295
- {
296
- "task": "BlastTab.seqdepth.pl",
297
- "description": "Estimates the sequencing depth of subject sequences.",
298
- "help_arg": "",
299
- "see_also": ["BlastTab.seqdepth_ZIP.pl", "BlastTab.seqdepth_nomedian.pl",
300
- "BedGraph.tad.rb"],
301
- "options": [
302
- "cat",
303
- {
304
- "arg": "in_file",
305
- "multiple_sep": " ",
306
- "mandatory": true,
307
- "description": ["One or more Tabular BLAST files of reads vs genes",
308
- "(or contigs)."]
309
- },
310
- "|",
311
- { "arg": "task" },
312
- {
313
- "name": "genes_or_ctgs.fna",
314
- "arg": "in_file",
315
- "mandatory": true,
316
- "description": ["A FastA file containing the genes or the contigs",
317
- "(db)."]
318
- },
319
- ">",
320
- {
321
- "name": "genes_or_ctgs.cov",
322
- "arg": "out_file",
323
- "mandatory": true,
324
- "description": ["A tab-delimited file with the following columns:",
325
- "(1) Subject ID. (2) Average sequencing depth. (3) Median",
326
- "sequencing depth. (4) Number of mapped reads. (5) Length of the",
327
- "subject sequence."]
328
- }
329
- ]
330
- },
331
- {
332
- "task": "BlastTab.seqdepth_ZIP.pl",
333
- "description": ["Estimates the average sequencing depth of subject",
334
- "sequences (genes or contigs) assuming a Zero-Inflated Poisson",
335
- "distribution (ZIP) to correct for non-covered positions. It uses the",
336
- "corrected method of moments estimators (CMMEs) as described by",
337
- "Beckett et al [1]. Note that [1] has a mistake in eq. (2.4), that",
338
- "should be: pi-hat-MM = 1 - (X-bar / lambda-hat-MM). Also note that a",
339
- "more elaborated mixture distribution can arise from coverage",
340
- "histograms (e.g., see [2] for an additional correction called 'tail",
341
- "distribution' and mixtures involving negative binomial) so take these",
342
- "results cum grano salis.\n [1]",
343
- "http://anisette.ucs.louisiana.edu/Academic/Sciences/MATH/stage/stat2012.pdf\n",
344
- "[2] Lindner et al, Bioinformatics, 2013."],
345
- "help_arg": "",
346
- "see_also": ["BlastTab.seqdepth.pl", "BlastTab.seqdepth_nomedian.pl",
347
- "BedGraph.tad.rb"],
348
- "options": [
349
- "cat",
350
- {
351
- "name": "blast",
352
- "arg": "in_file",
353
- "multiple_sep": " ",
354
- "mandatory": true,
355
- "description": ["One or more Tabular BLAST files of reads vs genes",
356
- "(or contigs)."]
357
- },
358
- "|",
359
- { "arg": "task" },
360
- {
361
- "name": "genes_or_ctgs.fna",
362
- "arg": "in_file",
363
- "mandatory": true,
364
- "description": ["A FastA file containing the genes or the contigs",
365
- "(db)."]
366
- },
367
- ">",
368
- {
369
- "name": "genes_or_ctgs.cov",
370
- "arg": "out_file",
371
- "mandatory": true,
372
- "description": ["Output file with the following columns:",
373
- "(1) Subject ID.",
374
- "(2) Estimated average sequencing depth (CMME lambda).",
375
- "(3) Zero-inflation (CMME pi).",
376
- "(4) Observed average sequencing depth.",
377
- "(5) Observed median sequencing depth.",
378
- "(6) Observed median sequencing depth excluding zeroes.",
379
- "(7) Number of mapped reads.",
380
- "(8) Length of the subject sequence."]
381
- }
382
- ]
383
- },
384
- {
385
- "task": "BlastTab.seqdepth_nomedian.pl",
386
- "description": ["Estimates the sequencing depth of subject",
387
- "sequences. The values reported by this script may differ from those",
388
- "of BlastTab.seqdepth.pl, because this script uses the aligned length",
389
- "of the read while BlastTab.seqdepth.pl uses the aligned length of the",
390
- "subject sequence."],
391
- "help_arg": "",
392
- "see_also": ["BlastTab.seqdepth.pl", "BlastTab.seqdepth_ZIP.pl"],
393
- "options": [
394
- "cat",
395
- {
396
- "arg": "in_file",
397
- "multiple_sep": " ",
398
- "mandatory": true,
399
- "description": ["One or more Tabular BLAST files of reads vs genes",
400
- "(or contigs)."]
401
- },
402
- "|",
403
- { "arg": "task" },
404
- {
405
- "name": "genes_or_ctgs.fna",
406
- "arg": "in_file",
407
- "mandatory": true,
408
- "description": ["A FastA file containing the genes or the contigs",
409
- "(db)."]
410
- },
411
- ">",
412
- {
413
- "name": "genes_or_ctgs.cov",
414
- "arg": "out_file",
415
- "mandatory": true,
416
- "description": ["A tab-delimited file with the following columns:",
417
- "(1) Subject ID. (2) Average sequencing depth. (3) Number of",
418
- "mapped reads. (4) Length of the subject sequence."]
419
- }
420
- ]
421
- },
422
- {
423
- "task": "BlastTab.subsample.pl",
424
- "description": ["Filters a BLAST output including only the hits produced",
425
- "by any of the given sequences as query."],
426
- "help_arg": "",
427
- "see_also": "BlastTab.filter.pl",
428
- "options": [
429
- {
430
- "name": "blast.tab",
431
- "mandatory": true,
432
- "arg": "in_file",
433
- "description": "BLAST output to be filtered (tabular format)."
434
- },
435
- {
436
- "name": "sample.fa",
437
- "mandatory": true,
438
- "arg": "in_file",
439
- "description": "Sequences to use as query (FastA format)."
440
- },
441
- ">",
442
- {
443
- "arg": "out_file",
444
- "mandatory": true,
445
- "description": "The filtered BLAST output (tabular format)."
446
- }
447
- ]
448
- },
449
- {
450
- "task": "BlastTab.sumPerHit.pl",
451
- "description": ["Sums the weights of all the queries hitting each",
452
- "subject. Often (but not necessarily) the BLAST files contain only",
453
- "best matches. The weights can be any number, but a common use of this",
454
- "Script is to add up counts (weights are integers). For example, in a",
455
- "BLAST of predicted genes vs some annotation source, the weights could",
456
- "be the number of reads recruited by each gene."],
457
- "help_arg": "-h",
458
- "options": [
459
- {
460
- "name": "Weights file",
461
- "opt": "-w",
462
- "arg": "in_file",
463
- "description": ["A two-columns tab-delimited file containing the",
464
- "the name (column 1) and the weight (column 2) of each query."]
465
- },
466
- {
467
- "name": "Minimum score",
468
- "opt": "-s",
469
- "arg": "float",
470
- "default": 0.0
471
- },
472
- {
473
- "name": "Minimum identity (%)",
474
- "opt": "-i",
475
- "arg": "float",
476
- "default": 0.0
477
- },
478
- {
479
- "name": "Queries",
480
- "opt": "-m",
481
- "arg": "integer",
482
- "default": 0,
483
- "description": "Maximum number of queries. Set to 0 for all."
484
- },
485
- {
486
- "name": "Normalize",
487
- "opt": "-n",
488
- "description": "Normalize weights by the number of hits per query."
489
- },
490
- {
491
- "name": "Include zeroes",
492
- "opt": "-z",
493
- "description": ["Add zero when weight is not found (by default:",
494
- "doesn't list them)."]
495
- },
496
- {
497
- "name": "Run quietly",
498
- "opt": "-q"
499
- },
500
- {
501
- "name": "blast",
502
- "arg": "in_file",
503
- "multiple_sep": " ",
504
- "mandatory": true,
505
- "description": "One or more BLAST files."
506
- },
507
- ">",
508
- {
509
- "arg": "out_file",
510
- "mandatory": true,
511
- "description": ["A two-columns tab-delimited file containing the",
512
- "summed weights per hit."]
513
- }
514
- ]
515
- },
516
- {
517
- "task": "BlastTab.taxid2taxrank.pl",
518
- "description": ["Takes a BLAST with NCBI Taxonomy IDs as subjects and",
519
- "replaces them by names at a given taxonomic rank."],
520
- "help_arg": "",
521
- "options": [
522
- {
523
- "name": "tax_blast.txt",
524
- "mandatory": true,
525
- "arg": "in_file",
526
- "description": ["BLAST output, where subject IDs are NCBI Taxonomy",
527
- "IDs."]
528
- },
529
- {
530
- "name": "nodes.dmp",
531
- "mandatory": true,
532
- "arg": "in_file",
533
- "description": "Nodes file from NCBI Taxonomy.",
534
- "source_url": "ftp://ftp.ncbi.nih.gov/pub/taxonomy/taxdump.tar.gz"
535
- },
536
- {
537
- "name": "names.dmp",
538
- "mandatory": true,
539
- "arg": "in_file",
540
- "description": "Names file from NCBI Taxonomy.",
541
- "source_url": "ftp://ftp.ncbi.nih.gov/pub/taxonomy/taxdump.tar.gz"
542
- },
543
- {
544
- "name": "rank",
545
- "arg": "string",
546
- "mandatory": true,
547
- "default": "genus",
548
- "description": ["The rank to be reported. All the reported nodes",
549
- "will have the same rank. To see supported values, run:\n",
550
- "`cut -f 5 nodes.dmp | sort -u`."]
551
- },
552
- {
553
- "name": "Best-hit",
554
- "arg": "select",
555
- "values": ["yes", "no"],
556
- "default": "yes",
557
- "description": ["Should it take into account the best hit per query",
558
- "only? This is: should it filter by best-hit?"]
559
- },
560
- ">",
561
- {
562
- "name": "taxrank_list.txt",
563
- "arg": "out_file",
564
- "mandatory": true,
565
- "description": ["BLAST-like output, where subject IDs are Taxonomy",
566
- "names."]
567
- }
568
- ]
569
- },
570
- {
571
- "task": "BlastTab.topHits_sorted.rb",
572
- "description": "Reports the top-N best hits of a BLAST.",
573
- "help_arg": "--help",
574
- "see_also": "BlastTab.best_hit_sorted.pl",
575
- "options": [
576
- {
577
- "name": "Sort",
578
- "arg": "select",
579
- "values": ["sort","cat"],
580
- "mandatory": true,
581
- "description": ["Use 'sort' if your BLAST is not pre-sorted by the",
582
- "first column (or if you're not sure). Use 'cat' otherwise."]
583
- },
584
- {
585
- "arg": "in_file",
586
- "mandatory": true,
587
- "description": "Tabular BLAST file."
588
- },
589
- "|",
590
- { "arg": "task" },
591
- "--blast",
592
- "-",
593
- {
594
- "name": "Output",
595
- "opt": "--out",
596
- "arg": "out_file",
597
- "mandatory": true,
598
- "description": [
599
- "Output filtered BLAST file.",
600
- "Supports compression with .gz extension."
601
- ]
602
- },
603
- {
604
- "opt": "--top",
605
- "arg": "integer",
606
- "default": 5,
607
- "description": "Maximum number of hits to report for each query."
608
- },
609
- {
610
- "opt": "--sort-by",
611
- "arg": "select",
612
- "values": ["bitscore", "evalue", "identity", "length", "no"],
613
- "default": "bitscore",
614
- "description": "Parameter used to detect the 'best' hits."
615
- },
616
- {
617
- "opt": "--quiet",
618
- "description": "Run quietly."
619
- }
620
- ]
621
- },
622
- {
623
- "task": "BlastTab.recplot2.R",
624
- "description": ["Produce recruitment plot objects provided that",
625
- "BlastTab.catsbj.pl has been previously executed."],
626
- "help_arg": "--help",
627
- "requires": [
628
- { "r_package": "optparse" },
629
- { "r_package": "enveomics.R" }
630
- ],
631
- "see_also": ["BlastTab.catsbj.pl", "GFF.catsbj.pl",
632
- "RecPlot2.compareIdentities.R"],
633
- "options": [
634
- {
635
- "opt": "--prefix",
636
- "arg": "in_file",
637
- "mandatory": true,
638
- "description": ["Path to the prefix of the BlastTab.catsbj.pl output",
639
- "files. At least the files .rec and .lim must exist with this",
640
- "prefix."]
641
- },
642
- {
643
- "opt": "--pos-breaks",
644
- "arg": "integer",
645
- "default": 1000,
646
- "description": "Breaks in the positions histogram."
647
- },
648
- {
649
- "opt": "--pos-breaks-tsv",
650
- "arg": "in_file",
651
- "description": ["File with (absolute) coordinates of breaks in the",
652
- "position histogram."]
653
- },
654
- {
655
- "opt": "--id-breaks",
656
- "arg": "integer",
657
- "default": 300,
658
- "description": ["Breaks in the identity histogram."]
659
- },
660
- {
661
- "opt": "--id-free-range",
662
- "description": ["Indicates that the range should be freely set from",
663
- "the observed values. Otherwise, 70-100% is included in the",
664
- "identity histogram (default)."]
665
- },
666
- {
667
- "opt": "--id-metric",
668
- "arg": "select",
669
- "values": ["identity", "corrected identity", "bit score"],
670
- "default": "identity",
671
- "description": ["Metric of identity to be used (Y-axis). Corrected",
672
- "identity is only supported if the original BLAST file included",
673
- "sequence lengths."]
674
- },
675
- {
676
- "opt": "--id-summary",
677
- "arg": "string",
678
- "default": "sum",
679
- "description": "Function summarizing the identity bins."
680
- },
681
- {
682
- "opt": "--id-cutoff",
683
- "arg": "float",
684
- "default": 95.0,
685
- "description": ["Cutoff of identity metric above which the hits are",
686
- "considered 'in-group'. The 95% identity corresponds to the",
687
- "expectation of ANI<95% within species."]
688
- },
689
- {
690
- "opt": "--threads",
691
- "arg": "integer",
692
- "default": 2,
693
- "description": "Number of threads to use."
694
- },
695
- {
696
- "opt": "--no-verbose",
697
- "description": "Indicates if the function should report the advance."
698
- },
699
- {
700
- "opt": "--peaks-col",
701
- "arg": "string",
702
- "default": "NA",
703
- "description": ["Color of peaks, mandatory for peak-finding (e.g.,",
704
- "darkred)."]
705
- },
706
- {
707
- "opt": "--peaks-method",
708
- "arg": "select",
709
- "values": ["emauto","em","mower"],
710
- "default": "emauto",
711
- "description": "Method to detect peaks."
712
- },
713
- {
714
- "name": "R Object Output",
715
- "arg": "out_file",
716
- "mandatory": true,
717
- "description": ["Recplo2 object that can be re-plotted using",
718
- "R function plot."]
719
- },
720
- {
721
- "name": "Graphical Output",
722
- "arg": "out_file",
723
- "description": "Recruitment plot in PDF."
724
- },
725
- {
726
- "name": "Width",
727
- "arg": "float",
728
- "description": "Width of the plot in inches (7 by default)."
729
- },
730
- {
731
- "name": "Height",
732
- "arg": "float",
733
- "description": "Height of the plot in inches (7 by default)."
734
- }
735
- ]
736
- },
737
- {
738
- "task": "RecPlot2.compareIdentities.R",
739
- "description": ["Calculates the difference between identity",
740
- "distributions of two recruitment plots."],
741
- "help_arg": "--help",
742
- "requires": [
743
- { "r_package": "optparse" },
744
- { "r_package": "enveomics.R" }
745
- ],
746
- "see_also": [ "BlastTab.recplot2.R" ],
747
- "options": [
748
- {
749
- "opt": "--method",
750
- "arg": "string",
751
- "default": "hellinger",
752
- "description": ["Distance method to use. This should be (an",
753
- "unambiguous abbreviation of) one of:",
754
- "'hellinger' (Hellinger, 1090, doi:10.1515/crll.1909.136.210),",
755
- "'bhattacharyya' (Bhattacharyya, 1943, Bull. Calcutta Math. Soc.",
756
- "35), 'kl' or 'kullback–leibler' (Kullback & Leibler, 1951,",
757
- "doi:10.1214/aoms/1177729694), or 'euclidean'."]
758
- },
759
- {
760
- "opt": "--pseudocounts",
761
- "arg": "float",
762
- "default": 0.0,
763
- "description": ["Smoothing parameter for Laplace smoothing. Use 0",
764
- "for no smoothing, or 1 for add-one smoothing."]
765
- },
766
- {
767
- "opt": "--max-deviation",
768
- "arg": "float",
769
- "description": ["Maximum mean deviation between identity breaks",
770
- "tolerated (as percent identity). Difference in number of",
771
- "id.breaks is never tolerated."]
772
- },
773
- {
774
- "arg": "in_file",
775
- "name": "RecPlot A",
776
- "mandatory": true,
777
- "description": ["File containing the R object `rp` for the first",
778
- "recruitment plot."]
779
- },
780
- {
781
- "arg": "in_file",
782
- "name": "RecPlot B",
783
- "mandatory": true,
784
- "description": ["File containing the R object `rp` for the second",
785
- "recruitment plot."]
786
- }
787
- ]
788
- }
789
- ]
790
- }