miga-base 1.2.15.2 → 1.2.15.3

Sign up to get free protection for your applications and to get access to all the features.
Files changed (304) hide show
  1. checksums.yaml +4 -4
  2. data/lib/miga/cli/action/download/gtdb.rb +4 -1
  3. data/lib/miga/cli/action/gtdb_get.rb +4 -0
  4. data/lib/miga/remote_dataset/download.rb +3 -2
  5. data/lib/miga/remote_dataset.rb +25 -7
  6. data/lib/miga/taxonomy.rb +6 -0
  7. data/lib/miga/version.rb +2 -2
  8. metadata +6 -302
  9. data/utils/FastAAI/00.Libraries/01.SCG_HMMs/Archaea_SCG.hmm +0 -41964
  10. data/utils/FastAAI/00.Libraries/01.SCG_HMMs/Bacteria_SCG.hmm +0 -32439
  11. data/utils/FastAAI/00.Libraries/01.SCG_HMMs/Complete_SCG_DB.hmm +0 -62056
  12. data/utils/FastAAI/FastAAI +0 -3659
  13. data/utils/FastAAI/FastAAI-legacy/FastAAI +0 -1336
  14. data/utils/FastAAI/FastAAI-legacy/kAAI_v1.0_virus.py +0 -1296
  15. data/utils/FastAAI/README.md +0 -84
  16. data/utils/enveomics/Docs/recplot2.md +0 -244
  17. data/utils/enveomics/Examples/aai-matrix.bash +0 -66
  18. data/utils/enveomics/Examples/ani-matrix.bash +0 -66
  19. data/utils/enveomics/Examples/essential-phylogeny.bash +0 -105
  20. data/utils/enveomics/Examples/unus-genome-phylogeny.bash +0 -100
  21. data/utils/enveomics/LICENSE.txt +0 -73
  22. data/utils/enveomics/Makefile +0 -52
  23. data/utils/enveomics/Manifest/Tasks/aasubs.json +0 -103
  24. data/utils/enveomics/Manifest/Tasks/blasttab.json +0 -790
  25. data/utils/enveomics/Manifest/Tasks/distances.json +0 -161
  26. data/utils/enveomics/Manifest/Tasks/fasta.json +0 -802
  27. data/utils/enveomics/Manifest/Tasks/fastq.json +0 -291
  28. data/utils/enveomics/Manifest/Tasks/graphics.json +0 -126
  29. data/utils/enveomics/Manifest/Tasks/mapping.json +0 -137
  30. data/utils/enveomics/Manifest/Tasks/ogs.json +0 -382
  31. data/utils/enveomics/Manifest/Tasks/other.json +0 -906
  32. data/utils/enveomics/Manifest/Tasks/remote.json +0 -355
  33. data/utils/enveomics/Manifest/Tasks/sequence-identity.json +0 -650
  34. data/utils/enveomics/Manifest/Tasks/tables.json +0 -308
  35. data/utils/enveomics/Manifest/Tasks/trees.json +0 -68
  36. data/utils/enveomics/Manifest/Tasks/variants.json +0 -111
  37. data/utils/enveomics/Manifest/categories.json +0 -165
  38. data/utils/enveomics/Manifest/examples.json +0 -162
  39. data/utils/enveomics/Manifest/tasks.json +0 -4
  40. data/utils/enveomics/Pipelines/assembly.pbs/CONFIG.mock.bash +0 -69
  41. data/utils/enveomics/Pipelines/assembly.pbs/FastA.N50.pl +0 -1
  42. data/utils/enveomics/Pipelines/assembly.pbs/FastA.filterN.pl +0 -1
  43. data/utils/enveomics/Pipelines/assembly.pbs/FastA.length.pl +0 -1
  44. data/utils/enveomics/Pipelines/assembly.pbs/README.md +0 -189
  45. data/utils/enveomics/Pipelines/assembly.pbs/RUNME-2.bash +0 -112
  46. data/utils/enveomics/Pipelines/assembly.pbs/RUNME-3.bash +0 -23
  47. data/utils/enveomics/Pipelines/assembly.pbs/RUNME-4.bash +0 -44
  48. data/utils/enveomics/Pipelines/assembly.pbs/RUNME.bash +0 -50
  49. data/utils/enveomics/Pipelines/assembly.pbs/kSelector.R +0 -37
  50. data/utils/enveomics/Pipelines/assembly.pbs/newbler.pbs +0 -68
  51. data/utils/enveomics/Pipelines/assembly.pbs/newbler_preparator.pl +0 -49
  52. data/utils/enveomics/Pipelines/assembly.pbs/soap.pbs +0 -80
  53. data/utils/enveomics/Pipelines/assembly.pbs/stats.pbs +0 -57
  54. data/utils/enveomics/Pipelines/assembly.pbs/velvet.pbs +0 -63
  55. data/utils/enveomics/Pipelines/blast.pbs/01.pbs.bash +0 -38
  56. data/utils/enveomics/Pipelines/blast.pbs/02.pbs.bash +0 -73
  57. data/utils/enveomics/Pipelines/blast.pbs/03.pbs.bash +0 -21
  58. data/utils/enveomics/Pipelines/blast.pbs/BlastTab.recover_job.pl +0 -72
  59. data/utils/enveomics/Pipelines/blast.pbs/CONFIG.mock.bash +0 -98
  60. data/utils/enveomics/Pipelines/blast.pbs/FastA.split.pl +0 -1
  61. data/utils/enveomics/Pipelines/blast.pbs/README.md +0 -127
  62. data/utils/enveomics/Pipelines/blast.pbs/RUNME.bash +0 -109
  63. data/utils/enveomics/Pipelines/blast.pbs/TASK.check.bash +0 -128
  64. data/utils/enveomics/Pipelines/blast.pbs/TASK.dry.bash +0 -16
  65. data/utils/enveomics/Pipelines/blast.pbs/TASK.eo.bash +0 -22
  66. data/utils/enveomics/Pipelines/blast.pbs/TASK.pause.bash +0 -26
  67. data/utils/enveomics/Pipelines/blast.pbs/TASK.run.bash +0 -89
  68. data/utils/enveomics/Pipelines/blast.pbs/sentinel.pbs.bash +0 -29
  69. data/utils/enveomics/Pipelines/idba.pbs/README.md +0 -49
  70. data/utils/enveomics/Pipelines/idba.pbs/RUNME.bash +0 -95
  71. data/utils/enveomics/Pipelines/idba.pbs/run.pbs +0 -56
  72. data/utils/enveomics/Pipelines/trim.pbs/README.md +0 -54
  73. data/utils/enveomics/Pipelines/trim.pbs/RUNME.bash +0 -70
  74. data/utils/enveomics/Pipelines/trim.pbs/run.pbs +0 -130
  75. data/utils/enveomics/README.md +0 -42
  76. data/utils/enveomics/Scripts/AAsubs.log2ratio.rb +0 -171
  77. data/utils/enveomics/Scripts/Aln.cat.rb +0 -221
  78. data/utils/enveomics/Scripts/Aln.convert.pl +0 -35
  79. data/utils/enveomics/Scripts/AlphaDiversity.pl +0 -152
  80. data/utils/enveomics/Scripts/BedGraph.tad.rb +0 -93
  81. data/utils/enveomics/Scripts/BedGraph.window.rb +0 -71
  82. data/utils/enveomics/Scripts/BlastPairwise.AAsubs.pl +0 -102
  83. data/utils/enveomics/Scripts/BlastTab.addlen.rb +0 -63
  84. data/utils/enveomics/Scripts/BlastTab.advance.bash +0 -48
  85. data/utils/enveomics/Scripts/BlastTab.best_hit_sorted.pl +0 -55
  86. data/utils/enveomics/Scripts/BlastTab.catsbj.pl +0 -104
  87. data/utils/enveomics/Scripts/BlastTab.cogCat.rb +0 -76
  88. data/utils/enveomics/Scripts/BlastTab.filter.pl +0 -47
  89. data/utils/enveomics/Scripts/BlastTab.kegg_pep2path_rest.pl +0 -194
  90. data/utils/enveomics/Scripts/BlastTab.metaxaPrep.pl +0 -104
  91. data/utils/enveomics/Scripts/BlastTab.pairedHits.rb +0 -157
  92. data/utils/enveomics/Scripts/BlastTab.recplot2.R +0 -48
  93. data/utils/enveomics/Scripts/BlastTab.seqdepth.pl +0 -86
  94. data/utils/enveomics/Scripts/BlastTab.seqdepth_ZIP.pl +0 -119
  95. data/utils/enveomics/Scripts/BlastTab.seqdepth_nomedian.pl +0 -86
  96. data/utils/enveomics/Scripts/BlastTab.subsample.pl +0 -47
  97. data/utils/enveomics/Scripts/BlastTab.sumPerHit.pl +0 -114
  98. data/utils/enveomics/Scripts/BlastTab.taxid2taxrank.pl +0 -90
  99. data/utils/enveomics/Scripts/BlastTab.topHits_sorted.rb +0 -123
  100. data/utils/enveomics/Scripts/Chao1.pl +0 -97
  101. data/utils/enveomics/Scripts/CharTable.classify.rb +0 -234
  102. data/utils/enveomics/Scripts/EBIseq2tax.rb +0 -83
  103. data/utils/enveomics/Scripts/FastA.N50.pl +0 -60
  104. data/utils/enveomics/Scripts/FastA.extract.rb +0 -152
  105. data/utils/enveomics/Scripts/FastA.filter.pl +0 -52
  106. data/utils/enveomics/Scripts/FastA.filterLen.pl +0 -28
  107. data/utils/enveomics/Scripts/FastA.filterN.pl +0 -60
  108. data/utils/enveomics/Scripts/FastA.fragment.rb +0 -100
  109. data/utils/enveomics/Scripts/FastA.gc.pl +0 -42
  110. data/utils/enveomics/Scripts/FastA.interpose.pl +0 -93
  111. data/utils/enveomics/Scripts/FastA.length.pl +0 -38
  112. data/utils/enveomics/Scripts/FastA.mask.rb +0 -89
  113. data/utils/enveomics/Scripts/FastA.per_file.pl +0 -36
  114. data/utils/enveomics/Scripts/FastA.qlen.pl +0 -57
  115. data/utils/enveomics/Scripts/FastA.rename.pl +0 -65
  116. data/utils/enveomics/Scripts/FastA.revcom.pl +0 -23
  117. data/utils/enveomics/Scripts/FastA.sample.rb +0 -98
  118. data/utils/enveomics/Scripts/FastA.slider.pl +0 -85
  119. data/utils/enveomics/Scripts/FastA.split.pl +0 -55
  120. data/utils/enveomics/Scripts/FastA.split.rb +0 -79
  121. data/utils/enveomics/Scripts/FastA.subsample.pl +0 -131
  122. data/utils/enveomics/Scripts/FastA.tag.rb +0 -65
  123. data/utils/enveomics/Scripts/FastA.toFastQ.rb +0 -69
  124. data/utils/enveomics/Scripts/FastA.wrap.rb +0 -48
  125. data/utils/enveomics/Scripts/FastQ.filter.pl +0 -54
  126. data/utils/enveomics/Scripts/FastQ.interpose.pl +0 -90
  127. data/utils/enveomics/Scripts/FastQ.maskQual.rb +0 -89
  128. data/utils/enveomics/Scripts/FastQ.offset.pl +0 -90
  129. data/utils/enveomics/Scripts/FastQ.split.pl +0 -53
  130. data/utils/enveomics/Scripts/FastQ.tag.rb +0 -70
  131. data/utils/enveomics/Scripts/FastQ.test-error.rb +0 -81
  132. data/utils/enveomics/Scripts/FastQ.toFastA.awk +0 -24
  133. data/utils/enveomics/Scripts/GFF.catsbj.pl +0 -127
  134. data/utils/enveomics/Scripts/GenBank.add_fields.rb +0 -84
  135. data/utils/enveomics/Scripts/HMM.essential.rb +0 -351
  136. data/utils/enveomics/Scripts/HMM.haai.rb +0 -168
  137. data/utils/enveomics/Scripts/HMMsearch.extractIds.rb +0 -83
  138. data/utils/enveomics/Scripts/JPlace.distances.rb +0 -88
  139. data/utils/enveomics/Scripts/JPlace.to_iToL.rb +0 -320
  140. data/utils/enveomics/Scripts/M5nr.getSequences.rb +0 -81
  141. data/utils/enveomics/Scripts/MeTaxa.distribution.pl +0 -198
  142. data/utils/enveomics/Scripts/MyTaxa.fragsByTax.pl +0 -35
  143. data/utils/enveomics/Scripts/MyTaxa.seq-taxrank.rb +0 -49
  144. data/utils/enveomics/Scripts/NCBIacc2tax.rb +0 -92
  145. data/utils/enveomics/Scripts/Newick.autoprune.R +0 -27
  146. data/utils/enveomics/Scripts/RAxML-EPA.to_iToL.pl +0 -228
  147. data/utils/enveomics/Scripts/RecPlot2.compareIdentities.R +0 -32
  148. data/utils/enveomics/Scripts/RefSeq.download.bash +0 -48
  149. data/utils/enveomics/Scripts/SRA.download.bash +0 -55
  150. data/utils/enveomics/Scripts/TRIBS.plot-test.R +0 -36
  151. data/utils/enveomics/Scripts/TRIBS.test.R +0 -39
  152. data/utils/enveomics/Scripts/Table.barplot.R +0 -31
  153. data/utils/enveomics/Scripts/Table.df2dist.R +0 -30
  154. data/utils/enveomics/Scripts/Table.filter.pl +0 -61
  155. data/utils/enveomics/Scripts/Table.merge.pl +0 -77
  156. data/utils/enveomics/Scripts/Table.prefScore.R +0 -60
  157. data/utils/enveomics/Scripts/Table.replace.rb +0 -69
  158. data/utils/enveomics/Scripts/Table.round.rb +0 -63
  159. data/utils/enveomics/Scripts/Table.split.pl +0 -57
  160. data/utils/enveomics/Scripts/Taxonomy.silva2ncbi.rb +0 -227
  161. data/utils/enveomics/Scripts/VCF.KaKs.rb +0 -147
  162. data/utils/enveomics/Scripts/VCF.SNPs.rb +0 -88
  163. data/utils/enveomics/Scripts/aai.rb +0 -421
  164. data/utils/enveomics/Scripts/ani.rb +0 -362
  165. data/utils/enveomics/Scripts/anir.rb +0 -137
  166. data/utils/enveomics/Scripts/clust.rand.rb +0 -102
  167. data/utils/enveomics/Scripts/gi2tax.rb +0 -103
  168. data/utils/enveomics/Scripts/in_silico_GA_GI.pl +0 -96
  169. data/utils/enveomics/Scripts/lib/data/dupont_2012_essential.hmm.gz +0 -0
  170. data/utils/enveomics/Scripts/lib/data/lee_2019_essential.hmm.gz +0 -0
  171. data/utils/enveomics/Scripts/lib/enveomics.R +0 -1
  172. data/utils/enveomics/Scripts/lib/enveomics_rb/anir.rb +0 -293
  173. data/utils/enveomics/Scripts/lib/enveomics_rb/bm_set.rb +0 -175
  174. data/utils/enveomics/Scripts/lib/enveomics_rb/enveomics.rb +0 -24
  175. data/utils/enveomics/Scripts/lib/enveomics_rb/errors.rb +0 -17
  176. data/utils/enveomics/Scripts/lib/enveomics_rb/gmm_em.rb +0 -30
  177. data/utils/enveomics/Scripts/lib/enveomics_rb/jplace.rb +0 -253
  178. data/utils/enveomics/Scripts/lib/enveomics_rb/match.rb +0 -88
  179. data/utils/enveomics/Scripts/lib/enveomics_rb/og.rb +0 -182
  180. data/utils/enveomics/Scripts/lib/enveomics_rb/rbm.rb +0 -49
  181. data/utils/enveomics/Scripts/lib/enveomics_rb/remote_data.rb +0 -74
  182. data/utils/enveomics/Scripts/lib/enveomics_rb/seq_range.rb +0 -237
  183. data/utils/enveomics/Scripts/lib/enveomics_rb/stats/rand.rb +0 -31
  184. data/utils/enveomics/Scripts/lib/enveomics_rb/stats/sample.rb +0 -152
  185. data/utils/enveomics/Scripts/lib/enveomics_rb/stats.rb +0 -3
  186. data/utils/enveomics/Scripts/lib/enveomics_rb/utils.rb +0 -74
  187. data/utils/enveomics/Scripts/lib/enveomics_rb/vcf.rb +0 -135
  188. data/utils/enveomics/Scripts/ogs.annotate.rb +0 -88
  189. data/utils/enveomics/Scripts/ogs.core-pan.rb +0 -160
  190. data/utils/enveomics/Scripts/ogs.extract.rb +0 -125
  191. data/utils/enveomics/Scripts/ogs.mcl.rb +0 -186
  192. data/utils/enveomics/Scripts/ogs.rb +0 -104
  193. data/utils/enveomics/Scripts/ogs.stats.rb +0 -131
  194. data/utils/enveomics/Scripts/rbm-legacy.rb +0 -172
  195. data/utils/enveomics/Scripts/rbm.rb +0 -108
  196. data/utils/enveomics/Scripts/sam.filter.rb +0 -148
  197. data/utils/enveomics/Tests/Makefile +0 -10
  198. data/utils/enveomics/Tests/Mgen_M2288.faa +0 -3189
  199. data/utils/enveomics/Tests/Mgen_M2288.fna +0 -8282
  200. data/utils/enveomics/Tests/Mgen_M2321.fna +0 -8288
  201. data/utils/enveomics/Tests/Nequ_Kin4M.faa +0 -2970
  202. data/utils/enveomics/Tests/Xanthomonas_oryzae-PilA.tribs.Rdata +0 -0
  203. data/utils/enveomics/Tests/Xanthomonas_oryzae-PilA.txt +0 -7
  204. data/utils/enveomics/Tests/Xanthomonas_oryzae.aai-mat.tsv +0 -17
  205. data/utils/enveomics/Tests/Xanthomonas_oryzae.aai.tsv +0 -137
  206. data/utils/enveomics/Tests/a_mg.cds-go.blast.tsv +0 -123
  207. data/utils/enveomics/Tests/a_mg.reads-cds.blast.tsv +0 -200
  208. data/utils/enveomics/Tests/a_mg.reads-cds.counts.tsv +0 -55
  209. data/utils/enveomics/Tests/alkB.nwk +0 -1
  210. data/utils/enveomics/Tests/anthrax-cansnp-data.tsv +0 -13
  211. data/utils/enveomics/Tests/anthrax-cansnp-key.tsv +0 -17
  212. data/utils/enveomics/Tests/hiv1.faa +0 -59
  213. data/utils/enveomics/Tests/hiv1.fna +0 -134
  214. data/utils/enveomics/Tests/hiv2.faa +0 -70
  215. data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv +0 -233
  216. data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv.lim +0 -1
  217. data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv.rec +0 -233
  218. data/utils/enveomics/Tests/phyla_counts.tsv +0 -10
  219. data/utils/enveomics/Tests/primate_lentivirus.ogs +0 -11
  220. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-hiv1.rbm +0 -9
  221. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-hiv2.rbm +0 -8
  222. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-siv.rbm +0 -6
  223. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv2-hiv2.rbm +0 -9
  224. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv2-siv.rbm +0 -6
  225. data/utils/enveomics/Tests/primate_lentivirus.rbm/siv-siv.rbm +0 -6
  226. data/utils/enveomics/build_enveomics_r.bash +0 -45
  227. data/utils/enveomics/enveomics.R/DESCRIPTION +0 -31
  228. data/utils/enveomics/enveomics.R/NAMESPACE +0 -39
  229. data/utils/enveomics/enveomics.R/R/autoprune.R +0 -155
  230. data/utils/enveomics/enveomics.R/R/barplot.R +0 -184
  231. data/utils/enveomics/enveomics.R/R/cliopts.R +0 -135
  232. data/utils/enveomics/enveomics.R/R/df2dist.R +0 -154
  233. data/utils/enveomics/enveomics.R/R/growthcurve.R +0 -331
  234. data/utils/enveomics/enveomics.R/R/prefscore.R +0 -79
  235. data/utils/enveomics/enveomics.R/R/recplot.R +0 -354
  236. data/utils/enveomics/enveomics.R/R/recplot2.R +0 -1631
  237. data/utils/enveomics/enveomics.R/R/tribs.R +0 -583
  238. data/utils/enveomics/enveomics.R/R/utils.R +0 -80
  239. data/utils/enveomics/enveomics.R/README.md +0 -81
  240. data/utils/enveomics/enveomics.R/data/growth.curves.rda +0 -0
  241. data/utils/enveomics/enveomics.R/data/phyla.counts.rda +0 -0
  242. data/utils/enveomics/enveomics.R/man/cash-enve.GrowthCurve-method.Rd +0 -16
  243. data/utils/enveomics/enveomics.R/man/cash-enve.RecPlot2-method.Rd +0 -16
  244. data/utils/enveomics/enveomics.R/man/cash-enve.RecPlot2.Peak-method.Rd +0 -16
  245. data/utils/enveomics/enveomics.R/man/enve.GrowthCurve-class.Rd +0 -25
  246. data/utils/enveomics/enveomics.R/man/enve.TRIBS-class.Rd +0 -46
  247. data/utils/enveomics/enveomics.R/man/enve.TRIBS.merge.Rd +0 -23
  248. data/utils/enveomics/enveomics.R/man/enve.TRIBStest-class.Rd +0 -47
  249. data/utils/enveomics/enveomics.R/man/enve.__prune.iter.Rd +0 -23
  250. data/utils/enveomics/enveomics.R/man/enve.__prune.reduce.Rd +0 -23
  251. data/utils/enveomics/enveomics.R/man/enve.__tribs.Rd +0 -40
  252. data/utils/enveomics/enveomics.R/man/enve.barplot.Rd +0 -103
  253. data/utils/enveomics/enveomics.R/man/enve.cliopts.Rd +0 -67
  254. data/utils/enveomics/enveomics.R/man/enve.col.alpha.Rd +0 -24
  255. data/utils/enveomics/enveomics.R/man/enve.col2alpha.Rd +0 -19
  256. data/utils/enveomics/enveomics.R/man/enve.df2dist.Rd +0 -45
  257. data/utils/enveomics/enveomics.R/man/enve.df2dist.group.Rd +0 -44
  258. data/utils/enveomics/enveomics.R/man/enve.df2dist.list.Rd +0 -47
  259. data/utils/enveomics/enveomics.R/man/enve.growthcurve.Rd +0 -75
  260. data/utils/enveomics/enveomics.R/man/enve.prefscore.Rd +0 -50
  261. data/utils/enveomics/enveomics.R/man/enve.prune.dist.Rd +0 -44
  262. data/utils/enveomics/enveomics.R/man/enve.recplot.Rd +0 -139
  263. data/utils/enveomics/enveomics.R/man/enve.recplot2-class.Rd +0 -45
  264. data/utils/enveomics/enveomics.R/man/enve.recplot2.ANIr.Rd +0 -24
  265. data/utils/enveomics/enveomics.R/man/enve.recplot2.Rd +0 -77
  266. data/utils/enveomics/enveomics.R/man/enve.recplot2.__counts.Rd +0 -25
  267. data/utils/enveomics/enveomics.R/man/enve.recplot2.__peakHist.Rd +0 -21
  268. data/utils/enveomics/enveomics.R/man/enve.recplot2.__whichClosestPeak.Rd +0 -19
  269. data/utils/enveomics/enveomics.R/man/enve.recplot2.changeCutoff.Rd +0 -19
  270. data/utils/enveomics/enveomics.R/man/enve.recplot2.compareIdentities.Rd +0 -47
  271. data/utils/enveomics/enveomics.R/man/enve.recplot2.coordinates.Rd +0 -29
  272. data/utils/enveomics/enveomics.R/man/enve.recplot2.corePeak.Rd +0 -18
  273. data/utils/enveomics/enveomics.R/man/enve.recplot2.extractWindows.Rd +0 -45
  274. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.Rd +0 -36
  275. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__em_e.Rd +0 -19
  276. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__em_m.Rd +0 -19
  277. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__emauto_one.Rd +0 -27
  278. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__mow_one.Rd +0 -52
  279. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__mower.Rd +0 -17
  280. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.em.Rd +0 -51
  281. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.emauto.Rd +0 -43
  282. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.mower.Rd +0 -82
  283. data/utils/enveomics/enveomics.R/man/enve.recplot2.peak-class.Rd +0 -59
  284. data/utils/enveomics/enveomics.R/man/enve.recplot2.seqdepth.Rd +0 -27
  285. data/utils/enveomics/enveomics.R/man/enve.recplot2.windowDepthThreshold.Rd +0 -36
  286. data/utils/enveomics/enveomics.R/man/enve.selvector.Rd +0 -23
  287. data/utils/enveomics/enveomics.R/man/enve.tribs.Rd +0 -68
  288. data/utils/enveomics/enveomics.R/man/enve.tribs.test.Rd +0 -28
  289. data/utils/enveomics/enveomics.R/man/enve.truncate.Rd +0 -27
  290. data/utils/enveomics/enveomics.R/man/growth.curves.Rd +0 -14
  291. data/utils/enveomics/enveomics.R/man/phyla.counts.Rd +0 -13
  292. data/utils/enveomics/enveomics.R/man/plot.enve.GrowthCurve.Rd +0 -78
  293. data/utils/enveomics/enveomics.R/man/plot.enve.TRIBS.Rd +0 -46
  294. data/utils/enveomics/enveomics.R/man/plot.enve.TRIBStest.Rd +0 -45
  295. data/utils/enveomics/enveomics.R/man/plot.enve.recplot2.Rd +0 -125
  296. data/utils/enveomics/enveomics.R/man/summary.enve.GrowthCurve.Rd +0 -19
  297. data/utils/enveomics/enveomics.R/man/summary.enve.TRIBS.Rd +0 -19
  298. data/utils/enveomics/enveomics.R/man/summary.enve.TRIBStest.Rd +0 -19
  299. data/utils/enveomics/globals.mk +0 -8
  300. data/utils/enveomics/manifest.json +0 -9
  301. data/utils/multitrim/Multitrim How-To.pdf +0 -0
  302. data/utils/multitrim/README.md +0 -67
  303. data/utils/multitrim/multitrim.py +0 -1555
  304. data/utils/multitrim/multitrim.yml +0 -13
@@ -1,906 +0,0 @@
1
- {
2
- "tasks": [
3
- {
4
- "task": "Aln.cat.rb",
5
- "description": ["Concatenates several multiple alignments in FastA",
6
- "format into a single multiple alignment. The IDs of the sequences",
7
- "(or the ID prefixes, if using --ignore-after) must coincide across",
8
- "files."],
9
- "help_arg": "--help",
10
- "options": [
11
- {
12
- "opt": "--coords",
13
- "arg": "out_file",
14
- "description": "Output file of coordinates in RAxML-compliant format."
15
- },
16
- {
17
- "opt": "--ignore-after",
18
- "arg": "string",
19
- "description": ["Remove everything in the IDs after the specified",
20
- "string."]
21
- },
22
- {
23
- "opt": "--remove-invariable",
24
- "description": "Remove invariable sites.",
25
- "note": ["Invariable sites are defined as columns with only one",
26
- "state and undefined characters. Additional ambiguous characters",
27
- "may exist and should be declared using --undefined."]
28
- },
29
- {
30
- "opt": "--missing-char",
31
- "description": "Character denoting missing data.",
32
- "arg": "character",
33
- "default": "-"
34
- },
35
- {
36
- "opt": "--model",
37
- "description": "Name of the model to use if --coords is used.",
38
- "note": "See RAxML's documentation for additional information.",
39
- "arg": "string",
40
- "default": "AUTO"
41
- },
42
- {
43
- "opt": "--undefined",
44
- "arg": "string",
45
- "description": ["All characters to be regarded as 'undefined'. It",
46
- "should include all ambiguous and missing data chars. Ignored",
47
- "unless --remove-invariable."],
48
- "default": "-.Xx?"
49
- },
50
- {
51
- "opt": "--quiet",
52
- "description": "Run quietly (no STDERR output)."
53
- },
54
- {
55
- "name": "Input alignments",
56
- "arg": "in_file",
57
- "multiple_sep": " ",
58
- "mandatory": true,
59
- "description": "Input alignments in FastA format."
60
- },
61
- ">",
62
- {
63
- "name": "Output alignment",
64
- "arg": "out_file",
65
- "mandatory": true,
66
- "description": "Output concatenated alignment."
67
- }
68
- ]
69
- },
70
- {
71
- "task": "Aln.convert.pl",
72
- "description": "Translates between different alignment formats.",
73
- "help_arg": "",
74
- "requires": [
75
- {
76
- "perl_lib": "Bio::AlignIO"
77
- }
78
- ],
79
- "cite": [["Stajich et al, 2002, GRes",
80
- "http://dx.doi.org/10.1101/gr.361602"]],
81
- "options": [
82
- {
83
- "name": "In-format",
84
- "description": "Input file's format.",
85
- "mandatory": true,
86
- "arg": "select",
87
- "values": ["bl2seq", "clustalw", "emboss", "fasta", "maf", "mase",
88
- "mega", "meme", "metafasta", "msf", "nexus", "pfam", "phylip", "po",
89
- "prodom", "psi", "selex", "stockholm", "XMFA", "arp"]
90
- },
91
- {
92
- "name": "Out-format",
93
- "description": "Output file's format.",
94
- "mandatory": true,
95
- "arg": "select",
96
- "values": ["bl2seq", "clustalw", "emboss", "fasta", "maf", "mase",
97
- "mega", "meme", "metafasta", "msf", "nexus", "pfam", "phylip", "po",
98
- "prodom", "psi", "selex", "stockholm", "XMFA", "arp"]
99
- },
100
- "<",
101
- {
102
- "arg": "in_file",
103
- "mandatory": true
104
- },
105
- ">",
106
- {
107
- "arg": "out_file",
108
- "mandatory": true
109
- }
110
- ]
111
- },
112
- {
113
- "task": "AlphaDiversity.pl",
114
- "description": ["Takes a table of OTU abundance in one or more samples",
115
- "and calculates the Rao (Q_alpha), Rao-Jost (Q_alpha_eqv), Shannon",
116
- "(Hprime), and inverse Simpson (1_lambda) indices of alpha diversity",
117
- "for each sample."],
118
- "help_arg": "--help",
119
- "see_also": ["Chao1.pl"],
120
- "options": [
121
- {
122
- "name": "Input table",
123
- "opt": "-i",
124
- "arg": "in_file",
125
- "description": ["Columns: samples, rows: OTUs, first column: OTU",
126
- "names)."],
127
- "mandatory": true
128
- },
129
- {
130
- "name": "Discard rows",
131
- "opt": "-r",
132
- "arg": "integer",
133
- "description": "Number of rows to ignore.",
134
- "default": 0
135
- },
136
- {
137
- "name": "Discard left columns",
138
- "opt": "-c",
139
- "arg": "integer",
140
- "description": ["Number of columns to ignore after the first column",
141
- "(i.e., between the first column, containing the name of the",
142
- "categories, and the first column of abundance values)."],
143
- "default": 0
144
- },
145
- {
146
- "name": "Discard right columns",
147
- "opt": "-C",
148
- "arg": "integer",
149
- "description": "Number of columns to ignore at the end of each line.",
150
- "default": 0
151
- },
152
- {
153
- "name": "Delimiter",
154
- "opt": "-d",
155
- "arg": "string",
156
- "description": "Character (or string) separating columns.",
157
- "note": ["Supported escaped characters are: '\\t' (tabulation), and",
158
- "'\\0' (null bit)."],
159
- "default": "\\t"
160
- },
161
- {
162
- "name": "Headers",
163
- "opt": "-h",
164
- "description": ["The first row is assumed to have the names of the",
165
- "samples."]
166
- },
167
- {
168
- "name": "Distances file",
169
- "opt": "-D",
170
- "arg": "in_file",
171
- "description": ["A squared matrix (or bottom-left half matrix) with",
172
- "the distances between categories (OTUs or functions). The first",
173
- "column must contain the names of the categories, and it shouldn't",
174
- "have headers. If not set, all distances are assumed to be one."],
175
- "note": "Only used for Rao."
176
- },
177
- {
178
- "name": "Skip Rao",
179
- "opt": "-R",
180
- "description": "Do not calculate Rao indices.",
181
- "note": ["This significantly decreases the total running time. Note",
182
- "that Rao indices are highly susceptible to precision errors, and",
183
- "shouldn't be trusted for very big numbers."]
184
- },
185
- {
186
- "name": "q for qD",
187
- "opt": "-q",
188
- "arg": "integer",
189
- "description": "Estimate the qD index (true diversity order q).",
190
- "default": 0
191
- },
192
- ">",
193
- {
194
- "arg": "out_file",
195
- "mandatory": true
196
- }
197
- ]
198
- },
199
- {
200
- "task": "Chao1.pl",
201
- "description": ["Takes a table of OTU abundance in one or more samples",
202
- "and calculates the chao1 index (with 95% Confidence Interval) for",
203
- "each sample. To use it with Qiime OTU Tables, run it ignoring 1",
204
- "left column and with header."],
205
- "cite": [["Chao, 1984, Scandinavian J Stat",
206
- "http://www.jstor.org/stable/4615964"]],
207
- "see_also": ["AlphaDiversity.pl"],
208
- "help_arg": "--help",
209
- "options": [
210
- {
211
- "name": "Input file",
212
- "opt": "-i",
213
- "arg": "in_file",
214
- "mandatory": true,
215
- "description": "Input table (columns:samples, rows:OTUs)."
216
- },
217
- {
218
- "name": "Rows",
219
- "opt": "-r",
220
- "arg": "integer",
221
- "default": 0,
222
- "description": "Number of rows to ignore."
223
- },
224
- {
225
- "name": "Left columns to ignore",
226
- "opt": "-c",
227
- "arg": "integer",
228
- "default": 0,
229
- "description": "Number of columns to ignore."
230
- },
231
- {
232
- "name": "Right columns to ignore",
233
- "opt": "-C",
234
- "arg": "integer",
235
- "default": 0,
236
- "description": "Number of columns to ignore at the end."
237
- },
238
- {
239
- "name": "Delimiter",
240
- "opt": "-d",
241
- "arg": "string",
242
- "default": "\\t",
243
- "description": "Delimiter between columns.",
244
- "note": ["Supported escaped characters are: \\t (tabulation),",
245
- "and \\0 (null bit)."]
246
- },
247
- {
248
- "name": "Header",
249
- "opt": "-h",
250
- "description": ["If set, the first row is assumed to have the names",
251
- "of the samples."]
252
- },
253
- ">",
254
- {
255
- "arg": "out_file",
256
- "mandatory": true,
257
- "description": ["Chao1 index and 95% CI bounds for each sample, in",
258
- "tab-delimited format."]
259
- }
260
- ]
261
- },
262
- {
263
- "task": "CharTable.classify.rb",
264
- "description": ["Uses a dichotomous key to classify objects parsing a",
265
- "character table."],
266
- "help_arg": "--help",
267
- "options": [
268
- {
269
- "opt": "--table",
270
- "arg": "in_file",
271
- "mandatory": true,
272
- "description": ["Input table containing the states (columns) per",
273
- "object (row). It must be tab-delimited and with row and column",
274
- "names."]
275
- },
276
- {
277
- "opt": "--key",
278
- "arg": "in_file",
279
- "mandatory": true,
280
- "description": ["Input table containing the dychotomous key in",
281
- "linked style, defined in four columns (can contain #-lead comment",
282
- "lines): (1) ID of the step, typically a sequential integer. (2)",
283
- "Name of character to evaluate. Must coincide with the -t headers.",
284
- "(3) First character decision (see below). (4) Second character",
285
- "decision (see below).\nA character decision must be formated as:",
286
- "state (must coincide with the values in -t), colon (:), step to",
287
- "follow. If the state is * (star) any state triggers the decision",
288
- "(this should be the norm in column 4). The step to follow should",
289
- "be a step ID in square brackets, or the name of the",
290
- "classification."]
291
- },
292
- {
293
- "opt": "--classification",
294
- "arg": "out_file",
295
- "description": ["Two-column table with the classification of the",
296
- "input objects."]
297
- },
298
- {
299
- "opt": "--newick",
300
- "arg": "out_file",
301
- "description": ["Tree containing all the classified objects. This",
302
- "only makes sense for synoptic keys."]
303
- },
304
- {
305
- "opt": "--quiet",
306
- "description": "Run quietly (no STDERR output)."
307
- }
308
- ]
309
- },
310
- {
311
- "task": "GenBank.add_fields.rb",
312
- "description": "Adds annotations to GenBank files.",
313
- "help_arg": "--help",
314
- "options": [
315
- {
316
- "opt": "--genbank",
317
- "arg": "in_file",
318
- "mandatory": true,
319
- "description": "Input GenBank file."
320
- },
321
- {
322
- "opt": "--table",
323
- "arg": "in_file",
324
- "mandatory": true,
325
- "description": ["Input file containing the annotations. It must be a",
326
- "tab-delimited raw table including a header row with the names of",
327
- "the fields."]
328
- },
329
- {
330
- "opt": "--out",
331
- "arg": "out_file",
332
- "mandatory": true,
333
- "description": "Output file containing the annotated GenBank."
334
- },
335
- {
336
- "opt": "--key",
337
- "arg": "integer",
338
- "default": 1,
339
- "description": "Key of the column to use as identifier."
340
- },
341
- {
342
- "opt": "--split",
343
- "arg": "string",
344
- "default": "#",
345
- "description": ["String that separates multiple entries in the",
346
- "annotation features."]
347
- },
348
- {
349
- "opt": "--quiet",
350
- "description": "Run quietly (no STDERR output)."
351
- }
352
- ]
353
- },
354
- {
355
- "task": "HMM.essential.rb",
356
- "description": ["Finds and extracts a collection of essential proteins",
357
- "suitable for genome completeness evaluation and phylogenetic",
358
- "analyses in Archaea and Bacteria."],
359
- "warn": ["Most complete bacterial genomes contain only 106/111 genes in",
360
- "this collection, therefore producing a completeness of 95.5%, and",
361
- "most archaeal genomes only contain 26/111 genes, producing a",
362
- "completeness of 23.4%. Use the options --bacteria and/or --archaea to",
363
- "ignore models often missing in one or both domains. Note that even",
364
- "with these options, some complete archaeal genomes result in very low",
365
- "values of completeness (e.g., Nanoarchaeum equitans returns 88.5%)."],
366
- "help_arg": "--help",
367
- "requires": [
368
- {
369
- "description": "HMMer 3.0+",
370
- "test": "hmmsearch -h",
371
- "source_url": "http://hmmer.janelia.org/software"
372
- }
373
- ],
374
- "cite": [
375
- ["Eddy, 2011, PLoS CB",
376
- "http://dx.doi.org/10.1371/journal.pcbi.1002195"],
377
- ["Dupont et al, 2012, ISME J",
378
- "https://doi.org/10.1038/ismej.2011.189"],
379
- ["Rodriguez-R et al, 2014, ISME J",
380
- "https://doi.org/10.1038/ismej.2015.5"],
381
- ["Lee, 2019, Bioinf",
382
- "https://doi.org/10.1093/bioinformatics/btz188"],
383
- ["Eren et al, 2015, PeerJ",
384
- "https://doi.org/10.7717/peerj.1319"]
385
- ],
386
- "options": [
387
- {
388
- "name": "Input file",
389
- "opt": "--in",
390
- "arg": "in_file",
391
- "mandatory": true,
392
- "description": "FastA file containing all the proteins in the genome."
393
- },
394
- {
395
- "opt": "--collection",
396
- "arg": "string",
397
- "default": "dupont_2012",
398
- "description": ["Reference collection of essential proteins to use.",
399
- "One of: dupont_2012 (default, Dupont et al 2012 modified by",
400
- "Rodriguez-R et al 2015), or lee_2019 (Lee 2019 modified by Eren",
401
- "et al 2015)."]
402
- },
403
- {
404
- "name": "Output file",
405
- "opt": "--out",
406
- "arg": "out_file",
407
- "description": ["FastA file with the translated essential genes. By",
408
- "default the file is not produced."]
409
- },
410
- {
411
- "opt": "--per-model",
412
- "arg": "out_file",
413
- "description": ["Prefix of translated genes in independent files",
414
- "with the name of the model appended. By default files are not",
415
- "produced."]
416
- },
417
- {
418
- "opt": "--report",
419
- "arg": "out_file",
420
- "description": ["Path to the report file. By default, the report is",
421
- "sent to the STDOUT."]
422
- },
423
- {
424
- "name": "HMMsearch output",
425
- "opt": "--hmm-out",
426
- "arg": "out_file",
427
- "description": ["Save HMMsearch output in this file. By default,",
428
- "not saved."]
429
- },
430
- {
431
- "opt": "--alignments",
432
- "opt": "out_file",
433
- "description": ["Save the aligned proteins in this file. By default,",
434
- "not saved."]
435
- },
436
- {
437
- "opt": "--bacteria",
438
- "description": "If set, ignores models typically missing in Bacteria."
439
- },
440
- {
441
- "opt": "--archaea",
442
- "description": "If set, ignores models typically missing in Archaea."
443
- },
444
- {
445
- "opt": "--genome-eq",
446
- "description": ["If set, ignores models not suitable for",
447
- "genome-equivalents estimations. See Rodriguez-R et al, 2015, ISME",
448
- "J 9(9):1928-1940."],
449
- "source_url": "http://www.nature.com/ismej/journal/vaop/ncurrent/full/ismej20155a.html"
450
- },
451
- {
452
- "opt": "--rename",
453
- "arg": "string",
454
- "description": ["If set, renames the sequences with the string",
455
- "provided and appends it with pipe (|) and the gene name (except",
456
- "in --per-model files)."]
457
- },
458
- {
459
- "opt": "--no-stats",
460
- "description": ["If set, no statistics are reported on genome",
461
- "evaluation."]
462
- },
463
- {
464
- "opt": "--no-genes",
465
- "description": ["If set, statistics won't include the lists of",
466
- "missing/multi-copy genes."]
467
- },
468
- {
469
- "opt": "--metagenome",
470
- "description": ["If set, it allows for multiple copies of each gene",
471
- "and turns on metagenomic report mode."]
472
- },
473
- {
474
- "opt": "--list-models",
475
- "description": ["If set, it only lists the models and exits.",
476
- "Compatible with 'Archaea', 'Bacteria', 'Genome eq', and 'Quiet';",
477
- "ignores all other parameters."]
478
- },
479
- {
480
- "opt": "--bin",
481
- "arg": "in_dir",
482
- "description": "Directory containing the binaries of HMMer 3.0+."
483
- },
484
- {
485
- "opt": "--model-file",
486
- "arg": "in_file",
487
- "description": "External file containing models to search."
488
- },
489
- {
490
- "opt": "--threads",
491
- "arg": "integer",
492
- "default": 2,
493
- "description": "Number of parallel threads to be used."
494
- },
495
- {
496
- "opt": "--quiet",
497
- "description": "Run quietly (no STDERR output)."
498
- }
499
- ]
500
- },
501
- {
502
- "task": "HMMsearch.extractIds.rb",
503
- "description": ["Extracts the sequence IDs and query model form a",
504
- "(multiple) HMMsearch report (for HMMer 3.0)."],
505
- "help_arg": "--help",
506
- "options": [
507
- {
508
- "opt": "--all-evalue",
509
- "arg": "float",
510
- "description": "Maximum e-value of sequence to report result."
511
- },
512
- {
513
- "opt": "--all-score",
514
- "arg": "float",
515
- "description": "Minimum score of sequence to report result."
516
- },
517
- {
518
- "opt": "--best-evalue",
519
- "arg": "float",
520
- "description": "Maximum e-value of best domain to report result."
521
- },
522
- {
523
- "opt": "--best-score",
524
- "arg": "float",
525
- "description": "Minimum score of best domain to report result."
526
- },
527
- {
528
- "opt": "--no-model",
529
- "description": "Do not include the query model in the output list."
530
- },
531
- {
532
- "opt": "--quiet",
533
- "description": "Run quietly."
534
- },
535
- "<",
536
- {
537
- "arg": "in_file",
538
- "mandatory": true,
539
- "description": "Input HMMsearch text file."
540
- },
541
- ">",
542
- {
543
- "arg": "out_file",
544
- "mandatory": true,
545
- "description": "Output list of IDs."
546
- }
547
- ]
548
- },
549
- {
550
- "task": "JPlace.distances.rb",
551
- "description": ["Extracts the distance (estimated branch length) of each",
552
- "placed read to a given node in a JPlace file."],
553
- "requires": [ { "ruby_gem": "json" } ],
554
- "help_arg": "--help",
555
- "options": [
556
- {
557
- "name": "Input file",
558
- "opt": "--in",
559
- "arg": "in_file",
560
- "mandatory": true,
561
- "description": ".jplace input file containing the read placement."
562
- },
563
- {
564
- "name": "Node",
565
- "opt": "--node",
566
- "arg": "string",
567
- "mandatory": true,
568
- "description": ["Index (number in curly brackets) of the node to",
569
- "which distances should be measured."]
570
- },
571
- {
572
- "name": "Output file",
573
- "opt": "--out",
574
- "arg": "out_file",
575
- "mandatory": true,
576
- "description": "Output file in tabular format."
577
- },
578
- {
579
- "opt": "--in-node",
580
- "arg": "string",
581
- "description": ["Report only reads placed at this node or it's",
582
- "children."]
583
- },
584
- {
585
- "opt": "--quiet",
586
- "description": "Run quietly (no STDERR output)."
587
- }
588
- ]
589
- },
590
- {
591
- "task": "JPlace.to_iToL.rb",
592
- "description": ["Generates iToL-compatible files from a .jplace file",
593
- "(produced by RAxML's EPA or pplacer), that can be used to draw",
594
- "pie-charts in the nodes of the reference tree."],
595
- "requires": [ { "ruby_gem": "json" } ],
596
- "help_arg": "--help",
597
- "options": [
598
- {
599
- "name": "Input file",
600
- "opt": "--in",
601
- "arg": "in_file",
602
- "mandatory": true,
603
- "description": ".jplace input file containing the read placement."
604
- },
605
- {
606
- "name": "Out base",
607
- "opt": "--out",
608
- "arg": "out_file",
609
- "mandatory": true,
610
- "description": "Base of the output files."
611
- },
612
- {
613
- "opt": "--unique",
614
- "arg": "string",
615
- "description": ["Name of the dataset (if only one is used).",
616
- "Conflicts with 'Regex' and 'Separator'."]
617
- },
618
- {
619
- "opt": "--regex",
620
- "arg": "string",
621
- "description": ["Regular expression capturing the sample ID (named",
622
- "dataset) in read names. By default: '^(?<dataset>.+?):.*'.",
623
- "Conflicts with 'Separator'."]
624
- },
625
- {
626
- "opt": "--separator",
627
- "arg": "string",
628
- "description": ["String separating the dataset name and the rest of",
629
- "the read name. It assumes that the read name starts by the",
630
- "dataset name. Conflicts with 'Regex'."]
631
- },
632
- {
633
- "opt": "--metadata",
634
- "arg": "in_file",
635
- "description": ["Datasets metadata in tab-delimited format with a",
636
- "header row. Valid headers: name (required), color (in Hex),",
637
- "size (# reads), norm (any float)."]
638
- },
639
- {
640
- "opt": "--norm",
641
- "arg": "string",
642
- "description": ["Normalization strategy. Must be one of:\n",
643
- "none: Direct read counts are reported without normalization.\n",
644
- "count (default): The counts are normalized (divided) by the total",
645
- "counts per dataset.\n",
646
- "size: The counts are normalized (divided) by the size column in",
647
- "metadata (must be integer).\n",
648
- "norm: The counts are normalized (divided) by the norm column in",
649
- "metadata (can be any float)."]
650
- },
651
- {
652
- "opt": "--old-itol",
653
- "description": ["Generate output file using the old iToL format",
654
- " (pre v3.0)."]
655
- },
656
- {
657
- "opt": "--collapse",
658
- "arg": "in_file",
659
- "description": "Internal nodes to collapse (requires rootted tree)."
660
- },
661
- {
662
- "opt": "--area",
663
- "description": ["If set, the area of the pies is proportional to the",
664
- "placements. Otherwise, the radius is."]
665
- },
666
- {
667
- "opt": "--quiet",
668
- "description": "Run quietly (no STDERR output)."
669
- }
670
- ]
671
- },
672
- {
673
- "task": "MyTaxa.fragsByTax.pl",
674
- "description": "Identifies fragments annotated as a taxon in MyTaxa.",
675
- "help_arg": "",
676
- "options": [
677
- {
678
- "name": "MyTaxa output",
679
- "arg": "in_file",
680
- "mandatory": true,
681
- "description": "Classification file generated by MyTaxa."
682
- },
683
- {
684
- "name": "Taxon",
685
- "arg": "string",
686
- "mandatory": true,
687
- "description": "Taxon to look for."
688
- },
689
- {
690
- "name": "Rank",
691
- "arg": "string",
692
- "description": "Rank of taxon (optional). By default: any rank."
693
- },
694
- ">",
695
- {
696
- "arg": "out_file",
697
- "mandatory": true,
698
- "description": "List of fragment IDs."
699
- }
700
- ]
701
- },
702
- {
703
- "task": "MyTaxa.seq-taxrank.rb",
704
- "description": ["Generates a simple tabular file with the classification",
705
- "of each sequence at a given taxonomic rank from a MyTaxa output."],
706
- "help_arg": "--help",
707
- "options": [
708
- {
709
- "name": "MyTaxa",
710
- "opt": "--mytaxa",
711
- "arg": "in_file",
712
- "mandatory": true,
713
- "description": "Input MyTaxa file."
714
- },
715
- {
716
- "opt": "--rank",
717
- "arg": "string",
718
- "default": "genus",
719
- "description": "Taxonomic rank."
720
- },
721
- {
722
- "opt": "--quiet",
723
- "description": "Run quietly."
724
- }
725
- ]
726
- },
727
- {
728
- "task": "Taxonomy.silva2ncbi.rb",
729
- "description": ["Re-formats Silva taxonomy into NCBI-like taxonomy dump",
730
- "files."],
731
- "help_arg": "--help",
732
- "options": [
733
- {
734
- "opt": "--silvaranks",
735
- "arg": "in_file",
736
- "mandatory": true,
737
- "description": ["Input Silva ranks file (e.g.,",
738
- "tax_ranks_ssu_115.txt)."],
739
- "source_url": "https://www.arb-silva.de/no_cache/download/archive/release_115/Exports/"
740
- },
741
- {
742
- "opt": "--silvaref",
743
- "arg": "in_file",
744
- "mandatory": true,
745
- "description": ["Input Silva ref alignment file (e.g.,",
746
- "SSURef_NR99_115_tax_silva_full_align_trunc.fasta)."],
747
- "source_url": "https://www.arb-silva.de/no_cache/download/archive/release_115/Exports/"
748
- },
749
- {
750
- "opt": "--patch",
751
- "arg": "in_file",
752
- "description": ["If passed, it replaces the paths specified in the",
753
- "patch."],
754
- "source_url": "http://enve-omics.ce.gatech.edu/data/public_misc/patch_Silva_SSU_r115.txt"
755
- },
756
- {
757
- "opt": "--seqinfo",
758
- "arg": "out_file",
759
- "description": ["If passed, it creates a CSV seq-info file",
760
- "compatible with taxtastic."]
761
- },
762
- {
763
- "opt": "--taxfile",
764
- "arg": "out_file",
765
- "description": "If passed, it creates a simple TSV taxonomy file."
766
- },
767
- {
768
- "opt": "--ncbi",
769
- "arg": "out_dir",
770
- "description": ["If passed, output folder for the NCBI dump files",
771
- "(e.g., taxdmp)."]
772
- },
773
- {
774
- "opt": "--warns",
775
- "description": "Verbously display warnings."
776
- }
777
- ]
778
- },
779
- {
780
- "task": "GFF.catsbj.pl",
781
- "description": ["Generates a list of coordinates from a GFF table",
782
- "concatenating the subject sequences."],
783
- "help_arg": "-h",
784
- "see_also": ["BlastTab.recplot2.R", "BlastTab.catsbj.pl"],
785
- "options": [
786
- {
787
- "name": "Lim file",
788
- "opt": "-L",
789
- "arg": "out_file",
790
- "description": ["An output file with the absolute coordinates of the",
791
- "concatenated contigs. This is identical to the .lim file",
792
- "generated by BlastTab.catsbj.pl."]
793
- },
794
- {
795
- "name": "Inter-feature gaps",
796
- "opt": "-i",
797
- "description": ["Preserve exact coordinates and include",
798
- "inter-feature windows as separate bins. By default, the",
799
- "coordinates are set in the midpoint between features when",
800
- "non-contiguous."]
801
- },
802
- {
803
- "name": "Subset",
804
- "opt": "-s",
805
- "description": ["The FastA provided is to be treated as a subset of",
806
- "the subject. By default, it expects all the contigs to be present",
807
- "in the BLAST."]
808
- },
809
- {
810
- "name": "Quiet",
811
- "opt": "-q",
812
- "description": "Run quietly."
813
- },
814
- {
815
- "name": "Subject sequences",
816
- "arg": "in_file",
817
- "mandatory": true,
818
- "description": "Subject sequences (contigs) in FastA format."
819
- },
820
- {
821
- "name": "Features",
822
- "arg": "in_file",
823
- "mandatory": true,
824
- "description": "Features to map in GFF."
825
- }
826
- ]
827
- },
828
- {
829
- "task": "Table.prefScore.R",
830
- "description": ["Estimate preference score of species based on occupancy",
831
- "in biased sample sets."],
832
- "help_arg": "--help",
833
- "requires": [ { "r_package": "optparse" } ],
834
- "options": [
835
- {
836
- "name": "Occupancy matrix",
837
- "opt": "--x",
838
- "arg": "in_file",
839
- "description": ["A tab-delimited table of presence/absence (1/0)",
840
- "with species as rows and samples as columns."],
841
- "mandatory": true
842
- },
843
- {
844
- "name": "Sample set",
845
- "opt": "--set",
846
- "arg": "in_file",
847
- "description": ["A list of sample names that constitute the test",
848
- "set, one per line."],
849
- "mandatory": true
850
- },
851
- {
852
- "opt": "--ignore",
853
- "arg": "in_file",
854
- "description": ["A list of species to exclude from the analysis,",
855
- "one per line."]
856
- },
857
- {
858
- "name": "Significance threshold",
859
- "opt": "--signif-thr",
860
- "arg": "float",
861
- "description": "Absolute value of the significance threshold."
862
- },
863
- {
864
- "opt": "--col-above",
865
- "arg": "string",
866
- "description": "Color for points significantly above zero.",
867
- "default": "#941100"
868
- },
869
- {
870
- "opt": "--col-equal",
871
- "arg": "string",
872
- "description": ["Color for points not significantly different from",
873
- "zero."],
874
- "default": "#BDBDBD"
875
- },
876
- {
877
- "opt": "--col-below",
878
- "arg": "string",
879
- "description": "Color for points significantly below zero.",
880
- "default": "#2F5496"
881
- },
882
- {
883
- "name": "Output preference scores",
884
- "arg": "out_file",
885
- "description": "Output raw-text file with preference scores.",
886
- "mandatory": true
887
- },
888
- {
889
- "name": "Graphical utput",
890
- "arg": "out_file",
891
- "description": "Output PDF file with preference scores plot."
892
- },
893
- {
894
- "name": "Width",
895
- "arg": "float",
896
- "description": "Width of the plot in inches (7 by default)."
897
- },
898
- {
899
- "name": "Height",
900
- "arg": "float",
901
- "description": "Height of the plot in inches (7 by default)."
902
- }
903
- ]
904
- }
905
- ]
906
- }