miga-base 1.2.15.2 → 1.2.15.4

Sign up to get free protection for your applications and to get access to all the features.
Files changed (306) hide show
  1. checksums.yaml +4 -4
  2. data/lib/miga/cli/action/download/gtdb.rb +4 -1
  3. data/lib/miga/cli/action/gtdb_get.rb +4 -0
  4. data/lib/miga/daemon.rb +4 -1
  5. data/lib/miga/lair.rb +6 -4
  6. data/lib/miga/remote_dataset/download.rb +3 -2
  7. data/lib/miga/remote_dataset.rb +25 -7
  8. data/lib/miga/taxonomy.rb +6 -0
  9. data/lib/miga/version.rb +2 -2
  10. metadata +6 -302
  11. data/utils/FastAAI/00.Libraries/01.SCG_HMMs/Archaea_SCG.hmm +0 -41964
  12. data/utils/FastAAI/00.Libraries/01.SCG_HMMs/Bacteria_SCG.hmm +0 -32439
  13. data/utils/FastAAI/00.Libraries/01.SCG_HMMs/Complete_SCG_DB.hmm +0 -62056
  14. data/utils/FastAAI/FastAAI +0 -3659
  15. data/utils/FastAAI/FastAAI-legacy/FastAAI +0 -1336
  16. data/utils/FastAAI/FastAAI-legacy/kAAI_v1.0_virus.py +0 -1296
  17. data/utils/FastAAI/README.md +0 -84
  18. data/utils/enveomics/Docs/recplot2.md +0 -244
  19. data/utils/enveomics/Examples/aai-matrix.bash +0 -66
  20. data/utils/enveomics/Examples/ani-matrix.bash +0 -66
  21. data/utils/enveomics/Examples/essential-phylogeny.bash +0 -105
  22. data/utils/enveomics/Examples/unus-genome-phylogeny.bash +0 -100
  23. data/utils/enveomics/LICENSE.txt +0 -73
  24. data/utils/enveomics/Makefile +0 -52
  25. data/utils/enveomics/Manifest/Tasks/aasubs.json +0 -103
  26. data/utils/enveomics/Manifest/Tasks/blasttab.json +0 -790
  27. data/utils/enveomics/Manifest/Tasks/distances.json +0 -161
  28. data/utils/enveomics/Manifest/Tasks/fasta.json +0 -802
  29. data/utils/enveomics/Manifest/Tasks/fastq.json +0 -291
  30. data/utils/enveomics/Manifest/Tasks/graphics.json +0 -126
  31. data/utils/enveomics/Manifest/Tasks/mapping.json +0 -137
  32. data/utils/enveomics/Manifest/Tasks/ogs.json +0 -382
  33. data/utils/enveomics/Manifest/Tasks/other.json +0 -906
  34. data/utils/enveomics/Manifest/Tasks/remote.json +0 -355
  35. data/utils/enveomics/Manifest/Tasks/sequence-identity.json +0 -650
  36. data/utils/enveomics/Manifest/Tasks/tables.json +0 -308
  37. data/utils/enveomics/Manifest/Tasks/trees.json +0 -68
  38. data/utils/enveomics/Manifest/Tasks/variants.json +0 -111
  39. data/utils/enveomics/Manifest/categories.json +0 -165
  40. data/utils/enveomics/Manifest/examples.json +0 -162
  41. data/utils/enveomics/Manifest/tasks.json +0 -4
  42. data/utils/enveomics/Pipelines/assembly.pbs/CONFIG.mock.bash +0 -69
  43. data/utils/enveomics/Pipelines/assembly.pbs/FastA.N50.pl +0 -1
  44. data/utils/enveomics/Pipelines/assembly.pbs/FastA.filterN.pl +0 -1
  45. data/utils/enveomics/Pipelines/assembly.pbs/FastA.length.pl +0 -1
  46. data/utils/enveomics/Pipelines/assembly.pbs/README.md +0 -189
  47. data/utils/enveomics/Pipelines/assembly.pbs/RUNME-2.bash +0 -112
  48. data/utils/enveomics/Pipelines/assembly.pbs/RUNME-3.bash +0 -23
  49. data/utils/enveomics/Pipelines/assembly.pbs/RUNME-4.bash +0 -44
  50. data/utils/enveomics/Pipelines/assembly.pbs/RUNME.bash +0 -50
  51. data/utils/enveomics/Pipelines/assembly.pbs/kSelector.R +0 -37
  52. data/utils/enveomics/Pipelines/assembly.pbs/newbler.pbs +0 -68
  53. data/utils/enveomics/Pipelines/assembly.pbs/newbler_preparator.pl +0 -49
  54. data/utils/enveomics/Pipelines/assembly.pbs/soap.pbs +0 -80
  55. data/utils/enveomics/Pipelines/assembly.pbs/stats.pbs +0 -57
  56. data/utils/enveomics/Pipelines/assembly.pbs/velvet.pbs +0 -63
  57. data/utils/enveomics/Pipelines/blast.pbs/01.pbs.bash +0 -38
  58. data/utils/enveomics/Pipelines/blast.pbs/02.pbs.bash +0 -73
  59. data/utils/enveomics/Pipelines/blast.pbs/03.pbs.bash +0 -21
  60. data/utils/enveomics/Pipelines/blast.pbs/BlastTab.recover_job.pl +0 -72
  61. data/utils/enveomics/Pipelines/blast.pbs/CONFIG.mock.bash +0 -98
  62. data/utils/enveomics/Pipelines/blast.pbs/FastA.split.pl +0 -1
  63. data/utils/enveomics/Pipelines/blast.pbs/README.md +0 -127
  64. data/utils/enveomics/Pipelines/blast.pbs/RUNME.bash +0 -109
  65. data/utils/enveomics/Pipelines/blast.pbs/TASK.check.bash +0 -128
  66. data/utils/enveomics/Pipelines/blast.pbs/TASK.dry.bash +0 -16
  67. data/utils/enveomics/Pipelines/blast.pbs/TASK.eo.bash +0 -22
  68. data/utils/enveomics/Pipelines/blast.pbs/TASK.pause.bash +0 -26
  69. data/utils/enveomics/Pipelines/blast.pbs/TASK.run.bash +0 -89
  70. data/utils/enveomics/Pipelines/blast.pbs/sentinel.pbs.bash +0 -29
  71. data/utils/enveomics/Pipelines/idba.pbs/README.md +0 -49
  72. data/utils/enveomics/Pipelines/idba.pbs/RUNME.bash +0 -95
  73. data/utils/enveomics/Pipelines/idba.pbs/run.pbs +0 -56
  74. data/utils/enveomics/Pipelines/trim.pbs/README.md +0 -54
  75. data/utils/enveomics/Pipelines/trim.pbs/RUNME.bash +0 -70
  76. data/utils/enveomics/Pipelines/trim.pbs/run.pbs +0 -130
  77. data/utils/enveomics/README.md +0 -42
  78. data/utils/enveomics/Scripts/AAsubs.log2ratio.rb +0 -171
  79. data/utils/enveomics/Scripts/Aln.cat.rb +0 -221
  80. data/utils/enveomics/Scripts/Aln.convert.pl +0 -35
  81. data/utils/enveomics/Scripts/AlphaDiversity.pl +0 -152
  82. data/utils/enveomics/Scripts/BedGraph.tad.rb +0 -93
  83. data/utils/enveomics/Scripts/BedGraph.window.rb +0 -71
  84. data/utils/enveomics/Scripts/BlastPairwise.AAsubs.pl +0 -102
  85. data/utils/enveomics/Scripts/BlastTab.addlen.rb +0 -63
  86. data/utils/enveomics/Scripts/BlastTab.advance.bash +0 -48
  87. data/utils/enveomics/Scripts/BlastTab.best_hit_sorted.pl +0 -55
  88. data/utils/enveomics/Scripts/BlastTab.catsbj.pl +0 -104
  89. data/utils/enveomics/Scripts/BlastTab.cogCat.rb +0 -76
  90. data/utils/enveomics/Scripts/BlastTab.filter.pl +0 -47
  91. data/utils/enveomics/Scripts/BlastTab.kegg_pep2path_rest.pl +0 -194
  92. data/utils/enveomics/Scripts/BlastTab.metaxaPrep.pl +0 -104
  93. data/utils/enveomics/Scripts/BlastTab.pairedHits.rb +0 -157
  94. data/utils/enveomics/Scripts/BlastTab.recplot2.R +0 -48
  95. data/utils/enveomics/Scripts/BlastTab.seqdepth.pl +0 -86
  96. data/utils/enveomics/Scripts/BlastTab.seqdepth_ZIP.pl +0 -119
  97. data/utils/enveomics/Scripts/BlastTab.seqdepth_nomedian.pl +0 -86
  98. data/utils/enveomics/Scripts/BlastTab.subsample.pl +0 -47
  99. data/utils/enveomics/Scripts/BlastTab.sumPerHit.pl +0 -114
  100. data/utils/enveomics/Scripts/BlastTab.taxid2taxrank.pl +0 -90
  101. data/utils/enveomics/Scripts/BlastTab.topHits_sorted.rb +0 -123
  102. data/utils/enveomics/Scripts/Chao1.pl +0 -97
  103. data/utils/enveomics/Scripts/CharTable.classify.rb +0 -234
  104. data/utils/enveomics/Scripts/EBIseq2tax.rb +0 -83
  105. data/utils/enveomics/Scripts/FastA.N50.pl +0 -60
  106. data/utils/enveomics/Scripts/FastA.extract.rb +0 -152
  107. data/utils/enveomics/Scripts/FastA.filter.pl +0 -52
  108. data/utils/enveomics/Scripts/FastA.filterLen.pl +0 -28
  109. data/utils/enveomics/Scripts/FastA.filterN.pl +0 -60
  110. data/utils/enveomics/Scripts/FastA.fragment.rb +0 -100
  111. data/utils/enveomics/Scripts/FastA.gc.pl +0 -42
  112. data/utils/enveomics/Scripts/FastA.interpose.pl +0 -93
  113. data/utils/enveomics/Scripts/FastA.length.pl +0 -38
  114. data/utils/enveomics/Scripts/FastA.mask.rb +0 -89
  115. data/utils/enveomics/Scripts/FastA.per_file.pl +0 -36
  116. data/utils/enveomics/Scripts/FastA.qlen.pl +0 -57
  117. data/utils/enveomics/Scripts/FastA.rename.pl +0 -65
  118. data/utils/enveomics/Scripts/FastA.revcom.pl +0 -23
  119. data/utils/enveomics/Scripts/FastA.sample.rb +0 -98
  120. data/utils/enveomics/Scripts/FastA.slider.pl +0 -85
  121. data/utils/enveomics/Scripts/FastA.split.pl +0 -55
  122. data/utils/enveomics/Scripts/FastA.split.rb +0 -79
  123. data/utils/enveomics/Scripts/FastA.subsample.pl +0 -131
  124. data/utils/enveomics/Scripts/FastA.tag.rb +0 -65
  125. data/utils/enveomics/Scripts/FastA.toFastQ.rb +0 -69
  126. data/utils/enveomics/Scripts/FastA.wrap.rb +0 -48
  127. data/utils/enveomics/Scripts/FastQ.filter.pl +0 -54
  128. data/utils/enveomics/Scripts/FastQ.interpose.pl +0 -90
  129. data/utils/enveomics/Scripts/FastQ.maskQual.rb +0 -89
  130. data/utils/enveomics/Scripts/FastQ.offset.pl +0 -90
  131. data/utils/enveomics/Scripts/FastQ.split.pl +0 -53
  132. data/utils/enveomics/Scripts/FastQ.tag.rb +0 -70
  133. data/utils/enveomics/Scripts/FastQ.test-error.rb +0 -81
  134. data/utils/enveomics/Scripts/FastQ.toFastA.awk +0 -24
  135. data/utils/enveomics/Scripts/GFF.catsbj.pl +0 -127
  136. data/utils/enveomics/Scripts/GenBank.add_fields.rb +0 -84
  137. data/utils/enveomics/Scripts/HMM.essential.rb +0 -351
  138. data/utils/enveomics/Scripts/HMM.haai.rb +0 -168
  139. data/utils/enveomics/Scripts/HMMsearch.extractIds.rb +0 -83
  140. data/utils/enveomics/Scripts/JPlace.distances.rb +0 -88
  141. data/utils/enveomics/Scripts/JPlace.to_iToL.rb +0 -320
  142. data/utils/enveomics/Scripts/M5nr.getSequences.rb +0 -81
  143. data/utils/enveomics/Scripts/MeTaxa.distribution.pl +0 -198
  144. data/utils/enveomics/Scripts/MyTaxa.fragsByTax.pl +0 -35
  145. data/utils/enveomics/Scripts/MyTaxa.seq-taxrank.rb +0 -49
  146. data/utils/enveomics/Scripts/NCBIacc2tax.rb +0 -92
  147. data/utils/enveomics/Scripts/Newick.autoprune.R +0 -27
  148. data/utils/enveomics/Scripts/RAxML-EPA.to_iToL.pl +0 -228
  149. data/utils/enveomics/Scripts/RecPlot2.compareIdentities.R +0 -32
  150. data/utils/enveomics/Scripts/RefSeq.download.bash +0 -48
  151. data/utils/enveomics/Scripts/SRA.download.bash +0 -55
  152. data/utils/enveomics/Scripts/TRIBS.plot-test.R +0 -36
  153. data/utils/enveomics/Scripts/TRIBS.test.R +0 -39
  154. data/utils/enveomics/Scripts/Table.barplot.R +0 -31
  155. data/utils/enveomics/Scripts/Table.df2dist.R +0 -30
  156. data/utils/enveomics/Scripts/Table.filter.pl +0 -61
  157. data/utils/enveomics/Scripts/Table.merge.pl +0 -77
  158. data/utils/enveomics/Scripts/Table.prefScore.R +0 -60
  159. data/utils/enveomics/Scripts/Table.replace.rb +0 -69
  160. data/utils/enveomics/Scripts/Table.round.rb +0 -63
  161. data/utils/enveomics/Scripts/Table.split.pl +0 -57
  162. data/utils/enveomics/Scripts/Taxonomy.silva2ncbi.rb +0 -227
  163. data/utils/enveomics/Scripts/VCF.KaKs.rb +0 -147
  164. data/utils/enveomics/Scripts/VCF.SNPs.rb +0 -88
  165. data/utils/enveomics/Scripts/aai.rb +0 -421
  166. data/utils/enveomics/Scripts/ani.rb +0 -362
  167. data/utils/enveomics/Scripts/anir.rb +0 -137
  168. data/utils/enveomics/Scripts/clust.rand.rb +0 -102
  169. data/utils/enveomics/Scripts/gi2tax.rb +0 -103
  170. data/utils/enveomics/Scripts/in_silico_GA_GI.pl +0 -96
  171. data/utils/enveomics/Scripts/lib/data/dupont_2012_essential.hmm.gz +0 -0
  172. data/utils/enveomics/Scripts/lib/data/lee_2019_essential.hmm.gz +0 -0
  173. data/utils/enveomics/Scripts/lib/enveomics.R +0 -1
  174. data/utils/enveomics/Scripts/lib/enveomics_rb/anir.rb +0 -293
  175. data/utils/enveomics/Scripts/lib/enveomics_rb/bm_set.rb +0 -175
  176. data/utils/enveomics/Scripts/lib/enveomics_rb/enveomics.rb +0 -24
  177. data/utils/enveomics/Scripts/lib/enveomics_rb/errors.rb +0 -17
  178. data/utils/enveomics/Scripts/lib/enveomics_rb/gmm_em.rb +0 -30
  179. data/utils/enveomics/Scripts/lib/enveomics_rb/jplace.rb +0 -253
  180. data/utils/enveomics/Scripts/lib/enveomics_rb/match.rb +0 -88
  181. data/utils/enveomics/Scripts/lib/enveomics_rb/og.rb +0 -182
  182. data/utils/enveomics/Scripts/lib/enveomics_rb/rbm.rb +0 -49
  183. data/utils/enveomics/Scripts/lib/enveomics_rb/remote_data.rb +0 -74
  184. data/utils/enveomics/Scripts/lib/enveomics_rb/seq_range.rb +0 -237
  185. data/utils/enveomics/Scripts/lib/enveomics_rb/stats/rand.rb +0 -31
  186. data/utils/enveomics/Scripts/lib/enveomics_rb/stats/sample.rb +0 -152
  187. data/utils/enveomics/Scripts/lib/enveomics_rb/stats.rb +0 -3
  188. data/utils/enveomics/Scripts/lib/enveomics_rb/utils.rb +0 -74
  189. data/utils/enveomics/Scripts/lib/enveomics_rb/vcf.rb +0 -135
  190. data/utils/enveomics/Scripts/ogs.annotate.rb +0 -88
  191. data/utils/enveomics/Scripts/ogs.core-pan.rb +0 -160
  192. data/utils/enveomics/Scripts/ogs.extract.rb +0 -125
  193. data/utils/enveomics/Scripts/ogs.mcl.rb +0 -186
  194. data/utils/enveomics/Scripts/ogs.rb +0 -104
  195. data/utils/enveomics/Scripts/ogs.stats.rb +0 -131
  196. data/utils/enveomics/Scripts/rbm-legacy.rb +0 -172
  197. data/utils/enveomics/Scripts/rbm.rb +0 -108
  198. data/utils/enveomics/Scripts/sam.filter.rb +0 -148
  199. data/utils/enveomics/Tests/Makefile +0 -10
  200. data/utils/enveomics/Tests/Mgen_M2288.faa +0 -3189
  201. data/utils/enveomics/Tests/Mgen_M2288.fna +0 -8282
  202. data/utils/enveomics/Tests/Mgen_M2321.fna +0 -8288
  203. data/utils/enveomics/Tests/Nequ_Kin4M.faa +0 -2970
  204. data/utils/enveomics/Tests/Xanthomonas_oryzae-PilA.tribs.Rdata +0 -0
  205. data/utils/enveomics/Tests/Xanthomonas_oryzae-PilA.txt +0 -7
  206. data/utils/enveomics/Tests/Xanthomonas_oryzae.aai-mat.tsv +0 -17
  207. data/utils/enveomics/Tests/Xanthomonas_oryzae.aai.tsv +0 -137
  208. data/utils/enveomics/Tests/a_mg.cds-go.blast.tsv +0 -123
  209. data/utils/enveomics/Tests/a_mg.reads-cds.blast.tsv +0 -200
  210. data/utils/enveomics/Tests/a_mg.reads-cds.counts.tsv +0 -55
  211. data/utils/enveomics/Tests/alkB.nwk +0 -1
  212. data/utils/enveomics/Tests/anthrax-cansnp-data.tsv +0 -13
  213. data/utils/enveomics/Tests/anthrax-cansnp-key.tsv +0 -17
  214. data/utils/enveomics/Tests/hiv1.faa +0 -59
  215. data/utils/enveomics/Tests/hiv1.fna +0 -134
  216. data/utils/enveomics/Tests/hiv2.faa +0 -70
  217. data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv +0 -233
  218. data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv.lim +0 -1
  219. data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv.rec +0 -233
  220. data/utils/enveomics/Tests/phyla_counts.tsv +0 -10
  221. data/utils/enveomics/Tests/primate_lentivirus.ogs +0 -11
  222. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-hiv1.rbm +0 -9
  223. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-hiv2.rbm +0 -8
  224. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-siv.rbm +0 -6
  225. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv2-hiv2.rbm +0 -9
  226. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv2-siv.rbm +0 -6
  227. data/utils/enveomics/Tests/primate_lentivirus.rbm/siv-siv.rbm +0 -6
  228. data/utils/enveomics/build_enveomics_r.bash +0 -45
  229. data/utils/enveomics/enveomics.R/DESCRIPTION +0 -31
  230. data/utils/enveomics/enveomics.R/NAMESPACE +0 -39
  231. data/utils/enveomics/enveomics.R/R/autoprune.R +0 -155
  232. data/utils/enveomics/enveomics.R/R/barplot.R +0 -184
  233. data/utils/enveomics/enveomics.R/R/cliopts.R +0 -135
  234. data/utils/enveomics/enveomics.R/R/df2dist.R +0 -154
  235. data/utils/enveomics/enveomics.R/R/growthcurve.R +0 -331
  236. data/utils/enveomics/enveomics.R/R/prefscore.R +0 -79
  237. data/utils/enveomics/enveomics.R/R/recplot.R +0 -354
  238. data/utils/enveomics/enveomics.R/R/recplot2.R +0 -1631
  239. data/utils/enveomics/enveomics.R/R/tribs.R +0 -583
  240. data/utils/enveomics/enveomics.R/R/utils.R +0 -80
  241. data/utils/enveomics/enveomics.R/README.md +0 -81
  242. data/utils/enveomics/enveomics.R/data/growth.curves.rda +0 -0
  243. data/utils/enveomics/enveomics.R/data/phyla.counts.rda +0 -0
  244. data/utils/enveomics/enveomics.R/man/cash-enve.GrowthCurve-method.Rd +0 -16
  245. data/utils/enveomics/enveomics.R/man/cash-enve.RecPlot2-method.Rd +0 -16
  246. data/utils/enveomics/enveomics.R/man/cash-enve.RecPlot2.Peak-method.Rd +0 -16
  247. data/utils/enveomics/enveomics.R/man/enve.GrowthCurve-class.Rd +0 -25
  248. data/utils/enveomics/enveomics.R/man/enve.TRIBS-class.Rd +0 -46
  249. data/utils/enveomics/enveomics.R/man/enve.TRIBS.merge.Rd +0 -23
  250. data/utils/enveomics/enveomics.R/man/enve.TRIBStest-class.Rd +0 -47
  251. data/utils/enveomics/enveomics.R/man/enve.__prune.iter.Rd +0 -23
  252. data/utils/enveomics/enveomics.R/man/enve.__prune.reduce.Rd +0 -23
  253. data/utils/enveomics/enveomics.R/man/enve.__tribs.Rd +0 -40
  254. data/utils/enveomics/enveomics.R/man/enve.barplot.Rd +0 -103
  255. data/utils/enveomics/enveomics.R/man/enve.cliopts.Rd +0 -67
  256. data/utils/enveomics/enveomics.R/man/enve.col.alpha.Rd +0 -24
  257. data/utils/enveomics/enveomics.R/man/enve.col2alpha.Rd +0 -19
  258. data/utils/enveomics/enveomics.R/man/enve.df2dist.Rd +0 -45
  259. data/utils/enveomics/enveomics.R/man/enve.df2dist.group.Rd +0 -44
  260. data/utils/enveomics/enveomics.R/man/enve.df2dist.list.Rd +0 -47
  261. data/utils/enveomics/enveomics.R/man/enve.growthcurve.Rd +0 -75
  262. data/utils/enveomics/enveomics.R/man/enve.prefscore.Rd +0 -50
  263. data/utils/enveomics/enveomics.R/man/enve.prune.dist.Rd +0 -44
  264. data/utils/enveomics/enveomics.R/man/enve.recplot.Rd +0 -139
  265. data/utils/enveomics/enveomics.R/man/enve.recplot2-class.Rd +0 -45
  266. data/utils/enveomics/enveomics.R/man/enve.recplot2.ANIr.Rd +0 -24
  267. data/utils/enveomics/enveomics.R/man/enve.recplot2.Rd +0 -77
  268. data/utils/enveomics/enveomics.R/man/enve.recplot2.__counts.Rd +0 -25
  269. data/utils/enveomics/enveomics.R/man/enve.recplot2.__peakHist.Rd +0 -21
  270. data/utils/enveomics/enveomics.R/man/enve.recplot2.__whichClosestPeak.Rd +0 -19
  271. data/utils/enveomics/enveomics.R/man/enve.recplot2.changeCutoff.Rd +0 -19
  272. data/utils/enveomics/enveomics.R/man/enve.recplot2.compareIdentities.Rd +0 -47
  273. data/utils/enveomics/enveomics.R/man/enve.recplot2.coordinates.Rd +0 -29
  274. data/utils/enveomics/enveomics.R/man/enve.recplot2.corePeak.Rd +0 -18
  275. data/utils/enveomics/enveomics.R/man/enve.recplot2.extractWindows.Rd +0 -45
  276. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.Rd +0 -36
  277. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__em_e.Rd +0 -19
  278. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__em_m.Rd +0 -19
  279. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__emauto_one.Rd +0 -27
  280. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__mow_one.Rd +0 -52
  281. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__mower.Rd +0 -17
  282. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.em.Rd +0 -51
  283. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.emauto.Rd +0 -43
  284. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.mower.Rd +0 -82
  285. data/utils/enveomics/enveomics.R/man/enve.recplot2.peak-class.Rd +0 -59
  286. data/utils/enveomics/enveomics.R/man/enve.recplot2.seqdepth.Rd +0 -27
  287. data/utils/enveomics/enveomics.R/man/enve.recplot2.windowDepthThreshold.Rd +0 -36
  288. data/utils/enveomics/enveomics.R/man/enve.selvector.Rd +0 -23
  289. data/utils/enveomics/enveomics.R/man/enve.tribs.Rd +0 -68
  290. data/utils/enveomics/enveomics.R/man/enve.tribs.test.Rd +0 -28
  291. data/utils/enveomics/enveomics.R/man/enve.truncate.Rd +0 -27
  292. data/utils/enveomics/enveomics.R/man/growth.curves.Rd +0 -14
  293. data/utils/enveomics/enveomics.R/man/phyla.counts.Rd +0 -13
  294. data/utils/enveomics/enveomics.R/man/plot.enve.GrowthCurve.Rd +0 -78
  295. data/utils/enveomics/enveomics.R/man/plot.enve.TRIBS.Rd +0 -46
  296. data/utils/enveomics/enveomics.R/man/plot.enve.TRIBStest.Rd +0 -45
  297. data/utils/enveomics/enveomics.R/man/plot.enve.recplot2.Rd +0 -125
  298. data/utils/enveomics/enveomics.R/man/summary.enve.GrowthCurve.Rd +0 -19
  299. data/utils/enveomics/enveomics.R/man/summary.enve.TRIBS.Rd +0 -19
  300. data/utils/enveomics/enveomics.R/man/summary.enve.TRIBStest.Rd +0 -19
  301. data/utils/enveomics/globals.mk +0 -8
  302. data/utils/enveomics/manifest.json +0 -9
  303. data/utils/multitrim/Multitrim How-To.pdf +0 -0
  304. data/utils/multitrim/README.md +0 -67
  305. data/utils/multitrim/multitrim.py +0 -1555
  306. data/utils/multitrim/multitrim.yml +0 -13
@@ -1,308 +0,0 @@
1
- {
2
- "tasks": [
3
- {
4
- "task": "Table.df2dist.R",
5
- "description": ["Transform a tab-delimited list of distances into a",
6
- "squared matrix."],
7
- "help_arg": "--help",
8
- "requires": [ { "r_package": "optparse" } ],
9
- "options": [
10
- {
11
- "name": "Input list",
12
- "opt": "--x",
13
- "arg": "in_file",
14
- "mandatory": true,
15
- "description": "A tab-delimited table with the distances."
16
- },
17
- {
18
- "opt": "--obj1-index",
19
- "arg": "integer",
20
- "default": 1,
21
- "description": ["Index of the column containing the ID of the object",
22
- "1."]
23
- },
24
- {
25
- "opt": "--obj2-index",
26
- "arg": "integer",
27
- "default": 2,
28
- "description": ["Index of the column containing the ID of the object",
29
- "2."]
30
- },
31
- {
32
- "opt": "--dist-index",
33
- "arg": "integer",
34
- "default": 3,
35
- "description": "Index of the column containing the distance."
36
- },
37
- {
38
- "opt": "--default-d",
39
- "arg": "integer",
40
- "description": "Default value for missing values. NA if empty."
41
- },
42
- {
43
- "opt": "--max-sim",
44
- "arg": "float",
45
- "description": ["If not-empty, assumes that the values are",
46
- "similarity (not distance) and this is the maximum similarity",
47
- "(corresponding to distance 0). Applies transformation:",
48
- "distance = (max.sim - values)/max.sim."]
49
- },
50
- {
51
- "arg": "out_file",
52
- "mandatory": true,
53
- "description": "Output squared matrix in tab-separated values format."
54
- }
55
- ]
56
- },
57
- {
58
- "task": "Table.filter.pl",
59
- "description": ["Extracts (and re-orders) a subset of rows from a raw",
60
- "table."],
61
- "help_arg": "",
62
- "options": [
63
- {
64
- "name": "Key",
65
- "opt": "-k",
66
- "arg": "integer",
67
- "default": 1,
68
- "description": "Column of the table to use as key to filter."
69
- },
70
- {
71
- "name": "Sep",
72
- "opt": "-s",
73
- "arg": "string",
74
- "description": ["String to use as separation between rows. By",
75
- "default, tabulation."]
76
- },
77
- {
78
- "name": "Inverse",
79
- "opt": "-i",
80
- "description": ["If set, reports the inverse of the list (i.e.,",
81
- "reports only rows absent in the list). Implies 'No re-order'."]
82
- },
83
- {
84
- "name": "Header",
85
- "opt": "-h",
86
- "description": "Keep first row of the table (header) untouched."
87
- },
88
- {
89
- "name": "No re-order",
90
- "opt": "-n",
91
- "description": ["The output has the same order of the table. By",
92
- "default, it prints in the order of the list."]
93
- },
94
- {
95
- "name": "List",
96
- "arg": "in_file",
97
- "mandatory": true,
98
- "description": "List of IDs to extract."
99
- },
100
- {
101
- "name": "Table",
102
- "arg": "in_file",
103
- "mandatory": true,
104
- "description": "Table file containing the superset."
105
- },
106
- ">",
107
- {
108
- "name": "Subset",
109
- "arg": "out_file",
110
- "mandatory": true,
111
- "description": "Table file to be created."
112
- }
113
- ]
114
- },
115
- {
116
- "task": "Table.merge.pl",
117
- "description": "Merges multiple (two-column) lists into one table.",
118
- "see_also": ["Table.split.pl"],
119
- "help_arg": "",
120
- "options": [
121
- {
122
- "name": "Strings",
123
- "opt": "-s",
124
- "description": ["Values are read as Strings. By default, values are",
125
- "read as numbers."]
126
- },
127
- {
128
- "name": "Input delimiter",
129
- "opt": "-i",
130
- "arg": "string",
131
- "description": "Input field-delimiter. By default, tabulation."
132
- },
133
- {
134
- "name": "Output delimiter",
135
- "opt": "-o",
136
- "arg": "string",
137
- "description": "Output field-delimiter. By default: tabulation."
138
- },
139
- {
140
- "name": "No header",
141
- "opt": "-n",
142
- "description": ["By default, the header is determined by the file",
143
- "names."]
144
- },
145
- {
146
- "name": "Empty",
147
- "opt": "-e",
148
- "description": ["Default string when no value is found. By default,",
149
- "the 'empty' value is 0 if values are numeric (i.e., unless -s is",
150
- "set) or an empty string otherwise."]
151
- },
152
- {
153
- "name": "Header",
154
- "opt": "-h",
155
- "arg": "string",
156
- "default": "Tag",
157
- "description": "Header of the first column, containing the IDs."
158
- },
159
- {
160
- "name": "Header format",
161
- "opt": "-H",
162
- "arg": "string",
163
- "default": "(?:.*/)?([^\\.]+)",
164
- "description": ["Format of filenames capturing the column header in",
165
- "the first capturing parenthesis. Non-capturing paretheses can be",
166
- "defined as (?:...). By default: '(?:.*/)?([^\\.]+)', which",
167
- "captures the part of the basename of the file before the first",
168
- "dot (if any)."]
169
- },
170
- {
171
- "name": "Rows to ignore",
172
- "opt": "-r",
173
- "arg": "integer",
174
- "default": 0,
175
- "description": "Number of leading rows to ignore in the input files."
176
- },
177
- {
178
- "arg": "in_file",
179
- "mandatory": true,
180
- "multiple_sep": " ",
181
- "description": "Input two-column lists."
182
- },
183
- ">",
184
- {
185
- "arg": "out_file",
186
- "mandatory": true,
187
- "description": "Merged table."
188
- }
189
- ]
190
- },
191
- {
192
- "task": "Table.round.rb",
193
- "description": "Rounds numbers in a table.",
194
- "help_arg": "--help",
195
- "options": [
196
- {
197
- "name": "Input file",
198
- "opt": "--in",
199
- "arg": "in_file",
200
- "mandatory": true,
201
- "description": "Input table."
202
- },
203
- {
204
- "name": "Output file",
205
- "opt": "--out",
206
- "arg": "out_file",
207
- "mandatory": true,
208
- "description": "Output table."
209
- },
210
- {
211
- "name": "Decimals",
212
- "opt": "--ndigits",
213
- "arg": "integer",
214
- "default": 0,
215
- "description": "Number of decimal digits."
216
- },
217
- {
218
- "opt": "--floor",
219
- "description": ["Floors the values instead of rounding them. Ignores",
220
- "'Decimals'."]
221
- },
222
- {
223
- "opt": "--ceil",
224
- "description": ["Ceils the values instead of rounding them. Ignores",
225
- "'Decimals'."]
226
- },
227
- {
228
- "opt": "--delimiter",
229
- "arg": "string",
230
- "description": "String delimiting columns. By default, tabulation."
231
- }
232
- ]
233
- },
234
- {
235
- "task": "Table.split.pl",
236
- "description": ["Split a file with multiple columns into multiple",
237
- "two-columns lists."],
238
- "see_also": ["Table.merge.pl"],
239
- "help_arg": "",
240
- "options": [
241
- {
242
- "name": "Input delimiter",
243
- "opt": "-i",
244
- "arg": "string",
245
- "description": "Input field-delimiter. By default, tabulation."
246
- },
247
- {
248
- "name": "Out prefix",
249
- "opt": "-o",
250
- "arg": "string",
251
- "description": "Prefix of the output files."
252
- },
253
- {
254
- "name": "Output directory",
255
- "opt": "-d",
256
- "arg": "out_dir",
257
- "description": "Output directory."
258
- },
259
- {
260
- "arg": "in_file",
261
- "mandatory": true,
262
- "description": "Input table."
263
- }
264
- ]
265
- },
266
- {
267
- "task": "Table.replace.rb",
268
- "description": "Replace a field in a table using a mapping file.",
269
- "help_arg": "--help",
270
- "options": [
271
- {
272
- "opt": "--map",
273
- "arg": "in_file",
274
- "mandatory": true,
275
- "description": "Mapping file with two columns (key and replacement)."
276
- },
277
- {
278
- "opt": "--in",
279
- "arg": "in_file",
280
- "mandatory": true,
281
- "description": "Input table."
282
- },
283
- {
284
- "opt": "--out",
285
- "arg": "out_file",
286
- "mandatory": true,
287
- "description": "Output table."
288
- },
289
- {
290
- "opt": "--key",
291
- "arg": "integer",
292
- "default": 1,
293
- "description": "Column to replace in Input table."
294
- },
295
- {
296
- "opt": "--unknown",
297
- "arg": "string",
298
- "description": "String to use whenever the key is not found in Map."
299
- },
300
- {
301
- "opt": "--delimiter",
302
- "arg": "string",
303
- "description": "String delimiting columns. By default, tabulation."
304
- }
305
- ]
306
- }
307
- ]
308
- }
@@ -1,68 +0,0 @@
1
- {
2
- "tasks": [
3
- {
4
- "task": "Newick.autoprune.R",
5
- "description": ["Automatically prunes a tree, to keep representatives of",
6
- "each clade."],
7
- "requires": [ { "r_package": "optparse" }, { "r_package": "ape" } ],
8
- "cite": [["Paradis et al, 2004, Bioinf",
9
- "http://dx.doi.org/10.1093/bioinformatics/btg412"]],
10
- "help_arg": "--help",
11
- "options": [
12
- {
13
- "name": "Input tree",
14
- "opt": "--t",
15
- "arg": "in_file",
16
- "mandatory": true,
17
- "description": "A tree to prune in Newick format."
18
- },
19
- {
20
- "opt": "--dist-quantile",
21
- "arg": "float",
22
- "default": 0.25,
23
- "description": "The quantile of edge lengths."
24
- },
25
- {
26
- "opt": "--min_dist",
27
- "arg": "float",
28
- "description": ["The minimum distance to allow between two tips. If",
29
- "not set, dist.quantile is used instead to calculate it."]
30
- },
31
- {
32
- "opt": "--quiet",
33
- "description": ["Boolean indicating if the function must run without",
34
- "output."]
35
- },
36
- {
37
- "opt": "--max_iters",
38
- "arg": "integer",
39
- "default": 1000,
40
- "description": "Maximum number of iterations."
41
- },
42
- {
43
- "opt": "--min_nodes_random",
44
- "arg": "integer",
45
- "default": 40000,
46
- "description": ["Minimum number of nodes to trigger 'tip-pairs'",
47
- "nodes sampling. This sampling is less reproducible and more",
48
- "computationally expensive, but it's the only solution if the",
49
- "cophenetic matrix exceeds 2^31-1 entries; above that, it cannot",
50
- "be represented in R."]
51
- },
52
- {
53
- "opt": "--random_nodes_frx",
54
- "arg": "float",
55
- "default": 1.0,
56
- "description": ["Fraction of the nodes to be sampled if more than",
57
- "'Min nodes random'."]
58
- },
59
- {
60
- "arg": "out_file",
61
- "mandatory": true,
62
- "description": ["Output file in Newick format containing the pruned",
63
- "tree."]
64
- }
65
- ]
66
- }
67
- ]
68
- }
@@ -1,111 +0,0 @@
1
- {
2
- "tasks": [
3
- {
4
- "task": "VCF.SNPs.rb",
5
- "description": ["Counts the number of Single-Nucleotide Polymorphisms",
6
- "(SNPs) in a VCF file."],
7
- "help_arg": "--help",
8
- "options": [
9
- {
10
- "opt": "--input",
11
- "arg": "in_file",
12
- "mandatory": true,
13
- "description": "Input file in Variant Call Format (VCF)."
14
- },
15
- {
16
- "name": "Filtered VCF",
17
- "opt": "--out",
18
- "arg": "out_file",
19
- "description": "Output (filtered) file in Variant Call Format (VCF)."
20
- },
21
- {
22
- "name": "Min DP",
23
- "opt": "--min-dp",
24
- "arg": "integer",
25
- "description": "Minimum number of reads covering the position.",
26
- "default": 4
27
- },
28
- {
29
- "name": "Max DP",
30
- "opt": "--max-dp",
31
- "arg": "integer",
32
- "description": ["Maximum number of reads covering the position. By",
33
- "default no limit."]
34
- },
35
- {
36
- "name": "Min Ref-DP",
37
- "opt": "--min-ref-dp",
38
- "arg": "integer",
39
- "description": "Minimum number of reads supporting the REF allele.",
40
- "default": 2
41
- },
42
- {
43
- "name": "Min Alt-DP",
44
- "opt": "--min-alt-dp",
45
- "arg": "integer",
46
- "description": "Minimum number of reads supporting the ALT allele.",
47
- "default": 2
48
- },
49
- {
50
- "opt": "--min-quality",
51
- "arg": "float",
52
- "description": "Minimum quality of the position mapping.",
53
- "default": 0.0
54
- },
55
- {
56
- "opt": "--min-shannon",
57
- "arg": "integer",
58
- "description": "Minimum information content (in bits, from 0 to 1).",
59
- "default": 0.0
60
- },
61
- {
62
- "opt": "--indels",
63
- "description": "Process indels."
64
- }
65
- ]
66
- },
67
- {
68
- "task": "VCF.KaKs.rb",
69
- "description": ["Estimates the Ka/Ks ratio from the SNPs in a VCF file.",
70
- "Ka and Ks are corrected using pseudo-counts, but no corrections for",
71
- "multiple substitutions are applied."],
72
- "help_arg": "--help",
73
- "see_also": ["VCF.SNPs.rb"],
74
- "options": [
75
- {
76
- "opt": "--input",
77
- "arg": "in_file",
78
- "mandatory": true,
79
- "description": "Input file in Variant Call Format (VCF)."
80
- },
81
- {
82
- "opt": "--seqs",
83
- "arg": "in_file",
84
- "mandatory": true,
85
- "description": "Input gene sequences (nucleotides) in FastA format."
86
- },
87
- {
88
- "name": "Synonymous fraction",
89
- "opt": "--syn-frx",
90
- "arg": "float",
91
- "description": ["Fraction of synonymous substitutions. If passed,",
92
- "the number of sites are estimated (not counted per gene),",
93
- "speeding up the computation ~10X."]
94
- },
95
- {
96
- "name": "Bacterial code synonymous fraction",
97
- "opt": "--syn-bacterial-code",
98
- "description": ["Sets the synonymous fraction to 0.760417,",
99
- "approximately the proportion of synonymous substitutions in the",
100
- "bacterial code."]
101
- },
102
- {
103
- "opt": "--codon-file",
104
- "arg": "out_file",
105
- "description": ["Output file including the codons of substitution",
106
- "variants."]
107
- }
108
- ]
109
- }
110
- ]
111
- }
@@ -1,165 +0,0 @@
1
- {
2
- "categories": {
3
- "Sequence similarity search": {
4
- "Statistics": [
5
- "BedGraph.tad.rb",
6
- "BedGraph.window.rb",
7
- "BlastPairwise.AAsubs.pl",
8
- "BlastTab.advance.bash",
9
- "BlastTab.recplot2.R",
10
- "BlastTab.seqdepth.pl",
11
- "BlastTab.seqdepth_nomedian.pl",
12
- "BlastTab.seqdepth_ZIP.pl",
13
- "BlastTab.sumPerHit.pl",
14
- "FastQ.test-error.rb",
15
- "RecPlot2.compareIdentities.R"
16
- ],
17
- "Manipulation": [
18
- "BlastTab.addlen.rb",
19
- "BlastTab.best_hit_sorted.pl",
20
- "BlastTab.catsbj.pl",
21
- "BlastTab.cogCat.rb",
22
- "BlastTab.filter.pl",
23
- "BlastTab.kegg_pep2path_rest.pl",
24
- "BlastTab.pairedHits.rb",
25
- "BlastTab.subsample.pl",
26
- "BlastTab.taxid2taxrank.pl",
27
- "BlastTab.topHits_sorted.rb",
28
- "sam.filter.rb"
29
- ],
30
- "Execution": [
31
- "aai.rb",
32
- "ani.rb",
33
- "anir.rb",
34
- "HMM.haai.rb",
35
- "rbm.rb"
36
- ]
37
- },
38
- "Sequence analyses": {
39
- "Statistics": [
40
- "FastA.gc.pl",
41
- "FastA.length.pl",
42
- "FastA.N50.pl",
43
- "FastA.qlen.pl",
44
- "FastQ.test-error.rb"
45
- ],
46
- "Manipulation": [
47
- "FastA.extract.rb",
48
- "FastA.filter.pl",
49
- "FastA.filterLen.pl",
50
- "FastA.filterN.pl",
51
- "FastA.fragment.rb",
52
- "FastA.interpose.pl",
53
- "FastA.mask.rb",
54
- "FastA.per_file.pl",
55
- "FastA.rename.pl",
56
- "FastA.revcom.pl",
57
- "FastA.sample.rb",
58
- "FastA.slider.pl",
59
- "FastA.split.pl",
60
- "FastA.split.rb",
61
- "FastA.subsample.pl",
62
- "FastA.tag.rb",
63
- "FastA.toFastQ.rb",
64
- "FastA.wrap.rb",
65
- "FastQ.filter.pl",
66
- "FastQ.interpose.pl",
67
- "FastQ.maskQual.rb",
68
- "FastQ.offset.pl",
69
- "FastQ.split.pl",
70
- "FastQ.tag.rb",
71
- "FastQ.toFastA.awk"
72
- ]
73
- },
74
- "Diversity": {
75
- "Community": [
76
- "AlphaDiversity.pl",
77
- "Chao1.pl",
78
- "Table.barplot.R",
79
- "Table.prefScore.R"
80
- ],
81
- "Population": [
82
- "VCF.SNPs.rb",
83
- "VCF.KaKs.rb",
84
- "Table.prefScore.R"
85
- ]
86
- },
87
- "Annotation": {
88
- "Database mapping": [
89
- "BlastTab.kegg_pep2path_rest.pl",
90
- "BlastTab.taxid2taxrank.pl",
91
- "EBIseq2tax.rb",
92
- "NCBIacc2tax.rb",
93
- "gi2tax.rb",
94
- "M5nr.getSequences.rb",
95
- "RefSeq.download.bash",
96
- "SRA.download.bash"
97
- ],
98
- "Tables": [
99
- "Table.barplot.R",
100
- "GenBank.add_fields.rb",
101
- "MyTaxa.fragsByTax.pl",
102
- "Table.df2dist.R",
103
- "Table.filter.pl",
104
- "Table.merge.pl",
105
- "Table.replace.rb",
106
- "Table.round.rb",
107
- "Table.split.pl"
108
- ],
109
- "Search": [
110
- "HMM.essential.rb",
111
- "HMM.haai.rb",
112
- "HMMsearch.extractIds.rb",
113
- "ogs.annotate.rb",
114
- "ogs.core-pan.rb",
115
- "ogs.extract.rb",
116
- "ogs.mcl.rb",
117
- "ogs.stats.rb",
118
- "ogs.rb"
119
- ]
120
- },
121
- "Other data": {
122
- "Phylogenetic and other distances": [
123
- "CharTable.classify.rb",
124
- "JPlace.distances.rb",
125
- "JPlace.to_iToL.rb",
126
- "Newick.autoprune.R",
127
- "TRIBS.test.R",
128
- "TRIBS.plot-test.R",
129
- "Table.df2dist.R"
130
- ],
131
- "Taxonomic": [
132
- "CharTable.classify.rb",
133
- "EBIseq2tax.rb",
134
- "NCBIacc2tax.rb",
135
- "Table.barplot.R",
136
- "gi2tax.rb",
137
- "MyTaxa.fragsByTax.pl",
138
- "MyTaxa.seq-taxrank.rb",
139
- "Taxonomy.silva2ncbi.rb"
140
- ],
141
- "Alignments": [
142
- "AAsubs.log2ratio.rb",
143
- "Aln.cat.rb",
144
- "Aln.convert.pl",
145
- "BlastPairwise.AAsubs.pl"
146
- ],
147
- "Clustering": [
148
- "ogs.mcl.rb",
149
- "clust.rand.rb"
150
- ],
151
- "Read recruitments": [
152
- "anir.rb",
153
- "BedGraph.tad.rb",
154
- "BedGraph.window.rb",
155
- "BlastTab.catsbj.pl",
156
- "BlastTab.pairedHits.rb",
157
- "BlastTab.recplot2.R",
158
- "FastQ.test-error.rb",
159
- "GFF.catsbj.pl",
160
- "RecPlot2.compareIdentities.R",
161
- "sam.filter.rb"
162
- ]
163
- }
164
- }
165
- }