miga-base 1.2.15.2 → 1.2.15.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (306) hide show
  1. checksums.yaml +4 -4
  2. data/lib/miga/cli/action/download/gtdb.rb +4 -1
  3. data/lib/miga/cli/action/gtdb_get.rb +4 -0
  4. data/lib/miga/daemon.rb +4 -1
  5. data/lib/miga/lair.rb +6 -4
  6. data/lib/miga/remote_dataset/download.rb +3 -2
  7. data/lib/miga/remote_dataset.rb +25 -7
  8. data/lib/miga/taxonomy.rb +6 -0
  9. data/lib/miga/version.rb +2 -2
  10. metadata +6 -302
  11. data/utils/FastAAI/00.Libraries/01.SCG_HMMs/Archaea_SCG.hmm +0 -41964
  12. data/utils/FastAAI/00.Libraries/01.SCG_HMMs/Bacteria_SCG.hmm +0 -32439
  13. data/utils/FastAAI/00.Libraries/01.SCG_HMMs/Complete_SCG_DB.hmm +0 -62056
  14. data/utils/FastAAI/FastAAI +0 -3659
  15. data/utils/FastAAI/FastAAI-legacy/FastAAI +0 -1336
  16. data/utils/FastAAI/FastAAI-legacy/kAAI_v1.0_virus.py +0 -1296
  17. data/utils/FastAAI/README.md +0 -84
  18. data/utils/enveomics/Docs/recplot2.md +0 -244
  19. data/utils/enveomics/Examples/aai-matrix.bash +0 -66
  20. data/utils/enveomics/Examples/ani-matrix.bash +0 -66
  21. data/utils/enveomics/Examples/essential-phylogeny.bash +0 -105
  22. data/utils/enveomics/Examples/unus-genome-phylogeny.bash +0 -100
  23. data/utils/enveomics/LICENSE.txt +0 -73
  24. data/utils/enveomics/Makefile +0 -52
  25. data/utils/enveomics/Manifest/Tasks/aasubs.json +0 -103
  26. data/utils/enveomics/Manifest/Tasks/blasttab.json +0 -790
  27. data/utils/enveomics/Manifest/Tasks/distances.json +0 -161
  28. data/utils/enveomics/Manifest/Tasks/fasta.json +0 -802
  29. data/utils/enveomics/Manifest/Tasks/fastq.json +0 -291
  30. data/utils/enveomics/Manifest/Tasks/graphics.json +0 -126
  31. data/utils/enveomics/Manifest/Tasks/mapping.json +0 -137
  32. data/utils/enveomics/Manifest/Tasks/ogs.json +0 -382
  33. data/utils/enveomics/Manifest/Tasks/other.json +0 -906
  34. data/utils/enveomics/Manifest/Tasks/remote.json +0 -355
  35. data/utils/enveomics/Manifest/Tasks/sequence-identity.json +0 -650
  36. data/utils/enveomics/Manifest/Tasks/tables.json +0 -308
  37. data/utils/enveomics/Manifest/Tasks/trees.json +0 -68
  38. data/utils/enveomics/Manifest/Tasks/variants.json +0 -111
  39. data/utils/enveomics/Manifest/categories.json +0 -165
  40. data/utils/enveomics/Manifest/examples.json +0 -162
  41. data/utils/enveomics/Manifest/tasks.json +0 -4
  42. data/utils/enveomics/Pipelines/assembly.pbs/CONFIG.mock.bash +0 -69
  43. data/utils/enveomics/Pipelines/assembly.pbs/FastA.N50.pl +0 -1
  44. data/utils/enveomics/Pipelines/assembly.pbs/FastA.filterN.pl +0 -1
  45. data/utils/enveomics/Pipelines/assembly.pbs/FastA.length.pl +0 -1
  46. data/utils/enveomics/Pipelines/assembly.pbs/README.md +0 -189
  47. data/utils/enveomics/Pipelines/assembly.pbs/RUNME-2.bash +0 -112
  48. data/utils/enveomics/Pipelines/assembly.pbs/RUNME-3.bash +0 -23
  49. data/utils/enveomics/Pipelines/assembly.pbs/RUNME-4.bash +0 -44
  50. data/utils/enveomics/Pipelines/assembly.pbs/RUNME.bash +0 -50
  51. data/utils/enveomics/Pipelines/assembly.pbs/kSelector.R +0 -37
  52. data/utils/enveomics/Pipelines/assembly.pbs/newbler.pbs +0 -68
  53. data/utils/enveomics/Pipelines/assembly.pbs/newbler_preparator.pl +0 -49
  54. data/utils/enveomics/Pipelines/assembly.pbs/soap.pbs +0 -80
  55. data/utils/enveomics/Pipelines/assembly.pbs/stats.pbs +0 -57
  56. data/utils/enveomics/Pipelines/assembly.pbs/velvet.pbs +0 -63
  57. data/utils/enveomics/Pipelines/blast.pbs/01.pbs.bash +0 -38
  58. data/utils/enveomics/Pipelines/blast.pbs/02.pbs.bash +0 -73
  59. data/utils/enveomics/Pipelines/blast.pbs/03.pbs.bash +0 -21
  60. data/utils/enveomics/Pipelines/blast.pbs/BlastTab.recover_job.pl +0 -72
  61. data/utils/enveomics/Pipelines/blast.pbs/CONFIG.mock.bash +0 -98
  62. data/utils/enveomics/Pipelines/blast.pbs/FastA.split.pl +0 -1
  63. data/utils/enveomics/Pipelines/blast.pbs/README.md +0 -127
  64. data/utils/enveomics/Pipelines/blast.pbs/RUNME.bash +0 -109
  65. data/utils/enveomics/Pipelines/blast.pbs/TASK.check.bash +0 -128
  66. data/utils/enveomics/Pipelines/blast.pbs/TASK.dry.bash +0 -16
  67. data/utils/enveomics/Pipelines/blast.pbs/TASK.eo.bash +0 -22
  68. data/utils/enveomics/Pipelines/blast.pbs/TASK.pause.bash +0 -26
  69. data/utils/enveomics/Pipelines/blast.pbs/TASK.run.bash +0 -89
  70. data/utils/enveomics/Pipelines/blast.pbs/sentinel.pbs.bash +0 -29
  71. data/utils/enveomics/Pipelines/idba.pbs/README.md +0 -49
  72. data/utils/enveomics/Pipelines/idba.pbs/RUNME.bash +0 -95
  73. data/utils/enveomics/Pipelines/idba.pbs/run.pbs +0 -56
  74. data/utils/enveomics/Pipelines/trim.pbs/README.md +0 -54
  75. data/utils/enveomics/Pipelines/trim.pbs/RUNME.bash +0 -70
  76. data/utils/enveomics/Pipelines/trim.pbs/run.pbs +0 -130
  77. data/utils/enveomics/README.md +0 -42
  78. data/utils/enveomics/Scripts/AAsubs.log2ratio.rb +0 -171
  79. data/utils/enveomics/Scripts/Aln.cat.rb +0 -221
  80. data/utils/enveomics/Scripts/Aln.convert.pl +0 -35
  81. data/utils/enveomics/Scripts/AlphaDiversity.pl +0 -152
  82. data/utils/enveomics/Scripts/BedGraph.tad.rb +0 -93
  83. data/utils/enveomics/Scripts/BedGraph.window.rb +0 -71
  84. data/utils/enveomics/Scripts/BlastPairwise.AAsubs.pl +0 -102
  85. data/utils/enveomics/Scripts/BlastTab.addlen.rb +0 -63
  86. data/utils/enveomics/Scripts/BlastTab.advance.bash +0 -48
  87. data/utils/enveomics/Scripts/BlastTab.best_hit_sorted.pl +0 -55
  88. data/utils/enveomics/Scripts/BlastTab.catsbj.pl +0 -104
  89. data/utils/enveomics/Scripts/BlastTab.cogCat.rb +0 -76
  90. data/utils/enveomics/Scripts/BlastTab.filter.pl +0 -47
  91. data/utils/enveomics/Scripts/BlastTab.kegg_pep2path_rest.pl +0 -194
  92. data/utils/enveomics/Scripts/BlastTab.metaxaPrep.pl +0 -104
  93. data/utils/enveomics/Scripts/BlastTab.pairedHits.rb +0 -157
  94. data/utils/enveomics/Scripts/BlastTab.recplot2.R +0 -48
  95. data/utils/enveomics/Scripts/BlastTab.seqdepth.pl +0 -86
  96. data/utils/enveomics/Scripts/BlastTab.seqdepth_ZIP.pl +0 -119
  97. data/utils/enveomics/Scripts/BlastTab.seqdepth_nomedian.pl +0 -86
  98. data/utils/enveomics/Scripts/BlastTab.subsample.pl +0 -47
  99. data/utils/enveomics/Scripts/BlastTab.sumPerHit.pl +0 -114
  100. data/utils/enveomics/Scripts/BlastTab.taxid2taxrank.pl +0 -90
  101. data/utils/enveomics/Scripts/BlastTab.topHits_sorted.rb +0 -123
  102. data/utils/enveomics/Scripts/Chao1.pl +0 -97
  103. data/utils/enveomics/Scripts/CharTable.classify.rb +0 -234
  104. data/utils/enveomics/Scripts/EBIseq2tax.rb +0 -83
  105. data/utils/enveomics/Scripts/FastA.N50.pl +0 -60
  106. data/utils/enveomics/Scripts/FastA.extract.rb +0 -152
  107. data/utils/enveomics/Scripts/FastA.filter.pl +0 -52
  108. data/utils/enveomics/Scripts/FastA.filterLen.pl +0 -28
  109. data/utils/enveomics/Scripts/FastA.filterN.pl +0 -60
  110. data/utils/enveomics/Scripts/FastA.fragment.rb +0 -100
  111. data/utils/enveomics/Scripts/FastA.gc.pl +0 -42
  112. data/utils/enveomics/Scripts/FastA.interpose.pl +0 -93
  113. data/utils/enveomics/Scripts/FastA.length.pl +0 -38
  114. data/utils/enveomics/Scripts/FastA.mask.rb +0 -89
  115. data/utils/enveomics/Scripts/FastA.per_file.pl +0 -36
  116. data/utils/enveomics/Scripts/FastA.qlen.pl +0 -57
  117. data/utils/enveomics/Scripts/FastA.rename.pl +0 -65
  118. data/utils/enveomics/Scripts/FastA.revcom.pl +0 -23
  119. data/utils/enveomics/Scripts/FastA.sample.rb +0 -98
  120. data/utils/enveomics/Scripts/FastA.slider.pl +0 -85
  121. data/utils/enveomics/Scripts/FastA.split.pl +0 -55
  122. data/utils/enveomics/Scripts/FastA.split.rb +0 -79
  123. data/utils/enveomics/Scripts/FastA.subsample.pl +0 -131
  124. data/utils/enveomics/Scripts/FastA.tag.rb +0 -65
  125. data/utils/enveomics/Scripts/FastA.toFastQ.rb +0 -69
  126. data/utils/enveomics/Scripts/FastA.wrap.rb +0 -48
  127. data/utils/enveomics/Scripts/FastQ.filter.pl +0 -54
  128. data/utils/enveomics/Scripts/FastQ.interpose.pl +0 -90
  129. data/utils/enveomics/Scripts/FastQ.maskQual.rb +0 -89
  130. data/utils/enveomics/Scripts/FastQ.offset.pl +0 -90
  131. data/utils/enveomics/Scripts/FastQ.split.pl +0 -53
  132. data/utils/enveomics/Scripts/FastQ.tag.rb +0 -70
  133. data/utils/enveomics/Scripts/FastQ.test-error.rb +0 -81
  134. data/utils/enveomics/Scripts/FastQ.toFastA.awk +0 -24
  135. data/utils/enveomics/Scripts/GFF.catsbj.pl +0 -127
  136. data/utils/enveomics/Scripts/GenBank.add_fields.rb +0 -84
  137. data/utils/enveomics/Scripts/HMM.essential.rb +0 -351
  138. data/utils/enveomics/Scripts/HMM.haai.rb +0 -168
  139. data/utils/enveomics/Scripts/HMMsearch.extractIds.rb +0 -83
  140. data/utils/enveomics/Scripts/JPlace.distances.rb +0 -88
  141. data/utils/enveomics/Scripts/JPlace.to_iToL.rb +0 -320
  142. data/utils/enveomics/Scripts/M5nr.getSequences.rb +0 -81
  143. data/utils/enveomics/Scripts/MeTaxa.distribution.pl +0 -198
  144. data/utils/enveomics/Scripts/MyTaxa.fragsByTax.pl +0 -35
  145. data/utils/enveomics/Scripts/MyTaxa.seq-taxrank.rb +0 -49
  146. data/utils/enveomics/Scripts/NCBIacc2tax.rb +0 -92
  147. data/utils/enveomics/Scripts/Newick.autoprune.R +0 -27
  148. data/utils/enveomics/Scripts/RAxML-EPA.to_iToL.pl +0 -228
  149. data/utils/enveomics/Scripts/RecPlot2.compareIdentities.R +0 -32
  150. data/utils/enveomics/Scripts/RefSeq.download.bash +0 -48
  151. data/utils/enveomics/Scripts/SRA.download.bash +0 -55
  152. data/utils/enveomics/Scripts/TRIBS.plot-test.R +0 -36
  153. data/utils/enveomics/Scripts/TRIBS.test.R +0 -39
  154. data/utils/enveomics/Scripts/Table.barplot.R +0 -31
  155. data/utils/enveomics/Scripts/Table.df2dist.R +0 -30
  156. data/utils/enveomics/Scripts/Table.filter.pl +0 -61
  157. data/utils/enveomics/Scripts/Table.merge.pl +0 -77
  158. data/utils/enveomics/Scripts/Table.prefScore.R +0 -60
  159. data/utils/enveomics/Scripts/Table.replace.rb +0 -69
  160. data/utils/enveomics/Scripts/Table.round.rb +0 -63
  161. data/utils/enveomics/Scripts/Table.split.pl +0 -57
  162. data/utils/enveomics/Scripts/Taxonomy.silva2ncbi.rb +0 -227
  163. data/utils/enveomics/Scripts/VCF.KaKs.rb +0 -147
  164. data/utils/enveomics/Scripts/VCF.SNPs.rb +0 -88
  165. data/utils/enveomics/Scripts/aai.rb +0 -421
  166. data/utils/enveomics/Scripts/ani.rb +0 -362
  167. data/utils/enveomics/Scripts/anir.rb +0 -137
  168. data/utils/enveomics/Scripts/clust.rand.rb +0 -102
  169. data/utils/enveomics/Scripts/gi2tax.rb +0 -103
  170. data/utils/enveomics/Scripts/in_silico_GA_GI.pl +0 -96
  171. data/utils/enveomics/Scripts/lib/data/dupont_2012_essential.hmm.gz +0 -0
  172. data/utils/enveomics/Scripts/lib/data/lee_2019_essential.hmm.gz +0 -0
  173. data/utils/enveomics/Scripts/lib/enveomics.R +0 -1
  174. data/utils/enveomics/Scripts/lib/enveomics_rb/anir.rb +0 -293
  175. data/utils/enveomics/Scripts/lib/enveomics_rb/bm_set.rb +0 -175
  176. data/utils/enveomics/Scripts/lib/enveomics_rb/enveomics.rb +0 -24
  177. data/utils/enveomics/Scripts/lib/enveomics_rb/errors.rb +0 -17
  178. data/utils/enveomics/Scripts/lib/enveomics_rb/gmm_em.rb +0 -30
  179. data/utils/enveomics/Scripts/lib/enveomics_rb/jplace.rb +0 -253
  180. data/utils/enveomics/Scripts/lib/enveomics_rb/match.rb +0 -88
  181. data/utils/enveomics/Scripts/lib/enveomics_rb/og.rb +0 -182
  182. data/utils/enveomics/Scripts/lib/enveomics_rb/rbm.rb +0 -49
  183. data/utils/enveomics/Scripts/lib/enveomics_rb/remote_data.rb +0 -74
  184. data/utils/enveomics/Scripts/lib/enveomics_rb/seq_range.rb +0 -237
  185. data/utils/enveomics/Scripts/lib/enveomics_rb/stats/rand.rb +0 -31
  186. data/utils/enveomics/Scripts/lib/enveomics_rb/stats/sample.rb +0 -152
  187. data/utils/enveomics/Scripts/lib/enveomics_rb/stats.rb +0 -3
  188. data/utils/enveomics/Scripts/lib/enveomics_rb/utils.rb +0 -74
  189. data/utils/enveomics/Scripts/lib/enveomics_rb/vcf.rb +0 -135
  190. data/utils/enveomics/Scripts/ogs.annotate.rb +0 -88
  191. data/utils/enveomics/Scripts/ogs.core-pan.rb +0 -160
  192. data/utils/enveomics/Scripts/ogs.extract.rb +0 -125
  193. data/utils/enveomics/Scripts/ogs.mcl.rb +0 -186
  194. data/utils/enveomics/Scripts/ogs.rb +0 -104
  195. data/utils/enveomics/Scripts/ogs.stats.rb +0 -131
  196. data/utils/enveomics/Scripts/rbm-legacy.rb +0 -172
  197. data/utils/enveomics/Scripts/rbm.rb +0 -108
  198. data/utils/enveomics/Scripts/sam.filter.rb +0 -148
  199. data/utils/enveomics/Tests/Makefile +0 -10
  200. data/utils/enveomics/Tests/Mgen_M2288.faa +0 -3189
  201. data/utils/enveomics/Tests/Mgen_M2288.fna +0 -8282
  202. data/utils/enveomics/Tests/Mgen_M2321.fna +0 -8288
  203. data/utils/enveomics/Tests/Nequ_Kin4M.faa +0 -2970
  204. data/utils/enveomics/Tests/Xanthomonas_oryzae-PilA.tribs.Rdata +0 -0
  205. data/utils/enveomics/Tests/Xanthomonas_oryzae-PilA.txt +0 -7
  206. data/utils/enveomics/Tests/Xanthomonas_oryzae.aai-mat.tsv +0 -17
  207. data/utils/enveomics/Tests/Xanthomonas_oryzae.aai.tsv +0 -137
  208. data/utils/enveomics/Tests/a_mg.cds-go.blast.tsv +0 -123
  209. data/utils/enveomics/Tests/a_mg.reads-cds.blast.tsv +0 -200
  210. data/utils/enveomics/Tests/a_mg.reads-cds.counts.tsv +0 -55
  211. data/utils/enveomics/Tests/alkB.nwk +0 -1
  212. data/utils/enveomics/Tests/anthrax-cansnp-data.tsv +0 -13
  213. data/utils/enveomics/Tests/anthrax-cansnp-key.tsv +0 -17
  214. data/utils/enveomics/Tests/hiv1.faa +0 -59
  215. data/utils/enveomics/Tests/hiv1.fna +0 -134
  216. data/utils/enveomics/Tests/hiv2.faa +0 -70
  217. data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv +0 -233
  218. data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv.lim +0 -1
  219. data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv.rec +0 -233
  220. data/utils/enveomics/Tests/phyla_counts.tsv +0 -10
  221. data/utils/enveomics/Tests/primate_lentivirus.ogs +0 -11
  222. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-hiv1.rbm +0 -9
  223. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-hiv2.rbm +0 -8
  224. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-siv.rbm +0 -6
  225. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv2-hiv2.rbm +0 -9
  226. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv2-siv.rbm +0 -6
  227. data/utils/enveomics/Tests/primate_lentivirus.rbm/siv-siv.rbm +0 -6
  228. data/utils/enveomics/build_enveomics_r.bash +0 -45
  229. data/utils/enveomics/enveomics.R/DESCRIPTION +0 -31
  230. data/utils/enveomics/enveomics.R/NAMESPACE +0 -39
  231. data/utils/enveomics/enveomics.R/R/autoprune.R +0 -155
  232. data/utils/enveomics/enveomics.R/R/barplot.R +0 -184
  233. data/utils/enveomics/enveomics.R/R/cliopts.R +0 -135
  234. data/utils/enveomics/enveomics.R/R/df2dist.R +0 -154
  235. data/utils/enveomics/enveomics.R/R/growthcurve.R +0 -331
  236. data/utils/enveomics/enveomics.R/R/prefscore.R +0 -79
  237. data/utils/enveomics/enveomics.R/R/recplot.R +0 -354
  238. data/utils/enveomics/enveomics.R/R/recplot2.R +0 -1631
  239. data/utils/enveomics/enveomics.R/R/tribs.R +0 -583
  240. data/utils/enveomics/enveomics.R/R/utils.R +0 -80
  241. data/utils/enveomics/enveomics.R/README.md +0 -81
  242. data/utils/enveomics/enveomics.R/data/growth.curves.rda +0 -0
  243. data/utils/enveomics/enveomics.R/data/phyla.counts.rda +0 -0
  244. data/utils/enveomics/enveomics.R/man/cash-enve.GrowthCurve-method.Rd +0 -16
  245. data/utils/enveomics/enveomics.R/man/cash-enve.RecPlot2-method.Rd +0 -16
  246. data/utils/enveomics/enveomics.R/man/cash-enve.RecPlot2.Peak-method.Rd +0 -16
  247. data/utils/enveomics/enveomics.R/man/enve.GrowthCurve-class.Rd +0 -25
  248. data/utils/enveomics/enveomics.R/man/enve.TRIBS-class.Rd +0 -46
  249. data/utils/enveomics/enveomics.R/man/enve.TRIBS.merge.Rd +0 -23
  250. data/utils/enveomics/enveomics.R/man/enve.TRIBStest-class.Rd +0 -47
  251. data/utils/enveomics/enveomics.R/man/enve.__prune.iter.Rd +0 -23
  252. data/utils/enveomics/enveomics.R/man/enve.__prune.reduce.Rd +0 -23
  253. data/utils/enveomics/enveomics.R/man/enve.__tribs.Rd +0 -40
  254. data/utils/enveomics/enveomics.R/man/enve.barplot.Rd +0 -103
  255. data/utils/enveomics/enveomics.R/man/enve.cliopts.Rd +0 -67
  256. data/utils/enveomics/enveomics.R/man/enve.col.alpha.Rd +0 -24
  257. data/utils/enveomics/enveomics.R/man/enve.col2alpha.Rd +0 -19
  258. data/utils/enveomics/enveomics.R/man/enve.df2dist.Rd +0 -45
  259. data/utils/enveomics/enveomics.R/man/enve.df2dist.group.Rd +0 -44
  260. data/utils/enveomics/enveomics.R/man/enve.df2dist.list.Rd +0 -47
  261. data/utils/enveomics/enveomics.R/man/enve.growthcurve.Rd +0 -75
  262. data/utils/enveomics/enveomics.R/man/enve.prefscore.Rd +0 -50
  263. data/utils/enveomics/enveomics.R/man/enve.prune.dist.Rd +0 -44
  264. data/utils/enveomics/enveomics.R/man/enve.recplot.Rd +0 -139
  265. data/utils/enveomics/enveomics.R/man/enve.recplot2-class.Rd +0 -45
  266. data/utils/enveomics/enveomics.R/man/enve.recplot2.ANIr.Rd +0 -24
  267. data/utils/enveomics/enveomics.R/man/enve.recplot2.Rd +0 -77
  268. data/utils/enveomics/enveomics.R/man/enve.recplot2.__counts.Rd +0 -25
  269. data/utils/enveomics/enveomics.R/man/enve.recplot2.__peakHist.Rd +0 -21
  270. data/utils/enveomics/enveomics.R/man/enve.recplot2.__whichClosestPeak.Rd +0 -19
  271. data/utils/enveomics/enveomics.R/man/enve.recplot2.changeCutoff.Rd +0 -19
  272. data/utils/enveomics/enveomics.R/man/enve.recplot2.compareIdentities.Rd +0 -47
  273. data/utils/enveomics/enveomics.R/man/enve.recplot2.coordinates.Rd +0 -29
  274. data/utils/enveomics/enveomics.R/man/enve.recplot2.corePeak.Rd +0 -18
  275. data/utils/enveomics/enveomics.R/man/enve.recplot2.extractWindows.Rd +0 -45
  276. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.Rd +0 -36
  277. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__em_e.Rd +0 -19
  278. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__em_m.Rd +0 -19
  279. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__emauto_one.Rd +0 -27
  280. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__mow_one.Rd +0 -52
  281. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__mower.Rd +0 -17
  282. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.em.Rd +0 -51
  283. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.emauto.Rd +0 -43
  284. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.mower.Rd +0 -82
  285. data/utils/enveomics/enveomics.R/man/enve.recplot2.peak-class.Rd +0 -59
  286. data/utils/enveomics/enveomics.R/man/enve.recplot2.seqdepth.Rd +0 -27
  287. data/utils/enveomics/enveomics.R/man/enve.recplot2.windowDepthThreshold.Rd +0 -36
  288. data/utils/enveomics/enveomics.R/man/enve.selvector.Rd +0 -23
  289. data/utils/enveomics/enveomics.R/man/enve.tribs.Rd +0 -68
  290. data/utils/enveomics/enveomics.R/man/enve.tribs.test.Rd +0 -28
  291. data/utils/enveomics/enveomics.R/man/enve.truncate.Rd +0 -27
  292. data/utils/enveomics/enveomics.R/man/growth.curves.Rd +0 -14
  293. data/utils/enveomics/enveomics.R/man/phyla.counts.Rd +0 -13
  294. data/utils/enveomics/enveomics.R/man/plot.enve.GrowthCurve.Rd +0 -78
  295. data/utils/enveomics/enveomics.R/man/plot.enve.TRIBS.Rd +0 -46
  296. data/utils/enveomics/enveomics.R/man/plot.enve.TRIBStest.Rd +0 -45
  297. data/utils/enveomics/enveomics.R/man/plot.enve.recplot2.Rd +0 -125
  298. data/utils/enveomics/enveomics.R/man/summary.enve.GrowthCurve.Rd +0 -19
  299. data/utils/enveomics/enveomics.R/man/summary.enve.TRIBS.Rd +0 -19
  300. data/utils/enveomics/enveomics.R/man/summary.enve.TRIBStest.Rd +0 -19
  301. data/utils/enveomics/globals.mk +0 -8
  302. data/utils/enveomics/manifest.json +0 -9
  303. data/utils/multitrim/Multitrim How-To.pdf +0 -0
  304. data/utils/multitrim/README.md +0 -67
  305. data/utils/multitrim/multitrim.py +0 -1555
  306. data/utils/multitrim/multitrim.yml +0 -13
@@ -1,308 +0,0 @@
1
- {
2
- "tasks": [
3
- {
4
- "task": "Table.df2dist.R",
5
- "description": ["Transform a tab-delimited list of distances into a",
6
- "squared matrix."],
7
- "help_arg": "--help",
8
- "requires": [ { "r_package": "optparse" } ],
9
- "options": [
10
- {
11
- "name": "Input list",
12
- "opt": "--x",
13
- "arg": "in_file",
14
- "mandatory": true,
15
- "description": "A tab-delimited table with the distances."
16
- },
17
- {
18
- "opt": "--obj1-index",
19
- "arg": "integer",
20
- "default": 1,
21
- "description": ["Index of the column containing the ID of the object",
22
- "1."]
23
- },
24
- {
25
- "opt": "--obj2-index",
26
- "arg": "integer",
27
- "default": 2,
28
- "description": ["Index of the column containing the ID of the object",
29
- "2."]
30
- },
31
- {
32
- "opt": "--dist-index",
33
- "arg": "integer",
34
- "default": 3,
35
- "description": "Index of the column containing the distance."
36
- },
37
- {
38
- "opt": "--default-d",
39
- "arg": "integer",
40
- "description": "Default value for missing values. NA if empty."
41
- },
42
- {
43
- "opt": "--max-sim",
44
- "arg": "float",
45
- "description": ["If not-empty, assumes that the values are",
46
- "similarity (not distance) and this is the maximum similarity",
47
- "(corresponding to distance 0). Applies transformation:",
48
- "distance = (max.sim - values)/max.sim."]
49
- },
50
- {
51
- "arg": "out_file",
52
- "mandatory": true,
53
- "description": "Output squared matrix in tab-separated values format."
54
- }
55
- ]
56
- },
57
- {
58
- "task": "Table.filter.pl",
59
- "description": ["Extracts (and re-orders) a subset of rows from a raw",
60
- "table."],
61
- "help_arg": "",
62
- "options": [
63
- {
64
- "name": "Key",
65
- "opt": "-k",
66
- "arg": "integer",
67
- "default": 1,
68
- "description": "Column of the table to use as key to filter."
69
- },
70
- {
71
- "name": "Sep",
72
- "opt": "-s",
73
- "arg": "string",
74
- "description": ["String to use as separation between rows. By",
75
- "default, tabulation."]
76
- },
77
- {
78
- "name": "Inverse",
79
- "opt": "-i",
80
- "description": ["If set, reports the inverse of the list (i.e.,",
81
- "reports only rows absent in the list). Implies 'No re-order'."]
82
- },
83
- {
84
- "name": "Header",
85
- "opt": "-h",
86
- "description": "Keep first row of the table (header) untouched."
87
- },
88
- {
89
- "name": "No re-order",
90
- "opt": "-n",
91
- "description": ["The output has the same order of the table. By",
92
- "default, it prints in the order of the list."]
93
- },
94
- {
95
- "name": "List",
96
- "arg": "in_file",
97
- "mandatory": true,
98
- "description": "List of IDs to extract."
99
- },
100
- {
101
- "name": "Table",
102
- "arg": "in_file",
103
- "mandatory": true,
104
- "description": "Table file containing the superset."
105
- },
106
- ">",
107
- {
108
- "name": "Subset",
109
- "arg": "out_file",
110
- "mandatory": true,
111
- "description": "Table file to be created."
112
- }
113
- ]
114
- },
115
- {
116
- "task": "Table.merge.pl",
117
- "description": "Merges multiple (two-column) lists into one table.",
118
- "see_also": ["Table.split.pl"],
119
- "help_arg": "",
120
- "options": [
121
- {
122
- "name": "Strings",
123
- "opt": "-s",
124
- "description": ["Values are read as Strings. By default, values are",
125
- "read as numbers."]
126
- },
127
- {
128
- "name": "Input delimiter",
129
- "opt": "-i",
130
- "arg": "string",
131
- "description": "Input field-delimiter. By default, tabulation."
132
- },
133
- {
134
- "name": "Output delimiter",
135
- "opt": "-o",
136
- "arg": "string",
137
- "description": "Output field-delimiter. By default: tabulation."
138
- },
139
- {
140
- "name": "No header",
141
- "opt": "-n",
142
- "description": ["By default, the header is determined by the file",
143
- "names."]
144
- },
145
- {
146
- "name": "Empty",
147
- "opt": "-e",
148
- "description": ["Default string when no value is found. By default,",
149
- "the 'empty' value is 0 if values are numeric (i.e., unless -s is",
150
- "set) or an empty string otherwise."]
151
- },
152
- {
153
- "name": "Header",
154
- "opt": "-h",
155
- "arg": "string",
156
- "default": "Tag",
157
- "description": "Header of the first column, containing the IDs."
158
- },
159
- {
160
- "name": "Header format",
161
- "opt": "-H",
162
- "arg": "string",
163
- "default": "(?:.*/)?([^\\.]+)",
164
- "description": ["Format of filenames capturing the column header in",
165
- "the first capturing parenthesis. Non-capturing paretheses can be",
166
- "defined as (?:...). By default: '(?:.*/)?([^\\.]+)', which",
167
- "captures the part of the basename of the file before the first",
168
- "dot (if any)."]
169
- },
170
- {
171
- "name": "Rows to ignore",
172
- "opt": "-r",
173
- "arg": "integer",
174
- "default": 0,
175
- "description": "Number of leading rows to ignore in the input files."
176
- },
177
- {
178
- "arg": "in_file",
179
- "mandatory": true,
180
- "multiple_sep": " ",
181
- "description": "Input two-column lists."
182
- },
183
- ">",
184
- {
185
- "arg": "out_file",
186
- "mandatory": true,
187
- "description": "Merged table."
188
- }
189
- ]
190
- },
191
- {
192
- "task": "Table.round.rb",
193
- "description": "Rounds numbers in a table.",
194
- "help_arg": "--help",
195
- "options": [
196
- {
197
- "name": "Input file",
198
- "opt": "--in",
199
- "arg": "in_file",
200
- "mandatory": true,
201
- "description": "Input table."
202
- },
203
- {
204
- "name": "Output file",
205
- "opt": "--out",
206
- "arg": "out_file",
207
- "mandatory": true,
208
- "description": "Output table."
209
- },
210
- {
211
- "name": "Decimals",
212
- "opt": "--ndigits",
213
- "arg": "integer",
214
- "default": 0,
215
- "description": "Number of decimal digits."
216
- },
217
- {
218
- "opt": "--floor",
219
- "description": ["Floors the values instead of rounding them. Ignores",
220
- "'Decimals'."]
221
- },
222
- {
223
- "opt": "--ceil",
224
- "description": ["Ceils the values instead of rounding them. Ignores",
225
- "'Decimals'."]
226
- },
227
- {
228
- "opt": "--delimiter",
229
- "arg": "string",
230
- "description": "String delimiting columns. By default, tabulation."
231
- }
232
- ]
233
- },
234
- {
235
- "task": "Table.split.pl",
236
- "description": ["Split a file with multiple columns into multiple",
237
- "two-columns lists."],
238
- "see_also": ["Table.merge.pl"],
239
- "help_arg": "",
240
- "options": [
241
- {
242
- "name": "Input delimiter",
243
- "opt": "-i",
244
- "arg": "string",
245
- "description": "Input field-delimiter. By default, tabulation."
246
- },
247
- {
248
- "name": "Out prefix",
249
- "opt": "-o",
250
- "arg": "string",
251
- "description": "Prefix of the output files."
252
- },
253
- {
254
- "name": "Output directory",
255
- "opt": "-d",
256
- "arg": "out_dir",
257
- "description": "Output directory."
258
- },
259
- {
260
- "arg": "in_file",
261
- "mandatory": true,
262
- "description": "Input table."
263
- }
264
- ]
265
- },
266
- {
267
- "task": "Table.replace.rb",
268
- "description": "Replace a field in a table using a mapping file.",
269
- "help_arg": "--help",
270
- "options": [
271
- {
272
- "opt": "--map",
273
- "arg": "in_file",
274
- "mandatory": true,
275
- "description": "Mapping file with two columns (key and replacement)."
276
- },
277
- {
278
- "opt": "--in",
279
- "arg": "in_file",
280
- "mandatory": true,
281
- "description": "Input table."
282
- },
283
- {
284
- "opt": "--out",
285
- "arg": "out_file",
286
- "mandatory": true,
287
- "description": "Output table."
288
- },
289
- {
290
- "opt": "--key",
291
- "arg": "integer",
292
- "default": 1,
293
- "description": "Column to replace in Input table."
294
- },
295
- {
296
- "opt": "--unknown",
297
- "arg": "string",
298
- "description": "String to use whenever the key is not found in Map."
299
- },
300
- {
301
- "opt": "--delimiter",
302
- "arg": "string",
303
- "description": "String delimiting columns. By default, tabulation."
304
- }
305
- ]
306
- }
307
- ]
308
- }
@@ -1,68 +0,0 @@
1
- {
2
- "tasks": [
3
- {
4
- "task": "Newick.autoprune.R",
5
- "description": ["Automatically prunes a tree, to keep representatives of",
6
- "each clade."],
7
- "requires": [ { "r_package": "optparse" }, { "r_package": "ape" } ],
8
- "cite": [["Paradis et al, 2004, Bioinf",
9
- "http://dx.doi.org/10.1093/bioinformatics/btg412"]],
10
- "help_arg": "--help",
11
- "options": [
12
- {
13
- "name": "Input tree",
14
- "opt": "--t",
15
- "arg": "in_file",
16
- "mandatory": true,
17
- "description": "A tree to prune in Newick format."
18
- },
19
- {
20
- "opt": "--dist-quantile",
21
- "arg": "float",
22
- "default": 0.25,
23
- "description": "The quantile of edge lengths."
24
- },
25
- {
26
- "opt": "--min_dist",
27
- "arg": "float",
28
- "description": ["The minimum distance to allow between two tips. If",
29
- "not set, dist.quantile is used instead to calculate it."]
30
- },
31
- {
32
- "opt": "--quiet",
33
- "description": ["Boolean indicating if the function must run without",
34
- "output."]
35
- },
36
- {
37
- "opt": "--max_iters",
38
- "arg": "integer",
39
- "default": 1000,
40
- "description": "Maximum number of iterations."
41
- },
42
- {
43
- "opt": "--min_nodes_random",
44
- "arg": "integer",
45
- "default": 40000,
46
- "description": ["Minimum number of nodes to trigger 'tip-pairs'",
47
- "nodes sampling. This sampling is less reproducible and more",
48
- "computationally expensive, but it's the only solution if the",
49
- "cophenetic matrix exceeds 2^31-1 entries; above that, it cannot",
50
- "be represented in R."]
51
- },
52
- {
53
- "opt": "--random_nodes_frx",
54
- "arg": "float",
55
- "default": 1.0,
56
- "description": ["Fraction of the nodes to be sampled if more than",
57
- "'Min nodes random'."]
58
- },
59
- {
60
- "arg": "out_file",
61
- "mandatory": true,
62
- "description": ["Output file in Newick format containing the pruned",
63
- "tree."]
64
- }
65
- ]
66
- }
67
- ]
68
- }
@@ -1,111 +0,0 @@
1
- {
2
- "tasks": [
3
- {
4
- "task": "VCF.SNPs.rb",
5
- "description": ["Counts the number of Single-Nucleotide Polymorphisms",
6
- "(SNPs) in a VCF file."],
7
- "help_arg": "--help",
8
- "options": [
9
- {
10
- "opt": "--input",
11
- "arg": "in_file",
12
- "mandatory": true,
13
- "description": "Input file in Variant Call Format (VCF)."
14
- },
15
- {
16
- "name": "Filtered VCF",
17
- "opt": "--out",
18
- "arg": "out_file",
19
- "description": "Output (filtered) file in Variant Call Format (VCF)."
20
- },
21
- {
22
- "name": "Min DP",
23
- "opt": "--min-dp",
24
- "arg": "integer",
25
- "description": "Minimum number of reads covering the position.",
26
- "default": 4
27
- },
28
- {
29
- "name": "Max DP",
30
- "opt": "--max-dp",
31
- "arg": "integer",
32
- "description": ["Maximum number of reads covering the position. By",
33
- "default no limit."]
34
- },
35
- {
36
- "name": "Min Ref-DP",
37
- "opt": "--min-ref-dp",
38
- "arg": "integer",
39
- "description": "Minimum number of reads supporting the REF allele.",
40
- "default": 2
41
- },
42
- {
43
- "name": "Min Alt-DP",
44
- "opt": "--min-alt-dp",
45
- "arg": "integer",
46
- "description": "Minimum number of reads supporting the ALT allele.",
47
- "default": 2
48
- },
49
- {
50
- "opt": "--min-quality",
51
- "arg": "float",
52
- "description": "Minimum quality of the position mapping.",
53
- "default": 0.0
54
- },
55
- {
56
- "opt": "--min-shannon",
57
- "arg": "integer",
58
- "description": "Minimum information content (in bits, from 0 to 1).",
59
- "default": 0.0
60
- },
61
- {
62
- "opt": "--indels",
63
- "description": "Process indels."
64
- }
65
- ]
66
- },
67
- {
68
- "task": "VCF.KaKs.rb",
69
- "description": ["Estimates the Ka/Ks ratio from the SNPs in a VCF file.",
70
- "Ka and Ks are corrected using pseudo-counts, but no corrections for",
71
- "multiple substitutions are applied."],
72
- "help_arg": "--help",
73
- "see_also": ["VCF.SNPs.rb"],
74
- "options": [
75
- {
76
- "opt": "--input",
77
- "arg": "in_file",
78
- "mandatory": true,
79
- "description": "Input file in Variant Call Format (VCF)."
80
- },
81
- {
82
- "opt": "--seqs",
83
- "arg": "in_file",
84
- "mandatory": true,
85
- "description": "Input gene sequences (nucleotides) in FastA format."
86
- },
87
- {
88
- "name": "Synonymous fraction",
89
- "opt": "--syn-frx",
90
- "arg": "float",
91
- "description": ["Fraction of synonymous substitutions. If passed,",
92
- "the number of sites are estimated (not counted per gene),",
93
- "speeding up the computation ~10X."]
94
- },
95
- {
96
- "name": "Bacterial code synonymous fraction",
97
- "opt": "--syn-bacterial-code",
98
- "description": ["Sets the synonymous fraction to 0.760417,",
99
- "approximately the proportion of synonymous substitutions in the",
100
- "bacterial code."]
101
- },
102
- {
103
- "opt": "--codon-file",
104
- "arg": "out_file",
105
- "description": ["Output file including the codons of substitution",
106
- "variants."]
107
- }
108
- ]
109
- }
110
- ]
111
- }
@@ -1,165 +0,0 @@
1
- {
2
- "categories": {
3
- "Sequence similarity search": {
4
- "Statistics": [
5
- "BedGraph.tad.rb",
6
- "BedGraph.window.rb",
7
- "BlastPairwise.AAsubs.pl",
8
- "BlastTab.advance.bash",
9
- "BlastTab.recplot2.R",
10
- "BlastTab.seqdepth.pl",
11
- "BlastTab.seqdepth_nomedian.pl",
12
- "BlastTab.seqdepth_ZIP.pl",
13
- "BlastTab.sumPerHit.pl",
14
- "FastQ.test-error.rb",
15
- "RecPlot2.compareIdentities.R"
16
- ],
17
- "Manipulation": [
18
- "BlastTab.addlen.rb",
19
- "BlastTab.best_hit_sorted.pl",
20
- "BlastTab.catsbj.pl",
21
- "BlastTab.cogCat.rb",
22
- "BlastTab.filter.pl",
23
- "BlastTab.kegg_pep2path_rest.pl",
24
- "BlastTab.pairedHits.rb",
25
- "BlastTab.subsample.pl",
26
- "BlastTab.taxid2taxrank.pl",
27
- "BlastTab.topHits_sorted.rb",
28
- "sam.filter.rb"
29
- ],
30
- "Execution": [
31
- "aai.rb",
32
- "ani.rb",
33
- "anir.rb",
34
- "HMM.haai.rb",
35
- "rbm.rb"
36
- ]
37
- },
38
- "Sequence analyses": {
39
- "Statistics": [
40
- "FastA.gc.pl",
41
- "FastA.length.pl",
42
- "FastA.N50.pl",
43
- "FastA.qlen.pl",
44
- "FastQ.test-error.rb"
45
- ],
46
- "Manipulation": [
47
- "FastA.extract.rb",
48
- "FastA.filter.pl",
49
- "FastA.filterLen.pl",
50
- "FastA.filterN.pl",
51
- "FastA.fragment.rb",
52
- "FastA.interpose.pl",
53
- "FastA.mask.rb",
54
- "FastA.per_file.pl",
55
- "FastA.rename.pl",
56
- "FastA.revcom.pl",
57
- "FastA.sample.rb",
58
- "FastA.slider.pl",
59
- "FastA.split.pl",
60
- "FastA.split.rb",
61
- "FastA.subsample.pl",
62
- "FastA.tag.rb",
63
- "FastA.toFastQ.rb",
64
- "FastA.wrap.rb",
65
- "FastQ.filter.pl",
66
- "FastQ.interpose.pl",
67
- "FastQ.maskQual.rb",
68
- "FastQ.offset.pl",
69
- "FastQ.split.pl",
70
- "FastQ.tag.rb",
71
- "FastQ.toFastA.awk"
72
- ]
73
- },
74
- "Diversity": {
75
- "Community": [
76
- "AlphaDiversity.pl",
77
- "Chao1.pl",
78
- "Table.barplot.R",
79
- "Table.prefScore.R"
80
- ],
81
- "Population": [
82
- "VCF.SNPs.rb",
83
- "VCF.KaKs.rb",
84
- "Table.prefScore.R"
85
- ]
86
- },
87
- "Annotation": {
88
- "Database mapping": [
89
- "BlastTab.kegg_pep2path_rest.pl",
90
- "BlastTab.taxid2taxrank.pl",
91
- "EBIseq2tax.rb",
92
- "NCBIacc2tax.rb",
93
- "gi2tax.rb",
94
- "M5nr.getSequences.rb",
95
- "RefSeq.download.bash",
96
- "SRA.download.bash"
97
- ],
98
- "Tables": [
99
- "Table.barplot.R",
100
- "GenBank.add_fields.rb",
101
- "MyTaxa.fragsByTax.pl",
102
- "Table.df2dist.R",
103
- "Table.filter.pl",
104
- "Table.merge.pl",
105
- "Table.replace.rb",
106
- "Table.round.rb",
107
- "Table.split.pl"
108
- ],
109
- "Search": [
110
- "HMM.essential.rb",
111
- "HMM.haai.rb",
112
- "HMMsearch.extractIds.rb",
113
- "ogs.annotate.rb",
114
- "ogs.core-pan.rb",
115
- "ogs.extract.rb",
116
- "ogs.mcl.rb",
117
- "ogs.stats.rb",
118
- "ogs.rb"
119
- ]
120
- },
121
- "Other data": {
122
- "Phylogenetic and other distances": [
123
- "CharTable.classify.rb",
124
- "JPlace.distances.rb",
125
- "JPlace.to_iToL.rb",
126
- "Newick.autoprune.R",
127
- "TRIBS.test.R",
128
- "TRIBS.plot-test.R",
129
- "Table.df2dist.R"
130
- ],
131
- "Taxonomic": [
132
- "CharTable.classify.rb",
133
- "EBIseq2tax.rb",
134
- "NCBIacc2tax.rb",
135
- "Table.barplot.R",
136
- "gi2tax.rb",
137
- "MyTaxa.fragsByTax.pl",
138
- "MyTaxa.seq-taxrank.rb",
139
- "Taxonomy.silva2ncbi.rb"
140
- ],
141
- "Alignments": [
142
- "AAsubs.log2ratio.rb",
143
- "Aln.cat.rb",
144
- "Aln.convert.pl",
145
- "BlastPairwise.AAsubs.pl"
146
- ],
147
- "Clustering": [
148
- "ogs.mcl.rb",
149
- "clust.rand.rb"
150
- ],
151
- "Read recruitments": [
152
- "anir.rb",
153
- "BedGraph.tad.rb",
154
- "BedGraph.window.rb",
155
- "BlastTab.catsbj.pl",
156
- "BlastTab.pairedHits.rb",
157
- "BlastTab.recplot2.R",
158
- "FastQ.test-error.rb",
159
- "GFF.catsbj.pl",
160
- "RecPlot2.compareIdentities.R",
161
- "sam.filter.rb"
162
- ]
163
- }
164
- }
165
- }