miga-base 0.7.23.0 → 0.7.25.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (320) hide show
  1. checksums.yaml +4 -4
  2. data/Gemfile +3 -0
  3. data/Rakefile +1 -0
  4. data/lib/miga/cli/action/add.rb +10 -8
  5. data/lib/miga/cli/action/classify_wf.rb +12 -11
  6. data/lib/miga/cli/action/derep_wf.rb +3 -9
  7. data/lib/miga/cli/action/edit.rb +0 -1
  8. data/lib/miga/cli/action/find.rb +1 -1
  9. data/lib/miga/cli/action/generic.rb +1 -1
  10. data/lib/miga/cli/action/get.rb +7 -2
  11. data/lib/miga/cli/action/index_wf.rb +4 -2
  12. data/lib/miga/cli/action/init.rb +60 -59
  13. data/lib/miga/cli/action/init/files_helper.rb +2 -1
  14. data/lib/miga/cli/action/ncbi_get.rb +1 -1
  15. data/lib/miga/cli/action/new.rb +15 -9
  16. data/lib/miga/cli/action/option.rb +63 -0
  17. data/lib/miga/cli/action/preproc_wf.rb +7 -5
  18. data/lib/miga/cli/action/quality_wf.rb +3 -3
  19. data/lib/miga/cli/action/tax_dist.rb +1 -1
  20. data/lib/miga/cli/action/tax_test.rb +1 -1
  21. data/lib/miga/cli/action/wf.rb +72 -54
  22. data/lib/miga/cli/base.rb +17 -5
  23. data/lib/miga/cli/objects_helper.rb +23 -18
  24. data/lib/miga/common.rb +1 -1
  25. data/lib/miga/common/with_option.rb +83 -0
  26. data/lib/miga/common/with_result.rb +2 -1
  27. data/lib/miga/dataset/base.rb +20 -2
  28. data/lib/miga/dataset/result.rb +3 -2
  29. data/lib/miga/metadata.rb +25 -13
  30. data/lib/miga/project/base.rb +82 -2
  31. data/lib/miga/project/result.rb +4 -4
  32. data/lib/miga/result.rb +18 -15
  33. data/lib/miga/result/stats.rb +2 -2
  34. data/lib/miga/version.rb +2 -2
  35. data/scripts/essential_genes.bash +18 -3
  36. data/scripts/miga.bash +8 -2
  37. data/scripts/ogs.bash +2 -3
  38. data/test/dataset_test.rb +5 -5
  39. data/test/lair_test.rb +1 -2
  40. data/test/result_test.rb +22 -0
  41. data/test/with_option_test.rb +115 -0
  42. data/utils/cleanup-databases.rb +1 -2
  43. data/utils/distance/base.rb +9 -0
  44. data/utils/distance/commands.rb +183 -81
  45. data/utils/distance/database.rb +69 -10
  46. data/utils/distance/pipeline.rb +15 -21
  47. data/utils/distance/runner.rb +28 -49
  48. data/utils/distance/temporal.rb +4 -2
  49. data/utils/distances.rb +2 -2
  50. data/utils/index_metadata.rb +1 -2
  51. data/utils/requirements.txt +1 -1
  52. data/utils/subclade/runner.rb +9 -10
  53. metadata +9 -273
  54. data/utils/enveomics/Docs/recplot2.md +0 -244
  55. data/utils/enveomics/Examples/aai-matrix.bash +0 -66
  56. data/utils/enveomics/Examples/ani-matrix.bash +0 -66
  57. data/utils/enveomics/Examples/essential-phylogeny.bash +0 -105
  58. data/utils/enveomics/Examples/unus-genome-phylogeny.bash +0 -100
  59. data/utils/enveomics/LICENSE.txt +0 -73
  60. data/utils/enveomics/Makefile +0 -52
  61. data/utils/enveomics/Manifest/Tasks/aasubs.json +0 -103
  62. data/utils/enveomics/Manifest/Tasks/blasttab.json +0 -786
  63. data/utils/enveomics/Manifest/Tasks/distances.json +0 -161
  64. data/utils/enveomics/Manifest/Tasks/fasta.json +0 -766
  65. data/utils/enveomics/Manifest/Tasks/fastq.json +0 -243
  66. data/utils/enveomics/Manifest/Tasks/graphics.json +0 -126
  67. data/utils/enveomics/Manifest/Tasks/mapping.json +0 -67
  68. data/utils/enveomics/Manifest/Tasks/ogs.json +0 -382
  69. data/utils/enveomics/Manifest/Tasks/other.json +0 -829
  70. data/utils/enveomics/Manifest/Tasks/remote.json +0 -355
  71. data/utils/enveomics/Manifest/Tasks/sequence-identity.json +0 -501
  72. data/utils/enveomics/Manifest/Tasks/tables.json +0 -308
  73. data/utils/enveomics/Manifest/Tasks/trees.json +0 -68
  74. data/utils/enveomics/Manifest/Tasks/variants.json +0 -111
  75. data/utils/enveomics/Manifest/categories.json +0 -156
  76. data/utils/enveomics/Manifest/examples.json +0 -154
  77. data/utils/enveomics/Manifest/tasks.json +0 -4
  78. data/utils/enveomics/Pipelines/assembly.pbs/CONFIG.mock.bash +0 -69
  79. data/utils/enveomics/Pipelines/assembly.pbs/FastA.N50.pl +0 -1
  80. data/utils/enveomics/Pipelines/assembly.pbs/FastA.filterN.pl +0 -1
  81. data/utils/enveomics/Pipelines/assembly.pbs/FastA.length.pl +0 -1
  82. data/utils/enveomics/Pipelines/assembly.pbs/README.md +0 -189
  83. data/utils/enveomics/Pipelines/assembly.pbs/RUNME-2.bash +0 -112
  84. data/utils/enveomics/Pipelines/assembly.pbs/RUNME-3.bash +0 -23
  85. data/utils/enveomics/Pipelines/assembly.pbs/RUNME-4.bash +0 -44
  86. data/utils/enveomics/Pipelines/assembly.pbs/RUNME.bash +0 -50
  87. data/utils/enveomics/Pipelines/assembly.pbs/kSelector.R +0 -37
  88. data/utils/enveomics/Pipelines/assembly.pbs/newbler.pbs +0 -68
  89. data/utils/enveomics/Pipelines/assembly.pbs/newbler_preparator.pl +0 -49
  90. data/utils/enveomics/Pipelines/assembly.pbs/soap.pbs +0 -80
  91. data/utils/enveomics/Pipelines/assembly.pbs/stats.pbs +0 -57
  92. data/utils/enveomics/Pipelines/assembly.pbs/velvet.pbs +0 -63
  93. data/utils/enveomics/Pipelines/blast.pbs/01.pbs.bash +0 -38
  94. data/utils/enveomics/Pipelines/blast.pbs/02.pbs.bash +0 -73
  95. data/utils/enveomics/Pipelines/blast.pbs/03.pbs.bash +0 -21
  96. data/utils/enveomics/Pipelines/blast.pbs/BlastTab.recover_job.pl +0 -72
  97. data/utils/enveomics/Pipelines/blast.pbs/CONFIG.mock.bash +0 -98
  98. data/utils/enveomics/Pipelines/blast.pbs/FastA.split.pl +0 -1
  99. data/utils/enveomics/Pipelines/blast.pbs/README.md +0 -127
  100. data/utils/enveomics/Pipelines/blast.pbs/RUNME.bash +0 -109
  101. data/utils/enveomics/Pipelines/blast.pbs/TASK.check.bash +0 -128
  102. data/utils/enveomics/Pipelines/blast.pbs/TASK.dry.bash +0 -16
  103. data/utils/enveomics/Pipelines/blast.pbs/TASK.eo.bash +0 -22
  104. data/utils/enveomics/Pipelines/blast.pbs/TASK.pause.bash +0 -26
  105. data/utils/enveomics/Pipelines/blast.pbs/TASK.run.bash +0 -89
  106. data/utils/enveomics/Pipelines/blast.pbs/sentinel.pbs.bash +0 -29
  107. data/utils/enveomics/Pipelines/idba.pbs/README.md +0 -49
  108. data/utils/enveomics/Pipelines/idba.pbs/RUNME.bash +0 -95
  109. data/utils/enveomics/Pipelines/idba.pbs/run.pbs +0 -56
  110. data/utils/enveomics/Pipelines/trim.pbs/README.md +0 -54
  111. data/utils/enveomics/Pipelines/trim.pbs/RUNME.bash +0 -70
  112. data/utils/enveomics/Pipelines/trim.pbs/run.pbs +0 -130
  113. data/utils/enveomics/README.md +0 -42
  114. data/utils/enveomics/Scripts/AAsubs.log2ratio.rb +0 -171
  115. data/utils/enveomics/Scripts/Aln.cat.rb +0 -163
  116. data/utils/enveomics/Scripts/Aln.convert.pl +0 -35
  117. data/utils/enveomics/Scripts/AlphaDiversity.pl +0 -152
  118. data/utils/enveomics/Scripts/BedGraph.tad.rb +0 -93
  119. data/utils/enveomics/Scripts/BedGraph.window.rb +0 -71
  120. data/utils/enveomics/Scripts/BlastPairwise.AAsubs.pl +0 -102
  121. data/utils/enveomics/Scripts/BlastTab.addlen.rb +0 -63
  122. data/utils/enveomics/Scripts/BlastTab.advance.bash +0 -48
  123. data/utils/enveomics/Scripts/BlastTab.best_hit_sorted.pl +0 -55
  124. data/utils/enveomics/Scripts/BlastTab.catsbj.pl +0 -104
  125. data/utils/enveomics/Scripts/BlastTab.cogCat.rb +0 -76
  126. data/utils/enveomics/Scripts/BlastTab.filter.pl +0 -47
  127. data/utils/enveomics/Scripts/BlastTab.kegg_pep2path_rest.pl +0 -194
  128. data/utils/enveomics/Scripts/BlastTab.metaxaPrep.pl +0 -104
  129. data/utils/enveomics/Scripts/BlastTab.pairedHits.rb +0 -157
  130. data/utils/enveomics/Scripts/BlastTab.recplot2.R +0 -48
  131. data/utils/enveomics/Scripts/BlastTab.seqdepth.pl +0 -86
  132. data/utils/enveomics/Scripts/BlastTab.seqdepth_ZIP.pl +0 -119
  133. data/utils/enveomics/Scripts/BlastTab.seqdepth_nomedian.pl +0 -86
  134. data/utils/enveomics/Scripts/BlastTab.subsample.pl +0 -47
  135. data/utils/enveomics/Scripts/BlastTab.sumPerHit.pl +0 -114
  136. data/utils/enveomics/Scripts/BlastTab.taxid2taxrank.pl +0 -90
  137. data/utils/enveomics/Scripts/BlastTab.topHits_sorted.rb +0 -101
  138. data/utils/enveomics/Scripts/Chao1.pl +0 -97
  139. data/utils/enveomics/Scripts/CharTable.classify.rb +0 -234
  140. data/utils/enveomics/Scripts/EBIseq2tax.rb +0 -83
  141. data/utils/enveomics/Scripts/FastA.N50.pl +0 -56
  142. data/utils/enveomics/Scripts/FastA.extract.rb +0 -152
  143. data/utils/enveomics/Scripts/FastA.filter.pl +0 -52
  144. data/utils/enveomics/Scripts/FastA.filterLen.pl +0 -28
  145. data/utils/enveomics/Scripts/FastA.filterN.pl +0 -60
  146. data/utils/enveomics/Scripts/FastA.fragment.rb +0 -92
  147. data/utils/enveomics/Scripts/FastA.gc.pl +0 -42
  148. data/utils/enveomics/Scripts/FastA.interpose.pl +0 -93
  149. data/utils/enveomics/Scripts/FastA.length.pl +0 -38
  150. data/utils/enveomics/Scripts/FastA.mask.rb +0 -89
  151. data/utils/enveomics/Scripts/FastA.per_file.pl +0 -36
  152. data/utils/enveomics/Scripts/FastA.qlen.pl +0 -57
  153. data/utils/enveomics/Scripts/FastA.rename.pl +0 -65
  154. data/utils/enveomics/Scripts/FastA.revcom.pl +0 -23
  155. data/utils/enveomics/Scripts/FastA.sample.rb +0 -83
  156. data/utils/enveomics/Scripts/FastA.slider.pl +0 -85
  157. data/utils/enveomics/Scripts/FastA.split.pl +0 -55
  158. data/utils/enveomics/Scripts/FastA.split.rb +0 -79
  159. data/utils/enveomics/Scripts/FastA.subsample.pl +0 -131
  160. data/utils/enveomics/Scripts/FastA.tag.rb +0 -65
  161. data/utils/enveomics/Scripts/FastA.wrap.rb +0 -48
  162. data/utils/enveomics/Scripts/FastQ.filter.pl +0 -54
  163. data/utils/enveomics/Scripts/FastQ.interpose.pl +0 -90
  164. data/utils/enveomics/Scripts/FastQ.offset.pl +0 -90
  165. data/utils/enveomics/Scripts/FastQ.split.pl +0 -53
  166. data/utils/enveomics/Scripts/FastQ.tag.rb +0 -63
  167. data/utils/enveomics/Scripts/FastQ.test-error.rb +0 -81
  168. data/utils/enveomics/Scripts/FastQ.toFastA.awk +0 -24
  169. data/utils/enveomics/Scripts/GFF.catsbj.pl +0 -127
  170. data/utils/enveomics/Scripts/GenBank.add_fields.rb +0 -84
  171. data/utils/enveomics/Scripts/HMM.essential.rb +0 -351
  172. data/utils/enveomics/Scripts/HMM.haai.rb +0 -168
  173. data/utils/enveomics/Scripts/HMMsearch.extractIds.rb +0 -83
  174. data/utils/enveomics/Scripts/JPlace.distances.rb +0 -88
  175. data/utils/enveomics/Scripts/JPlace.to_iToL.rb +0 -320
  176. data/utils/enveomics/Scripts/M5nr.getSequences.rb +0 -81
  177. data/utils/enveomics/Scripts/MeTaxa.distribution.pl +0 -198
  178. data/utils/enveomics/Scripts/MyTaxa.fragsByTax.pl +0 -35
  179. data/utils/enveomics/Scripts/MyTaxa.seq-taxrank.rb +0 -49
  180. data/utils/enveomics/Scripts/NCBIacc2tax.rb +0 -92
  181. data/utils/enveomics/Scripts/Newick.autoprune.R +0 -27
  182. data/utils/enveomics/Scripts/RAxML-EPA.to_iToL.pl +0 -228
  183. data/utils/enveomics/Scripts/RecPlot2.compareIdentities.R +0 -32
  184. data/utils/enveomics/Scripts/RefSeq.download.bash +0 -48
  185. data/utils/enveomics/Scripts/SRA.download.bash +0 -57
  186. data/utils/enveomics/Scripts/TRIBS.plot-test.R +0 -36
  187. data/utils/enveomics/Scripts/TRIBS.test.R +0 -39
  188. data/utils/enveomics/Scripts/Table.barplot.R +0 -31
  189. data/utils/enveomics/Scripts/Table.df2dist.R +0 -30
  190. data/utils/enveomics/Scripts/Table.filter.pl +0 -61
  191. data/utils/enveomics/Scripts/Table.merge.pl +0 -77
  192. data/utils/enveomics/Scripts/Table.replace.rb +0 -69
  193. data/utils/enveomics/Scripts/Table.round.rb +0 -63
  194. data/utils/enveomics/Scripts/Table.split.pl +0 -57
  195. data/utils/enveomics/Scripts/Taxonomy.silva2ncbi.rb +0 -227
  196. data/utils/enveomics/Scripts/VCF.KaKs.rb +0 -147
  197. data/utils/enveomics/Scripts/VCF.SNPs.rb +0 -88
  198. data/utils/enveomics/Scripts/aai.rb +0 -418
  199. data/utils/enveomics/Scripts/ani.rb +0 -362
  200. data/utils/enveomics/Scripts/clust.rand.rb +0 -102
  201. data/utils/enveomics/Scripts/gi2tax.rb +0 -103
  202. data/utils/enveomics/Scripts/in_silico_GA_GI.pl +0 -96
  203. data/utils/enveomics/Scripts/lib/data/dupont_2012_essential.hmm.gz +0 -0
  204. data/utils/enveomics/Scripts/lib/data/lee_2019_essential.hmm.gz +0 -0
  205. data/utils/enveomics/Scripts/lib/enveomics.R +0 -1
  206. data/utils/enveomics/Scripts/lib/enveomics_rb/enveomics.rb +0 -24
  207. data/utils/enveomics/Scripts/lib/enveomics_rb/jplace.rb +0 -253
  208. data/utils/enveomics/Scripts/lib/enveomics_rb/og.rb +0 -182
  209. data/utils/enveomics/Scripts/lib/enveomics_rb/remote_data.rb +0 -74
  210. data/utils/enveomics/Scripts/lib/enveomics_rb/seq_range.rb +0 -237
  211. data/utils/enveomics/Scripts/lib/enveomics_rb/stat.rb +0 -30
  212. data/utils/enveomics/Scripts/lib/enveomics_rb/vcf.rb +0 -135
  213. data/utils/enveomics/Scripts/ogs.annotate.rb +0 -88
  214. data/utils/enveomics/Scripts/ogs.core-pan.rb +0 -160
  215. data/utils/enveomics/Scripts/ogs.extract.rb +0 -125
  216. data/utils/enveomics/Scripts/ogs.mcl.rb +0 -186
  217. data/utils/enveomics/Scripts/ogs.rb +0 -104
  218. data/utils/enveomics/Scripts/ogs.stats.rb +0 -131
  219. data/utils/enveomics/Scripts/rbm.rb +0 -146
  220. data/utils/enveomics/Tests/Makefile +0 -10
  221. data/utils/enveomics/Tests/Mgen_M2288.faa +0 -3189
  222. data/utils/enveomics/Tests/Mgen_M2288.fna +0 -8282
  223. data/utils/enveomics/Tests/Mgen_M2321.fna +0 -8288
  224. data/utils/enveomics/Tests/Nequ_Kin4M.faa +0 -2970
  225. data/utils/enveomics/Tests/Xanthomonas_oryzae-PilA.tribs.Rdata +0 -0
  226. data/utils/enveomics/Tests/Xanthomonas_oryzae-PilA.txt +0 -7
  227. data/utils/enveomics/Tests/Xanthomonas_oryzae.aai-mat.tsv +0 -17
  228. data/utils/enveomics/Tests/Xanthomonas_oryzae.aai.tsv +0 -137
  229. data/utils/enveomics/Tests/a_mg.cds-go.blast.tsv +0 -123
  230. data/utils/enveomics/Tests/a_mg.reads-cds.blast.tsv +0 -200
  231. data/utils/enveomics/Tests/a_mg.reads-cds.counts.tsv +0 -55
  232. data/utils/enveomics/Tests/alkB.nwk +0 -1
  233. data/utils/enveomics/Tests/anthrax-cansnp-data.tsv +0 -13
  234. data/utils/enveomics/Tests/anthrax-cansnp-key.tsv +0 -17
  235. data/utils/enveomics/Tests/hiv1.faa +0 -59
  236. data/utils/enveomics/Tests/hiv1.fna +0 -134
  237. data/utils/enveomics/Tests/hiv2.faa +0 -70
  238. data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv +0 -233
  239. data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv.lim +0 -1
  240. data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv.rec +0 -233
  241. data/utils/enveomics/Tests/phyla_counts.tsv +0 -10
  242. data/utils/enveomics/Tests/primate_lentivirus.ogs +0 -11
  243. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-hiv1.rbm +0 -9
  244. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-hiv2.rbm +0 -8
  245. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-siv.rbm +0 -6
  246. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv2-hiv2.rbm +0 -9
  247. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv2-siv.rbm +0 -6
  248. data/utils/enveomics/Tests/primate_lentivirus.rbm/siv-siv.rbm +0 -6
  249. data/utils/enveomics/build_enveomics_r.bash +0 -45
  250. data/utils/enveomics/enveomics.R/DESCRIPTION +0 -31
  251. data/utils/enveomics/enveomics.R/NAMESPACE +0 -39
  252. data/utils/enveomics/enveomics.R/R/autoprune.R +0 -155
  253. data/utils/enveomics/enveomics.R/R/barplot.R +0 -184
  254. data/utils/enveomics/enveomics.R/R/cliopts.R +0 -135
  255. data/utils/enveomics/enveomics.R/R/df2dist.R +0 -154
  256. data/utils/enveomics/enveomics.R/R/growthcurve.R +0 -331
  257. data/utils/enveomics/enveomics.R/R/recplot.R +0 -354
  258. data/utils/enveomics/enveomics.R/R/recplot2.R +0 -1631
  259. data/utils/enveomics/enveomics.R/R/tribs.R +0 -583
  260. data/utils/enveomics/enveomics.R/R/utils.R +0 -50
  261. data/utils/enveomics/enveomics.R/README.md +0 -80
  262. data/utils/enveomics/enveomics.R/data/growth.curves.rda +0 -0
  263. data/utils/enveomics/enveomics.R/data/phyla.counts.rda +0 -0
  264. data/utils/enveomics/enveomics.R/man/cash-enve.GrowthCurve-method.Rd +0 -17
  265. data/utils/enveomics/enveomics.R/man/cash-enve.RecPlot2-method.Rd +0 -17
  266. data/utils/enveomics/enveomics.R/man/cash-enve.RecPlot2.Peak-method.Rd +0 -17
  267. data/utils/enveomics/enveomics.R/man/enve.GrowthCurve-class.Rd +0 -25
  268. data/utils/enveomics/enveomics.R/man/enve.TRIBS-class.Rd +0 -46
  269. data/utils/enveomics/enveomics.R/man/enve.TRIBS.merge.Rd +0 -23
  270. data/utils/enveomics/enveomics.R/man/enve.TRIBStest-class.Rd +0 -47
  271. data/utils/enveomics/enveomics.R/man/enve.__prune.iter.Rd +0 -23
  272. data/utils/enveomics/enveomics.R/man/enve.__prune.reduce.Rd +0 -23
  273. data/utils/enveomics/enveomics.R/man/enve.__tribs.Rd +0 -32
  274. data/utils/enveomics/enveomics.R/man/enve.barplot.Rd +0 -91
  275. data/utils/enveomics/enveomics.R/man/enve.cliopts.Rd +0 -57
  276. data/utils/enveomics/enveomics.R/man/enve.col.alpha.Rd +0 -24
  277. data/utils/enveomics/enveomics.R/man/enve.col2alpha.Rd +0 -19
  278. data/utils/enveomics/enveomics.R/man/enve.df2dist.Rd +0 -39
  279. data/utils/enveomics/enveomics.R/man/enve.df2dist.group.Rd +0 -38
  280. data/utils/enveomics/enveomics.R/man/enve.df2dist.list.Rd +0 -40
  281. data/utils/enveomics/enveomics.R/man/enve.growthcurve.Rd +0 -67
  282. data/utils/enveomics/enveomics.R/man/enve.prune.dist.Rd +0 -37
  283. data/utils/enveomics/enveomics.R/man/enve.recplot.Rd +0 -122
  284. data/utils/enveomics/enveomics.R/man/enve.recplot2-class.Rd +0 -45
  285. data/utils/enveomics/enveomics.R/man/enve.recplot2.ANIr.Rd +0 -24
  286. data/utils/enveomics/enveomics.R/man/enve.recplot2.Rd +0 -68
  287. data/utils/enveomics/enveomics.R/man/enve.recplot2.__counts.Rd +0 -25
  288. data/utils/enveomics/enveomics.R/man/enve.recplot2.__peakHist.Rd +0 -21
  289. data/utils/enveomics/enveomics.R/man/enve.recplot2.__whichClosestPeak.Rd +0 -19
  290. data/utils/enveomics/enveomics.R/man/enve.recplot2.changeCutoff.Rd +0 -19
  291. data/utils/enveomics/enveomics.R/man/enve.recplot2.compareIdentities.Rd +0 -41
  292. data/utils/enveomics/enveomics.R/man/enve.recplot2.coordinates.Rd +0 -29
  293. data/utils/enveomics/enveomics.R/man/enve.recplot2.corePeak.Rd +0 -18
  294. data/utils/enveomics/enveomics.R/man/enve.recplot2.extractWindows.Rd +0 -40
  295. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.Rd +0 -36
  296. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__em_e.Rd +0 -19
  297. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__em_m.Rd +0 -19
  298. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__emauto_one.Rd +0 -27
  299. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__mow_one.Rd +0 -41
  300. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__mower.Rd +0 -17
  301. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.em.Rd +0 -43
  302. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.emauto.Rd +0 -37
  303. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.mower.Rd +0 -74
  304. data/utils/enveomics/enveomics.R/man/enve.recplot2.peak-class.Rd +0 -59
  305. data/utils/enveomics/enveomics.R/man/enve.recplot2.seqdepth.Rd +0 -27
  306. data/utils/enveomics/enveomics.R/man/enve.recplot2.windowDepthThreshold.Rd +0 -32
  307. data/utils/enveomics/enveomics.R/man/enve.tribs.Rd +0 -59
  308. data/utils/enveomics/enveomics.R/man/enve.tribs.test.Rd +0 -28
  309. data/utils/enveomics/enveomics.R/man/enve.truncate.Rd +0 -27
  310. data/utils/enveomics/enveomics.R/man/growth.curves.Rd +0 -14
  311. data/utils/enveomics/enveomics.R/man/phyla.counts.Rd +0 -13
  312. data/utils/enveomics/enveomics.R/man/plot.enve.GrowthCurve.Rd +0 -63
  313. data/utils/enveomics/enveomics.R/man/plot.enve.TRIBS.Rd +0 -38
  314. data/utils/enveomics/enveomics.R/man/plot.enve.TRIBStest.Rd +0 -38
  315. data/utils/enveomics/enveomics.R/man/plot.enve.recplot2.Rd +0 -111
  316. data/utils/enveomics/enveomics.R/man/summary.enve.GrowthCurve.Rd +0 -19
  317. data/utils/enveomics/enveomics.R/man/summary.enve.TRIBS.Rd +0 -19
  318. data/utils/enveomics/enveomics.R/man/summary.enve.TRIBStest.Rd +0 -19
  319. data/utils/enveomics/globals.mk +0 -8
  320. data/utils/enveomics/manifest.json +0 -9
data/test/lair_test.rb CHANGED
@@ -75,10 +75,9 @@ class LairTest < Test::Unit::TestCase
75
75
  assert_predicate(d, :active?)
76
76
  end
77
77
 
78
- out = capture_stderr { lair.terminate_daemons }.string
78
+ out = capture_stderr { lair.terminate_daemons ; sleep(2) }.string
79
79
  assert_match(/Probing MiGA::Daemon/, out)
80
80
  assert_match(/Sending termination message/, out)
81
- sleep(2)
82
81
  assert_not_predicate(d, :active?)
83
82
 
84
83
  out = capture_stderr { assert { lair.daemon_loop } }.string
data/test/result_test.rb CHANGED
@@ -38,6 +38,28 @@ class ResultTest < Test::Unit::TestCase
38
38
  assert_instance_of(MiGA::Result, r)
39
39
  end
40
40
 
41
+ def test_unlink
42
+ r = project.add_result(:clade_finding)
43
+ path = r.path
44
+ done = r.path(:done)
45
+ data = r.file_path(:empty)
46
+ assert(File.exist?(path))
47
+ assert(File.exist?(done))
48
+ assert(File.exist?(data))
49
+ r.unlink
50
+ assert(!File.exist?(path))
51
+ assert(!File.exist?(done))
52
+ assert(File.exist?(data))
53
+ end
54
+
55
+ def test_remove
56
+ r = project.add_result(:clade_finding)
57
+ data = r.file_path(:empty)
58
+ assert(File.exist?(data))
59
+ r.remove!
60
+ assert(!File.exist?(data))
61
+ end
62
+
41
63
  def test_result_source
42
64
  r = dataset.add_result(:trimmed_reads)
43
65
  assert_equal(dataset.name, r.source.name)
@@ -0,0 +1,115 @@
1
+ # frozen_string_literal: true
2
+
3
+ require 'test_helper'
4
+ require 'miga/common/with_option'
5
+
6
+ class WithDaemonTest < Test::Unit::TestCase
7
+ include TestHelper
8
+
9
+ class TestWithOption < MiGA::MiGA
10
+ include MiGA::Common::WithOption
11
+
12
+ attr_reader :metadata, :saved
13
+
14
+ def initialize
15
+ @metadata = { range: 0.9 }
16
+ @saved = false
17
+ end
18
+
19
+ def self.OPTIONS
20
+ {
21
+ empty: {},
22
+ float: { type: Float },
23
+ range: { default: 1.0, in: -5.5..5.5, type: Float },
24
+ default: { default: 9, type: Integer },
25
+ token: { type: Integer, tokens: %w[yes no 0] },
26
+ proc: { default: proc { Date.today } },
27
+ bool: { in: [true, false] }
28
+ }
29
+ end
30
+
31
+ def save
32
+ @saved = true
33
+ end
34
+ end
35
+
36
+ def test_with_option
37
+ o = TestWithOption.new
38
+ assert_respond_to(o, :option)
39
+ assert_equal(1, o.metadata.size)
40
+ end
41
+
42
+ def test_option
43
+ o = TestWithOption.new
44
+ assert_equal(9, o.option(:default))
45
+ assert_nil(o.option(:bool))
46
+ assert_raise { o.option(:not_an_option) }
47
+ assert_nil(o.option(:empty))
48
+ end
49
+
50
+ def test_set_bool
51
+ o = TestWithOption.new
52
+ assert_nil(o.option(:bool))
53
+ assert(!o.saved)
54
+ assert_raise { o.set_option(:bool, 'true') }
55
+ assert_nil(o.option(:bool))
56
+ assert(!o.saved)
57
+ assert_equal(true, o.set_option(:bool, 'true', true))
58
+ assert(o.saved)
59
+ assert_equal(false, o.set_option(:bool, false))
60
+ assert_equal(false, o.set_option(:bool, 'false', true))
61
+ assert_nil(o.set_option(:bool, nil))
62
+ end
63
+
64
+ def test_set_empty
65
+ o = TestWithOption.new
66
+ assert_nil(o.option(:empty))
67
+ assert_equal('a', o.set_option(:empty, 'a'))
68
+ assert_equal('1', o.set_option(:empty, '1', true))
69
+ end
70
+
71
+ def test_all_options
72
+ o = TestWithOption.new
73
+ assert(o.all_options.is_a?(Hash))
74
+ assert_include(o.all_options.keys, :bool)
75
+ assert_nil(o.all_options[:bool])
76
+ end
77
+
78
+ def test_option?
79
+ o = TestWithOption.new
80
+ assert(o.option?(:range))
81
+ assert(!o.option?(:not_an_option))
82
+ end
83
+
84
+ def test_option_metadata
85
+ o = TestWithOption.new
86
+ assert_equal(0.9, o.option(:range))
87
+ assert_equal(1.0, o.set_option(:range, nil))
88
+ assert_equal(2.0, o.set_option(:range, 2.0))
89
+ assert_equal(3.0, o.set_option(:range, '3', true))
90
+ end
91
+
92
+ def test_option_range
93
+ o = TestWithOption.new
94
+ assert_raise { o.set_option(:range, 9.0) }
95
+ assert_raise { o.set_option(:range, 3) }
96
+ assert_raise { o.set_option(:range, true) }
97
+ end
98
+
99
+ def test_option_proc
100
+ o = TestWithOption.new
101
+ assert(o.option(:proc).is_a?(Date))
102
+ assert(o.set_option(:proc, 1).is_a?(Integer))
103
+ assert(o.set_option(:proc, nil).is_a?(Date))
104
+ end
105
+
106
+ def test_token
107
+ o = TestWithOption.new
108
+ assert_nil(o.option(:token))
109
+ assert_equal(1, o.set_option(:token, 1))
110
+ assert_equal(-2, o.set_option(:token, '-2', true))
111
+ assert_equal('yes', o.set_option(:token, 'yes'))
112
+ assert_equal('0', o.set_option(:token, '0', true))
113
+ assert_raise { o.set_option(:token, 'maybe') }
114
+ end
115
+ end
@@ -19,7 +19,7 @@ m.say 'Cleaning Databases'
19
19
  next unless (idx % thr) == t
20
20
 
21
21
  d = p.dataset(i)
22
- next unless d.is_ref? and d.is_active?
22
+ next unless d.ref? && d.active?
23
23
 
24
24
  d.cleanup_distances!
25
25
  end
@@ -28,4 +28,3 @@ end
28
28
  Process.waitall
29
29
  m.advance('Dataset:', dsn.size, dsn.size)
30
30
  m.say
31
-
@@ -2,4 +2,13 @@ require 'miga'
2
2
  require 'miga/tax_dist'
3
3
 
4
4
  class MiGA::DistanceRunner
5
+ require_relative 'temporal.rb'
6
+ require_relative 'database.rb'
7
+ require_relative 'commands.rb'
8
+ require_relative 'pipeline.rb'
9
+
10
+ include MiGA::DistanceRunner::Temporal
11
+ include MiGA::DistanceRunner::Database
12
+ include MiGA::DistanceRunner::Commands
13
+ include MiGA::DistanceRunner::Pipeline
5
14
  end
@@ -1,105 +1,207 @@
1
1
  module MiGA::DistanceRunner::Commands
2
- # Estimates or calculates AAI against +target+
3
- def aai(target)
4
- # Check if the request makes sense
5
- return nil if target.nil? || target.result(:essential_genes).nil?
6
-
7
- # Check if it's been calculated
8
- y = stored_value(target, :aai)
9
- return y unless y.nil? || y.zero?
10
-
11
- # Try hAAI (except in clade projects)
12
- unless @ref_project.is_clade?
13
- y = haai(target)
14
- return y unless y.nil? || y.zero?
2
+ ##
3
+ # Estimates AAI against +targets+ using hAAI
4
+ def haai(targets)
5
+ puts "[#{Time.now}] hAAI: #{dataset.name} vs #{targets.size} targets"
6
+ empty_vals = targets.map { |_i| nil }
7
+ return empty_vals if opts[:haai_p] == 'no'
8
+
9
+ # Launch comparisons
10
+ sbj = pending_targets(targets, :haai)
11
+ unless sbj.empty?
12
+ opts[:haai_p] == 'fastaai' ? fastaai_cmd(sbj) : haai_cmd(sbj)
15
13
  end
16
- # Full AAI
17
- aai_cmd(
18
- tmp_file('proteins.fa'), target.result(:cds).file_path(:proteins),
19
- dataset.name, target.name, tmp_dbs[:aai]
20
- ).tap { checkpoint :aai }
14
+
15
+ # Return AAI estimates from the database
16
+ batch_values_from_db(:aai, targets.map { |i| i&.name })
21
17
  end
22
18
 
23
19
  ##
24
- # Estimates AAI against +target+ using hAAI
25
- def haai(target)
26
- return nil if opts[:haai_p] == 'no'
27
-
28
- haai = aai_cmd(tmp_file('ess_genes.fa'),
29
- target.result(:essential_genes).file_path(:ess_genes),
30
- dataset.name, target.name, tmp_dbs[:haai],
31
- aai_save_rbm: 'no-save-rbm', aai_p: opts[:haai_p])
32
- checkpoint :haai
33
- return nil if haai.nil? || haai.zero? || haai > 90.0
34
-
35
- aai = 100.0 - Math.exp(2.435076 + 0.4275193 * Math.log(100.0 - haai))
36
- SQLite3::Database.new(tmp_dbs[:aai]) do |conn|
37
- conn.execute 'insert into aai values(?, ?, ?, 0, 0, 0)',
38
- [dataset.name, target.name, aai]
20
+ # Estimates or calculates AAI against +targets+
21
+ def aai(targets)
22
+ puts "[#{Time.now}] AAI: #{dataset.name} vs #{targets.size} targets"
23
+
24
+ # Try hAAI first
25
+ haai(targets)
26
+
27
+ # Launch comparisons
28
+ pending_targets(targets, :aai).each do |target|
29
+ # Full AAI
30
+ target_cds = target.result(:cds).file_path(:proteins) or next
31
+ aairb_cmd(
32
+ tmp_file('proteins.fa'), target_cds,
33
+ dataset.name, target.name, tmp_dbs[:aai], checkpoint: :aai
34
+ )
39
35
  end
40
- checkpoint :aai
41
- aai
36
+
37
+ # Return AAI from the database
38
+ batch_values_from_db(:aai, targets.map { |i| i&.name })
42
39
  end
43
40
 
44
41
  ##
45
- # Calculates ANI against +target+
46
- def ani(target)
47
- # Check if the request makes sense
48
- t = tmp_file('largecontigs.fa')
49
- r = target.result(:assembly)
50
- return nil if r.nil? || !File.size?(t)
51
-
52
- # Check if it's been calculated
53
- y = stored_value(target, :ani)
54
- return y unless y.nil? || y.zero?
55
-
56
- # Run it
57
- ani_cmd(
58
- t, r.file_path(:largecontigs),
59
- dataset.name, target.name, tmp_dbs[:ani]
60
- ).tap { checkpoint :ani }
42
+ # Calculates ANI against +targets+
43
+ def ani(targets)
44
+ puts "[#{Time.now}] ANI: #{dataset.name} vs #{targets.size} targets"
45
+ empty_vals = targets.map { |_i| nil }
46
+ return empty_vals unless File.size?(tmp_file('largecontigs.fa'))
47
+
48
+ # Launch comparisons
49
+ sbj = pending_targets(targets, :ani)
50
+ unless sbj.empty?
51
+ opts[:ani_p] == 'fastani' ? fastani_cmd(sbj) : anirb_cmd(sbj)
52
+ end
53
+
54
+ # Return ANI from the database
55
+ batch_values_from_db(:ani, targets.map { |i| i&.name })
61
56
  end
62
57
 
63
58
  ##
64
- # Calculates and returns ANI against +target+ if AAI >= +aai_limit+.
65
- # Returns +nil+ otherwise
66
- def ani_after_aai(target, aai_limit = 85.0)
67
- aai = aai(target)
68
- (aai.nil? || aai < aai_limit) ? nil : ani(target)
59
+ # Calculates and returns ANI against +targets+ if AAI >= +aai_limit+.
60
+ # Note that ANI values may be returned for lower (or failing) AAIs if the
61
+ # value is already stored in the database
62
+ def ani_after_aai(targets, aai_limit = 85.0)
63
+ # Run AAI and select targets with AAI ≥ aai_limit
64
+ aai = aai(targets)
65
+ sbj = aai.each_with_index.map { |i, k| targets[k] if i&.> aai_limit }
66
+ sbj.compact!
67
+
68
+ # Run ANI
69
+ ani(sbj) unless sbj.empty?
70
+
71
+ # Return ANI from the database
72
+ batch_values_from_db(:ani, targets.map { |i| i&.name })
69
73
  end
70
74
 
71
75
  ##
72
76
  # Execute an AAI command
73
- def aai_cmd(f1, f2, n1, n2, db, o = {})
77
+ def aairb_cmd(f1, f2, n1, n2, db, o = {})
74
78
  o = opts.merge(o)
75
- v = `aai.rb -1 "#{f1}" -2 "#{f2}" -S "#{db}" \
76
- --name1 "#{n1}" --name2 "#{n2}" \
77
- -t "#{o[:thr]}" -a --lookup-first "--#{o[:aai_save_rbm]}" \
78
- -p "#{o[:aai_p] || 'blast+'}"`.chomp
79
- (v.nil? || v.empty?) ? 0 : v.to_f
79
+ run_cmd <<~CMD
80
+ aai.rb -1 "#{f1}" -2 "#{f2}" -S "#{db}" \
81
+ --name1 "#{n1}" --name2 "#{n2}" \
82
+ -t "#{o[:thr]}" -a --#{'no-' unless o[:aai_save_rbm]}save-rbm \
83
+ -p "#{o[:aai_p]}"
84
+ CMD
85
+ ensure
86
+ checkpoint(o[:checkpoint]) if o[:checkpoint]
80
87
  end
81
88
 
82
89
  ##
83
- # Execute an ANI command
84
- def ani_cmd(f1, f2, n1, n2, db, o = {})
85
- o = opts.merge(o)
86
- v = nil
87
- if o[:ani_p] == 'fastani'
88
- out = `fastANI -r "#{f1}" -q "#{f2}" \
89
- -o /dev/stdout 2>/dev/null`.chomp.split(/\s+/)
90
- unless out.empty?
91
- SQLite3::Database.new(db) do |conn|
92
- conn.execute 'insert into ani values(?, ?, ?, 0, ?, ?)',
93
- [n1, n2, out[2], out[3], out[4]]
94
- end
90
+ # Execute an ani.rb command
91
+ def anirb_cmd(targets)
92
+ f1 = tmp_file('largecontigs.fa')
93
+ return unless File.size?(f1)
94
+
95
+ targets.each do |target|
96
+ target_asm = target&.result(:assembly)&.file_path(:largecontigs) or next
97
+ run_cmd <<~CMD
98
+ ani.rb -1 "#{f1}" -2 "#{target_asm}" -S "#{tmp_dbs[:ani]}" \
99
+ --name1 "#{dataset.name}" --name2 "#{target.name}" \
100
+ -t "#{opts[:thr]}" -a --no-save-regions --no-save-rbm \
101
+ -p "#{opts[:ani_p]}"
102
+ CMD
103
+ checkpoint(:ani)
104
+ end
105
+ end
106
+
107
+ ##
108
+ # Execute a FastANI command
109
+ def fastani_cmd(targets)
110
+ f1 = tmp_file('largecontigs.fa')
111
+ return unless File.size?(f1)
112
+
113
+ # Run FastANI
114
+ File.open(f2 = tmp_file, 'w') do |fh|
115
+ targets.each do |target|
116
+ target_asm = target&.result(:assembly)&.file_path(:largecontigs)
117
+ fh.puts target_asm if target_asm
118
+ end
119
+ end
120
+ run_cmd <<~CMD
121
+ fastANI -q "#{f1}" --rl "#{f2}" -t #{opts[:thr]} \
122
+ -o "#{f3 = tmp_file}"
123
+ CMD
124
+
125
+ # Retrieve resulting data and save to DB
126
+ data = {}
127
+ File.open(f3, 'r') do |fh|
128
+ fh.each do |ln|
129
+ row = ln.chomp.split("\t")
130
+ n2 = File.basename(row[1], '.gz')
131
+ n2 = File.basename(n2, '.LargeContigs.fna')
132
+ data[n2] = [row[2].to_f, 0.0, row[3].to_i, row[4].to_i]
133
+ end
134
+ end
135
+ batch_data_to_db(:ani, data)
136
+
137
+ # Cleanup
138
+ [f2, f3].each { |i| File.unlink(i) }
139
+ end
140
+
141
+ ##
142
+ # Execute a FastAAI command
143
+ def fastaai_cmd(targets)
144
+ qry_idx = dataset.result(:essential_genes).file_path(:fastaai_index)
145
+ return nil unless qry_idx
146
+
147
+ # Run FastAAI
148
+ File.open(f1 = tmp_file, 'w') { |fh| fh.puts qry_idx }
149
+ File.open(f2 = tmp_file, 'w') do |fh|
150
+ targets.each do |target|
151
+ target_idx = target&.result(:essential_genes)&.file_path(:fastaai_index)
152
+ fh.puts target_idx if target_idx
153
+ end
154
+ end
155
+ run_cmd <<~CMD
156
+ FastAAI --qd "#{f1}" --rd "#{f2}" --output "#{f3 = tmp_file}" \
157
+ --threads #{opts[:thr]}
158
+ CMD
159
+
160
+ # Save values in the databases
161
+ haai_data = {}
162
+ aai_data = {}
163
+ File.open(f3, 'r') do |fh|
164
+ fh.each do |ln|
165
+ out = ln.chomp.split("\t")
166
+ haai_data[out[1]] = [
167
+ out[2].to_f * 100, out[3].to_f * 100, out[4].to_i, out[5].to_i
168
+ ]
169
+ aai_data[out[1]] = [out[6].to_f, 0, 0, 0] if out[6] !~ /^>/
95
170
  end
96
- v = out[2]
97
- else
98
- v = `ani.rb -1 "#{f1}" -2 "#{f2}" -S "#{db}" \
99
- --name1 "#{n1}" --name2 "#{n2}" \
100
- -t "#{opts[:thr]}" -a --no-save-regions --no-save-rbm \
101
- --lookup-first -p "#{o[:ani_p] || 'blast+'}"`.chomp
102
171
  end
103
- v.nil? || v.empty? ? 0 : v.to_f
172
+ batch_data_to_db(:haai, haai_data)
173
+ batch_data_to_db(:aai, aai_data)
174
+
175
+ # Cleanup
176
+ [f1, f2, f3].each { |i| File.unlink(i) }
177
+ end
178
+
179
+ ##
180
+ # Execute an hAAI command
181
+ def haai_cmd(targets)
182
+ aai_data = {}
183
+ targets.each do |target|
184
+ target_ess = target&.result(:essential_genes)&.file_path(:ess_genes)
185
+ next unless target_ess
186
+
187
+ # hAAI
188
+ h = aairb_cmd(
189
+ tmp_file('ess_genes.fa'), target_ess,
190
+ dataset.name, target.name, tmp_dbs[:haai],
191
+ aai_save_rbm: false, aai_p: opts[:haai_p], checkpoint: :haai
192
+ )&.chomp&.to_f
193
+ next if h.nil? || h.zero? || h > 90.0
194
+
195
+ # Estimated AAI
196
+ aai_data[target.name] = [
197
+ 100.0 - Math.exp(2.435076 + 0.4275193 * Math.log(100.0 - h)), 0, 0, 0
198
+ ] unless h&.zero? || h > 90.0
199
+ end
200
+ batch_data_to_db(:aai, aai_data)
201
+ end
202
+
203
+ def run_cmd(cmd)
204
+ puts "CMD: #{cmd}"
205
+ `#{cmd}`
104
206
  end
105
207
  end