miga-base 1.2.15.2 → 1.2.15.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (306) hide show
  1. checksums.yaml +4 -4
  2. data/lib/miga/cli/action/download/gtdb.rb +4 -1
  3. data/lib/miga/cli/action/gtdb_get.rb +4 -0
  4. data/lib/miga/daemon.rb +4 -1
  5. data/lib/miga/lair.rb +6 -4
  6. data/lib/miga/remote_dataset/download.rb +3 -2
  7. data/lib/miga/remote_dataset.rb +25 -7
  8. data/lib/miga/taxonomy.rb +6 -0
  9. data/lib/miga/version.rb +2 -2
  10. metadata +6 -302
  11. data/utils/FastAAI/00.Libraries/01.SCG_HMMs/Archaea_SCG.hmm +0 -41964
  12. data/utils/FastAAI/00.Libraries/01.SCG_HMMs/Bacteria_SCG.hmm +0 -32439
  13. data/utils/FastAAI/00.Libraries/01.SCG_HMMs/Complete_SCG_DB.hmm +0 -62056
  14. data/utils/FastAAI/FastAAI +0 -3659
  15. data/utils/FastAAI/FastAAI-legacy/FastAAI +0 -1336
  16. data/utils/FastAAI/FastAAI-legacy/kAAI_v1.0_virus.py +0 -1296
  17. data/utils/FastAAI/README.md +0 -84
  18. data/utils/enveomics/Docs/recplot2.md +0 -244
  19. data/utils/enveomics/Examples/aai-matrix.bash +0 -66
  20. data/utils/enveomics/Examples/ani-matrix.bash +0 -66
  21. data/utils/enveomics/Examples/essential-phylogeny.bash +0 -105
  22. data/utils/enveomics/Examples/unus-genome-phylogeny.bash +0 -100
  23. data/utils/enveomics/LICENSE.txt +0 -73
  24. data/utils/enveomics/Makefile +0 -52
  25. data/utils/enveomics/Manifest/Tasks/aasubs.json +0 -103
  26. data/utils/enveomics/Manifest/Tasks/blasttab.json +0 -790
  27. data/utils/enveomics/Manifest/Tasks/distances.json +0 -161
  28. data/utils/enveomics/Manifest/Tasks/fasta.json +0 -802
  29. data/utils/enveomics/Manifest/Tasks/fastq.json +0 -291
  30. data/utils/enveomics/Manifest/Tasks/graphics.json +0 -126
  31. data/utils/enveomics/Manifest/Tasks/mapping.json +0 -137
  32. data/utils/enveomics/Manifest/Tasks/ogs.json +0 -382
  33. data/utils/enveomics/Manifest/Tasks/other.json +0 -906
  34. data/utils/enveomics/Manifest/Tasks/remote.json +0 -355
  35. data/utils/enveomics/Manifest/Tasks/sequence-identity.json +0 -650
  36. data/utils/enveomics/Manifest/Tasks/tables.json +0 -308
  37. data/utils/enveomics/Manifest/Tasks/trees.json +0 -68
  38. data/utils/enveomics/Manifest/Tasks/variants.json +0 -111
  39. data/utils/enveomics/Manifest/categories.json +0 -165
  40. data/utils/enveomics/Manifest/examples.json +0 -162
  41. data/utils/enveomics/Manifest/tasks.json +0 -4
  42. data/utils/enveomics/Pipelines/assembly.pbs/CONFIG.mock.bash +0 -69
  43. data/utils/enveomics/Pipelines/assembly.pbs/FastA.N50.pl +0 -1
  44. data/utils/enveomics/Pipelines/assembly.pbs/FastA.filterN.pl +0 -1
  45. data/utils/enveomics/Pipelines/assembly.pbs/FastA.length.pl +0 -1
  46. data/utils/enveomics/Pipelines/assembly.pbs/README.md +0 -189
  47. data/utils/enveomics/Pipelines/assembly.pbs/RUNME-2.bash +0 -112
  48. data/utils/enveomics/Pipelines/assembly.pbs/RUNME-3.bash +0 -23
  49. data/utils/enveomics/Pipelines/assembly.pbs/RUNME-4.bash +0 -44
  50. data/utils/enveomics/Pipelines/assembly.pbs/RUNME.bash +0 -50
  51. data/utils/enveomics/Pipelines/assembly.pbs/kSelector.R +0 -37
  52. data/utils/enveomics/Pipelines/assembly.pbs/newbler.pbs +0 -68
  53. data/utils/enveomics/Pipelines/assembly.pbs/newbler_preparator.pl +0 -49
  54. data/utils/enveomics/Pipelines/assembly.pbs/soap.pbs +0 -80
  55. data/utils/enveomics/Pipelines/assembly.pbs/stats.pbs +0 -57
  56. data/utils/enveomics/Pipelines/assembly.pbs/velvet.pbs +0 -63
  57. data/utils/enveomics/Pipelines/blast.pbs/01.pbs.bash +0 -38
  58. data/utils/enveomics/Pipelines/blast.pbs/02.pbs.bash +0 -73
  59. data/utils/enveomics/Pipelines/blast.pbs/03.pbs.bash +0 -21
  60. data/utils/enveomics/Pipelines/blast.pbs/BlastTab.recover_job.pl +0 -72
  61. data/utils/enveomics/Pipelines/blast.pbs/CONFIG.mock.bash +0 -98
  62. data/utils/enveomics/Pipelines/blast.pbs/FastA.split.pl +0 -1
  63. data/utils/enveomics/Pipelines/blast.pbs/README.md +0 -127
  64. data/utils/enveomics/Pipelines/blast.pbs/RUNME.bash +0 -109
  65. data/utils/enveomics/Pipelines/blast.pbs/TASK.check.bash +0 -128
  66. data/utils/enveomics/Pipelines/blast.pbs/TASK.dry.bash +0 -16
  67. data/utils/enveomics/Pipelines/blast.pbs/TASK.eo.bash +0 -22
  68. data/utils/enveomics/Pipelines/blast.pbs/TASK.pause.bash +0 -26
  69. data/utils/enveomics/Pipelines/blast.pbs/TASK.run.bash +0 -89
  70. data/utils/enveomics/Pipelines/blast.pbs/sentinel.pbs.bash +0 -29
  71. data/utils/enveomics/Pipelines/idba.pbs/README.md +0 -49
  72. data/utils/enveomics/Pipelines/idba.pbs/RUNME.bash +0 -95
  73. data/utils/enveomics/Pipelines/idba.pbs/run.pbs +0 -56
  74. data/utils/enveomics/Pipelines/trim.pbs/README.md +0 -54
  75. data/utils/enveomics/Pipelines/trim.pbs/RUNME.bash +0 -70
  76. data/utils/enveomics/Pipelines/trim.pbs/run.pbs +0 -130
  77. data/utils/enveomics/README.md +0 -42
  78. data/utils/enveomics/Scripts/AAsubs.log2ratio.rb +0 -171
  79. data/utils/enveomics/Scripts/Aln.cat.rb +0 -221
  80. data/utils/enveomics/Scripts/Aln.convert.pl +0 -35
  81. data/utils/enveomics/Scripts/AlphaDiversity.pl +0 -152
  82. data/utils/enveomics/Scripts/BedGraph.tad.rb +0 -93
  83. data/utils/enveomics/Scripts/BedGraph.window.rb +0 -71
  84. data/utils/enveomics/Scripts/BlastPairwise.AAsubs.pl +0 -102
  85. data/utils/enveomics/Scripts/BlastTab.addlen.rb +0 -63
  86. data/utils/enveomics/Scripts/BlastTab.advance.bash +0 -48
  87. data/utils/enveomics/Scripts/BlastTab.best_hit_sorted.pl +0 -55
  88. data/utils/enveomics/Scripts/BlastTab.catsbj.pl +0 -104
  89. data/utils/enveomics/Scripts/BlastTab.cogCat.rb +0 -76
  90. data/utils/enveomics/Scripts/BlastTab.filter.pl +0 -47
  91. data/utils/enveomics/Scripts/BlastTab.kegg_pep2path_rest.pl +0 -194
  92. data/utils/enveomics/Scripts/BlastTab.metaxaPrep.pl +0 -104
  93. data/utils/enveomics/Scripts/BlastTab.pairedHits.rb +0 -157
  94. data/utils/enveomics/Scripts/BlastTab.recplot2.R +0 -48
  95. data/utils/enveomics/Scripts/BlastTab.seqdepth.pl +0 -86
  96. data/utils/enveomics/Scripts/BlastTab.seqdepth_ZIP.pl +0 -119
  97. data/utils/enveomics/Scripts/BlastTab.seqdepth_nomedian.pl +0 -86
  98. data/utils/enveomics/Scripts/BlastTab.subsample.pl +0 -47
  99. data/utils/enveomics/Scripts/BlastTab.sumPerHit.pl +0 -114
  100. data/utils/enveomics/Scripts/BlastTab.taxid2taxrank.pl +0 -90
  101. data/utils/enveomics/Scripts/BlastTab.topHits_sorted.rb +0 -123
  102. data/utils/enveomics/Scripts/Chao1.pl +0 -97
  103. data/utils/enveomics/Scripts/CharTable.classify.rb +0 -234
  104. data/utils/enveomics/Scripts/EBIseq2tax.rb +0 -83
  105. data/utils/enveomics/Scripts/FastA.N50.pl +0 -60
  106. data/utils/enveomics/Scripts/FastA.extract.rb +0 -152
  107. data/utils/enveomics/Scripts/FastA.filter.pl +0 -52
  108. data/utils/enveomics/Scripts/FastA.filterLen.pl +0 -28
  109. data/utils/enveomics/Scripts/FastA.filterN.pl +0 -60
  110. data/utils/enveomics/Scripts/FastA.fragment.rb +0 -100
  111. data/utils/enveomics/Scripts/FastA.gc.pl +0 -42
  112. data/utils/enveomics/Scripts/FastA.interpose.pl +0 -93
  113. data/utils/enveomics/Scripts/FastA.length.pl +0 -38
  114. data/utils/enveomics/Scripts/FastA.mask.rb +0 -89
  115. data/utils/enveomics/Scripts/FastA.per_file.pl +0 -36
  116. data/utils/enveomics/Scripts/FastA.qlen.pl +0 -57
  117. data/utils/enveomics/Scripts/FastA.rename.pl +0 -65
  118. data/utils/enveomics/Scripts/FastA.revcom.pl +0 -23
  119. data/utils/enveomics/Scripts/FastA.sample.rb +0 -98
  120. data/utils/enveomics/Scripts/FastA.slider.pl +0 -85
  121. data/utils/enveomics/Scripts/FastA.split.pl +0 -55
  122. data/utils/enveomics/Scripts/FastA.split.rb +0 -79
  123. data/utils/enveomics/Scripts/FastA.subsample.pl +0 -131
  124. data/utils/enveomics/Scripts/FastA.tag.rb +0 -65
  125. data/utils/enveomics/Scripts/FastA.toFastQ.rb +0 -69
  126. data/utils/enveomics/Scripts/FastA.wrap.rb +0 -48
  127. data/utils/enveomics/Scripts/FastQ.filter.pl +0 -54
  128. data/utils/enveomics/Scripts/FastQ.interpose.pl +0 -90
  129. data/utils/enveomics/Scripts/FastQ.maskQual.rb +0 -89
  130. data/utils/enveomics/Scripts/FastQ.offset.pl +0 -90
  131. data/utils/enveomics/Scripts/FastQ.split.pl +0 -53
  132. data/utils/enveomics/Scripts/FastQ.tag.rb +0 -70
  133. data/utils/enveomics/Scripts/FastQ.test-error.rb +0 -81
  134. data/utils/enveomics/Scripts/FastQ.toFastA.awk +0 -24
  135. data/utils/enveomics/Scripts/GFF.catsbj.pl +0 -127
  136. data/utils/enveomics/Scripts/GenBank.add_fields.rb +0 -84
  137. data/utils/enveomics/Scripts/HMM.essential.rb +0 -351
  138. data/utils/enveomics/Scripts/HMM.haai.rb +0 -168
  139. data/utils/enveomics/Scripts/HMMsearch.extractIds.rb +0 -83
  140. data/utils/enveomics/Scripts/JPlace.distances.rb +0 -88
  141. data/utils/enveomics/Scripts/JPlace.to_iToL.rb +0 -320
  142. data/utils/enveomics/Scripts/M5nr.getSequences.rb +0 -81
  143. data/utils/enveomics/Scripts/MeTaxa.distribution.pl +0 -198
  144. data/utils/enveomics/Scripts/MyTaxa.fragsByTax.pl +0 -35
  145. data/utils/enveomics/Scripts/MyTaxa.seq-taxrank.rb +0 -49
  146. data/utils/enveomics/Scripts/NCBIacc2tax.rb +0 -92
  147. data/utils/enveomics/Scripts/Newick.autoprune.R +0 -27
  148. data/utils/enveomics/Scripts/RAxML-EPA.to_iToL.pl +0 -228
  149. data/utils/enveomics/Scripts/RecPlot2.compareIdentities.R +0 -32
  150. data/utils/enveomics/Scripts/RefSeq.download.bash +0 -48
  151. data/utils/enveomics/Scripts/SRA.download.bash +0 -55
  152. data/utils/enveomics/Scripts/TRIBS.plot-test.R +0 -36
  153. data/utils/enveomics/Scripts/TRIBS.test.R +0 -39
  154. data/utils/enveomics/Scripts/Table.barplot.R +0 -31
  155. data/utils/enveomics/Scripts/Table.df2dist.R +0 -30
  156. data/utils/enveomics/Scripts/Table.filter.pl +0 -61
  157. data/utils/enveomics/Scripts/Table.merge.pl +0 -77
  158. data/utils/enveomics/Scripts/Table.prefScore.R +0 -60
  159. data/utils/enveomics/Scripts/Table.replace.rb +0 -69
  160. data/utils/enveomics/Scripts/Table.round.rb +0 -63
  161. data/utils/enveomics/Scripts/Table.split.pl +0 -57
  162. data/utils/enveomics/Scripts/Taxonomy.silva2ncbi.rb +0 -227
  163. data/utils/enveomics/Scripts/VCF.KaKs.rb +0 -147
  164. data/utils/enveomics/Scripts/VCF.SNPs.rb +0 -88
  165. data/utils/enveomics/Scripts/aai.rb +0 -421
  166. data/utils/enveomics/Scripts/ani.rb +0 -362
  167. data/utils/enveomics/Scripts/anir.rb +0 -137
  168. data/utils/enveomics/Scripts/clust.rand.rb +0 -102
  169. data/utils/enveomics/Scripts/gi2tax.rb +0 -103
  170. data/utils/enveomics/Scripts/in_silico_GA_GI.pl +0 -96
  171. data/utils/enveomics/Scripts/lib/data/dupont_2012_essential.hmm.gz +0 -0
  172. data/utils/enveomics/Scripts/lib/data/lee_2019_essential.hmm.gz +0 -0
  173. data/utils/enveomics/Scripts/lib/enveomics.R +0 -1
  174. data/utils/enveomics/Scripts/lib/enveomics_rb/anir.rb +0 -293
  175. data/utils/enveomics/Scripts/lib/enveomics_rb/bm_set.rb +0 -175
  176. data/utils/enveomics/Scripts/lib/enveomics_rb/enveomics.rb +0 -24
  177. data/utils/enveomics/Scripts/lib/enveomics_rb/errors.rb +0 -17
  178. data/utils/enveomics/Scripts/lib/enveomics_rb/gmm_em.rb +0 -30
  179. data/utils/enveomics/Scripts/lib/enveomics_rb/jplace.rb +0 -253
  180. data/utils/enveomics/Scripts/lib/enveomics_rb/match.rb +0 -88
  181. data/utils/enveomics/Scripts/lib/enveomics_rb/og.rb +0 -182
  182. data/utils/enveomics/Scripts/lib/enveomics_rb/rbm.rb +0 -49
  183. data/utils/enveomics/Scripts/lib/enveomics_rb/remote_data.rb +0 -74
  184. data/utils/enveomics/Scripts/lib/enveomics_rb/seq_range.rb +0 -237
  185. data/utils/enveomics/Scripts/lib/enveomics_rb/stats/rand.rb +0 -31
  186. data/utils/enveomics/Scripts/lib/enveomics_rb/stats/sample.rb +0 -152
  187. data/utils/enveomics/Scripts/lib/enveomics_rb/stats.rb +0 -3
  188. data/utils/enveomics/Scripts/lib/enveomics_rb/utils.rb +0 -74
  189. data/utils/enveomics/Scripts/lib/enveomics_rb/vcf.rb +0 -135
  190. data/utils/enveomics/Scripts/ogs.annotate.rb +0 -88
  191. data/utils/enveomics/Scripts/ogs.core-pan.rb +0 -160
  192. data/utils/enveomics/Scripts/ogs.extract.rb +0 -125
  193. data/utils/enveomics/Scripts/ogs.mcl.rb +0 -186
  194. data/utils/enveomics/Scripts/ogs.rb +0 -104
  195. data/utils/enveomics/Scripts/ogs.stats.rb +0 -131
  196. data/utils/enveomics/Scripts/rbm-legacy.rb +0 -172
  197. data/utils/enveomics/Scripts/rbm.rb +0 -108
  198. data/utils/enveomics/Scripts/sam.filter.rb +0 -148
  199. data/utils/enveomics/Tests/Makefile +0 -10
  200. data/utils/enveomics/Tests/Mgen_M2288.faa +0 -3189
  201. data/utils/enveomics/Tests/Mgen_M2288.fna +0 -8282
  202. data/utils/enveomics/Tests/Mgen_M2321.fna +0 -8288
  203. data/utils/enveomics/Tests/Nequ_Kin4M.faa +0 -2970
  204. data/utils/enveomics/Tests/Xanthomonas_oryzae-PilA.tribs.Rdata +0 -0
  205. data/utils/enveomics/Tests/Xanthomonas_oryzae-PilA.txt +0 -7
  206. data/utils/enveomics/Tests/Xanthomonas_oryzae.aai-mat.tsv +0 -17
  207. data/utils/enveomics/Tests/Xanthomonas_oryzae.aai.tsv +0 -137
  208. data/utils/enveomics/Tests/a_mg.cds-go.blast.tsv +0 -123
  209. data/utils/enveomics/Tests/a_mg.reads-cds.blast.tsv +0 -200
  210. data/utils/enveomics/Tests/a_mg.reads-cds.counts.tsv +0 -55
  211. data/utils/enveomics/Tests/alkB.nwk +0 -1
  212. data/utils/enveomics/Tests/anthrax-cansnp-data.tsv +0 -13
  213. data/utils/enveomics/Tests/anthrax-cansnp-key.tsv +0 -17
  214. data/utils/enveomics/Tests/hiv1.faa +0 -59
  215. data/utils/enveomics/Tests/hiv1.fna +0 -134
  216. data/utils/enveomics/Tests/hiv2.faa +0 -70
  217. data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv +0 -233
  218. data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv.lim +0 -1
  219. data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv.rec +0 -233
  220. data/utils/enveomics/Tests/phyla_counts.tsv +0 -10
  221. data/utils/enveomics/Tests/primate_lentivirus.ogs +0 -11
  222. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-hiv1.rbm +0 -9
  223. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-hiv2.rbm +0 -8
  224. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-siv.rbm +0 -6
  225. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv2-hiv2.rbm +0 -9
  226. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv2-siv.rbm +0 -6
  227. data/utils/enveomics/Tests/primate_lentivirus.rbm/siv-siv.rbm +0 -6
  228. data/utils/enveomics/build_enveomics_r.bash +0 -45
  229. data/utils/enveomics/enveomics.R/DESCRIPTION +0 -31
  230. data/utils/enveomics/enveomics.R/NAMESPACE +0 -39
  231. data/utils/enveomics/enveomics.R/R/autoprune.R +0 -155
  232. data/utils/enveomics/enveomics.R/R/barplot.R +0 -184
  233. data/utils/enveomics/enveomics.R/R/cliopts.R +0 -135
  234. data/utils/enveomics/enveomics.R/R/df2dist.R +0 -154
  235. data/utils/enveomics/enveomics.R/R/growthcurve.R +0 -331
  236. data/utils/enveomics/enveomics.R/R/prefscore.R +0 -79
  237. data/utils/enveomics/enveomics.R/R/recplot.R +0 -354
  238. data/utils/enveomics/enveomics.R/R/recplot2.R +0 -1631
  239. data/utils/enveomics/enveomics.R/R/tribs.R +0 -583
  240. data/utils/enveomics/enveomics.R/R/utils.R +0 -80
  241. data/utils/enveomics/enveomics.R/README.md +0 -81
  242. data/utils/enveomics/enveomics.R/data/growth.curves.rda +0 -0
  243. data/utils/enveomics/enveomics.R/data/phyla.counts.rda +0 -0
  244. data/utils/enveomics/enveomics.R/man/cash-enve.GrowthCurve-method.Rd +0 -16
  245. data/utils/enveomics/enveomics.R/man/cash-enve.RecPlot2-method.Rd +0 -16
  246. data/utils/enveomics/enveomics.R/man/cash-enve.RecPlot2.Peak-method.Rd +0 -16
  247. data/utils/enveomics/enveomics.R/man/enve.GrowthCurve-class.Rd +0 -25
  248. data/utils/enveomics/enveomics.R/man/enve.TRIBS-class.Rd +0 -46
  249. data/utils/enveomics/enveomics.R/man/enve.TRIBS.merge.Rd +0 -23
  250. data/utils/enveomics/enveomics.R/man/enve.TRIBStest-class.Rd +0 -47
  251. data/utils/enveomics/enveomics.R/man/enve.__prune.iter.Rd +0 -23
  252. data/utils/enveomics/enveomics.R/man/enve.__prune.reduce.Rd +0 -23
  253. data/utils/enveomics/enveomics.R/man/enve.__tribs.Rd +0 -40
  254. data/utils/enveomics/enveomics.R/man/enve.barplot.Rd +0 -103
  255. data/utils/enveomics/enveomics.R/man/enve.cliopts.Rd +0 -67
  256. data/utils/enveomics/enveomics.R/man/enve.col.alpha.Rd +0 -24
  257. data/utils/enveomics/enveomics.R/man/enve.col2alpha.Rd +0 -19
  258. data/utils/enveomics/enveomics.R/man/enve.df2dist.Rd +0 -45
  259. data/utils/enveomics/enveomics.R/man/enve.df2dist.group.Rd +0 -44
  260. data/utils/enveomics/enveomics.R/man/enve.df2dist.list.Rd +0 -47
  261. data/utils/enveomics/enveomics.R/man/enve.growthcurve.Rd +0 -75
  262. data/utils/enveomics/enveomics.R/man/enve.prefscore.Rd +0 -50
  263. data/utils/enveomics/enveomics.R/man/enve.prune.dist.Rd +0 -44
  264. data/utils/enveomics/enveomics.R/man/enve.recplot.Rd +0 -139
  265. data/utils/enveomics/enveomics.R/man/enve.recplot2-class.Rd +0 -45
  266. data/utils/enveomics/enveomics.R/man/enve.recplot2.ANIr.Rd +0 -24
  267. data/utils/enveomics/enveomics.R/man/enve.recplot2.Rd +0 -77
  268. data/utils/enveomics/enveomics.R/man/enve.recplot2.__counts.Rd +0 -25
  269. data/utils/enveomics/enveomics.R/man/enve.recplot2.__peakHist.Rd +0 -21
  270. data/utils/enveomics/enveomics.R/man/enve.recplot2.__whichClosestPeak.Rd +0 -19
  271. data/utils/enveomics/enveomics.R/man/enve.recplot2.changeCutoff.Rd +0 -19
  272. data/utils/enveomics/enveomics.R/man/enve.recplot2.compareIdentities.Rd +0 -47
  273. data/utils/enveomics/enveomics.R/man/enve.recplot2.coordinates.Rd +0 -29
  274. data/utils/enveomics/enveomics.R/man/enve.recplot2.corePeak.Rd +0 -18
  275. data/utils/enveomics/enveomics.R/man/enve.recplot2.extractWindows.Rd +0 -45
  276. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.Rd +0 -36
  277. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__em_e.Rd +0 -19
  278. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__em_m.Rd +0 -19
  279. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__emauto_one.Rd +0 -27
  280. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__mow_one.Rd +0 -52
  281. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__mower.Rd +0 -17
  282. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.em.Rd +0 -51
  283. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.emauto.Rd +0 -43
  284. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.mower.Rd +0 -82
  285. data/utils/enveomics/enveomics.R/man/enve.recplot2.peak-class.Rd +0 -59
  286. data/utils/enveomics/enveomics.R/man/enve.recplot2.seqdepth.Rd +0 -27
  287. data/utils/enveomics/enveomics.R/man/enve.recplot2.windowDepthThreshold.Rd +0 -36
  288. data/utils/enveomics/enveomics.R/man/enve.selvector.Rd +0 -23
  289. data/utils/enveomics/enveomics.R/man/enve.tribs.Rd +0 -68
  290. data/utils/enveomics/enveomics.R/man/enve.tribs.test.Rd +0 -28
  291. data/utils/enveomics/enveomics.R/man/enve.truncate.Rd +0 -27
  292. data/utils/enveomics/enveomics.R/man/growth.curves.Rd +0 -14
  293. data/utils/enveomics/enveomics.R/man/phyla.counts.Rd +0 -13
  294. data/utils/enveomics/enveomics.R/man/plot.enve.GrowthCurve.Rd +0 -78
  295. data/utils/enveomics/enveomics.R/man/plot.enve.TRIBS.Rd +0 -46
  296. data/utils/enveomics/enveomics.R/man/plot.enve.TRIBStest.Rd +0 -45
  297. data/utils/enveomics/enveomics.R/man/plot.enve.recplot2.Rd +0 -125
  298. data/utils/enveomics/enveomics.R/man/summary.enve.GrowthCurve.Rd +0 -19
  299. data/utils/enveomics/enveomics.R/man/summary.enve.TRIBS.Rd +0 -19
  300. data/utils/enveomics/enveomics.R/man/summary.enve.TRIBStest.Rd +0 -19
  301. data/utils/enveomics/globals.mk +0 -8
  302. data/utils/enveomics/manifest.json +0 -9
  303. data/utils/multitrim/Multitrim How-To.pdf +0 -0
  304. data/utils/multitrim/README.md +0 -67
  305. data/utils/multitrim/multitrim.py +0 -1555
  306. data/utils/multitrim/multitrim.yml +0 -13
@@ -1,291 +0,0 @@
1
- {
2
- "tasks": [
3
- {
4
- "task": "FastQ.filter.pl",
5
- "description": "Extracts a subset of sequences from a FastQ file.",
6
- "see_also": ["FastA.filter.pl"],
7
- "help_arg": "-h",
8
- "options": [
9
- {
10
- "name": "Reverse list",
11
- "opt": "-r",
12
- "description": "Extracts sequences NOT present in the list."
13
- },
14
- {
15
- "name": "Quiet",
16
- "opt": "-q",
17
- "description": "Runs quietly."
18
- },
19
- {
20
- "name": "List",
21
- "arg": "in_file",
22
- "mandatory": true,
23
- "description": "List of sequences to extract."
24
- },
25
- {
26
- "name": "Seqs.fq",
27
- "arg": "in_file",
28
- "mandatory": true,
29
- "description": "FastQ file containing the superset of sequences."
30
- },
31
- ">",
32
- {
33
- "name": "Subset.fq",
34
- "arg": "out_file",
35
- "mandatory": true,
36
- "description": "FastQ file to be created."
37
- }
38
- ]
39
- },
40
- {
41
- "task": "FastQ.interpose.pl",
42
- "description": ["Interposes sequences in FastQ format from two files",
43
- "into one output file. If more than two files are provided, the script",
44
- "will interpose all the input files."],
45
- "warn": ["Note that this script will check for the consistency of the",
46
- "names (assuming a pair of related reads contains the same name",
47
- "varying only in a trailing slash (/) followed by a digit. If you want",
48
- "to turn this feature off just set the checking period to zero. If you",
49
- "want to decrease the sampling period (to speed the script up) or",
50
- "increase it (to make it more sensitive to errors) just change the",
51
- "checking period accordingly."],
52
- "see_also": ["FastQ.split.pl","FastA.interpose.pl"],
53
- "help_arg": "",
54
- "options": [
55
- {
56
- "name": "Checking period",
57
- "opt": "-T",
58
- "arg": "integer",
59
- "default": 1000,
60
- "description": "Sampling period for names evaluation."
61
- },
62
- {
63
- "arg": "out_file",
64
- "mandatory": true,
65
- "description": "Output FastQ file."
66
- },
67
- {
68
- "arg": "in_file",
69
- "mandatory": true,
70
- "description": "First input FastQ file."
71
- },
72
- {
73
- "arg": "in_file",
74
- "mandatory": true,
75
- "description": "Second input FastQ file."
76
- },
77
- {
78
- "arg": "in_file",
79
- "multiple_sep": " ",
80
- "description": "Any additional input FastQ files."
81
- }
82
- ]
83
- },
84
- {
85
- "task": "FastQ.maskQual.rb",
86
- "description": "Masks low-quality bases in a FastQ file.",
87
- "help_arg": "--help",
88
- "options": [
89
- {
90
- "opt": "--input",
91
- "arg": "in_file",
92
- "mandatory": true,
93
- "description": ["Path to the FastQ file containing the sequences.",
94
- "Supports compression with .gz extension."]
95
- },
96
- {
97
- "opt": "--output",
98
- "arg": "out_file",
99
- "mandatory": true,
100
- "description": ["Path to the output FastQ file.",
101
- "Supports compression with .gz extension."]
102
- },
103
- {
104
- "opt": "--qual",
105
- "arg": "integer",
106
- "default": 15,
107
- "description": "Minimum quality score to allow a base."
108
- },
109
- {
110
- "opt": "--offset",
111
- "arg": "integer",
112
- "default": 33,
113
- "description": "Q-score offset."
114
- },
115
- {
116
- "opt": "--fasta",
117
- "description": "Output sequences in FastA format."
118
- },
119
- {
120
- "opt": "--quiet",
121
- "description": "Run quietly."
122
- }
123
- ]
124
- },
125
- {
126
- "task": "FastQ.offset.pl",
127
- "description": ["There are several FastQ formats. This script takes a",
128
- "FastQ in any of them, identifies the type of FastQ (this is, the",
129
- "offset), and generates a FastQ with the given offset."],
130
- "warn": ["Note that Solexa+64 FastQ can cause problematic values when",
131
- "using the offset 33, since there is no equivalent in Phred+33 for",
132
- "negative values (the range of Solexa+64 is -5 to 40)."],
133
- "help_arg": "",
134
- "options": [
135
- {
136
- "arg": "in_file",
137
- "mandatory": true,
138
- "description": ["Input file in FastQ format (range is automatically",
139
- "detected)."]
140
- },
141
- {
142
- "name": "Offset",
143
- "arg": "integer",
144
- "default": 33,
145
- "mandatory": true,
146
- "description": ["Offset to use for the output. Use 0 (zero) to",
147
- "detect the input format and exit."]
148
- },
149
- {
150
- "opt": "force",
151
- "description": ["If set, turns errors into warnings and continues.",
152
- "Out-of-range values are set to the closest range limit."]
153
- },
154
- ">",
155
- {
156
- "arg": "out_file",
157
- "mandatory": true,
158
- "description": ["Output file in FastQ format with the specified",
159
- "offset."]
160
- }
161
- ]
162
- },
163
- {
164
- "task": "FastQ.split.pl",
165
- "description": ["Splits a FastQ file into several FastQ files. This",
166
- "script can be used to separate interposed sister reads using any even",
167
- "number of output files."],
168
- "help_arg": "",
169
- "see_also": ["FastQ.interpose.pl","FastA.split.pl"],
170
- "options": [
171
- {
172
- "name": "in_file.fq",
173
- "arg": "in_file",
174
- "mandatory": true,
175
- "description": "Input file in FastQ format."
176
- },
177
- {
178
- "name": "out_base",
179
- "arg": "out_file",
180
- "mandatory": true,
181
- "description": ["Prefix for the name of the output files. It will be",
182
- "appended with .<i>.fastq, where <i> is a consecutive number",
183
- "starting in 1."]
184
- },
185
- {
186
- "name": "no_files",
187
- "arg": "integer",
188
- "default": 2,
189
- "description": "Number of files to generate."
190
- }
191
- ]
192
- },
193
- {
194
- "task": "FastQ.tag.rb",
195
- "description": "Generates easy-to-parse tagged reads from FastQ files.",
196
- "see_also": ["FastA.tag.rb"],
197
- "help_arg": "--help",
198
- "options": [
199
- {
200
- "name": "Input file",
201
- "opt": "--in",
202
- "arg": "in_file",
203
- "mandatory": true,
204
- "description": [
205
- "FastQ file containing the sequences.",
206
- "Supports compression with .gz extension."
207
- ]
208
- },
209
- {
210
- "name": "Output file",
211
- "opt": "--out",
212
- "arg": "out_file",
213
- "mandatory": true,
214
- "description": [
215
- "FastQ to create.",
216
- "Supports compression with .gz extension."
217
- ]
218
- },
219
- {
220
- "opt": "--prefix",
221
- "arg": "string",
222
- "description": "Prefix to use in all IDs."
223
- },
224
- {
225
- "opt": "--suffix",
226
- "arg": "string",
227
- "description": "Suffix to use in all IDs."
228
- },
229
- {
230
- "opt": "--quiet",
231
- "description": "Run quietly (no STDERR output)."
232
- }
233
- ]
234
- },
235
- {
236
- "task": "FastQ.toFastA.awk",
237
- "description": "Translates FastQ files into FastA.",
238
- "see_also": "FastA.toFastQ.rb",
239
- "help_arg": "'' --help",
240
- "options": [
241
- "<",
242
- {
243
- "arg": "in_file",
244
- "mandatory": true,
245
- "description": "Input FastQ file."
246
- },
247
- ">",
248
- {
249
- "arg": "out_file",
250
- "mandatory": true,
251
- "description": "Output FastA file."
252
- }
253
- ]
254
- },
255
- {
256
- "task": "FastQ.test-error.rb",
257
- "description": ["Compares the estimated error of sequencing reads",
258
- "(Q-score) with observed mismatches (identity against a know",
259
- "reference sequence)."],
260
- "help_arg": "--help",
261
- "options": [
262
- {
263
- "name": "FastQ",
264
- "opt": "--fastq",
265
- "arg": "in_file",
266
- "mandatory": true,
267
- "description": "FastQ file containing the sequences."
268
- },
269
- {
270
- "name": "Tabular BLAST",
271
- "opt": "--blast",
272
- "arg": "in_file",
273
- "mandatory": true,
274
- "description": ["Tabular BLAST file mapping reads to reference",
275
- "sequences."]
276
- },
277
- {
278
- "name": "Output",
279
- "opt": "--out",
280
- "arg": "out_file",
281
- "mandatory": true,
282
- "description": "Output tab-delimited file to create."
283
- },
284
- {
285
- "opt": "--quiet",
286
- "description": "Run quietly (no STDERR output)."
287
- }
288
- ]
289
- }
290
- ]
291
- }
@@ -1,126 +0,0 @@
1
- {
2
- "tasks": [
3
- {
4
- "task": "Table.barplot.R",
5
- "description": "Creates nice barplots from tab-delimited tables.",
6
- "requires": [ { "r_package": "optparse" } ],
7
- "help_arg": "--help",
8
- "options": [
9
- {
10
- "name": "Input file",
11
- "opt": "--x",
12
- "arg": "in_file",
13
- "mandatory": true,
14
- "description": ["A tab-delimited file containing header (first row)",
15
- "and row names (first column)."]
16
- },
17
- {
18
- "opt": "--sizes",
19
- "arg": "string",
20
- "description": ["A numeric vector containing the real size of the",
21
- "samples (columns) in the same order of the input table. If set,",
22
- "the values are assumed to be 100%, otherwise the sum of the",
23
- "columns is used. Separate values by commas."]
24
- },
25
- {
26
- "opt": "--top",
27
- "arg": "integer",
28
- "default": 25,
29
- "description": ["Maximum number of categories to display. Any",
30
- "additional categories will be listed as 'Others'."]
31
- },
32
- {
33
- "opt": "--colors-per-group",
34
- "arg": "integer",
35
- "default": 9,
36
- "description": ["Number of categories in the first two saturation",
37
- "groups of colors. The third group contains the remaining",
38
- "categories if needed."]
39
- },
40
- {
41
- "opt": "--bars-width",
42
- "arg": "integer",
43
- "default": 4,
44
- "description": "Width of the barplot with respect to the legend."
45
- },
46
- {
47
- "opt": "--legend-ncol",
48
- "arg": "integer",
49
- "default": 1,
50
- "description": "Number of columns in the legend."
51
- },
52
- {
53
- "opt": "--other-col",
54
- "arg": "string",
55
- "default": "#000000",
56
- "description": "Color of the 'Others' category."
57
- },
58
- {
59
- "opt": "--add-trend",
60
- "description": ["Controls if semi-transparent areas are to be",
61
- "plotted between the bars to connect the regions (trend regions)."]
62
- },
63
- {
64
- "opt": "--organic-trend",
65
- "description": ["Controls if the trend regions are to be smoothed",
66
- "(curves). By default, trend regions have straight edges. If TRUE,",
67
- "forces add.trend=TRUE."]
68
- },
69
- {
70
- "opt": "--sort-by",
71
- "arg": "string",
72
- "default": "median",
73
- "description": ["Any function that takes a numeric vector and",
74
- "returns a numeric scalar. This function is applied to each row,",
75
- "and the resulting values are used to sort the rows",
76
- "(decreasingly). Good options include: sd, min, max, mean, median."]
77
- },
78
- {
79
- "opt": "--min-report",
80
- "arg": "integer",
81
- "default": 101,
82
- "description": ["Minimum percentage to report the value in the plot.",
83
- "Any value above 100 indicates that no values are to be reported."]
84
- },
85
- {
86
- "opt": "--order",
87
- "arg": "string",
88
- "description": ["Controls how the rows should be ordered. If empty",
89
- "(default), sort.by is applied per row and the results are sorted",
90
- "decreasingly. If NA, no sorting is performed, i.e., the original",
91
- "order is respected. If a vector is provided, it is assumed to be",
92
- "the custom order to be used (either by numeric index or by row",
93
- "names). Separate values by commas."]
94
- },
95
- {
96
- "opt": "--col",
97
- "arg": "string",
98
- "description": ["Colors to use. If provided, overrides the variables",
99
- "`top` and `colors.per.group`, but `other.col` is still used if",
100
- "the vector is insufficient for all the rows. Separate values by",
101
- "commas. An additional palette is available when using value",
102
- "'coto' (palette contributed by Luis (Coto) Orellana)."]
103
- },
104
- {
105
- "arg": "out_file",
106
- "mandatory": true,
107
- "description": "Output file in PDF format."
108
- },
109
- {
110
- "name": "width",
111
- "arg": "float",
112
- "mandatory": true,
113
- "default": 7,
114
- "description": "Width of the plot (in inches)."
115
- },
116
- {
117
- "name": "height",
118
- "arg": "float",
119
- "mandatory": true,
120
- "default": 7,
121
- "description": "Height of the plot (in inches)."
122
- }
123
- ]
124
- }
125
- ]
126
- }
@@ -1,137 +0,0 @@
1
- {
2
- "tasks": [
3
- {
4
- "task": "BedGraph.tad.rb",
5
- "description": ["Estimates the truncated average sequencing depth (TAD)",
6
- "from a BedGraph file."],
7
- "warn": ["This script doesn't consider zero-coverage positions if",
8
- "missing from the file. If you produce your BedGraph file with",
9
- "bedtools genomecov and want to consider zero-coverage position, be",
10
- "sure to use -bga (not -bg)."],
11
- "see_also": ["BedGraph.window.rb",
12
- "BlastTab.seqdepth.pl", "BlastTab.seqdepth_ZIP.pl"],
13
- "help_arg": "--help",
14
- "options": [
15
- {
16
- "opt": "--input",
17
- "arg": "in_file",
18
- "mandatory": true,
19
- "description": "Input BedGraph file."
20
- },
21
- {
22
- "opt": "--range",
23
- "arg": "float",
24
- "default": 0.5,
25
- "description": ["Central range to consider, between 0 and 1. By",
26
- "default: inter-quartile range (0.5)."]
27
- },
28
- {
29
- "opt": "--per-seq",
30
- "description": ["Calculate averages per reference sequence, not",
31
- "total. Assumes a sorted BedGraph file."]
32
- },
33
- {
34
- "opt": "--length",
35
- "description": "Add sequence length to the output."
36
- }
37
- ]
38
- },
39
- {
40
- "task": "BedGraph.window.rb",
41
- "description": ["Estimates the sequencing depth per windows from a",
42
- "BedGraph file."],
43
- "warn": ["This script doesn't consider zero-coverage positions if",
44
- "missing from the file. If you produce your BedGraph file with",
45
- "bedtools genomecov and want to consider zero-coverage position, be",
46
- "sure to use -bga (not -bg)."],
47
- "see_also": ["BedGraph.tad.rb",
48
- "BlastTab.seqdepth.pl", "BlastTab.seqdepth_ZIP.pl"],
49
- "help_arg": "--help",
50
- "options": [
51
- {
52
- "opt": "--input",
53
- "arg": "in_file",
54
- "mandatory": true,
55
- "description": "Input BedGraph file."
56
- },
57
- {
58
- "name": "Window size",
59
- "opt": "--win",
60
- "arg": "float",
61
- "default": 1000,
62
- "description": "Window size, in base pairs."
63
- }
64
- ]
65
- },
66
- {
67
- "task": "sam.filter.rb",
68
- "description": ["Filters a SAM or BAM file by target sequences and/or",
69
- "identity."],
70
- "see_also": ["anir.rb"],
71
- "help_arg": "--help",
72
- "options": [
73
- {
74
- "opt": "--genome",
75
- "arg": "in_file",
76
- "mandatory": true,
77
- "description": ["Genome assembly.",
78
- "Supports compression with .gz extension."]
79
- },
80
- {
81
- "opt": "--mapping",
82
- "arg": "in_file",
83
- "mandatory": true,
84
- "description": ["Mapping file.",
85
- "Supports compression with .gz extension."]
86
- },
87
- {
88
- "opt": "--out-sam",
89
- "arg": "out_file",
90
- "mandatory": true,
91
- "description": ["Output filtered file in SAM format.",
92
- "Supports compression with .gz extension."]
93
- },
94
- {
95
- "opt": "--g-format",
96
- "arg": "select",
97
- "values": ["fasta", "list"],
98
- "default": "fasta",
99
- "description": ["Genome assembly format."]
100
- },
101
- {
102
- "opt": "--m-format",
103
- "arg": "select",
104
- "values": ["sam", "bam"],
105
- "default": "sam",
106
- "description": ["Mapping file format. SAM supports compression with",
107
- ".gz file extension."]
108
- },
109
- {
110
- "opt": "--identity",
111
- "arg": "float",
112
- "description": "Set a fixed threshold of percent identity.",
113
- "default": 95.0
114
- },
115
- {
116
- "opt": "--no-header",
117
- "description": "Do not include the headers."
118
- },
119
- {
120
- "opt": "--threads",
121
- "arg": "integer",
122
- "description": "Threads to use.",
123
- "default": 2
124
- },
125
- {
126
- "opt": "--log",
127
- "arg": "out_file",
128
- "description": "Log file to save output."
129
- },
130
- {
131
- "opt": "--quiet",
132
- "description": "Run quietly."
133
- }
134
- ]
135
- }
136
- ]
137
- }