miga-base 1.2.15.2 → 1.2.15.4

Sign up to get free protection for your applications and to get access to all the features.
Files changed (306) hide show
  1. checksums.yaml +4 -4
  2. data/lib/miga/cli/action/download/gtdb.rb +4 -1
  3. data/lib/miga/cli/action/gtdb_get.rb +4 -0
  4. data/lib/miga/daemon.rb +4 -1
  5. data/lib/miga/lair.rb +6 -4
  6. data/lib/miga/remote_dataset/download.rb +3 -2
  7. data/lib/miga/remote_dataset.rb +25 -7
  8. data/lib/miga/taxonomy.rb +6 -0
  9. data/lib/miga/version.rb +2 -2
  10. metadata +6 -302
  11. data/utils/FastAAI/00.Libraries/01.SCG_HMMs/Archaea_SCG.hmm +0 -41964
  12. data/utils/FastAAI/00.Libraries/01.SCG_HMMs/Bacteria_SCG.hmm +0 -32439
  13. data/utils/FastAAI/00.Libraries/01.SCG_HMMs/Complete_SCG_DB.hmm +0 -62056
  14. data/utils/FastAAI/FastAAI +0 -3659
  15. data/utils/FastAAI/FastAAI-legacy/FastAAI +0 -1336
  16. data/utils/FastAAI/FastAAI-legacy/kAAI_v1.0_virus.py +0 -1296
  17. data/utils/FastAAI/README.md +0 -84
  18. data/utils/enveomics/Docs/recplot2.md +0 -244
  19. data/utils/enveomics/Examples/aai-matrix.bash +0 -66
  20. data/utils/enveomics/Examples/ani-matrix.bash +0 -66
  21. data/utils/enveomics/Examples/essential-phylogeny.bash +0 -105
  22. data/utils/enveomics/Examples/unus-genome-phylogeny.bash +0 -100
  23. data/utils/enveomics/LICENSE.txt +0 -73
  24. data/utils/enveomics/Makefile +0 -52
  25. data/utils/enveomics/Manifest/Tasks/aasubs.json +0 -103
  26. data/utils/enveomics/Manifest/Tasks/blasttab.json +0 -790
  27. data/utils/enveomics/Manifest/Tasks/distances.json +0 -161
  28. data/utils/enveomics/Manifest/Tasks/fasta.json +0 -802
  29. data/utils/enveomics/Manifest/Tasks/fastq.json +0 -291
  30. data/utils/enveomics/Manifest/Tasks/graphics.json +0 -126
  31. data/utils/enveomics/Manifest/Tasks/mapping.json +0 -137
  32. data/utils/enveomics/Manifest/Tasks/ogs.json +0 -382
  33. data/utils/enveomics/Manifest/Tasks/other.json +0 -906
  34. data/utils/enveomics/Manifest/Tasks/remote.json +0 -355
  35. data/utils/enveomics/Manifest/Tasks/sequence-identity.json +0 -650
  36. data/utils/enveomics/Manifest/Tasks/tables.json +0 -308
  37. data/utils/enveomics/Manifest/Tasks/trees.json +0 -68
  38. data/utils/enveomics/Manifest/Tasks/variants.json +0 -111
  39. data/utils/enveomics/Manifest/categories.json +0 -165
  40. data/utils/enveomics/Manifest/examples.json +0 -162
  41. data/utils/enveomics/Manifest/tasks.json +0 -4
  42. data/utils/enveomics/Pipelines/assembly.pbs/CONFIG.mock.bash +0 -69
  43. data/utils/enveomics/Pipelines/assembly.pbs/FastA.N50.pl +0 -1
  44. data/utils/enveomics/Pipelines/assembly.pbs/FastA.filterN.pl +0 -1
  45. data/utils/enveomics/Pipelines/assembly.pbs/FastA.length.pl +0 -1
  46. data/utils/enveomics/Pipelines/assembly.pbs/README.md +0 -189
  47. data/utils/enveomics/Pipelines/assembly.pbs/RUNME-2.bash +0 -112
  48. data/utils/enveomics/Pipelines/assembly.pbs/RUNME-3.bash +0 -23
  49. data/utils/enveomics/Pipelines/assembly.pbs/RUNME-4.bash +0 -44
  50. data/utils/enveomics/Pipelines/assembly.pbs/RUNME.bash +0 -50
  51. data/utils/enveomics/Pipelines/assembly.pbs/kSelector.R +0 -37
  52. data/utils/enveomics/Pipelines/assembly.pbs/newbler.pbs +0 -68
  53. data/utils/enveomics/Pipelines/assembly.pbs/newbler_preparator.pl +0 -49
  54. data/utils/enveomics/Pipelines/assembly.pbs/soap.pbs +0 -80
  55. data/utils/enveomics/Pipelines/assembly.pbs/stats.pbs +0 -57
  56. data/utils/enveomics/Pipelines/assembly.pbs/velvet.pbs +0 -63
  57. data/utils/enveomics/Pipelines/blast.pbs/01.pbs.bash +0 -38
  58. data/utils/enveomics/Pipelines/blast.pbs/02.pbs.bash +0 -73
  59. data/utils/enveomics/Pipelines/blast.pbs/03.pbs.bash +0 -21
  60. data/utils/enveomics/Pipelines/blast.pbs/BlastTab.recover_job.pl +0 -72
  61. data/utils/enveomics/Pipelines/blast.pbs/CONFIG.mock.bash +0 -98
  62. data/utils/enveomics/Pipelines/blast.pbs/FastA.split.pl +0 -1
  63. data/utils/enveomics/Pipelines/blast.pbs/README.md +0 -127
  64. data/utils/enveomics/Pipelines/blast.pbs/RUNME.bash +0 -109
  65. data/utils/enveomics/Pipelines/blast.pbs/TASK.check.bash +0 -128
  66. data/utils/enveomics/Pipelines/blast.pbs/TASK.dry.bash +0 -16
  67. data/utils/enveomics/Pipelines/blast.pbs/TASK.eo.bash +0 -22
  68. data/utils/enveomics/Pipelines/blast.pbs/TASK.pause.bash +0 -26
  69. data/utils/enveomics/Pipelines/blast.pbs/TASK.run.bash +0 -89
  70. data/utils/enveomics/Pipelines/blast.pbs/sentinel.pbs.bash +0 -29
  71. data/utils/enveomics/Pipelines/idba.pbs/README.md +0 -49
  72. data/utils/enveomics/Pipelines/idba.pbs/RUNME.bash +0 -95
  73. data/utils/enveomics/Pipelines/idba.pbs/run.pbs +0 -56
  74. data/utils/enveomics/Pipelines/trim.pbs/README.md +0 -54
  75. data/utils/enveomics/Pipelines/trim.pbs/RUNME.bash +0 -70
  76. data/utils/enveomics/Pipelines/trim.pbs/run.pbs +0 -130
  77. data/utils/enveomics/README.md +0 -42
  78. data/utils/enveomics/Scripts/AAsubs.log2ratio.rb +0 -171
  79. data/utils/enveomics/Scripts/Aln.cat.rb +0 -221
  80. data/utils/enveomics/Scripts/Aln.convert.pl +0 -35
  81. data/utils/enveomics/Scripts/AlphaDiversity.pl +0 -152
  82. data/utils/enveomics/Scripts/BedGraph.tad.rb +0 -93
  83. data/utils/enveomics/Scripts/BedGraph.window.rb +0 -71
  84. data/utils/enveomics/Scripts/BlastPairwise.AAsubs.pl +0 -102
  85. data/utils/enveomics/Scripts/BlastTab.addlen.rb +0 -63
  86. data/utils/enveomics/Scripts/BlastTab.advance.bash +0 -48
  87. data/utils/enveomics/Scripts/BlastTab.best_hit_sorted.pl +0 -55
  88. data/utils/enveomics/Scripts/BlastTab.catsbj.pl +0 -104
  89. data/utils/enveomics/Scripts/BlastTab.cogCat.rb +0 -76
  90. data/utils/enveomics/Scripts/BlastTab.filter.pl +0 -47
  91. data/utils/enveomics/Scripts/BlastTab.kegg_pep2path_rest.pl +0 -194
  92. data/utils/enveomics/Scripts/BlastTab.metaxaPrep.pl +0 -104
  93. data/utils/enveomics/Scripts/BlastTab.pairedHits.rb +0 -157
  94. data/utils/enveomics/Scripts/BlastTab.recplot2.R +0 -48
  95. data/utils/enveomics/Scripts/BlastTab.seqdepth.pl +0 -86
  96. data/utils/enveomics/Scripts/BlastTab.seqdepth_ZIP.pl +0 -119
  97. data/utils/enveomics/Scripts/BlastTab.seqdepth_nomedian.pl +0 -86
  98. data/utils/enveomics/Scripts/BlastTab.subsample.pl +0 -47
  99. data/utils/enveomics/Scripts/BlastTab.sumPerHit.pl +0 -114
  100. data/utils/enveomics/Scripts/BlastTab.taxid2taxrank.pl +0 -90
  101. data/utils/enveomics/Scripts/BlastTab.topHits_sorted.rb +0 -123
  102. data/utils/enveomics/Scripts/Chao1.pl +0 -97
  103. data/utils/enveomics/Scripts/CharTable.classify.rb +0 -234
  104. data/utils/enveomics/Scripts/EBIseq2tax.rb +0 -83
  105. data/utils/enveomics/Scripts/FastA.N50.pl +0 -60
  106. data/utils/enveomics/Scripts/FastA.extract.rb +0 -152
  107. data/utils/enveomics/Scripts/FastA.filter.pl +0 -52
  108. data/utils/enveomics/Scripts/FastA.filterLen.pl +0 -28
  109. data/utils/enveomics/Scripts/FastA.filterN.pl +0 -60
  110. data/utils/enveomics/Scripts/FastA.fragment.rb +0 -100
  111. data/utils/enveomics/Scripts/FastA.gc.pl +0 -42
  112. data/utils/enveomics/Scripts/FastA.interpose.pl +0 -93
  113. data/utils/enveomics/Scripts/FastA.length.pl +0 -38
  114. data/utils/enveomics/Scripts/FastA.mask.rb +0 -89
  115. data/utils/enveomics/Scripts/FastA.per_file.pl +0 -36
  116. data/utils/enveomics/Scripts/FastA.qlen.pl +0 -57
  117. data/utils/enveomics/Scripts/FastA.rename.pl +0 -65
  118. data/utils/enveomics/Scripts/FastA.revcom.pl +0 -23
  119. data/utils/enveomics/Scripts/FastA.sample.rb +0 -98
  120. data/utils/enveomics/Scripts/FastA.slider.pl +0 -85
  121. data/utils/enveomics/Scripts/FastA.split.pl +0 -55
  122. data/utils/enveomics/Scripts/FastA.split.rb +0 -79
  123. data/utils/enveomics/Scripts/FastA.subsample.pl +0 -131
  124. data/utils/enveomics/Scripts/FastA.tag.rb +0 -65
  125. data/utils/enveomics/Scripts/FastA.toFastQ.rb +0 -69
  126. data/utils/enveomics/Scripts/FastA.wrap.rb +0 -48
  127. data/utils/enveomics/Scripts/FastQ.filter.pl +0 -54
  128. data/utils/enveomics/Scripts/FastQ.interpose.pl +0 -90
  129. data/utils/enveomics/Scripts/FastQ.maskQual.rb +0 -89
  130. data/utils/enveomics/Scripts/FastQ.offset.pl +0 -90
  131. data/utils/enveomics/Scripts/FastQ.split.pl +0 -53
  132. data/utils/enveomics/Scripts/FastQ.tag.rb +0 -70
  133. data/utils/enveomics/Scripts/FastQ.test-error.rb +0 -81
  134. data/utils/enveomics/Scripts/FastQ.toFastA.awk +0 -24
  135. data/utils/enveomics/Scripts/GFF.catsbj.pl +0 -127
  136. data/utils/enveomics/Scripts/GenBank.add_fields.rb +0 -84
  137. data/utils/enveomics/Scripts/HMM.essential.rb +0 -351
  138. data/utils/enveomics/Scripts/HMM.haai.rb +0 -168
  139. data/utils/enveomics/Scripts/HMMsearch.extractIds.rb +0 -83
  140. data/utils/enveomics/Scripts/JPlace.distances.rb +0 -88
  141. data/utils/enveomics/Scripts/JPlace.to_iToL.rb +0 -320
  142. data/utils/enveomics/Scripts/M5nr.getSequences.rb +0 -81
  143. data/utils/enveomics/Scripts/MeTaxa.distribution.pl +0 -198
  144. data/utils/enveomics/Scripts/MyTaxa.fragsByTax.pl +0 -35
  145. data/utils/enveomics/Scripts/MyTaxa.seq-taxrank.rb +0 -49
  146. data/utils/enveomics/Scripts/NCBIacc2tax.rb +0 -92
  147. data/utils/enveomics/Scripts/Newick.autoprune.R +0 -27
  148. data/utils/enveomics/Scripts/RAxML-EPA.to_iToL.pl +0 -228
  149. data/utils/enveomics/Scripts/RecPlot2.compareIdentities.R +0 -32
  150. data/utils/enveomics/Scripts/RefSeq.download.bash +0 -48
  151. data/utils/enveomics/Scripts/SRA.download.bash +0 -55
  152. data/utils/enveomics/Scripts/TRIBS.plot-test.R +0 -36
  153. data/utils/enveomics/Scripts/TRIBS.test.R +0 -39
  154. data/utils/enveomics/Scripts/Table.barplot.R +0 -31
  155. data/utils/enveomics/Scripts/Table.df2dist.R +0 -30
  156. data/utils/enveomics/Scripts/Table.filter.pl +0 -61
  157. data/utils/enveomics/Scripts/Table.merge.pl +0 -77
  158. data/utils/enveomics/Scripts/Table.prefScore.R +0 -60
  159. data/utils/enveomics/Scripts/Table.replace.rb +0 -69
  160. data/utils/enveomics/Scripts/Table.round.rb +0 -63
  161. data/utils/enveomics/Scripts/Table.split.pl +0 -57
  162. data/utils/enveomics/Scripts/Taxonomy.silva2ncbi.rb +0 -227
  163. data/utils/enveomics/Scripts/VCF.KaKs.rb +0 -147
  164. data/utils/enveomics/Scripts/VCF.SNPs.rb +0 -88
  165. data/utils/enveomics/Scripts/aai.rb +0 -421
  166. data/utils/enveomics/Scripts/ani.rb +0 -362
  167. data/utils/enveomics/Scripts/anir.rb +0 -137
  168. data/utils/enveomics/Scripts/clust.rand.rb +0 -102
  169. data/utils/enveomics/Scripts/gi2tax.rb +0 -103
  170. data/utils/enveomics/Scripts/in_silico_GA_GI.pl +0 -96
  171. data/utils/enveomics/Scripts/lib/data/dupont_2012_essential.hmm.gz +0 -0
  172. data/utils/enveomics/Scripts/lib/data/lee_2019_essential.hmm.gz +0 -0
  173. data/utils/enveomics/Scripts/lib/enveomics.R +0 -1
  174. data/utils/enveomics/Scripts/lib/enveomics_rb/anir.rb +0 -293
  175. data/utils/enveomics/Scripts/lib/enveomics_rb/bm_set.rb +0 -175
  176. data/utils/enveomics/Scripts/lib/enveomics_rb/enveomics.rb +0 -24
  177. data/utils/enveomics/Scripts/lib/enveomics_rb/errors.rb +0 -17
  178. data/utils/enveomics/Scripts/lib/enveomics_rb/gmm_em.rb +0 -30
  179. data/utils/enveomics/Scripts/lib/enveomics_rb/jplace.rb +0 -253
  180. data/utils/enveomics/Scripts/lib/enveomics_rb/match.rb +0 -88
  181. data/utils/enveomics/Scripts/lib/enveomics_rb/og.rb +0 -182
  182. data/utils/enveomics/Scripts/lib/enveomics_rb/rbm.rb +0 -49
  183. data/utils/enveomics/Scripts/lib/enveomics_rb/remote_data.rb +0 -74
  184. data/utils/enveomics/Scripts/lib/enveomics_rb/seq_range.rb +0 -237
  185. data/utils/enveomics/Scripts/lib/enveomics_rb/stats/rand.rb +0 -31
  186. data/utils/enveomics/Scripts/lib/enveomics_rb/stats/sample.rb +0 -152
  187. data/utils/enveomics/Scripts/lib/enveomics_rb/stats.rb +0 -3
  188. data/utils/enveomics/Scripts/lib/enveomics_rb/utils.rb +0 -74
  189. data/utils/enveomics/Scripts/lib/enveomics_rb/vcf.rb +0 -135
  190. data/utils/enveomics/Scripts/ogs.annotate.rb +0 -88
  191. data/utils/enveomics/Scripts/ogs.core-pan.rb +0 -160
  192. data/utils/enveomics/Scripts/ogs.extract.rb +0 -125
  193. data/utils/enveomics/Scripts/ogs.mcl.rb +0 -186
  194. data/utils/enveomics/Scripts/ogs.rb +0 -104
  195. data/utils/enveomics/Scripts/ogs.stats.rb +0 -131
  196. data/utils/enveomics/Scripts/rbm-legacy.rb +0 -172
  197. data/utils/enveomics/Scripts/rbm.rb +0 -108
  198. data/utils/enveomics/Scripts/sam.filter.rb +0 -148
  199. data/utils/enveomics/Tests/Makefile +0 -10
  200. data/utils/enveomics/Tests/Mgen_M2288.faa +0 -3189
  201. data/utils/enveomics/Tests/Mgen_M2288.fna +0 -8282
  202. data/utils/enveomics/Tests/Mgen_M2321.fna +0 -8288
  203. data/utils/enveomics/Tests/Nequ_Kin4M.faa +0 -2970
  204. data/utils/enveomics/Tests/Xanthomonas_oryzae-PilA.tribs.Rdata +0 -0
  205. data/utils/enveomics/Tests/Xanthomonas_oryzae-PilA.txt +0 -7
  206. data/utils/enveomics/Tests/Xanthomonas_oryzae.aai-mat.tsv +0 -17
  207. data/utils/enveomics/Tests/Xanthomonas_oryzae.aai.tsv +0 -137
  208. data/utils/enveomics/Tests/a_mg.cds-go.blast.tsv +0 -123
  209. data/utils/enveomics/Tests/a_mg.reads-cds.blast.tsv +0 -200
  210. data/utils/enveomics/Tests/a_mg.reads-cds.counts.tsv +0 -55
  211. data/utils/enveomics/Tests/alkB.nwk +0 -1
  212. data/utils/enveomics/Tests/anthrax-cansnp-data.tsv +0 -13
  213. data/utils/enveomics/Tests/anthrax-cansnp-key.tsv +0 -17
  214. data/utils/enveomics/Tests/hiv1.faa +0 -59
  215. data/utils/enveomics/Tests/hiv1.fna +0 -134
  216. data/utils/enveomics/Tests/hiv2.faa +0 -70
  217. data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv +0 -233
  218. data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv.lim +0 -1
  219. data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv.rec +0 -233
  220. data/utils/enveomics/Tests/phyla_counts.tsv +0 -10
  221. data/utils/enveomics/Tests/primate_lentivirus.ogs +0 -11
  222. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-hiv1.rbm +0 -9
  223. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-hiv2.rbm +0 -8
  224. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-siv.rbm +0 -6
  225. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv2-hiv2.rbm +0 -9
  226. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv2-siv.rbm +0 -6
  227. data/utils/enveomics/Tests/primate_lentivirus.rbm/siv-siv.rbm +0 -6
  228. data/utils/enveomics/build_enveomics_r.bash +0 -45
  229. data/utils/enveomics/enveomics.R/DESCRIPTION +0 -31
  230. data/utils/enveomics/enveomics.R/NAMESPACE +0 -39
  231. data/utils/enveomics/enveomics.R/R/autoprune.R +0 -155
  232. data/utils/enveomics/enveomics.R/R/barplot.R +0 -184
  233. data/utils/enveomics/enveomics.R/R/cliopts.R +0 -135
  234. data/utils/enveomics/enveomics.R/R/df2dist.R +0 -154
  235. data/utils/enveomics/enveomics.R/R/growthcurve.R +0 -331
  236. data/utils/enveomics/enveomics.R/R/prefscore.R +0 -79
  237. data/utils/enveomics/enveomics.R/R/recplot.R +0 -354
  238. data/utils/enveomics/enveomics.R/R/recplot2.R +0 -1631
  239. data/utils/enveomics/enveomics.R/R/tribs.R +0 -583
  240. data/utils/enveomics/enveomics.R/R/utils.R +0 -80
  241. data/utils/enveomics/enveomics.R/README.md +0 -81
  242. data/utils/enveomics/enveomics.R/data/growth.curves.rda +0 -0
  243. data/utils/enveomics/enveomics.R/data/phyla.counts.rda +0 -0
  244. data/utils/enveomics/enveomics.R/man/cash-enve.GrowthCurve-method.Rd +0 -16
  245. data/utils/enveomics/enveomics.R/man/cash-enve.RecPlot2-method.Rd +0 -16
  246. data/utils/enveomics/enveomics.R/man/cash-enve.RecPlot2.Peak-method.Rd +0 -16
  247. data/utils/enveomics/enveomics.R/man/enve.GrowthCurve-class.Rd +0 -25
  248. data/utils/enveomics/enveomics.R/man/enve.TRIBS-class.Rd +0 -46
  249. data/utils/enveomics/enveomics.R/man/enve.TRIBS.merge.Rd +0 -23
  250. data/utils/enveomics/enveomics.R/man/enve.TRIBStest-class.Rd +0 -47
  251. data/utils/enveomics/enveomics.R/man/enve.__prune.iter.Rd +0 -23
  252. data/utils/enveomics/enveomics.R/man/enve.__prune.reduce.Rd +0 -23
  253. data/utils/enveomics/enveomics.R/man/enve.__tribs.Rd +0 -40
  254. data/utils/enveomics/enveomics.R/man/enve.barplot.Rd +0 -103
  255. data/utils/enveomics/enveomics.R/man/enve.cliopts.Rd +0 -67
  256. data/utils/enveomics/enveomics.R/man/enve.col.alpha.Rd +0 -24
  257. data/utils/enveomics/enveomics.R/man/enve.col2alpha.Rd +0 -19
  258. data/utils/enveomics/enveomics.R/man/enve.df2dist.Rd +0 -45
  259. data/utils/enveomics/enveomics.R/man/enve.df2dist.group.Rd +0 -44
  260. data/utils/enveomics/enveomics.R/man/enve.df2dist.list.Rd +0 -47
  261. data/utils/enveomics/enveomics.R/man/enve.growthcurve.Rd +0 -75
  262. data/utils/enveomics/enveomics.R/man/enve.prefscore.Rd +0 -50
  263. data/utils/enveomics/enveomics.R/man/enve.prune.dist.Rd +0 -44
  264. data/utils/enveomics/enveomics.R/man/enve.recplot.Rd +0 -139
  265. data/utils/enveomics/enveomics.R/man/enve.recplot2-class.Rd +0 -45
  266. data/utils/enveomics/enveomics.R/man/enve.recplot2.ANIr.Rd +0 -24
  267. data/utils/enveomics/enveomics.R/man/enve.recplot2.Rd +0 -77
  268. data/utils/enveomics/enveomics.R/man/enve.recplot2.__counts.Rd +0 -25
  269. data/utils/enveomics/enveomics.R/man/enve.recplot2.__peakHist.Rd +0 -21
  270. data/utils/enveomics/enveomics.R/man/enve.recplot2.__whichClosestPeak.Rd +0 -19
  271. data/utils/enveomics/enveomics.R/man/enve.recplot2.changeCutoff.Rd +0 -19
  272. data/utils/enveomics/enveomics.R/man/enve.recplot2.compareIdentities.Rd +0 -47
  273. data/utils/enveomics/enveomics.R/man/enve.recplot2.coordinates.Rd +0 -29
  274. data/utils/enveomics/enveomics.R/man/enve.recplot2.corePeak.Rd +0 -18
  275. data/utils/enveomics/enveomics.R/man/enve.recplot2.extractWindows.Rd +0 -45
  276. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.Rd +0 -36
  277. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__em_e.Rd +0 -19
  278. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__em_m.Rd +0 -19
  279. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__emauto_one.Rd +0 -27
  280. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__mow_one.Rd +0 -52
  281. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__mower.Rd +0 -17
  282. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.em.Rd +0 -51
  283. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.emauto.Rd +0 -43
  284. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.mower.Rd +0 -82
  285. data/utils/enveomics/enveomics.R/man/enve.recplot2.peak-class.Rd +0 -59
  286. data/utils/enveomics/enveomics.R/man/enve.recplot2.seqdepth.Rd +0 -27
  287. data/utils/enveomics/enveomics.R/man/enve.recplot2.windowDepthThreshold.Rd +0 -36
  288. data/utils/enveomics/enveomics.R/man/enve.selvector.Rd +0 -23
  289. data/utils/enveomics/enveomics.R/man/enve.tribs.Rd +0 -68
  290. data/utils/enveomics/enveomics.R/man/enve.tribs.test.Rd +0 -28
  291. data/utils/enveomics/enveomics.R/man/enve.truncate.Rd +0 -27
  292. data/utils/enveomics/enveomics.R/man/growth.curves.Rd +0 -14
  293. data/utils/enveomics/enveomics.R/man/phyla.counts.Rd +0 -13
  294. data/utils/enveomics/enveomics.R/man/plot.enve.GrowthCurve.Rd +0 -78
  295. data/utils/enveomics/enveomics.R/man/plot.enve.TRIBS.Rd +0 -46
  296. data/utils/enveomics/enveomics.R/man/plot.enve.TRIBStest.Rd +0 -45
  297. data/utils/enveomics/enveomics.R/man/plot.enve.recplot2.Rd +0 -125
  298. data/utils/enveomics/enveomics.R/man/summary.enve.GrowthCurve.Rd +0 -19
  299. data/utils/enveomics/enveomics.R/man/summary.enve.TRIBS.Rd +0 -19
  300. data/utils/enveomics/enveomics.R/man/summary.enve.TRIBStest.Rd +0 -19
  301. data/utils/enveomics/globals.mk +0 -8
  302. data/utils/enveomics/manifest.json +0 -9
  303. data/utils/multitrim/Multitrim How-To.pdf +0 -0
  304. data/utils/multitrim/README.md +0 -67
  305. data/utils/multitrim/multitrim.py +0 -1555
  306. data/utils/multitrim/multitrim.yml +0 -13
@@ -1,291 +0,0 @@
1
- {
2
- "tasks": [
3
- {
4
- "task": "FastQ.filter.pl",
5
- "description": "Extracts a subset of sequences from a FastQ file.",
6
- "see_also": ["FastA.filter.pl"],
7
- "help_arg": "-h",
8
- "options": [
9
- {
10
- "name": "Reverse list",
11
- "opt": "-r",
12
- "description": "Extracts sequences NOT present in the list."
13
- },
14
- {
15
- "name": "Quiet",
16
- "opt": "-q",
17
- "description": "Runs quietly."
18
- },
19
- {
20
- "name": "List",
21
- "arg": "in_file",
22
- "mandatory": true,
23
- "description": "List of sequences to extract."
24
- },
25
- {
26
- "name": "Seqs.fq",
27
- "arg": "in_file",
28
- "mandatory": true,
29
- "description": "FastQ file containing the superset of sequences."
30
- },
31
- ">",
32
- {
33
- "name": "Subset.fq",
34
- "arg": "out_file",
35
- "mandatory": true,
36
- "description": "FastQ file to be created."
37
- }
38
- ]
39
- },
40
- {
41
- "task": "FastQ.interpose.pl",
42
- "description": ["Interposes sequences in FastQ format from two files",
43
- "into one output file. If more than two files are provided, the script",
44
- "will interpose all the input files."],
45
- "warn": ["Note that this script will check for the consistency of the",
46
- "names (assuming a pair of related reads contains the same name",
47
- "varying only in a trailing slash (/) followed by a digit. If you want",
48
- "to turn this feature off just set the checking period to zero. If you",
49
- "want to decrease the sampling period (to speed the script up) or",
50
- "increase it (to make it more sensitive to errors) just change the",
51
- "checking period accordingly."],
52
- "see_also": ["FastQ.split.pl","FastA.interpose.pl"],
53
- "help_arg": "",
54
- "options": [
55
- {
56
- "name": "Checking period",
57
- "opt": "-T",
58
- "arg": "integer",
59
- "default": 1000,
60
- "description": "Sampling period for names evaluation."
61
- },
62
- {
63
- "arg": "out_file",
64
- "mandatory": true,
65
- "description": "Output FastQ file."
66
- },
67
- {
68
- "arg": "in_file",
69
- "mandatory": true,
70
- "description": "First input FastQ file."
71
- },
72
- {
73
- "arg": "in_file",
74
- "mandatory": true,
75
- "description": "Second input FastQ file."
76
- },
77
- {
78
- "arg": "in_file",
79
- "multiple_sep": " ",
80
- "description": "Any additional input FastQ files."
81
- }
82
- ]
83
- },
84
- {
85
- "task": "FastQ.maskQual.rb",
86
- "description": "Masks low-quality bases in a FastQ file.",
87
- "help_arg": "--help",
88
- "options": [
89
- {
90
- "opt": "--input",
91
- "arg": "in_file",
92
- "mandatory": true,
93
- "description": ["Path to the FastQ file containing the sequences.",
94
- "Supports compression with .gz extension."]
95
- },
96
- {
97
- "opt": "--output",
98
- "arg": "out_file",
99
- "mandatory": true,
100
- "description": ["Path to the output FastQ file.",
101
- "Supports compression with .gz extension."]
102
- },
103
- {
104
- "opt": "--qual",
105
- "arg": "integer",
106
- "default": 15,
107
- "description": "Minimum quality score to allow a base."
108
- },
109
- {
110
- "opt": "--offset",
111
- "arg": "integer",
112
- "default": 33,
113
- "description": "Q-score offset."
114
- },
115
- {
116
- "opt": "--fasta",
117
- "description": "Output sequences in FastA format."
118
- },
119
- {
120
- "opt": "--quiet",
121
- "description": "Run quietly."
122
- }
123
- ]
124
- },
125
- {
126
- "task": "FastQ.offset.pl",
127
- "description": ["There are several FastQ formats. This script takes a",
128
- "FastQ in any of them, identifies the type of FastQ (this is, the",
129
- "offset), and generates a FastQ with the given offset."],
130
- "warn": ["Note that Solexa+64 FastQ can cause problematic values when",
131
- "using the offset 33, since there is no equivalent in Phred+33 for",
132
- "negative values (the range of Solexa+64 is -5 to 40)."],
133
- "help_arg": "",
134
- "options": [
135
- {
136
- "arg": "in_file",
137
- "mandatory": true,
138
- "description": ["Input file in FastQ format (range is automatically",
139
- "detected)."]
140
- },
141
- {
142
- "name": "Offset",
143
- "arg": "integer",
144
- "default": 33,
145
- "mandatory": true,
146
- "description": ["Offset to use for the output. Use 0 (zero) to",
147
- "detect the input format and exit."]
148
- },
149
- {
150
- "opt": "force",
151
- "description": ["If set, turns errors into warnings and continues.",
152
- "Out-of-range values are set to the closest range limit."]
153
- },
154
- ">",
155
- {
156
- "arg": "out_file",
157
- "mandatory": true,
158
- "description": ["Output file in FastQ format with the specified",
159
- "offset."]
160
- }
161
- ]
162
- },
163
- {
164
- "task": "FastQ.split.pl",
165
- "description": ["Splits a FastQ file into several FastQ files. This",
166
- "script can be used to separate interposed sister reads using any even",
167
- "number of output files."],
168
- "help_arg": "",
169
- "see_also": ["FastQ.interpose.pl","FastA.split.pl"],
170
- "options": [
171
- {
172
- "name": "in_file.fq",
173
- "arg": "in_file",
174
- "mandatory": true,
175
- "description": "Input file in FastQ format."
176
- },
177
- {
178
- "name": "out_base",
179
- "arg": "out_file",
180
- "mandatory": true,
181
- "description": ["Prefix for the name of the output files. It will be",
182
- "appended with .<i>.fastq, where <i> is a consecutive number",
183
- "starting in 1."]
184
- },
185
- {
186
- "name": "no_files",
187
- "arg": "integer",
188
- "default": 2,
189
- "description": "Number of files to generate."
190
- }
191
- ]
192
- },
193
- {
194
- "task": "FastQ.tag.rb",
195
- "description": "Generates easy-to-parse tagged reads from FastQ files.",
196
- "see_also": ["FastA.tag.rb"],
197
- "help_arg": "--help",
198
- "options": [
199
- {
200
- "name": "Input file",
201
- "opt": "--in",
202
- "arg": "in_file",
203
- "mandatory": true,
204
- "description": [
205
- "FastQ file containing the sequences.",
206
- "Supports compression with .gz extension."
207
- ]
208
- },
209
- {
210
- "name": "Output file",
211
- "opt": "--out",
212
- "arg": "out_file",
213
- "mandatory": true,
214
- "description": [
215
- "FastQ to create.",
216
- "Supports compression with .gz extension."
217
- ]
218
- },
219
- {
220
- "opt": "--prefix",
221
- "arg": "string",
222
- "description": "Prefix to use in all IDs."
223
- },
224
- {
225
- "opt": "--suffix",
226
- "arg": "string",
227
- "description": "Suffix to use in all IDs."
228
- },
229
- {
230
- "opt": "--quiet",
231
- "description": "Run quietly (no STDERR output)."
232
- }
233
- ]
234
- },
235
- {
236
- "task": "FastQ.toFastA.awk",
237
- "description": "Translates FastQ files into FastA.",
238
- "see_also": "FastA.toFastQ.rb",
239
- "help_arg": "'' --help",
240
- "options": [
241
- "<",
242
- {
243
- "arg": "in_file",
244
- "mandatory": true,
245
- "description": "Input FastQ file."
246
- },
247
- ">",
248
- {
249
- "arg": "out_file",
250
- "mandatory": true,
251
- "description": "Output FastA file."
252
- }
253
- ]
254
- },
255
- {
256
- "task": "FastQ.test-error.rb",
257
- "description": ["Compares the estimated error of sequencing reads",
258
- "(Q-score) with observed mismatches (identity against a know",
259
- "reference sequence)."],
260
- "help_arg": "--help",
261
- "options": [
262
- {
263
- "name": "FastQ",
264
- "opt": "--fastq",
265
- "arg": "in_file",
266
- "mandatory": true,
267
- "description": "FastQ file containing the sequences."
268
- },
269
- {
270
- "name": "Tabular BLAST",
271
- "opt": "--blast",
272
- "arg": "in_file",
273
- "mandatory": true,
274
- "description": ["Tabular BLAST file mapping reads to reference",
275
- "sequences."]
276
- },
277
- {
278
- "name": "Output",
279
- "opt": "--out",
280
- "arg": "out_file",
281
- "mandatory": true,
282
- "description": "Output tab-delimited file to create."
283
- },
284
- {
285
- "opt": "--quiet",
286
- "description": "Run quietly (no STDERR output)."
287
- }
288
- ]
289
- }
290
- ]
291
- }
@@ -1,126 +0,0 @@
1
- {
2
- "tasks": [
3
- {
4
- "task": "Table.barplot.R",
5
- "description": "Creates nice barplots from tab-delimited tables.",
6
- "requires": [ { "r_package": "optparse" } ],
7
- "help_arg": "--help",
8
- "options": [
9
- {
10
- "name": "Input file",
11
- "opt": "--x",
12
- "arg": "in_file",
13
- "mandatory": true,
14
- "description": ["A tab-delimited file containing header (first row)",
15
- "and row names (first column)."]
16
- },
17
- {
18
- "opt": "--sizes",
19
- "arg": "string",
20
- "description": ["A numeric vector containing the real size of the",
21
- "samples (columns) in the same order of the input table. If set,",
22
- "the values are assumed to be 100%, otherwise the sum of the",
23
- "columns is used. Separate values by commas."]
24
- },
25
- {
26
- "opt": "--top",
27
- "arg": "integer",
28
- "default": 25,
29
- "description": ["Maximum number of categories to display. Any",
30
- "additional categories will be listed as 'Others'."]
31
- },
32
- {
33
- "opt": "--colors-per-group",
34
- "arg": "integer",
35
- "default": 9,
36
- "description": ["Number of categories in the first two saturation",
37
- "groups of colors. The third group contains the remaining",
38
- "categories if needed."]
39
- },
40
- {
41
- "opt": "--bars-width",
42
- "arg": "integer",
43
- "default": 4,
44
- "description": "Width of the barplot with respect to the legend."
45
- },
46
- {
47
- "opt": "--legend-ncol",
48
- "arg": "integer",
49
- "default": 1,
50
- "description": "Number of columns in the legend."
51
- },
52
- {
53
- "opt": "--other-col",
54
- "arg": "string",
55
- "default": "#000000",
56
- "description": "Color of the 'Others' category."
57
- },
58
- {
59
- "opt": "--add-trend",
60
- "description": ["Controls if semi-transparent areas are to be",
61
- "plotted between the bars to connect the regions (trend regions)."]
62
- },
63
- {
64
- "opt": "--organic-trend",
65
- "description": ["Controls if the trend regions are to be smoothed",
66
- "(curves). By default, trend regions have straight edges. If TRUE,",
67
- "forces add.trend=TRUE."]
68
- },
69
- {
70
- "opt": "--sort-by",
71
- "arg": "string",
72
- "default": "median",
73
- "description": ["Any function that takes a numeric vector and",
74
- "returns a numeric scalar. This function is applied to each row,",
75
- "and the resulting values are used to sort the rows",
76
- "(decreasingly). Good options include: sd, min, max, mean, median."]
77
- },
78
- {
79
- "opt": "--min-report",
80
- "arg": "integer",
81
- "default": 101,
82
- "description": ["Minimum percentage to report the value in the plot.",
83
- "Any value above 100 indicates that no values are to be reported."]
84
- },
85
- {
86
- "opt": "--order",
87
- "arg": "string",
88
- "description": ["Controls how the rows should be ordered. If empty",
89
- "(default), sort.by is applied per row and the results are sorted",
90
- "decreasingly. If NA, no sorting is performed, i.e., the original",
91
- "order is respected. If a vector is provided, it is assumed to be",
92
- "the custom order to be used (either by numeric index or by row",
93
- "names). Separate values by commas."]
94
- },
95
- {
96
- "opt": "--col",
97
- "arg": "string",
98
- "description": ["Colors to use. If provided, overrides the variables",
99
- "`top` and `colors.per.group`, but `other.col` is still used if",
100
- "the vector is insufficient for all the rows. Separate values by",
101
- "commas. An additional palette is available when using value",
102
- "'coto' (palette contributed by Luis (Coto) Orellana)."]
103
- },
104
- {
105
- "arg": "out_file",
106
- "mandatory": true,
107
- "description": "Output file in PDF format."
108
- },
109
- {
110
- "name": "width",
111
- "arg": "float",
112
- "mandatory": true,
113
- "default": 7,
114
- "description": "Width of the plot (in inches)."
115
- },
116
- {
117
- "name": "height",
118
- "arg": "float",
119
- "mandatory": true,
120
- "default": 7,
121
- "description": "Height of the plot (in inches)."
122
- }
123
- ]
124
- }
125
- ]
126
- }
@@ -1,137 +0,0 @@
1
- {
2
- "tasks": [
3
- {
4
- "task": "BedGraph.tad.rb",
5
- "description": ["Estimates the truncated average sequencing depth (TAD)",
6
- "from a BedGraph file."],
7
- "warn": ["This script doesn't consider zero-coverage positions if",
8
- "missing from the file. If you produce your BedGraph file with",
9
- "bedtools genomecov and want to consider zero-coverage position, be",
10
- "sure to use -bga (not -bg)."],
11
- "see_also": ["BedGraph.window.rb",
12
- "BlastTab.seqdepth.pl", "BlastTab.seqdepth_ZIP.pl"],
13
- "help_arg": "--help",
14
- "options": [
15
- {
16
- "opt": "--input",
17
- "arg": "in_file",
18
- "mandatory": true,
19
- "description": "Input BedGraph file."
20
- },
21
- {
22
- "opt": "--range",
23
- "arg": "float",
24
- "default": 0.5,
25
- "description": ["Central range to consider, between 0 and 1. By",
26
- "default: inter-quartile range (0.5)."]
27
- },
28
- {
29
- "opt": "--per-seq",
30
- "description": ["Calculate averages per reference sequence, not",
31
- "total. Assumes a sorted BedGraph file."]
32
- },
33
- {
34
- "opt": "--length",
35
- "description": "Add sequence length to the output."
36
- }
37
- ]
38
- },
39
- {
40
- "task": "BedGraph.window.rb",
41
- "description": ["Estimates the sequencing depth per windows from a",
42
- "BedGraph file."],
43
- "warn": ["This script doesn't consider zero-coverage positions if",
44
- "missing from the file. If you produce your BedGraph file with",
45
- "bedtools genomecov and want to consider zero-coverage position, be",
46
- "sure to use -bga (not -bg)."],
47
- "see_also": ["BedGraph.tad.rb",
48
- "BlastTab.seqdepth.pl", "BlastTab.seqdepth_ZIP.pl"],
49
- "help_arg": "--help",
50
- "options": [
51
- {
52
- "opt": "--input",
53
- "arg": "in_file",
54
- "mandatory": true,
55
- "description": "Input BedGraph file."
56
- },
57
- {
58
- "name": "Window size",
59
- "opt": "--win",
60
- "arg": "float",
61
- "default": 1000,
62
- "description": "Window size, in base pairs."
63
- }
64
- ]
65
- },
66
- {
67
- "task": "sam.filter.rb",
68
- "description": ["Filters a SAM or BAM file by target sequences and/or",
69
- "identity."],
70
- "see_also": ["anir.rb"],
71
- "help_arg": "--help",
72
- "options": [
73
- {
74
- "opt": "--genome",
75
- "arg": "in_file",
76
- "mandatory": true,
77
- "description": ["Genome assembly.",
78
- "Supports compression with .gz extension."]
79
- },
80
- {
81
- "opt": "--mapping",
82
- "arg": "in_file",
83
- "mandatory": true,
84
- "description": ["Mapping file.",
85
- "Supports compression with .gz extension."]
86
- },
87
- {
88
- "opt": "--out-sam",
89
- "arg": "out_file",
90
- "mandatory": true,
91
- "description": ["Output filtered file in SAM format.",
92
- "Supports compression with .gz extension."]
93
- },
94
- {
95
- "opt": "--g-format",
96
- "arg": "select",
97
- "values": ["fasta", "list"],
98
- "default": "fasta",
99
- "description": ["Genome assembly format."]
100
- },
101
- {
102
- "opt": "--m-format",
103
- "arg": "select",
104
- "values": ["sam", "bam"],
105
- "default": "sam",
106
- "description": ["Mapping file format. SAM supports compression with",
107
- ".gz file extension."]
108
- },
109
- {
110
- "opt": "--identity",
111
- "arg": "float",
112
- "description": "Set a fixed threshold of percent identity.",
113
- "default": 95.0
114
- },
115
- {
116
- "opt": "--no-header",
117
- "description": "Do not include the headers."
118
- },
119
- {
120
- "opt": "--threads",
121
- "arg": "integer",
122
- "description": "Threads to use.",
123
- "default": 2
124
- },
125
- {
126
- "opt": "--log",
127
- "arg": "out_file",
128
- "description": "Log file to save output."
129
- },
130
- {
131
- "opt": "--quiet",
132
- "description": "Run quietly."
133
- }
134
- ]
135
- }
136
- ]
137
- }