miga-base 0.7.26.0 → 0.7.26.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (276) hide show
  1. checksums.yaml +4 -4
  2. data/lib/miga/version.rb +1 -1
  3. data/utils/FastAAI/00.Libraries/01.SCG_HMMs/Archaea_SCG.hmm +41964 -0
  4. data/utils/FastAAI/00.Libraries/01.SCG_HMMs/Bacteria_SCG.hmm +32439 -0
  5. data/utils/FastAAI/00.Libraries/01.SCG_HMMs/Complete_SCG_DB.hmm +62056 -0
  6. data/utils/FastAAI/FastAAI/FastAAI +1336 -0
  7. data/utils/FastAAI/README.md +84 -0
  8. data/utils/FastAAI/kAAI_v1.0_virus.py +1296 -0
  9. data/utils/enveomics/Docs/recplot2.md +244 -0
  10. data/utils/enveomics/Examples/aai-matrix.bash +66 -0
  11. data/utils/enveomics/Examples/ani-matrix.bash +66 -0
  12. data/utils/enveomics/Examples/essential-phylogeny.bash +105 -0
  13. data/utils/enveomics/Examples/unus-genome-phylogeny.bash +100 -0
  14. data/utils/enveomics/LICENSE.txt +73 -0
  15. data/utils/enveomics/Makefile +52 -0
  16. data/utils/enveomics/Manifest/Tasks/aasubs.json +103 -0
  17. data/utils/enveomics/Manifest/Tasks/blasttab.json +786 -0
  18. data/utils/enveomics/Manifest/Tasks/distances.json +161 -0
  19. data/utils/enveomics/Manifest/Tasks/fasta.json +766 -0
  20. data/utils/enveomics/Manifest/Tasks/fastq.json +243 -0
  21. data/utils/enveomics/Manifest/Tasks/graphics.json +126 -0
  22. data/utils/enveomics/Manifest/Tasks/mapping.json +67 -0
  23. data/utils/enveomics/Manifest/Tasks/ogs.json +382 -0
  24. data/utils/enveomics/Manifest/Tasks/other.json +829 -0
  25. data/utils/enveomics/Manifest/Tasks/remote.json +355 -0
  26. data/utils/enveomics/Manifest/Tasks/sequence-identity.json +501 -0
  27. data/utils/enveomics/Manifest/Tasks/tables.json +308 -0
  28. data/utils/enveomics/Manifest/Tasks/trees.json +68 -0
  29. data/utils/enveomics/Manifest/Tasks/variants.json +111 -0
  30. data/utils/enveomics/Manifest/categories.json +156 -0
  31. data/utils/enveomics/Manifest/examples.json +154 -0
  32. data/utils/enveomics/Manifest/tasks.json +4 -0
  33. data/utils/enveomics/Pipelines/assembly.pbs/CONFIG.mock.bash +69 -0
  34. data/utils/enveomics/Pipelines/assembly.pbs/FastA.N50.pl +1 -0
  35. data/utils/enveomics/Pipelines/assembly.pbs/FastA.filterN.pl +1 -0
  36. data/utils/enveomics/Pipelines/assembly.pbs/FastA.length.pl +1 -0
  37. data/utils/enveomics/Pipelines/assembly.pbs/README.md +189 -0
  38. data/utils/enveomics/Pipelines/assembly.pbs/RUNME-2.bash +112 -0
  39. data/utils/enveomics/Pipelines/assembly.pbs/RUNME-3.bash +23 -0
  40. data/utils/enveomics/Pipelines/assembly.pbs/RUNME-4.bash +44 -0
  41. data/utils/enveomics/Pipelines/assembly.pbs/RUNME.bash +50 -0
  42. data/utils/enveomics/Pipelines/assembly.pbs/kSelector.R +37 -0
  43. data/utils/enveomics/Pipelines/assembly.pbs/newbler.pbs +68 -0
  44. data/utils/enveomics/Pipelines/assembly.pbs/newbler_preparator.pl +49 -0
  45. data/utils/enveomics/Pipelines/assembly.pbs/soap.pbs +80 -0
  46. data/utils/enveomics/Pipelines/assembly.pbs/stats.pbs +57 -0
  47. data/utils/enveomics/Pipelines/assembly.pbs/velvet.pbs +63 -0
  48. data/utils/enveomics/Pipelines/blast.pbs/01.pbs.bash +38 -0
  49. data/utils/enveomics/Pipelines/blast.pbs/02.pbs.bash +73 -0
  50. data/utils/enveomics/Pipelines/blast.pbs/03.pbs.bash +21 -0
  51. data/utils/enveomics/Pipelines/blast.pbs/BlastTab.recover_job.pl +72 -0
  52. data/utils/enveomics/Pipelines/blast.pbs/CONFIG.mock.bash +98 -0
  53. data/utils/enveomics/Pipelines/blast.pbs/FastA.split.pl +1 -0
  54. data/utils/enveomics/Pipelines/blast.pbs/README.md +127 -0
  55. data/utils/enveomics/Pipelines/blast.pbs/RUNME.bash +109 -0
  56. data/utils/enveomics/Pipelines/blast.pbs/TASK.check.bash +128 -0
  57. data/utils/enveomics/Pipelines/blast.pbs/TASK.dry.bash +16 -0
  58. data/utils/enveomics/Pipelines/blast.pbs/TASK.eo.bash +22 -0
  59. data/utils/enveomics/Pipelines/blast.pbs/TASK.pause.bash +26 -0
  60. data/utils/enveomics/Pipelines/blast.pbs/TASK.run.bash +89 -0
  61. data/utils/enveomics/Pipelines/blast.pbs/sentinel.pbs.bash +29 -0
  62. data/utils/enveomics/Pipelines/idba.pbs/README.md +49 -0
  63. data/utils/enveomics/Pipelines/idba.pbs/RUNME.bash +95 -0
  64. data/utils/enveomics/Pipelines/idba.pbs/run.pbs +56 -0
  65. data/utils/enveomics/Pipelines/trim.pbs/README.md +54 -0
  66. data/utils/enveomics/Pipelines/trim.pbs/RUNME.bash +70 -0
  67. data/utils/enveomics/Pipelines/trim.pbs/run.pbs +130 -0
  68. data/utils/enveomics/README.md +42 -0
  69. data/utils/enveomics/Scripts/AAsubs.log2ratio.rb +171 -0
  70. data/utils/enveomics/Scripts/Aln.cat.rb +163 -0
  71. data/utils/enveomics/Scripts/Aln.convert.pl +35 -0
  72. data/utils/enveomics/Scripts/AlphaDiversity.pl +152 -0
  73. data/utils/enveomics/Scripts/BedGraph.tad.rb +93 -0
  74. data/utils/enveomics/Scripts/BedGraph.window.rb +71 -0
  75. data/utils/enveomics/Scripts/BlastPairwise.AAsubs.pl +102 -0
  76. data/utils/enveomics/Scripts/BlastTab.addlen.rb +63 -0
  77. data/utils/enveomics/Scripts/BlastTab.advance.bash +48 -0
  78. data/utils/enveomics/Scripts/BlastTab.best_hit_sorted.pl +55 -0
  79. data/utils/enveomics/Scripts/BlastTab.catsbj.pl +104 -0
  80. data/utils/enveomics/Scripts/BlastTab.cogCat.rb +76 -0
  81. data/utils/enveomics/Scripts/BlastTab.filter.pl +47 -0
  82. data/utils/enveomics/Scripts/BlastTab.kegg_pep2path_rest.pl +194 -0
  83. data/utils/enveomics/Scripts/BlastTab.metaxaPrep.pl +104 -0
  84. data/utils/enveomics/Scripts/BlastTab.pairedHits.rb +157 -0
  85. data/utils/enveomics/Scripts/BlastTab.recplot2.R +48 -0
  86. data/utils/enveomics/Scripts/BlastTab.seqdepth.pl +86 -0
  87. data/utils/enveomics/Scripts/BlastTab.seqdepth_ZIP.pl +119 -0
  88. data/utils/enveomics/Scripts/BlastTab.seqdepth_nomedian.pl +86 -0
  89. data/utils/enveomics/Scripts/BlastTab.subsample.pl +47 -0
  90. data/utils/enveomics/Scripts/BlastTab.sumPerHit.pl +114 -0
  91. data/utils/enveomics/Scripts/BlastTab.taxid2taxrank.pl +90 -0
  92. data/utils/enveomics/Scripts/BlastTab.topHits_sorted.rb +101 -0
  93. data/utils/enveomics/Scripts/Chao1.pl +97 -0
  94. data/utils/enveomics/Scripts/CharTable.classify.rb +234 -0
  95. data/utils/enveomics/Scripts/EBIseq2tax.rb +83 -0
  96. data/utils/enveomics/Scripts/FastA.N50.pl +56 -0
  97. data/utils/enveomics/Scripts/FastA.extract.rb +152 -0
  98. data/utils/enveomics/Scripts/FastA.filter.pl +52 -0
  99. data/utils/enveomics/Scripts/FastA.filterLen.pl +28 -0
  100. data/utils/enveomics/Scripts/FastA.filterN.pl +60 -0
  101. data/utils/enveomics/Scripts/FastA.fragment.rb +92 -0
  102. data/utils/enveomics/Scripts/FastA.gc.pl +42 -0
  103. data/utils/enveomics/Scripts/FastA.interpose.pl +93 -0
  104. data/utils/enveomics/Scripts/FastA.length.pl +38 -0
  105. data/utils/enveomics/Scripts/FastA.mask.rb +89 -0
  106. data/utils/enveomics/Scripts/FastA.per_file.pl +36 -0
  107. data/utils/enveomics/Scripts/FastA.qlen.pl +57 -0
  108. data/utils/enveomics/Scripts/FastA.rename.pl +65 -0
  109. data/utils/enveomics/Scripts/FastA.revcom.pl +23 -0
  110. data/utils/enveomics/Scripts/FastA.sample.rb +83 -0
  111. data/utils/enveomics/Scripts/FastA.slider.pl +85 -0
  112. data/utils/enveomics/Scripts/FastA.split.pl +55 -0
  113. data/utils/enveomics/Scripts/FastA.split.rb +79 -0
  114. data/utils/enveomics/Scripts/FastA.subsample.pl +131 -0
  115. data/utils/enveomics/Scripts/FastA.tag.rb +65 -0
  116. data/utils/enveomics/Scripts/FastA.wrap.rb +48 -0
  117. data/utils/enveomics/Scripts/FastQ.filter.pl +54 -0
  118. data/utils/enveomics/Scripts/FastQ.interpose.pl +90 -0
  119. data/utils/enveomics/Scripts/FastQ.offset.pl +90 -0
  120. data/utils/enveomics/Scripts/FastQ.split.pl +53 -0
  121. data/utils/enveomics/Scripts/FastQ.tag.rb +63 -0
  122. data/utils/enveomics/Scripts/FastQ.test-error.rb +81 -0
  123. data/utils/enveomics/Scripts/FastQ.toFastA.awk +24 -0
  124. data/utils/enveomics/Scripts/GFF.catsbj.pl +127 -0
  125. data/utils/enveomics/Scripts/GenBank.add_fields.rb +84 -0
  126. data/utils/enveomics/Scripts/HMM.essential.rb +351 -0
  127. data/utils/enveomics/Scripts/HMM.haai.rb +168 -0
  128. data/utils/enveomics/Scripts/HMMsearch.extractIds.rb +83 -0
  129. data/utils/enveomics/Scripts/JPlace.distances.rb +88 -0
  130. data/utils/enveomics/Scripts/JPlace.to_iToL.rb +320 -0
  131. data/utils/enveomics/Scripts/M5nr.getSequences.rb +81 -0
  132. data/utils/enveomics/Scripts/MeTaxa.distribution.pl +198 -0
  133. data/utils/enveomics/Scripts/MyTaxa.fragsByTax.pl +35 -0
  134. data/utils/enveomics/Scripts/MyTaxa.seq-taxrank.rb +49 -0
  135. data/utils/enveomics/Scripts/NCBIacc2tax.rb +92 -0
  136. data/utils/enveomics/Scripts/Newick.autoprune.R +27 -0
  137. data/utils/enveomics/Scripts/RAxML-EPA.to_iToL.pl +228 -0
  138. data/utils/enveomics/Scripts/RecPlot2.compareIdentities.R +32 -0
  139. data/utils/enveomics/Scripts/RefSeq.download.bash +48 -0
  140. data/utils/enveomics/Scripts/SRA.download.bash +57 -0
  141. data/utils/enveomics/Scripts/TRIBS.plot-test.R +36 -0
  142. data/utils/enveomics/Scripts/TRIBS.test.R +39 -0
  143. data/utils/enveomics/Scripts/Table.barplot.R +31 -0
  144. data/utils/enveomics/Scripts/Table.df2dist.R +30 -0
  145. data/utils/enveomics/Scripts/Table.filter.pl +61 -0
  146. data/utils/enveomics/Scripts/Table.merge.pl +77 -0
  147. data/utils/enveomics/Scripts/Table.replace.rb +69 -0
  148. data/utils/enveomics/Scripts/Table.round.rb +63 -0
  149. data/utils/enveomics/Scripts/Table.split.pl +57 -0
  150. data/utils/enveomics/Scripts/Taxonomy.silva2ncbi.rb +227 -0
  151. data/utils/enveomics/Scripts/VCF.KaKs.rb +147 -0
  152. data/utils/enveomics/Scripts/VCF.SNPs.rb +88 -0
  153. data/utils/enveomics/Scripts/aai.rb +418 -0
  154. data/utils/enveomics/Scripts/ani.rb +362 -0
  155. data/utils/enveomics/Scripts/clust.rand.rb +102 -0
  156. data/utils/enveomics/Scripts/gi2tax.rb +103 -0
  157. data/utils/enveomics/Scripts/in_silico_GA_GI.pl +96 -0
  158. data/utils/enveomics/Scripts/lib/data/dupont_2012_essential.hmm.gz +0 -0
  159. data/utils/enveomics/Scripts/lib/data/lee_2019_essential.hmm.gz +0 -0
  160. data/utils/enveomics/Scripts/lib/enveomics.R +1 -0
  161. data/utils/enveomics/Scripts/lib/enveomics_rb/enveomics.rb +24 -0
  162. data/utils/enveomics/Scripts/lib/enveomics_rb/jplace.rb +253 -0
  163. data/utils/enveomics/Scripts/lib/enveomics_rb/og.rb +182 -0
  164. data/utils/enveomics/Scripts/lib/enveomics_rb/remote_data.rb +74 -0
  165. data/utils/enveomics/Scripts/lib/enveomics_rb/seq_range.rb +237 -0
  166. data/utils/enveomics/Scripts/lib/enveomics_rb/stat.rb +30 -0
  167. data/utils/enveomics/Scripts/lib/enveomics_rb/vcf.rb +135 -0
  168. data/utils/enveomics/Scripts/ogs.annotate.rb +88 -0
  169. data/utils/enveomics/Scripts/ogs.core-pan.rb +160 -0
  170. data/utils/enveomics/Scripts/ogs.extract.rb +125 -0
  171. data/utils/enveomics/Scripts/ogs.mcl.rb +186 -0
  172. data/utils/enveomics/Scripts/ogs.rb +104 -0
  173. data/utils/enveomics/Scripts/ogs.stats.rb +131 -0
  174. data/utils/enveomics/Scripts/rbm.rb +146 -0
  175. data/utils/enveomics/Tests/Makefile +10 -0
  176. data/utils/enveomics/Tests/Mgen_M2288.faa +3189 -0
  177. data/utils/enveomics/Tests/Mgen_M2288.fna +8282 -0
  178. data/utils/enveomics/Tests/Mgen_M2321.fna +8288 -0
  179. data/utils/enveomics/Tests/Nequ_Kin4M.faa +2970 -0
  180. data/utils/enveomics/Tests/Xanthomonas_oryzae-PilA.tribs.Rdata +0 -0
  181. data/utils/enveomics/Tests/Xanthomonas_oryzae-PilA.txt +7 -0
  182. data/utils/enveomics/Tests/Xanthomonas_oryzae.aai-mat.tsv +17 -0
  183. data/utils/enveomics/Tests/Xanthomonas_oryzae.aai.tsv +137 -0
  184. data/utils/enveomics/Tests/a_mg.cds-go.blast.tsv +123 -0
  185. data/utils/enveomics/Tests/a_mg.reads-cds.blast.tsv +200 -0
  186. data/utils/enveomics/Tests/a_mg.reads-cds.counts.tsv +55 -0
  187. data/utils/enveomics/Tests/alkB.nwk +1 -0
  188. data/utils/enveomics/Tests/anthrax-cansnp-data.tsv +13 -0
  189. data/utils/enveomics/Tests/anthrax-cansnp-key.tsv +17 -0
  190. data/utils/enveomics/Tests/hiv1.faa +59 -0
  191. data/utils/enveomics/Tests/hiv1.fna +134 -0
  192. data/utils/enveomics/Tests/hiv2.faa +70 -0
  193. data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv +233 -0
  194. data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv.lim +1 -0
  195. data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv.rec +233 -0
  196. data/utils/enveomics/Tests/phyla_counts.tsv +10 -0
  197. data/utils/enveomics/Tests/primate_lentivirus.ogs +11 -0
  198. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-hiv1.rbm +9 -0
  199. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-hiv2.rbm +8 -0
  200. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-siv.rbm +6 -0
  201. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv2-hiv2.rbm +9 -0
  202. data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv2-siv.rbm +6 -0
  203. data/utils/enveomics/Tests/primate_lentivirus.rbm/siv-siv.rbm +6 -0
  204. data/utils/enveomics/build_enveomics_r.bash +45 -0
  205. data/utils/enveomics/enveomics.R/DESCRIPTION +31 -0
  206. data/utils/enveomics/enveomics.R/NAMESPACE +39 -0
  207. data/utils/enveomics/enveomics.R/R/autoprune.R +155 -0
  208. data/utils/enveomics/enveomics.R/R/barplot.R +184 -0
  209. data/utils/enveomics/enveomics.R/R/cliopts.R +135 -0
  210. data/utils/enveomics/enveomics.R/R/df2dist.R +154 -0
  211. data/utils/enveomics/enveomics.R/R/growthcurve.R +331 -0
  212. data/utils/enveomics/enveomics.R/R/recplot.R +354 -0
  213. data/utils/enveomics/enveomics.R/R/recplot2.R +1631 -0
  214. data/utils/enveomics/enveomics.R/R/tribs.R +583 -0
  215. data/utils/enveomics/enveomics.R/R/utils.R +50 -0
  216. data/utils/enveomics/enveomics.R/README.md +80 -0
  217. data/utils/enveomics/enveomics.R/data/growth.curves.rda +0 -0
  218. data/utils/enveomics/enveomics.R/data/phyla.counts.rda +0 -0
  219. data/utils/enveomics/enveomics.R/man/cash-enve.GrowthCurve-method.Rd +17 -0
  220. data/utils/enveomics/enveomics.R/man/cash-enve.RecPlot2-method.Rd +17 -0
  221. data/utils/enveomics/enveomics.R/man/cash-enve.RecPlot2.Peak-method.Rd +17 -0
  222. data/utils/enveomics/enveomics.R/man/enve.GrowthCurve-class.Rd +25 -0
  223. data/utils/enveomics/enveomics.R/man/enve.TRIBS-class.Rd +46 -0
  224. data/utils/enveomics/enveomics.R/man/enve.TRIBS.merge.Rd +23 -0
  225. data/utils/enveomics/enveomics.R/man/enve.TRIBStest-class.Rd +47 -0
  226. data/utils/enveomics/enveomics.R/man/enve.__prune.iter.Rd +23 -0
  227. data/utils/enveomics/enveomics.R/man/enve.__prune.reduce.Rd +23 -0
  228. data/utils/enveomics/enveomics.R/man/enve.__tribs.Rd +32 -0
  229. data/utils/enveomics/enveomics.R/man/enve.barplot.Rd +91 -0
  230. data/utils/enveomics/enveomics.R/man/enve.cliopts.Rd +57 -0
  231. data/utils/enveomics/enveomics.R/man/enve.col.alpha.Rd +24 -0
  232. data/utils/enveomics/enveomics.R/man/enve.col2alpha.Rd +19 -0
  233. data/utils/enveomics/enveomics.R/man/enve.df2dist.Rd +39 -0
  234. data/utils/enveomics/enveomics.R/man/enve.df2dist.group.Rd +38 -0
  235. data/utils/enveomics/enveomics.R/man/enve.df2dist.list.Rd +40 -0
  236. data/utils/enveomics/enveomics.R/man/enve.growthcurve.Rd +67 -0
  237. data/utils/enveomics/enveomics.R/man/enve.prune.dist.Rd +37 -0
  238. data/utils/enveomics/enveomics.R/man/enve.recplot.Rd +122 -0
  239. data/utils/enveomics/enveomics.R/man/enve.recplot2-class.Rd +45 -0
  240. data/utils/enveomics/enveomics.R/man/enve.recplot2.ANIr.Rd +24 -0
  241. data/utils/enveomics/enveomics.R/man/enve.recplot2.Rd +68 -0
  242. data/utils/enveomics/enveomics.R/man/enve.recplot2.__counts.Rd +25 -0
  243. data/utils/enveomics/enveomics.R/man/enve.recplot2.__peakHist.Rd +21 -0
  244. data/utils/enveomics/enveomics.R/man/enve.recplot2.__whichClosestPeak.Rd +19 -0
  245. data/utils/enveomics/enveomics.R/man/enve.recplot2.changeCutoff.Rd +19 -0
  246. data/utils/enveomics/enveomics.R/man/enve.recplot2.compareIdentities.Rd +41 -0
  247. data/utils/enveomics/enveomics.R/man/enve.recplot2.coordinates.Rd +29 -0
  248. data/utils/enveomics/enveomics.R/man/enve.recplot2.corePeak.Rd +18 -0
  249. data/utils/enveomics/enveomics.R/man/enve.recplot2.extractWindows.Rd +40 -0
  250. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.Rd +36 -0
  251. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__em_e.Rd +19 -0
  252. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__em_m.Rd +19 -0
  253. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__emauto_one.Rd +27 -0
  254. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__mow_one.Rd +41 -0
  255. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__mower.Rd +17 -0
  256. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.em.Rd +43 -0
  257. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.emauto.Rd +37 -0
  258. data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.mower.Rd +74 -0
  259. data/utils/enveomics/enveomics.R/man/enve.recplot2.peak-class.Rd +59 -0
  260. data/utils/enveomics/enveomics.R/man/enve.recplot2.seqdepth.Rd +27 -0
  261. data/utils/enveomics/enveomics.R/man/enve.recplot2.windowDepthThreshold.Rd +32 -0
  262. data/utils/enveomics/enveomics.R/man/enve.tribs.Rd +59 -0
  263. data/utils/enveomics/enveomics.R/man/enve.tribs.test.Rd +28 -0
  264. data/utils/enveomics/enveomics.R/man/enve.truncate.Rd +27 -0
  265. data/utils/enveomics/enveomics.R/man/growth.curves.Rd +14 -0
  266. data/utils/enveomics/enveomics.R/man/phyla.counts.Rd +13 -0
  267. data/utils/enveomics/enveomics.R/man/plot.enve.GrowthCurve.Rd +63 -0
  268. data/utils/enveomics/enveomics.R/man/plot.enve.TRIBS.Rd +38 -0
  269. data/utils/enveomics/enveomics.R/man/plot.enve.TRIBStest.Rd +38 -0
  270. data/utils/enveomics/enveomics.R/man/plot.enve.recplot2.Rd +111 -0
  271. data/utils/enveomics/enveomics.R/man/summary.enve.GrowthCurve.Rd +19 -0
  272. data/utils/enveomics/enveomics.R/man/summary.enve.TRIBS.Rd +19 -0
  273. data/utils/enveomics/enveomics.R/man/summary.enve.TRIBStest.Rd +19 -0
  274. data/utils/enveomics/globals.mk +8 -0
  275. data/utils/enveomics/manifest.json +9 -0
  276. metadata +277 -4
@@ -0,0 +1,57 @@
1
+ % Generated by roxygen2: do not edit by hand
2
+ % Please edit documentation in R/cliopts.R
3
+ \name{enve.cliopts}
4
+ \alias{enve.cliopts}
5
+ \title{Enveomics: Cliopts}
6
+ \usage{
7
+ enve.cliopts(fx, rd_file, positional_arguments, usage, mandatory = c(),
8
+ vectorize = c(), ignore = c(), number = c(), defaults = list(),
9
+ o_desc = list(), p_desc = "")
10
+ }
11
+ \arguments{
12
+ \item{fx}{Function for which the interface should be generated.}
13
+
14
+ \item{rd_file}{(Optional) .Rd file with the standard documentation of
15
+ the function.}
16
+
17
+ \item{positional_arguments}{(Optional) Number of \strong{positional}
18
+ arguments passed to \code{\link[optparse]{parse_args}}
19
+ (package: \pkg{optparse}).}
20
+
21
+ \item{usage}{(Optional) Usage passed to \code{\link[optparse]{OptionParser}}
22
+ (package: \pkg{optparse}).}
23
+
24
+ \item{mandatory}{Mandatory arguments.}
25
+
26
+ \item{vectorize}{Arguments of the function to vectorize (comma-delimited).
27
+ If numeric, use also \code{number}.}
28
+
29
+ \item{ignore}{Arguments of the function to ignore.}
30
+
31
+ \item{number}{Force these arguments as numerics. Useful for numeric
32
+ vectors (see \code{vectorize}) or arguments with no defaults.}
33
+
34
+ \item{defaults}{Defaults to use instead of the ones provided by the
35
+ formals.}
36
+
37
+ \item{o_desc}{Descriptions of the options. Help from \code{rd} is ignored
38
+ for arguments present in this list.}
39
+
40
+ \item{p_desc}{Description Description of the function. Help from \code{rd}
41
+ is ignored for the function description unless this value is an empty string.}
42
+ }
43
+ \value{
44
+ Returns a list with keys:
45
+ \itemize{
46
+ \item{\code{options}, a named list with the values for the function's
47
+ arguments}
48
+ \item{\code{args}, a vector with zero or more strings containing the
49
+ positional arguments}}
50
+ }
51
+ \description{
52
+ Generates nicely formatted command-line interfaces for functions
53
+ (\strong{closures} only).
54
+ }
55
+ \author{
56
+ Luis M. Rodriguez-R [aut, cre]
57
+ }
@@ -0,0 +1,24 @@
1
+ % Generated by roxygen2: do not edit by hand
2
+ % Please edit documentation in R/utils.R
3
+ \name{enve.col.alpha}
4
+ \alias{enve.col.alpha}
5
+ \title{Enveomics: Color Alpha}
6
+ \usage{
7
+ enve.col.alpha(col, alpha = 1/2)
8
+ }
9
+ \arguments{
10
+ \item{col}{Color or vector of colors. It can be any value supported by
11
+ \code{\link[grDevices]{col2rgb}}, such as \code{darkred} or \code{#009988}.}
12
+
13
+ \item{alpha}{Alpha value to add to the color, from 0 to 1.}
14
+ }
15
+ \value{
16
+ Returns a color or a vector of colors in \emph{hex} notation,
17
+ including \code{alpha}.
18
+ }
19
+ \description{
20
+ Modify alpha in a color (or vector of colors).
21
+ }
22
+ \author{
23
+ Luis M. Rodriguez-R [aut, cre]
24
+ }
@@ -0,0 +1,19 @@
1
+ % Generated by roxygen2: do not edit by hand
2
+ % Please edit documentation in R/growthcurve.R
3
+ \name{enve.col2alpha}
4
+ \alias{enve.col2alpha}
5
+ \title{Enveomics: Color to Alpha}
6
+ \usage{
7
+ enve.col2alpha(x, alpha)
8
+ }
9
+ \arguments{
10
+ \item{x}{A vector of any value base colors.}
11
+
12
+ \item{alpha}{Alpha level to set (in the 0-1 range).}
13
+ }
14
+ \description{
15
+ Takes a vector of colors and sets the alpha.
16
+ }
17
+ \author{
18
+ Luis M. Rodriguez-R [aut, cre]
19
+ }
@@ -0,0 +1,39 @@
1
+ % Generated by roxygen2: do not edit by hand
2
+ % Please edit documentation in R/df2dist.R
3
+ \name{enve.df2dist}
4
+ \alias{enve.df2dist}
5
+ \title{Enveomics: Data Frame to Dist}
6
+ \usage{
7
+ enve.df2dist(x, obj1.index = 1, obj2.index = 2, dist.index = 3,
8
+ default.d = NA, max.sim = 0)
9
+ }
10
+ \arguments{
11
+ \item{x}{A dataframe (or coercible object) with at least three columns:
12
+ \enumerate{
13
+ \item ID of the object 1,
14
+ \item ID of the object 2, and
15
+ \item distance between the two objects.}}
16
+
17
+ \item{obj1.index}{Index of the column containing the ID of the object 1.}
18
+
19
+ \item{obj2.index}{Index of the column containing the ID of the object 2.}
20
+
21
+ \item{dist.index}{Index of the column containing the distance.}
22
+
23
+ \item{default.d}{Default value (for missing values).}
24
+
25
+ \item{max.sim}{If not zero, assumes that the values are similarity
26
+ (not distance) and this is the maximum similarity (corresponding to
27
+ distance 0). Applies transformation:
28
+ \eqn{distance = (max.sim - values)/max.sim.}}
29
+ }
30
+ \value{
31
+ Returns a \strong{dist} object.
32
+ }
33
+ \description{
34
+ Transform a dataframe (or coercible object, like a table) into a
35
+ \strong{dist} object.
36
+ }
37
+ \author{
38
+ Luis M. Rodriguez-R [aut, cre]
39
+ }
@@ -0,0 +1,38 @@
1
+ % Generated by roxygen2: do not edit by hand
2
+ % Please edit documentation in R/df2dist.R
3
+ \name{enve.df2dist.group}
4
+ \alias{enve.df2dist.group}
5
+ \title{Enveomics: Data Frame to Dist (Group)}
6
+ \usage{
7
+ enve.df2dist.group(x, obj1.index = 1, obj2.index = 2, dist.index = 3,
8
+ summary = median, empty.rm = TRUE)
9
+ }
10
+ \arguments{
11
+ \item{x}{A dataframe (or coercible object) with at least three columns:
12
+ \enumerate{
13
+ \item ID of the object 1,
14
+ \item ID of the object 2, and
15
+ \item distance between the two objects.}}
16
+
17
+ \item{obj1.index}{Index of the column containing the ID of the object 1.}
18
+
19
+ \item{obj2.index}{Index of the column containing the ID of the object 2.}
20
+
21
+ \item{dist.index}{Index of the column containing the distance.}
22
+
23
+ \item{summary}{Function summarizing the different distances between the
24
+ two objects.}
25
+
26
+ \item{empty.rm}{Remove rows with empty or \code{NA} groups.}
27
+ }
28
+ \value{
29
+ Returns a \strong{dist} object.
30
+ }
31
+ \description{
32
+ Transform a dataframe (or coercible object, like a table) into a
33
+ \strong{dist} object, where there are 1 or more distances between each pair
34
+ of objects.
35
+ }
36
+ \author{
37
+ Luis M. Rodriguez-R [aut, cre]
38
+ }
@@ -0,0 +1,40 @@
1
+ % Generated by roxygen2: do not edit by hand
2
+ % Please edit documentation in R/df2dist.R
3
+ \name{enve.df2dist.list}
4
+ \alias{enve.df2dist.list}
5
+ \title{Enveomics: Data Frame to Dist (List)}
6
+ \usage{
7
+ enve.df2dist.list(x, groups, obj1.index = 1, obj2.index = 2,
8
+ dist.index = 3, empty.rm = TRUE, ...)
9
+ }
10
+ \arguments{
11
+ \item{x}{A dataframe (or coercible object) with at least three columns:
12
+ \enumerate{
13
+ \item ID of the object 1,
14
+ \item ID of the object 2, and
15
+ \item distance between the two objects.}}
16
+
17
+ \item{groups}{Named array where the IDs correspond to the object IDs,
18
+ and the values correspond to the group.}
19
+
20
+ \item{obj1.index}{Index of the column containing the ID of the object 1.}
21
+
22
+ \item{obj2.index}{Index of the column containing the ID of the object 2.}
23
+
24
+ \item{dist.index}{Index of the column containing the distance.}
25
+
26
+ \item{empty.rm}{Remove incomplete matrices.}
27
+
28
+ \item{...}{Any other parameters supported by
29
+ \code{\link{enve.df2dist.group}}.}
30
+ }
31
+ \value{
32
+ Returns a \strong{list} of \strong{dist} objects.
33
+ }
34
+ \description{
35
+ Transform a dataframe (or coercible object, like a table)
36
+ into a \strong{dist} object.
37
+ }
38
+ \author{
39
+ Luis M. Rodriguez-R [aut, cre]
40
+ }
@@ -0,0 +1,67 @@
1
+ % Generated by roxygen2: do not edit by hand
2
+ % Please edit documentation in R/growthcurve.R
3
+ \name{enve.growthcurve}
4
+ \alias{enve.growthcurve}
5
+ \title{Enveomics: Growth Curve}
6
+ \usage{
7
+ enve.growthcurve(x, times = 1:nrow(x), triplicates = FALSE, design,
8
+ new.times = seq(min(times), max(times), length.out = length(times) *
9
+ 10), level = 0.95, interval = c("confidence", "prediction"),
10
+ plot = TRUE, FUN = function(t, K, r, P0) K * P0 * exp(r * t)/(K + P0
11
+ * (exp(r * t) - 1)), nls.opt = list(), ...)
12
+ }
13
+ \arguments{
14
+ \item{x}{Data frame (or coercible) containing the observed growth data
15
+ (e.g., O.D. values). Each column is an independent growth curve and each
16
+ row is a time point. \code{NA}'s are allowed.}
17
+
18
+ \item{times}{Vector with the times at which each row was taken. By default,
19
+ all rows are assumed to be part of constantly periodic measurements.}
20
+
21
+ \item{triplicates}{If \code{TRUE}, the columns are assumed to be sorted by
22
+ sample with three replicates by sample. It requires a number of columns
23
+ multiple of 3.}
24
+
25
+ \item{design}{Experimental design of the data. An \strong{array} of mode list
26
+ with sample names as index and the list of column names in each sample as
27
+ the values. By default, each column is assumed to be an independent sample
28
+ if \code{triplicates} is \code{FALSE}, or every three columns are assumed
29
+ to be a sample if \code{triplicates} is \code{TRUE}. In the latter case,
30
+ samples are simply numbered.}
31
+
32
+ \item{new.times}{Values of time for the fitted curve.}
33
+
34
+ \item{level}{Confidence (or prediction) interval in the fitted curve.}
35
+
36
+ \item{interval}{Type of interval to be calculated for the fitted curve.}
37
+
38
+ \item{plot}{Should the growth curve be plotted?}
39
+
40
+ \item{FUN}{Function to fit. By default: logistic growth with paramenters
41
+ \code{K}: carrying capacity,
42
+ \code{r}: intrinsic growth rate, and
43
+ \code{P0}: Initial population.}
44
+
45
+ \item{nls.opt}{Any additional options passed to \code{nls}.}
46
+
47
+ \item{...}{Any additional parameters to be passed to
48
+ \code{plot.enve.GrowthCurve}.}
49
+ }
50
+ \value{
51
+ Returns an \code{\link{enve.GrowthCurve}} object.
52
+ }
53
+ \description{
54
+ Calculates growth curves using the logistic growth function.
55
+ }
56
+ \examples{
57
+ # Load data
58
+ data("growth.curves", package="enveomics.R", envir=environment())
59
+ # Generate growth curves with different colors
60
+ g <- enve.growthcurve(growth.curves[,-1], growth.curves[,1], triplicates=TRUE)
61
+ # Generate black-and-white growth curves with different symbols
62
+ plot(g, pch=15:17, col="black", band.density=45, band.angle=c(-45,45,0))
63
+
64
+ }
65
+ \author{
66
+ Luis M. Rodriguez-R [aut, cre]
67
+ }
@@ -0,0 +1,37 @@
1
+ % Generated by roxygen2: do not edit by hand
2
+ % Please edit documentation in R/autoprune.R
3
+ \name{enve.prune.dist}
4
+ \alias{enve.prune.dist}
5
+ \title{Enveomics: Prune Dist}
6
+ \usage{
7
+ enve.prune.dist(t, dist.quantile = 0.25, min_dist, quiet = FALSE,
8
+ max_iters = 100, min_nodes_random = 40000, random_nodes_frx = 1)
9
+ }
10
+ \arguments{
11
+ \item{t}{A \strong{phylo} object or a path to the Newick file.}
12
+
13
+ \item{dist.quantile}{The quantile of edge lengths.}
14
+
15
+ \item{min_dist}{The minimum distance to allow between two tips.
16
+ If not set, \code{dist.quantile} is used instead to calculate it.}
17
+
18
+ \item{quiet}{Boolean indicating if the function must run without output.}
19
+
20
+ \item{max_iters}{Maximum number of iterations.}
21
+
22
+ \item{min_nodes_random}{Minimum number of nodes to trigger \emph{tip-pairs} nodes sampling.
23
+ This sampling is less reproducible and more computationally expensive,
24
+ but it's the only solution if the cophenetic matrix exceeds \code{2^31-1}
25
+ entries; above that, it cannot be represented in R.}
26
+
27
+ \item{random_nodes_frx}{Fraction of the nodes to be sampled if more than \code{min_nodes_random}.}
28
+ }
29
+ \value{
30
+ Returns a pruned \strong{phylo} object.
31
+ }
32
+ \description{
33
+ Automatically prunes a tree, to keep representatives of each clade.
34
+ }
35
+ \author{
36
+ Luis M. Rodriguez-R [aut, cre]
37
+ }
@@ -0,0 +1,122 @@
1
+ % Generated by roxygen2: do not edit by hand
2
+ % Please edit documentation in R/recplot.R
3
+ \name{enve.recplot}
4
+ \alias{enve.recplot}
5
+ \title{Enveomics: Recruitment Plots}
6
+ \usage{
7
+ enve.recplot(prefix, id.min = NULL, id.max = NULL, id.binsize = NULL,
8
+ id.splines = 0, id.metric = "id", id.summary = "sum",
9
+ pos.min = 1, pos.max = NULL, pos.binsize = 1000, pos.splines = 0,
10
+ rec.col1 = "white", rec.col2 = "black", main = NULL,
11
+ contig.col = grey(0.85), ret.recplot = FALSE, ret.hist = FALSE,
12
+ ret.mode = FALSE, id.cutoff = NULL, verbose = TRUE, ...)
13
+ }
14
+ \arguments{
15
+ \item{prefix}{Path to the prefix of the BlastTab.catsbj.pl output files. At
16
+ least the files \strong{.rec} and \strong{.lim} must exist with this prefix.}
17
+
18
+ \item{id.min}{Minimum identity to be considered. By default, the minimum detected
19
+ identity. This value is a percentage.}
20
+
21
+ \item{id.max}{Maximum identity to be considered. By default, 100\%.}
22
+
23
+ \item{id.binsize}{Size of the identity bins (vertical histograms). By default, 0.1 for
24
+ identity metrics and 5 for bit score.}
25
+
26
+ \item{id.splines}{Smoothing parameter for the splines in the identity histogram. Zero (0) for no
27
+ splines. A generally good value is 1/2. If non-zero, requires the \pkg{stats} package.}
28
+
29
+ \item{id.metric}{Metric of identity to be used (Y-axis).
30
+ It can be any unambiguous prefix of:
31
+ \itemize{
32
+ \item "identity"
33
+ \item "corrected identity"
34
+ \item "bit score"}}
35
+
36
+ \item{id.summary}{Method used to build the identity histogram (Horizontal axis of the right panel).
37
+ It can be any unambiguous prefix of:
38
+ \itemize{
39
+ \item "sum"
40
+ \item "average"
41
+ \item "median"
42
+ \item "90\% lower bound"
43
+ \item "90\% upper bound"
44
+ \item "95\% lower bound"
45
+ \item "95\% upper bound" }
46
+ The last four options
47
+ correspond to the upper and lower boundaries of the 90\% and 95\% empirical confidence
48
+ intervals.}
49
+
50
+ \item{pos.min}{Minimum (leftmost) position in the reference (concatenated) genome (in bp).}
51
+
52
+ \item{pos.max}{Maximum (rightmost) position in the reference (concatenated) genome (in bp).
53
+ By default: Length of the genome.}
54
+
55
+ \item{pos.binsize}{Size of the position bins (horizontal histograms) in bp.}
56
+
57
+ \item{pos.splines}{Smoothing parameter for the splines in the position histogram. Zero (0) for no splines.
58
+ If non-zero, requires the stats package.}
59
+
60
+ \item{rec.col1}{Lightest color in the recruitment plot.}
61
+
62
+ \item{rec.col2}{Darkest color in the recruitment plot.}
63
+
64
+ \item{main}{Title of the plot.}
65
+
66
+ \item{contig.col}{Color of the Contig boundaries. Set to \code{NA} to ignore Contig boundaries.}
67
+
68
+ \item{ret.recplot}{Indicates if the matrix of the recruitment plot is to be returned.}
69
+
70
+ \item{ret.hist}{Ignored, for backwards compatibility.}
71
+
72
+ \item{ret.mode}{Indicates if the mode of the identity is to be computed. It requires the
73
+ \pkg{modeest} package.}
74
+
75
+ \item{id.cutoff}{Minimum identity to consider an alignment as "top". By default, it is 0.95 for the
76
+ identity metrics and 95\% of the best scoring alignment for bit score.}
77
+
78
+ \item{verbose}{Indicates if the function should report the advance.}
79
+
80
+ \item{...}{Any additional graphic parameters to be passed to plot for all panels except the
81
+ recruitment plot (lower-left).}
82
+ }
83
+ \value{
84
+ Returns a list with the following elements:
85
+
86
+ \describe{
87
+ \item{\code{pos.marks}}{Midpoints of the position histogram.}
88
+ \item{\code{id.matrix}}{Midpoints of the identity histogram.}
89
+ \item{\code{recplot}}{Matrix containing the recruitment plot values
90
+ (if \code{ret.recplot=TRUE}).}
91
+ \item{\code{id.mean}}{Mean identity.}
92
+ \item{\code{id.median}}{Median identity.}
93
+ \item{\code{id.mode}}{Mode of the identity (if \code{ret.mode=TRUE}). Deprecated.}
94
+ \item{\code{id.hist}}{Values of the identity histogram (if \code{ret.hist=TRUE}).}
95
+ \item{\code{pos.hist.low}}{Values of the position histogram (depth) with "low"
96
+ identity (i.e., below id.cutoff) (if \code{ret.hist=TRUE}).}
97
+ \item{\code{pos.hist.top}}{Values of the position histogram (depth) with "top"
98
+ identity (i.e., above id.cutoff) (if \code{ret.hist=TRUE}).}
99
+ \item{\code{id.max}}{Value of \code{id.max}. This is returned because
100
+ \code{id.max=NULL} may vary.}
101
+ \item{\code{id.cutoff}}{Value of \code{id.cutoff}.
102
+ This is returned because \code{id.cutoff=NULL} may vary.}
103
+ \item{\code{seqdepth.mean.top}}{Average sequencing depth with identity above
104
+ \code{id.cutoff}.}
105
+ \item{\code{seqdepth.mean.low}}{Average sequencing depth with identity below
106
+ \code{id.cutoff}.}
107
+ \item{\code{seqdepth.mean.all}}{Average sequencing depth without identity filtering.}
108
+ \item{\code{seqdepth.median.top}}{Median sequencing depth with identity above
109
+ \code{id.cutoff}.}
110
+ \item{\code{seqdepth.median.low}}{Median sequencing depth with identity below
111
+ \code{id.cutoff}.}
112
+ \item{\code{seqdepth.median.all}}{Median sequencing depth without identity filtering.}
113
+ \item{\code{id.metric}}{Full name of the used identity metric.}
114
+ \item{\code{id.summary}}{Full name of the summary method used to build the identity plot.}}
115
+ }
116
+ \description{
117
+ Produces recruitment plots provided that BlastTab.catsbj.pl has
118
+ been previously executed. Requires the \pkg{gplots} library.
119
+ }
120
+ \author{
121
+ Luis M. Rodriguez-R [aut, cre]
122
+ }