miga-base 0.7.24.0 → 0.7.26.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/lib/miga/cli/action/add.rb +9 -6
- data/lib/miga/cli/action/derep_wf.rb +1 -1
- data/lib/miga/cli/action/index_wf.rb +4 -2
- data/lib/miga/cli/action/init.rb +83 -68
- data/lib/miga/cli/action/init/files_helper.rb +2 -1
- data/lib/miga/cli/action/option.rb +21 -2
- data/lib/miga/cli/action/preproc_wf.rb +7 -5
- data/lib/miga/cli/action/wf.rb +40 -24
- data/lib/miga/cli/base.rb +16 -5
- data/lib/miga/common/with_option.rb +1 -1
- data/lib/miga/dataset/result.rb +2 -1
- data/lib/miga/project/base.rb +1 -1
- data/lib/miga/result.rb +18 -15
- data/lib/miga/version.rb +2 -2
- data/scripts/essential_genes.bash +17 -1
- data/scripts/miga.bash +8 -2
- data/test/lair_test.rb +1 -2
- data/test/result_test.rb +22 -0
- data/utils/distance/base.rb +9 -0
- data/utils/distance/commands.rb +183 -81
- data/utils/distance/database.rb +68 -9
- data/utils/distance/pipeline.rb +14 -18
- data/utils/distance/runner.rb +17 -30
- data/utils/distance/temporal.rb +4 -2
- data/utils/distances.rb +2 -2
- data/utils/requirements.txt +5 -5
- metadata +5 -272
- data/utils/enveomics/Docs/recplot2.md +0 -244
- data/utils/enveomics/Examples/aai-matrix.bash +0 -66
- data/utils/enveomics/Examples/ani-matrix.bash +0 -66
- data/utils/enveomics/Examples/essential-phylogeny.bash +0 -105
- data/utils/enveomics/Examples/unus-genome-phylogeny.bash +0 -100
- data/utils/enveomics/LICENSE.txt +0 -73
- data/utils/enveomics/Makefile +0 -52
- data/utils/enveomics/Manifest/Tasks/aasubs.json +0 -103
- data/utils/enveomics/Manifest/Tasks/blasttab.json +0 -786
- data/utils/enveomics/Manifest/Tasks/distances.json +0 -161
- data/utils/enveomics/Manifest/Tasks/fasta.json +0 -766
- data/utils/enveomics/Manifest/Tasks/fastq.json +0 -243
- data/utils/enveomics/Manifest/Tasks/graphics.json +0 -126
- data/utils/enveomics/Manifest/Tasks/mapping.json +0 -67
- data/utils/enveomics/Manifest/Tasks/ogs.json +0 -382
- data/utils/enveomics/Manifest/Tasks/other.json +0 -829
- data/utils/enveomics/Manifest/Tasks/remote.json +0 -355
- data/utils/enveomics/Manifest/Tasks/sequence-identity.json +0 -501
- data/utils/enveomics/Manifest/Tasks/tables.json +0 -308
- data/utils/enveomics/Manifest/Tasks/trees.json +0 -68
- data/utils/enveomics/Manifest/Tasks/variants.json +0 -111
- data/utils/enveomics/Manifest/categories.json +0 -156
- data/utils/enveomics/Manifest/examples.json +0 -154
- data/utils/enveomics/Manifest/tasks.json +0 -4
- data/utils/enveomics/Pipelines/assembly.pbs/CONFIG.mock.bash +0 -69
- data/utils/enveomics/Pipelines/assembly.pbs/FastA.N50.pl +0 -1
- data/utils/enveomics/Pipelines/assembly.pbs/FastA.filterN.pl +0 -1
- data/utils/enveomics/Pipelines/assembly.pbs/FastA.length.pl +0 -1
- data/utils/enveomics/Pipelines/assembly.pbs/README.md +0 -189
- data/utils/enveomics/Pipelines/assembly.pbs/RUNME-2.bash +0 -112
- data/utils/enveomics/Pipelines/assembly.pbs/RUNME-3.bash +0 -23
- data/utils/enveomics/Pipelines/assembly.pbs/RUNME-4.bash +0 -44
- data/utils/enveomics/Pipelines/assembly.pbs/RUNME.bash +0 -50
- data/utils/enveomics/Pipelines/assembly.pbs/kSelector.R +0 -37
- data/utils/enveomics/Pipelines/assembly.pbs/newbler.pbs +0 -68
- data/utils/enveomics/Pipelines/assembly.pbs/newbler_preparator.pl +0 -49
- data/utils/enveomics/Pipelines/assembly.pbs/soap.pbs +0 -80
- data/utils/enveomics/Pipelines/assembly.pbs/stats.pbs +0 -57
- data/utils/enveomics/Pipelines/assembly.pbs/velvet.pbs +0 -63
- data/utils/enveomics/Pipelines/blast.pbs/01.pbs.bash +0 -38
- data/utils/enveomics/Pipelines/blast.pbs/02.pbs.bash +0 -73
- data/utils/enveomics/Pipelines/blast.pbs/03.pbs.bash +0 -21
- data/utils/enveomics/Pipelines/blast.pbs/BlastTab.recover_job.pl +0 -72
- data/utils/enveomics/Pipelines/blast.pbs/CONFIG.mock.bash +0 -98
- data/utils/enveomics/Pipelines/blast.pbs/FastA.split.pl +0 -1
- data/utils/enveomics/Pipelines/blast.pbs/README.md +0 -127
- data/utils/enveomics/Pipelines/blast.pbs/RUNME.bash +0 -109
- data/utils/enveomics/Pipelines/blast.pbs/TASK.check.bash +0 -128
- data/utils/enveomics/Pipelines/blast.pbs/TASK.dry.bash +0 -16
- data/utils/enveomics/Pipelines/blast.pbs/TASK.eo.bash +0 -22
- data/utils/enveomics/Pipelines/blast.pbs/TASK.pause.bash +0 -26
- data/utils/enveomics/Pipelines/blast.pbs/TASK.run.bash +0 -89
- data/utils/enveomics/Pipelines/blast.pbs/sentinel.pbs.bash +0 -29
- data/utils/enveomics/Pipelines/idba.pbs/README.md +0 -49
- data/utils/enveomics/Pipelines/idba.pbs/RUNME.bash +0 -95
- data/utils/enveomics/Pipelines/idba.pbs/run.pbs +0 -56
- data/utils/enveomics/Pipelines/trim.pbs/README.md +0 -54
- data/utils/enveomics/Pipelines/trim.pbs/RUNME.bash +0 -70
- data/utils/enveomics/Pipelines/trim.pbs/run.pbs +0 -130
- data/utils/enveomics/README.md +0 -42
- data/utils/enveomics/Scripts/AAsubs.log2ratio.rb +0 -171
- data/utils/enveomics/Scripts/Aln.cat.rb +0 -163
- data/utils/enveomics/Scripts/Aln.convert.pl +0 -35
- data/utils/enveomics/Scripts/AlphaDiversity.pl +0 -152
- data/utils/enveomics/Scripts/BedGraph.tad.rb +0 -93
- data/utils/enveomics/Scripts/BedGraph.window.rb +0 -71
- data/utils/enveomics/Scripts/BlastPairwise.AAsubs.pl +0 -102
- data/utils/enveomics/Scripts/BlastTab.addlen.rb +0 -63
- data/utils/enveomics/Scripts/BlastTab.advance.bash +0 -48
- data/utils/enveomics/Scripts/BlastTab.best_hit_sorted.pl +0 -55
- data/utils/enveomics/Scripts/BlastTab.catsbj.pl +0 -104
- data/utils/enveomics/Scripts/BlastTab.cogCat.rb +0 -76
- data/utils/enveomics/Scripts/BlastTab.filter.pl +0 -47
- data/utils/enveomics/Scripts/BlastTab.kegg_pep2path_rest.pl +0 -194
- data/utils/enveomics/Scripts/BlastTab.metaxaPrep.pl +0 -104
- data/utils/enveomics/Scripts/BlastTab.pairedHits.rb +0 -157
- data/utils/enveomics/Scripts/BlastTab.recplot2.R +0 -48
- data/utils/enveomics/Scripts/BlastTab.seqdepth.pl +0 -86
- data/utils/enveomics/Scripts/BlastTab.seqdepth_ZIP.pl +0 -119
- data/utils/enveomics/Scripts/BlastTab.seqdepth_nomedian.pl +0 -86
- data/utils/enveomics/Scripts/BlastTab.subsample.pl +0 -47
- data/utils/enveomics/Scripts/BlastTab.sumPerHit.pl +0 -114
- data/utils/enveomics/Scripts/BlastTab.taxid2taxrank.pl +0 -90
- data/utils/enveomics/Scripts/BlastTab.topHits_sorted.rb +0 -101
- data/utils/enveomics/Scripts/Chao1.pl +0 -97
- data/utils/enveomics/Scripts/CharTable.classify.rb +0 -234
- data/utils/enveomics/Scripts/EBIseq2tax.rb +0 -83
- data/utils/enveomics/Scripts/FastA.N50.pl +0 -56
- data/utils/enveomics/Scripts/FastA.extract.rb +0 -152
- data/utils/enveomics/Scripts/FastA.filter.pl +0 -52
- data/utils/enveomics/Scripts/FastA.filterLen.pl +0 -28
- data/utils/enveomics/Scripts/FastA.filterN.pl +0 -60
- data/utils/enveomics/Scripts/FastA.fragment.rb +0 -92
- data/utils/enveomics/Scripts/FastA.gc.pl +0 -42
- data/utils/enveomics/Scripts/FastA.interpose.pl +0 -93
- data/utils/enveomics/Scripts/FastA.length.pl +0 -38
- data/utils/enveomics/Scripts/FastA.mask.rb +0 -89
- data/utils/enveomics/Scripts/FastA.per_file.pl +0 -36
- data/utils/enveomics/Scripts/FastA.qlen.pl +0 -57
- data/utils/enveomics/Scripts/FastA.rename.pl +0 -65
- data/utils/enveomics/Scripts/FastA.revcom.pl +0 -23
- data/utils/enveomics/Scripts/FastA.sample.rb +0 -83
- data/utils/enveomics/Scripts/FastA.slider.pl +0 -85
- data/utils/enveomics/Scripts/FastA.split.pl +0 -55
- data/utils/enveomics/Scripts/FastA.split.rb +0 -79
- data/utils/enveomics/Scripts/FastA.subsample.pl +0 -131
- data/utils/enveomics/Scripts/FastA.tag.rb +0 -65
- data/utils/enveomics/Scripts/FastA.wrap.rb +0 -48
- data/utils/enveomics/Scripts/FastQ.filter.pl +0 -54
- data/utils/enveomics/Scripts/FastQ.interpose.pl +0 -90
- data/utils/enveomics/Scripts/FastQ.offset.pl +0 -90
- data/utils/enveomics/Scripts/FastQ.split.pl +0 -53
- data/utils/enveomics/Scripts/FastQ.tag.rb +0 -63
- data/utils/enveomics/Scripts/FastQ.test-error.rb +0 -81
- data/utils/enveomics/Scripts/FastQ.toFastA.awk +0 -24
- data/utils/enveomics/Scripts/GFF.catsbj.pl +0 -127
- data/utils/enveomics/Scripts/GenBank.add_fields.rb +0 -84
- data/utils/enveomics/Scripts/HMM.essential.rb +0 -351
- data/utils/enveomics/Scripts/HMM.haai.rb +0 -168
- data/utils/enveomics/Scripts/HMMsearch.extractIds.rb +0 -83
- data/utils/enveomics/Scripts/JPlace.distances.rb +0 -88
- data/utils/enveomics/Scripts/JPlace.to_iToL.rb +0 -320
- data/utils/enveomics/Scripts/M5nr.getSequences.rb +0 -81
- data/utils/enveomics/Scripts/MeTaxa.distribution.pl +0 -198
- data/utils/enveomics/Scripts/MyTaxa.fragsByTax.pl +0 -35
- data/utils/enveomics/Scripts/MyTaxa.seq-taxrank.rb +0 -49
- data/utils/enveomics/Scripts/NCBIacc2tax.rb +0 -92
- data/utils/enveomics/Scripts/Newick.autoprune.R +0 -27
- data/utils/enveomics/Scripts/RAxML-EPA.to_iToL.pl +0 -228
- data/utils/enveomics/Scripts/RecPlot2.compareIdentities.R +0 -32
- data/utils/enveomics/Scripts/RefSeq.download.bash +0 -48
- data/utils/enveomics/Scripts/SRA.download.bash +0 -57
- data/utils/enveomics/Scripts/TRIBS.plot-test.R +0 -36
- data/utils/enveomics/Scripts/TRIBS.test.R +0 -39
- data/utils/enveomics/Scripts/Table.barplot.R +0 -31
- data/utils/enveomics/Scripts/Table.df2dist.R +0 -30
- data/utils/enveomics/Scripts/Table.filter.pl +0 -61
- data/utils/enveomics/Scripts/Table.merge.pl +0 -77
- data/utils/enveomics/Scripts/Table.replace.rb +0 -69
- data/utils/enveomics/Scripts/Table.round.rb +0 -63
- data/utils/enveomics/Scripts/Table.split.pl +0 -57
- data/utils/enveomics/Scripts/Taxonomy.silva2ncbi.rb +0 -227
- data/utils/enveomics/Scripts/VCF.KaKs.rb +0 -147
- data/utils/enveomics/Scripts/VCF.SNPs.rb +0 -88
- data/utils/enveomics/Scripts/aai.rb +0 -418
- data/utils/enveomics/Scripts/ani.rb +0 -362
- data/utils/enveomics/Scripts/clust.rand.rb +0 -102
- data/utils/enveomics/Scripts/gi2tax.rb +0 -103
- data/utils/enveomics/Scripts/in_silico_GA_GI.pl +0 -96
- data/utils/enveomics/Scripts/lib/data/dupont_2012_essential.hmm.gz +0 -0
- data/utils/enveomics/Scripts/lib/data/lee_2019_essential.hmm.gz +0 -0
- data/utils/enveomics/Scripts/lib/enveomics.R +0 -1
- data/utils/enveomics/Scripts/lib/enveomics_rb/enveomics.rb +0 -24
- data/utils/enveomics/Scripts/lib/enveomics_rb/jplace.rb +0 -253
- data/utils/enveomics/Scripts/lib/enveomics_rb/og.rb +0 -182
- data/utils/enveomics/Scripts/lib/enveomics_rb/remote_data.rb +0 -74
- data/utils/enveomics/Scripts/lib/enveomics_rb/seq_range.rb +0 -237
- data/utils/enveomics/Scripts/lib/enveomics_rb/stat.rb +0 -30
- data/utils/enveomics/Scripts/lib/enveomics_rb/vcf.rb +0 -135
- data/utils/enveomics/Scripts/ogs.annotate.rb +0 -88
- data/utils/enveomics/Scripts/ogs.core-pan.rb +0 -160
- data/utils/enveomics/Scripts/ogs.extract.rb +0 -125
- data/utils/enveomics/Scripts/ogs.mcl.rb +0 -186
- data/utils/enveomics/Scripts/ogs.rb +0 -104
- data/utils/enveomics/Scripts/ogs.stats.rb +0 -131
- data/utils/enveomics/Scripts/rbm.rb +0 -146
- data/utils/enveomics/Tests/Makefile +0 -10
- data/utils/enveomics/Tests/Mgen_M2288.faa +0 -3189
- data/utils/enveomics/Tests/Mgen_M2288.fna +0 -8282
- data/utils/enveomics/Tests/Mgen_M2321.fna +0 -8288
- data/utils/enveomics/Tests/Nequ_Kin4M.faa +0 -2970
- data/utils/enveomics/Tests/Xanthomonas_oryzae-PilA.tribs.Rdata +0 -0
- data/utils/enveomics/Tests/Xanthomonas_oryzae-PilA.txt +0 -7
- data/utils/enveomics/Tests/Xanthomonas_oryzae.aai-mat.tsv +0 -17
- data/utils/enveomics/Tests/Xanthomonas_oryzae.aai.tsv +0 -137
- data/utils/enveomics/Tests/a_mg.cds-go.blast.tsv +0 -123
- data/utils/enveomics/Tests/a_mg.reads-cds.blast.tsv +0 -200
- data/utils/enveomics/Tests/a_mg.reads-cds.counts.tsv +0 -55
- data/utils/enveomics/Tests/alkB.nwk +0 -1
- data/utils/enveomics/Tests/anthrax-cansnp-data.tsv +0 -13
- data/utils/enveomics/Tests/anthrax-cansnp-key.tsv +0 -17
- data/utils/enveomics/Tests/hiv1.faa +0 -59
- data/utils/enveomics/Tests/hiv1.fna +0 -134
- data/utils/enveomics/Tests/hiv2.faa +0 -70
- data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv +0 -233
- data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv.lim +0 -1
- data/utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv.rec +0 -233
- data/utils/enveomics/Tests/phyla_counts.tsv +0 -10
- data/utils/enveomics/Tests/primate_lentivirus.ogs +0 -11
- data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-hiv1.rbm +0 -9
- data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-hiv2.rbm +0 -8
- data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-siv.rbm +0 -6
- data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv2-hiv2.rbm +0 -9
- data/utils/enveomics/Tests/primate_lentivirus.rbm/hiv2-siv.rbm +0 -6
- data/utils/enveomics/Tests/primate_lentivirus.rbm/siv-siv.rbm +0 -6
- data/utils/enveomics/build_enveomics_r.bash +0 -45
- data/utils/enveomics/enveomics.R/DESCRIPTION +0 -31
- data/utils/enveomics/enveomics.R/NAMESPACE +0 -39
- data/utils/enveomics/enveomics.R/R/autoprune.R +0 -155
- data/utils/enveomics/enveomics.R/R/barplot.R +0 -184
- data/utils/enveomics/enveomics.R/R/cliopts.R +0 -135
- data/utils/enveomics/enveomics.R/R/df2dist.R +0 -154
- data/utils/enveomics/enveomics.R/R/growthcurve.R +0 -331
- data/utils/enveomics/enveomics.R/R/recplot.R +0 -354
- data/utils/enveomics/enveomics.R/R/recplot2.R +0 -1631
- data/utils/enveomics/enveomics.R/R/tribs.R +0 -583
- data/utils/enveomics/enveomics.R/R/utils.R +0 -50
- data/utils/enveomics/enveomics.R/README.md +0 -80
- data/utils/enveomics/enveomics.R/data/growth.curves.rda +0 -0
- data/utils/enveomics/enveomics.R/data/phyla.counts.rda +0 -0
- data/utils/enveomics/enveomics.R/man/cash-enve.GrowthCurve-method.Rd +0 -17
- data/utils/enveomics/enveomics.R/man/cash-enve.RecPlot2-method.Rd +0 -17
- data/utils/enveomics/enveomics.R/man/cash-enve.RecPlot2.Peak-method.Rd +0 -17
- data/utils/enveomics/enveomics.R/man/enve.GrowthCurve-class.Rd +0 -25
- data/utils/enveomics/enveomics.R/man/enve.TRIBS-class.Rd +0 -46
- data/utils/enveomics/enveomics.R/man/enve.TRIBS.merge.Rd +0 -23
- data/utils/enveomics/enveomics.R/man/enve.TRIBStest-class.Rd +0 -47
- data/utils/enveomics/enveomics.R/man/enve.__prune.iter.Rd +0 -23
- data/utils/enveomics/enveomics.R/man/enve.__prune.reduce.Rd +0 -23
- data/utils/enveomics/enveomics.R/man/enve.__tribs.Rd +0 -32
- data/utils/enveomics/enveomics.R/man/enve.barplot.Rd +0 -91
- data/utils/enveomics/enveomics.R/man/enve.cliopts.Rd +0 -57
- data/utils/enveomics/enveomics.R/man/enve.col.alpha.Rd +0 -24
- data/utils/enveomics/enveomics.R/man/enve.col2alpha.Rd +0 -19
- data/utils/enveomics/enveomics.R/man/enve.df2dist.Rd +0 -39
- data/utils/enveomics/enveomics.R/man/enve.df2dist.group.Rd +0 -38
- data/utils/enveomics/enveomics.R/man/enve.df2dist.list.Rd +0 -40
- data/utils/enveomics/enveomics.R/man/enve.growthcurve.Rd +0 -67
- data/utils/enveomics/enveomics.R/man/enve.prune.dist.Rd +0 -37
- data/utils/enveomics/enveomics.R/man/enve.recplot.Rd +0 -122
- data/utils/enveomics/enveomics.R/man/enve.recplot2-class.Rd +0 -45
- data/utils/enveomics/enveomics.R/man/enve.recplot2.ANIr.Rd +0 -24
- data/utils/enveomics/enveomics.R/man/enve.recplot2.Rd +0 -68
- data/utils/enveomics/enveomics.R/man/enve.recplot2.__counts.Rd +0 -25
- data/utils/enveomics/enveomics.R/man/enve.recplot2.__peakHist.Rd +0 -21
- data/utils/enveomics/enveomics.R/man/enve.recplot2.__whichClosestPeak.Rd +0 -19
- data/utils/enveomics/enveomics.R/man/enve.recplot2.changeCutoff.Rd +0 -19
- data/utils/enveomics/enveomics.R/man/enve.recplot2.compareIdentities.Rd +0 -41
- data/utils/enveomics/enveomics.R/man/enve.recplot2.coordinates.Rd +0 -29
- data/utils/enveomics/enveomics.R/man/enve.recplot2.corePeak.Rd +0 -18
- data/utils/enveomics/enveomics.R/man/enve.recplot2.extractWindows.Rd +0 -40
- data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.Rd +0 -36
- data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__em_e.Rd +0 -19
- data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__em_m.Rd +0 -19
- data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__emauto_one.Rd +0 -27
- data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__mow_one.Rd +0 -41
- data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__mower.Rd +0 -17
- data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.em.Rd +0 -43
- data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.emauto.Rd +0 -37
- data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.mower.Rd +0 -74
- data/utils/enveomics/enveomics.R/man/enve.recplot2.peak-class.Rd +0 -59
- data/utils/enveomics/enveomics.R/man/enve.recplot2.seqdepth.Rd +0 -27
- data/utils/enveomics/enveomics.R/man/enve.recplot2.windowDepthThreshold.Rd +0 -32
- data/utils/enveomics/enveomics.R/man/enve.tribs.Rd +0 -59
- data/utils/enveomics/enveomics.R/man/enve.tribs.test.Rd +0 -28
- data/utils/enveomics/enveomics.R/man/enve.truncate.Rd +0 -27
- data/utils/enveomics/enveomics.R/man/growth.curves.Rd +0 -14
- data/utils/enveomics/enveomics.R/man/phyla.counts.Rd +0 -13
- data/utils/enveomics/enveomics.R/man/plot.enve.GrowthCurve.Rd +0 -63
- data/utils/enveomics/enveomics.R/man/plot.enve.TRIBS.Rd +0 -38
- data/utils/enveomics/enveomics.R/man/plot.enve.TRIBStest.Rd +0 -38
- data/utils/enveomics/enveomics.R/man/plot.enve.recplot2.Rd +0 -111
- data/utils/enveomics/enveomics.R/man/summary.enve.GrowthCurve.Rd +0 -19
- data/utils/enveomics/enveomics.R/man/summary.enve.TRIBS.Rd +0 -19
- data/utils/enveomics/enveomics.R/man/summary.enve.TRIBStest.Rd +0 -19
- data/utils/enveomics/globals.mk +0 -8
- data/utils/enveomics/manifest.json +0 -9
data/utils/distance/database.rb
CHANGED
|
@@ -22,12 +22,16 @@ module MiGA::DistanceRunner::Database
|
|
|
22
22
|
end
|
|
23
23
|
end
|
|
24
24
|
# Initialize if it doesn't exist
|
|
25
|
-
|
|
26
|
-
|
|
27
|
-
|
|
28
|
-
|
|
29
|
-
|
|
30
|
-
|
|
25
|
+
unless File.size? dbs[m]
|
|
26
|
+
SQLite3::Database.new(dbs[m]) do |conn|
|
|
27
|
+
conn.execute <<~SQL
|
|
28
|
+
create table if not exists #{t}(
|
|
29
|
+
seq1 varchar(256), seq2 varchar(256),
|
|
30
|
+
#{t} float, sd float, n int, omega int
|
|
31
|
+
)
|
|
32
|
+
SQL
|
|
33
|
+
end
|
|
34
|
+
end
|
|
31
35
|
# Copy over to (local) temporals
|
|
32
36
|
@tmp_dbs[m] = tmp_file("#{m}.db")
|
|
33
37
|
FileUtils.cp(dbs[m], tmp_dbs[m])
|
|
@@ -92,27 +96,72 @@ module MiGA::DistanceRunner::Database
|
|
|
92
96
|
# possible number of matches
|
|
93
97
|
def data_from_db(n1, n2, db, metric)
|
|
94
98
|
y = nil
|
|
99
|
+
table = metric == :haai ? :aai : metric
|
|
95
100
|
SQLite3::Database.new(db) do |conn|
|
|
96
101
|
y = conn.execute(
|
|
97
|
-
"select #{
|
|
102
|
+
"select #{table}, sd, n, omega from #{table} where seq1=? and seq2=?",
|
|
98
103
|
[n1, n2]
|
|
99
104
|
).first
|
|
100
|
-
end if File.size?
|
|
105
|
+
end if File.size?(db)
|
|
101
106
|
y
|
|
102
107
|
end
|
|
103
108
|
|
|
104
109
|
##
|
|
105
110
|
# Save +data+ of +metric+ between +n1+ and +n2+ in the +db+ database.
|
|
106
111
|
def data_to_db(n1, n2, db, metric, data)
|
|
112
|
+
table = metric == :haai ? :aai : metric
|
|
107
113
|
SQLite3::Database.new(db) do |conn|
|
|
108
114
|
conn.execute(
|
|
109
|
-
"insert into #{
|
|
115
|
+
"insert into #{table} (seq1, seq2, #{table}, sd, n, omega) " +
|
|
110
116
|
"values (?, ?, ?, ?, ?, ?)", [n1, n2] + data
|
|
111
117
|
)
|
|
112
118
|
end
|
|
113
119
|
checkpoint metric
|
|
114
120
|
end
|
|
115
121
|
|
|
122
|
+
##
|
|
123
|
+
# Saves +data+ of +metric+ in batch to the temporary database,
|
|
124
|
+
# and assumes query is +#dataset+. +data+ must be a hash with target names
|
|
125
|
+
# as key and arrays as values with: [val, sd, n, omega]
|
|
126
|
+
def batch_data_to_db(metric, data)
|
|
127
|
+
db = tmp_dbs[metric]
|
|
128
|
+
table = metric == :haai ? :aai : metric
|
|
129
|
+
`cp #{db} ~/here.db`
|
|
130
|
+
SQLite3::Database.new(db) do |conn|
|
|
131
|
+
data.each do |k, v|
|
|
132
|
+
sql = <<~SQL
|
|
133
|
+
insert into #{table} (
|
|
134
|
+
seq1, seq2, #{table}, sd, n, omega
|
|
135
|
+
) values (?, ?, ?, ?, ?, ?)
|
|
136
|
+
SQL
|
|
137
|
+
conn.execute(sql, [dataset.name, k] + v)
|
|
138
|
+
end
|
|
139
|
+
end
|
|
140
|
+
checkpoint(metric)
|
|
141
|
+
end
|
|
142
|
+
|
|
143
|
+
##
|
|
144
|
+
# Retrieves data of +metric+ in batch from the temporary database,
|
|
145
|
+
# and assumes query is +#dataset+. The output data is a hash with the same
|
|
146
|
+
# structure described for +#batch_data_to_db+
|
|
147
|
+
def batch_data_from_db(metric)
|
|
148
|
+
db = tmp_dbs[metric]
|
|
149
|
+
table = metric == :haai ? :aai : metric
|
|
150
|
+
data = {}
|
|
151
|
+
SQLite3::Database.new(db) do |conn|
|
|
152
|
+
sql = "select seq2, #{table}, sd, n, omega from #{table}"
|
|
153
|
+
conn.execute(sql).each { |row| data[row.shift] = row }
|
|
154
|
+
end
|
|
155
|
+
data
|
|
156
|
+
end
|
|
157
|
+
|
|
158
|
+
##
|
|
159
|
+
# Retrieve only +metric+ values against +names+
|
|
160
|
+
def batch_values_from_db(metric, names)
|
|
161
|
+
data = batch_data_from_db(metric)
|
|
162
|
+
names.map { |i| data[i]&.first }
|
|
163
|
+
end
|
|
164
|
+
|
|
116
165
|
##
|
|
117
166
|
# Iterates for each entry in +db+
|
|
118
167
|
def foreach_in_db(db, metric, &blk)
|
|
@@ -120,4 +169,14 @@ module MiGA::DistanceRunner::Database
|
|
|
120
169
|
conn.execute("select * from #{metric}").each { |r| blk[r] }
|
|
121
170
|
end
|
|
122
171
|
end
|
|
172
|
+
|
|
173
|
+
##
|
|
174
|
+
# Select only those targets that are not yet stored in either direction
|
|
175
|
+
def pending_targets(targets, metric)
|
|
176
|
+
saved = batch_data_from_db(metric).keys
|
|
177
|
+
targets
|
|
178
|
+
.compact
|
|
179
|
+
.select { |i| !saved.include?(i.name) }
|
|
180
|
+
.select { |i| !stored_value(i, metric)&.> 0.0 }
|
|
181
|
+
end
|
|
123
182
|
end
|
data/utils/distance/pipeline.rb
CHANGED
|
@@ -11,19 +11,14 @@ module MiGA::DistanceRunner::Pipeline
|
|
|
11
11
|
val_med = ''
|
|
12
12
|
val_cls = nil
|
|
13
13
|
i_n = 0
|
|
14
|
-
File.
|
|
15
|
-
|
|
16
|
-
|
|
17
|
-
|
|
18
|
-
|
|
19
|
-
|
|
20
|
-
|
|
21
|
-
|
|
22
|
-
val_cls = i_n
|
|
23
|
-
puts "[#{classif}] New max: #{val_med} (#{val_cls}): #{max_val}"
|
|
24
|
-
end
|
|
25
|
-
end
|
|
26
|
-
end
|
|
14
|
+
sbj_datasets = File.foreach(med).map { |i| ref_project.dataset(i.chomp) }
|
|
15
|
+
values = send(metric, sbj_datasets)
|
|
16
|
+
max_idx = values.map(&:to_f).each_with_index.max[1]
|
|
17
|
+
max_val = values[max_idx]
|
|
18
|
+
val_med = sbj_datasets[max_idx].name
|
|
19
|
+
val_cls = max_idx + 1
|
|
20
|
+
puts "[#{classif}] New max: #{val_med} (#{val_cls}): #{max_val}"
|
|
21
|
+
|
|
27
22
|
classif = "#{classif}/miga-project.sc-#{val_cls}"
|
|
28
23
|
result_fh.puts [val_cls, val_med, max_val, classif].join("\t")
|
|
29
24
|
classify(clades, classif, metric, result_fh, val_cls)
|
|
@@ -32,9 +27,8 @@ module MiGA::DistanceRunner::Pipeline
|
|
|
32
27
|
# Run distances against datasets listed in metadata's +:dist_req+
|
|
33
28
|
def distances_by_request(metric)
|
|
34
29
|
$stderr.puts 'Running distances by request'
|
|
35
|
-
dataset.option(:dist_req).
|
|
36
|
-
|
|
37
|
-
end
|
|
30
|
+
sbj_datasets = dataset.option(:dist_req).map { |i| ref_project.dataset(i) }
|
|
31
|
+
send(metric, sbj_datasets)
|
|
38
32
|
end
|
|
39
33
|
|
|
40
34
|
# Builds a tree with all visited medoids from any classification level
|
|
@@ -74,8 +68,10 @@ module MiGA::DistanceRunner::Pipeline
|
|
|
74
68
|
$stderr.puts "Testing taxonomy | opts = #{opts}"
|
|
75
69
|
# Get taxonomy of closest relative
|
|
76
70
|
from_ref_project = (project != ref_project)
|
|
77
|
-
res_dir =
|
|
78
|
-
|
|
71
|
+
res_dir =
|
|
72
|
+
from_ref_project ?
|
|
73
|
+
File.expand_path('data/09.distances/05.taxonomy', project.path) :
|
|
74
|
+
home
|
|
79
75
|
Dir.mkdir res_dir unless Dir.exist? res_dir
|
|
80
76
|
File.open(File.expand_path("#{dataset.name}.done", res_dir), 'w') do |fh|
|
|
81
77
|
fh.puts Time.now.to_s
|
data/utils/distance/runner.rb
CHANGED
|
@@ -1,29 +1,17 @@
|
|
|
1
1
|
require_relative 'base.rb'
|
|
2
|
-
require_relative 'temporal.rb'
|
|
3
|
-
require_relative 'database.rb'
|
|
4
|
-
require_relative 'commands.rb'
|
|
5
|
-
require_relative 'pipeline.rb'
|
|
6
2
|
|
|
7
3
|
class MiGA::DistanceRunner
|
|
8
|
-
include MiGA::DistanceRunner::Temporal
|
|
9
|
-
include MiGA::DistanceRunner::Database
|
|
10
|
-
include MiGA::DistanceRunner::Commands
|
|
11
|
-
include MiGA::DistanceRunner::Pipeline
|
|
12
|
-
|
|
13
4
|
attr_reader :project, :ref_project, :dataset, :opts, :home
|
|
14
5
|
attr_reader :tmp, :tmp_dbs, :dbs, :db_counts
|
|
15
6
|
|
|
16
7
|
def initialize(project_path, dataset_name, opts_hash = {})
|
|
17
8
|
@opts = opts_hash
|
|
18
|
-
@project = MiGA::Project.load(project_path)
|
|
19
|
-
|
|
9
|
+
@project = MiGA::Project.load(project_path)
|
|
10
|
+
@project or raise "No project at #{project_path}"
|
|
20
11
|
@dataset = project.dataset(dataset_name)
|
|
21
12
|
@home = File.expand_path('data/09.distances', project.path)
|
|
22
13
|
|
|
23
14
|
# Default opts
|
|
24
|
-
@opts[:aai_save_rbm] =
|
|
25
|
-
project.option(:aai_save_rbm) ? 'save-rbm' : 'no-save-rbm'
|
|
26
|
-
@opts[:thr] ||= ENV.fetch('CORES') { 2 }.to_i
|
|
27
15
|
if opts[:run_taxonomy] && project.option(:ref_project)
|
|
28
16
|
ref_path = project.option(:ref_project)
|
|
29
17
|
@home = File.expand_path('05.taxonomy', @home)
|
|
@@ -39,7 +27,8 @@ class MiGA::DistanceRunner
|
|
|
39
27
|
else
|
|
40
28
|
@ref_project = project
|
|
41
29
|
end
|
|
42
|
-
|
|
30
|
+
@opts[:thr] ||= ENV.fetch('CORES') { 1 }.to_i
|
|
31
|
+
%i[haai_p aai_p ani_p distances_checkpoint aai_save_rbm].each do |m|
|
|
43
32
|
@opts[m] ||= ref_project.option(m)
|
|
44
33
|
end
|
|
45
34
|
$stderr.puts "Options: #{opts}"
|
|
@@ -64,12 +53,11 @@ class MiGA::DistanceRunner
|
|
|
64
53
|
initialize_dbs! true
|
|
65
54
|
|
|
66
55
|
# first-come-first-serve traverse
|
|
56
|
+
sbj = []
|
|
67
57
|
ref_project.each_dataset do |ds|
|
|
68
|
-
|
|
69
|
-
|
|
70
|
-
puts "[ #{Time.now} ] #{ds.name}"
|
|
71
|
-
ani_after_aai(ds)
|
|
58
|
+
sbj << ds if ds.ref? && !ds.multi? && ds.result(:essential_genes)
|
|
72
59
|
end
|
|
60
|
+
ani_after_aai(sbj)
|
|
73
61
|
|
|
74
62
|
# Finalize
|
|
75
63
|
%i[haai aai ani].each { |m| checkpoint! m if db_counts[m] > 0 }
|
|
@@ -97,27 +85,26 @@ class MiGA::DistanceRunner
|
|
|
97
85
|
par_dir = File.dirname(File.expand_path(classif, res.dir))
|
|
98
86
|
par = File.expand_path('miga-project.classif', par_dir)
|
|
99
87
|
closest = { dataset: nil, ani: 0.0 }
|
|
88
|
+
sbj_datasets = []
|
|
100
89
|
if File.size? par
|
|
101
90
|
File.open(par, 'r') do |fh|
|
|
102
91
|
fh.each_line do |ln|
|
|
103
92
|
r = ln.chomp.split("\t")
|
|
104
|
-
|
|
105
|
-
|
|
106
|
-
ani = ani_after_aai(ref_project.dataset(r[0]), 80.0)
|
|
107
|
-
unless ani.nil? || ani < closest[:ani]
|
|
108
|
-
closest = { ds: r[0], ani: ani }
|
|
109
|
-
end
|
|
93
|
+
sbj_datasets << ref_project.dataset(r[0]) if r[1].to_i == val_cls
|
|
110
94
|
end
|
|
111
95
|
end
|
|
96
|
+
ani = ani_after_aai(sbj_datasets, 80.0)
|
|
97
|
+
ani_max = ani.map(&:to_f).each_with_index.max
|
|
98
|
+
closest = { ds: sbj_datasets[ani_max[1]].name, ani: ani_max[0] }
|
|
112
99
|
end
|
|
113
100
|
|
|
114
101
|
# Calculate all the AAIs/ANIs against the closest ANI95-clade (if AAI > 80%)
|
|
115
102
|
cl_path = res.file_path :clades_ani95
|
|
116
|
-
if !cl_path.nil?
|
|
117
|
-
File.foreach(cl_path)
|
|
118
|
-
|
|
119
|
-
|
|
120
|
-
|
|
103
|
+
if !cl_path.nil? && File.size?(cl_path) && tsk[0] == :clade_finding
|
|
104
|
+
clades = File.foreach(cl_path).map { |i| i.chomp.split(',') }
|
|
105
|
+
sbj_dataset_names = clades.find { |i| i.include?(closest[:ds]) }
|
|
106
|
+
sbj_datasets = sbj_dataset_names&.map { |i| ref_project.dataset(i) }
|
|
107
|
+
ani_after_aai(sbj_datasets, 80.0) if sbj_datasets
|
|
121
108
|
end
|
|
122
109
|
|
|
123
110
|
# Finalize
|
data/utils/distance/temporal.rb
CHANGED
|
@@ -24,8 +24,10 @@ module MiGA::DistanceRunner::Temporal
|
|
|
24
24
|
end
|
|
25
25
|
end
|
|
26
26
|
|
|
27
|
-
# Temporal file with extension +ext+
|
|
28
|
-
def tmp_file(ext)
|
|
27
|
+
# Temporal file with extension +ext+, or a unique ID if +ext+ is +nil+
|
|
28
|
+
def tmp_file(ext = nil)
|
|
29
|
+
@_tmp_count ||= 0
|
|
30
|
+
ext ||= "#{@_tmp_count += 1}.tmp"
|
|
29
31
|
File.expand_path("#{dataset.name}.#{ext}", tmp)
|
|
30
32
|
end
|
|
31
33
|
|
data/utils/distances.rb
CHANGED
|
@@ -2,8 +2,8 @@
|
|
|
2
2
|
|
|
3
3
|
require_relative 'distance/runner.rb'
|
|
4
4
|
|
|
5
|
-
dataset = ARGV.shift
|
|
6
5
|
project = ARGV.shift
|
|
6
|
+
dataset = ARGV.shift
|
|
7
7
|
opts = Hash[ARGV.map { |i| i.split("=", 2).tap { |j| j[0] = j[0].to_sym } }]
|
|
8
|
-
runner = MiGA::DistanceRunner.new(
|
|
8
|
+
runner = MiGA::DistanceRunner.new(project, dataset, opts)
|
|
9
9
|
runner.go!
|
data/utils/requirements.txt
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
Software Test exec Website Notes
|
|
2
2
|
-------- --------- ------- -----
|
|
3
3
|
Ruby ruby https://www.ruby-lang.org/ Required version: 2.3+
|
|
4
|
-
Python
|
|
4
|
+
Python python3 https://www.python.org/ Required version: 3+
|
|
5
5
|
R R http://www.r-project.org/
|
|
6
6
|
SQLite3 sqlite3 https://www.sqlite.org/
|
|
7
7
|
NCBI BLAST+ blastp ftp://ftp.ncbi.nlm.nih.gov/blast/executables/blast+/LATEST
|
|
@@ -10,12 +10,12 @@ FastANI fastANI https://github.com/ParBLiSS/FastANI Required version: 1.1+
|
|
|
10
10
|
HMMer 3.0+ hmmsearch http://hmmer.janelia.org/software
|
|
11
11
|
Bedtools bedtools http://bedtools.readthedocs.org/en/latest/
|
|
12
12
|
Prodigal prodigal http://prodigal.ornl.gov
|
|
13
|
-
IDBA idba_ud http://i.cs.hku.hk/~alse/hkubrg/projects/idba
|
|
14
13
|
MCL mcl http://micans.org/mcl/
|
|
15
14
|
Barrnap barrnap http://www.vicbioinformatics.com/software.barrnap.shtml
|
|
16
|
-
|
|
17
|
-
|
|
18
|
-
|
|
15
|
+
IDBA (reads) idba_ud http://i.cs.hku.hk/~alse/hkubrg/projects/idba
|
|
16
|
+
Scythe (reads) scythe https://github.com/vsbuffalo/scythe Required version: 0.991+
|
|
17
|
+
FastQC (reads) fastqc http://www.bioinformatics.babraham.ac.uk/projects/fastqc
|
|
18
|
+
SolexaQA++ (reads) SolexaQA++ http://solexaqa.sourceforge.net Required version: v3.1.3+
|
|
19
19
|
OpenJDK (rdp) java https://adoptopenjdk.net/ Any Java VM would work
|
|
20
20
|
MyTaxa (mytaxa) MyTaxa http://enve-omics.ce.gatech.edu/mytaxa
|
|
21
21
|
Krona (mytaxa) ktImportText https://github.com/marbl/Krona/wiki
|
metadata
CHANGED
|
@@ -1,14 +1,14 @@
|
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
|
2
2
|
name: miga-base
|
|
3
3
|
version: !ruby/object:Gem::Version
|
|
4
|
-
version: 0.7.
|
|
4
|
+
version: 0.7.26.0
|
|
5
5
|
platform: ruby
|
|
6
6
|
authors:
|
|
7
7
|
- Luis M. Rodriguez-R
|
|
8
|
-
autorequire:
|
|
8
|
+
autorequire:
|
|
9
9
|
bindir: bin
|
|
10
10
|
cert_chain: []
|
|
11
|
-
date: 2021-
|
|
11
|
+
date: 2021-03-01 00:00:00.000000000 Z
|
|
12
12
|
dependencies:
|
|
13
13
|
- !ruby/object:Gem::Dependency
|
|
14
14
|
name: daemons
|
|
@@ -261,273 +261,6 @@ files:
|
|
|
261
261
|
- utils/distance/temporal.rb
|
|
262
262
|
- utils/distances.rb
|
|
263
263
|
- utils/domain-ess-genes.rb
|
|
264
|
-
- utils/enveomics/Docs/recplot2.md
|
|
265
|
-
- utils/enveomics/Examples/aai-matrix.bash
|
|
266
|
-
- utils/enveomics/Examples/ani-matrix.bash
|
|
267
|
-
- utils/enveomics/Examples/essential-phylogeny.bash
|
|
268
|
-
- utils/enveomics/Examples/unus-genome-phylogeny.bash
|
|
269
|
-
- utils/enveomics/LICENSE.txt
|
|
270
|
-
- utils/enveomics/Makefile
|
|
271
|
-
- utils/enveomics/Manifest/Tasks/aasubs.json
|
|
272
|
-
- utils/enveomics/Manifest/Tasks/blasttab.json
|
|
273
|
-
- utils/enveomics/Manifest/Tasks/distances.json
|
|
274
|
-
- utils/enveomics/Manifest/Tasks/fasta.json
|
|
275
|
-
- utils/enveomics/Manifest/Tasks/fastq.json
|
|
276
|
-
- utils/enveomics/Manifest/Tasks/graphics.json
|
|
277
|
-
- utils/enveomics/Manifest/Tasks/mapping.json
|
|
278
|
-
- utils/enveomics/Manifest/Tasks/ogs.json
|
|
279
|
-
- utils/enveomics/Manifest/Tasks/other.json
|
|
280
|
-
- utils/enveomics/Manifest/Tasks/remote.json
|
|
281
|
-
- utils/enveomics/Manifest/Tasks/sequence-identity.json
|
|
282
|
-
- utils/enveomics/Manifest/Tasks/tables.json
|
|
283
|
-
- utils/enveomics/Manifest/Tasks/trees.json
|
|
284
|
-
- utils/enveomics/Manifest/Tasks/variants.json
|
|
285
|
-
- utils/enveomics/Manifest/categories.json
|
|
286
|
-
- utils/enveomics/Manifest/examples.json
|
|
287
|
-
- utils/enveomics/Manifest/tasks.json
|
|
288
|
-
- utils/enveomics/Pipelines/assembly.pbs/CONFIG.mock.bash
|
|
289
|
-
- utils/enveomics/Pipelines/assembly.pbs/FastA.N50.pl
|
|
290
|
-
- utils/enveomics/Pipelines/assembly.pbs/FastA.filterN.pl
|
|
291
|
-
- utils/enveomics/Pipelines/assembly.pbs/FastA.length.pl
|
|
292
|
-
- utils/enveomics/Pipelines/assembly.pbs/README.md
|
|
293
|
-
- utils/enveomics/Pipelines/assembly.pbs/RUNME-2.bash
|
|
294
|
-
- utils/enveomics/Pipelines/assembly.pbs/RUNME-3.bash
|
|
295
|
-
- utils/enveomics/Pipelines/assembly.pbs/RUNME-4.bash
|
|
296
|
-
- utils/enveomics/Pipelines/assembly.pbs/RUNME.bash
|
|
297
|
-
- utils/enveomics/Pipelines/assembly.pbs/kSelector.R
|
|
298
|
-
- utils/enveomics/Pipelines/assembly.pbs/newbler.pbs
|
|
299
|
-
- utils/enveomics/Pipelines/assembly.pbs/newbler_preparator.pl
|
|
300
|
-
- utils/enveomics/Pipelines/assembly.pbs/soap.pbs
|
|
301
|
-
- utils/enveomics/Pipelines/assembly.pbs/stats.pbs
|
|
302
|
-
- utils/enveomics/Pipelines/assembly.pbs/velvet.pbs
|
|
303
|
-
- utils/enveomics/Pipelines/blast.pbs/01.pbs.bash
|
|
304
|
-
- utils/enveomics/Pipelines/blast.pbs/02.pbs.bash
|
|
305
|
-
- utils/enveomics/Pipelines/blast.pbs/03.pbs.bash
|
|
306
|
-
- utils/enveomics/Pipelines/blast.pbs/BlastTab.recover_job.pl
|
|
307
|
-
- utils/enveomics/Pipelines/blast.pbs/CONFIG.mock.bash
|
|
308
|
-
- utils/enveomics/Pipelines/blast.pbs/FastA.split.pl
|
|
309
|
-
- utils/enveomics/Pipelines/blast.pbs/README.md
|
|
310
|
-
- utils/enveomics/Pipelines/blast.pbs/RUNME.bash
|
|
311
|
-
- utils/enveomics/Pipelines/blast.pbs/TASK.check.bash
|
|
312
|
-
- utils/enveomics/Pipelines/blast.pbs/TASK.dry.bash
|
|
313
|
-
- utils/enveomics/Pipelines/blast.pbs/TASK.eo.bash
|
|
314
|
-
- utils/enveomics/Pipelines/blast.pbs/TASK.pause.bash
|
|
315
|
-
- utils/enveomics/Pipelines/blast.pbs/TASK.run.bash
|
|
316
|
-
- utils/enveomics/Pipelines/blast.pbs/sentinel.pbs.bash
|
|
317
|
-
- utils/enveomics/Pipelines/idba.pbs/README.md
|
|
318
|
-
- utils/enveomics/Pipelines/idba.pbs/RUNME.bash
|
|
319
|
-
- utils/enveomics/Pipelines/idba.pbs/run.pbs
|
|
320
|
-
- utils/enveomics/Pipelines/trim.pbs/README.md
|
|
321
|
-
- utils/enveomics/Pipelines/trim.pbs/RUNME.bash
|
|
322
|
-
- utils/enveomics/Pipelines/trim.pbs/run.pbs
|
|
323
|
-
- utils/enveomics/README.md
|
|
324
|
-
- utils/enveomics/Scripts/AAsubs.log2ratio.rb
|
|
325
|
-
- utils/enveomics/Scripts/Aln.cat.rb
|
|
326
|
-
- utils/enveomics/Scripts/Aln.convert.pl
|
|
327
|
-
- utils/enveomics/Scripts/AlphaDiversity.pl
|
|
328
|
-
- utils/enveomics/Scripts/BedGraph.tad.rb
|
|
329
|
-
- utils/enveomics/Scripts/BedGraph.window.rb
|
|
330
|
-
- utils/enveomics/Scripts/BlastPairwise.AAsubs.pl
|
|
331
|
-
- utils/enveomics/Scripts/BlastTab.addlen.rb
|
|
332
|
-
- utils/enveomics/Scripts/BlastTab.advance.bash
|
|
333
|
-
- utils/enveomics/Scripts/BlastTab.best_hit_sorted.pl
|
|
334
|
-
- utils/enveomics/Scripts/BlastTab.catsbj.pl
|
|
335
|
-
- utils/enveomics/Scripts/BlastTab.cogCat.rb
|
|
336
|
-
- utils/enveomics/Scripts/BlastTab.filter.pl
|
|
337
|
-
- utils/enveomics/Scripts/BlastTab.kegg_pep2path_rest.pl
|
|
338
|
-
- utils/enveomics/Scripts/BlastTab.metaxaPrep.pl
|
|
339
|
-
- utils/enveomics/Scripts/BlastTab.pairedHits.rb
|
|
340
|
-
- utils/enveomics/Scripts/BlastTab.recplot2.R
|
|
341
|
-
- utils/enveomics/Scripts/BlastTab.seqdepth.pl
|
|
342
|
-
- utils/enveomics/Scripts/BlastTab.seqdepth_ZIP.pl
|
|
343
|
-
- utils/enveomics/Scripts/BlastTab.seqdepth_nomedian.pl
|
|
344
|
-
- utils/enveomics/Scripts/BlastTab.subsample.pl
|
|
345
|
-
- utils/enveomics/Scripts/BlastTab.sumPerHit.pl
|
|
346
|
-
- utils/enveomics/Scripts/BlastTab.taxid2taxrank.pl
|
|
347
|
-
- utils/enveomics/Scripts/BlastTab.topHits_sorted.rb
|
|
348
|
-
- utils/enveomics/Scripts/Chao1.pl
|
|
349
|
-
- utils/enveomics/Scripts/CharTable.classify.rb
|
|
350
|
-
- utils/enveomics/Scripts/EBIseq2tax.rb
|
|
351
|
-
- utils/enveomics/Scripts/FastA.N50.pl
|
|
352
|
-
- utils/enveomics/Scripts/FastA.extract.rb
|
|
353
|
-
- utils/enveomics/Scripts/FastA.filter.pl
|
|
354
|
-
- utils/enveomics/Scripts/FastA.filterLen.pl
|
|
355
|
-
- utils/enveomics/Scripts/FastA.filterN.pl
|
|
356
|
-
- utils/enveomics/Scripts/FastA.fragment.rb
|
|
357
|
-
- utils/enveomics/Scripts/FastA.gc.pl
|
|
358
|
-
- utils/enveomics/Scripts/FastA.interpose.pl
|
|
359
|
-
- utils/enveomics/Scripts/FastA.length.pl
|
|
360
|
-
- utils/enveomics/Scripts/FastA.mask.rb
|
|
361
|
-
- utils/enveomics/Scripts/FastA.per_file.pl
|
|
362
|
-
- utils/enveomics/Scripts/FastA.qlen.pl
|
|
363
|
-
- utils/enveomics/Scripts/FastA.rename.pl
|
|
364
|
-
- utils/enveomics/Scripts/FastA.revcom.pl
|
|
365
|
-
- utils/enveomics/Scripts/FastA.sample.rb
|
|
366
|
-
- utils/enveomics/Scripts/FastA.slider.pl
|
|
367
|
-
- utils/enveomics/Scripts/FastA.split.pl
|
|
368
|
-
- utils/enveomics/Scripts/FastA.split.rb
|
|
369
|
-
- utils/enveomics/Scripts/FastA.subsample.pl
|
|
370
|
-
- utils/enveomics/Scripts/FastA.tag.rb
|
|
371
|
-
- utils/enveomics/Scripts/FastA.wrap.rb
|
|
372
|
-
- utils/enveomics/Scripts/FastQ.filter.pl
|
|
373
|
-
- utils/enveomics/Scripts/FastQ.interpose.pl
|
|
374
|
-
- utils/enveomics/Scripts/FastQ.offset.pl
|
|
375
|
-
- utils/enveomics/Scripts/FastQ.split.pl
|
|
376
|
-
- utils/enveomics/Scripts/FastQ.tag.rb
|
|
377
|
-
- utils/enveomics/Scripts/FastQ.test-error.rb
|
|
378
|
-
- utils/enveomics/Scripts/FastQ.toFastA.awk
|
|
379
|
-
- utils/enveomics/Scripts/GFF.catsbj.pl
|
|
380
|
-
- utils/enveomics/Scripts/GenBank.add_fields.rb
|
|
381
|
-
- utils/enveomics/Scripts/HMM.essential.rb
|
|
382
|
-
- utils/enveomics/Scripts/HMM.haai.rb
|
|
383
|
-
- utils/enveomics/Scripts/HMMsearch.extractIds.rb
|
|
384
|
-
- utils/enveomics/Scripts/JPlace.distances.rb
|
|
385
|
-
- utils/enveomics/Scripts/JPlace.to_iToL.rb
|
|
386
|
-
- utils/enveomics/Scripts/M5nr.getSequences.rb
|
|
387
|
-
- utils/enveomics/Scripts/MeTaxa.distribution.pl
|
|
388
|
-
- utils/enveomics/Scripts/MyTaxa.fragsByTax.pl
|
|
389
|
-
- utils/enveomics/Scripts/MyTaxa.seq-taxrank.rb
|
|
390
|
-
- utils/enveomics/Scripts/NCBIacc2tax.rb
|
|
391
|
-
- utils/enveomics/Scripts/Newick.autoprune.R
|
|
392
|
-
- utils/enveomics/Scripts/RAxML-EPA.to_iToL.pl
|
|
393
|
-
- utils/enveomics/Scripts/RecPlot2.compareIdentities.R
|
|
394
|
-
- utils/enveomics/Scripts/RefSeq.download.bash
|
|
395
|
-
- utils/enveomics/Scripts/SRA.download.bash
|
|
396
|
-
- utils/enveomics/Scripts/TRIBS.plot-test.R
|
|
397
|
-
- utils/enveomics/Scripts/TRIBS.test.R
|
|
398
|
-
- utils/enveomics/Scripts/Table.barplot.R
|
|
399
|
-
- utils/enveomics/Scripts/Table.df2dist.R
|
|
400
|
-
- utils/enveomics/Scripts/Table.filter.pl
|
|
401
|
-
- utils/enveomics/Scripts/Table.merge.pl
|
|
402
|
-
- utils/enveomics/Scripts/Table.replace.rb
|
|
403
|
-
- utils/enveomics/Scripts/Table.round.rb
|
|
404
|
-
- utils/enveomics/Scripts/Table.split.pl
|
|
405
|
-
- utils/enveomics/Scripts/Taxonomy.silva2ncbi.rb
|
|
406
|
-
- utils/enveomics/Scripts/VCF.KaKs.rb
|
|
407
|
-
- utils/enveomics/Scripts/VCF.SNPs.rb
|
|
408
|
-
- utils/enveomics/Scripts/aai.rb
|
|
409
|
-
- utils/enveomics/Scripts/ani.rb
|
|
410
|
-
- utils/enveomics/Scripts/clust.rand.rb
|
|
411
|
-
- utils/enveomics/Scripts/gi2tax.rb
|
|
412
|
-
- utils/enveomics/Scripts/in_silico_GA_GI.pl
|
|
413
|
-
- utils/enveomics/Scripts/lib/data/dupont_2012_essential.hmm.gz
|
|
414
|
-
- utils/enveomics/Scripts/lib/data/lee_2019_essential.hmm.gz
|
|
415
|
-
- utils/enveomics/Scripts/lib/enveomics.R
|
|
416
|
-
- utils/enveomics/Scripts/lib/enveomics_rb/enveomics.rb
|
|
417
|
-
- utils/enveomics/Scripts/lib/enveomics_rb/jplace.rb
|
|
418
|
-
- utils/enveomics/Scripts/lib/enveomics_rb/og.rb
|
|
419
|
-
- utils/enveomics/Scripts/lib/enveomics_rb/remote_data.rb
|
|
420
|
-
- utils/enveomics/Scripts/lib/enveomics_rb/seq_range.rb
|
|
421
|
-
- utils/enveomics/Scripts/lib/enveomics_rb/stat.rb
|
|
422
|
-
- utils/enveomics/Scripts/lib/enveomics_rb/vcf.rb
|
|
423
|
-
- utils/enveomics/Scripts/ogs.annotate.rb
|
|
424
|
-
- utils/enveomics/Scripts/ogs.core-pan.rb
|
|
425
|
-
- utils/enveomics/Scripts/ogs.extract.rb
|
|
426
|
-
- utils/enveomics/Scripts/ogs.mcl.rb
|
|
427
|
-
- utils/enveomics/Scripts/ogs.rb
|
|
428
|
-
- utils/enveomics/Scripts/ogs.stats.rb
|
|
429
|
-
- utils/enveomics/Scripts/rbm.rb
|
|
430
|
-
- utils/enveomics/Tests/Makefile
|
|
431
|
-
- utils/enveomics/Tests/Mgen_M2288.faa
|
|
432
|
-
- utils/enveomics/Tests/Mgen_M2288.fna
|
|
433
|
-
- utils/enveomics/Tests/Mgen_M2321.fna
|
|
434
|
-
- utils/enveomics/Tests/Nequ_Kin4M.faa
|
|
435
|
-
- utils/enveomics/Tests/Xanthomonas_oryzae-PilA.tribs.Rdata
|
|
436
|
-
- utils/enveomics/Tests/Xanthomonas_oryzae-PilA.txt
|
|
437
|
-
- utils/enveomics/Tests/Xanthomonas_oryzae.aai-mat.tsv
|
|
438
|
-
- utils/enveomics/Tests/Xanthomonas_oryzae.aai.tsv
|
|
439
|
-
- utils/enveomics/Tests/a_mg.cds-go.blast.tsv
|
|
440
|
-
- utils/enveomics/Tests/a_mg.reads-cds.blast.tsv
|
|
441
|
-
- utils/enveomics/Tests/a_mg.reads-cds.counts.tsv
|
|
442
|
-
- utils/enveomics/Tests/alkB.nwk
|
|
443
|
-
- utils/enveomics/Tests/anthrax-cansnp-data.tsv
|
|
444
|
-
- utils/enveomics/Tests/anthrax-cansnp-key.tsv
|
|
445
|
-
- utils/enveomics/Tests/hiv1.faa
|
|
446
|
-
- utils/enveomics/Tests/hiv1.fna
|
|
447
|
-
- utils/enveomics/Tests/hiv2.faa
|
|
448
|
-
- utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv
|
|
449
|
-
- utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv.lim
|
|
450
|
-
- utils/enveomics/Tests/hiv_mix-hiv1.blast.tsv.rec
|
|
451
|
-
- utils/enveomics/Tests/phyla_counts.tsv
|
|
452
|
-
- utils/enveomics/Tests/primate_lentivirus.ogs
|
|
453
|
-
- utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-hiv1.rbm
|
|
454
|
-
- utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-hiv2.rbm
|
|
455
|
-
- utils/enveomics/Tests/primate_lentivirus.rbm/hiv1-siv.rbm
|
|
456
|
-
- utils/enveomics/Tests/primate_lentivirus.rbm/hiv2-hiv2.rbm
|
|
457
|
-
- utils/enveomics/Tests/primate_lentivirus.rbm/hiv2-siv.rbm
|
|
458
|
-
- utils/enveomics/Tests/primate_lentivirus.rbm/siv-siv.rbm
|
|
459
|
-
- utils/enveomics/build_enveomics_r.bash
|
|
460
|
-
- utils/enveomics/enveomics.R/DESCRIPTION
|
|
461
|
-
- utils/enveomics/enveomics.R/NAMESPACE
|
|
462
|
-
- utils/enveomics/enveomics.R/R/autoprune.R
|
|
463
|
-
- utils/enveomics/enveomics.R/R/barplot.R
|
|
464
|
-
- utils/enveomics/enveomics.R/R/cliopts.R
|
|
465
|
-
- utils/enveomics/enveomics.R/R/df2dist.R
|
|
466
|
-
- utils/enveomics/enveomics.R/R/growthcurve.R
|
|
467
|
-
- utils/enveomics/enveomics.R/R/recplot.R
|
|
468
|
-
- utils/enveomics/enveomics.R/R/recplot2.R
|
|
469
|
-
- utils/enveomics/enveomics.R/R/tribs.R
|
|
470
|
-
- utils/enveomics/enveomics.R/R/utils.R
|
|
471
|
-
- utils/enveomics/enveomics.R/README.md
|
|
472
|
-
- utils/enveomics/enveomics.R/data/growth.curves.rda
|
|
473
|
-
- utils/enveomics/enveomics.R/data/phyla.counts.rda
|
|
474
|
-
- utils/enveomics/enveomics.R/man/cash-enve.GrowthCurve-method.Rd
|
|
475
|
-
- utils/enveomics/enveomics.R/man/cash-enve.RecPlot2-method.Rd
|
|
476
|
-
- utils/enveomics/enveomics.R/man/cash-enve.RecPlot2.Peak-method.Rd
|
|
477
|
-
- utils/enveomics/enveomics.R/man/enve.GrowthCurve-class.Rd
|
|
478
|
-
- utils/enveomics/enveomics.R/man/enve.TRIBS-class.Rd
|
|
479
|
-
- utils/enveomics/enveomics.R/man/enve.TRIBS.merge.Rd
|
|
480
|
-
- utils/enveomics/enveomics.R/man/enve.TRIBStest-class.Rd
|
|
481
|
-
- utils/enveomics/enveomics.R/man/enve.__prune.iter.Rd
|
|
482
|
-
- utils/enveomics/enveomics.R/man/enve.__prune.reduce.Rd
|
|
483
|
-
- utils/enveomics/enveomics.R/man/enve.__tribs.Rd
|
|
484
|
-
- utils/enveomics/enveomics.R/man/enve.barplot.Rd
|
|
485
|
-
- utils/enveomics/enveomics.R/man/enve.cliopts.Rd
|
|
486
|
-
- utils/enveomics/enveomics.R/man/enve.col.alpha.Rd
|
|
487
|
-
- utils/enveomics/enveomics.R/man/enve.col2alpha.Rd
|
|
488
|
-
- utils/enveomics/enveomics.R/man/enve.df2dist.Rd
|
|
489
|
-
- utils/enveomics/enveomics.R/man/enve.df2dist.group.Rd
|
|
490
|
-
- utils/enveomics/enveomics.R/man/enve.df2dist.list.Rd
|
|
491
|
-
- utils/enveomics/enveomics.R/man/enve.growthcurve.Rd
|
|
492
|
-
- utils/enveomics/enveomics.R/man/enve.prune.dist.Rd
|
|
493
|
-
- utils/enveomics/enveomics.R/man/enve.recplot.Rd
|
|
494
|
-
- utils/enveomics/enveomics.R/man/enve.recplot2-class.Rd
|
|
495
|
-
- utils/enveomics/enveomics.R/man/enve.recplot2.ANIr.Rd
|
|
496
|
-
- utils/enveomics/enveomics.R/man/enve.recplot2.Rd
|
|
497
|
-
- utils/enveomics/enveomics.R/man/enve.recplot2.__counts.Rd
|
|
498
|
-
- utils/enveomics/enveomics.R/man/enve.recplot2.__peakHist.Rd
|
|
499
|
-
- utils/enveomics/enveomics.R/man/enve.recplot2.__whichClosestPeak.Rd
|
|
500
|
-
- utils/enveomics/enveomics.R/man/enve.recplot2.changeCutoff.Rd
|
|
501
|
-
- utils/enveomics/enveomics.R/man/enve.recplot2.compareIdentities.Rd
|
|
502
|
-
- utils/enveomics/enveomics.R/man/enve.recplot2.coordinates.Rd
|
|
503
|
-
- utils/enveomics/enveomics.R/man/enve.recplot2.corePeak.Rd
|
|
504
|
-
- utils/enveomics/enveomics.R/man/enve.recplot2.extractWindows.Rd
|
|
505
|
-
- utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.Rd
|
|
506
|
-
- utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__em_e.Rd
|
|
507
|
-
- utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__em_m.Rd
|
|
508
|
-
- utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__emauto_one.Rd
|
|
509
|
-
- utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__mow_one.Rd
|
|
510
|
-
- utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__mower.Rd
|
|
511
|
-
- utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.em.Rd
|
|
512
|
-
- utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.emauto.Rd
|
|
513
|
-
- utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.mower.Rd
|
|
514
|
-
- utils/enveomics/enveomics.R/man/enve.recplot2.peak-class.Rd
|
|
515
|
-
- utils/enveomics/enveomics.R/man/enve.recplot2.seqdepth.Rd
|
|
516
|
-
- utils/enveomics/enveomics.R/man/enve.recplot2.windowDepthThreshold.Rd
|
|
517
|
-
- utils/enveomics/enveomics.R/man/enve.tribs.Rd
|
|
518
|
-
- utils/enveomics/enveomics.R/man/enve.tribs.test.Rd
|
|
519
|
-
- utils/enveomics/enveomics.R/man/enve.truncate.Rd
|
|
520
|
-
- utils/enveomics/enveomics.R/man/growth.curves.Rd
|
|
521
|
-
- utils/enveomics/enveomics.R/man/phyla.counts.Rd
|
|
522
|
-
- utils/enveomics/enveomics.R/man/plot.enve.GrowthCurve.Rd
|
|
523
|
-
- utils/enveomics/enveomics.R/man/plot.enve.TRIBS.Rd
|
|
524
|
-
- utils/enveomics/enveomics.R/man/plot.enve.TRIBStest.Rd
|
|
525
|
-
- utils/enveomics/enveomics.R/man/plot.enve.recplot2.Rd
|
|
526
|
-
- utils/enveomics/enveomics.R/man/summary.enve.GrowthCurve.Rd
|
|
527
|
-
- utils/enveomics/enveomics.R/man/summary.enve.TRIBS.Rd
|
|
528
|
-
- utils/enveomics/enveomics.R/man/summary.enve.TRIBStest.Rd
|
|
529
|
-
- utils/enveomics/globals.mk
|
|
530
|
-
- utils/enveomics/manifest.json
|
|
531
264
|
- utils/find-medoid.R
|
|
532
265
|
- utils/index_metadata.rb
|
|
533
266
|
- utils/mytaxa_scan.R
|
|
@@ -548,7 +281,7 @@ homepage: http://enve-omics.ce.gatech.edu/miga
|
|
|
548
281
|
licenses:
|
|
549
282
|
- Artistic-2.0
|
|
550
283
|
metadata: {}
|
|
551
|
-
post_install_message:
|
|
284
|
+
post_install_message:
|
|
552
285
|
rdoc_options:
|
|
553
286
|
- lib
|
|
554
287
|
- README.md
|
|
@@ -570,7 +303,7 @@ required_rubygems_version: !ruby/object:Gem::Requirement
|
|
|
570
303
|
version: '0'
|
|
571
304
|
requirements: []
|
|
572
305
|
rubygems_version: 3.1.4
|
|
573
|
-
signing_key:
|
|
306
|
+
signing_key:
|
|
574
307
|
specification_version: 4
|
|
575
308
|
summary: MiGA
|
|
576
309
|
test_files: []
|