miga-base 0.7.26.1 → 1.0.2.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/lib/miga/_data/aai-intax.blast.tsv.gz +0 -0
- data/lib/miga/_data/aai-intax.diamond.tsv.gz +0 -0
- data/lib/miga/_data/aai-novel.blast.tsv.gz +0 -0
- data/lib/miga/_data/aai-novel.diamond.tsv.gz +0 -0
- data/lib/miga/cli/action/classify_wf.rb +2 -2
- data/lib/miga/cli/action/derep_wf.rb +1 -1
- data/lib/miga/cli/action/doctor.rb +57 -14
- data/lib/miga/cli/action/doctor/base.rb +47 -23
- data/lib/miga/cli/action/init.rb +11 -7
- data/lib/miga/cli/action/init/files_helper.rb +1 -0
- data/lib/miga/cli/action/ncbi_get.rb +3 -3
- data/lib/miga/cli/action/tax_dist.rb +2 -2
- data/lib/miga/cli/action/wf.rb +5 -4
- data/lib/miga/common.rb +1 -0
- data/lib/miga/daemon.rb +11 -4
- data/lib/miga/dataset/result.rb +10 -6
- data/lib/miga/json.rb +5 -4
- data/lib/miga/metadata.rb +5 -1
- data/lib/miga/parallel.rb +36 -0
- data/lib/miga/project.rb +8 -8
- data/lib/miga/project/base.rb +4 -4
- data/lib/miga/project/result.rb +2 -2
- data/lib/miga/sqlite.rb +10 -2
- data/lib/miga/version.rb +23 -9
- data/scripts/aai_distances.bash +16 -18
- data/scripts/ani_distances.bash +16 -17
- data/scripts/assembly.bash +31 -16
- data/scripts/haai_distances.bash +3 -27
- data/scripts/miga.bash +6 -4
- data/scripts/p.bash +1 -1
- data/scripts/read_quality.bash +9 -18
- data/scripts/trimmed_fasta.bash +14 -30
- data/scripts/trimmed_reads.bash +36 -36
- data/test/parallel_test.rb +31 -0
- data/test/project_test.rb +2 -1
- data/test/remote_dataset_test.rb +1 -1
- data/utils/distance/commands.rb +1 -0
- data/utils/distance/database.rb +0 -1
- data/utils/distance/runner.rb +2 -4
- data/utils/enveomics/Manifest/Tasks/fasta.json +39 -3
- data/utils/enveomics/Manifest/Tasks/fastq.json +50 -2
- data/utils/enveomics/Manifest/Tasks/mapping.json +70 -0
- data/utils/enveomics/Manifest/Tasks/other.json +77 -0
- data/utils/enveomics/Manifest/Tasks/sequence-identity.json +138 -1
- data/utils/enveomics/Manifest/categories.json +13 -4
- data/utils/enveomics/Scripts/Aln.cat.rb +206 -148
- data/utils/enveomics/Scripts/FastA.N50.pl +33 -29
- data/utils/enveomics/Scripts/FastA.fragment.rb +69 -61
- data/utils/enveomics/Scripts/FastA.sample.rb +61 -46
- data/utils/enveomics/Scripts/FastA.toFastQ.rb +69 -0
- data/utils/enveomics/Scripts/FastQ.maskQual.rb +89 -0
- data/utils/enveomics/Scripts/FastQ.tag.rb +59 -52
- data/utils/enveomics/Scripts/SRA.download.bash +6 -8
- data/utils/enveomics/Scripts/Table.prefScore.R +60 -0
- data/utils/enveomics/Scripts/aai.rb +3 -2
- data/utils/enveomics/Scripts/anir.rb +137 -0
- data/utils/enveomics/Scripts/lib/enveomics_rb/anir.rb +293 -0
- data/utils/enveomics/Scripts/lib/enveomics_rb/bm_set.rb +175 -0
- data/utils/enveomics/Scripts/lib/enveomics_rb/enveomics.rb +17 -17
- data/utils/enveomics/Scripts/lib/enveomics_rb/errors.rb +17 -0
- data/utils/enveomics/Scripts/lib/enveomics_rb/gmm_em.rb +30 -0
- data/utils/enveomics/Scripts/lib/enveomics_rb/match.rb +63 -0
- data/utils/enveomics/Scripts/lib/enveomics_rb/rbm.rb +49 -0
- data/utils/enveomics/Scripts/lib/enveomics_rb/stats.rb +3 -0
- data/utils/enveomics/Scripts/lib/enveomics_rb/stats/rand.rb +31 -0
- data/utils/enveomics/Scripts/lib/enveomics_rb/stats/sample.rb +152 -0
- data/utils/enveomics/Scripts/lib/enveomics_rb/utils.rb +73 -0
- data/utils/enveomics/Scripts/rbm-legacy.rb +172 -0
- data/utils/enveomics/Scripts/rbm.rb +87 -133
- data/utils/enveomics/Scripts/sam.filter.rb +148 -0
- data/utils/enveomics/enveomics.R/DESCRIPTION +2 -2
- data/utils/enveomics/enveomics.R/NAMESPACE +1 -1
- data/utils/enveomics/enveomics.R/R/prefscore.R +79 -0
- data/utils/enveomics/enveomics.R/R/utils.R +30 -0
- data/utils/enveomics/enveomics.R/README.md +1 -0
- data/utils/enveomics/enveomics.R/man/cash-enve.GrowthCurve-method.Rd +0 -1
- data/utils/enveomics/enveomics.R/man/cash-enve.RecPlot2-method.Rd +0 -1
- data/utils/enveomics/enveomics.R/man/cash-enve.RecPlot2.Peak-method.Rd +0 -1
- data/utils/enveomics/enveomics.R/man/enve.__tribs.Rd +10 -2
- data/utils/enveomics/enveomics.R/man/enve.barplot.Rd +16 -4
- data/utils/enveomics/enveomics.R/man/enve.cliopts.Rd +13 -3
- data/utils/enveomics/enveomics.R/man/enve.df2dist.Rd +8 -2
- data/utils/enveomics/enveomics.R/man/enve.df2dist.group.Rd +8 -2
- data/utils/enveomics/enveomics.R/man/enve.df2dist.list.Rd +9 -2
- data/utils/enveomics/enveomics.R/man/enve.growthcurve.Rd +13 -5
- data/utils/enveomics/enveomics.R/man/enve.prefscore.Rd +50 -0
- data/utils/enveomics/enveomics.R/man/enve.prune.dist.Rd +9 -2
- data/utils/enveomics/enveomics.R/man/enve.recplot.Rd +23 -6
- data/utils/enveomics/enveomics.R/man/enve.recplot2.Rd +13 -4
- data/utils/enveomics/enveomics.R/man/enve.recplot2.compareIdentities.Rd +8 -2
- data/utils/enveomics/enveomics.R/man/enve.recplot2.extractWindows.Rd +7 -2
- data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.__mow_one.Rd +14 -3
- data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.em.Rd +10 -2
- data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.emauto.Rd +8 -2
- data/utils/enveomics/enveomics.R/man/enve.recplot2.findPeaks.mower.Rd +17 -9
- data/utils/enveomics/enveomics.R/man/enve.recplot2.windowDepthThreshold.Rd +6 -2
- data/utils/enveomics/enveomics.R/man/enve.selvector.Rd +23 -0
- data/utils/enveomics/enveomics.R/man/enve.tribs.Rd +14 -5
- data/utils/enveomics/enveomics.R/man/plot.enve.GrowthCurve.Rd +19 -4
- data/utils/enveomics/enveomics.R/man/plot.enve.TRIBS.Rd +11 -3
- data/utils/enveomics/enveomics.R/man/plot.enve.TRIBStest.Rd +11 -4
- data/utils/enveomics/enveomics.R/man/plot.enve.recplot2.Rd +26 -12
- data/utils/multitrim/Multitrim How-To.pdf +0 -0
- data/utils/multitrim/README.md +67 -0
- data/utils/multitrim/multitrim.py +1555 -0
- data/utils/multitrim/multitrim.yml +13 -0
- data/utils/requirements.txt +4 -3
- data/utils/subclade/pipeline.rb +2 -2
- metadata +35 -7
- data/utils/enveomics/Scripts/lib/enveomics_rb/stat.rb +0 -30
data/utils/requirements.txt
CHANGED
@@ -13,9 +13,10 @@ Prodigal prodigal http://prodigal.ornl.gov
|
|
13
13
|
MCL mcl http://micans.org/mcl/
|
14
14
|
Barrnap barrnap http://www.vicbioinformatics.com/software.barrnap.shtml
|
15
15
|
IDBA (reads) idba_ud http://i.cs.hku.hk/~alse/hkubrg/projects/idba
|
16
|
-
|
17
|
-
|
18
|
-
|
16
|
+
FaQCs (reads) FaQCs https://github.com/LANL-Bioinformatics/FaQCs
|
17
|
+
Falco (reads) falco https://github.com/smithlabcode/falco
|
18
|
+
Seqtk (reads) seqtk https://github.com/lh3/seqtk
|
19
|
+
Fastp (reads) fastp https://github.com/OpenGene/fastp
|
19
20
|
OpenJDK (rdp) java https://adoptopenjdk.net/ Any Java VM would work
|
20
21
|
MyTaxa (mytaxa) MyTaxa http://enve-omics.ce.gatech.edu/mytaxa
|
21
22
|
Krona (mytaxa) ktImportText https://github.com/marbl/Krona/wiki
|
data/utils/subclade/pipeline.rb
CHANGED
@@ -17,10 +17,10 @@ module MiGA::SubcladeRunner::Pipeline
|
|
17
17
|
metric_res = project.result(par[0]) or raise "Incomplete step #{par[0]}"
|
18
18
|
Zlib::GzipReader.open(metric_res.file_path(:matrix)) do |ifh|
|
19
19
|
ifh.each_line do |ln|
|
20
|
-
next if ln =~ /^
|
20
|
+
next if ln =~ /^a\tb\tvalue\t/
|
21
21
|
|
22
22
|
r = ln.chomp.split("\t")
|
23
|
-
ofh.puts "G>#{r[
|
23
|
+
ofh.puts "G>#{r[0]}\tG>#{r[1]}\t#{r[2]}" if r[2].to_f >= par[1]
|
24
24
|
end
|
25
25
|
end
|
26
26
|
ofh.close
|
metadata
CHANGED
@@ -1,14 +1,14 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: miga-base
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.
|
4
|
+
version: 1.0.2.0
|
5
5
|
platform: ruby
|
6
6
|
authors:
|
7
7
|
- Luis M. Rodriguez-R
|
8
|
-
autorequire:
|
8
|
+
autorequire:
|
9
9
|
bindir: bin
|
10
10
|
cert_chain: []
|
11
|
-
date: 2021-
|
11
|
+
date: 2021-04-13 00:00:00.000000000 Z
|
12
12
|
dependencies:
|
13
13
|
- !ruby/object:Gem::Dependency
|
14
14
|
name: daemons
|
@@ -110,8 +110,12 @@ files:
|
|
110
110
|
- lib/miga.rb
|
111
111
|
- lib/miga/_data/aai-intax-blast.tsv.gz
|
112
112
|
- lib/miga/_data/aai-intax-diamond.tsv.gz
|
113
|
+
- lib/miga/_data/aai-intax.blast.tsv.gz
|
114
|
+
- lib/miga/_data/aai-intax.diamond.tsv.gz
|
113
115
|
- lib/miga/_data/aai-novel-blast.tsv.gz
|
114
116
|
- lib/miga/_data/aai-novel-diamond.tsv.gz
|
117
|
+
- lib/miga/_data/aai-novel.blast.tsv.gz
|
118
|
+
- lib/miga/_data/aai-novel.diamond.tsv.gz
|
115
119
|
- lib/miga/cli.rb
|
116
120
|
- lib/miga/cli/action.rb
|
117
121
|
- lib/miga/cli/action/about.rb
|
@@ -187,6 +191,7 @@ files:
|
|
187
191
|
- lib/miga/json.rb
|
188
192
|
- lib/miga/lair.rb
|
189
193
|
- lib/miga/metadata.rb
|
194
|
+
- lib/miga/parallel.rb
|
190
195
|
- lib/miga/project.rb
|
191
196
|
- lib/miga/project/base.rb
|
192
197
|
- lib/miga/project/dataset.rb
|
@@ -240,6 +245,7 @@ files:
|
|
240
245
|
- test/lair_test.rb
|
241
246
|
- test/metadata_test.rb
|
242
247
|
- test/net_test.rb
|
248
|
+
- test/parallel_test.rb
|
243
249
|
- test/project_test.rb
|
244
250
|
- test/remote_dataset_test.rb
|
245
251
|
- test/result_stats_test.rb
|
@@ -374,9 +380,11 @@ files:
|
|
374
380
|
- utils/enveomics/Scripts/FastA.split.rb
|
375
381
|
- utils/enveomics/Scripts/FastA.subsample.pl
|
376
382
|
- utils/enveomics/Scripts/FastA.tag.rb
|
383
|
+
- utils/enveomics/Scripts/FastA.toFastQ.rb
|
377
384
|
- utils/enveomics/Scripts/FastA.wrap.rb
|
378
385
|
- utils/enveomics/Scripts/FastQ.filter.pl
|
379
386
|
- utils/enveomics/Scripts/FastQ.interpose.pl
|
387
|
+
- utils/enveomics/Scripts/FastQ.maskQual.rb
|
380
388
|
- utils/enveomics/Scripts/FastQ.offset.pl
|
381
389
|
- utils/enveomics/Scripts/FastQ.split.pl
|
382
390
|
- utils/enveomics/Scripts/FastQ.tag.rb
|
@@ -405,6 +413,7 @@ files:
|
|
405
413
|
- utils/enveomics/Scripts/Table.df2dist.R
|
406
414
|
- utils/enveomics/Scripts/Table.filter.pl
|
407
415
|
- utils/enveomics/Scripts/Table.merge.pl
|
416
|
+
- utils/enveomics/Scripts/Table.prefScore.R
|
408
417
|
- utils/enveomics/Scripts/Table.replace.rb
|
409
418
|
- utils/enveomics/Scripts/Table.round.rb
|
410
419
|
- utils/enveomics/Scripts/Table.split.pl
|
@@ -413,18 +422,28 @@ files:
|
|
413
422
|
- utils/enveomics/Scripts/VCF.SNPs.rb
|
414
423
|
- utils/enveomics/Scripts/aai.rb
|
415
424
|
- utils/enveomics/Scripts/ani.rb
|
425
|
+
- utils/enveomics/Scripts/anir.rb
|
416
426
|
- utils/enveomics/Scripts/clust.rand.rb
|
417
427
|
- utils/enveomics/Scripts/gi2tax.rb
|
418
428
|
- utils/enveomics/Scripts/in_silico_GA_GI.pl
|
419
429
|
- utils/enveomics/Scripts/lib/data/dupont_2012_essential.hmm.gz
|
420
430
|
- utils/enveomics/Scripts/lib/data/lee_2019_essential.hmm.gz
|
421
431
|
- utils/enveomics/Scripts/lib/enveomics.R
|
432
|
+
- utils/enveomics/Scripts/lib/enveomics_rb/anir.rb
|
433
|
+
- utils/enveomics/Scripts/lib/enveomics_rb/bm_set.rb
|
422
434
|
- utils/enveomics/Scripts/lib/enveomics_rb/enveomics.rb
|
435
|
+
- utils/enveomics/Scripts/lib/enveomics_rb/errors.rb
|
436
|
+
- utils/enveomics/Scripts/lib/enveomics_rb/gmm_em.rb
|
423
437
|
- utils/enveomics/Scripts/lib/enveomics_rb/jplace.rb
|
438
|
+
- utils/enveomics/Scripts/lib/enveomics_rb/match.rb
|
424
439
|
- utils/enveomics/Scripts/lib/enveomics_rb/og.rb
|
440
|
+
- utils/enveomics/Scripts/lib/enveomics_rb/rbm.rb
|
425
441
|
- utils/enveomics/Scripts/lib/enveomics_rb/remote_data.rb
|
426
442
|
- utils/enveomics/Scripts/lib/enveomics_rb/seq_range.rb
|
427
|
-
- utils/enveomics/Scripts/lib/enveomics_rb/
|
443
|
+
- utils/enveomics/Scripts/lib/enveomics_rb/stats.rb
|
444
|
+
- utils/enveomics/Scripts/lib/enveomics_rb/stats/rand.rb
|
445
|
+
- utils/enveomics/Scripts/lib/enveomics_rb/stats/sample.rb
|
446
|
+
- utils/enveomics/Scripts/lib/enveomics_rb/utils.rb
|
428
447
|
- utils/enveomics/Scripts/lib/enveomics_rb/vcf.rb
|
429
448
|
- utils/enveomics/Scripts/ogs.annotate.rb
|
430
449
|
- utils/enveomics/Scripts/ogs.core-pan.rb
|
@@ -432,7 +451,9 @@ files:
|
|
432
451
|
- utils/enveomics/Scripts/ogs.mcl.rb
|
433
452
|
- utils/enveomics/Scripts/ogs.rb
|
434
453
|
- utils/enveomics/Scripts/ogs.stats.rb
|
454
|
+
- utils/enveomics/Scripts/rbm-legacy.rb
|
435
455
|
- utils/enveomics/Scripts/rbm.rb
|
456
|
+
- utils/enveomics/Scripts/sam.filter.rb
|
436
457
|
- utils/enveomics/Tests/Makefile
|
437
458
|
- utils/enveomics/Tests/Mgen_M2288.faa
|
438
459
|
- utils/enveomics/Tests/Mgen_M2288.fna
|
@@ -470,6 +491,7 @@ files:
|
|
470
491
|
- utils/enveomics/enveomics.R/R/cliopts.R
|
471
492
|
- utils/enveomics/enveomics.R/R/df2dist.R
|
472
493
|
- utils/enveomics/enveomics.R/R/growthcurve.R
|
494
|
+
- utils/enveomics/enveomics.R/R/prefscore.R
|
473
495
|
- utils/enveomics/enveomics.R/R/recplot.R
|
474
496
|
- utils/enveomics/enveomics.R/R/recplot2.R
|
475
497
|
- utils/enveomics/enveomics.R/R/tribs.R
|
@@ -495,6 +517,7 @@ files:
|
|
495
517
|
- utils/enveomics/enveomics.R/man/enve.df2dist.group.Rd
|
496
518
|
- utils/enveomics/enveomics.R/man/enve.df2dist.list.Rd
|
497
519
|
- utils/enveomics/enveomics.R/man/enve.growthcurve.Rd
|
520
|
+
- utils/enveomics/enveomics.R/man/enve.prefscore.Rd
|
498
521
|
- utils/enveomics/enveomics.R/man/enve.prune.dist.Rd
|
499
522
|
- utils/enveomics/enveomics.R/man/enve.recplot.Rd
|
500
523
|
- utils/enveomics/enveomics.R/man/enve.recplot2-class.Rd
|
@@ -520,6 +543,7 @@ files:
|
|
520
543
|
- utils/enveomics/enveomics.R/man/enve.recplot2.peak-class.Rd
|
521
544
|
- utils/enveomics/enveomics.R/man/enve.recplot2.seqdepth.Rd
|
522
545
|
- utils/enveomics/enveomics.R/man/enve.recplot2.windowDepthThreshold.Rd
|
546
|
+
- utils/enveomics/enveomics.R/man/enve.selvector.Rd
|
523
547
|
- utils/enveomics/enveomics.R/man/enve.tribs.Rd
|
524
548
|
- utils/enveomics/enveomics.R/man/enve.tribs.test.Rd
|
525
549
|
- utils/enveomics/enveomics.R/man/enve.truncate.Rd
|
@@ -536,6 +560,10 @@ files:
|
|
536
560
|
- utils/enveomics/manifest.json
|
537
561
|
- utils/find-medoid.R
|
538
562
|
- utils/index_metadata.rb
|
563
|
+
- utils/multitrim/Multitrim How-To.pdf
|
564
|
+
- utils/multitrim/README.md
|
565
|
+
- utils/multitrim/multitrim.py
|
566
|
+
- utils/multitrim/multitrim.yml
|
539
567
|
- utils/mytaxa_scan.R
|
540
568
|
- utils/mytaxa_scan.rb
|
541
569
|
- utils/plot-taxdist.R
|
@@ -554,7 +582,7 @@ homepage: http://enve-omics.ce.gatech.edu/miga
|
|
554
582
|
licenses:
|
555
583
|
- Artistic-2.0
|
556
584
|
metadata: {}
|
557
|
-
post_install_message:
|
585
|
+
post_install_message:
|
558
586
|
rdoc_options:
|
559
587
|
- lib
|
560
588
|
- README.md
|
@@ -575,8 +603,8 @@ required_rubygems_version: !ruby/object:Gem::Requirement
|
|
575
603
|
- !ruby/object:Gem::Version
|
576
604
|
version: '0'
|
577
605
|
requirements: []
|
578
|
-
rubygems_version: 3.1.
|
579
|
-
signing_key:
|
606
|
+
rubygems_version: 3.1.6
|
607
|
+
signing_key:
|
580
608
|
specification_version: 4
|
581
609
|
summary: MiGA
|
582
610
|
test_files: []
|
@@ -1,30 +0,0 @@
|
|
1
|
-
|
2
|
-
module Enve
|
3
|
-
class Stat
|
4
|
-
# Generates a random number from the +dist+ distribution with +params+
|
5
|
-
# parameters. This is simply a wrapper to the r_* functions below.
|
6
|
-
def self.rand(dist=:unif, *params)
|
7
|
-
send("r_#{dist}", *params)
|
8
|
-
end
|
9
|
-
|
10
|
-
# Generates a random number from the uniform distribution between +min+ and
|
11
|
-
# +max+. By default generates random numbers between 0.0 and 1.0.
|
12
|
-
def self.r_unif(min=0.0, max=1.0)
|
13
|
-
min + (max-min)*Random::rand
|
14
|
-
end
|
15
|
-
|
16
|
-
# Generates a random number from the geometric distribution with support
|
17
|
-
# {0, 1, 2, ...} and probability of success +p+.
|
18
|
-
def self.r_geom(p)
|
19
|
-
(Math::log(1.0 - rand)/Math::log(1.0-p) - 1.0).ceil
|
20
|
-
end
|
21
|
-
|
22
|
-
# Generates a random number from the shifted geometric distribution with
|
23
|
-
# support {1, 2, 3, ...} and probability of success +p+.
|
24
|
-
def self.r_sgeom(p)
|
25
|
-
(Math::log(1.0 - rand)/Math::log(1.0-p)).ceil
|
26
|
-
end
|
27
|
-
|
28
|
-
end
|
29
|
-
end
|
30
|
-
|