bio 1.6.0.pre.20181210 → 2.0.3
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/.travis.yml +32 -34
- data/ChangeLog +1462 -8
- data/Gemfile +0 -2
- data/KNOWN_ISSUES.rdoc +4 -10
- data/LEGAL +0 -10
- data/README.rdoc +31 -80
- data/README_DEV.rdoc +5 -5
- data/RELEASE_NOTES.rdoc +171 -18
- data/Rakefile +0 -34
- data/appveyor.yml +15 -7
- data/bioruby.gemspec +13 -4
- data/bioruby.gemspec.erb +0 -1
- data/gemfiles/Gemfile.travis-rbx +0 -2
- data/gemfiles/Gemfile.travis-ruby1.8 +0 -2
- data/gemfiles/Gemfile.travis-ruby1.9 +0 -2
- data/gemfiles/Gemfile.windows +6 -0
- data/lib/bio/appl/blast/report.rb +40 -8
- data/lib/bio/appl/iprscan/report.rb +3 -3
- data/lib/bio/appl/sosui/report.rb +1 -1
- data/lib/bio/db/embl/uniprotkb.rb +1 -1
- data/lib/bio/db/gff.rb +3 -1
- data/lib/bio/db/go.rb +2 -2
- data/lib/bio/db/kegg/common.rb +14 -0
- data/lib/bio/db/kegg/genes.rb +26 -0
- data/lib/bio/db/kegg/pathway.rb +5 -11
- data/lib/bio/sequence/common.rb +112 -0
- data/lib/bio/sequence/format.rb +1 -0
- data/lib/bio/tree.rb +1 -1
- data/lib/bio/version.rb +3 -3
- data/sample/color_scheme_aa.rb +82 -0
- data/sample/color_scheme_na.rb +5 -6
- data/sample/fastq2html.cwl +23 -0
- data/sample/fastq2html.rb +94 -0
- data/sample/fastq2html.testdata.yaml +5 -0
- data/sample/na2aa.cwl +23 -0
- data/sample/na2aa.rb +11 -25
- data/sample/na2aa.testdata.yaml +7 -0
- data/sample/rev_comp.cwl +23 -0
- data/sample/rev_comp.rb +20 -0
- data/sample/rev_comp.testdata.yaml +7 -0
- data/test/network/bio/db/kegg/test_genes_hsa7422.rb +91 -0
- data/test/unit/bio/appl/blast/test_report.rb +4 -4
- data/test/unit/bio/db/test_gff.rb +5 -0
- data/test/unit/bio/sequence/test_ruby3.rb +462 -0
- metadata +17 -8
- data/lib/bio/appl/blast/xmlparser.rb +0 -236
- data/setup.rb +0 -1600
data/sample/na2aa.cwl
ADDED
@@ -0,0 +1,23 @@
|
|
1
|
+
#!/usr/bin/env cwl-runner
|
2
|
+
|
3
|
+
cwlVersion: v1.0
|
4
|
+
class: CommandLineTool
|
5
|
+
baseCommand: [ruby]
|
6
|
+
|
7
|
+
inputs:
|
8
|
+
- id: script
|
9
|
+
type: File
|
10
|
+
default:
|
11
|
+
class: File
|
12
|
+
location: na2aa.rb
|
13
|
+
inputBinding:
|
14
|
+
position: -1
|
15
|
+
- id: seqFile
|
16
|
+
type: File[]
|
17
|
+
inputBinding:
|
18
|
+
position: 1
|
19
|
+
|
20
|
+
outputs:
|
21
|
+
- id: out
|
22
|
+
type: stdout
|
23
|
+
stdout: $(inputs.script.nameroot)-$(inputs.seqFile[0].nameroot).fst
|
data/sample/na2aa.rb
CHANGED
@@ -1,34 +1,20 @@
|
|
1
1
|
#!/usr/bin/env ruby
|
2
2
|
#
|
3
|
-
#
|
3
|
+
# na2aa.rb - translate any NA input into AA FASTA format
|
4
4
|
#
|
5
|
-
# Copyright (C)
|
6
|
-
#
|
7
|
-
# This program is free software; you can redistribute it and/or modify
|
8
|
-
# it under the terms of the GNU General Public License as published by
|
9
|
-
# the Free Software Foundation; either version 2 of the License, or
|
10
|
-
# (at your option) any later version.
|
11
|
-
#
|
12
|
-
# This program is distributed in the hope that it will be useful,
|
13
|
-
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
14
|
-
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
15
|
-
# GNU General Public License for more details.
|
16
|
-
#
|
17
|
-
# $Id: na2aa.rb,v 1.1 2008/02/06 16:25:53 pjotr Exp $
|
5
|
+
# Copyright:: Copyright (C) 2019 BioRuby Project
|
6
|
+
# License:: The Ruby License
|
18
7
|
#
|
19
8
|
|
20
9
|
require 'bio'
|
21
|
-
require 'pp'
|
22
10
|
|
23
|
-
|
24
|
-
|
25
|
-
|
26
|
-
|
27
|
-
|
28
|
-
|
29
|
-
|
30
|
-
|
31
|
-
print rec
|
11
|
+
ARGV.each do |fn|
|
12
|
+
Bio::FlatFile.open(fn) do |ff|
|
13
|
+
ff.each do |entry|
|
14
|
+
next if /\A\s*\z/ =~ ff.entry_raw.to_s
|
15
|
+
na = entry.naseq
|
16
|
+
aa = na.translate
|
17
|
+
print aa.to_fasta(entry.definition, 70)
|
18
|
+
end
|
32
19
|
end
|
33
20
|
end
|
34
|
-
|
data/sample/rev_comp.cwl
ADDED
@@ -0,0 +1,23 @@
|
|
1
|
+
#!/usr/bin/env cwl-runner
|
2
|
+
|
3
|
+
cwlVersion: v1.0
|
4
|
+
class: CommandLineTool
|
5
|
+
baseCommand: [ruby]
|
6
|
+
|
7
|
+
inputs:
|
8
|
+
- id: script
|
9
|
+
type: File
|
10
|
+
default:
|
11
|
+
class: File
|
12
|
+
location: rev_comp.rb
|
13
|
+
inputBinding:
|
14
|
+
position: -1
|
15
|
+
- id: seqFile
|
16
|
+
type: File[]
|
17
|
+
inputBinding:
|
18
|
+
position: 1
|
19
|
+
|
20
|
+
outputs:
|
21
|
+
- id: out
|
22
|
+
type: stdout
|
23
|
+
stdout: $(inputs.script.nameroot)-$(inputs.seqFile[0].nameroot).fst
|
data/sample/rev_comp.rb
ADDED
@@ -0,0 +1,20 @@
|
|
1
|
+
#!/usr/bin/env ruby
|
2
|
+
#
|
3
|
+
# rev_comp.rb - Reverse complement DNA sequences
|
4
|
+
#
|
5
|
+
# Copyright:: Copyright (C) 2019 BioRuby Project
|
6
|
+
# License:: The Ruby License
|
7
|
+
#
|
8
|
+
|
9
|
+
require 'bio'
|
10
|
+
|
11
|
+
ARGV.each do |fn|
|
12
|
+
Bio::FlatFile.open(fn) do |ff|
|
13
|
+
ff.each do |entry|
|
14
|
+
next if /\A\s*\z/ =~ ff.entry_raw.to_s
|
15
|
+
na = entry.naseq
|
16
|
+
revcomp = na.reverse_complement
|
17
|
+
print revcomp.to_fasta("complement(#{entry.entry_id}) " + entry.definition, 70)
|
18
|
+
end
|
19
|
+
end
|
20
|
+
end
|
@@ -0,0 +1,91 @@
|
|
1
|
+
#
|
2
|
+
# test/network/bio/db/kegg/test_genes_hsa7422.rb - Unit test for Bio::KEGG::GENES
|
3
|
+
#
|
4
|
+
# Copyright:: Copyright (C) 2019 BioRuby Project <staff@bioruby.org>
|
5
|
+
# License:: The Ruby License
|
6
|
+
# Contributor:: kojix2 <2xijok@gmail.com>
|
7
|
+
#
|
8
|
+
|
9
|
+
# loading helper routine for testing bioruby
|
10
|
+
require 'pathname'
|
11
|
+
load Pathname.new(File.join(File.dirname(__FILE__), ['..'] * 4,
|
12
|
+
'bioruby_test_helper.rb')).cleanpath.to_s
|
13
|
+
|
14
|
+
# libraries needed for the tests
|
15
|
+
require 'test/unit'
|
16
|
+
require 'bio/db/kegg/genes'
|
17
|
+
require 'bio/io/togows'
|
18
|
+
|
19
|
+
module Bio
|
20
|
+
|
21
|
+
# This test is moved from test/unit/bio/db/kegg/test_genes.rb
|
22
|
+
# and modified to get sample data from the internet
|
23
|
+
# because of KEGG data license issue.
|
24
|
+
#
|
25
|
+
# Note that this test may fail due to the data entry updates in KEGG.
|
26
|
+
class TestBioKEGGGENES_hsa7422 < Test::Unit::TestCase
|
27
|
+
|
28
|
+
str = Bio::TogoWS::REST.entry("kegg-genes", "hsa:7422")
|
29
|
+
DATA = str.freeze
|
30
|
+
|
31
|
+
def setup
|
32
|
+
#filename = File.join(BioRubyTestDataPath, 'KEGG/hsa7422.gene')
|
33
|
+
@obj = Bio::KEGG::GENES.new(DATA)
|
34
|
+
end
|
35
|
+
|
36
|
+
def test_diseases_as_strings
|
37
|
+
expected = ["H01456 Diabetic nephropathy",
|
38
|
+
"H01457 Diabetic retinopathy",
|
39
|
+
"H01459 Diabetic neuropathy",
|
40
|
+
"H01529 Avascular necrosis of femoral head",
|
41
|
+
"H01709 Glucocorticoid-induced osteonecrosis"]
|
42
|
+
|
43
|
+
assert_equal(expected, @obj.diseases_as_strings)
|
44
|
+
end
|
45
|
+
|
46
|
+
def test_diseases_as_hash
|
47
|
+
expected = {"H01456"=>"Diabetic nephropathy",
|
48
|
+
"H01457"=>"Diabetic retinopathy",
|
49
|
+
"H01459"=>"Diabetic neuropathy",
|
50
|
+
"H01529"=>"Avascular necrosis of femoral head",
|
51
|
+
"H01709"=>"Glucocorticoid-induced osteonecrosis"}
|
52
|
+
assert_equal(expected, @obj.diseases_as_hash)
|
53
|
+
end
|
54
|
+
|
55
|
+
def test_drug_targets_as_strings
|
56
|
+
expected = ["Abicipar pegol: D11517",
|
57
|
+
"Aflibercept: D09574",
|
58
|
+
"Aflibercept beta: D10819",
|
59
|
+
"Bevacizumab: D06409",
|
60
|
+
"Bevasiranib sodium: D08874",
|
61
|
+
"Brolucizumab: D11083",
|
62
|
+
"Faricimab: D11516",
|
63
|
+
"Navicixizumab: D11126",
|
64
|
+
"Pegaptanib: D05386",
|
65
|
+
"Ranibizumab: D05697",
|
66
|
+
"Vanucizumab: D11244"]
|
67
|
+
assert_equal(expected, @obj.drug_targets_as_strings)
|
68
|
+
end
|
69
|
+
|
70
|
+
def test_networks_as_strings
|
71
|
+
expected = ["nt06114 PI3K signaling (virus)",
|
72
|
+
"nt06124 Chemokine signaling (virus)",
|
73
|
+
"nt06164 Kaposi sarcoma-associated herpesvirus (KSHV)",
|
74
|
+
"nt06214 PI3K signaling",
|
75
|
+
"nt06219 JAK-STAT signaling",
|
76
|
+
"nt06224 CXCR signaling",
|
77
|
+
"nt06225 HIF-1 signaling",
|
78
|
+
"nt06262 Pancreatic cancer",
|
79
|
+
"nt06264 Renal cell carcinoma",
|
80
|
+
"N00079 HIF-1 signaling pathway",
|
81
|
+
"N00080 Loss of VHL to HIF-1 signaling pathway",
|
82
|
+
"N00081 Mutation-inactivated VHL to HIF-1 signaling pathway",
|
83
|
+
"N00095 ERBB2-overexpression to EGF-Jak-STAT signaling pathway",
|
84
|
+
"N00157 KSHV vGPCR to GNB/G-ERK signaling pathway",
|
85
|
+
"N00179 KSHV K1 to PI3K-NFKB signaling pathway"]
|
86
|
+
assert_equal(expected, @obj.networks_as_strings)
|
87
|
+
end
|
88
|
+
|
89
|
+
end #class TestBioKEGGGENES_hsa7422
|
90
|
+
|
91
|
+
end #module Bio
|
@@ -479,7 +479,7 @@ module Bio
|
|
479
479
|
include TemplateTestBlastReportHsp
|
480
480
|
end
|
481
481
|
|
482
|
-
if
|
482
|
+
if Bio::Blast::Report.private_method_defined? :xmlparser_parse then
|
483
483
|
|
484
484
|
class TestBlastReportXMLParser < Test::Unit::TestCase
|
485
485
|
include TemplateTestBlastReport
|
@@ -497,7 +497,7 @@ module Bio
|
|
497
497
|
include TemplateTestBlastReportHsp
|
498
498
|
end
|
499
499
|
|
500
|
-
end #if
|
500
|
+
end #if
|
501
501
|
|
502
502
|
class TestBlastReportDefault < Test::Unit::TestCase
|
503
503
|
include TemplateTestBlastReport
|
@@ -1294,7 +1294,7 @@ module Bio
|
|
1294
1294
|
end
|
1295
1295
|
|
1296
1296
|
# Tests for XMLParser version
|
1297
|
-
if
|
1297
|
+
if Bio::Blast::Report.private_method_defined? :xmlparser_parse then
|
1298
1298
|
|
1299
1299
|
class TestBlastReportMultiXMLParser < Test::Unit::TestCase
|
1300
1300
|
include TemplateTestBlastReportMulti
|
@@ -1312,6 +1312,6 @@ module Bio
|
|
1312
1312
|
include TemplateTestBlastReportHspMulti
|
1313
1313
|
end
|
1314
1314
|
|
1315
|
-
end #if
|
1315
|
+
end #if
|
1316
1316
|
|
1317
1317
|
end # module Bio
|
@@ -182,6 +182,11 @@ END_OF_DATA
|
|
182
182
|
assert_equal(str, @obj.to_s)
|
183
183
|
end
|
184
184
|
|
185
|
+
def test_self_parse
|
186
|
+
obj2 = Bio::GFF::GFF2::Record.parse(@obj.to_s)
|
187
|
+
assert_equal(@obj, obj2)
|
188
|
+
end
|
189
|
+
|
185
190
|
def test_eqeq
|
186
191
|
obj2 = Bio::GFF::GFF2::Record.new(@obj.to_s)
|
187
192
|
assert_equal(true, @obj == obj2)
|