bio-bigbio 0.1.5 → 0.1.6
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +7 -0
- data/Gemfile +4 -8
- data/Gemfile.lock +60 -22
- data/LICENSE.txt +1 -1
- data/README.md +22 -3
- data/Rakefile +1 -1
- data/VERSION +1 -1
- data/bin/fasta_filter.rb +2 -0
- data/bin/getorf +1 -1
- data/bin/nt2aa.rb +1 -1
- data/bio-bigbio.gemspec +15 -28
- data/lib/bigbio.rb +1 -1
- data/spec/emitter_spec.rb +24 -24
- data/test/performance/translate_with_biolib.rb +1 -1
- data/test/performance/translate_with_bioruby.rb +1 -1
- metadata +45 -53
checksums.yaml
ADDED
@@ -0,0 +1,7 @@
|
|
1
|
+
---
|
2
|
+
SHA1:
|
3
|
+
metadata.gz: 358cea2b69da2db20774ab98b4c0dfaa561b32c6
|
4
|
+
data.tar.gz: 1e1baca80f0aa0fd26d579e158aa88e0361493e9
|
5
|
+
SHA512:
|
6
|
+
metadata.gz: ac532f773fd025ee927bfff89a96d142b2d9b9ca28f14a2bd368553a164026bd2530d4f4f95e2addcc30ae323d6b58ed5c30111335927c2e66630933ee16f75c
|
7
|
+
data.tar.gz: b228c3d346a4cf87f9fec71392336d9e66be1c721f8dae167553ecac5a92b689cd9420a0206ef31fee4dd4e9df43ea5a97472474a07cb4ed1da0bd553a013473
|
data/Gemfile
CHANGED
@@ -1,15 +1,11 @@
|
|
1
1
|
source "http://rubygems.org"
|
2
|
-
# Add dependencies required to use your gem here.
|
3
|
-
# Example:
|
4
|
-
# gem "activesupport", ">= 2.3.5"
|
5
2
|
gem "bio", ">= 1.4.1"
|
6
|
-
gem "bio-logger"
|
3
|
+
gem "bio-logger"
|
7
4
|
|
8
5
|
# Add dependencies to develop your gem here.
|
9
6
|
# Include everything needed to run rake, tests, features, etc.
|
10
7
|
group :development do
|
11
|
-
gem "rspec"
|
12
|
-
gem "bundler"
|
13
|
-
gem "jeweler"
|
14
|
-
gem "rcov", ">= 0"
|
8
|
+
gem "rspec"
|
9
|
+
gem "bundler"
|
10
|
+
gem "jeweler"
|
15
11
|
end
|
data/Gemfile.lock
CHANGED
@@ -1,34 +1,72 @@
|
|
1
1
|
GEM
|
2
2
|
remote: http://rubygems.org/
|
3
3
|
specs:
|
4
|
-
|
5
|
-
bio
|
4
|
+
addressable (2.3.6)
|
5
|
+
bio (1.4.3)
|
6
|
+
bio-logger (1.0.1)
|
6
7
|
log4r (>= 1.1.9)
|
7
|
-
|
8
|
-
|
9
|
-
|
10
|
-
|
8
|
+
builder (3.2.2)
|
9
|
+
descendants_tracker (0.0.4)
|
10
|
+
thread_safe (~> 0.3, >= 0.3.1)
|
11
|
+
diff-lcs (1.1.3)
|
12
|
+
faraday (0.9.0)
|
13
|
+
multipart-post (>= 1.2, < 3)
|
14
|
+
git (1.2.6)
|
15
|
+
github_api (0.11.3)
|
16
|
+
addressable (~> 2.3)
|
17
|
+
descendants_tracker (~> 0.0.1)
|
18
|
+
faraday (~> 0.8, < 0.10)
|
19
|
+
hashie (>= 1.2)
|
20
|
+
multi_json (>= 1.7.5, < 2.0)
|
21
|
+
nokogiri (~> 1.6.0)
|
22
|
+
oauth2
|
23
|
+
hashie (2.1.1)
|
24
|
+
highline (1.6.21)
|
25
|
+
jeweler (2.0.1)
|
26
|
+
builder
|
27
|
+
bundler (>= 1.0)
|
11
28
|
git (>= 1.2.5)
|
29
|
+
github_api
|
30
|
+
highline (>= 1.6.15)
|
31
|
+
nokogiri (>= 1.5.10)
|
12
32
|
rake
|
13
|
-
|
14
|
-
|
15
|
-
|
16
|
-
|
17
|
-
|
18
|
-
|
19
|
-
|
20
|
-
|
21
|
-
|
22
|
-
|
23
|
-
|
33
|
+
rdoc
|
34
|
+
json (1.8.1)
|
35
|
+
jwt (0.1.11)
|
36
|
+
multi_json (>= 1.5)
|
37
|
+
log4r (1.1.10)
|
38
|
+
mini_portile (0.5.3)
|
39
|
+
multi_json (1.9.3)
|
40
|
+
multi_xml (0.5.5)
|
41
|
+
multipart-post (2.0.0)
|
42
|
+
nokogiri (1.6.1)
|
43
|
+
mini_portile (~> 0.5.0)
|
44
|
+
oauth2 (0.9.3)
|
45
|
+
faraday (>= 0.8, < 0.10)
|
46
|
+
jwt (~> 0.1.8)
|
47
|
+
multi_json (~> 1.3)
|
48
|
+
multi_xml (~> 0.5)
|
49
|
+
rack (~> 1.2)
|
50
|
+
rack (1.5.2)
|
51
|
+
rake (10.3.1)
|
52
|
+
rdoc (4.1.1)
|
53
|
+
json (~> 1.4)
|
54
|
+
rspec (2.10.0)
|
55
|
+
rspec-core (~> 2.10.0)
|
56
|
+
rspec-expectations (~> 2.10.0)
|
57
|
+
rspec-mocks (~> 2.10.0)
|
58
|
+
rspec-core (2.10.1)
|
59
|
+
rspec-expectations (2.10.0)
|
60
|
+
diff-lcs (~> 1.1.3)
|
61
|
+
rspec-mocks (2.10.1)
|
62
|
+
thread_safe (0.3.3)
|
24
63
|
|
25
64
|
PLATFORMS
|
26
65
|
ruby
|
27
66
|
|
28
67
|
DEPENDENCIES
|
29
68
|
bio (>= 1.4.1)
|
30
|
-
bio-logger
|
31
|
-
bundler
|
32
|
-
jeweler
|
33
|
-
|
34
|
-
rspec (~> 2.3.0)
|
69
|
+
bio-logger
|
70
|
+
bundler
|
71
|
+
jeweler
|
72
|
+
rspec
|
data/LICENSE.txt
CHANGED
data/README.md
CHANGED
@@ -79,6 +79,12 @@ so to skip every other record
|
|
79
79
|
fasta_filter.rb --filter "num % 2 == 0"
|
80
80
|
```
|
81
81
|
|
82
|
+
Find all sequences that contain a stop codon in the sequence
|
83
|
+
|
84
|
+
```sh
|
85
|
+
fasta_filter.rb --filter 'rec.seq =~ /\*./' aa.fa
|
86
|
+
```
|
87
|
+
|
82
88
|
Rewrite all sequences to lower case, you can use the useful rewrite
|
83
89
|
option
|
84
90
|
|
@@ -86,7 +92,20 @@ option
|
|
86
92
|
fasta_filter.rb --rewrite 'rec.seq = rec.seq.downcase'
|
87
93
|
```
|
88
94
|
|
89
|
-
|
95
|
+
Rewrite the FASTA descriptors
|
96
|
+
|
97
|
+
```sh
|
98
|
+
fasta_filter.rb --rewrite 'rec.descr =~ /gene=(\S+)/; rec.descr = $1' test.fa
|
99
|
+
```
|
100
|
+
|
101
|
+
Filters and rewrites can be combined. The rest is up to your
|
102
|
+
imagination! One final example to remove low quality sequences from an
|
103
|
+
amino acid file (one amino acid dominates):
|
104
|
+
|
105
|
+
```sh
|
106
|
+
fasta_filter.rb --filter "count = {} ; rec.seq.each_char { |c| count[c] ||= 1 ; count[c] += 1 }; count.values.max.to_f/rec.seq.size < 0.30" < aa.fa > aa1.fa
|
107
|
+
```
|
108
|
+
|
90
109
|
|
91
110
|
# API Examples
|
92
111
|
|
@@ -227,9 +246,9 @@ If you use this software, please cite one of
|
|
227
246
|
|
228
247
|
# Biogems.info
|
229
248
|
|
230
|
-
This Biogem is published
|
249
|
+
This Biogem is published on [biogems.info](http://biogems.info/index.html#bigbio)
|
231
250
|
|
232
251
|
# Copyright
|
233
252
|
|
234
|
-
Copyright (c) 2011-
|
253
|
+
Copyright (c) 2011-2014 Pjotr Prins. See LICENSE for further details.
|
235
254
|
|
data/Rakefile
CHANGED
data/VERSION
CHANGED
@@ -1 +1 @@
|
|
1
|
-
0.1.
|
1
|
+
0.1.6
|
data/bin/fasta_filter.rb
CHANGED
@@ -60,6 +60,8 @@ class OptParser
|
|
60
60
|
opts.separator " fasta_filter.rb --filter \"rec.descr =~ /C. elegans/\" test/data/fasta/nt.fa"
|
61
61
|
opts.separator " fasta_filter.rb --filter \"num % 2 == 0\" test/data/fasta/nt.fa"
|
62
62
|
opts.separator " fasta_filter.rb test/data/fasta/nt.fa --rewrite 'rec.seq.downcase!'"
|
63
|
+
opts.separator " fasta_filter.rb --rewrite 'rec.descr =~ /gene=(\S+)/; rec.descr = $1' test.fa"
|
64
|
+
opts.separator " fasta_filter.rb --filter 'rec.seq =~ /\*./' aa.fa"
|
63
65
|
opts.separator ""
|
64
66
|
opts.separator "Other options:"
|
65
67
|
opts.separator ""
|
data/bin/getorf
CHANGED
data/bin/nt2aa.rb
CHANGED
data/bio-bigbio.gemspec
CHANGED
@@ -5,11 +5,11 @@
|
|
5
5
|
|
6
6
|
Gem::Specification.new do |s|
|
7
7
|
s.name = "bio-bigbio"
|
8
|
-
s.version = "0.1.
|
8
|
+
s.version = "0.1.6"
|
9
9
|
|
10
10
|
s.required_rubygems_version = Gem::Requirement.new(">= 0") if s.respond_to? :required_rubygems_version=
|
11
11
|
s.authors = ["Pjotr Prins"]
|
12
|
-
s.date = "
|
12
|
+
s.date = "2014-05-16"
|
13
13
|
s.description = "Fasta reader, ORF emitter, sequence translation"
|
14
14
|
s.email = "pjotr.public01@thebird.nl"
|
15
15
|
s.executables = ["fasta_filter.rb", "fasta_sort.rb", "getorf", "nt2aa.rb"]
|
@@ -63,44 +63,31 @@ Gem::Specification.new do |s|
|
|
63
63
|
s.homepage = "http://github.com/pjotrp/bigbio"
|
64
64
|
s.licenses = ["MIT"]
|
65
65
|
s.require_paths = ["lib"]
|
66
|
-
s.rubygems_version = "1.8.
|
66
|
+
s.rubygems_version = "1.8.23"
|
67
67
|
s.summary = "Low memory sequence emitters"
|
68
|
-
s.test_files = [
|
69
|
-
"spec/emitter_spec.rb",
|
70
|
-
"spec/predictorf_spec.rb",
|
71
|
-
"test/doctest/test_fasta.rb",
|
72
|
-
"test/doctest/test_frames.rb",
|
73
|
-
"test/doctest/test_getorf.rb",
|
74
|
-
"test/doctest/test_paired.rb",
|
75
|
-
"test/performance/translate_with_biolib.rb",
|
76
|
-
"test/performance/translate_with_bioruby.rb"
|
77
|
-
]
|
78
68
|
|
79
69
|
if s.respond_to? :specification_version then
|
80
70
|
s.specification_version = 3
|
81
71
|
|
82
72
|
if Gem::Version.new(Gem::VERSION) >= Gem::Version.new('1.2.0') then
|
83
73
|
s.add_runtime_dependency(%q<bio>, [">= 1.4.1"])
|
84
|
-
s.add_runtime_dependency(%q<bio-logger>, [">= 0
|
85
|
-
s.add_development_dependency(%q<rspec>, ["
|
86
|
-
s.add_development_dependency(%q<bundler>, ["
|
87
|
-
s.add_development_dependency(%q<jeweler>, ["
|
88
|
-
s.add_development_dependency(%q<rcov>, [">= 0"])
|
74
|
+
s.add_runtime_dependency(%q<bio-logger>, [">= 0"])
|
75
|
+
s.add_development_dependency(%q<rspec>, [">= 0"])
|
76
|
+
s.add_development_dependency(%q<bundler>, [">= 0"])
|
77
|
+
s.add_development_dependency(%q<jeweler>, [">= 0"])
|
89
78
|
else
|
90
79
|
s.add_dependency(%q<bio>, [">= 1.4.1"])
|
91
|
-
s.add_dependency(%q<bio-logger>, [">= 0
|
92
|
-
s.add_dependency(%q<rspec>, ["
|
93
|
-
s.add_dependency(%q<bundler>, ["
|
94
|
-
s.add_dependency(%q<jeweler>, ["
|
95
|
-
s.add_dependency(%q<rcov>, [">= 0"])
|
80
|
+
s.add_dependency(%q<bio-logger>, [">= 0"])
|
81
|
+
s.add_dependency(%q<rspec>, [">= 0"])
|
82
|
+
s.add_dependency(%q<bundler>, [">= 0"])
|
83
|
+
s.add_dependency(%q<jeweler>, [">= 0"])
|
96
84
|
end
|
97
85
|
else
|
98
86
|
s.add_dependency(%q<bio>, [">= 1.4.1"])
|
99
|
-
s.add_dependency(%q<bio-logger>, [">= 0
|
100
|
-
s.add_dependency(%q<rspec>, ["
|
101
|
-
s.add_dependency(%q<bundler>, ["
|
102
|
-
s.add_dependency(%q<jeweler>, ["
|
103
|
-
s.add_dependency(%q<rcov>, [">= 0"])
|
87
|
+
s.add_dependency(%q<bio-logger>, [">= 0"])
|
88
|
+
s.add_dependency(%q<rspec>, [">= 0"])
|
89
|
+
s.add_dependency(%q<bundler>, [">= 0"])
|
90
|
+
s.add_dependency(%q<jeweler>, [">= 0"])
|
104
91
|
end
|
105
92
|
end
|
106
93
|
|
data/lib/bigbio.rb
CHANGED
data/spec/emitter_spec.rb
CHANGED
@@ -10,7 +10,7 @@ describe Bio::Big::FastaEmitter, "when using the emitter" do
|
|
10
10
|
|
11
11
|
it "should emit small parts" do
|
12
12
|
s = ""
|
13
|
-
FastaEmitter.new("test/data/fasta/nt.fa",10).emit_seq do | part, index, tag, seq |
|
13
|
+
Bio::Big::FastaEmitter.new("test/data/fasta/nt.fa",10).emit_seq do | part, index, tag, seq |
|
14
14
|
# p [index, part, tag, seq]
|
15
15
|
s += seq
|
16
16
|
if index == 95 and part == :tail
|
@@ -38,7 +38,7 @@ describe Bio::Big::FastaEmitter, "when using the emitter" do
|
|
38
38
|
end
|
39
39
|
|
40
40
|
it "should emit large parts" do
|
41
|
-
FastaEmitter.new("test/data/fasta/nt.fa").emit_seq do | part, index, tag, seq |
|
41
|
+
Bio::Big::FastaEmitter.new("test/data/fasta/nt.fa").emit_seq do | part, index, tag, seq |
|
42
42
|
# p [index, part, tag, seq]
|
43
43
|
if index == 95
|
44
44
|
seq.should == "ATCATTAGCAACACCAGCTTCCTCTCTCTCGCTTCAAAGTTCACTACTCGTGGATCTCGTCTTCAGTGTACAGTATCAAGGGCTCGATCTGCGGTGGATGAGACATCAGATTCAGGAGCTTTTCAAAGAACTGCATCGACATCCGTAACTTCGTTTCAAAAGATTCCAATTCTCAGTTTCAGCTGAATCTGGTAGATACCATCTTTACATATCGTATGCTTGTCATGGGCTTCTAGATGCCTTTCATACTTAAAGATCAAAGGACTTGACGATGCAATAAGCTTCTCGTCTGTAAAACCC"
|
@@ -47,12 +47,12 @@ describe Bio::Big::FastaEmitter, "when using the emitter" do
|
|
47
47
|
end
|
48
48
|
end
|
49
49
|
|
50
|
-
describe Bio::Big::ShortFrameState, "when using the ShortFrameState" do
|
50
|
+
describe Bio::Big::ShortFrameState, "when using the Bio::Big::ShortFrameState" do
|
51
51
|
|
52
52
|
include Bio::Big
|
53
53
|
|
54
54
|
it "should find an ORF" do
|
55
|
-
fr = ShortFrameState.new "atggattaaatgtaatggatttaatgtaaa",0,0
|
55
|
+
fr = Bio::Big::ShortFrameState.new "atggattaaatgtaatggatttaatgtaaa",0,0
|
56
56
|
orfs = fr.get_stopstop_orfs
|
57
57
|
orfs.map{ | orf | orf.pos }.should == [ 3, 5 ]
|
58
58
|
orfs.map{ | orf | orf.to_seq }.should == ["ATGTAA", "TGGATTTAA"]
|
@@ -61,14 +61,14 @@ describe Bio::Big::ShortFrameState, "when using the ShortFrameState" do
|
|
61
61
|
orfs.map{ | orf | orf.to_seq }.should == ["ATGGATTAA","ATGTAA"]
|
62
62
|
end
|
63
63
|
it "should handle min_size" do
|
64
|
-
fr = ShortFrameState.new "atggattaaatgtaatggatttaatgtaaa",0,9
|
64
|
+
fr = Bio::Big::ShortFrameState.new "atggattaaatgtaatggatttaatgtaaa",0,9
|
65
65
|
orfs = fr.get_stopstop_orfs
|
66
66
|
orfs.map{ | orf | orf.to_seq }.should == [ "TGGATTTAA"]
|
67
67
|
orfs.map{ | orf | orf.pos }.should == [ 5 ]
|
68
68
|
fr.get_startstop_orfs.should == []
|
69
69
|
end
|
70
70
|
it "should find ORFs in" do
|
71
|
-
fr = ShortFrameState.new "atgttttaaatgtaatgttgttaaatgttttaaatgtaatgttgttaa",0,0
|
71
|
+
fr = Bio::Big::ShortFrameState.new "atgttttaaatgtaatgttgttaaatgttttaaatgtaatgttgttaa",0,0
|
72
72
|
orfs = fr.get_stopstop_orfs
|
73
73
|
orfs.map{ | orf | orf.to_seq }.should == ["ATGTAA", "TGTTGTTAA", "ATGTTTTAA", "ATGTAA", "TGTTGTTAA"]
|
74
74
|
orfs.map{ | orf | orf.pos }.should == [3, 5, 8, 11, 13]
|
@@ -108,17 +108,17 @@ describe Bio::Big::ShortFrameState, "when using the ShortFrameState" do
|
|
108
108
|
|
109
109
|
# Frame 0
|
110
110
|
minsize = 0
|
111
|
-
fr = ShortFrameState.new s,0,minsize
|
111
|
+
fr = Bio::Big::ShortFrameState.new s,0,minsize
|
112
112
|
orfs = fr.get_stopstop_orfs
|
113
113
|
orfs.map{ | orf | orf.to_seq }.should == []
|
114
114
|
|
115
115
|
# Frame 1
|
116
|
-
fr = ShortFrameState.new s[1..-1],0,minsize
|
116
|
+
fr = Bio::Big::ShortFrameState.new s[1..-1],0,minsize
|
117
117
|
os = fr.get_stopstop_orfs
|
118
118
|
os.map{ | orf | orf.to_seq }.should == ["TTNCGCGTGCCGCCTTCTTTCTCCTTTTTCTCTTTTACTTCTTCATCATCATCTTCTTCTTCTTCCTCTTCGATATTCGTCAGTGTGTGTATTTTGGGGAAAACTTTGTGA"]
|
119
119
|
orfs += os
|
120
120
|
# Frame 2
|
121
|
-
fr = ShortFrameState.new s[2..-1],0,minsize
|
121
|
+
fr = Bio::Big::ShortFrameState.new s[2..-1],0,minsize
|
122
122
|
os = fr.get_stopstop_orfs
|
123
123
|
os.map{ | orf | orf.to_seq }.should == ["GCGGANCGGTAA", "GAAAATCGCGGATGTGGCTTTCAAAGCTTCAAGGACTATCGATTGGGATGGTATGGCTAA", "GGTCCTTGTCACAGATGA", "GGCTCGTAG"]
|
124
124
|
orfs += os
|
@@ -132,14 +132,14 @@ describe Bio::Big::ShortFrameState, "when using the ShortFrameState" do
|
|
132
132
|
|
133
133
|
# Frame 0
|
134
134
|
minsize = 0
|
135
|
-
fr = ShortFrameState.new s,0,minsize
|
135
|
+
fr = Bio::Big::ShortFrameState.new s,0,minsize
|
136
136
|
orfs = fr.get_startstop_orfs
|
137
137
|
|
138
138
|
# Frame 1
|
139
|
-
fr = ShortFrameState.new s[1..-1],0,minsize
|
139
|
+
fr = Bio::Big::ShortFrameState.new s[1..-1],0,minsize
|
140
140
|
orfs += fr.get_startstop_orfs
|
141
141
|
# Frame 2
|
142
|
-
fr = ShortFrameState.new s[2..-1],0,minsize
|
142
|
+
fr = Bio::Big::ShortFrameState.new s[2..-1],0,minsize
|
143
143
|
orfs += fr.get_startstop_orfs
|
144
144
|
orfs.map{ | orf | orf.to_seq }.should == []
|
145
145
|
orfs.size.should == 0
|
@@ -151,11 +151,11 @@ describe Bio::Big::ShortFrameState, "when combining frames" do
|
|
151
151
|
it "should combine a forward frame" do
|
152
152
|
s1 = "atggattaaatgtaata"
|
153
153
|
s2 = "atggatttaatgtaaa"
|
154
|
-
fr = ShortFrameState.new s1,0,0
|
154
|
+
fr = Bio::Big::ShortFrameState.new s1,0,0
|
155
155
|
fr.ntseq_pos.should == 0
|
156
156
|
orfs = fr.get_stopstop_orfs
|
157
157
|
orfs.size == 1 # in codons
|
158
|
-
fr3 = FrameCodonHelpers::CreateShortFrame.create_right(fr,orfs,s2)
|
158
|
+
fr3 = Bio::Big::FrameCodonHelpers::CreateShortFrame.create_right(fr,orfs,s2)
|
159
159
|
fr3.ntseq_pos.should == 15
|
160
160
|
fr3.codons.to_seq.should == "TAATGGATTTAATGTAAA"
|
161
161
|
norfs = fr3.get_stopstop_orfs
|
@@ -169,11 +169,11 @@ describe Bio::Big::ShortFrameState, "when combining frames" do
|
|
169
169
|
# ......---===xx
|
170
170
|
s2 = "atggatttaattattataaa"
|
171
171
|
# x======xxx======xxx.
|
172
|
-
fr = ShortFrameState.new s1,0,0
|
172
|
+
fr = Bio::Big::ShortFrameState.new s1,0,0
|
173
173
|
fr.ntseq_pos.should == 0
|
174
174
|
orfs = fr.get_stopstop_orfs
|
175
175
|
orfs.size == 0 # in codons
|
176
|
-
fr3 = FrameCodonHelpers::CreateShortFrame.create_right(fr,orfs,s2)
|
176
|
+
fr3 = Bio::Big::FrameCodonHelpers::CreateShortFrame.create_right(fr,orfs,s2)
|
177
177
|
fr3.ntseq_pos.should == 0
|
178
178
|
fr3.codons.to_seq.should == "ATGGATTAAATGTAATGGATTTAATTATTATAA"
|
179
179
|
norfs = fr3.get_stopstop_orfs
|
@@ -187,11 +187,11 @@ describe Bio::Big::ShortFrameState, "when combining frames" do
|
|
187
187
|
# ......---===xx
|
188
188
|
s2 = "atggatttaatgtaaa"
|
189
189
|
# x======xxx
|
190
|
-
fr = ShortFrameState.new s1,0,0
|
190
|
+
fr = Bio::Big::ShortFrameState.new s1,0,0
|
191
191
|
fr.ntseq_pos.should == 0
|
192
192
|
orfs = fr.get_stopstop_orfs
|
193
193
|
orfs.size == 0 # in codons
|
194
|
-
fr3 = FrameCodonHelpers::CreateShortFrame.create_right(fr,orfs,s2)
|
194
|
+
fr3 = Bio::Big::FrameCodonHelpers::CreateShortFrame.create_right(fr,orfs,s2)
|
195
195
|
# p fr3
|
196
196
|
fr3.ntseq_pos.should == 0 # on the combined sequences
|
197
197
|
fr3.codons.to_seq.should == "ATGGATTAAATGTAATGGATTTAATGTAAA"
|
@@ -221,14 +221,14 @@ describe Bio::Big::ShortFrameState, "when combining frames" do
|
|
221
221
|
s1 = "atggattaaatgta"
|
222
222
|
# ......xxx=====
|
223
223
|
# now move the other way, as sequences get emitted on the left
|
224
|
-
fr = ShortReversedFrameState.new s2,0,0
|
224
|
+
fr = Bio::Big::ShortReversedFrameState.new s2,0,0
|
225
225
|
# p fr
|
226
226
|
fr.codons.to_seq.should == "ATTTAAATGGATTTAATGTAAATT"
|
227
227
|
fr.ntseq_pos.should == 0
|
228
228
|
orfs = fr.get_stopstop_orfs
|
229
229
|
orfs.map{ | orf | orf.to_seq }.should == ["ATGGATTTAATGTAA"]
|
230
230
|
orfs.first.pos.should == 2 # in codons
|
231
|
-
fr3 = FrameCodonHelpers::CreateShortFrame.create_left(fr,orfs,s1)
|
231
|
+
fr3 = Bio::Big::FrameCodonHelpers::CreateShortFrame.create_left(fr,orfs,s1)
|
232
232
|
fr3.ntseq_pos.should == 18 # 6 codons
|
233
233
|
fr3.codons.to_seq.should == "ATGGATTAAATGTATATTTAA"
|
234
234
|
norfs = fr3.get_stopstop_orfs
|
@@ -244,9 +244,9 @@ describe Bio::Big::OrfEmitter, "when using the ORF emitter" do
|
|
244
244
|
include Bio::Big
|
245
245
|
|
246
246
|
it "should emit STOP-STOP ORFs in all frames" do
|
247
|
-
f = FastaEmitter.new("test/data/fasta/nt.fa")
|
247
|
+
f = Bio::Big::FastaEmitter.new("test/data/fasta/nt.fa")
|
248
248
|
seqs = []
|
249
|
-
OrfEmitter.new(f,:stopstop)::emit_seq do | frame, index, tag, pos, seq |
|
249
|
+
Bio::Big::OrfEmitter.new(f,:stopstop)::emit_seq do | frame, index, tag, pos, seq |
|
250
250
|
break if index != 0
|
251
251
|
if frame == 0 and index == 0 and pos == 39
|
252
252
|
seq.should == "TTNCGCGTGCCGCCTTCTTTCTCCTTTTTCTCTTTTACTTCTTCATCATCATCTTCTTCTTCTTCCTCTTCGATATTCGTCAGTGTGTGTATTTTGGGGAAAACTTTGTGA"
|
@@ -259,9 +259,9 @@ describe Bio::Big::OrfEmitter, "when using the ORF emitter" do
|
|
259
259
|
seqs.join(';')[50..350].should == "TNCGCGTGCCGCCTTCTTTCTCCTTTTTCTCTTTTACTTCTTCATCATCATCTTCTTCTTCTTCCTCTTCGATATTCGTCAGTGTGTGTATTTTGGGGAAAACTTTGTGA;GCAAAGAGCGAGAAAATGAGCGGANCGGTAAGAAAATCGCGGATGTGGCTTTCAAAGCTTCAAGGACTATCGATTGGGATGGTATGGCTAAGGTCCTTGTCACAGATGAGGCTCGTAGAGAGTTCTCTAACCTTCGTCGTGCTTTCGATGAGGTTAACACACAGCTCCAGACCAAATTTAGTCAGGACCT"
|
260
260
|
end
|
261
261
|
it "should emit STOP-STOP ORFs in all frames using a shorter emitter" do
|
262
|
-
f = FastaEmitter.new("test/data/fasta/nt.fa",150)
|
262
|
+
f = Bio::Big::FastaEmitter.new("test/data/fasta/nt.fa",150)
|
263
263
|
seqs = []
|
264
|
-
OrfEmitter.new(f,:stopstop)::emit_seq do | frame, index, tag, pos, seq |
|
264
|
+
Bio::Big::OrfEmitter.new(f,:stopstop)::emit_seq do | frame, index, tag, pos, seq |
|
265
265
|
break if index != 0
|
266
266
|
if frame == 0 and index == 0 and pos == 39
|
267
267
|
seq.should == "TTNCGCGTGCCGCCTTCTTTCTCCTTTTTCTCTTTTACTTCTTCATCATCATCTTCTTCTTCTTCCTCTTCGATATTCGTCAGTGTGTGTATTTTGGGGAAAACTTTGTGA"
|
metadata
CHANGED
@@ -1,82 +1,85 @@
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
2
2
|
name: bio-bigbio
|
3
3
|
version: !ruby/object:Gem::Version
|
4
|
-
version: 0.1.
|
5
|
-
prerelease:
|
4
|
+
version: 0.1.6
|
6
5
|
platform: ruby
|
7
6
|
authors:
|
8
7
|
- Pjotr Prins
|
9
8
|
autorequire:
|
10
9
|
bindir: bin
|
11
10
|
cert_chain: []
|
12
|
-
date:
|
11
|
+
date: 2014-05-16 00:00:00.000000000 Z
|
13
12
|
dependencies:
|
14
13
|
- !ruby/object:Gem::Dependency
|
15
14
|
name: bio
|
16
|
-
requirement:
|
17
|
-
none: false
|
15
|
+
requirement: !ruby/object:Gem::Requirement
|
18
16
|
requirements:
|
19
|
-
- -
|
17
|
+
- - ">="
|
20
18
|
- !ruby/object:Gem::Version
|
21
19
|
version: 1.4.1
|
22
20
|
type: :runtime
|
23
21
|
prerelease: false
|
24
|
-
version_requirements:
|
22
|
+
version_requirements: !ruby/object:Gem::Requirement
|
23
|
+
requirements:
|
24
|
+
- - ">="
|
25
|
+
- !ruby/object:Gem::Version
|
26
|
+
version: 1.4.1
|
25
27
|
- !ruby/object:Gem::Dependency
|
26
28
|
name: bio-logger
|
27
|
-
requirement:
|
28
|
-
none: false
|
29
|
+
requirement: !ruby/object:Gem::Requirement
|
29
30
|
requirements:
|
30
|
-
- -
|
31
|
+
- - ">="
|
31
32
|
- !ruby/object:Gem::Version
|
32
|
-
version: 0
|
33
|
+
version: '0'
|
33
34
|
type: :runtime
|
34
35
|
prerelease: false
|
35
|
-
version_requirements:
|
36
|
+
version_requirements: !ruby/object:Gem::Requirement
|
37
|
+
requirements:
|
38
|
+
- - ">="
|
39
|
+
- !ruby/object:Gem::Version
|
40
|
+
version: '0'
|
36
41
|
- !ruby/object:Gem::Dependency
|
37
42
|
name: rspec
|
38
|
-
requirement:
|
39
|
-
none: false
|
43
|
+
requirement: !ruby/object:Gem::Requirement
|
40
44
|
requirements:
|
41
|
-
- -
|
45
|
+
- - ">="
|
42
46
|
- !ruby/object:Gem::Version
|
43
|
-
version:
|
47
|
+
version: '0'
|
44
48
|
type: :development
|
45
49
|
prerelease: false
|
46
|
-
version_requirements:
|
50
|
+
version_requirements: !ruby/object:Gem::Requirement
|
51
|
+
requirements:
|
52
|
+
- - ">="
|
53
|
+
- !ruby/object:Gem::Version
|
54
|
+
version: '0'
|
47
55
|
- !ruby/object:Gem::Dependency
|
48
56
|
name: bundler
|
49
|
-
requirement:
|
50
|
-
none: false
|
57
|
+
requirement: !ruby/object:Gem::Requirement
|
51
58
|
requirements:
|
52
|
-
- -
|
59
|
+
- - ">="
|
53
60
|
- !ruby/object:Gem::Version
|
54
|
-
version:
|
61
|
+
version: '0'
|
55
62
|
type: :development
|
56
63
|
prerelease: false
|
57
|
-
version_requirements:
|
64
|
+
version_requirements: !ruby/object:Gem::Requirement
|
65
|
+
requirements:
|
66
|
+
- - ">="
|
67
|
+
- !ruby/object:Gem::Version
|
68
|
+
version: '0'
|
58
69
|
- !ruby/object:Gem::Dependency
|
59
70
|
name: jeweler
|
60
|
-
requirement:
|
61
|
-
none: false
|
71
|
+
requirement: !ruby/object:Gem::Requirement
|
62
72
|
requirements:
|
63
|
-
- -
|
73
|
+
- - ">="
|
64
74
|
- !ruby/object:Gem::Version
|
65
|
-
version:
|
75
|
+
version: '0'
|
66
76
|
type: :development
|
67
77
|
prerelease: false
|
68
|
-
version_requirements:
|
69
|
-
- !ruby/object:Gem::Dependency
|
70
|
-
name: rcov
|
71
|
-
requirement: &27199840 !ruby/object:Gem::Requirement
|
72
|
-
none: false
|
78
|
+
version_requirements: !ruby/object:Gem::Requirement
|
73
79
|
requirements:
|
74
|
-
- -
|
80
|
+
- - ">="
|
75
81
|
- !ruby/object:Gem::Version
|
76
82
|
version: '0'
|
77
|
-
type: :development
|
78
|
-
prerelease: false
|
79
|
-
version_requirements: *27199840
|
80
83
|
description: Fasta reader, ORF emitter, sequence translation
|
81
84
|
email: pjotr.public01@thebird.nl
|
82
85
|
executables:
|
@@ -89,7 +92,7 @@ extra_rdoc_files:
|
|
89
92
|
- LICENSE.txt
|
90
93
|
- README.md
|
91
94
|
files:
|
92
|
-
- .travis.yml
|
95
|
+
- ".travis.yml"
|
93
96
|
- Gemfile
|
94
97
|
- Gemfile.lock
|
95
98
|
- LICENSE.txt
|
@@ -133,37 +136,26 @@ files:
|
|
133
136
|
homepage: http://github.com/pjotrp/bigbio
|
134
137
|
licenses:
|
135
138
|
- MIT
|
139
|
+
metadata: {}
|
136
140
|
post_install_message:
|
137
141
|
rdoc_options: []
|
138
142
|
require_paths:
|
139
143
|
- lib
|
140
144
|
required_ruby_version: !ruby/object:Gem::Requirement
|
141
|
-
none: false
|
142
145
|
requirements:
|
143
|
-
- -
|
146
|
+
- - ">="
|
144
147
|
- !ruby/object:Gem::Version
|
145
148
|
version: '0'
|
146
|
-
segments:
|
147
|
-
- 0
|
148
|
-
hash: 2941883289909211187
|
149
149
|
required_rubygems_version: !ruby/object:Gem::Requirement
|
150
|
-
none: false
|
151
150
|
requirements:
|
152
|
-
- -
|
151
|
+
- - ">="
|
153
152
|
- !ruby/object:Gem::Version
|
154
153
|
version: '0'
|
155
154
|
requirements: []
|
156
155
|
rubyforge_project:
|
157
|
-
rubygems_version:
|
156
|
+
rubygems_version: 2.0.3
|
158
157
|
signing_key:
|
159
158
|
specification_version: 3
|
160
159
|
summary: Low memory sequence emitters
|
161
|
-
test_files:
|
162
|
-
|
163
|
-
- spec/predictorf_spec.rb
|
164
|
-
- test/doctest/test_fasta.rb
|
165
|
-
- test/doctest/test_frames.rb
|
166
|
-
- test/doctest/test_getorf.rb
|
167
|
-
- test/doctest/test_paired.rb
|
168
|
-
- test/performance/translate_with_biolib.rb
|
169
|
-
- test/performance/translate_with_bioruby.rb
|
160
|
+
test_files: []
|
161
|
+
has_rdoc:
|