bio 0.7.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data/bin/bioruby +107 -0
- data/bin/br_biofetch.rb +59 -0
- data/bin/br_bioflat.rb +294 -0
- data/bin/br_biogetseq.rb +57 -0
- data/bin/br_pmfetch.rb +431 -0
- data/doc/BioRuby.rd.ja +225 -0
- data/doc/Changes-0.7.rd +236 -0
- data/doc/Design.rd.ja +341 -0
- data/doc/KEGG_API.rd +1437 -0
- data/doc/KEGG_API.rd.ja +1399 -0
- data/doc/TODO.rd.ja +138 -0
- data/doc/Tutorial.rd +1138 -0
- data/doc/Tutorial.rd.ja +2110 -0
- data/etc/bioinformatics/seqdatabase.ini +210 -0
- data/lib/bio.rb +256 -0
- data/lib/bio/alignment.rb +1906 -0
- data/lib/bio/appl/bl2seq/report.rb +350 -0
- data/lib/bio/appl/blast.rb +269 -0
- data/lib/bio/appl/blast/format0.rb +1402 -0
- data/lib/bio/appl/blast/format8.rb +95 -0
- data/lib/bio/appl/blast/report.rb +652 -0
- data/lib/bio/appl/blast/rexml.rb +151 -0
- data/lib/bio/appl/blast/wublast.rb +553 -0
- data/lib/bio/appl/blast/xmlparser.rb +222 -0
- data/lib/bio/appl/blat/report.rb +392 -0
- data/lib/bio/appl/clustalw.rb +191 -0
- data/lib/bio/appl/clustalw/report.rb +154 -0
- data/lib/bio/appl/emboss.rb +68 -0
- data/lib/bio/appl/fasta.rb +262 -0
- data/lib/bio/appl/fasta/format10.rb +428 -0
- data/lib/bio/appl/fasta/format6.rb +37 -0
- data/lib/bio/appl/genscan/report.rb +570 -0
- data/lib/bio/appl/hmmer.rb +129 -0
- data/lib/bio/appl/hmmer/report.rb +556 -0
- data/lib/bio/appl/mafft.rb +222 -0
- data/lib/bio/appl/mafft/report.rb +119 -0
- data/lib/bio/appl/psort.rb +555 -0
- data/lib/bio/appl/psort/report.rb +473 -0
- data/lib/bio/appl/sim4.rb +134 -0
- data/lib/bio/appl/sim4/report.rb +501 -0
- data/lib/bio/appl/sosui/report.rb +166 -0
- data/lib/bio/appl/spidey/report.rb +604 -0
- data/lib/bio/appl/targetp/report.rb +283 -0
- data/lib/bio/appl/tmhmm/report.rb +238 -0
- data/lib/bio/command.rb +166 -0
- data/lib/bio/data/aa.rb +354 -0
- data/lib/bio/data/codontable.rb +740 -0
- data/lib/bio/data/na.rb +226 -0
- data/lib/bio/db.rb +340 -0
- data/lib/bio/db/aaindex.rb +280 -0
- data/lib/bio/db/embl/common.rb +332 -0
- data/lib/bio/db/embl/embl.rb +446 -0
- data/lib/bio/db/embl/sptr.rb +954 -0
- data/lib/bio/db/embl/swissprot.rb +32 -0
- data/lib/bio/db/embl/trembl.rb +31 -0
- data/lib/bio/db/embl/uniprot.rb +32 -0
- data/lib/bio/db/fantom.rb +604 -0
- data/lib/bio/db/fasta.rb +869 -0
- data/lib/bio/db/genbank/common.rb +299 -0
- data/lib/bio/db/genbank/ddbj.rb +34 -0
- data/lib/bio/db/genbank/genbank.rb +354 -0
- data/lib/bio/db/genbank/genpept.rb +73 -0
- data/lib/bio/db/genbank/refseq.rb +31 -0
- data/lib/bio/db/gff.rb +106 -0
- data/lib/bio/db/go.rb +497 -0
- data/lib/bio/db/kegg/brite.rb +51 -0
- data/lib/bio/db/kegg/cell.rb +88 -0
- data/lib/bio/db/kegg/compound.rb +130 -0
- data/lib/bio/db/kegg/enzyme.rb +125 -0
- data/lib/bio/db/kegg/expression.rb +173 -0
- data/lib/bio/db/kegg/genes.rb +293 -0
- data/lib/bio/db/kegg/genome.rb +362 -0
- data/lib/bio/db/kegg/glycan.rb +213 -0
- data/lib/bio/db/kegg/keggtab.rb +418 -0
- data/lib/bio/db/kegg/kgml.rb +299 -0
- data/lib/bio/db/kegg/ko.rb +178 -0
- data/lib/bio/db/kegg/reaction.rb +97 -0
- data/lib/bio/db/litdb.rb +131 -0
- data/lib/bio/db/medline.rb +317 -0
- data/lib/bio/db/nbrf.rb +199 -0
- data/lib/bio/db/pdb.rb +38 -0
- data/lib/bio/db/pdb/atom.rb +60 -0
- data/lib/bio/db/pdb/chain.rb +117 -0
- data/lib/bio/db/pdb/model.rb +106 -0
- data/lib/bio/db/pdb/pdb.rb +1682 -0
- data/lib/bio/db/pdb/residue.rb +122 -0
- data/lib/bio/db/pdb/utils.rb +234 -0
- data/lib/bio/db/prosite.rb +616 -0
- data/lib/bio/db/rebase.rb +417 -0
- data/lib/bio/db/transfac.rb +387 -0
- data/lib/bio/feature.rb +201 -0
- data/lib/bio/io/brdb.rb +103 -0
- data/lib/bio/io/das.rb +471 -0
- data/lib/bio/io/dbget.rb +212 -0
- data/lib/bio/io/ddbjxml.rb +614 -0
- data/lib/bio/io/fastacmd.rb +123 -0
- data/lib/bio/io/fetch.rb +114 -0
- data/lib/bio/io/flatfile.rb +496 -0
- data/lib/bio/io/flatfile/bdb.rb +266 -0
- data/lib/bio/io/flatfile/index.rb +1308 -0
- data/lib/bio/io/flatfile/indexer.rb +778 -0
- data/lib/bio/io/higet.rb +92 -0
- data/lib/bio/io/keggapi.rb +863 -0
- data/lib/bio/io/pubmed.rb +189 -0
- data/lib/bio/io/registry.rb +308 -0
- data/lib/bio/io/soapwsdl.rb +114 -0
- data/lib/bio/io/sql.rb +428 -0
- data/lib/bio/location.rb +650 -0
- data/lib/bio/pathway.rb +991 -0
- data/lib/bio/reference.rb +308 -0
- data/lib/bio/sequence.rb +593 -0
- data/lib/bio/shell.rb +51 -0
- data/lib/bio/shell/core.rb +512 -0
- data/lib/bio/shell/plugin/codon.rb +228 -0
- data/lib/bio/shell/plugin/entry.rb +85 -0
- data/lib/bio/shell/plugin/flatfile.rb +119 -0
- data/lib/bio/shell/plugin/keggapi.rb +187 -0
- data/lib/bio/shell/plugin/midi.rb +448 -0
- data/lib/bio/shell/plugin/obda.rb +63 -0
- data/lib/bio/shell/plugin/seq.rb +238 -0
- data/lib/bio/shell/session.rb +214 -0
- data/lib/bio/util/color_scheme.rb +214 -0
- data/lib/bio/util/color_scheme/buried.rb +78 -0
- data/lib/bio/util/color_scheme/helix.rb +78 -0
- data/lib/bio/util/color_scheme/hydropathy.rb +83 -0
- data/lib/bio/util/color_scheme/nucleotide.rb +50 -0
- data/lib/bio/util/color_scheme/strand.rb +78 -0
- data/lib/bio/util/color_scheme/taylor.rb +69 -0
- data/lib/bio/util/color_scheme/turn.rb +78 -0
- data/lib/bio/util/color_scheme/zappo.rb +69 -0
- data/lib/bio/util/contingency_table.rb +337 -0
- data/lib/bio/util/sirna.rb +306 -0
- data/lib/bioruby.rb +34 -0
- data/sample/biofetch.rb +475 -0
- data/sample/color_scheme_na.rb +99 -0
- data/sample/dbget +37 -0
- data/sample/fasta2tab.rb +99 -0
- data/sample/fsplit.rb +51 -0
- data/sample/gb2fasta.rb +31 -0
- data/sample/gb2tab.rb +325 -0
- data/sample/gbtab2mysql.rb +161 -0
- data/sample/genes2nuc.rb +33 -0
- data/sample/genes2pep.rb +33 -0
- data/sample/genes2tab.rb +81 -0
- data/sample/genome2rb.rb +29 -0
- data/sample/genome2tab.rb +76 -0
- data/sample/goslim.rb +311 -0
- data/sample/gt2fasta.rb +47 -0
- data/sample/pmfetch.rb +42 -0
- data/sample/pmsearch.rb +42 -0
- data/sample/psortplot_html.rb +222 -0
- data/sample/ssearch2tab.rb +96 -0
- data/sample/tdiary.rb +158 -0
- data/sample/tfastx2tab.rb +100 -0
- data/sample/vs-genes.rb +212 -0
- data/test/data/SOSUI/sample.report +11 -0
- data/test/data/TMHMM/sample.report +21 -0
- data/test/data/blast/eco:b0002.faa +15 -0
- data/test/data/blast/eco:b0002.faa.m0 +128 -0
- data/test/data/blast/eco:b0002.faa.m7 +65 -0
- data/test/data/blast/eco:b0002.faa.m8 +1 -0
- data/test/data/embl/AB090716.embl +65 -0
- data/test/data/genscan/sample.report +63 -0
- data/test/data/prosite/prosite.dat +2233 -0
- data/test/data/refseq/nm_126355.entret +64 -0
- data/test/data/uniprot/p53_human.uniprot +1456 -0
- data/test/runner.rb +10 -0
- data/test/unit/bio/appl/blast/test_report.rb +427 -0
- data/test/unit/bio/appl/blast/test_xmlparser.rb +400 -0
- data/test/unit/bio/appl/genscan/test_report.rb +195 -0
- data/test/unit/bio/appl/sosui/test_report.rb +94 -0
- data/test/unit/bio/appl/targetp/test_report.rb +159 -0
- data/test/unit/bio/appl/test_blast.rb +159 -0
- data/test/unit/bio/appl/test_fasta.rb +142 -0
- data/test/unit/bio/appl/tmhmm/test_report.rb +139 -0
- data/test/unit/bio/data/test_aa.rb +103 -0
- data/test/unit/bio/data/test_codontable.rb +120 -0
- data/test/unit/bio/data/test_na.rb +89 -0
- data/test/unit/bio/db/embl/test_common.rb +130 -0
- data/test/unit/bio/db/embl/test_embl.rb +227 -0
- data/test/unit/bio/db/embl/test_sptr.rb +268 -0
- data/test/unit/bio/db/embl/test_uniprot.rb +44 -0
- data/test/unit/bio/db/kegg/test_genes.rb +58 -0
- data/test/unit/bio/db/test_fasta.rb +263 -0
- data/test/unit/bio/db/test_gff.rb +140 -0
- data/test/unit/bio/db/test_prosite.rb +1450 -0
- data/test/unit/bio/io/test_ddbjxml.rb +87 -0
- data/test/unit/bio/io/test_soapwsdl.rb +45 -0
- data/test/unit/bio/shell/plugin/test_seq.rb +175 -0
- data/test/unit/bio/test_alignment.rb +1028 -0
- data/test/unit/bio/test_command.rb +71 -0
- data/test/unit/bio/test_db.rb +109 -0
- data/test/unit/bio/test_feature.rb +128 -0
- data/test/unit/bio/test_location.rb +51 -0
- data/test/unit/bio/test_pathway.rb +485 -0
- data/test/unit/bio/test_sequence.rb +386 -0
- data/test/unit/bio/test_shell.rb +31 -0
- data/test/unit/bio/util/test_color_scheme.rb +45 -0
- data/test/unit/bio/util/test_contingency_table.rb +106 -0
- data/test/unit/bio/util/test_sirna.rb +258 -0
- metadata +295 -0
|
@@ -0,0 +1,428 @@
|
|
|
1
|
+
#
|
|
2
|
+
# bio/appl/fasta/format10.rb - FASTA output (-m 10) parser
|
|
3
|
+
#
|
|
4
|
+
# Copyright (C) 2002 KATAYAMA Toshiaki <k@bioruby.org>
|
|
5
|
+
#
|
|
6
|
+
# This library is free software; you can redistribute it and/or
|
|
7
|
+
# modify it under the terms of the GNU Lesser General Public
|
|
8
|
+
# License as published by the Free Software Foundation; either
|
|
9
|
+
# version 2 of the License, or (at your option) any later version.
|
|
10
|
+
#
|
|
11
|
+
# This library is distributed in the hope that it will be useful,
|
|
12
|
+
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
13
|
+
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
14
|
+
# Lesser General Public License for more details.
|
|
15
|
+
#
|
|
16
|
+
# You should have received a copy of the GNU Lesser General Public
|
|
17
|
+
# License along with this library; if not, write to the Free Software
|
|
18
|
+
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
|
|
19
|
+
#
|
|
20
|
+
# $Id: format10.rb,v 1.6 2005/09/26 13:00:05 k Exp $
|
|
21
|
+
#
|
|
22
|
+
|
|
23
|
+
require 'bio/appl/fasta'
|
|
24
|
+
|
|
25
|
+
module Bio
|
|
26
|
+
class Fasta
|
|
27
|
+
|
|
28
|
+
class Report
|
|
29
|
+
|
|
30
|
+
def initialize(data)
|
|
31
|
+
# header lines - brief list of the hits
|
|
32
|
+
if data.sub!(/.*\nThe best scores are/m, '')
|
|
33
|
+
data.sub!(/(.*)\n\n>>>/m, '')
|
|
34
|
+
@list = "The best scores are" + $1
|
|
35
|
+
else
|
|
36
|
+
data.sub!(/.*\n!!\s+/m, '')
|
|
37
|
+
data.sub!(/.*/) { |x| @list = x; '' }
|
|
38
|
+
end
|
|
39
|
+
|
|
40
|
+
# body lines - fasta execution result
|
|
41
|
+
program, *hits = data.split(/\n>>/)
|
|
42
|
+
|
|
43
|
+
# trailing lines - log messages of the execution
|
|
44
|
+
@log = hits.pop
|
|
45
|
+
@log.sub!(/.*<\n/m, '')
|
|
46
|
+
@log.strip!
|
|
47
|
+
|
|
48
|
+
# parse results
|
|
49
|
+
@program = Program.new(program)
|
|
50
|
+
@hits = []
|
|
51
|
+
|
|
52
|
+
hits.each do |x|
|
|
53
|
+
@hits.push(Hit.new(x))
|
|
54
|
+
end
|
|
55
|
+
end
|
|
56
|
+
attr_reader :list, :log, :program, :hits
|
|
57
|
+
|
|
58
|
+
def each
|
|
59
|
+
@hits.each do |x|
|
|
60
|
+
yield x
|
|
61
|
+
end
|
|
62
|
+
end
|
|
63
|
+
|
|
64
|
+
def threshold(evalue_max = 0.1)
|
|
65
|
+
list = []
|
|
66
|
+
@hits.each do |x|
|
|
67
|
+
list.push(x) if x.evalue < evalue_max
|
|
68
|
+
end
|
|
69
|
+
return list
|
|
70
|
+
end
|
|
71
|
+
|
|
72
|
+
def lap_over(length_min = 0)
|
|
73
|
+
list = []
|
|
74
|
+
@hits.each do |x|
|
|
75
|
+
list.push(x) if x.overlap > length_min
|
|
76
|
+
end
|
|
77
|
+
return list
|
|
78
|
+
end
|
|
79
|
+
|
|
80
|
+
|
|
81
|
+
class Program
|
|
82
|
+
def initialize(data)
|
|
83
|
+
@definition, *program = data.split(/\n/)
|
|
84
|
+
@program = {}
|
|
85
|
+
|
|
86
|
+
pat = /;\s+([^:]+):\s+(.*)/
|
|
87
|
+
|
|
88
|
+
program.each do |x|
|
|
89
|
+
if pat.match(x)
|
|
90
|
+
@program[$1] = $2
|
|
91
|
+
end
|
|
92
|
+
end
|
|
93
|
+
end
|
|
94
|
+
attr_reader :definition, :program
|
|
95
|
+
end
|
|
96
|
+
|
|
97
|
+
|
|
98
|
+
class Hit
|
|
99
|
+
def initialize(data)
|
|
100
|
+
score, query, target = data.split(/\n>/)
|
|
101
|
+
|
|
102
|
+
@definition, *score = score.split(/\n/)
|
|
103
|
+
@score = {}
|
|
104
|
+
|
|
105
|
+
pat = /;\s+([^:]+):\s+(.*)/
|
|
106
|
+
|
|
107
|
+
score.each do |x|
|
|
108
|
+
if pat.match(x)
|
|
109
|
+
@score[$1] = $2
|
|
110
|
+
end
|
|
111
|
+
end
|
|
112
|
+
|
|
113
|
+
@query = Query.new(query)
|
|
114
|
+
@target = Target.new(target)
|
|
115
|
+
end
|
|
116
|
+
attr_reader :definition, :score, :query, :target
|
|
117
|
+
|
|
118
|
+
def evalue
|
|
119
|
+
if @score['fa_expect']
|
|
120
|
+
@score['fa_expect'].to_f
|
|
121
|
+
elsif @score['sw_expect']
|
|
122
|
+
@score['sw_expect'].to_f
|
|
123
|
+
elsif @score['fx_expect']
|
|
124
|
+
@score['fx_expect'].to_f
|
|
125
|
+
elsif @score['tx_expect']
|
|
126
|
+
@score['tx_expect'].to_f
|
|
127
|
+
end
|
|
128
|
+
end
|
|
129
|
+
|
|
130
|
+
def bit_score
|
|
131
|
+
if @score['fa_bits']
|
|
132
|
+
@score['fa_bits'].to_f
|
|
133
|
+
elsif @score['sw_bits']
|
|
134
|
+
@score['sw_bits'].to_f
|
|
135
|
+
elsif @score['fx_bits']
|
|
136
|
+
@score['fx_bits'].to_f
|
|
137
|
+
elsif @score['tx_bits']
|
|
138
|
+
@score['tx_bits'].to_f
|
|
139
|
+
end
|
|
140
|
+
end
|
|
141
|
+
|
|
142
|
+
def direction
|
|
143
|
+
@score['fa_frame'] || @score['sw_frame'] || @score['fx_frame'] || @score['tx_frame']
|
|
144
|
+
end
|
|
145
|
+
|
|
146
|
+
def sw
|
|
147
|
+
@score['sw_score'].to_i
|
|
148
|
+
end
|
|
149
|
+
|
|
150
|
+
def identity
|
|
151
|
+
@score['sw_ident'].to_f
|
|
152
|
+
end
|
|
153
|
+
|
|
154
|
+
def overlap
|
|
155
|
+
@score['sw_overlap'].to_i
|
|
156
|
+
end
|
|
157
|
+
|
|
158
|
+
def query_id
|
|
159
|
+
@query.entry_id
|
|
160
|
+
end
|
|
161
|
+
|
|
162
|
+
def target_id
|
|
163
|
+
@target.entry_id
|
|
164
|
+
end
|
|
165
|
+
|
|
166
|
+
def query_def
|
|
167
|
+
@query.definition
|
|
168
|
+
end
|
|
169
|
+
|
|
170
|
+
def target_def
|
|
171
|
+
@target.definition
|
|
172
|
+
end
|
|
173
|
+
|
|
174
|
+
def query_len
|
|
175
|
+
@query.length
|
|
176
|
+
end
|
|
177
|
+
|
|
178
|
+
def target_len
|
|
179
|
+
@target.length
|
|
180
|
+
end
|
|
181
|
+
|
|
182
|
+
def query_seq
|
|
183
|
+
@query.sequence
|
|
184
|
+
end
|
|
185
|
+
|
|
186
|
+
def target_seq
|
|
187
|
+
@target.sequence
|
|
188
|
+
end
|
|
189
|
+
|
|
190
|
+
def query_type
|
|
191
|
+
@query.moltype
|
|
192
|
+
end
|
|
193
|
+
|
|
194
|
+
def target_type
|
|
195
|
+
@target.moltype
|
|
196
|
+
end
|
|
197
|
+
|
|
198
|
+
def query_start
|
|
199
|
+
@query.start
|
|
200
|
+
end
|
|
201
|
+
|
|
202
|
+
def query_end
|
|
203
|
+
@query.stop
|
|
204
|
+
end
|
|
205
|
+
|
|
206
|
+
def target_start
|
|
207
|
+
@target.start
|
|
208
|
+
end
|
|
209
|
+
|
|
210
|
+
def target_end
|
|
211
|
+
@target.stop
|
|
212
|
+
end
|
|
213
|
+
|
|
214
|
+
def lap_at
|
|
215
|
+
[ query_start, query_end, target_start, target_end ]
|
|
216
|
+
end
|
|
217
|
+
|
|
218
|
+
|
|
219
|
+
class Query
|
|
220
|
+
def initialize(data)
|
|
221
|
+
@definition, *data = data.split(/\n/)
|
|
222
|
+
@data = {}
|
|
223
|
+
@sequence = ''
|
|
224
|
+
|
|
225
|
+
pat = /;\s+([^:]+):\s+(.*)/
|
|
226
|
+
|
|
227
|
+
data.each do |x|
|
|
228
|
+
if pat.match(x)
|
|
229
|
+
@data[$1] = $2
|
|
230
|
+
else
|
|
231
|
+
@sequence += x
|
|
232
|
+
end
|
|
233
|
+
end
|
|
234
|
+
end
|
|
235
|
+
attr_reader :definition, :data, :sequence
|
|
236
|
+
|
|
237
|
+
def entry_id
|
|
238
|
+
@definition[/\S+/]
|
|
239
|
+
end
|
|
240
|
+
|
|
241
|
+
def length
|
|
242
|
+
@data['sq_len'].to_i
|
|
243
|
+
end
|
|
244
|
+
|
|
245
|
+
def moltype
|
|
246
|
+
@data['sq_type']
|
|
247
|
+
end
|
|
248
|
+
|
|
249
|
+
def start
|
|
250
|
+
@data['al_start'].to_i
|
|
251
|
+
end
|
|
252
|
+
|
|
253
|
+
def stop
|
|
254
|
+
@data['al_stop'].to_i
|
|
255
|
+
end
|
|
256
|
+
|
|
257
|
+
end
|
|
258
|
+
|
|
259
|
+
class Target < Query; end
|
|
260
|
+
end
|
|
261
|
+
|
|
262
|
+
end
|
|
263
|
+
|
|
264
|
+
end
|
|
265
|
+
end
|
|
266
|
+
|
|
267
|
+
|
|
268
|
+
if __FILE__ == $0
|
|
269
|
+
begin
|
|
270
|
+
require 'pp'
|
|
271
|
+
alias p pp
|
|
272
|
+
rescue
|
|
273
|
+
end
|
|
274
|
+
|
|
275
|
+
rep = Bio::Fasta::Report.new(ARGF.read)
|
|
276
|
+
p rep
|
|
277
|
+
|
|
278
|
+
end
|
|
279
|
+
|
|
280
|
+
|
|
281
|
+
=begin
|
|
282
|
+
|
|
283
|
+
= Bio::Fasta::Report
|
|
284
|
+
|
|
285
|
+
Summarized results of the fasta execution hits.
|
|
286
|
+
|
|
287
|
+
--- Bio::Fasta::Report.new(data)
|
|
288
|
+
--- Bio::Fasta::Report#each
|
|
289
|
+
|
|
290
|
+
Iterates on each Bio::Fasta::Report::Hit object.
|
|
291
|
+
|
|
292
|
+
--- Bio::Fasta::Report#hits
|
|
293
|
+
|
|
294
|
+
Returns an Array of Bio::Fasta::Report::Hit objects.
|
|
295
|
+
|
|
296
|
+
--- Bio::Fasta::Report#threshold(evalue_max = 0.1)
|
|
297
|
+
|
|
298
|
+
Returns an Array of Bio::Fasta::Report::Hit objects having
|
|
299
|
+
better evalue than 'evalue_max'.
|
|
300
|
+
|
|
301
|
+
--- Bio::Fasta::Report#lap_over(length_min = 0)
|
|
302
|
+
|
|
303
|
+
Returns an Array of Bio::Fasta::Report::Hit objects having
|
|
304
|
+
longer overlap length than 'length_min'.
|
|
305
|
+
|
|
306
|
+
--- Bio::Fasta::Report#program
|
|
307
|
+
|
|
308
|
+
Returns a Bio::Fasta::Report::Program object.
|
|
309
|
+
|
|
310
|
+
--- Bio::Fasta::Report#list
|
|
311
|
+
|
|
312
|
+
Returns the 'The best scores are' lines as a String.
|
|
313
|
+
|
|
314
|
+
--- Bio::Fasta::Report#log
|
|
315
|
+
|
|
316
|
+
Returns the trailing lines including library size, execution date,
|
|
317
|
+
fasta function used, and fasta versions as a String.
|
|
318
|
+
|
|
319
|
+
|
|
320
|
+
== Bio::Fasta::Report::Program
|
|
321
|
+
|
|
322
|
+
Log of the fasta execution environments.
|
|
323
|
+
|
|
324
|
+
--- Bio::Fasta::Report::Program#definition
|
|
325
|
+
|
|
326
|
+
Returns a String containing query and library filenames.
|
|
327
|
+
|
|
328
|
+
--- Bio::Fasta::Report::Program#program
|
|
329
|
+
|
|
330
|
+
Accessor for a Hash containing 'mp_name', 'mp_ver', 'mp_argv',
|
|
331
|
+
'pg_name', 'pg_ver, 'pg_matrix', 'pg_gap-pen', 'pg_ktup',
|
|
332
|
+
'pg_optcut', 'pg_cgap', 'mp_extrap', 'mp_stats', and 'mp_KS' values.
|
|
333
|
+
|
|
334
|
+
|
|
335
|
+
== Bio::Fasta::Report::Hit
|
|
336
|
+
|
|
337
|
+
--- Bio::Fasta::Report::Hit#definition
|
|
338
|
+
--- Bio::Fasta::Report::Hit#score
|
|
339
|
+
--- Bio::Fasta::Report::Hit#query
|
|
340
|
+
--- Bio::Fasta::Report::Hit#target
|
|
341
|
+
|
|
342
|
+
Accessors for the internal structures.
|
|
343
|
+
|
|
344
|
+
--- Bio::Fasta::Report::Hit#evalue
|
|
345
|
+
--- Bio::Fasta::Report::Hit#bit_score
|
|
346
|
+
--- Bio::Fasta::Report::Hit#sw
|
|
347
|
+
--- Bio::Fasta::Report::Hit#identity
|
|
348
|
+
|
|
349
|
+
Matching scores.
|
|
350
|
+
|
|
351
|
+
--- Bio::Fasta::Report::Hit#query_id
|
|
352
|
+
--- Bio::Fasta::Report::Hit#query_def
|
|
353
|
+
--- Bio::Fasta::Report::Hit#query_len
|
|
354
|
+
--- Bio::Fasta::Report::Hit#query_seq
|
|
355
|
+
--- Bio::Fasta::Report::Hit#query_type
|
|
356
|
+
--- Bio::Fasta::Report::Hit#target_id
|
|
357
|
+
--- Bio::Fasta::Report::Hit#target_def
|
|
358
|
+
--- Bio::Fasta::Report::Hit#target_len
|
|
359
|
+
--- Bio::Fasta::Report::Hit#target_seq
|
|
360
|
+
--- Bio::Fasta::Report::Hit#target_type
|
|
361
|
+
|
|
362
|
+
Matching subjects.
|
|
363
|
+
Shortcuts for the methods of Hit::Query and the Hit::Target.
|
|
364
|
+
|
|
365
|
+
--- Bio::Fasta::Report::Hit#query_start
|
|
366
|
+
--- Bio::Fasta::Report::Hit#query_end
|
|
367
|
+
--- Bio::Fasta::Report::Hit#target_start
|
|
368
|
+
--- Bio::Fasta::Report::Hit#target_end
|
|
369
|
+
--- Bio::Fasta::Report::Hit#overlap
|
|
370
|
+
--- Bio::Fasta::Report::Hit#lap_at
|
|
371
|
+
--- Bio::Fasta::Report::Hit#direction
|
|
372
|
+
|
|
373
|
+
Matching regions.
|
|
374
|
+
|
|
375
|
+
|
|
376
|
+
== Bio::Fasta::Report::Hit::Query
|
|
377
|
+
|
|
378
|
+
--- Bio::Fasta::Report::Hit::Query#entry_id
|
|
379
|
+
|
|
380
|
+
Returns the first word in the definition as a String.
|
|
381
|
+
You can get this value by Report::Hit#query_id method.
|
|
382
|
+
|
|
383
|
+
--- Bio::Fasta::Report::Hit::Query#definition
|
|
384
|
+
|
|
385
|
+
Returns the definition of the entry as a String.
|
|
386
|
+
You can access this value by Report::Hit#query_def method.
|
|
387
|
+
|
|
388
|
+
--- Bio::Fasta::Report::Hit::Query#sequence
|
|
389
|
+
|
|
390
|
+
Returns the sequence (with gaps) as a String.
|
|
391
|
+
You can access this value by the Report::Hit#query_seq method.
|
|
392
|
+
|
|
393
|
+
--- Bio::Fasta::Report::Hit::Query#length
|
|
394
|
+
|
|
395
|
+
Returns the sequence length.
|
|
396
|
+
You can access this value by the Report::Hit#query_len method.
|
|
397
|
+
|
|
398
|
+
--- Bio::Fasta::Report::Hit::Query#moltype
|
|
399
|
+
|
|
400
|
+
Returns 'p' for protein sequence, 'D' for nucleotide sequence.
|
|
401
|
+
|
|
402
|
+
--- Bio::Fasta::Report::Hit::Query#start
|
|
403
|
+
--- Bio::Fasta::Report::Hit::Query#stop
|
|
404
|
+
|
|
405
|
+
Returns alignment start and stop position.
|
|
406
|
+
You can access these values by Report::Hit#query_start and
|
|
407
|
+
Report::Hit#query_end methods.
|
|
408
|
+
|
|
409
|
+
--- Bio::Fasta::Report::Hit::Query#data
|
|
410
|
+
|
|
411
|
+
Returns a Hash containing 'sq_len', 'sq_offset', 'sq_type',
|
|
412
|
+
'al_start', 'al_stop', and 'al_display_start' values.
|
|
413
|
+
You can access most of these values by Report::Hit#query_* methods.
|
|
414
|
+
|
|
415
|
+
|
|
416
|
+
== Bio::Fasta::Report::Hit::Target
|
|
417
|
+
|
|
418
|
+
--- Bio::Fasta::Report::Hit::Target#entry_id
|
|
419
|
+
--- Bio::Fasta::Report::Hit::Target#definition
|
|
420
|
+
--- Bio::Fasta::Report::Hit::Target#data
|
|
421
|
+
--- Bio::Fasta::Report::Hit::Target#sequence
|
|
422
|
+
--- Bio::Fasta::Report::Hit::Target#length
|
|
423
|
+
--- Bio::Fasta::Report::Hit::Target#start
|
|
424
|
+
--- Bio::Fasta::Report::Hit::Target#stop
|
|
425
|
+
|
|
426
|
+
Same as Bio::Fasta::Report::Hit::Query but for Target.
|
|
427
|
+
|
|
428
|
+
=end
|
|
@@ -0,0 +1,37 @@
|
|
|
1
|
+
#
|
|
2
|
+
# bio/appl/fasta/format6.rb - FASTA output (-m 6) parser
|
|
3
|
+
#
|
|
4
|
+
# Copyright (C) 2002 KATAYAMA Toshiaki <k@bioruby.org>
|
|
5
|
+
#
|
|
6
|
+
# This library is free software; you can redistribute it and/or
|
|
7
|
+
# modify it under the terms of the GNU Lesser General Public
|
|
8
|
+
# License as published by the Free Software Foundation; either
|
|
9
|
+
# version 2 of the License, or (at your option) any later version.
|
|
10
|
+
#
|
|
11
|
+
# This library is distributed in the hope that it will be useful,
|
|
12
|
+
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
13
|
+
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
14
|
+
# Lesser General Public License for more details.
|
|
15
|
+
#
|
|
16
|
+
# You should have received a copy of the GNU Lesser General Public
|
|
17
|
+
# License along with this library; if not, write to the Free Software
|
|
18
|
+
# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
|
|
19
|
+
#
|
|
20
|
+
# $Id: format6.rb,v 1.2 2005/09/08 01:22:09 k Exp $
|
|
21
|
+
#
|
|
22
|
+
|
|
23
|
+
module Bio
|
|
24
|
+
class Fasta
|
|
25
|
+
|
|
26
|
+
class Report
|
|
27
|
+
|
|
28
|
+
# will be ported from sample/{fasta2tab,ssearch2tab,tfastx2tab}.rb
|
|
29
|
+
|
|
30
|
+
def initialize
|
|
31
|
+
raise NotImplementedError
|
|
32
|
+
end
|
|
33
|
+
end
|
|
34
|
+
|
|
35
|
+
end
|
|
36
|
+
end
|
|
37
|
+
|