bio 0.7.1 → 1.0.0

Sign up to get free protection for your applications and to get access to all the features.
Files changed (142) hide show
  1. data/bin/bioruby +71 -27
  2. data/bin/br_biofetch.rb +5 -17
  3. data/bin/br_bioflat.rb +14 -26
  4. data/bin/br_biogetseq.rb +6 -18
  5. data/bin/br_pmfetch.rb +6 -16
  6. data/doc/Changes-0.7.rd +35 -0
  7. data/doc/KEGG_API.rd +287 -172
  8. data/doc/KEGG_API.rd.ja +273 -160
  9. data/doc/Tutorial.rd +18 -9
  10. data/doc/Tutorial.rd.ja +656 -138
  11. data/lib/bio.rb +6 -24
  12. data/lib/bio/alignment.rb +5 -5
  13. data/lib/bio/appl/blast.rb +132 -98
  14. data/lib/bio/appl/blast/format0.rb +9 -19
  15. data/lib/bio/appl/blast/wublast.rb +5 -18
  16. data/lib/bio/appl/emboss.rb +40 -47
  17. data/lib/bio/appl/hmmer.rb +116 -82
  18. data/lib/bio/appl/hmmer/report.rb +509 -364
  19. data/lib/bio/appl/spidey/report.rb +7 -18
  20. data/lib/bio/data/na.rb +3 -21
  21. data/lib/bio/db.rb +3 -21
  22. data/lib/bio/db/aaindex.rb +147 -52
  23. data/lib/bio/db/embl/common.rb +27 -6
  24. data/lib/bio/db/embl/embl.rb +18 -10
  25. data/lib/bio/db/embl/sptr.rb +87 -67
  26. data/lib/bio/db/embl/swissprot.rb +32 -3
  27. data/lib/bio/db/embl/trembl.rb +32 -3
  28. data/lib/bio/db/embl/uniprot.rb +32 -3
  29. data/lib/bio/db/fasta.rb +327 -289
  30. data/lib/bio/db/medline.rb +25 -4
  31. data/lib/bio/db/nbrf.rb +12 -20
  32. data/lib/bio/db/pdb.rb +4 -1
  33. data/lib/bio/db/pdb/chemicalcomponent.rb +240 -0
  34. data/lib/bio/db/pdb/pdb.rb +13 -8
  35. data/lib/bio/db/rebase.rb +93 -97
  36. data/lib/bio/feature.rb +2 -31
  37. data/lib/bio/io/ddbjxml.rb +167 -139
  38. data/lib/bio/io/fastacmd.rb +89 -56
  39. data/lib/bio/io/flatfile.rb +994 -278
  40. data/lib/bio/io/flatfile/index.rb +257 -194
  41. data/lib/bio/io/flatfile/indexer.rb +37 -29
  42. data/lib/bio/reference.rb +147 -64
  43. data/lib/bio/sequence.rb +57 -417
  44. data/lib/bio/sequence/aa.rb +64 -0
  45. data/lib/bio/sequence/common.rb +175 -0
  46. data/lib/bio/sequence/compat.rb +68 -0
  47. data/lib/bio/sequence/format.rb +134 -0
  48. data/lib/bio/sequence/generic.rb +24 -0
  49. data/lib/bio/sequence/na.rb +189 -0
  50. data/lib/bio/shell.rb +9 -23
  51. data/lib/bio/shell/core.rb +130 -125
  52. data/lib/bio/shell/demo.rb +143 -0
  53. data/lib/bio/shell/{session.rb → interface.rb} +42 -40
  54. data/lib/bio/shell/object.rb +52 -0
  55. data/lib/bio/shell/plugin/codon.rb +4 -22
  56. data/lib/bio/shell/plugin/emboss.rb +23 -0
  57. data/lib/bio/shell/plugin/entry.rb +34 -25
  58. data/lib/bio/shell/plugin/flatfile.rb +5 -23
  59. data/lib/bio/shell/plugin/keggapi.rb +11 -24
  60. data/lib/bio/shell/plugin/midi.rb +5 -23
  61. data/lib/bio/shell/plugin/obda.rb +4 -22
  62. data/lib/bio/shell/plugin/seq.rb +6 -24
  63. data/lib/bio/shell/rails/Rakefile +10 -0
  64. data/lib/bio/shell/rails/app/controllers/application.rb +4 -0
  65. data/lib/bio/shell/rails/app/controllers/shell_controller.rb +94 -0
  66. data/lib/bio/shell/rails/app/helpers/application_helper.rb +3 -0
  67. data/lib/bio/shell/rails/app/models/shell_connection.rb +30 -0
  68. data/lib/bio/shell/rails/app/views/layouts/shell.rhtml +37 -0
  69. data/lib/bio/shell/rails/app/views/shell/history.rhtml +5 -0
  70. data/lib/bio/shell/rails/app/views/shell/index.rhtml +2 -0
  71. data/lib/bio/shell/rails/app/views/shell/show.rhtml +13 -0
  72. data/lib/bio/shell/rails/config/boot.rb +19 -0
  73. data/lib/bio/shell/rails/config/database.yml +85 -0
  74. data/lib/bio/shell/rails/config/environment.rb +53 -0
  75. data/lib/bio/shell/rails/config/environments/development.rb +19 -0
  76. data/lib/bio/shell/rails/config/environments/production.rb +19 -0
  77. data/lib/bio/shell/rails/config/environments/test.rb +19 -0
  78. data/lib/bio/shell/rails/config/routes.rb +19 -0
  79. data/lib/bio/shell/rails/doc/README_FOR_APP +2 -0
  80. data/lib/bio/shell/rails/public/404.html +8 -0
  81. data/lib/bio/shell/rails/public/500.html +8 -0
  82. data/lib/bio/shell/rails/public/dispatch.cgi +10 -0
  83. data/lib/bio/shell/rails/public/dispatch.fcgi +24 -0
  84. data/lib/bio/shell/rails/public/dispatch.rb +10 -0
  85. data/lib/bio/shell/rails/public/favicon.ico +0 -0
  86. data/lib/bio/shell/rails/public/images/icon.png +0 -0
  87. data/lib/bio/shell/rails/public/images/rails.png +0 -0
  88. data/lib/bio/shell/rails/public/index.html +277 -0
  89. data/lib/bio/shell/rails/public/javascripts/controls.js +750 -0
  90. data/lib/bio/shell/rails/public/javascripts/dragdrop.js +584 -0
  91. data/lib/bio/shell/rails/public/javascripts/effects.js +854 -0
  92. data/lib/bio/shell/rails/public/javascripts/prototype.js +1785 -0
  93. data/lib/bio/shell/rails/public/robots.txt +1 -0
  94. data/lib/bio/shell/rails/public/stylesheets/main.css +187 -0
  95. data/lib/bio/shell/rails/script/about +3 -0
  96. data/lib/bio/shell/rails/script/breakpointer +3 -0
  97. data/lib/bio/shell/rails/script/console +3 -0
  98. data/lib/bio/shell/rails/script/destroy +3 -0
  99. data/lib/bio/shell/rails/script/generate +3 -0
  100. data/lib/bio/shell/rails/script/performance/benchmarker +3 -0
  101. data/lib/bio/shell/rails/script/performance/profiler +3 -0
  102. data/lib/bio/shell/rails/script/plugin +3 -0
  103. data/lib/bio/shell/rails/script/process/reaper +3 -0
  104. data/lib/bio/shell/rails/script/process/spawner +3 -0
  105. data/lib/bio/shell/rails/script/process/spinner +3 -0
  106. data/lib/bio/shell/rails/script/runner +3 -0
  107. data/lib/bio/shell/rails/script/server +42 -0
  108. data/lib/bio/shell/rails/test/test_helper.rb +28 -0
  109. data/lib/bio/shell/web.rb +90 -0
  110. data/lib/bio/util/contingency_table.rb +231 -225
  111. data/sample/any2fasta.rb +59 -0
  112. data/test/data/HMMER/hmmpfam.out +64 -0
  113. data/test/data/HMMER/hmmsearch.out +88 -0
  114. data/test/data/aaindex/DAYM780301 +30 -0
  115. data/test/data/aaindex/PRAM900102 +20 -0
  116. data/test/data/bl2seq/cd8a_cd8b_blastp.bl2seq +53 -0
  117. data/test/data/bl2seq/cd8a_p53_e-5blastp.bl2seq +37 -0
  118. data/test/data/blast/{eco:b0002.faa → b0002.faa} +0 -0
  119. data/test/data/blast/{eco:b0002.faa.m0 → b0002.faa.m0} +2 -2
  120. data/test/data/blast/{eco:b0002.faa.m7 → b0002.faa.m7} +1 -1
  121. data/test/data/blast/{eco:b0002.faa.m8 → b0002.faa.m8} +0 -0
  122. data/test/unit/bio/appl/bl2seq/test_report.rb +134 -0
  123. data/test/unit/bio/appl/blast/test_report.rb +15 -12
  124. data/test/unit/bio/appl/blast/test_xmlparser.rb +4 -4
  125. data/test/unit/bio/appl/hmmer/test_report.rb +355 -0
  126. data/test/unit/bio/appl/test_blast.rb +5 -5
  127. data/test/unit/bio/data/test_na.rb +9 -18
  128. data/test/unit/bio/db/pdb/test_pdb.rb +169 -0
  129. data/test/unit/bio/db/test_aaindex.rb +197 -0
  130. data/test/unit/bio/io/test_fastacmd.rb +55 -0
  131. data/test/unit/bio/sequence/test_aa.rb +102 -0
  132. data/test/unit/bio/sequence/test_common.rb +178 -0
  133. data/test/unit/bio/sequence/test_compat.rb +82 -0
  134. data/test/unit/bio/sequence/test_na.rb +242 -0
  135. data/test/unit/bio/shell/plugin/test_seq.rb +29 -19
  136. data/test/unit/bio/test_alignment.rb +15 -7
  137. data/test/unit/bio/test_reference.rb +198 -0
  138. data/test/unit/bio/test_sequence.rb +4 -49
  139. data/test/unit/bio/test_shell.rb +2 -2
  140. metadata +118 -15
  141. data/lib/bio/io/brdb.rb +0 -103
  142. data/lib/bioruby.rb +0 -34
@@ -1,7 +1,26 @@
1
1
  #
2
- # bio/db/medline.rb - NCBI PubMed/MEDLINE database class
2
+ # = bio/db/medline.rb - NCBI PubMed/MEDLINE database class
3
3
  #
4
- # Copyright (C) 2001, 2005 KATAYAMA Toshiaki <k@bioruby.org>
4
+ # Copyright:: Copyright (C) 2001, 2005
5
+ # KATAYAMA Toshiaki <k@bioruby.org>
6
+ # License:: LGPL
7
+ #
8
+ # == Description
9
+ #
10
+ # NCBI PubMed/MEDLINE database class.
11
+ #
12
+ # == Examples
13
+ #
14
+ # medline = Bio::MEDLINE.new(txt)
15
+ # medline.reference
16
+ # medline.pmid == medline.entry_id
17
+ # medilne.mesh
18
+ #
19
+ # == References
20
+ #
21
+ # $Id: medline.rb,v 1.13 2006/02/18 15:03:47 nakao Exp $
22
+ #
23
+ #++
5
24
  #
6
25
  # This library is free software; you can redistribute it and/or
7
26
  # modify it under the terms of the GNU Lesser General Public
@@ -17,15 +36,17 @@
17
36
  # License along with this library; if not, write to the Free Software
18
37
  # Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
19
38
  #
20
- # $Id: medline.rb,v 1.12 2005/09/08 01:22:11 k Exp $
39
+ #--
21
40
  #
22
41
 
23
42
  require 'bio/db'
24
43
 
25
44
  module Bio
26
45
 
46
+ # NCBI PubMed/MEDLINE database class.
27
47
  class MEDLINE < NCBIDB
28
48
 
49
+ #
29
50
  def initialize(entry)
30
51
  @pubmed = Hash.new('')
31
52
 
@@ -39,7 +60,7 @@ module Bio
39
60
  end
40
61
 
41
62
 
42
- # Reference object
63
+ # returns a Reference object.
43
64
  def reference
44
65
  hash = Hash.new('')
45
66
 
@@ -1,27 +1,11 @@
1
1
  #
2
2
  # = bio/db/nbrf.rb - NBRF/PIR format sequence data class
3
3
  #
4
- # Copyright:: Copyright (C) 2001-2003 GOTO Naohisa <ngoto@gen-info.osaka-u.ac.jp>
4
+ # Copyright:: Copyright (C) 2001-2003,2006 Naohisa Goto <ng@bioruby.org>
5
5
  # Copyright (C) 2001-2002 KATAYAMA Toshiaki <k@bioruby.org>
6
- # License:: LGPL
6
+ # License:: Ruby's
7
7
  #
8
- #--
9
- # This library is free software; you can redistribute it and/or
10
- # modify it under the terms of the GNU Lesser General Public
11
- # License as published by the Free Software Foundation; either
12
- # version 2 of the License, or (at your option) any later version.
13
- #
14
- # This library is distributed in the hope that it will be useful,
15
- # but WITHOUT ANY WARRANTY; without even the implied warranty of
16
- # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
17
- # Lesser General Public License for more details.
18
- #
19
- # You should have received a copy of the GNU Lesser General Public
20
- # License along with this library; if not, write to the Free Software
21
- # Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
22
- #++
23
- #
24
- # $Id: nbrf.rb,v 1.7 2005/12/18 15:58:41 k Exp $
8
+ # $Id: nbrf.rb,v 1.8 2006/02/22 08:43:15 ngoto Exp $
25
9
  #
26
10
  # Sequence data class for NBRF/PIR flatfile format.
27
11
  #
@@ -44,7 +28,15 @@ module Bio
44
28
  #++
45
29
 
46
30
  # Delimiter of each entry. Bio::FlatFile uses it.
47
- DELIMITER = RS = "*\n"
31
+ DELIMITER = RS = "\n>"
32
+
33
+ # (Integer) excess read size included in DELIMITER.
34
+ DELIMITER_OVERRUN = 1 # '>'
35
+
36
+ #--
37
+ # Note: DELIMITER is changed due to the change of Bio::FlatFile.
38
+ # DELIMITER = RS = "*\n"
39
+ #++
48
40
 
49
41
  # Creates a new NBRF object. It stores the comment and sequence
50
42
  # information from one entry of the NBRF/PIR format string.
@@ -17,7 +17,7 @@
17
17
  # License along with this library; if not, write to the Free Software
18
18
  # Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
19
19
  #
20
- # $Id: pdb.rb,v 1.5 2005/12/16 19:23:03 ngoto Exp $
20
+ # $Id: pdb.rb,v 1.6 2006/01/29 06:54:13 ngoto Exp $
21
21
  #
22
22
 
23
23
  require 'bio/db'
@@ -25,6 +25,9 @@ require 'bio/db'
25
25
  # definition of the PDB class
26
26
  module Bio
27
27
  class PDB #< DB
28
+
29
+ autoload :ChemicalComponent, 'bio/db/pdb/chemicalcomponent'
30
+
28
31
  end #class PDB
29
32
  end #module Bio
30
33
 
@@ -0,0 +1,240 @@
1
+ #
2
+ # = bio/db/pdb/chemicalcomponent.rb - PDB Chemical Component Dictionary parser
3
+ #
4
+ # Copyright:: Copyright (C) 2006
5
+ # GOTO Naohisa <ngoto@gen-info.osaka-u.ac.jp>
6
+ # License:: LGPL
7
+ #
8
+ # $Id: chemicalcomponent.rb,v 1.1 2006/01/29 06:54:13 ngoto Exp $
9
+ #
10
+ #--
11
+ # This library is free software; you can redistribute it and/or
12
+ # modify it under the terms of the GNU Lesser General Public
13
+ # License as published by the Free Software Foundation; either
14
+ # version 2 of the License, or (at your option) any later version.
15
+ #
16
+ # This library is distributed in the hope that it will be useful,
17
+ # but WITHOUT ANY WARRANTY; without even the implied warranty of
18
+ # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
19
+ # Lesser General Public License for more details.
20
+ #
21
+ # You should have received a copy of the GNU Lesser General Public
22
+ # License along with this library; if not, write to the Free Software
23
+ # Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
24
+ #++
25
+ #
26
+ # = About Bio::PDB::ChemicalComponent
27
+ #
28
+ # Please refer Bio::PDB::ChemicalComponent.
29
+ #
30
+ # = References
31
+ #
32
+ # * ((<URL:http://deposit.pdb.org/cc_dict_tut.html>))
33
+ # * http://deposit.pdb.org/het_dictionary.txt
34
+ #
35
+
36
+ require 'bio/db/pdb/pdb'
37
+
38
+ module Bio
39
+ class PDB
40
+
41
+ # Bio::PDB::ChemicalComponet is a parser for a entry of
42
+ # the PDB Chemical Component Dictionary.
43
+ #
44
+ # The PDB Chemical Component Dictionary is available in
45
+ # http://deposit.pdb.org/het_dictionary.txt
46
+ class ChemicalComponent
47
+
48
+ # delimiter for reading via Bio::FlatFile
49
+ DELIMITER = RS = "\n\n"
50
+
51
+ # Single field (normally single line) of a entry
52
+ class Record < Bio::PDB::Record
53
+
54
+ # fetches record name
55
+ def fetch_record_name(str)
56
+ str[0..6].strip
57
+ end
58
+ private :fetch_record_name
59
+
60
+ # fetches record name
61
+ def self.fetch_record_name(str)
62
+ str[0..6].strip
63
+ end
64
+ private_class_method :fetch_record_name
65
+
66
+ # RESIDUE field.
67
+ # It would be wrong because the definition described in documents
68
+ # seems ambiguous.
69
+ RESIDUE =
70
+ def_rec([ 11, 13, Pdb_LString[3], :hetID ],
71
+ [ 16, 20, Pdb_Integer, :numHetAtoms ]
72
+ )
73
+
74
+ # CONECT field
75
+ # It would be wrong because the definition described in documents
76
+ # seems ambiguous.
77
+ CONECT =
78
+ def_rec([ 12, 15, Pdb_Atom, :name ],
79
+ [ 19, 20, Pdb_Integer, :num ],
80
+ [ 21, 24, Pdb_Atom, :other_atoms ],
81
+ [ 26, 29, Pdb_Atom, :other_atoms ],
82
+ [ 31, 34, Pdb_Atom, :other_atoms ],
83
+ [ 36, 39, Pdb_Atom, :other_atoms ],
84
+ [ 41, 44, Pdb_Atom, :other_atoms ],
85
+ [ 46, 49, Pdb_Atom, :other_atoms ],
86
+ [ 51, 54, Pdb_Atom, :other_atoms ],
87
+ [ 56, 59, Pdb_Atom, :other_atoms ],
88
+ [ 61, 64, Pdb_Atom, :other_atoms ],
89
+ [ 66, 69, Pdb_Atom, :other_atoms ],
90
+ [ 71, 74, Pdb_Atom, :other_atoms ],
91
+ [ 76, 79, Pdb_Atom, :other_atoms ]
92
+ )
93
+
94
+ # HET field.
95
+ # It is the same as Bio::PDB::Record::HET.
96
+ HET = Bio::PDB::Record::HET
97
+
98
+ #--
99
+ #HETSYN = Bio::PDB::Record::HETSYN
100
+ #++
101
+
102
+ # HETSYN field.
103
+ # It is very similar to Bio::PDB::Record::HETSYN.
104
+ HETSYN =
105
+ def_rec([ 9, 10, Pdb_Continuation, nil ],
106
+ [ 12, 14, Pdb_LString(3), :hetID ],
107
+ [ 16, 70, Pdb_String, :hetSynonyms ]
108
+ )
109
+
110
+ # HETNAM field.
111
+ # It is the same as Bio::PDB::Record::HETNAM.
112
+ HETNAM = Bio::PDB::Record::HETNAM
113
+
114
+ # FORMUL field.
115
+ # It is the same as Bio::PDB::Record::FORMUL.
116
+ FORMUL = Bio::PDB::Record::FORMUL
117
+
118
+ # default definition for unknown fields.
119
+ Default = Bio::PDB::Record::Default
120
+
121
+ # Hash to store allowed definitions.
122
+ Definition = create_definition_hash
123
+
124
+ # END record class.
125
+ #
126
+ # Because END is a reserved word of Ruby, it is separately
127
+ # added to the hash
128
+ End = Bio::PDB::Record::End
129
+ Definition['END'] = End
130
+
131
+ # Look up the class in Definition hash
132
+ def self.get_record_class(str)
133
+ t = fetch_record_name(str)
134
+ return Definition[t]
135
+ end
136
+ end #class Record
137
+
138
+ # Creates a new object.
139
+ def initialize(str)
140
+ @data = str.split(/[\r\n]+/)
141
+ @hash = {}
142
+
143
+ #Flag to say whether the current line is part of a continuation
144
+ cont = false
145
+
146
+ #Goes through each line and replace that line with a PDB::Record
147
+ @data.collect! do |line|
148
+ #Go to next if the previous line was contiunation able, and
149
+ #add_continuation returns true. Line is added by add_continuation
150
+ next if cont and cont = cont.add_continuation(line)
151
+
152
+ #Make the new record
153
+ f = Record.get_record_class(line).new.initialize_from_string(line)
154
+ #p f
155
+ #Set cont
156
+ cont = f if f.continue?
157
+ #Set the hash to point to this record either by adding to an
158
+ #array, or on it's own
159
+ key = f.record_name
160
+ if a = @hash[key] then
161
+ a << f
162
+ else
163
+ @hash[key] = [ f ]
164
+ end
165
+ f
166
+ end #each
167
+ #At the end we need to add the final model
168
+ @data.compact!
169
+ end
170
+
171
+ # all records in this entry as an array.
172
+ attr_reader :data
173
+
174
+ # all records in this entry as an hash accessed by record names.
175
+ attr_reader :hash
176
+
177
+ # Identifier written in the first line "RESIDUE" record. (e.g. CMP)
178
+ def entry_id
179
+ @data[0].hetID
180
+ end
181
+
182
+ # Synonyms for the comical component. Returns an array of strings.
183
+ def hetsyn
184
+ unless defined? @hetsyn
185
+ if r = @hash["HETSYN"]
186
+ @hetsyn = r[0].hetSynonyms.to_s.split(/\;\s*/)
187
+ else
188
+ return []
189
+ end
190
+ end
191
+ @hetsyn
192
+ end
193
+
194
+ # The name of the chemical component.
195
+ # Returns a string (or nil, if the entry is something wrong).
196
+ def hetnam
197
+ @hash["HETNAM"][0].text
198
+ end
199
+
200
+ # The chemical formula of the chemical component.
201
+ # Returns a string (or nil, if the entry is something wrong).
202
+ def formul
203
+ @hash["FORMUL"][0].text
204
+ end
205
+
206
+ # Returns an hash of bindings of atoms.
207
+ # Note that each white spaces are stripped for atom symbols.
208
+ def conect
209
+ unless defined? @conect
210
+ c = {}
211
+ @hash["CONECT"].each do |e|
212
+ key = e.name.to_s.strip
213
+ unless key.empty?
214
+ val = e.other_atoms.collect { |x| x.strip }
215
+ #warn "Warning: #{key}: atom name conflict?" if c[key]
216
+ c[key] = val
217
+ end
218
+ end
219
+ @conect = c
220
+ end
221
+ @conect
222
+ end
223
+
224
+ # Gets all records whose record type is _name_.
225
+ # Returns an array of <code>Bio::PDB::Record::*</code> objects.
226
+ #
227
+ # if _name_ is nil, returns hash storing all record data.
228
+ #
229
+ # Example:
230
+ # p pdb.record('CONECT')
231
+ # p pdb.record['CONECT']
232
+ #
233
+ def record(name = nil)
234
+ name ? @hash[name] : @hash
235
+ end
236
+
237
+ end #class ChemicalComponent
238
+ end #class PDB
239
+ end #module Bio
240
+
@@ -6,7 +6,7 @@
6
6
  # Alex Gutteridge <alexg@ebi.ac.uk>
7
7
  # License:: LGPL
8
8
  #
9
- # $Id: pdb.rb,v 1.13 2006/01/20 13:54:08 ngoto Exp $
9
+ # $Id: pdb.rb,v 1.15 2006/02/20 13:00:43 ngoto Exp $
10
10
  #
11
11
  #--
12
12
  # This library is free software; you can redistribute it and/or
@@ -86,19 +86,19 @@ module Bio
86
86
 
87
87
  module Pdb_SList
88
88
  def self.new(str)
89
- str.strip.split(/\;\s*/)
89
+ str.to_s.strip.split(/\;\s*/)
90
90
  end
91
91
  end
92
92
 
93
93
  module Pdb_List
94
94
  def self.new(str)
95
- str.strip.split(/\,\s*/)
95
+ str.to_s.strip.split(/\,\s*/)
96
96
  end
97
97
  end
98
98
 
99
99
  module Pdb_Specification_list
100
100
  def self.new(str)
101
- a = str.strip.split(/\;\s*/)
101
+ a = str.to_s.strip.split(/\;\s*/)
102
102
  a.collect! { |x| x.split(/\:\s*/, 2) }
103
103
  a
104
104
  end
@@ -106,7 +106,7 @@ module Bio
106
106
 
107
107
  module Pdb_String
108
108
  def self.new(str)
109
- str.gsub(/\s+\z/, '')
109
+ str.to_s.gsub(/\s+\z/, '')
110
110
  end
111
111
 
112
112
  #Creates a new module with a string left justified to the
@@ -116,7 +116,7 @@ module Bio
116
116
  m.module_eval %Q{
117
117
  @@nn = nn
118
118
  def self.new(str)
119
- str.gsub(/\s+\z/, '').ljust(@@nn)[0, @@nn]
119
+ str.to_s.gsub(/\s+\z/, '').ljust(@@nn)[0, @@nn]
120
120
  end
121
121
  }
122
122
  m
@@ -129,7 +129,7 @@ module Bio
129
129
  m.module_eval %Q{
130
130
  @@nn = nn
131
131
  def self.new(str)
132
- str.ljust(@@nn)[0, @@nn]
132
+ str.to_s.ljust(@@nn)[0, @@nn]
133
133
  end
134
134
  }
135
135
  m
@@ -157,7 +157,7 @@ module Bio
157
157
 
158
158
  module Pdb_StringRJ
159
159
  def self.new(str)
160
- str.gsub(/\A\s+/, '')
160
+ str.to_s.gsub(/\A\s+/, '')
161
161
  end
162
162
  end
163
163
 
@@ -1807,6 +1807,11 @@ module Bio
1807
1807
  self.record('HEADER').first.classification
1808
1808
  end
1809
1809
 
1810
+ # Get authors in "AUTHOR".
1811
+ def authors
1812
+ self.record('AUTHOR').first.authorList
1813
+ end
1814
+
1810
1815
  #--
1811
1816
  # Bio::DB methods
1812
1817
  #++
@@ -1,15 +1,99 @@
1
- require 'bio/reference'
2
- module Bio
3
-
4
1
  #
5
- # bio/db/rebase.rb - Interface for EMBOSS formatted REBASE files
2
+ # = bio/db/rebase.rb - Interface for EMBOSS formatted REBASE files
6
3
  #
7
4
  # Copyright:: Copyright (C) 2005 Trevor Wennblom <trevor@corevx.com>
8
5
  # License:: LGPL
9
6
  #
10
- # $Id: rebase.rb,v 1.2 2005/12/13 15:02:41 trevor Exp $
7
+ # $Id: rebase.rb,v 1.3 2006/02/27 13:22:05 k Exp $
11
8
  #
12
9
  #
10
+ # == Synopsis
11
+ #
12
+ # Bio::REBASE provides utilties for interacting with REBASE data in EMBOSS
13
+ # format. REBASE is the Restriction Enzyme Database, more information
14
+ # can be found here:
15
+ #
16
+
17
+ # * http://rebase.neb.com
18
+ #
19
+ # EMBOSS formatted files located at:
20
+ #
21
+ # * http://rebase.neb.com/rebase/rebase.f37.html
22
+ #
23
+ # These files are the same as the "emboss_?.???" files located at:
24
+ #
25
+ # * ftp://ftp.neb.com/pub/rebase/
26
+ #
27
+ # To easily get started with the data you can simply type this command
28
+ # at your shell prompt:
29
+ #
30
+ # % wget ftp://ftp.neb.com/pub/rebase/emboss*
31
+ #
32
+ #
33
+ # == Usage
34
+ #
35
+ # require 'bio/db/rebase'
36
+ # require 'pp'
37
+ #
38
+ # enz = File.read('emboss_e')
39
+ # ref = File.read('emboss_r')
40
+ # sup = File.read('emboss_s')
41
+ #
42
+ # # When creating a new instance of Bio::REBASE
43
+ # # the contents of the enzyme file must be passed.
44
+ # # The references and suppiers file contents
45
+ # # may also be passed.
46
+ # rebase = Bio::REBASE.new( enz )
47
+ # rebase = Bio::REBASE.new( enz, ref )
48
+ # rebase = Bio::REBASE.new( enz, ref, sup )
49
+ #
50
+ # # The 'read' class method allows you to read in files
51
+ # # that are REBASE EMBOSS formatted
52
+ # rebase = Bio::REBASE.read( 'emboss_e' )
53
+ # rebase = Bio::REBASE.read( 'emboss_e', 'emboss_r' )
54
+ # rebase = Bio::REBASE.read( 'emboss_e', 'emboss_r', 'emboss_s' )
55
+ #
56
+ # # The data loaded may be saved in YAML format
57
+ # rebase.save_yaml( 'enz.yaml' )
58
+ # rebase.save_yaml( 'enz.yaml', 'ref.yaml' )
59
+ # rebase.save_yaml( 'enz.yaml', 'ref.yaml', 'sup.yaml' )
60
+ #
61
+ # # YAML formatted files can also be read with the
62
+ # # class method 'load_yaml'
63
+ # rebase = Bio::REBASE.load_yaml( 'enz.yaml' )
64
+ # rebase = Bio::REBASE.load_yaml( 'enz.yaml', 'ref.yaml' )
65
+ # rebase = Bio::REBASE.load_yaml( 'enz.yaml', 'ref.yaml', 'sup.yaml' )
66
+ #
67
+ # pp rebase.enzymes[0..4] # ["AarI", "AasI", "AatI", "AatII", "Acc16I"]
68
+ # pp rebase['AarI'].pattern # "CACCTGC"
69
+ # pp rebase['AarI'].blunt? # false
70
+ # pp rebase['AarI'].organism # "Arthrobacter aurescens SS2-322"
71
+ # pp rebase['AarI'].source # "A. Janulaitis"
72
+ # pp rebase['AarI'].primary_strand_cut1 # 11
73
+ # pp rebase['AarI'].primary_strand_cut2 # 0
74
+ # pp rebase['AarI'].complementary_strand_cut1 # 15
75
+ # pp rebase['AarI'].complementary_strand_cut2 # 0
76
+ # pp rebase['AarI'].suppliers # ["F"]
77
+ # pp rebase['AarI'].supplier_names # ["Fermentas International Inc."]
78
+ #
79
+ # pp rebase['AarI'].isoschizomers # Currently none stored in the references file
80
+ # pp rebase['AarI'].methylation # ""
81
+ #
82
+ # pp rebase['EcoRII'].methylation # "2(5)"
83
+ # pp rebase['EcoRII'].suppliers # ["F", "J", "M", "O", "S"]
84
+ # pp rebase['EcoRII'].supplier_names # ["Fermentas International Inc.", "Nippon Gene Co., Ltd.",
85
+ # # "Roche Applied Science", "Toyobo Biochemicals",
86
+ # # "Sigma Chemical Corporation"]
87
+ #
88
+ # # Number of enzymes in the database
89
+ # pp rebase.size # 673
90
+ # pp rebase.enzymes.size # 673
91
+ #
92
+ # rebase.each do |name, info|
93
+ # pp "#{name}: #{info.methylation}" unless info.methylation.empty?
94
+ # end
95
+ #
96
+ #
13
97
  #--
14
98
  #
15
99
  # This library is free software; you can redistribute it and/or
@@ -28,104 +112,15 @@ module Bio
28
112
  #
29
113
  #++
30
114
  #
31
- #
32
-
33
- =begin rdoc
34
- bio/db/rebase.rb - Interface for EMBOSS formatted REBASE files
35
-
36
- == Synopsis
37
-
38
- Bio::REBASE provides utilties for interacting with REBASE data in EMBOSS
39
- format. REBASE is the Restriction Enzyme Database, more information
40
- can be found here:
41
- * http://rebase.neb.com
42
-
43
- EMBOSS formatted files located at:
44
- * http://rebase.neb.com/rebase/rebase.f37.html
45
-
46
- These files are the same as the "emboss_?.???" files located at:
47
- * ftp://ftp.neb.com/pub/rebase/
48
-
49
- To easily get started with the data you can simply type this command at your shell prompt:
50
- wget ftp://ftp.neb.com/pub/rebase/emboss*
51
-
52
-
53
- == Usage
54
-
55
- require 'bio/db/rebase'
56
- require 'pp'
57
-
58
- enz = File.read('emboss_e')
59
- ref = File.read('emboss_r')
60
- sup = File.read('emboss_s')
61
-
62
- # When creating a new instance of Bio::REBASE
63
- # the contents of the enzyme file must be passed.
64
- # The references and suppiers file contents
65
- # may also be passed.
66
- rebase = Bio::REBASE.new( enz )
67
- rebase = Bio::REBASE.new( enz, ref )
68
- rebase = Bio::REBASE.new( enz, ref, sup )
69
-
70
- # The 'read' class method allows you to read in files
71
- # that are REBASE EMBOSS formatted
72
- rebase = Bio::REBASE.read( 'emboss_e' )
73
- rebase = Bio::REBASE.read( 'emboss_e', 'emboss_r' )
74
- rebase = Bio::REBASE.read( 'emboss_e', 'emboss_r', 'emboss_s' )
75
-
76
- # The data loaded may be saved in YAML format
77
- rebase.save_yaml( 'enz.yaml' )
78
- rebase.save_yaml( 'enz.yaml', 'ref.yaml' )
79
- rebase.save_yaml( 'enz.yaml', 'ref.yaml', 'sup.yaml' )
80
-
81
- # YAML formatted files can also be read with the
82
- # class method 'load_yaml'
83
- rebase = Bio::REBASE.load_yaml( 'enz.yaml' )
84
- rebase = Bio::REBASE.load_yaml( 'enz.yaml', 'ref.yaml' )
85
- rebase = Bio::REBASE.load_yaml( 'enz.yaml', 'ref.yaml', 'sup.yaml' )
86
-
87
- pp rebase.enzymes[0..4] # ["AarI", "AasI", "AatI", "AatII", "Acc16I"]
88
- pp rebase['AarI'].pattern # "CACCTGC"
89
- pp rebase['AarI'].blunt? # false
90
- pp rebase['AarI'].organism # "Arthrobacter aurescens SS2-322"
91
- pp rebase['AarI'].source # "A. Janulaitis"
92
- pp rebase['AarI'].primary_strand_cut1 # 11
93
- pp rebase['AarI'].primary_strand_cut2 # 0
94
- pp rebase['AarI'].complementary_strand_cut1 # 15
95
- pp rebase['AarI'].complementary_strand_cut2 # 0
96
- pp rebase['AarI'].suppliers # ["F"]
97
- pp rebase['AarI'].supplier_names # ["Fermentas International Inc."]
98
-
99
- pp rebase['AarI'].isoschizomers # Currently none stored in the references file
100
- pp rebase['AarI'].methylation # ""
101
-
102
- pp rebase['EcoRII'].methylation # "2(5)"
103
- pp rebase['EcoRII'].suppliers # ["F", "J", "M", "O", "S"]
104
- pp rebase['EcoRII'].supplier_names # ["Fermentas International Inc.", "Nippon Gene Co., Ltd.",
105
- # "Roche Applied Science", "Toyobo Biochemicals",
106
- # "Sigma Chemical Corporation"]
107
-
108
- # Number of enzymes in the database
109
- pp rebase.size # 673
110
- pp rebase.enzymes.size # 673
111
-
112
- rebase.each do |name, info|
113
- pp "#{name}: #{info.methylation}" unless info.methylation.empty?
114
- end
115
-
116
115
 
117
- == Author
118
- Trevor Wennblom <trevor@corevx.com>
116
+ autoload :YAML, 'yaml'
119
117
 
118
+ module Bio
120
119
 
121
- == Copyright
122
- Copyright (C) 2005 Trevor Wennblom
123
- Licensed under the same terms as BioRuby.
120
+ autoload :Reference, 'reference'
124
121
 
125
- =end
126
122
 
127
123
  class REBASE
128
- autoload(:YAML, 'yaml')
129
124
 
130
125
  class DynamicMethod_Hash < Hash
131
126
  # Define a writer or reader
@@ -414,4 +409,5 @@ class REBASE
414
409
  end
415
410
 
416
411
  end # REBASE
412
+
417
413
  end # Bio