RubyGems - bio - Versions diffs - 1.3.0 → 1.3.1 - Mend

bio 1.3.0 → 1.3.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (75) hide show

data/COPYING +56 -0
data/COPYING.ja +51 -0
data/ChangeLog +540 -0
data/GPL +340 -0
data/LEGAL +141 -0
data/LGPL +504 -0
data/README.rdoc +4 -2
data/Rakefile +2 -2
data/bioruby.gemspec +17 -29
data/doc/Tutorial.rd +118 -90
data/doc/Tutorial.rd.html +124 -87
data/lib/bio/appl/blast.rb +2 -2
data/lib/bio/appl/blast/format0.rb +1 -1
data/lib/bio/appl/fasta.rb +5 -12
data/lib/bio/appl/fasta/format10.rb +96 -6
data/lib/bio/appl/gcg/msf.rb +11 -14
data/lib/bio/appl/pts1.rb +0 -4
data/lib/bio/appl/sim4/report.rb +50 -17
data/lib/bio/db/biosql/biosql_to_biosequence.rb +10 -0
data/lib/bio/db/biosql/sequence.rb +234 -298
data/lib/bio/db/embl/embl.rb +0 -3
data/lib/bio/db/genbank/common.rb +3 -1
data/lib/bio/io/biosql/ar-biosql.rb +257 -0
data/lib/bio/io/biosql/biosql.rb +39 -0
data/lib/bio/io/biosql/config/database.yml +5 -4
data/lib/bio/io/ncbirest.rb +12 -5
data/lib/bio/io/pubmed.rb +5 -1
data/lib/bio/io/sql.rb +43 -150
data/lib/bio/sequence/compat.rb +5 -1
data/lib/bio/util/restriction_enzyme/range/sequence_range/calculated_cuts.rb +6 -4
data/lib/bio/version.rb +1 -1
data/test/data/gcg/pileup-aa.msf +67 -0
data/test/data/sim4/complement-A4.sim4 +43 -0
data/test/data/sim4/simple-A4.sim4 +25 -0
data/test/data/sim4/simple2-A4.sim4 +25 -0
data/test/functional/bio/io/test_pubmed.rb +129 -0
data/test/unit/bio/appl/bl2seq/test_report.rb +5 -5
data/test/unit/bio/appl/gcg/test_msf.rb +154 -0
data/test/unit/bio/appl/hmmer/test_report.rb +2 -2
data/test/unit/bio/appl/sim4/test_report.rb +869 -0
data/test/unit/bio/appl/test_blast.rb +1 -1
data/test/unit/bio/db/biosql/tc_biosql.rb +110 -0
data/test/unit/bio/db/biosql/ts_suite_biosql.rb +8 -0
data/test/unit/bio/test_feature.rb +18 -17
data/test/unit/bio/test_reference.rb +18 -18
data/test/unit/bio/test_sequence.rb +1 -1
metadata +18 -30
data/lib/bio/io/biosql/biodatabase.rb +0 -64
data/lib/bio/io/biosql/bioentry.rb +0 -29
data/lib/bio/io/biosql/bioentry_dbxref.rb +0 -11
data/lib/bio/io/biosql/bioentry_path.rb +0 -12
data/lib/bio/io/biosql/bioentry_qualifier_value.rb +0 -10
data/lib/bio/io/biosql/bioentry_reference.rb +0 -10
data/lib/bio/io/biosql/bioentry_relationship.rb +0 -10
data/lib/bio/io/biosql/biosequence.rb +0 -11
data/lib/bio/io/biosql/comment.rb +0 -7
data/lib/bio/io/biosql/dbxref.rb +0 -13
data/lib/bio/io/biosql/dbxref_qualifier_value.rb +0 -12
data/lib/bio/io/biosql/location.rb +0 -32
data/lib/bio/io/biosql/location_qualifier_value.rb +0 -11
data/lib/bio/io/biosql/ontology.rb +0 -10
data/lib/bio/io/biosql/reference.rb +0 -9
data/lib/bio/io/biosql/seqfeature.rb +0 -32
data/lib/bio/io/biosql/seqfeature_dbxref.rb +0 -11
data/lib/bio/io/biosql/seqfeature_path.rb +0 -11
data/lib/bio/io/biosql/seqfeature_qualifier_value.rb +0 -20
data/lib/bio/io/biosql/seqfeature_relationship.rb +0 -11
data/lib/bio/io/biosql/taxon.rb +0 -12
data/lib/bio/io/biosql/taxon_name.rb +0 -9
data/lib/bio/io/biosql/term.rb +0 -27
data/lib/bio/io/biosql/term_dbxref.rb +0 -11
data/lib/bio/io/biosql/term_path.rb +0 -12
data/lib/bio/io/biosql/term_relationship.rb +0 -13
data/lib/bio/io/biosql/term_relationship_term.rb +0 -11
data/lib/bio/io/biosql/term_synonym.rb +0 -10

data/README.rdoc CHANGED

@@ -239,10 +239,12 @@ RubyGems 0.9.0 and removed in RubyGems 1.0.1.
 == LICENSE
 BioRuby can be freely distributed under the same terms as Ruby.
+See the file COPYING (or COPYING.ja written in Japanese).
-Note that setup.rb included in the BioRuby package comes from
+As written in the file COPYING, see the file LEGAL for files distributed
+under different license. For example, setup.rb which comes from
 {RAA:setup}[http://raa.ruby-lang.org/project/setup/] developed by Minero Aoki
-(http://i.loveruby.net/en/projects/setup/).
+(http://i.loveruby.net/en/projects/setup/) is licensed under LGPL 2.1.
 == CONTACT

data/Rakefile CHANGED

@@ -61,7 +61,7 @@ task :gemspec => GEM_SPEC_FILE
 desc "Force update gem spec file"
 task :regemspec do
   #rm GEM_SPEC_FILE, :force => true
-  Rake::Task[GEM_SPEC_FILE].execute
+  Rake::Task[GEM_SPEC_FILE].execute(nil)
 end
 desc "Update #{GEM_SPEC_FILE}"
@@ -137,7 +137,7 @@ desc "Force update doc/Tutorial*.html"
 task :retutorial2html do
   # safe_unlink HTMLFILES_TUTORIAL
   HTMLFILES_TUTORIAL.each do |x|
-    Rake::Task[x].execute
+    Rake::Task[x].execute(nil)
   end
 end

data/bioruby.gemspec CHANGED

@@ -3,7 +3,7 @@
 #
 Gem::Specification.new do |s|
   s.name = 'bio'
-  s.version = "1.3.0"
+  s.version = "1.3.1"
   s.author = "BioRuby project"
   s.email = "staff@bioruby.org"
@@ -14,8 +14,13 @@ Gem::Specification.new do |s|
   s.platform = Gem::Platform::RUBY
   s.files = [
+    "COPYING",
+    "COPYING.ja",
     "ChangeLog",
+    "GPL",
     "KNOWN_ISSUES.rdoc",
+    "LEGAL",
+    "LGPL",
     "README.rdoc",
     "README_DEV.rdoc",
     "Rakefile",
@@ -153,35 +158,9 @@ Gem::Specification.new do |s|
     "lib/bio/db/soft.rb",
     "lib/bio/db/transfac.rb",
     "lib/bio/feature.rb",
-    "lib/bio/io/biosql/biodatabase.rb",
-    "lib/bio/io/biosql/bioentry.rb",
-    "lib/bio/io/biosql/bioentry_dbxref.rb",
-    "lib/bio/io/biosql/bioentry_path.rb",
-    "lib/bio/io/biosql/bioentry_qualifier_value.rb",
-    "lib/bio/io/biosql/bioentry_reference.rb",
-    "lib/bio/io/biosql/bioentry_relationship.rb",
-    "lib/bio/io/biosql/biosequence.rb",
-    "lib/bio/io/biosql/comment.rb",
+    "lib/bio/io/biosql/ar-biosql.rb",
+    "lib/bio/io/biosql/biosql.rb",
     "lib/bio/io/biosql/config/database.yml",
-    "lib/bio/io/biosql/dbxref.rb",
-    "lib/bio/io/biosql/dbxref_qualifier_value.rb",
-    "lib/bio/io/biosql/location.rb",
-    "lib/bio/io/biosql/location_qualifier_value.rb",
-    "lib/bio/io/biosql/ontology.rb",
-    "lib/bio/io/biosql/reference.rb",
-    "lib/bio/io/biosql/seqfeature.rb",
-    "lib/bio/io/biosql/seqfeature_dbxref.rb",
-    "lib/bio/io/biosql/seqfeature_path.rb",
-    "lib/bio/io/biosql/seqfeature_qualifier_value.rb",
-    "lib/bio/io/biosql/seqfeature_relationship.rb",
-    "lib/bio/io/biosql/taxon.rb",
-    "lib/bio/io/biosql/taxon_name.rb",
-    "lib/bio/io/biosql/term.rb",
-    "lib/bio/io/biosql/term_dbxref.rb",
-    "lib/bio/io/biosql/term_path.rb",
-    "lib/bio/io/biosql/term_relationship.rb",
-    "lib/bio/io/biosql/term_relationship_term.rb",
-    "lib/bio/io/biosql/term_synonym.rb",
     "lib/bio/io/das.rb",
     "lib/bio/io/dbget.rb",
     "lib/bio/io/ddbjxml.rb",
@@ -345,6 +324,7 @@ Gem::Specification.new do |s|
     "test/data/embl/AB090716.embl.rel89",
     "test/data/fasta/example1.txt",
     "test/data/fasta/example2.txt",
+    "test/data/gcg/pileup-aa.msf",
     "test/data/genscan/sample.report",
     "test/data/iprscan/merged.raw",
     "test/data/iprscan/merged.txt",
@@ -354,11 +334,15 @@ Gem::Specification.new do |s|
     "test/data/prosite/prosite.dat",
     "test/data/refseq/nm_126355.entret",
     "test/data/rpsblast/misc.rpsblast",
+    "test/data/sim4/complement-A4.sim4",
+    "test/data/sim4/simple-A4.sim4",
+    "test/data/sim4/simple2-A4.sim4",
     "test/data/soft/GDS100_partial.soft",
     "test/data/soft/GSE3457_family_partial.soft",
     "test/data/uniprot/p53_human.uniprot",
     "test/functional/bio/appl/test_pts1.rb",
     "test/functional/bio/io/test_ensembl.rb",
+    "test/functional/bio/io/test_pubmed.rb",
     "test/functional/bio/io/test_soapwsdl.rb",
     "test/functional/bio/io/test_togows.rb",
     "test/functional/bio/sequence/test_output_embl.rb",
@@ -368,6 +352,7 @@ Gem::Specification.new do |s|
     "test/unit/bio/appl/blast/test_ncbioptions.rb",
     "test/unit/bio/appl/blast/test_report.rb",
     "test/unit/bio/appl/blast/test_rpsblast.rb",
+    "test/unit/bio/appl/gcg/test_msf.rb",
     "test/unit/bio/appl/genscan/test_report.rb",
     "test/unit/bio/appl/hmmer/test_report.rb",
     "test/unit/bio/appl/iprscan/test_report.rb",
@@ -375,6 +360,7 @@ Gem::Specification.new do |s|
     "test/unit/bio/appl/paml/codeml/test_rates.rb",
     "test/unit/bio/appl/paml/codeml/test_report.rb",
     "test/unit/bio/appl/paml/test_codeml.rb",
+    "test/unit/bio/appl/sim4/test_report.rb",
     "test/unit/bio/appl/sosui/test_report.rb",
     "test/unit/bio/appl/targetp/test_report.rb",
     "test/unit/bio/appl/test_blast.rb",
@@ -384,6 +370,8 @@ Gem::Specification.new do |s|
     "test/unit/bio/data/test_aa.rb",
     "test/unit/bio/data/test_codontable.rb",
     "test/unit/bio/data/test_na.rb",
+    "test/unit/bio/db/biosql/tc_biosql.rb",
+    "test/unit/bio/db/biosql/ts_suite_biosql.rb",
     "test/unit/bio/db/embl/test_common.rb",
     "test/unit/bio/db/embl/test_embl.rb",
     "test/unit/bio/db/embl/test_embl_rel89.rb",

data/doc/Tutorial.rd CHANGED

@@ -2,45 +2,43 @@
 #
 # A possible test run could be from rdtool (on Debian package rdtool)
 #
-#   ruby -I lib ./bin/rd2 ~/cvs/opensource/bioruby/doc/Tutorial.rd
+#   rd2 $BIORUBYPATH/doc/Tutorial.rd
 #
 # or with style sheet:
 #
-#   ruby -I lib ./bin/rd2 -r rd/rd2html-lib.rb --with-c
-ss=bioruby.css ~/cvs/opensource/bioruby/doc/Tutorial.rd > ~/bioruby.html
+#   rd2 -r rd/rd2html-lib.rb --with-css=bioruby.css $BIORUBYPATH/doc/Tutorial.rd > ~/bioruby.html
 #
 # in Debian:
 #
-#   rd2 -r rd/rd2html-lib  --with-css="/home/wrk/izip/cvs/opensource/bioruby/lib/bio/shell/rails/vendor/plugins/bioruby/generators/bioruby/templates/bioruby.css" Tutorial.rd > index.html
+#   rd2 -r rd/rd2html-lib  --with-css="../lib/bio/shell/rails/vendor/plugins/bioruby/generators/bioruby/templates/bioruby.css" Tutorial.rd > Tutorial.rd.html
 #
 # A common problem is tabs in the text file! TABs are not allowed.
 #
 # To add tests run Toshiaki's bioruby shell and paste in the query plus
 # results.
 #
-# To run the embedded Ruby doctests you can get the doctest.rb from Pjotr.
+# To run the embedded Ruby doctests you can use the rubydoctest tool, part
+# of the bioruby-support repository at http://github.com/pjotrp/bioruby-support/
+#
 =begin
 #doctest Testing bioruby
 = BioRuby Tutorial
-Editor: PjotrPrins <p .at. bioruby.org>
 * Copyright (C) 2001-2003 KATAYAMA Toshiaki <k .at. bioruby.org>
-* Copyright (C) 2005-2008 Pjotr Prins, Naohisa Goto and others
+* Copyright (C) 2005-2009 Pjotr Prins, Naohisa Goto and others
-The latest version resides in the CVS repository ./doc/((<Tutorial.rd|URL:http://cvs.open-bio.org/cgi-bin/viewcvs/viewcvs.cgi/*checkout*/bioruby/doc/Tutorial.rd?rev=HEAD&cvsroot=bioruby&content-type=text/plain>)). This one was updated:
+This document was last modified: 2009/03/17
+Current editor: Pjotr Prins <p .at. bioruby.org>
-  $Id: Tutorial.rd,v 1.22 2008/05/19 12:22:05 pjotr Exp $
-in preparation for the ((<BioHackathlon 2008|URL:http://hackathon.dbcls.jp/>))
+The latest version resides in the GIT source code repository:  ./doc/((<Tutorial.rd|URL:http://github.com/pjotrp/bioruby/raw/documentation/doc/Tutorial.rd>)).
 == Introduction
 This is a tutorial for using Bioruby. A basic knowledge of Ruby is required.
 If you want to know more about the programming langauge Ruby we recommend the
-excellent book ((<Programming Ruby|URL:http://www.pragprog.com/titles/ruby>))
+latest Ruby book ((<Programming Ruby|URL:http://www.pragprog.com/titles/ruby>))
 by Dave Thomas and Andy Hunt - some of it is online
 ((<here|URL:http://www.rubycentral.com/pickaxe/>)).
@@ -53,7 +51,7 @@ version it has with the
 command. Showing something like:
-  ruby 1.8.5 (2006-08-25) [powerpc-linux]
+  ruby 1.8.7 (2008-08-11 patchlevel 72) [i486-linux]
 If you see no such thing you'll have to install Ruby using your installation
 manager. For more information see the
@@ -81,6 +79,7 @@ and you should see a prompt
 Now test the following:
+  bioruby> require 'bio'
   bioruby> seq = Bio::Sequence::NA.new("atgcatgcaaaa")
   ==> "atgcatgcaaaa"
@@ -182,37 +181,35 @@ way of writing concise and clear code using 'closures'. Each sliding
 window creates a subsequence which is supplied to the enclosed block
 through a variable named +s+.
-Show average percentage of GC content for 20 bases (stepping the default one base at a time)
+* Show average percentage of GC content for 20 bases (stepping the default one base at a time)
-  bioruby> seq = Bio::Sequence::NA.new("atgcatgcaattaagctaatcccaattagatcatcccgatcatcaaaaaaaaaa")
-  ==> "atgcatgcaattaagctaatcccaattagatcatcccgatcatcaaaaaaaaaa"
+   bioruby> seq = Bio::Sequence::NA.new("atgcatgcaattaagctaatcccaattagatcatcccgatcatcaaaaaaaaaa")
+   ==> "atgcatgcaattaagctaatcccaattagatcatcccgatcatcaaaaaaaaaa"
-  bioruby> a=[]; seq.window_search(20) { |s| a.push s.gc_percent }
-  bioruby> a
-  ==> [30, 35, 40, 40, 35, 35, 35, 30, 25, 30, 30, 30, 35, 35, 35, 35, 35, 40, 45, 45, 45, 45, 40, 35, 40, 40, 40, 40, 40, 35, 35, 35, 30, 30, 30]
+   bioruby> a=[]; seq.window_search(20) { |s| a.push s.gc_percent }
+   bioruby> a
+   ==> [30, 35, 40, 40, 35, 35, 35, 30, 25, 30, 30, 30, 35, 35, 35, 35, 35, 40, 45, 45, 45, 45, 40, 35, 40, 40, 40, 40, 40, 35, 35, 35, 30, 30, 30]
 Since the class of each subsequence is the same as original sequence
 (Bio::Sequence::NA or Bio::Sequence::AA or Bio::Sequence), you can
 use all methods on the subsequence. For example,
-Shows translation results for 15 bases shifting a codon at a time
+* Shows translation results for 15 bases shifting a codon at a time
-  bioruby> a = []
-  bioruby> seq.window_search(15, 3) do |s|
-  bioruby>   a.push s.translate
-  bioruby> end
-  bioruby> a
-  ==> ["MHAIK", "HAIKL", "AIKLI", "IKLIP", "KLIPI", "LIPIR", "IPIRS", "PIRSS", "IRSSR", "RSSRS", "SSRSS", "SRSSK", "RSSKK", "SSKKK"]
+   bioruby> a = []
+   bioruby> seq.window_search(15, 3) { | s | a.push s.translate }
+   bioruby> a
+   ==> ["MHAIK", "HAIKL", "AIKLI", "IKLIP", "KLIPI", "LIPIR", "IPIRS", "PIRSS", "IRSSR", "RSSRS", "SSRSS", "SRSSK", "RSSKK", "SSKKK"]
 Finally, the window_search method returns the last leftover
 subsequence. This allows for example
-Divide a genome sequence into sections of 10000bp and
-output FASTA formatted sequences (line width 60 chars). The 1000bp at the
-start and end of each subsequence overlapped. At the 3' end of the sequence
-the leftover is also added:
+* Divide a genome sequence into sections of 10000bp and
+  output FASTA formatted sequences (line width 60 chars). The 1000bp at the
+  start and end of each subsequence overlapped. At the 3' end of the sequence
+  the leftover is also added:
     i = 1
     textwidth=60
@@ -229,24 +226,20 @@ size to equal values.
 Other examples
-Count the codon usage
+* Count the codon usage
-  bioruby> codon_usage = Hash.new(0)
-  bioruby> seq.window_search(3, 3) do |s|
-  bioruby>   codon_usage[s] += 1
-  bioruby> end
-  bioruby> codon_usage
-  ==> {"cat"=>1, "aaa"=>3, "cca"=>1, "att"=>2, "aga"=>1, "atc"=>1, "cta"=>1, "gca"=>1, "cga"=>1, "tca"=>3, "aag"=>1, "tcc"=>1, "atg"=>1}
+   bioruby> codon_usage = Hash.new(0)
+   bioruby> seq.window_search(3, 3) { |s| codon_usage[s] += 1 }
+   bioruby> codon_usage
+   ==> {"cat"=>1, "aaa"=>3, "cca"=>1, "att"=>2, "aga"=>1, "atc"=>1, "cta"=>1, "gca"=>1, "cga"=>1, "tca"=>3, "aag"=>1, "tcc"=>1, "atg"=>1}
-Calculate molecular weight for each 10-aa peptide (or 10-nt nucleic acid)
+* Calculate molecular weight for each 10-aa peptide (or 10-nt nucleic acid)
-  bioruby> a = []
-  bioruby> seq.window_search(10, 10) do |s|
-  bioruby>   a.push s.molecular_weight
-  bioruby> end
-  bioruby> a
-  ==> [3096.2062, 3086.1962, 3056.1762, 3023.1262, 3073.2262]
+   bioruby> a = []
+   bioruby> seq.window_search(10, 10) { |s| a.push s.molecular_weight }
+   bioruby> a
+   ==> [3096.2062, 3086.1962, 3056.1762, 3023.1262, 3073.2262]
 In most cases, sequences are read from files or retrieved from databases.
 For example:
@@ -398,12 +391,12 @@ very complicated:
       end
     end
-Note: In this example Feature#assoc method makes a Hash from a
-feature object. It is useful because you can get data from the hash
-by using qualifiers as keys.
-(But there is a risk some information is lost when two or more
-qualifiers are the same. Therefore an Array is returned by
-Feature#feature)
+* Note: In this example Feature#assoc method makes a Hash from a
+  feature object. It is useful because you can get data from the hash
+  by using qualifiers as keys.
+  (But there is a risk some information is lost when two or more
+  qualifiers are the same. Therefore an Array is returned by
+  Feature#feature)
 Bio::Sequence#splicing splices subsequence from nucleic acid sequence
 according to location information used in GenBank, EMBL and DDBJ.
@@ -417,11 +410,11 @@ feature style location text but also Bio::Locations object. For more
 information about location format and Bio::Locations class, see
 bio/location.rb.
-Splice according to location string used in a GenBank entry
+* Splice according to location string used in a GenBank entry
     naseq.splicing('join(2035..2050,complement(1775..1818),13..345')
-Generate Bio::Locations object and pass the splicing method
+* Generate Bio::Locations object and pass the splicing method
     locs = Bio::Locations.new('join((8298.8300)..10206,1..855)')
     naseq.splicing(locs)
@@ -429,7 +422,7 @@ Generate Bio::Locations object and pass the splicing method
 You can also use the splicing method for amino acid sequences
 (Bio::Sequence::AA objects).
-Splicing peptide from a protein (e.g. signal peptide)
+* Splicing peptide from a protein (e.g. signal peptide)
     aaseq.splicing('21..119')
@@ -469,7 +462,7 @@ to a FASTA file can be found in sample/any2fasta.rb. With this technique it is
 possible to write a Unix type grep/sort pipe for sequence information. One
 example using scripts in the BIORUBY sample folder:
-  fastagrep.rb '/At|Dm/' database.seq | fastasort.rb
+ fastagrep.rb '/At|Dm/' database.seq | fastasort.rb
 greps the database for Arabidopsis and Drosophila entries and sorts the output
 to FASTA.
@@ -505,23 +498,23 @@ Array and BioPerl's Bio::SimpleAlign.  A very simple example is:
   bioruby> a.consensus
   ==> "a?gc?"
   # shows IUPAC consensus
-  a.consensus_iupac
-  ==> "ahgcr"
+  p a.consensus_iupac       # ==> "ahgcr"
   # iterates over each seq
   a.each { |x| p x }
-  # ==>
-  #    "atgca"
-  #    "aagca"
-  #    "acgca"
-  #    "acgcg"
+    # ==>
+    #    "atgca"
+    #    "aagca"
+    #    "acgca"
+    #    "acgcg"
   # iterates over each site
   a.each_site { |x| p x }
-  # ==>
-  #    ["a", "a", "a", "a"]
-  #    ["t", "a", "c", "c"]
-  #    ["g", "g", "g", "g"]
-  #    ["c", "c", "c", "c"]
-  #    ["a", "a", "a", "g"]
+    # ==>
+    #    ["a", "a", "a", "a"]
+    #    ["t", "a", "c", "c"]
+    #    ["g", "g", "g", "g"]
+    #    ["c", "c", "c", "c"]
+    #    ["a", "a", "a", "g"]
   # doing alignment by using CLUSTAL W.
   # clustalw command must be installed.
@@ -671,7 +664,7 @@ method of the factory object after the "query" method.
 === using FASTA from a remote internet site
 * Note: Currently, only GenomeNet (fasta.genome.jp) is
-supported. check the class documentation for updates.
+  supported. check the class documentation for updates.
 For accessing a remote site the Bio::Fasta.remote method is used
 instead of Bio::Fasta.local.  When using a remote method, the
@@ -774,7 +767,7 @@ Check the documentation for Bio::Blast::Report to see what can be
 retrieved. For now suffice to state that Bio::Blast::Report has a
 hierarchical structure mirroring the general BLAST output stream:
-  * In a Bio::Blast::Report object, @iteratinos is an array of
+  * In a Bio::Blast::Report object, @iterations is an array of
     Bio::Blast::Report::Iteration objects.
     * In a Bio::Blast::Report::Iteration object, @hits is an array of
       Bio::Blast::Report::Hits objects.
@@ -790,13 +783,26 @@ you can directly create Bio::Blast::Report objects without the
 Bio::Blast factory object. For this purpose use Bio::Blast.reports,
 which supports the "-m 0" default and "-m 7" XML type output format.
-    #!/usr/bin/env ruby
+* For example:
-    require 'bio'
+   bioruby> blast_version = nil; result = []
+   bioruby> Bio::Blast.reports(File.new("../test/data/blast/blastp-multi.m7")) do |report|
+   bioruby>   blast_version = report.version
+   bioruby>   report.iterations.each do |itr|
+   bioruby>     itr.hits.each do |hit|
+   bioruby>       result.push hit.target_id
+   bioruby>     end
+   bioruby>   end
+   bioruby> end
+   bioruby> blast_version
+   ==> "blastp 2.2.18 [Mar-02-2008]"
+   bioruby> result
+   ==> ["BAB38768", "BAB38768", "BAB38769", "BAB37741"]
-    # Iterates over each XML result.
-    # The variable "report" is a Bio::Blast::Report object.
-    Bio::Blast.reports(ARGF) do |report|
+* another example:
+    require 'bio'
+    Bio::Blast.reports(ARGF) do |report|
       puts "Hits for " + report.query_def + " against " + report.db
       report.each do |hit|
         print hit.target_id, "\t", hit.evalue, "\n" if hit.evalue < 0.001
@@ -804,14 +810,16 @@ which supports the "-m 0" default and "-m 7" XML type output format.
     end
 Save the script as hits_under_0.001.rb and to process BLAST output
-files *.xml, you can
+files *.xml, you can run it with:
    % ruby hits_under_0.001.rb *.xml
-Sometimes BLAST XML output may be wrong and can not be parsed. We
-recommended to install BLAST 2.2.5 or later, and try combinations of
-the -D and -m options when you encounter problems.
+Sometimes BLAST XML output may be wrong and can not be parsed. Check whether
+blast is version 2.2.5 or later. See also blast --help.
+Bio::Blast loads the full XML file into memory. If this causes a problem
+you can split the BLAST XML file into smaller chunks using XML-Twig. An
+example can be found in ((<Biotools|URL:http://github.com/pjotrp/biotools/>)).
 === Add remote BLAST search sites
@@ -838,10 +846,6 @@ they may be included.
 Below script is an example which seaches PubMed and creates a reference list.
-    #!/usr/bin/env ruby
-    require 'bio'
     ARGV.each do |id|
       entry = Bio::PubMed.query(id)     # searches PubMed and get entry
       medline = Bio::MEDLINE.new(entry) # creates Bio::MEDLINE object from entry text
@@ -1010,10 +1014,6 @@ BioRuby and other projects' members (2002).
 Here we give a quick overview. Check out
 ((<URL:http://obda.open-bio.org/>)) for more extensive details.
-The specification is stored on CVS repository at cvs.open-bio.org,
-also available via http from:
-((<URL:http://cvs.open-bio.org/cgi-bin/viewcvs/viewcvs.cgi/obda-specs/?cvsroot=obf-common>))
 == BioRegistry
 BioRegistry allows for locating retrieval methods and database
@@ -1254,6 +1254,34 @@ Please refer to KEGG_API.rd.ja (English version: ((<URL:http://www.genome.jp/keg
   * ((<URL:http://www.genome.jp/kegg/soap/>))
+== Ruby Ensembl API
+Ruby Ensembl API is a ruby API to the Ensembl database. It is NOT currently
+included in the BioRuby archives. To install it, see
+((<URL:http://wiki.github.com/jandot/ruby-ensembl-api>))
+for more information.
+=== Gene Ontology (GO) through the Ruby Ensembl API
+Gene Ontologies can be fetched through the Ruby Ensembl API package:
+   require 'ensembl'
+   Ensembl::Core::DBConnection.connect('drosophila_melanogaster')
+   infile = IO.readlines(ARGV.shift) # reading your comma-separated accession mapping file (one line per mapping)
+   infile.each do |line|
+     accs = line.split(",")          # Split the comma-sep.entries into an array
+     drosphila_acc = accs.shift      # the first entry is the Drosophila acc
+     mosq_acc = accs.shift           # the second entry is you Mosq. acc
+     gene = Ensembl::Core::Gene.find_by_stable_id(drosophila_acc)
+     print "#{mosq_acc}"
+     gene.go_terms.each do |go|
+        print ",#{go}"
+     end
+   end
+Prints each mosq. accession/uniq identifier and the GO terms from the Drosphila
+homologues.
 == Comparing BioProjects
 For a quick functional comparison of BioRuby, BioPerl, BioPython and Bioconductor (R) see ((<URL:http://sciruby.codeforpeople.com/sr.cgi/BioProjects>))
@@ -1284,13 +1312,13 @@ carefully that come with each package.
 Ruby fails to find the BioRuby libraries - add it to the RUBYLIB path, or pass
 it to the interpeter. For example:
-  ruby -I~/cvs/bioruby/lib yourprogram.rb
+  ruby -I$BIORUBYPATH/lib yourprogram.rb
 == Modifying this page
-IMPORTANT NOTICE: This page is maintained in the BioRuby CVS
+IMPORTANT NOTICE: This page is maintained in the BioRuby source code
 repository. Please edit the file there otherwise changes may get
-lost. See ((<BioRuby Developer Information>)) for CVS and mailing list
+lost. See ((<BioRuby Developer Information>)) for repository and mailing list
 access.
 =end