bio-bigbio 0.1.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data/Gemfile +15 -0
- data/Gemfile.lock +34 -0
- data/LICENSE +34 -0
- data/README.rdoc +28 -0
- data/Rakefile +50 -0
- data/VERSION +1 -0
- data/bin/getorf +118 -0
- data/bin/nt2aa.rb +56 -0
- data/bio-bigbio.gemspec +102 -0
- data/doc/bigbio_getorf.wtex +14 -0
- data/lib/bigbio/adapters/translate.rb +64 -0
- data/lib/bigbio/db/blast/blastclust.rb +16 -0
- data/lib/bigbio/db/blast.rb +2 -0
- data/lib/bigbio/db/emitters/fasta_emitter.rb +48 -0
- data/lib/bigbio/db/emitters/orf_emitter.rb +289 -0
- data/lib/bigbio/db/fasta/fastaindex.rb +3 -0
- data/lib/bigbio/db/fasta/fastapairedreader.rb +19 -0
- data/lib/bigbio/db/fasta/fastapairedwriter.rb +21 -0
- data/lib/bigbio/db/fasta/fastareader.rb +132 -0
- data/lib/bigbio/db/fasta/fastarecord.rb +39 -0
- data/lib/bigbio/db/fasta/fastawriter.rb +20 -0
- data/lib/bigbio/db/fasta/indexer.rb +33 -0
- data/lib/bigbio/db/fasta.rb +13 -0
- data/lib/bigbio/environment.rb +12 -0
- data/lib/bigbio/sequence/predictorf.rb +140 -0
- data/lib/bigbio/sequence/translate.rb +52 -0
- data/lib/bigbio.rb +38 -0
- data/spec/emitter_spec.rb +265 -0
- data/spec/predictorf_spec.rb +199 -0
- data/test/data/EMBOSS/EGC.1 +32 -0
- data/test/data/fasta/nt.fa +1000 -0
- data/test/doctest/test_fasta.rb +112 -0
- data/test/doctest/test_frames.rb +76 -0
- data/test/doctest/test_getorf.rb +154 -0
- data/test/doctest/test_paired.rb +55 -0
- data/test/performance/translate_with_biolib.rb +67 -0
- data/test/performance/translate_with_bioruby.rb +64 -0
- metadata +163 -0
@@ -0,0 +1,32 @@
|
|
1
|
+
# Genetic Code Table
|
2
|
+
#
|
3
|
+
# Obtained from: http://www3.ncbi.nlm.nih.gov/Taxonomy/Utils/wprintgc.cgi
|
4
|
+
#
|
5
|
+
# Version 3.4
|
6
|
+
# Added CTG,TTG as allowed alternate start codons in Standard code.
|
7
|
+
# Prats et al. 1989, Hann et al. 1992
|
8
|
+
#
|
9
|
+
# Initiation Codon:
|
10
|
+
#
|
11
|
+
# AUG
|
12
|
+
#
|
13
|
+
# Alternative Initiation Codons
|
14
|
+
#
|
15
|
+
# In rare cases, translation in eukaryotes can be initiated from codons
|
16
|
+
# other than AUG. A well documented case (including direct protein
|
17
|
+
# sequencing) is the GUG start of a ribosomal P protein of the fungus
|
18
|
+
# Candida albicans (Abramczyk et al.). Other examples can be found in the
|
19
|
+
# following references: Peabody 1989; Prats et al. 1989; Hann et al.
|
20
|
+
# 1992; Sugihara et al. 1990.
|
21
|
+
#
|
22
|
+
# GUG, CUG, UUG
|
23
|
+
|
24
|
+
Genetic Code [1]
|
25
|
+
|
26
|
+
Standard
|
27
|
+
|
28
|
+
AAs = FFLLSSSSYY**CC*WLLLLPPPPHHQQRRRRIIIMTTTTNNKKSSRRVVVVAAAADDEEGGGG
|
29
|
+
Starts = ---M---------------M---------------M----------------------------
|
30
|
+
Base1 = TTTTTTTTTTTTTTTTCCCCCCCCCCCCCCCCAAAAAAAAAAAAAAAAGGGGGGGGGGGGGGGG
|
31
|
+
Base2 = TTTTCCCCAAAAGGGGTTTTCCCCAAAAGGGGTTTTCCCCAAAAGGGGTTTTCCCCAAAAGGGG
|
32
|
+
Base3 = TCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAG
|