bio-bigbio 0.1.1
Sign up to get free protection for your applications and to get access to all the features.
- data/Gemfile +15 -0
- data/Gemfile.lock +34 -0
- data/LICENSE +34 -0
- data/README.rdoc +28 -0
- data/Rakefile +50 -0
- data/VERSION +1 -0
- data/bin/getorf +118 -0
- data/bin/nt2aa.rb +56 -0
- data/bio-bigbio.gemspec +102 -0
- data/doc/bigbio_getorf.wtex +14 -0
- data/lib/bigbio/adapters/translate.rb +64 -0
- data/lib/bigbio/db/blast/blastclust.rb +16 -0
- data/lib/bigbio/db/blast.rb +2 -0
- data/lib/bigbio/db/emitters/fasta_emitter.rb +48 -0
- data/lib/bigbio/db/emitters/orf_emitter.rb +289 -0
- data/lib/bigbio/db/fasta/fastaindex.rb +3 -0
- data/lib/bigbio/db/fasta/fastapairedreader.rb +19 -0
- data/lib/bigbio/db/fasta/fastapairedwriter.rb +21 -0
- data/lib/bigbio/db/fasta/fastareader.rb +132 -0
- data/lib/bigbio/db/fasta/fastarecord.rb +39 -0
- data/lib/bigbio/db/fasta/fastawriter.rb +20 -0
- data/lib/bigbio/db/fasta/indexer.rb +33 -0
- data/lib/bigbio/db/fasta.rb +13 -0
- data/lib/bigbio/environment.rb +12 -0
- data/lib/bigbio/sequence/predictorf.rb +140 -0
- data/lib/bigbio/sequence/translate.rb +52 -0
- data/lib/bigbio.rb +38 -0
- data/spec/emitter_spec.rb +265 -0
- data/spec/predictorf_spec.rb +199 -0
- data/test/data/EMBOSS/EGC.1 +32 -0
- data/test/data/fasta/nt.fa +1000 -0
- data/test/doctest/test_fasta.rb +112 -0
- data/test/doctest/test_frames.rb +76 -0
- data/test/doctest/test_getorf.rb +154 -0
- data/test/doctest/test_paired.rb +55 -0
- data/test/performance/translate_with_biolib.rb +67 -0
- data/test/performance/translate_with_bioruby.rb +64 -0
- metadata +163 -0
@@ -0,0 +1,32 @@
|
|
1
|
+
# Genetic Code Table
|
2
|
+
#
|
3
|
+
# Obtained from: http://www3.ncbi.nlm.nih.gov/Taxonomy/Utils/wprintgc.cgi
|
4
|
+
#
|
5
|
+
# Version 3.4
|
6
|
+
# Added CTG,TTG as allowed alternate start codons in Standard code.
|
7
|
+
# Prats et al. 1989, Hann et al. 1992
|
8
|
+
#
|
9
|
+
# Initiation Codon:
|
10
|
+
#
|
11
|
+
# AUG
|
12
|
+
#
|
13
|
+
# Alternative Initiation Codons
|
14
|
+
#
|
15
|
+
# In rare cases, translation in eukaryotes can be initiated from codons
|
16
|
+
# other than AUG. A well documented case (including direct protein
|
17
|
+
# sequencing) is the GUG start of a ribosomal P protein of the fungus
|
18
|
+
# Candida albicans (Abramczyk et al.). Other examples can be found in the
|
19
|
+
# following references: Peabody 1989; Prats et al. 1989; Hann et al.
|
20
|
+
# 1992; Sugihara et al. 1990.
|
21
|
+
#
|
22
|
+
# GUG, CUG, UUG
|
23
|
+
|
24
|
+
Genetic Code [1]
|
25
|
+
|
26
|
+
Standard
|
27
|
+
|
28
|
+
AAs = FFLLSSSSYY**CC*WLLLLPPPPHHQQRRRRIIIMTTTTNNKKSSRRVVVVAAAADDEEGGGG
|
29
|
+
Starts = ---M---------------M---------------M----------------------------
|
30
|
+
Base1 = TTTTTTTTTTTTTTTTCCCCCCCCCCCCCCCCAAAAAAAAAAAAAAAAGGGGGGGGGGGGGGGG
|
31
|
+
Base2 = TTTTCCCCAAAAGGGGTTTTCCCCAAAAGGGGTTTTCCCCAAAAGGGGTTTTCCCCAAAAGGGG
|
32
|
+
Base3 = TCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAG
|