bio 1.4.1 → 1.4.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data/ChangeLog +954 -0
- data/KNOWN_ISSUES.rdoc +40 -5
- data/README.rdoc +36 -35
- data/RELEASE_NOTES.rdoc +87 -59
- data/bioruby.gemspec +24 -2
- data/doc/RELEASE_NOTES-1.4.1.rdoc +104 -0
- data/doc/Tutorial.rd +162 -200
- data/doc/Tutorial.rd.html +149 -146
- data/lib/bio.rb +1 -0
- data/lib/bio/appl/blast.rb +1 -1
- data/lib/bio/appl/blast/ddbj.rb +26 -34
- data/lib/bio/appl/blast/genomenet.rb +21 -11
- data/lib/bio/db/embl/sptr.rb +193 -21
- data/lib/bio/db/fasta.rb +1 -1
- data/lib/bio/db/fastq.rb +14 -0
- data/lib/bio/db/fastq/format_fastq.rb +2 -2
- data/lib/bio/db/genbank/ddbj.rb +1 -2
- data/lib/bio/db/genbank/format_genbank.rb +1 -1
- data/lib/bio/db/medline.rb +1 -0
- data/lib/bio/db/newick.rb +3 -1
- data/lib/bio/db/pdb/pdb.rb +9 -9
- data/lib/bio/db/pdb/residue.rb +2 -2
- data/lib/bio/io/ddbjrest.rb +344 -0
- data/lib/bio/io/ncbirest.rb +121 -1
- data/lib/bio/location.rb +2 -2
- data/lib/bio/reference.rb +3 -4
- data/lib/bio/shell/plugin/entry.rb +7 -3
- data/lib/bio/shell/plugin/ncbirest.rb +5 -1
- data/lib/bio/util/restriction_enzyme.rb +3 -0
- data/lib/bio/util/restriction_enzyme/dense_int_array.rb +195 -0
- data/lib/bio/util/restriction_enzyme/range/sequence_range.rb +7 -7
- data/lib/bio/util/restriction_enzyme/range/sequence_range/calculated_cuts.rb +57 -18
- data/lib/bio/util/restriction_enzyme/range/sequence_range/fragment.rb +2 -2
- data/lib/bio/util/restriction_enzyme/sorted_num_array.rb +219 -0
- data/lib/bio/version.rb +1 -1
- data/sample/test_restriction_enzyme_long.rb +4403 -0
- data/test/data/fasta/EFTU_BACSU.fasta +8 -0
- data/test/data/genbank/CAA35997.gp +48 -0
- data/test/data/genbank/SCU49845.gb +167 -0
- data/test/data/litdb/1717226.litdb +13 -0
- data/test/data/pir/CRAB_ANAPL.pir +6 -0
- data/test/functional/bio/appl/blast/test_remote.rb +93 -0
- data/test/functional/bio/appl/test_blast.rb +61 -0
- data/test/functional/bio/io/test_ddbjrest.rb +47 -0
- data/test/functional/bio/test_command.rb +3 -3
- data/test/unit/bio/db/embl/test_sptr.rb +6 -6
- data/test/unit/bio/db/embl/test_uniprot_new_part.rb +208 -0
- data/test/unit/bio/db/genbank/test_common.rb +274 -0
- data/test/unit/bio/db/genbank/test_genbank.rb +401 -0
- data/test/unit/bio/db/genbank/test_genpept.rb +81 -0
- data/test/unit/bio/db/pdb/test_pdb.rb +3287 -11
- data/test/unit/bio/db/test_fasta.rb +34 -12
- data/test/unit/bio/db/test_fastq.rb +26 -0
- data/test/unit/bio/db/test_litdb.rb +95 -0
- data/test/unit/bio/db/test_medline.rb +1 -0
- data/test/unit/bio/db/test_nbrf.rb +82 -0
- data/test/unit/bio/db/test_newick.rb +22 -4
- data/test/unit/bio/test_reference.rb +35 -0
- data/test/unit/bio/util/restriction_enzyme/test_dense_int_array.rb +201 -0
- data/test/unit/bio/util/restriction_enzyme/test_sorted_num_array.rb +281 -0
- metadata +44 -38
@@ -0,0 +1,8 @@
|
|
1
|
+
>sp|P33166|EFTU_BACSU Elongation factor Tu;
|
2
|
+
MAKEKFDRSKSHANIGTIGHVDHGKTTLTAAITTVLHKKSGKGTAMAYDQIDGAPEERER
|
3
|
+
GITISTAHVEYETETRHYAHVDCPGHADYVKNMITGAAQMDGAILVVSAADGPMPQTREH
|
4
|
+
ILLSKNVGVPYIVVFLNKCDMVDDEELLELVEMEVRDLLSEYDFPGDDVPVVKGSALKAL
|
5
|
+
EGDAEWEAKIFELMDAVDEYIPTPERDTEKPFMMPVEDVFSITGRGTVATGRVERGQVKV
|
6
|
+
GDEVEIIGLQEENKKTTVTGVEMFRKLLDYAEAGDNIGALLRGVSREEIQRGQVLAKPGT
|
7
|
+
ITPHSKFKAEVYVLSKEEGGRHTPFFSNYRPQFYFRTTDVTGIIHLPEGVEMVMPGDNTE
|
8
|
+
MNVELISTIAIEEGTRFSIREGGRTVGSGVVSTITE
|
@@ -0,0 +1,48 @@
|
|
1
|
+
LOCUS CAA35997 100 aa linear MAM 12-SEP-1993
|
2
|
+
DEFINITION unnamed protein product [Bos taurus].
|
3
|
+
ACCESSION CAA35997
|
4
|
+
VERSION CAA35997.1 GI:8
|
5
|
+
DBSOURCE embl accession X51700.1
|
6
|
+
KEYWORDS .
|
7
|
+
SOURCE Bos taurus (cattle)
|
8
|
+
ORGANISM Bos taurus
|
9
|
+
Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
|
10
|
+
Mammalia; Eutheria; Laurasiatheria; Cetartiodactyla; Ruminantia;
|
11
|
+
Pecora; Bovidae; Bovinae; Bos.
|
12
|
+
REFERENCE 1 (residues 1 to 100)
|
13
|
+
AUTHORS Kiefer,M.C., Saphire,A.C.S., Bauer,D.M. and Barr,P.J.
|
14
|
+
JOURNAL Unpublished
|
15
|
+
REFERENCE 2 (residues 1 to 100)
|
16
|
+
AUTHORS Kiefer,M.C.
|
17
|
+
TITLE Direct Submission
|
18
|
+
JOURNAL Submitted (30-JAN-1990) Kiefer M.C., Chiron Corporation, 4560
|
19
|
+
Hortom St, Emeryville CA 94608-2916, U S A
|
20
|
+
COMMENT See <X15699> for Human sequence.
|
21
|
+
Data kindly reviewed (08-MAY-1990) by Kiefer M.C.
|
22
|
+
FEATURES Location/Qualifiers
|
23
|
+
source 1..100
|
24
|
+
/organism="Bos taurus"
|
25
|
+
/db_xref="taxon:9913"
|
26
|
+
/clone="bBGP-3"
|
27
|
+
/tissue_type="bone matrix"
|
28
|
+
/clone_lib="Zap-bb"
|
29
|
+
Protein 1..100
|
30
|
+
/name="unnamed protein product"
|
31
|
+
Region 33..97
|
32
|
+
/region_name="Gla"
|
33
|
+
/note="Vitamin K-dependent
|
34
|
+
carboxylation/gamma-carboxyglutamic (GLA) domain; cl02449"
|
35
|
+
/db_xref="CDD:141428"
|
36
|
+
CDS 1..100
|
37
|
+
/coded_by="X51700.1:28..330"
|
38
|
+
/note="bone Gla precursor (100 AA)"
|
39
|
+
/db_xref="GOA:P02820"
|
40
|
+
/db_xref="InterPro:IPR000294"
|
41
|
+
/db_xref="InterPro:IPR002384"
|
42
|
+
/db_xref="PDB:1Q3M"
|
43
|
+
/db_xref="UniProtKB/Swiss-Prot:P02820"
|
44
|
+
ORIGIN
|
45
|
+
1 mrtpmllall alatlclagr adakpgdaes gkgaafvskq egsevvkrlr ryldhwlgap
|
46
|
+
61 apypdplepk revcelnpdc deladhigfq eayrrfygpv
|
47
|
+
//
|
48
|
+
|
@@ -0,0 +1,167 @@
|
|
1
|
+
LOCUS SCU49845 5028 bp DNA linear PLN 23-MAR-2010
|
2
|
+
DEFINITION Saccharomyces cerevisiae TCP1-beta gene, partial cds; and Axl2p
|
3
|
+
(AXL2) and Rev7p (REV7) genes, complete cds.
|
4
|
+
ACCESSION U49845
|
5
|
+
VERSION U49845.1 GI:1293613
|
6
|
+
KEYWORDS .
|
7
|
+
SOURCE Saccharomyces cerevisiae (baker's yeast)
|
8
|
+
ORGANISM Saccharomyces cerevisiae
|
9
|
+
Eukaryota; Fungi; Dikarya; Ascomycota; Saccharomyceta;
|
10
|
+
Saccharomycotina; Saccharomycetes; Saccharomycetales;
|
11
|
+
Saccharomycetaceae; Saccharomyces.
|
12
|
+
REFERENCE 1 (bases 1 to 5028)
|
13
|
+
AUTHORS Roemer,T., Madden,K., Chang,J. and Snyder,M.
|
14
|
+
TITLE Selection of axial growth sites in yeast requires Axl2p, a novel
|
15
|
+
plasma membrane glycoprotein
|
16
|
+
JOURNAL Genes Dev. 10 (7), 777-793 (1996)
|
17
|
+
PUBMED 8846915
|
18
|
+
REFERENCE 2 (bases 1 to 5028)
|
19
|
+
AUTHORS Roemer,T.
|
20
|
+
TITLE Direct Submission
|
21
|
+
JOURNAL Submitted (22-FEB-1996) Biology, Yale University, New Haven, CT
|
22
|
+
06520, USA
|
23
|
+
FEATURES Location/Qualifiers
|
24
|
+
source 1..5028
|
25
|
+
/organism="Saccharomyces cerevisiae"
|
26
|
+
/mol_type="genomic DNA"
|
27
|
+
/db_xref="taxon:4932"
|
28
|
+
/chromosome="IX"
|
29
|
+
mRNA <1..>206
|
30
|
+
/product="TCP1-beta"
|
31
|
+
CDS <1..206
|
32
|
+
/codon_start=3
|
33
|
+
/product="TCP1-beta"
|
34
|
+
/protein_id="AAA98665.1"
|
35
|
+
/db_xref="GI:1293614"
|
36
|
+
/translation="SSIYNGISTSGLDLNNGTIADMRQLGIVESYKLKRAVVSSASEA
|
37
|
+
AEVLLRVDNIIRARPRTANRQHM"
|
38
|
+
gene <687..>3158
|
39
|
+
/gene="AXL2"
|
40
|
+
mRNA <687..>3158
|
41
|
+
/gene="AXL2"
|
42
|
+
/product="Axl2p"
|
43
|
+
CDS 687..3158
|
44
|
+
/gene="AXL2"
|
45
|
+
/note="plasma membrane glycoprotein"
|
46
|
+
/codon_start=1
|
47
|
+
/product="Axl2p"
|
48
|
+
/protein_id="AAA98666.1"
|
49
|
+
/db_xref="GI:1293615"
|
50
|
+
/translation="MTQLQISLLLTATISLLHLVVATPYEAYPIGKQYPPVARVNESF
|
51
|
+
TFQISNDTYKSSVDKTAQITYNCFDLPSWLSFDSSSRTFSGEPSSDLLSDANTTLYFN
|
52
|
+
VILEGTDSADSTSLNNTYQFVVTNRPSISLSSDFNLLALLKNYGYTNGKNALKLDPNE
|
53
|
+
VFNVTFDRSMFTNEESIVSYYGRSQLYNAPLPNWLFFDSGELKFTGTAPVINSAIAPE
|
54
|
+
TSYSFVIIATDIEGFSAVEVEFELVIGAHQLTTSIQNSLIINVTDTGNVSYDLPLNYV
|
55
|
+
YLDDDPISSDKLGSINLLDAPDWVALDNATISGSVPDELLGKNSNPANFSVSIYDTYG
|
56
|
+
DVIYFNFEVVSTTDLFAISSLPNINATRGEWFSYYFLPSQFTDYVNTNVSLEFTNSSQ
|
57
|
+
DHDWVKFQSSNLTLAGEVPKNFDKLSLGLKANQGSQSQELYFNIIGMDSKITHSNHSA
|
58
|
+
NATSTRSSHHSTSTSSYTSSTYTAKISSTSAAATSSAPAALPAANKTSSHNKKAVAIA
|
59
|
+
CGVAIPLGVILVALICFLIFWRRRRENPDDENLPHAISGPDLNNPANKPNQENATPLN
|
60
|
+
NPFDDDASSYDDTSIARRLAALNTLKLDNHSATESDISSVDEKRDSLSGMNTYNDQFQ
|
61
|
+
SQSKEELLAKPPVQPPESPFFDPQNRSSSVYMDSEPAVNKSWRYTGNLSPVSDIVRDS
|
62
|
+
YGSQKTVDTEKLFDLEAPEKEKRTSRDVTMSSLDPWNSNISPSPVRKSVTPSPYNVTK
|
63
|
+
HRNRHLQNIQDSQSGKNGITPTTMSTSSSDDFVPVKDGENFCWVHSMEPDRRPSKKRL
|
64
|
+
VDFSNKSNVNVGQVKDIHGRIPEML"
|
65
|
+
gene complement(<3300..>4037)
|
66
|
+
/gene="REV7"
|
67
|
+
mRNA complement(<3300..>4037)
|
68
|
+
/gene="REV7"
|
69
|
+
/product="Rev7p"
|
70
|
+
CDS complement(3300..4037)
|
71
|
+
/gene="REV7"
|
72
|
+
/codon_start=1
|
73
|
+
/product="Rev7p"
|
74
|
+
/protein_id="AAA98667.1"
|
75
|
+
/db_xref="GI:1293616"
|
76
|
+
/translation="MNRWVEKWLRVYLKCYINLILFYRNVYPPQSFDYTTYQSFNLPQ
|
77
|
+
FVPINRHPALIDYIEELILDVLSKLTHVYRFSICIINKKNDLCIEKYVLDFSELQHVD
|
78
|
+
KDDQIITETEVFDEFRSSLNSLIMHLEKLPKVNDDTITFEAVINAIELELGHKLDRNR
|
79
|
+
RVDSLEEKAEIERDSNWVKCQEDENLPDNNGFQPPKIKLTSLVGSDVGPLIIHQFSEK
|
80
|
+
LISGDDKILNGVYSQYEEGESIFGSLF"
|
81
|
+
ORIGIN
|
82
|
+
1 gatcctccat atacaacggt atctccacct caggtttaga tctcaacaac ggaaccattg
|
83
|
+
61 ccgacatgag acagttaggt atcgtcgaga gttacaagct aaaacgagca gtagtcagct
|
84
|
+
121 ctgcatctga agccgctgaa gttctactaa gggtggataa catcatccgt gcaagaccaa
|
85
|
+
181 gaaccgccaa tagacaacat atgtaacata tttaggatat acctcgaaaa taataaaccg
|
86
|
+
241 ccacactgtc attattataa ttagaaacag aacgcaaaaa ttatccacta tataattcaa
|
87
|
+
301 agacgcgaaa aaaaaagaac aacgcgtcat agaacttttg gcaattcgcg tcacaaataa
|
88
|
+
361 attttggcaa cttatgtttc ctcttcgagc agtactcgag ccctgtctca agaatgtaat
|
89
|
+
421 aatacccatc gtaggtatgg ttaaagatag catctccaca acctcaaagc tccttgccga
|
90
|
+
481 gagtcgccct cctttgtcga gtaattttca cttttcatat gagaacttat tttcttattc
|
91
|
+
541 tttactctca catcctgtag tgattgacac tgcaacagcc accatcacta gaagaacaga
|
92
|
+
601 acaattactt aatagaaaaa ttatatcttc ctcgaaacga tttcctgctt ccaacatcta
|
93
|
+
661 cgtatatcaa gaagcattca cttaccatga cacagcttca gatttcatta ttgctgacag
|
94
|
+
721 ctactatatc actactccat ctagtagtgg ccacgcccta tgaggcatat cctatcggaa
|
95
|
+
781 aacaataccc cccagtggca agagtcaatg aatcgtttac atttcaaatt tccaatgata
|
96
|
+
841 cctataaatc gtctgtagac aagacagctc aaataacata caattgcttc gacttaccga
|
97
|
+
901 gctggctttc gtttgactct agttctagaa cgttctcagg tgaaccttct tctgacttac
|
98
|
+
961 tatctgatgc gaacaccacg ttgtatttca atgtaatact cgagggtacg gactctgccg
|
99
|
+
1021 acagcacgtc tttgaacaat acataccaat ttgttgttac aaaccgtcca tccatctcgc
|
100
|
+
1081 tatcgtcaga tttcaatcta ttggcgttgt taaaaaacta tggttatact aacggcaaaa
|
101
|
+
1141 acgctctgaa actagatcct aatgaagtct tcaacgtgac ttttgaccgt tcaatgttca
|
102
|
+
1201 ctaacgaaga atccattgtg tcgtattacg gacgttctca gttgtataat gcgccgttac
|
103
|
+
1261 ccaattggct gttcttcgat tctggcgagt tgaagtttac tgggacggca ccggtgataa
|
104
|
+
1321 actcggcgat tgctccagaa acaagctaca gttttgtcat catcgctaca gacattgaag
|
105
|
+
1381 gattttctgc cgttgaggta gaattcgaat tagtcatcgg ggctcaccag ttaactacct
|
106
|
+
1441 ctattcaaaa tagtttgata atcaacgtta ctgacacagg taacgtttca tatgacttac
|
107
|
+
1501 ctctaaacta tgtttatctc gatgacgatc ctatttcttc tgataaattg ggttctataa
|
108
|
+
1561 acttattgga tgctccagac tgggtggcat tagataatgc taccatttcc gggtctgtcc
|
109
|
+
1621 cagatgaatt actcggtaag aactccaatc ctgccaattt ttctgtgtcc atttatgata
|
110
|
+
1681 cttatggtga tgtgatttat ttcaacttcg aagttgtctc cacaacggat ttgtttgcca
|
111
|
+
1741 ttagttctct tcccaatatt aacgctacaa ggggtgaatg gttctcctac tattttttgc
|
112
|
+
1801 cttctcagtt tacagactac gtgaatacaa acgtttcatt agagtttact aattcaagcc
|
113
|
+
1861 aagaccatga ctgggtgaaa ttccaatcat ctaatttaac attagctgga gaagtgccca
|
114
|
+
1921 agaatttcga caagctttca ttaggtttga aagcgaacca aggttcacaa tctcaagagc
|
115
|
+
1981 tatattttaa catcattggc atggattcaa agataactca ctcaaaccac agtgcgaatg
|
116
|
+
2041 caacgtccac aagaagttct caccactcca cctcaacaag ttcttacaca tcttctactt
|
117
|
+
2101 acactgcaaa aatttcttct acctccgctg ctgctacttc ttctgctcca gcagcgctgc
|
118
|
+
2161 cagcagccaa taaaacttca tctcacaata aaaaagcagt agcaattgcg tgcggtgttg
|
119
|
+
2221 ctatcccatt aggcgttatc ctagtagctc tcatttgctt cctaatattc tggagacgca
|
120
|
+
2281 gaagggaaaa tccagacgat gaaaacttac cgcatgctat tagtggacct gatttgaata
|
121
|
+
2341 atcctgcaaa taaaccaaat caagaaaacg ctacaccttt gaacaacccc tttgatgatg
|
122
|
+
2401 atgcttcctc gtacgatgat acttcaatag caagaagatt ggctgctttg aacactttga
|
123
|
+
2461 aattggataa ccactctgcc actgaatctg atatttccag cgtggatgaa aagagagatt
|
124
|
+
2521 ctctatcagg tatgaataca tacaatgatc agttccaatc ccaaagtaaa gaagaattat
|
125
|
+
2581 tagcaaaacc cccagtacag cctccagaga gcccgttctt tgacccacag aataggtctt
|
126
|
+
2641 cttctgtgta tatggatagt gaaccagcag taaataaatc ctggcgatat actggcaacc
|
127
|
+
2701 tgtcaccagt ctctgatatt gtcagagaca gttacggatc acaaaaaact gttgatacag
|
128
|
+
2761 aaaaactttt cgatttagaa gcaccagaga aggaaaaacg tacgtcaagg gatgtcacta
|
129
|
+
2821 tgtcttcact ggacccttgg aacagcaata ttagcccttc tcccgtaaga aaatcagtaa
|
130
|
+
2881 caccatcacc atataacgta acgaagcatc gtaaccgcca cttacaaaat attcaagact
|
131
|
+
2941 ctcaaagcgg taaaaacgga atcactccca caacaatgtc aacttcatct tctgacgatt
|
132
|
+
3001 ttgttccggt taaagatggt gaaaattttt gctgggtcca tagcatggaa ccagacagaa
|
133
|
+
3061 gaccaagtaa gaaaaggtta gtagattttt caaataagag taatgtcaat gttggtcaag
|
134
|
+
3121 ttaaggacat tcacggacgc atcccagaaa tgctgtgatt atacgcaacg atattttgct
|
135
|
+
3181 taattttatt ttcctgtttt attttttatt agtggtttac agatacccta tattttattt
|
136
|
+
3241 agtttttata cttagagaca tttaatttta attccattct tcaaatttca tttttgcact
|
137
|
+
3301 taaaacaaag atccaaaaat gctctcgccc tcttcatatt gagaatacac tccattcaaa
|
138
|
+
3361 attttgtcgt caccgctgat taatttttca ctaaactgat gaataatcaa aggccccacg
|
139
|
+
3421 tcagaaccga ctaaagaagt gagttttatt ttaggaggtt gaaaaccatt attgtctggt
|
140
|
+
3481 aaattttcat cttcttgaca tttaacccag tttgaatccc tttcaatttc tgctttttcc
|
141
|
+
3541 tccaaactat cgaccctcct gtttctgtcc aacttatgtc ctagttccaa ttcgatcgca
|
142
|
+
3601 ttaataactg cttcaaatgt tattgtgtca tcgttgactt taggtaattt ctccaaatgc
|
143
|
+
3661 ataatcaaac tatttaagga agatcggaat tcgtcgaaca cttcagtttc cgtaatgatc
|
144
|
+
3721 tgatcgtctt tatccacatg ttgtaattca ctaaaatcta aaacgtattt ttcaatgcat
|
145
|
+
3781 aaatcgttct ttttattaat aatgcagatg gaaaatctgt aaacgtgcgt taatttagaa
|
146
|
+
3841 agaacatcca gtataagttc ttctatatag tcaattaaag caggatgcct attaatggga
|
147
|
+
3901 acgaactgcg gcaagttgaa tgactggtaa gtagtgtagt cgaatgactg aggtgggtat
|
148
|
+
3961 acatttctat aaaataaaat caaattaatg tagcatttta agtataccct cagccacttc
|
149
|
+
4021 tctacccatc tattcataaa gctgacgcaa cgattactat tttttttttc ttcttggatc
|
150
|
+
4081 tcagtcgtcg caaaaacgta taccttcttt ttccgacctt ttttttagct ttctggaaaa
|
151
|
+
4141 gtttatatta gttaaacagg gtctagtctt agtgtgaaag ctagtggttt cgattgactg
|
152
|
+
4201 atattaagaa agtggaaatt aaattagtag tgtagacgta tatgcatatg tatttctcgc
|
153
|
+
4261 ctgtttatgt ttctacgtac ttttgattta tagcaagggg aaaagaaata catactattt
|
154
|
+
4321 tttggtaaag gtgaaagcat aatgtaaaag ctagaataaa atggacgaaa taaagagagg
|
155
|
+
4381 cttagttcat cttttttcca aaaagcaccc aatgataata actaaaatga aaaggatttg
|
156
|
+
4441 ccatctgtca gcaacatcag ttgtgtgagc aataataaaa tcatcacctc cgttgccttt
|
157
|
+
4501 agcgcgtttg tcgtttgtat cttccgtaat tttagtctta tcaatgggaa tcataaattt
|
158
|
+
4561 tccaatgaat tagcaatttc gtccaattct ttttgagctt cttcatattt gctttggaat
|
159
|
+
4621 tcttcgcact tcttttccca ttcatctctt tcttcttcca aagcaacgat ccttctaccc
|
160
|
+
4681 atttgctcag agttcaaatc ggcctctttc agtttatcca ttgcttcctt cagtttggct
|
161
|
+
4741 tcactgtctt ctagctgttg ttctagatcc tggtttttct tggtgtagtt ctcattatta
|
162
|
+
4801 gatctcaagt tattggagtc ttcagccaat tgctttgtat cagacaattg actctctaac
|
163
|
+
4861 ttctccactt cactgtcgag ttgctcgttt ttagcggaca aagatttaat ctcgttttct
|
164
|
+
4921 ttttcagtgt tagattgctc taattctttg agctgttctc tcagctcctc atatttttct
|
165
|
+
4981 tgccatgact cagattctaa ttttaagcta ttcaatttct ctttgatc
|
166
|
+
//
|
167
|
+
|
@@ -0,0 +1,13 @@
|
|
1
|
+
CODE 1717226
|
2
|
+
TITLE Characterization of an Escherichia coli gene encoding
|
3
|
+
betaine aldehyde dehydrogenase (BADH). Structural similarity
|
4
|
+
to mammalian ALDHs and a plant BADH.
|
5
|
+
FIELD q (sequence analysis)
|
6
|
+
JOURNAL Gene
|
7
|
+
VOLUME Vol.103, No.1, 45-52 (1991)
|
8
|
+
KEYWORD *Betaine Aldehyde Dehydrogenase;;*betB Gene;E.coli;;
|
9
|
+
Seq Determination;1854bp;491AAs;;Hydropathy Plot;*EC1.2.1.8;;
|
10
|
+
Seq Comparison
|
11
|
+
AUTHOR Boyd,L.A.;Adam,L.;Pelcher,L.E.;McHughen,A.;Hirji,R.;
|
12
|
+
Selvaraj,G.
|
13
|
+
END
|
@@ -0,0 +1,93 @@
|
|
1
|
+
#
|
2
|
+
# = test/functional/bio/appl/blast/test_remote.rb - Unit test for Bio::Blast::Remote::Genomenet and Bio::Blast::Remote::DDBJ with network connection
|
3
|
+
#
|
4
|
+
# Copyright:: Copyright (C) 2011
|
5
|
+
# Naohisa Goto <ng@bioruby.org>
|
6
|
+
# License:: The Ruby License
|
7
|
+
#
|
8
|
+
|
9
|
+
# loading helper routine for testing bioruby
|
10
|
+
require 'pathname'
|
11
|
+
load Pathname.new(File.join(File.dirname(__FILE__), ['..'] * 4,
|
12
|
+
'bioruby_test_helper.rb')).cleanpath.to_s
|
13
|
+
|
14
|
+
# libraries needed for the tests
|
15
|
+
require 'test/unit'
|
16
|
+
require 'bio/sequence'
|
17
|
+
require 'bio/appl/blast'
|
18
|
+
|
19
|
+
module Bio
|
20
|
+
module FuncTestBlastRemote
|
21
|
+
|
22
|
+
module NetTestBlastRemoteCommon
|
23
|
+
|
24
|
+
Programs = %w( blastn tblastn tblastx blastp blastx ).freeze
|
25
|
+
Programs.each { |x| x.freeze }
|
26
|
+
|
27
|
+
def test_databases
|
28
|
+
Programs.each do |prog|
|
29
|
+
databases = nil
|
30
|
+
assert_nothing_raised {
|
31
|
+
databases = @klass.databases(prog)
|
32
|
+
}
|
33
|
+
assert_kind_of(Array, databases, "wrong data type for #{prog}")
|
34
|
+
assert(!databases.empty?, "no database found for #{prog}")
|
35
|
+
end
|
36
|
+
end
|
37
|
+
|
38
|
+
# sampling test for blastn database
|
39
|
+
def test_databases_blastn
|
40
|
+
databases = @klass.databases("blastn")
|
41
|
+
self.class::BLASTN_DBNAME_KEYWORDS.each do |re|
|
42
|
+
assert(databases.find { |x| re =~ x })
|
43
|
+
end
|
44
|
+
end
|
45
|
+
|
46
|
+
# sampling test for blastp database
|
47
|
+
def test_databases_blastp
|
48
|
+
databases = @klass.databases("blastp")
|
49
|
+
self.class::BLASTP_DBNAME_KEYWORDS.each do |re|
|
50
|
+
assert(databases.find { |x| re =~ x })
|
51
|
+
end
|
52
|
+
end
|
53
|
+
|
54
|
+
def test_database_description
|
55
|
+
Programs.each do |prog|
|
56
|
+
@klass.databases(prog).each do |db|
|
57
|
+
assert_kind_of(String, @klass.database_description(prog, db))
|
58
|
+
end
|
59
|
+
end
|
60
|
+
end
|
61
|
+
end #module NetTestBlastRemoteCommon
|
62
|
+
|
63
|
+
# This test class only contains tests for meta information.
|
64
|
+
# BLAST execution tests are written in ../test_blast.rb
|
65
|
+
class NetTestBlastRemoteGenomeNet < Test::Unit::TestCase
|
66
|
+
|
67
|
+
include NetTestBlastRemoteCommon
|
68
|
+
|
69
|
+
BLASTN_DBNAME_KEYWORDS = [ /genes/, /nt/ ]
|
70
|
+
BLASTP_DBNAME_KEYWORDS = [ /genes/, /uniprot/, /nr/ ]
|
71
|
+
|
72
|
+
def setup
|
73
|
+
@klass = Bio::Blast::Remote::GenomeNet
|
74
|
+
end
|
75
|
+
end #class NetTestBlastRemoteGenomeNet
|
76
|
+
|
77
|
+
# This test class only contains tests for meta information.
|
78
|
+
# BLAST execution tests are written in ../test_blast.rb
|
79
|
+
class NetTestBlastRemoteDDBJ < Test::Unit::TestCase
|
80
|
+
|
81
|
+
include NetTestBlastRemoteCommon
|
82
|
+
|
83
|
+
BLASTN_DBNAME_KEYWORDS = [ /ddbj/i, /nt/i ]
|
84
|
+
BLASTP_DBNAME_KEYWORDS = [ /uniprot/i, /pdb/i ]
|
85
|
+
|
86
|
+
def setup
|
87
|
+
@klass = Bio::Blast::Remote::DDBJ
|
88
|
+
end
|
89
|
+
end #class NetTestBlastRemoteDDBJ
|
90
|
+
|
91
|
+
end #module FuncTestBlastRemote
|
92
|
+
end #module Bio
|
93
|
+
|
@@ -0,0 +1,61 @@
|
|
1
|
+
#
|
2
|
+
# = test/functional/bio/appl/test_blast.rb - Unit test for Bio::Blast with network connection
|
3
|
+
#
|
4
|
+
# Copyright:: Copyright (C) 2011
|
5
|
+
# Naohisa Goto <ng@bioruby.org>
|
6
|
+
# License:: The Ruby License
|
7
|
+
#
|
8
|
+
|
9
|
+
# loading helper routine for testing bioruby
|
10
|
+
require 'pathname'
|
11
|
+
load Pathname.new(File.join(File.dirname(__FILE__), ['..'] * 3,
|
12
|
+
'bioruby_test_helper.rb')).cleanpath.to_s
|
13
|
+
|
14
|
+
# libraries needed for the tests
|
15
|
+
require 'test/unit'
|
16
|
+
require 'bio/sequence'
|
17
|
+
require 'bio/appl/blast'
|
18
|
+
|
19
|
+
module Bio
|
20
|
+
module FunctTestBlast
|
21
|
+
|
22
|
+
module NetTestBlastCommonProteinQuery
|
23
|
+
filename = File.join(BioRubyTestDataPath, 'fasta', 'EFTU_BACSU.fasta')
|
24
|
+
QuerySequence = File.read(filename).freeze
|
25
|
+
|
26
|
+
def test_query
|
27
|
+
report = nil
|
28
|
+
assert_nothing_raised {
|
29
|
+
report = @blast.query(QuerySequence)
|
30
|
+
}
|
31
|
+
assert(report.hits.size > 0)
|
32
|
+
end
|
33
|
+
end #module NetTestBlastCommonProteinQuery
|
34
|
+
|
35
|
+
class NetTestBlast_GenomeNet < Test::Unit::TestCase
|
36
|
+
include NetTestBlastCommonProteinQuery
|
37
|
+
|
38
|
+
def setup
|
39
|
+
@blast = Bio::Blast.new('blastp', 'mine-aa eco',
|
40
|
+
[ '-e', '1e-10',
|
41
|
+
'-v', '10',
|
42
|
+
'-b', '10' ],
|
43
|
+
'genomenet')
|
44
|
+
end
|
45
|
+
end #class NetTestBlast_GenomeNet
|
46
|
+
|
47
|
+
class NetTestBlast_DDBJ < Test::Unit::TestCase
|
48
|
+
include NetTestBlastCommonProteinQuery
|
49
|
+
|
50
|
+
def setup
|
51
|
+
@blast = Bio::Blast.new('blastp', 'SWISS',
|
52
|
+
['-e', '1e-10',
|
53
|
+
'-v', '10',
|
54
|
+
'-b', '10' ],
|
55
|
+
'ddbj')
|
56
|
+
end
|
57
|
+
end #class NetTestBlast_DDBJ
|
58
|
+
|
59
|
+
end #module FuncTestBlast
|
60
|
+
end #module Bio
|
61
|
+
|
@@ -0,0 +1,47 @@
|
|
1
|
+
#
|
2
|
+
# test/functional/bio/io/test_ddbjrest.rb - Functional test for Bio::DDBJ::REST
|
3
|
+
#
|
4
|
+
# Copyright:: Copyright (C) 2011
|
5
|
+
# Naohisa Goto <ng@bioruby.org>
|
6
|
+
# License:: The Ruby License
|
7
|
+
#
|
8
|
+
|
9
|
+
# loading helper routine for testing bioruby
|
10
|
+
require 'pathname'
|
11
|
+
load Pathname.new(File.join(File.dirname(__FILE__), ['..'] * 3,
|
12
|
+
'bioruby_test_helper.rb')).cleanpath.to_s
|
13
|
+
|
14
|
+
# libraries needed for the tests
|
15
|
+
require 'bio/io/ddbjrest'
|
16
|
+
require 'test/unit'
|
17
|
+
|
18
|
+
module Bio
|
19
|
+
module NetTestDDBJREST
|
20
|
+
|
21
|
+
class TestDDBJ < Test::Unit::TestCase
|
22
|
+
|
23
|
+
def setup
|
24
|
+
@obj = Bio::DDBJ::REST::DDBJ.new
|
25
|
+
end
|
26
|
+
|
27
|
+
def test_countBasePair
|
28
|
+
text = @obj.countBasePair("AF237819")
|
29
|
+
expected = {
|
30
|
+
"a" => 47,
|
31
|
+
"t" => 38,
|
32
|
+
"g" => 48,
|
33
|
+
"c" => 38
|
34
|
+
}
|
35
|
+
h = {}
|
36
|
+
text.each_line do |line|
|
37
|
+
base, count, percent = line.split(/\t/)
|
38
|
+
count = count.to_i
|
39
|
+
h[base] = count if count > 0
|
40
|
+
end
|
41
|
+
assert_equal(expected, h)
|
42
|
+
end
|
43
|
+
|
44
|
+
end #class TestDDBJ
|
45
|
+
|
46
|
+
end #module NetTestDDBJREST
|
47
|
+
end #module Bio
|