swissparser 0.5.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data/History.txt +8 -0
- data/LICENSE +675 -0
- data/README.txt +32 -0
- data/Rakefile +23 -0
- data/examples/data/EColPositives_noTAT.bas +520 -0
- data/examples/data/kegg_enzyme_short.txt +881 -0
- data/examples/data/uniprot.txt +2855 -0
- data/examples/kegg_demo.rb +103 -0
- data/examples/signal_demo.rb +100 -0
- data/examples/uniprot_demo.rb +83 -0
- data/lib/swiss_parser.rb +214 -0
- metadata +76 -0
data/README.txt
ADDED
@@ -0,0 +1,32 @@
|
|
1
|
+
= SwissParser
|
2
|
+
by Paradigmatic
|
3
|
+
http://github.com/paradigmatic/SwissParser
|
4
|
+
|
5
|
+
== DESCRIPTION:
|
6
|
+
|
7
|
+
Simple DSL to define parser for flat files formats common in biofinformatics.
|
8
|
+
|
9
|
+
== FEATURES:
|
10
|
+
|
11
|
+
* Defines parsers with a declarative syntax.
|
12
|
+
* The whole parsing workflow is configurable.
|
13
|
+
* The user can create new parsers by extending existing parsers.
|
14
|
+
|
15
|
+
== SYNOPSIS:
|
16
|
+
|
17
|
+
See examples
|
18
|
+
|
19
|
+
== REQUIREMENTS:
|
20
|
+
|
21
|
+
Only prue standard ruby. Tested with version 1.8.7 only but should work with JRuby and others.
|
22
|
+
|
23
|
+
If you want to participate in SwissParser developpement, you will need the gem *bones*.
|
24
|
+
|
25
|
+
== INSTALL:
|
26
|
+
|
27
|
+
Soon available as a gem...
|
28
|
+
|
29
|
+
== LICENSE:
|
30
|
+
|
31
|
+
Distributed under GPLv3. See included LICENSE file.
|
32
|
+
|
data/Rakefile
ADDED
@@ -0,0 +1,23 @@
|
|
1
|
+
begin
|
2
|
+
require 'bones'
|
3
|
+
rescue LoadError
|
4
|
+
abort '### Please install the "bones" gem ###'
|
5
|
+
end
|
6
|
+
|
7
|
+
ensure_in_path 'lib'
|
8
|
+
require 'swiss_parser'
|
9
|
+
|
10
|
+
#task :default => 'test:run'
|
11
|
+
#task 'gem:release' => 'test:run'
|
12
|
+
|
13
|
+
Bones {
|
14
|
+
name 'swissparser'
|
15
|
+
authors 'paradigmatic'
|
16
|
+
email 'paradigmatic@streum.org'
|
17
|
+
url 'http://github.com/paradigmatic/SwissParser'
|
18
|
+
version Swiss::VERSION
|
19
|
+
ignore_file '.gitignore'
|
20
|
+
rdoc.exclude ["examples/data"]
|
21
|
+
}
|
22
|
+
|
23
|
+
# EOF
|
@@ -0,0 +1,520 @@
|
|
1
|
+
N Serine protease espP precursor
|
2
|
+
T SIG
|
3
|
+
C 55
|
4
|
+
S MNKIYSLKYSHITGGLIAVSELSGRVSSRATGKKKHKRILALCFLGLLQSYSFASQMDISNFYIRDYMDF
|
5
|
+
/
|
6
|
+
N Serine protease pet precursor
|
7
|
+
T SIG
|
8
|
+
C 52
|
9
|
+
S MNKIYSIKYSAATGGLIAVSELAKKVICKTNRKISAALLSLAVISYTNIIAANMDISKAWARDYLDLAQN
|
10
|
+
/
|
11
|
+
N Hemoglobin-binding protease hbp precursor
|
12
|
+
T SIG
|
13
|
+
C 52
|
14
|
+
S MNRIYSLRYSAVARGFIAVSEFARKCVHKSVRRLCFPVLLLIPVLFSAGSAGTVNNELGYQLFRDFAENK
|
15
|
+
/
|
16
|
+
N Alkaline phosphatase precursor
|
17
|
+
T SIG
|
18
|
+
C 21
|
19
|
+
S MKQSTIALALLPLLFTPVTKARTPEMPVLENRAAQGDITAPGGARRLTGDTAALRDSLSDKPAKNIILLI
|
20
|
+
/
|
21
|
+
N L-asparaginase 2 precursor
|
22
|
+
T SIG
|
23
|
+
C 22
|
24
|
+
S MEFFKKTALAALVMGFSGAALALPNITILATGGTIAGGGDSATKSNYTVGVGVENLVNAVPQLKDIANVK
|
25
|
+
/
|
26
|
+
N Beta-lactamase precursor
|
27
|
+
T SIG
|
28
|
+
C 19
|
29
|
+
S MFKTTLCALLITASCSTFAAPQQINDIVHRTITPLIEQQKIPGMAVAVIYGKPYYFTWGYADIAKKQPVT
|
30
|
+
/
|
31
|
+
N L-arabinose-binding periplasmic protein precursor
|
32
|
+
T SIG
|
33
|
+
C 23
|
34
|
+
S MHKFTKALAAIGLAAVMSQSAMAENLKLGFLVKQPEEPWFQTEWKFADKAKDLGFEVIKIAVPDGEKTLN
|
35
|
+
/
|
36
|
+
N D-ribose-binding periplasmic protein precursor
|
37
|
+
T SIG
|
38
|
+
C 25
|
39
|
+
S MNMKKLATLVSAVALSATVSANAMAKDTIALVVSTLNNPFFVSLKDGAQKADKLGYNLVVLDSQNNPAKE
|
40
|
+
/
|
41
|
+
N Outer membrane protein tolC precursor
|
42
|
+
T SIG
|
43
|
+
C 22
|
44
|
+
S MKKLLPILIGLSLSGFSSLSQAENLMQVYQQARLSNPELRKSAADRDAAFKINEARSPLLPQLGLGADYT
|
45
|
+
/
|
46
|
+
N Maltoporin precursor
|
47
|
+
T SIG
|
48
|
+
C 25
|
49
|
+
S MMITLRKLPLAVAVAAGVMSAQAMAVDFHGYARSGIGWTGSGGEQQCFQTGAQSKYRLGNECETYAELKL
|
50
|
+
/
|
51
|
+
N K88 fimbrial protein AB precursor
|
52
|
+
T SIG
|
53
|
+
C 21
|
54
|
+
S MKKTLIALAIAASAASGMAHAWMTGDFNGSVDIGGSITADDYRQKWEWKVTGLNGFGNVLNDLTNGGTKL
|
55
|
+
/
|
56
|
+
N CFA/I fimbrial subunit B precursor
|
57
|
+
T SIG
|
58
|
+
C 23
|
59
|
+
S MKFKKTIGAMALTTMFVAVSASAVEKNITVTASVDPVIDLLQADGNALPSVKLAYSPASKTFESYRVMTQ
|
60
|
+
/
|
61
|
+
N Pap fimbrial major pilin protein precursor
|
62
|
+
T SIG
|
63
|
+
C 22
|
64
|
+
S MIKSVIAGAVAMAVVSFGVNNAAPTIPQGQGKVTFNGTVVDAPCSISQKSDQSIDFGQLSKSFLEAGGVS
|
65
|
+
/
|
66
|
+
N Lipoprotein 28 precursor
|
67
|
+
T SIG
|
68
|
+
C 23
|
69
|
+
S MKLTTHHLRTGAALLLAGILLAGCDQSSSDAKHIKVGVINGAEQDVAEVAKVAKEKYGLDVELVGFSGSL
|
70
|
+
/
|
71
|
+
N Protease 3 precursor
|
72
|
+
T SIG
|
73
|
+
C 23
|
74
|
+
S MPRSTWFKALLLLVALWAPLSQAETGWQPIQETIRKSDKDNRQYQAIRLDGMVVLLVSDPQAVKSLSALV
|
75
|
+
/
|
76
|
+
N M-agglutinin precursor
|
77
|
+
T SIG
|
78
|
+
C 24
|
79
|
+
S MNLKKIAIASSVFAGITMALTCHAVTVTATHTVESDAEFTIDWVDAGPTTDAKDGEVWGHLDMTQTRGTP
|
80
|
+
/
|
81
|
+
N Ferrienterobactin receptor precursor
|
82
|
+
T SIG
|
83
|
+
C 22
|
84
|
+
S MNKKIHSLALLVNLGIYGVAQAQEPTDTPVSHDDTIVVTAAEQNLQAPGVTITADEIRKNPVARDVSKII
|
85
|
+
/
|
86
|
+
N Penicillin G acylase precursor
|
87
|
+
T SIG
|
88
|
+
C 26
|
89
|
+
S MKNRNRMIVNCVTASLMYYWSLPALAEQSSSEIKIVRDEYGMPHIYANDTHLFYGYGYVVAQDRLFQMEM
|
90
|
+
/
|
91
|
+
N Outer membrane usher protein faeD precursor
|
92
|
+
T SIG
|
93
|
+
C 35
|
94
|
+
S MKKYVTTKSVQPVAFRLTTLSLVMSAVLGSASVIAGEKLDMSFIQGGGGVPEVWAALNGSYAPGRYLVDL
|
95
|
+
/
|
96
|
+
N Ferrichrome-iron receptor precursor
|
97
|
+
T SIG
|
98
|
+
C 33
|
99
|
+
S MARSKTAQPKHSLRKIAVVVATAVSGMSVYAQAAVEPKEDTITVTAAPAPESAWGPAATIAARQSATGTK
|
100
|
+
/
|
101
|
+
N Outer membrane protein C precursor
|
102
|
+
T SIG
|
103
|
+
C 21
|
104
|
+
S MKVKVLSLLVPALLVAGAANAAEVYNKDGNKLDLYGKVDGLHYFSDNKDVGDQTYMRLGFKGETQVTDQL
|
105
|
+
/
|
106
|
+
N Protein ushA precursor
|
107
|
+
T SIG
|
108
|
+
C 25
|
109
|
+
S MKLLQRGVALALLTTFTLASETALAYEQDKTYKITVLHTNDHHGHFWRNEGEYGLAAQKTLVDGIRKEVA
|
110
|
+
/
|
111
|
+
N Outer membrane usher protein papC precursor
|
112
|
+
T SIG
|
113
|
+
C 24
|
114
|
+
S MKDRIPFAVNNITCVILLSLFCNAASAVEFNTDVLDAADKKNIDFTRFSEGYVLPGQYLLDVIVNGQSIS
|
115
|
+
/
|
116
|
+
N PAP fimbrial minor pilin protein precursor
|
117
|
+
T SIG
|
118
|
+
C 22
|
119
|
+
S MRLRFSVPLFFFGCVFVHGVFAGPFPPPGMSLPEYWGEEHVWWDGRAAFHEVVRPACTLAMEDAWQIIDM
|
120
|
+
/
|
121
|
+
N Ferrichrome-binding periplasmic protein precursor
|
122
|
+
T SIG
|
123
|
+
C 30
|
124
|
+
S MSGLPLISRRRLLTAMALSPLLWQMNTAHAAAIDPNRIVALEWLPVELLLLGIVPYGVADTINYRLWVSE
|
125
|
+
/
|
126
|
+
N Heat-stable enterotoxin A3/A4 precursor
|
127
|
+
T SIG
|
128
|
+
C 19
|
129
|
+
S MKKSILFIFLSVLSFSPFAQDAKPVESSKEKITLESKKCNIAKKSNKSGPSMNSSNYCCELCCNPACTGC
|
130
|
+
/
|
131
|
+
N Protease 7 precursor
|
132
|
+
T SIG
|
133
|
+
C 20
|
134
|
+
S MRAKLLGIVLTTPIAISSFASTETLSFTPDNINADISLGTLSGKTKERVYAEEGGRKVSQLDWKFNNAAI
|
135
|
+
/
|
136
|
+
N Glycerophosphoryl diester phosphodiesterase precursor
|
137
|
+
T SIG
|
138
|
+
C 25
|
139
|
+
S MKLTLKNLSMAIMMSTIVMGSSAMAADSNEKIVIAHRGASGYLPEHTLPAAMAYAQGADYLEQDLVMTKD
|
140
|
+
/
|
141
|
+
N Lysine-arginine-ornithine-binding periplasmic protein precursor
|
142
|
+
T SIG
|
143
|
+
C 22
|
144
|
+
S MKKSILALSLLVGLSTAASSYAALPETVRIGTDTTYAPFSSKDAKGDFVGDIDLGNEMCKRMQVKCTWVA
|
145
|
+
/
|
146
|
+
N Protein ybiS precursor
|
147
|
+
T SIG
|
148
|
+
C 24
|
149
|
+
S MNMKLKTLFAAAFAVVGFCSTASAVTYPLPTDGSRLVGQNQVITIPEGNTPLEYFAAEYQMGLSNMMEAN
|
150
|
+
/
|
151
|
+
N Rare lipoprotein A precursor
|
152
|
+
T SIG
|
153
|
+
C 17
|
154
|
+
S MRKQWLGICIAAGMLAACTSDDGQQQTVSVPQPAVCNGPIVEISGADPRFPLNATANQDYQRDGKSYKIV
|
155
|
+
/
|
156
|
+
N Long-chain fatty acid transport protein precursor
|
157
|
+
T SIG
|
158
|
+
C 27
|
159
|
+
S MVMSQKTLFTKSALAVAVALISTQAWSAGFQLNEFSSSGLGRAYSGEGAIDDAGNVSRNPALITMFDRPT
|
160
|
+
/
|
161
|
+
N F17 fimbrial protein precursor
|
162
|
+
T SIG
|
163
|
+
C 21
|
164
|
+
S MQKIQFILGILAAASSSATLAYDGKITFNGKVVDQTCSVTTESKNLTVKLTVSANSLASSGKVVGLTPFT
|
165
|
+
/
|
166
|
+
N F41 fimbrial protein precursor
|
167
|
+
T SIG
|
168
|
+
C 22
|
169
|
+
S MKKTLIALAVAASAAVSGSVMAADWTEGQPGDIIIGGEITSPSVKWLWKTEGLSSFSNTTNEIVKRKLNI
|
170
|
+
/
|
171
|
+
N S-fimbrial adhesin protein sfaS precursor
|
172
|
+
T SIG
|
173
|
+
C 22
|
174
|
+
S MKLKAIILATGLINCIAFSAQAVDTTITVTGNVLQRTCNVPGNVDVSLGNYVSDFPNAGSGSPWVNFDLS
|
175
|
+
/
|
176
|
+
N Periplasmic trehalase precursor
|
177
|
+
T SIG
|
178
|
+
C 30
|
179
|
+
S MKSPAPSRPQKMALIPACIFLCFAALSVQAEETPVTPQPPDILLGPLFNDQNAKLFPDQKTFADAVPNSD
|
180
|
+
/
|
181
|
+
N Fimbrial adhesin papG precursor
|
182
|
+
T SIG
|
183
|
+
C 21
|
184
|
+
S MKKWFPAFLFLSLSGGNDALAGWHNVMFYAFNDYLTTNAGNVKVIDQPQLIPWNTGSATATYYSCSGPEF
|
185
|
+
/
|
186
|
+
N Heat-labile enterotoxin IIA, A chain precursor
|
187
|
+
T SIG
|
188
|
+
C 18
|
189
|
+
S MIKHVLLFFVFISFSVSANDFFRADSRTPDEIRRAGGLLPRGQQEAYERGPININLYEHARGTVTGNTRY
|
190
|
+
/
|
191
|
+
N Heat-labile enterotoxin B chain precursor
|
192
|
+
T SIG
|
193
|
+
C 21
|
194
|
+
S MNKVKFYVLFTALLSSLCAHGAPQSITELCSEYHNTQIYTINDKILSYTEMAGKREMVIITFKSGATFQV
|
195
|
+
/
|
196
|
+
N Heat-labile enterotoxin IIA, B chain precursor
|
197
|
+
T SIG
|
198
|
+
C 19
|
199
|
+
S MSSKKIIGAFVLMTGILSGQVYAGVSEHFRNICNQTTADIVAGVQLKKYIDVNTNTRGIYVVSNTGGVWY
|
200
|
+
/
|
201
|
+
N K88 fimbrial protein AC precursor
|
202
|
+
T SIG
|
203
|
+
C 21
|
204
|
+
S MKKTLIALAIAASAASGMAHAWMTGDFNGSVDIGGSITADDYRQKWEWKVTGLNGFGNVLNDLTNGGTKL
|
205
|
+
/
|
206
|
+
N K88 fimbrial protein AD precursor
|
207
|
+
T SIG
|
208
|
+
C 21
|
209
|
+
S MKKTLIALAIAASAASGMAHAWMTGDFNGSVDIGGSITADDYRQKWEWKVTGLNGFGNVLNDLTNGGTKL
|
210
|
+
/
|
211
|
+
N Ferric aerobactin receptor precursor
|
212
|
+
T SIG
|
213
|
+
C 25
|
214
|
+
S MMISKKYTLWALNPLLLTMMAPAVAQQTDDETFVVSANRSNRTVAEMAQTWVIENAELEQQIQGGKELKD
|
215
|
+
/
|
216
|
+
N TraT complement resistance protein precursor
|
217
|
+
T SIG
|
218
|
+
C 20
|
219
|
+
S MKTKKLMMVALVSSTLALSGCGAMSTAIKKRNLEVKTQMSETIWLEPASETVFLQIKNTSDKDMSGLQGK
|
220
|
+
/
|
221
|
+
N CS3 fimbrial subunit A precursor
|
222
|
+
T SIG
|
223
|
+
C 22
|
224
|
+
S MLKIKYLLIGLSLSAMSSYSLAAAGPTLTKELALNVLSPAALDATWAPQDLTLSNTGVSNTLVGVLTLSN
|
225
|
+
/
|
226
|
+
N Thiosulfate-binding protein precursor
|
227
|
+
T SIG
|
228
|
+
C 25
|
229
|
+
S MAVNLLKKNSLALVASLLLAGHVQATELLNSSYDVSRELFAALNPPFEQQAKDNGGDKLTIKQSHAGSSK
|
230
|
+
/
|
231
|
+
N Colicin I receptor precursor
|
232
|
+
T SIG
|
233
|
+
C 25
|
234
|
+
S MFRLNPFVRVGLCLSAISCAWPVLAVDDDGETMVVTASSVEQNLKDAPASSVITQEDLQRKPVQNLKDVL
|
235
|
+
/
|
236
|
+
N Protein papJ precursor
|
237
|
+
T SIG
|
238
|
+
C 27
|
239
|
+
S MVVNKTTAVLYLIALSLSGFIHTFLRAEERGIYDDVFTADALRHYRINERGRTGSLTCSGALLSSPCTLV
|
240
|
+
/
|
241
|
+
N K99 fimbrial protein precursor
|
242
|
+
T SIG
|
243
|
+
C 22
|
244
|
+
S MKKTLLAIILGGMAFATTNASANTGTINFNGKITSATCTIDPEVNGNRTSIDLGQAAISGHGTVVDFKLK
|
245
|
+
/
|
246
|
+
N Periplasmic protein trbC precursor
|
247
|
+
T SIG
|
248
|
+
C 21
|
249
|
+
S MKLSMKSLAALLMMLNGAVMASENVNTPENRQFLKQQENLSRQLREKPDHLKAWAEKQVLENPLQRSDNH
|
250
|
+
/
|
251
|
+
N Glucose-1-phosphatase precursor
|
252
|
+
T SIG
|
253
|
+
C 22
|
254
|
+
S MNKTLIAAAVAGIVLLASNAQAQTVPEGYQLQQVLMMSRHNLRAPLANNGVLEQSTPNKWPEWDVPGGQL
|
255
|
+
/
|
256
|
+
N Protein fanG precursor
|
257
|
+
T SIG
|
258
|
+
C 21
|
259
|
+
S MKKLYKAITVICILMSNLQSAQGATKSVQVPIRTEVKIPTCQLEIDSSIDSFVKIEDIISSRATSKEANL
|
260
|
+
/
|
261
|
+
N Protein fanH precursor
|
262
|
+
T SIG
|
263
|
+
C 20
|
264
|
+
S MIKKVPVLLFFMASISITHASQTATKSLGVSITLSKAQCKINNRAGISGSVLPMISTSGQIISSKKFTTV
|
265
|
+
/
|
266
|
+
N Fimbrial protein 987P precursor
|
267
|
+
T SIG
|
268
|
+
C 23
|
269
|
+
S MRMKKSALTLAVLSSLFSGYSLAAPAENNTSQANLDFTGKVTASLCQVDTNLSQTIDLGELSTSALKATG
|
270
|
+
/
|
271
|
+
N Outer membrane porin protein nmpC precursor
|
272
|
+
T SIG
|
273
|
+
C 23
|
274
|
+
S MKKLTVAISAVAASVLMAMSAQAAEIYNKDSNKLDLYGKVNAKHYFSSNDDDGDTTYARLGFKGETQIND
|
275
|
+
/
|
276
|
+
N Ecotin precursor
|
277
|
+
T SIG
|
278
|
+
C 20
|
279
|
+
S MKTILPAVLFAAFATTSAWAAESVQPLEKIAPYPQAEKGMKRQVIQLTPQDESTLKVELLIGQTLEVDCN
|
280
|
+
/
|
281
|
+
N Periplasmic oligopeptide-binding protein precursor
|
282
|
+
T SIG
|
283
|
+
C 26
|
284
|
+
S MTNITKRSLVAAGVLAALMAGNVALAADVPAGVTLAEKQTLVRNNGSEVQLDPHKIEGVPESNISRDLFE
|
285
|
+
/
|
286
|
+
N Periplasmic dipeptide transport protein precursor
|
287
|
+
T SIG
|
288
|
+
C 28
|
289
|
+
S MRISLKKSGMLKLGLSLVAMTVAASVQAKTLVYCSEGSPEGFNPQLFTSGTYDASSVPLYNRLVEFKIGT
|
290
|
+
/
|
291
|
+
N Penicillin-binding protein 4 precursor
|
292
|
+
T SIG
|
293
|
+
C 20
|
294
|
+
S MRFSRFIIGLTSCIAFSVQAANVDEYITQLPAGANLALMVQKVGASAPAIYHSQQMALPASTQKVITALA
|
295
|
+
/
|
296
|
+
N F107 fimbrial protein precursor
|
297
|
+
T SIG
|
298
|
+
C 21
|
299
|
+
S MKRLVFISFVALSMTAGSAMAQQGDVKFFGNVSATTCNLTPQISGTVGDTQLGTVAPSGTGSEIPFALKA
|
300
|
+
/
|
301
|
+
N Alpha-amylase precursor
|
302
|
+
T SIG
|
303
|
+
C 17
|
304
|
+
S MKLAACFLTLLPGFAVAASWTSPGFPAFSEQGTGTFVSHAQLPKGTRPLTNFDQQCWQPADAIKLNQMLS
|
305
|
+
/
|
306
|
+
N Arginine-binding periplasmic protein 2 precursor
|
307
|
+
T SIG
|
308
|
+
C 19
|
309
|
+
S MKKLVLAALLASFTFGASAAEKINFGVSATYPPFESIGANNEIVGFDIDLKALCKQMQAECTFTNHAFDS
|
310
|
+
/
|
311
|
+
N Thiamine-binding periplasmic protein precursor
|
312
|
+
T SIG
|
313
|
+
C 18
|
314
|
+
S MLKKCLPLLLLCTAPVFAKPVLTVYTYDSFAADWGPGPVVKKAFEADCNCLKLVALEDGVSLLNRLRMEG
|
315
|
+
/
|
316
|
+
N Organic solvent tolerance protein precursor
|
317
|
+
T SIG
|
318
|
+
C 24
|
319
|
+
S MKKRIPTLLATMIATALYSQQGLAADLASQCMLGVPSYDRPLVQGDTNDLVTINADHAKGDYPDDAVFTG
|
320
|
+
/
|
321
|
+
N Outer membrane usher protein htrE precursor
|
322
|
+
T SIG
|
323
|
+
C 29
|
324
|
+
S MTIEYTKNYHHLTRIATFCALLYCNTAFSAELVEYDHTFLMGQNASNIDLRYSEGNPAIPGVYDVSVYVN
|
325
|
+
/
|
326
|
+
N Glucans biosynthesis protein G precursor
|
327
|
+
T SIG
|
328
|
+
C 22
|
329
|
+
S MMKMRWLSAAVMLTLYTSSSWAFSIDDVAKQAQSLAGKGYETPKSNLPSVRDMKYADYQQIQFNHDKAYW
|
330
|
+
/
|
331
|
+
N Protein yebF precursor
|
332
|
+
T SIG
|
333
|
+
C 21
|
334
|
+
S MKKRGAFLGLLLVSACASVFAANNETSKSVTFPKCEDLDAAGIAASVKRDQQNRVARWADDQKIVGQADP
|
335
|
+
/
|
336
|
+
N Nickel-binding periplasmic protein precursor
|
337
|
+
T SIG
|
338
|
+
C 22
|
339
|
+
S MLSTLRRTLFALLACASFIVHAAAPDEITTAWPVNVGPLNPHLYTPNQMFQSMVYEPLVKYQADGSVIPW
|
340
|
+
/
|
341
|
+
N Outer membrane protease ompP precursor
|
342
|
+
T SIG
|
343
|
+
C 23
|
344
|
+
S MQTKLLAIMLAAPVVFSSQEASASDFFGPEKISTEINLGTLSGKTKERVYPEEGGRKVSQLDWKYSNAAI
|
345
|
+
/
|
346
|
+
N Thiol:disulfide interchange protein dsbD precursor
|
347
|
+
T SIG
|
348
|
+
C 19
|
349
|
+
S MAQRIFTLILLLCSTSVFAGLFDAPGRSQFVPADQAFAFDFQQNQHDLNLWQIKDGYYLYRKQIRITPEH
|
350
|
+
/
|
351
|
+
N Outer membrane protein slp precursor
|
352
|
+
T SIG
|
353
|
+
C 18
|
354
|
+
S MNMTKGALILSLSFLLAACSSIPQNIKGNNQPDIQKSFVAVHNQPGLYVGQARFGGKVINVINGKTDTLL
|
355
|
+
/
|
356
|
+
N Molybdate-binding periplasmic protein precursor
|
357
|
+
T SIG
|
358
|
+
C 24
|
359
|
+
S MARKWLNLFAGAALSFAVAGNALADEGKITVFAAASLTNAMQDIATQFKKKGVDVVSSFASSSTLARQIE
|
360
|
+
/
|
361
|
+
N D-xylose-binding periplasmic protein precursor
|
362
|
+
T SIG
|
363
|
+
C 23
|
364
|
+
S MKIKNILLTLCTSLLLTNVAAHAKEVKIGMAIDDLRLERWQKDRDIFVKKESLGAKVFVQSANGNEETQM
|
365
|
+
/
|
366
|
+
N Protein yhjJ precursor
|
367
|
+
T SIG
|
368
|
+
C 24
|
369
|
+
S MQGTKIRLLAGGLLMMATAGYVQADALQPDPAWQQGTLSNGLQWQVLTTPRPSDRVEIRLLVNTGSLAES
|
370
|
+
/
|
371
|
+
N Glutamate/aspartate periplasmic-binding protein precursor
|
372
|
+
T SIG
|
373
|
+
C 22
|
374
|
+
S MQLRKPATAILALALSAGLAQADDAAPAAGSTLDKIAKNGVIVVGHRESSPFSYYDNQQKVVGYSQDYSN
|
375
|
+
/
|
376
|
+
N Periplasmic protein torT precursor
|
377
|
+
T SIG
|
378
|
+
C 18
|
379
|
+
S MRVLLFLLLSLFMLPAFSADNLLRWHDAQHFTVQASTPLKAKRAWKLCALPSLKDSYWLSLNYGMQEAAR
|
380
|
+
/
|
381
|
+
N Protease degQ precursor
|
382
|
+
T SIG
|
383
|
+
C 27
|
384
|
+
S MKKQTQLLSALALSVGLTLSASFQAVASIPGQVADQAPLPSLAPMLEKVLAVVSVRVEGTASQGQKIPEE
|
385
|
+
/
|
386
|
+
N High-affinity zinc uptake system protein znuA precursor
|
387
|
+
T SIG
|
388
|
+
C 26
|
389
|
+
S MLHKKTLLFAALSAALWGGATQAADAAVVASLKPVGFIASAIADGVTETELLPDGASEHDYSLRPSDVKR
|
390
|
+
/
|
391
|
+
N Protein erfK/srfK precursor
|
392
|
+
T SIG
|
393
|
+
C 21
|
394
|
+
S MRRVNILCSFALLFASHTSLAVTYPLPPEGSRLVGQSFTVTVPDHNTQPLTFAAQYGQGLSNMLEANPGA
|
395
|
+
/
|
396
|
+
N D-allose-binding periplasmic protein precursor
|
397
|
+
T SIG
|
398
|
+
C 23
|
399
|
+
S MNKYLKYFSGTLVGLMLSTSAFAAAEYAVVLKTLSNPFWVDMKKGIEDEATLGVSVDIFASPSEGDFQSQ
|
400
|
+
/
|
401
|
+
N ABC transporter periplasmic-binding protein ytfQ precursor
|
402
|
+
T SIG
|
403
|
+
C 21
|
404
|
+
S MWKRLLIVSAVSAAMSSMALAAPLTVGFSQVGSESGWRAAETNVAKSEAERGITLKIADGQQKQENQIKA
|
405
|
+
/
|
406
|
+
N Copper homeostasis protein cutF precursor
|
407
|
+
T SIG
|
408
|
+
C 20
|
409
|
+
S MVKKAIVTAMAVISLFTLMGCNNRAEVDTLSPAQAAELKPMPQSWRGVLPADCEGIETSLFLEKDGTWVM
|
410
|
+
/
|
411
|
+
N Heat-labile enterotoxin IIB, A chain precursor
|
412
|
+
T SIG
|
413
|
+
C 20
|
414
|
+
S MAKVISFFISLFLISFPLYANDYFRADSRTPDEVRRSGGLIPRGQDEAYEGTPININLYDHARGTATGNT
|
415
|
+
/
|
416
|
+
N Heat-labile enterotoxin IIB, B chain precursor
|
417
|
+
T SIG
|
418
|
+
C 23
|
419
|
+
S MSFKKIIKAFVIMAALVSVQAHAGASQFFKDNCNRTTASLVEGVELTKYIDINNNTDGMYVVSSTGGVWR
|
420
|
+
/
|
421
|
+
N FKBP-type peptidyl-prolyl cis-trans isomerase fkpA precursor
|
422
|
+
T SIG
|
423
|
+
C 25
|
424
|
+
S MKSLFKVTLLATTMAVALHAPITFAAEAAKPATAADSKAAFKNDDQKSAYLGASLGRYMENSLKEQEKLG
|
425
|
+
/
|
426
|
+
N Nonfimbrial adhesin 1 precursor
|
427
|
+
T SIG
|
428
|
+
C 28
|
429
|
+
S MKAKKYENQIYNENGRRCQRHGRRLAIADANGLNTVNAGDGKNLGTATATTTLQSCSVDLNLVTPNATVN
|
430
|
+
/
|
431
|
+
N Copper amine oxidase precursor
|
432
|
+
T SIG
|
433
|
+
C 30
|
434
|
+
S MGSPSLYSARKTTLALAVALSFAWQAPVFAHGGEAHMVPMDKTLKEFGADQWDDYAQLFTLIKDGAYVKV
|
435
|
+
/
|
436
|
+
N Outer membrane protein G precursor
|
437
|
+
T SIG
|
438
|
+
C 21
|
439
|
+
S MKKLLPCTALVMCAGMACAQAEERNDWHFNIGAMYEIENVEGYGEDMDGLEPSVYFNAANGPWRIALAYY
|
440
|
+
/
|
441
|
+
N Transthyretin-like protein precursor
|
442
|
+
T SIG
|
443
|
+
C 23
|
444
|
+
S MLKRYLVLSVATAAFSLPSLVNAAQQNILSVHILNQQTGKPAADVTVTLEKADNGWLQLNTAKTDKDGRI
|
445
|
+
/
|
446
|
+
N Metal-binding protein yodA precursor
|
447
|
+
T SIG
|
448
|
+
C 23
|
449
|
+
S MAIRLYKLAVALGVFIVSAPAFSHGHHSHGKPLTEVEQKAANGVFDDANVNRTLSDWDGVWQSVYPLLQS
|
450
|
+
/
|
451
|
+
N Protein yfdX precursor
|
452
|
+
T SIG
|
453
|
+
C 21
|
454
|
+
S MKRLIMATMVTAILASSTVWAADNAPVAAQQQTQQVQQTQKTAAAAERISQGLYAMRDVQVARLALFHGD
|
455
|
+
/
|
456
|
+
N Thiol:disulfide interchange protein dsbG precursor
|
457
|
+
T SIG
|
458
|
+
C 17
|
459
|
+
S MLKKILLLALLPAIAFAEELPAPVKAIEKQGITIIKTFDAPGGMKGYLGKQDMGVTIYLTPDGKHAISGY
|
460
|
+
/
|
461
|
+
N Periplasmic murein peptide-binding protein precursor
|
462
|
+
T SIG
|
463
|
+
C 22
|
464
|
+
S MKHSVSVTCCALLVSSISLSYAAEVPSGTVLAEKQELVRHIKDEPASLDPKAVGLPEIQVIRDLFEGLVN
|
465
|
+
/
|
466
|
+
N UPF0098 protein ybcL precursor
|
467
|
+
T SIG
|
468
|
+
C 21
|
469
|
+
S MKTLIVSTVLAFITFSAQAAAFQVTSNEIKTGEQLTTSHVFSGFGCEGGNSPSLTWSGVPEGTKSFAVTV
|
470
|
+
/
|
471
|
+
N Outer membrane protein N precursor
|
472
|
+
T SIG
|
473
|
+
C 21
|
474
|
+
S MKSKVLALLIPALLAAGAAHAAEVYNKDGNKLDLYGKVDGLHYFSDNSAKGDQSYARLGFKGETQINDQL
|
475
|
+
/
|
476
|
+
N Adhesin AIDA-I precursor
|
477
|
+
T SIG
|
478
|
+
C 49
|
479
|
+
S MNKAYSIIWSHSRQAWIVASELARGHGFVLAKNTLLVLAVVSTIGNAFAVISGTVSSGGTVSSGETQIVY
|
480
|
+
/
|
481
|
+
N Probable copper-binding protein pcoE precursor
|
482
|
+
T SIG
|
483
|
+
C 20
|
484
|
+
S MKKILVSFVAIMAVASSAMAAETMNMHDQVNNAQAPAHQMQSSAEKSAVQDSMTMMDMSSHDQAAMSHDM
|
485
|
+
/
|
486
|
+
N Taurine-binding periplasmic protein precursor
|
487
|
+
T SIG
|
488
|
+
C 22
|
489
|
+
S MAISSRNTLLAALAFIAFQAQAVNVTVAYQTSAEPAKVAQADNTFAKESGTVDWRKFDSGASIVRALASG
|
490
|
+
/
|
491
|
+
N Temperature-sensitive hemagglutinin tsh precursor
|
492
|
+
T SIG
|
493
|
+
C 52
|
494
|
+
S MNRIYSLRYSAVARGFIAVSEFARKCVHKSVRRLCFPVLLLIPVLFSAGSAGTVNNELGYQLFRDFAENK
|
495
|
+
/
|
496
|
+
N Serine protease pic precursor
|
497
|
+
T SIG
|
498
|
+
C 55
|
499
|
+
S MNKVYSLKYCPVTGGLIAVSELARRVIKKTCRRLTHILLAGIPAICLCYSISQAGIVRSDIAYQIYRDFA
|
500
|
+
/
|
501
|
+
N Serine protease espP precursor
|
502
|
+
T SIG
|
503
|
+
C 55
|
504
|
+
S MNKIYSLKYSHITGGLIAVSELSGRVSSRATGKKKHKRILALCFLGLLQSYSFASQMDISNFYIRDYMDF
|
505
|
+
/
|
506
|
+
N Serine protease pic precursor
|
507
|
+
T SIG
|
508
|
+
C 55
|
509
|
+
S MNKVYSLKYCPVTGGLIVVSELASRVIKKTCRRLTHILLAGIPAVYLYYPISQAGIVRSDIAYQIYRDFA
|
510
|
+
/
|
511
|
+
N Serine protease sat precursor
|
512
|
+
T SIG
|
513
|
+
C 49
|
514
|
+
S MNKIYSLKYSAATGGLIAVSELAKRVSGKTNRKLVATMLSLAVAGTVNAAIDISNVWARDYLDLAQNKGI
|
515
|
+
/
|
516
|
+
N Serine protease espC precursor
|
517
|
+
T SIG
|
518
|
+
C 53
|
519
|
+
S MNKIYALKYCHATGGLIAVSELASRVMKKAARGSLLALFNLSLYGAFLSAQAAQLNIDNVWARDYLDLAQ
|
520
|
+
/
|