neurohmmer 0.1.0
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +7 -0
- data/.gitignore +35 -0
- data/CODE_OF_CONDUCT.md +13 -0
- data/Gemfile +4 -0
- data/LICENSE +662 -0
- data/README.md +136 -0
- data/Rakefile +17 -0
- data/bin/neurohmmer +69 -0
- data/data/hmm/CRH_DH44.fa.hmm +427 -0
- data/data/hmm/Chordate_Glucagon_PACAP.fa.hmm +484 -0
- data/data/hmm/Chordate_Neurotensin_precursors_neurotensin_like_Ciona.fa.hmm +526 -0
- data/data/hmm/Deutrostomian_tachykinin.fa.hmm +367 -0
- data/data/hmm/Gastrin_releasing_peptide.fa.hmm +448 -0
- data/data/hmm/GnRH.fa.hmm +370 -0
- data/data/hmm/Hypocretin_orexin.fa.hmm +451 -0
- data/data/hmm/Lophotrochozoan_luqin_arthropod_RYamide.fa.hmm +385 -0
- data/data/hmm/NPFF.fa.hmm +430 -0
- data/data/hmm/NPS.fa.hmm +790 -0
- data/data/hmm/PTH.fa.hmm +502 -0
- data/data/hmm/Protostomian_Allatostatin_B.fa.hmm +835 -0
- data/data/hmm/Protostomian_CCH_amide.fa.hmm +415 -0
- data/data/hmm/Protostomian_Ecdysis_Triggering_Hormone.fa.hmm +433 -0
- data/data/hmm/Protostomian_PDF.fa.hmm +265 -0
- data/data/hmm/Protostomian_allatostatin_C.fa.hmm +352 -0
- data/data/hmm/Protostomian_proctolin.fa.hmm +346 -0
- data/data/hmm/Putative_chordate_Opioid.fa.hmm +802 -0
- data/data/hmm/SIF.fa.hmm +286 -0
- data/data/hmm/TRH.fa.hmm +910 -0
- data/data/hmm/allatotropin.fa.hmm +433 -0
- data/data/hmm/ambulacrarian_amphioxus_NPS-like.fa.hmm +847 -0
- data/data/hmm/avp.fa.hmm +475 -0
- data/data/hmm/calcitonin_DH31.fa.hmm +418 -0
- data/data/hmm/cholecystokinin_sulfakinin.fa.hmm +433 -0
- data/data/hmm/chordate_OX26_QRFP.fa.hmm +475 -0
- data/data/hmm/chordate_somatostatin_cortistatin_like.fa.hmm +361 -0
- data/data/hmm/f_type_SALMF.fa.hmm +811 -0
- data/data/hmm/galanin.fa.hmm +391 -0
- data/data/hmm/l_type_SALMF.fa.hmm +523 -0
- data/data/hmm/nmu_pyrokinin.fa.hmm +424 -0
- data/data/hmm/npy_npf.fa.hmm +301 -0
- data/data/hmm/protostomian_CCAP.fa.hmm +415 -0
- data/data/hmm/protostomian_allatostatinA_buccalin.fa.hmm +706 -0
- data/data/hmm/protostomian_leucokinin.fa.hmm +511 -0
- data/data/hmm/protostomian_tackykinin.fa.hmm +760 -0
- data/data/hmm/tachykinin.fa.hmm +541 -0
- data/data/hmm/vertebrate_ghrelin_motilin.fa.hmm +382 -0
- data/data/raw_data/CRH_DH44.fa +44 -0
- data/data/raw_data/CRH_DH44.fa.aligned.fa +242 -0
- data/data/raw_data/Chordate_Glucagon_PACAP.fa +18 -0
- data/data/raw_data/Chordate_Glucagon_PACAP.fa.aligned.fa +72 -0
- data/data/raw_data/Chordate_Neurotensin_precursors_neurotensin_like_Ciona.fa +10 -0
- data/data/raw_data/Chordate_Neurotensin_precursors_neurotensin_like_Ciona.fa.aligned.fa +25 -0
- data/data/raw_data/Deutrostomian_tachykinin.fa +1283 -0
- data/data/raw_data/Deutrostomian_tachykinin.fa.aligned.fa +5707 -0
- data/data/raw_data/Gastrin_releasing_peptide.fa +12 -0
- data/data/raw_data/Gastrin_releasing_peptide.fa.aligned.fa +25 -0
- data/data/raw_data/GnRH.fa +22 -0
- data/data/raw_data/GnRH.fa.aligned.fa +66 -0
- data/data/raw_data/Hypocretin_orexin.fa +14 -0
- data/data/raw_data/Hypocretin_orexin.fa.aligned.fa +49 -0
- data/data/raw_data/Lophotrochozoan_luqin_arthropod_RYamide.fa +26 -0
- data/data/raw_data/Lophotrochozoan_luqin_arthropod_RYamide.fa.aligned.fa +91 -0
- data/data/raw_data/NPFF.fa +16 -0
- data/data/raw_data/NPFF.fa.aligned.fa +48 -0
- data/data/raw_data/NPS.fa +8 -0
- data/data/raw_data/NPS.fa.aligned.fa +24 -0
- data/data/raw_data/PTH.fa +24 -0
- data/data/raw_data/PTH.fa.aligned.fa +144 -0
- data/data/raw_data/Protostomian_Allatostatin_B.fa +17 -0
- data/data/raw_data/Protostomian_Allatostatin_B.fa.aligned.fa +120 -0
- data/data/raw_data/Protostomian_CCH_amide.fa +24 -0
- data/data/raw_data/Protostomian_CCH_amide.fa.aligned.fa +72 -0
- data/data/raw_data/Protostomian_Ecdysis_Triggering_Hormone.fa +24 -0
- data/data/raw_data/Protostomian_Ecdysis_Triggering_Hormone.fa.aligned.fa +84 -0
- data/data/raw_data/Protostomian_PDF.fa +16 -0
- data/data/raw_data/Protostomian_PDF.fa.aligned.fa +32 -0
- data/data/raw_data/Protostomian_allatostatin_C.fa +28 -0
- data/data/raw_data/Protostomian_allatostatin_C.fa.aligned.fa +56 -0
- data/data/raw_data/Protostomian_proctolin.fa +16 -0
- data/data/raw_data/Protostomian_proctolin.fa.aligned.fa +32 -0
- data/data/raw_data/Putative_chordate_Opioid.fa +8 -0
- data/data/raw_data/Putative_chordate_Opioid.fa.aligned.fa +32 -0
- data/data/raw_data/SIF.fa +28 -0
- data/data/raw_data/SIF.fa.aligned.fa +70 -0
- data/data/raw_data/TRH.fa +10 -0
- data/data/raw_data/TRH.fa.aligned.fa +50 -0
- data/data/raw_data/allatotropin.fa +31 -0
- data/data/raw_data/allatotropin.fa.aligned.fa +90 -0
- data/data/raw_data/ambulacrarian_amphioxus_NPS-like.fa +8 -0
- data/data/raw_data/ambulacrarian_amphioxus_NPS-like.fa.aligned.fa +24 -0
- data/data/raw_data/avp.fa +28 -0
- data/data/raw_data/avp.fa.aligned.fa +70 -0
- data/data/raw_data/calcitonin_DH31.fa +36 -0
- data/data/raw_data/calcitonin_DH31.fa.aligned.fa +126 -0
- data/data/raw_data/cholecystokinin_sulfakinin.fa +28 -0
- data/data/raw_data/cholecystokinin_sulfakinin.fa.aligned.fa +84 -0
- data/data/raw_data/chordate_OX26_QRFP.fa +10 -0
- data/data/raw_data/chordate_OX26_QRFP.fa.aligned.fa +25 -0
- data/data/raw_data/chordate_somatostatin_cortistatin_like.fa +10 -0
- data/data/raw_data/chordate_somatostatin_cortistatin_like.fa.aligned.fa +20 -0
- data/data/raw_data/f_type_SALMF.fa +118 -0
- data/data/raw_data/f_type_SALMF.fa.aligned.fa +590 -0
- data/data/raw_data/galanin.fa +93 -0
- data/data/raw_data/galanin.fa.aligned.fa +552 -0
- data/data/raw_data/kisspeptin.fa +16 -0
- data/data/raw_data/kisspeptin.fa.aligned.fa +0 -0
- data/data/raw_data/l_type_SALMF.fa +68 -0
- data/data/raw_data/l_type_SALMF.fa.aligned.fa +170 -0
- data/data/raw_data/nmu_pyrokinin.fa +18 -0
- data/data/raw_data/nmu_pyrokinin.fa.aligned.fa +63 -0
- data/data/raw_data/npy_npf.fa +20 -0
- data/data/raw_data/npy_npf.fa.aligned.fa +40 -0
- data/data/raw_data/protostomian_CCAP.fa +14 -0
- data/data/raw_data/protostomian_CCAP.fa.aligned.fa +42 -0
- data/data/raw_data/protostomian_allatostatinA_buccalin.fa +100 -0
- data/data/raw_data/protostomian_allatostatinA_buccalin.fa.aligned.fa +1350 -0
- data/data/raw_data/protostomian_leucokinin.fa +18 -0
- data/data/raw_data/protostomian_leucokinin.fa.aligned.fa +63 -0
- data/data/raw_data/protostomian_tackykinin.fa +504 -0
- data/data/raw_data/protostomian_tackykinin.fa.aligned.fa +2002 -0
- data/data/raw_data/tachykinin.fa.aligned.fa +13546 -0
- data/data/raw_data/vertebrate_ghrelin_motilin.fa +16 -0
- data/data/raw_data/vertebrate_ghrelin_motilin.fa.aligned.fa +32 -0
- data/lib/neurohmmer.rb +89 -0
- data/lib/neurohmmer/arg_validators.rb +71 -0
- data/lib/neurohmmer/hmmer.rb +71 -0
- data/lib/neurohmmer/output.rb +50 -0
- data/lib/neurohmmer/version.rb +4 -0
- data/neurohmmer.gemspec +34 -0
- data/spec/neurohmmer_spec.rb +11 -0
- data/spec/spec_helper.rb +2 -0
- data/template/contents.slim +55 -0
- metadata +269 -0
@@ -0,0 +1,16 @@
|
|
1
|
+
>Ensembl_FBtr0085024_PDF_Dmel
|
2
|
+
MARYTYLVALVLLAICCQWGYCGAMAMPDEERYVRKEYNRDLLDWFNNVGVGQFSPGQVATLCRYPLILENSLGPSVPIRKRNSELINSLLSLPKNMNDAGK
|
3
|
+
>gi_45650472_Pmon
|
4
|
+
MCRVAMLLVVLAVTAVVVTEAQREPAASKCQAATELAIQILQAVKGAHPGVAVGPHKRNSELINSLLGLPKFMIDAGRR
|
5
|
+
>gi_283526164_Psed
|
6
|
+
MNSIIVLSLAVLAIFTSSIQSSPLNRAEDLQPVERQIIAEMASKILKVAEDGLVYSKRNAELINSLLGLPKMMNDAGK
|
7
|
+
>CO508274_Hypsibius_dujardini_Tardigrada
|
8
|
+
MDVKAFLFAVAMSTFLTSSSAIWVFLEPRFDAEFISRNSEMVGQEVYSQFPSGSEGPAQLLSQGYQPVELTRIPIRKRNSEILNTIIGLPNKLRQRG
|
9
|
+
>Ensembl_F48B9.4_Cele
|
10
|
+
MSSRISVSLLLLAVVATMFFTANVVDATPRSQGNMMRYGNSLPAYAPHVLYRFYNSRQFAPINKRNNAEVVNHILKNFGALDRLGDVGK
|
11
|
+
>Ensembl_T07E3.6a_Cele
|
12
|
+
MNRFIISMIALLAVFCAVSTASPLLYRAPQYQMYDDVQFVKRSNAELINGLIGMDLGKLSAVGKRSNAELINGLLSMNLNKLSGAGRR
|
13
|
+
>jgi_239524_Lgig
|
14
|
+
MVALSPEMNSCTKCLLLLVFVGLTVLVKLSESSPLRPYQTQIEEKSRQDIITLAARVIKIAMYGSNQYDVIKRNAGTVDHLLNFPDLSVGK
|
15
|
+
>gi_187067819_Skow
|
16
|
+
MASYKSMMVIYCVFLLVADIEGFLKVVAKKSGRIQREVAEKRDLLRDKEIEKRPHGERDLRNYGNTKQEVDIPRHMVLGR
|
@@ -0,0 +1,32 @@
|
|
1
|
+
>Ensembl_FBtr0085024_PDF_Dmel
|
2
|
+
MARYTYLV-----ALVLLAICCQWG---YCGAMAMPDEERY----------VRKEY--NR
|
3
|
+
DLLD--WFNNVGVGQFSPGQVATLCRYPLILENSLGP----SVPIRKRNSELINSLL---
|
4
|
+
-SLP-KNMNDAGK-
|
5
|
+
>gi_45650472_Pmon
|
6
|
+
MCRVAML-------LVVLAVT----------AVVVTEAQREPA--------ASKCQA-AT
|
7
|
+
ELAI------------------------QILQAVKGAHPGVAVGPHKRNSELINSLL---
|
8
|
+
-GLP-KFMIDAGRR
|
9
|
+
>gi_283526164_Psed
|
10
|
+
MNSIIVL------SLAVLAIF--------TSSIQSSPLNRAE-----DLQPVERQI--IA
|
11
|
+
EMAS------------------------KILKVAEDGLVY-----SKRNAELINSLL---
|
12
|
+
-GLP-KMMNDAGK-
|
13
|
+
>CO508274_Hypsibius_dujardini_Tardigrada
|
14
|
+
MDVKAFL------FAVAMSTFLT-----SSSAIWVFLEPRF------DAEFISR----NS
|
15
|
+
EMVGQEVYSQFPSGSEGPA---------QLLSQGYQPVELTRIPIRKRNSEILNTII---
|
16
|
+
-GLP-NKLRQRG--
|
17
|
+
>Ensembl_F48B9.4_Cele
|
18
|
+
MSSRISV------SLLLLAVVATMF----FTANVVDATPRS-----------------QG
|
19
|
+
NMMR--------YGNSLPA------YAPHVLYRFYNSRQFAPIN-KRNNAEVVNHILKNF
|
20
|
+
GALD--RLGDVGK-
|
21
|
+
>Ensembl_T07E3.6a_Cele
|
22
|
+
MNRFIIS------MIALLAVFCAVS----TASPLLYRAPQYQM--YDDVQFVKRS---NA
|
23
|
+
ELIN------------------------GLIGMDLG--KLSAVG-KRSNAELINGLL---
|
24
|
+
-SMNLNKLSGAGRR
|
25
|
+
>jgi_239524_Lgig
|
26
|
+
MVALSPEMNSCTKCLLLLVFV--------GLTVLVKLSESSPLRPY-QTQIEEKS---RQ
|
27
|
+
DIIT---------------------LAARVIKIAMYGSNQYDV--IKRNAGTVDHLL-NF
|
28
|
+
PDLS------VGK-
|
29
|
+
>gi_187067819_Skow
|
30
|
+
MASYKSM-------MVIYCVFLLVADIEGFLKVVAKKSGR-----------IQREVAEKR
|
31
|
+
DLLRDK----------------------EIEKRPHGERDLRNYGNTKQEVDIPRHMV---
|
32
|
+
----------LGR-
|
@@ -0,0 +1,28 @@
|
|
1
|
+
>gi_161295377_Ctel
|
2
|
+
MVPSKSVCAIVVVMSCYVLCGFIVNAVPTQDGGSNLSHGYNEVSEMGLTDTKLAFLEKKLREEIERDLADLLVMEHQHRHNLNFIQEKKRQLEIKKREPVQCLVNIVSCWKRK
|
3
|
+
>jgi_181187_Hrob
|
4
|
+
MKNVTFLLLAMSATLLLLLASALPPRRRSLISKNYIFPKTHSKRFAKNNDAEDPLYSSYPFEYNNNEPISMDSNKYANSLNKEFPKAPKGKQVFKKAHVPCLFSIISCWK
|
5
|
+
>gi_163505903_Lgig
|
6
|
+
MKSLPVLTLTLFCICLNEVSSNKILPGEEHRQLVQITEESSNNDRLLKRSTLQDAYESHLAMLMEAEQSLTKQIEELKLRREELSNRKRSHVMCLVNLISCFRKR
|
7
|
+
>gi_260628238_Cgig
|
8
|
+
MELTQSVFVLKLYAAVVAVLLVAEVHAQPQKFSTEIQQTGDESSTDLNLFKMALREAYNRELEFYEQQEAQIVKQLAALENDRNQIRERKRSHIRCLVNVIACYRKK
|
9
|
+
>gi_203663510_Acal
|
10
|
+
MSVSVRTWRAVNTCLLLTLLTLWADVLVVRAAVIPVSSPEPMEEASALQLLPGKIGRASLLREMERQLMILQAAEENIVSGLQELEEERRVLSGRKRSHYSSMCMFNVVACYRKRK
|
11
|
+
>jgi_290676_Dpul
|
12
|
+
MMAKISAVVPVAILLYLAASGAAKSTDREETESTDFGQDIEVLGAVPDDGSVETALLNYLFAKQIVARLRTNANPQDLMRKRSYWKQCAFNAVSCFGK
|
13
|
+
>BCM_GLEAN_05428_Tcas
|
14
|
+
MAAQLPRYLTKTLFIFLIATLVVANARPNHFGDASQNSISGLKFQVVGEPADGNNLLDSRLKPWELEMLVQRLSEISSQTGGDFAWDKSIRLPEAKRQSRYRQCYFNPISCFRK
|
15
|
+
>Ensembl_FBtr0080234_AstC_Dmel
|
16
|
+
MMKFVQILLCYGLLLTLFFALSEARPSGAETGPDSDGLDGQDAEDVRGAYGGGYDMPAQAIYPNIPMDRLQMLFAQYRPTSYSAYLRSPTYGNVNELYRLPESKRQVRYRQCYFNPISCFRK
|
17
|
+
>Ensembl_FBtr0114455_AstCC_Dmel
|
18
|
+
MVVPKRAALLLDRLMVALHHALEQERSEQRIGEFFGDRNILSGKFGDSHNGMEHHQAREDGMYSDDDAGTLLDYDFKDLNQINRATGETRRAGADRSGTSTHSGSPAGSRRIQPSGSGGGRAYWRCYFNAVSCF
|
19
|
+
>Ensembl_F33D11.8_Cele
|
20
|
+
MVKFFVFLLFFAFLCSFTSAIPLRSLFLRSYDDINQESIARGYFAPQPVDDDNADNRPKRGIDLLKRRVEIIERNRCFFNPITCY
|
21
|
+
>Ensembl_M02E1.2_Cele
|
22
|
+
MMAQKTLIIAVMLVCSILQPMLALGSLTPSAAFRANMQQRERSPNTLFYMDGASKQYGDEIKDPIYKRFKPCYYSPIQCLIKRK
|
23
|
+
>Ensembl_R11.2_Cele
|
24
|
+
MRVLTFLLVTLFALANVMQAQRYDRAIYEALLNDLEREFVERELAQHVLEKRELLRQDRQELDRVRRASEKKSYPRNCYFSPIQCLFTRN
|
25
|
+
>Ensembl_Y73B6BL.35_Cele
|
26
|
+
MKSSSVLSVALIVLVIVQLISASLASVPSSSAVSDGQIDFDALAAKIEMLRPNRYWKRAHNIDTRALNQFKNCYFSPIQCVLMERRRK
|
27
|
+
>Ensembl_R08B4.5_Cele
|
28
|
+
MSSGKLFQFFIVFLATLLLADAIPMVSSRDEDDQIIQKRLSNDALIRLLMRNRGTQTQLGLKRGLVKKAEVERRSIDEDFSNCFLSPVQCMLPSSRK
|
@@ -0,0 +1,56 @@
|
|
1
|
+
>gi_161295377_Ctel
|
2
|
+
MVPSKS--------VCAIVVVMSCYVLCGFIVNAVPTQDGGSN-------------LSHG
|
3
|
+
YNEVSEMGLTDTKL--AFLEKKLREEIERDLADLLVME---------------HQHRHNL
|
4
|
+
NFIQEKKR-------------QLEIKKREPV----------QCLVNIVSCW----KRK
|
5
|
+
>jgi_181187_Hrob
|
6
|
+
MKN-----------VTFLLLAMSATLLLLLASALPPRRRSLIS-----------------
|
7
|
+
------------------KNYIFPKTHSKRFAKNNDAEDPLYSSYPF------EYNNNEP
|
8
|
+
ISMDSNKYANSLNKEFPKAPKGKQVFKKAHV----------PCLFSIISCW------K
|
9
|
+
>gi_163505903_Lgig
|
10
|
+
MKS-------------LPVLTLTLFCICLNEVSSNKILPGEEHRQ----------LVQIT
|
11
|
+
EESSNNDRLL--------KRSTLQDAYESHLAMLMEAE---------------QSLTKQI
|
12
|
+
EELKLRRE-------------ELSNRKRSHV----------MCLVNLISCF----RKR
|
13
|
+
>gi_260628238_Cgig
|
14
|
+
MELT----------QSVFVLKLYAAVVAVLLVAEVHAQPQKFSTE----------IQQTG
|
15
|
+
DESSTDLNL---------FKMALREAYNRELEFYEQQE---------------AQIVKQL
|
16
|
+
AALENDRN-------------QIRERKRSHI----------RCLVNVIACY----RKK
|
17
|
+
>gi_203663510_Acal
|
18
|
+
MSVSVRTWRAVNTCLLLTLLTLWADVLVVRAAVIPVSSPEPM------------------
|
19
|
+
-EEASALQLLPGKI----GRASLLREMERQLMILQAAE---------------ENIVSGL
|
20
|
+
QELEEERR-------------VLSGRKRSHY--------SSMCMFNVVACYR---KRK
|
21
|
+
>jgi_290676_Dpul
|
22
|
+
MMA-------------KISAVVPVAILLYLAASGAAKSTDREETESTDFGQD----IEVL
|
23
|
+
GAVPDDGSVETALL----NYLFAKQIVAR-------------------------------
|
24
|
+
--LRTNANP------------QDLMRKRSY---------WKQCAFNAVSCF-----GK
|
25
|
+
>BCM_GLEAN_05428_Tcas
|
26
|
+
MAAQ---------LPRYLTKTLFIFLIATLVVANARPNHFGDASQNSISGLK----FQVV
|
27
|
+
GEPADGNNLLDSRL----KPWELEMLVQR-------------------------------
|
28
|
+
--LSEISSQTGGDFAWDKSIRLPEAKRQSR---------YRQCYFNPISCF-----RK
|
29
|
+
>Ensembl_FBtr0080234_AstC_Dmel
|
30
|
+
MMK-------------FVQILLCYGLLLTLFFALSEARPSGAETGPDSDGLDGQDAEDVR
|
31
|
+
GAYGGGYDMPAQAIYPNIPMDRLQMLFAQ------------------------YRPTSYS
|
32
|
+
AYLRSPTYGNVNELY-----RLPESKRQVR---------YRQCYFNPISCF-----RK
|
33
|
+
>Ensembl_FBtr0114455_AstCC_Dmel
|
34
|
+
MVVPKR------------AALLLDRLMVALHHALEQERS-----------------EQRI
|
35
|
+
GEFFGDRNILSGKF--GDSHNGMEHHQAREDGMYSDDDAGTLLDYDFKDLNQINRATGET
|
36
|
+
RRAGADRSGTSTHSG------SPAGSRRIQPSGSGGGRAYWRCYFNAVSCF-------
|
37
|
+
>Ensembl_F33D11.8_Cele
|
38
|
+
MVK-------------FFVFLLFFAFLCSFTSAIP-------------------------
|
39
|
+
----------------------LRSLFLRSYDDINQES--------------IARGYFAP
|
40
|
+
QPVDDDNADNRPKRG------IDLLKRRVEIIE------RNRCFFNPITCY-------
|
41
|
+
>Ensembl_M02E1.2_Cele
|
42
|
+
MMAQ----------KTLIIAVMLVCSILQPMLALGSLTP---------------------
|
43
|
+
------------------SAAFRANMQQR------------------------ERSPNTL
|
44
|
+
FYMDGASKQYGDEI-------KDPIYKR-----------FKPCYYSPIQCLI---KRK
|
45
|
+
>Ensembl_R11.2_Cele
|
46
|
+
MRV------------------LTFLLVTLFALA------------------------NVM
|
47
|
+
QAQRYDRAIYEALL-----NDLEREFVERELA---------------------QHVLEKR
|
48
|
+
ELLRQDRQE------------LDRVRRASEKKSY-----PRNCYFSPIQCLF---TRN
|
49
|
+
>Ensembl_Y73B6BL.35_Cele
|
50
|
+
MKS-----------SSVLSVALIVLVIVQLISASLASVPSS----------------SAV
|
51
|
+
SDGQIDFDALAAKI-----------EMLR-------------------------------
|
52
|
+
---------------------PNRYWKRAHNIDTRALNQFKNCYFSPIQCVLMERRRK
|
53
|
+
>Ensembl_R08B4.5_Cele
|
54
|
+
MSS-----------GKLFQFFIVFLATLLLADAIP-----------------------MV
|
55
|
+
SSRDEDDQIIQKRL----SNDALIRLLMR------------------------NRGTQTQ
|
56
|
+
LGLKRGLVK------------KAEVERRSIDED------FSNCFLSPVQCMLP-SSRK
|
@@ -0,0 +1,16 @@
|
|
1
|
+
>Ensembl_FBtr0079562_Dmel
|
2
|
+
MGVPRSHGTGIGCGSGHRWLLVWMTVLLLVVPPHLVDGRYLPTRSHGDDLDKLRELMLQILELSNEDPQQQQQQQQQQQHPQLRLHNEATGGSSSSSNINNPRVSNGNSNAAWLQKLSAMGALDELGGDGARFGPNYGRY
|
3
|
+
>BCM_GLEAN_15137_Tcas
|
4
|
+
MFDRKLVFALVFVVFATLAVEGRYLPTRSNGDRIEKLRELLKDLFENEVEKEEYQADAPPRWHPESKLFYKREAPAH
|
5
|
+
>gi_300039604_Apis
|
6
|
+
MAGKFSALFLVGFVAAVVVAPYMMAEARYLPTRGNDDRLTRLKELLTDLLDSGAQPNLEMERPYVDVNGDFSRLRPREYNIPEKSIMELFNPTVPHHQRPRS
|
7
|
+
>jgi_305680_Dpul
|
8
|
+
MLKSTSLKALVTLLVVSFVLMASSPRAADARYLMTRGKDPRFDRLYDIITKLLQNGGGDLEYQIKSQLDSGP
|
9
|
+
>jgi_21488_Ctel
|
10
|
+
MEIRLTLVLALLVAALGVVANALSIPSDALKDNQMDVADKDGDQSRRATWLETRDLEDDFKELVYLTIEELVNEGRMDPRVLSKEENEVKEKRGRWQGFCFKRTRSGRFLPYICWKGDRK
|
11
|
+
>gi_223843442_Apom
|
12
|
+
MDMCRLSAILVILYGTLCAVTNAMSIPASQLKDSGVELDSSENTALDEGRRASWLETRDLENDFKDLVFLTLQELAQEGRIDPRVIVEENSLDTKEKRGRWQGFCFRRTKTGRFLPYICWKGDRK
|
13
|
+
>gi_163376585_Lgig
|
14
|
+
MRSSTILSLLVVLLLAAPTFCLPPDQGSEIDDLDKRPKYMDTREELSVLKDMVYIVLQELAEDGKINPELFTIHDQKAVVKRMKYMGICMRRTKYNAVVPYPCLRSGR
|
15
|
+
>gi_121437918_Acal
|
16
|
+
MELQACNIFALFVVVVTLSVASSLPASRTDDVLQEASGLALNKRPKYMDTRRDLDVFKDLVLISIQELVDENRLNPALLPEEDAPKPVEKRMRYMGICMKKQYNNFIPFPCLRSGR
|
@@ -0,0 +1,32 @@
|
|
1
|
+
>Ensembl_FBtr0079562_Dmel
|
2
|
+
MGVPRSHGTGIGCGSGHRWLLVWMTVLL-LVVPPHLVD----------------------
|
3
|
+
--GRYLPTRSHGDDLDKLRELMLQILELSNEDPQQQQQQQQQQQHPQLRLHNEATGGSSS
|
4
|
+
SSNINNPRVSNGNSNAAWLQKLSAMGALDELGGDGARFGP----NYGRY----
|
5
|
+
>BCM_GLEAN_15137_Tcas
|
6
|
+
M--------------FDRKLVFALVF---VVFATLAVE----------------------
|
7
|
+
--GRYLPTRSNGDRIEKLRELLKDLFENEVEKEEYQADAP-----P--------------
|
8
|
+
------------------------------------RWHPESKLFYKREAPAH
|
9
|
+
>gi_300039604_Apis
|
10
|
+
M-----------AGKFSALFLVGFVAAV-VVAPYMMAE----------------------
|
11
|
+
--ARYLPTRGNDDRLTRLKELLTDLLDSGAQ--------------PNLEMERPYVDVNGD
|
12
|
+
FSR-----LRPREYN---IPEKSIME----------LFNPTVP-HHQR--PRS
|
13
|
+
>jgi_305680_Dpul
|
14
|
+
M--------------LKSTSLKALVTLL-VVSFVLMASSPRAAD----------------
|
15
|
+
--ARYLMTRGKDPRFDRLYDIITKLLQNGGGDLEYQIKSQLDSG-P--------------
|
16
|
+
-----------------------------------------------------
|
17
|
+
>jgi_21488_Ctel
|
18
|
+
MEI------------RLTLVLALLVAALGVVANALSIPSDALKDN--QMDVADKDG-DQS
|
19
|
+
RRATWLETR---DLEDDFKELVYLTIEELVNEGRMD---------PRVLSKEEN-EVKEK
|
20
|
+
RGRWQGFCFKRTRSG---------------------RFLPYICWKGDRK----
|
21
|
+
>gi_223843442_Apom
|
22
|
+
MDM---------C--RLSAILVILYGTLCAVTNAMSIPASQLKDSGVELDSSENTALDEG
|
23
|
+
RRASWLETR---DLENDFKDLVFLTLQELAQEGRID---------PRVIVEENSLDTKEK
|
24
|
+
RGRWQGFCFRRTKTG---------------------RFLPYICWKGDRK----
|
25
|
+
>gi_163376585_Lgig
|
26
|
+
M--------------RSSTILSLLVVLL-LAAPTFCLPPDQGSEI----D-------DLD
|
27
|
+
KRPKYMDTR---EELSVLKDMVYIVLQELAEDGKIN---------PELFTIHDQ-KAVVK
|
28
|
+
RMKYMGICMRRTKYN---------------------AVVPYPCLRSGR-----
|
29
|
+
>gi_121437918_Acal
|
30
|
+
MEL------------QACNIFALFVVVV-TLSVASSLPASRTDDV-----LQEASGLALN
|
31
|
+
KRPKYMDTR---RDLDVFKDLVLISIQELVDENRLN---------PALLPEEDAPKPVEK
|
32
|
+
RMRYMGICMKK-QYN---------------------NFIPFPCLRSGR-----
|
@@ -0,0 +1,8 @@
|
|
1
|
+
>PENK_Hsap
|
2
|
+
MARFLTLCTWLLLLGPGLLATVRAECSQDCATCSYRLVRPADINFLACVMECEGKLPSLKIWETCKELLQLSKPELPQDGTSTLRENSKPEESHLLAKRYGGFMKRYGGFMKKMDELYPMEPEEEANGSEILAKRYGGFMKKDAEEDDSLANSSDLLKELLETGDNRERSHHQDGSDNEEEVSKRYGGFMRGLKRSPQLEDEAKELQKRYGGFMRRVGRPEWWMDYQKRYGGFLKRFAEALPSDEEGESYSKEVPEMEKRYGGFMRF
|
3
|
+
>PDYN_Hsap
|
4
|
+
MAWQGLVLAACLLMFPSTTADCLSRCSLCAVKTQDGPKPINPLICSLQCQAALLPSEEWERCQSFLSFFTPSTLGLNDKEDLGSKSVGEGPYSELAKLSGSFLKELEKSKFLPSISTKENTLSKSLEEKLRGLSDGFREGAESELMRDAQLNDGAMETGTLYLAEEDPKEQVKRYGGFLRKYPKRSSEVAGEGDGDSMGHEDLYKRYGGFLRRIRPKLKWDNQKRYGGFLRRQFKVVTRSQEDPNAYSGELFDA
|
5
|
+
>Ghost_KH.C10.27.v1.A.SL11_Cint
|
6
|
+
MKLVKKFSILAAIVVCYFGCIADAVPVDTVEKQLLQREGTGNPENFLDWTNQLNSTDDAEDNPFLAENRNSDEENNDYSPGQAESIQSDKRFQSLFKRYPGFQGLFKRHNPHLPDLFKRYNSMGLFKRSPGMLGLFKRGLLGLFKRSDARLQGLFKRDSATQGSFKRSSEAQALPKRYPNFQGLFKRLSEATEYPEDDSSNDDTKQRGNLHSLFKRDTSAHYLEDRGESIPFLFRRS
|
7
|
+
>ENsembl_SNAP00000092003_Csav
|
8
|
+
MYSIQACLLLSILFNPDSIIVKAVPAIDAIERELISKQINKEEVNFIDFTKALNSTALDDMSDDELLWMLGQMIQPIQESTSVNDEEQLSGIDDIEEIDKEQGTNDELNLGKDGDQNQAYFSPQMKRHFGPLFKRMRGLFKRAPNAPLKRGLSGLFRRDPNTPGEPDARKVSDGGRTDTRGMQGLFKREPAFPVDADNSYDGKSHQVKLDRRRMPGLFKRGLQNLFKRAGGANSLFKREDGIENEVGARNRKSDLQEIFKRGIQGLFKRMTTDDLNAENNLGEAPHYRRSFHSLFKRDLSLSWNKSSGENKNKVHSLEKRGENIPFIFKRN
|
@@ -0,0 +1,32 @@
|
|
1
|
+
>PENK_Hsap
|
2
|
+
MA---RFLTLCTWLLLLGPGLLATVRAECSQDCATCSYRLVR-PADINFLACVMECEGKL
|
3
|
+
PSLKIWETCKELLQLSKPELPQDGTSTLRENSKPEESHL---------------------
|
4
|
+
-----------------------------------LAKR-----YGGFMKRY--------
|
5
|
+
-----GGFMKKMDE--LYPMEPEEEANGSEILAKRYGGF---MKKDAEEDDSLANSSD--
|
6
|
+
-------------LLKELLETGDNRERSHHQDGSDNEEEVSKRYGGFMRGL-KRSPQLED
|
7
|
+
E---------AKELQKRY---GGFMRRVG----RPEW--WMDYQKRYGGFL-----KR-F
|
8
|
+
AEALPSDEEGESYSK-------EVPEMEKRYGG----FMRF
|
9
|
+
>PDYN_Hsap
|
10
|
+
MAW--QGLVLAACLLMF-----PSTTADCLSRCSLCAVKTQDGPKPINPLICSLQCQAAL
|
11
|
+
LPSEEWERCQSFLSFFTP-------STLGLNDKED---L---------------------
|
12
|
+
-----------------------------------GSKSVGEGPYSELAKLS--------
|
13
|
+
-----GSFLKELEKSKFLPSISTKENTLSKSLEEKLRGLSDGFREGAESE--LMRDAQ--
|
14
|
+
-------------LNDGAMETGTLYLA------EEDPKEQVKRYGGFLRKYPKRSSEVAG
|
15
|
+
EG--DGDSMGHEDLYKRY---GGFLRRI-----RPKL--KWDNQKRYGGFL-----RRQF
|
16
|
+
KVVTRSQEDPNAYSG-------ELFDA--------------
|
17
|
+
>Ghost_KH.C10.27.v1.A.SL11_Cint
|
18
|
+
MKLVKKFSILAAIVV-------------CYFGCIADAVP-VD------------TVEKQL
|
19
|
+
LQREGTGNPENFLDWTNQL-----NST---DDAEDNPFLA--------------------
|
20
|
+
------------ENRNSDEEN--NDYSPGQAESIQSDKR-----FQSLFKRY--------
|
21
|
+
-----PGFQGLFKR--HNPHLPDLFK------RYNSMGL---FKRSPG------------
|
22
|
+
--------------MLGLFKRGLLGL--------------FKRSDARLQGLFKRDSATQG
|
23
|
+
S---FKRSSEAQALPKRYPNFQGLFKRLSEATEYPEDDSSNDDTKQRGNL----------
|
24
|
+
HSLFKRDTS--------------AHYLEDRGESIPFLFRRS
|
25
|
+
>ENsembl_SNAP00000092003_Csav
|
26
|
+
MYSI-QACLLLSILF-------------NPDSIIVKAVPAID------------AIEREL
|
27
|
+
ISKQINKEEVNFIDFTKAL-----NST-ALDDMSDDELLWMLGQMIQPIQESTSVNDEEQ
|
28
|
+
LSGIDDIEEIDKEQGTNDELNLGKDGDQNQAYFSPQMKR----HFGPLFKRMRGLFKRAP
|
29
|
+
NAPLKRGLSGLFRRDPNTPGEPDARK-VSDGGRTDTRGMQGLFKREPA----FPVDADNS
|
30
|
+
YDGKSHQVKLDRRRMPGLFKRGLQNL--------------FKRAGG-ANSLFKREDGIEN
|
31
|
+
EVGARNRKSDLQEIFKRG--IQGLFKRM-----------TTDDLNAENNLGEAPHYRRSF
|
32
|
+
HSLFKRDLS-LSWNKSSGENKNKVHSLEKRGENIPFIFKRN
|
@@ -0,0 +1,28 @@
|
|
1
|
+
>jgi_176362_Lgig
|
2
|
+
MVAKGTVGILIVLFNTICANIDLNYNQVPVANPLLFGRRGINPDMSSLFFGKRSGNSDHRDLRKMKDTCKAVLSSCKILFSDYEDDTVRNKVQDGFGRFK
|
3
|
+
>gi_207118044_Hasi
|
4
|
+
MNCKIPCLLLVLTFCIMSFTHAQANPRNLNRLVGQQPLLFGRRGVNPNMNSLFFGKRAPSMNNMDVRTMCNAVLSACAAWQADMTDN
|
5
|
+
>gi_260928914_Cgig
|
6
|
+
MKIYSIISIVIALVAVIVLKTSASKENSRGLTRLVGQQPLLFGRRGMNPNMNSLFFGKRAVDRPTLDDIIVEKCSRIMAACREYAHERMGEDDI
|
7
|
+
>gi_117945496_Ipar
|
8
|
+
MSGRRNLLVPASLVLILSAILFFGHETQQVEAAYSPTRGQQNTHSFGRRGLNPNVNSLFFGKRGGSEQEALSNTEMGRKCLAAMSMCNMYFETNTINES
|
9
|
+
>jgi_175046_Lgig
|
10
|
+
MNRCTACLVLVLVVILTVNAVQSARGNGRQRPQLFGRHGVRPGMNGLVFGKRNSESQEMQQDCWSSLNLCLKVILNNGDMEEV
|
11
|
+
>gi_161198869_Ctel
|
12
|
+
MDCRLVTFVALFCSMLLVQQVLSDPLEDHLPETSGLFFGKRSSHPNMNNLLFGRRSYAQMAANYQVEEARQGICKSMKETCGKWGFDVEN
|
13
|
+
>gi_301553931_Apom
|
14
|
+
MQTKIVISACILAAMLVFQCACADPLRDQLPDTTGLFFGKRGSHPNMNNLLFGRRSYPIEDLEDARKVCRAVQATCARWGLDEN
|
15
|
+
>gi_326351257_Ecom
|
16
|
+
MDIKIVILACSLTVLLLSRQASTEPLEDQLPEDTGLFFGKRTSHNPNMNNLVFGRRSYQPKVQRRMNAEDAKRICLNVRLTCAKWFAEEDQMRNLKH
|
17
|
+
>BCM_GLEAN_08645_Tcas
|
18
|
+
MQLALAKVFSVCIVVIILTSWIEMTEATYRKPPFNGSIFGKRGATIGKLLTFVIFLSKIISSEYDSASKALSAMCEIASEACQTWFPSQEK
|
19
|
+
>gi_118778560_Agam
|
20
|
+
MAAFKVLGSLIVVLLVVLALSGHAEAGYRKPPFNGSIFGKRNGNSVDYEGNAKVLSTMCEIAAEACQSWFTQEQK
|
21
|
+
>Ensembl_FBtr0091490_IFa_Dmel
|
22
|
+
MALRFTLTLLLVTILVAAILLGSSEAAYRKPPFNGSIFGKRNSLGKSKIRIPLKPPPISPSRLRQRQNERRLRGGHGGVSHVVSPERQQIGPRPATPPPRTDLEPTTNTPATGGQMLCLLVRLNVEMPDVKKVMYKIYNVSRAYRYIELMPYIYIKYSINLQH
|
23
|
+
>jgi_260818_Dpul
|
24
|
+
MRSSFIVVMVCVVVVLTFWGQVAEATRKLPFNGSIFGKRSNQGTDKLESPSNLQLLCDAAMNACSDWLPIGSK
|
25
|
+
>Ensembl_F37A8.4_Cele
|
26
|
+
MWYIALLLAVIATSVTAQKADDEPIVFLVRVPIDEMDDDSSLLESYYHPRDILSKRAIPFNGGMYGKRSTMPFSGGMYGKRSGQIFAQRRAAIPFSGGMYGKRSLVPQSYSNNENQIKRGAMPFSGGMYGR
|
27
|
+
>MPI_GENEPREDICTION_JIGTRA00000189416_Ppac
|
28
|
+
MTFSGGMYGKRAAPSQFSGGMYGKRSETNYKRGPVMFSGGMYGKRAAPSQFSGGMYGKRAVPMTFSGGMYGKRASSPMMFGGGMYGKRAPMPYSGGMYGR
|
@@ -0,0 +1,70 @@
|
|
1
|
+
>jgi_176362_Lgig
|
2
|
+
MVAKGTVGILIVLFNTI---------CANIDLNYNQVPVANPL---------LFGRRGIN
|
3
|
+
-PDMSSLFFGKRSGNSDHR-----------------------------------------
|
4
|
+
---------------------------DLRKMKD-TCKAVLSSCKILFSD---YEDDTVR
|
5
|
+
NKVQDGFG-----RF----------------K
|
6
|
+
>gi_207118044_Hasi
|
7
|
+
MNCKIPCLLLVLTFCIMSFTH-----AQANPRNLNRLVGQQPL---------LFGRRGVN
|
8
|
+
-PNMNSLFFGKRA-----------------------------------------------
|
9
|
+
------PSM------------------NNMDVRT-MCNAVLSACAAWQAD---MTDN---
|
10
|
+
--------------------------------
|
11
|
+
>gi_260928914_Cgig
|
12
|
+
MKIYSIISIVIALVAVIVLKTSA---SKENSRGLTRLVGQQPL---------LFGRRGMN
|
13
|
+
-PNMNSLFFGKRAVD---------RP----------------------------------
|
14
|
+
---------------------------TLDDIIVEKCSRIMAACREYAHER-MGEDD---
|
15
|
+
-------------------------------I
|
16
|
+
>gi_117945496_Ipar
|
17
|
+
MSGRRNLLVPASLVLILSAILFFGHETQQVEAAYSPTRGQQNT-----H---SFGRRGLN
|
18
|
+
-PNVNSLFFGKRGGS---------------------------------------------
|
19
|
+
----EQEAL------------------SNTEMGR-KCLAAMSMCNMYFETNTINES----
|
20
|
+
--------------------------------
|
21
|
+
>jgi_175046_Lgig
|
22
|
+
MNRCTACLVLVLVVILTVNA------VQSARGNGRQRPQ-------------LFGRHGVR
|
23
|
+
-PGMNGLVFGKRNS----------------------------------------------
|
24
|
+
---------------------------ESQEMQQ-DCWSSLNLCLKVILN---NGD--ME
|
25
|
+
EV------------------------------
|
26
|
+
>gi_161198869_Ctel
|
27
|
+
MDCRLVTFVALFCSMLLVQ-------QVLSDPLEDHLPETSGL---------FFGKRSSH
|
28
|
+
-PNMNNLLFGRRSY----------------------------------------------
|
29
|
+
------AQM---AANY-----------QVEEARQGICKSMKETCGKWGFD---VEN----
|
30
|
+
--------------------------------
|
31
|
+
>gi_301553931_Apom
|
32
|
+
MQTKIVISACILAAMLVFQ-------CACADPLRDQLPDTTGL---------FFGKRGSH
|
33
|
+
-PNMNNLLFGRRSYP---------------------------------------------
|
34
|
+
----IE---------------------DLEDARK-VCRAVQATCARWGLD----EN----
|
35
|
+
--------------------------------
|
36
|
+
>gi_326351257_Ecom
|
37
|
+
MDIKIVILACSLTVLLLSR-------QASTEPLEDQLPEDTGL---------FFGKRTSH
|
38
|
+
NPNMNNLVFGRRSYQ---------------------------------------------
|
39
|
+
--PKVQRRM------------------NAEDAKR-ICLNVRLTCAKWFAE----EDQ-MR
|
40
|
+
NLKH----------------------------
|
41
|
+
>BCM_GLEAN_08645_Tcas
|
42
|
+
MQLALAKVFSVCIVVIILTSW-----IEMTEATYRKPP----------------------
|
43
|
+
---FNGSIFGKRGAT--------------------------------IGKLLTFVIFLSK
|
44
|
+
IISSEYD--------------------SASKALSAMCEIASEACQTWFPS---QEK----
|
45
|
+
--------------------------------
|
46
|
+
>gi_118778560_Agam
|
47
|
+
MAAFKVLGSLIVVLLVVLAL------SGHAEAGYRKPP----------------------
|
48
|
+
---FNGSIFGKRNGN---------------------------------------------
|
49
|
+
--SVDYE--------------------GNAKVLSTMCEIAAEACQSWFTQ---EQK----
|
50
|
+
--------------------------------
|
51
|
+
>Ensembl_FBtr0091490_IFa_Dmel
|
52
|
+
MALRFTLTLLLVTILVAAIL------LGSSEAAYRKPP----------------------
|
53
|
+
---FNGSIFGKRNSLGKSKIRIPLKPPPISPSRLRQRQNERRLRGGHGG--------VSH
|
54
|
+
VVSPERQQI-------GPRPATPPPRTDLEPTTNTPATGGQMLCLLVRLN---VEMPDVK
|
55
|
+
KVMYKIYNVSRAYRYIELMPYIYIKYSINLQH
|
56
|
+
>jgi_260818_Dpul
|
57
|
+
MRSSFIVVMVCVVVVLTF--------WGQVAEATRKLP----------------------
|
58
|
+
---FNGSIFGKRSNQGTDKL----------------------------------------
|
59
|
+
---------------------------ESPSNLQLLCDAAMNACSDWLPI---GSK----
|
60
|
+
--------------------------------
|
61
|
+
>Ensembl_F37A8.4_Cele
|
62
|
+
MWYIALLLAVIATSVTAQKADDEP-IVFLVRVPIDEMDDDSSLLESYYHPRDILSKRAIP
|
63
|
+
---FNGGMYGKRSTM------------PFS--------------GGMYGKR------SGQ
|
64
|
+
IFAQRRAAIPFSGGMYGKRSLVPQSYSNNENQIK--------------------------
|
65
|
+
-------------R--GAMPFSGGMYG----R
|
66
|
+
>MPI_GENEPREDICTION_JIGTRA00000189416_Ppac
|
67
|
+
MTFS----------------------------------------------GGMYGKRAAP
|
68
|
+
-SQFSGGMYGKRSETNYKR-----GPVMFS--------------GGMYGKRAAPSQFSGG
|
69
|
+
MYGKRAVPMTFSGGMYGKRASSPMMFGGGMYGKR--------------------------
|
70
|
+
----------------APMPYSGGMYG----R
|
@@ -0,0 +1,10 @@
|
|
1
|
+
>Uniprot_TRH_Hsap
|
2
|
+
MPGPWLLLALALTLNLTGVPGGRAQPEAAQQEAVTAAEHPGLDDFLRQVERLLFLRENIQRLQGDQGEHSASQIFQSDWLSKRQHPGKREEEEEEGVEEEEEEEGGAVGPHKRQHPGRREDEASWSVDVTQHKRQHPGRRSPWLAYAVPKRQHPGRRLADPKAQRSWEEEEEEEEREEDLMPEKRQHPGKRALGGPCGPQGAYGQAGLLLGLLDDLSRSQGAEEKRQHPGRRAAWVREPLEE
|
3
|
+
>Ensembl_ENSGALT00000013835_Ggal
|
4
|
+
MPSIQLPVLLLCLTLSGVCLNGRQFPPELSENMGRSSLDDILQRSGSHMLQSVLKKVEKKEEMNKELNMPLPQWLSKRQHPGKRYISDPEKRQHPGKRDVEEKASFGDIQKRQHLGKTEVEGYLVNYLELKKRQHPGRRSLWDQSTDISSSQLTYLNELSKRQHPGRRYLMYKHQHPSKRGWNDELDLSDQNWEKHQQFGNRDRDSDSPDYTGPCDLQQSAICNKDSLLLDLAEKFSKEGVEEKHQHPGRRSAWENETEE
|
5
|
+
>Ensembl_ENSDART00000018054_Drer
|
6
|
+
MRAVCVFVLACVAVSGAPGVRGQDGPAEEELFQRAEDLLLRSILTQMEEQNSENDQPEWMEKRQHPGKRQHPGKREEDLEPEVEMERWRRQHPGKRAPLDLGMLEDPTALSELSKRQHPGKRYLMLLHKRQHPGRRELQEADGHSAELEKRQHPGKRRCEGWADAGCGLLELLDTSGAPEKRQHPGRRAELEDELPGLE
|
7
|
+
>jgi_102993_Bflo
|
8
|
+
MAAHLCILLLLTAIRLAHGAEPAHGAEPAHGAEPAHGAEPAHGAEPGPLAHGAEPAHGAEPGPLAHGAEPAHGAEPGPLAPWPDTEAPRERDSGTTREPWERALLEDMARVLGALALYDADMEVMNQEETSPPFTHGGAELGQLLTDSFLLQSTDKRQSPGKRQSPGKRQSPGKRQSPGKRQSPGKRQSPGKRGDDEITLPMGLRFEPLFSSALSESSTDKRQSAGKRQSPGKRQSPGKRQSPGKRQSPGKRTFPFPGTPQMETHDATDARANLLTLLDLVEQKRQSPGKRQHPGKRADWLRPSPEEPWLLYPPEKPDVLLPFISSWSPESGIEDGGMASDGARDDKRQSPGKRQSPGKRQSPGKRQSPGKRDDAETGLPQGLPFDPLFYSAFGESSTDKRQSPGKRQSPGKRQSPGKRQSPGKRQSPGKRQSPGKRGGELSAAAAGQGAYAPAGSRKDWTEKPAIYTTFPAGF
|
9
|
+
>gi109402869_Spur
|
10
|
+
MKGTVGLYMWACILGYVTWGGAALPTILGKELVLSENDGPEIADWVQGKEIPLRNQYWGDVAEEEEEDELGMLSPDSEKRQYPGGKRQYPGGKRQYPGGKRQYPGGKRQFPAGKRQFVGGELIPSPELRQWPGGXRQWPGGXRQWPGGKRQYPGGKRQYPGGKRQWPEIKRQYPGGKRSEDDQDLLAMEIRQYPGG
|
@@ -0,0 +1,50 @@
|
|
1
|
+
>Uniprot_TRH_Hsap
|
2
|
+
MPGPWLLLALALTLNLT-GVPGGRAQPE--------------------------------
|
3
|
+
---------------------------AAQQEAVTAAEHPG---LDDFLRQVERLLFLRE
|
4
|
+
NIQRLQGDQGEH-------SASQIFQSDWL-----SKRQHPGKREEEEEEGVEEEEEEEG
|
5
|
+
GAVGPHKRQHPGRREDEAS-----------------------------------------
|
6
|
+
---------------------WSVD-----------------VTQH-----KRQHPGRRS
|
7
|
+
PWLAYAV--------P--------------------------------KRQHPGRRL---
|
8
|
+
----ADPKAQRSWEEEEEEEEREE---------------DLMPEKRQHPGKRA-------
|
9
|
+
LGGPCGPQGAYGQA--GLLLGLLDDLSRSQGAEEKRQHPGRRAA----------------
|
10
|
+
----WVREPLE-------E
|
11
|
+
>Ensembl_ENSGALT00000013835_Ggal
|
12
|
+
MPSIQLPVLL-LCLTLS-GV-CLNGRQF--------------------------------
|
13
|
+
---------------------------PPE-----LSENMGRSSLDDILQRSGSHM-LQS
|
14
|
+
VLKKVEKKEEMN-------KELNMPLPQWL-----SKRQHPGKRYISD------------
|
15
|
+
----PEKRQHPGKRDVEEKA------------------------SFGDIQ----------
|
16
|
+
------KRQHLGK--------TEVEGY-----------LVNYLELK-----KRQHPGRRS
|
17
|
+
LWDQST----------DISSSQLTYLNELS------------------KRQHPGRRY--L
|
18
|
+
MYKHQHP-SKRGWNDELDLS-------------------DQNWEKHQQFGNRDRDSDSPD
|
19
|
+
YTGPCDLQQSAICNKDSLLLDLAEKFSKE-GVEEKHQHPGRRSA----------------
|
20
|
+
----WENETEE--------
|
21
|
+
>Ensembl_ENSDART00000018054_Drer
|
22
|
+
MRAVCVFVL--ACVAVS-GAPGVRGQDG--------------------------------
|
23
|
+
---------------------------PAE---------------EELFQRAEDLL-LRS
|
24
|
+
ILTQMEEQNSEN-------DQ-----PEWM-----EKRQHPG------------------
|
25
|
+
------KRQHPGKREEDLE-----------------------------------------
|
26
|
+
---------------------PEVE-----------------MERW-----RRQHPGKRA
|
27
|
+
PLDLGMLED------P-------TALSELS------------------KRQHPGKRYLML
|
28
|
+
LHKRQHP-GRRELQEADGHS--------------------AELEKRQHPGKRR-------
|
29
|
+
----CEGWADAGCG-------LLELLDTS-GAPEKRQHPGRRAE----------------
|
30
|
+
----LEDELPGL------E
|
31
|
+
>jgi_102993_Bflo
|
32
|
+
MAAHLCILLLLTAIRLAHGAEPAHGAEPAHGAEPAHGAEPAHGAEPGPLAHGAEPAHGAE
|
33
|
+
PGPLAHGAEPAHGAEPGPLAPWPDTEAPRERDSGTTREPWERALLEDMARVLGALA-LYD
|
34
|
+
ADMEVMNQEETSPPFTHGGAELGQLLTDSFLLQSTDKRQSPGKRQSPGKRQSPGKRQSPG
|
35
|
+
KRQSPGKRQSPGKRGDDEITLPMGLRFEPLFSSALSESSTDKRQSAGKRQSPGKRQSPGK
|
36
|
+
RQSP-GKRQSPGKRTFPFPGTPQMETHDATDARANLLTLLDLVEQKRQSPGKRQHPGKRA
|
37
|
+
DWLRPSPEEPWLLYPPEKPDVLLPFISSWSPESGIEDGGMASDGARDDKRQSPGKRQ--S
|
38
|
+
PGKRQSP-GKRQSPGKRDDAETGLPQGLPFDPLFYSAFGESSTDKRQSPGKRQ----SPG
|
39
|
+
KRQSPGKRQSPGKR----------------QSPGKRQSPGKRGGELSAAAAGQGAYAPAG
|
40
|
+
SRKDWTEKPAIYTTFPAGF
|
41
|
+
>gi109402869_Spur
|
42
|
+
MKGTVGLYMW-ACIL---GYVTWGGAAL--------------------------------
|
43
|
+
---------------PTIL--------GKE---LVLSENDG-PEIADWVQGKEIPL-RNQ
|
44
|
+
YWGDVAEEEEE--------DELGMLSPDS------EKRQYPG-----------GKRQYPG
|
45
|
+
G-----KRQYPG----------------------------------GKRQYPG-----GK
|
46
|
+
RQFPAGKRQFVGGELI-----PSPE-----------------LRQW--PGGXRQWPGGXR
|
47
|
+
QW-------------P---------------------GG---------KRQYPG------
|
48
|
+
-GKRQYPGGKRQWPEI----------------------------KRQYPGGKRSED----
|
49
|
+
--------------------------DQDLLAMEIRQYPG--------------------
|
50
|
+
------------------G
|
@@ -0,0 +1,31 @@
|
|
1
|
+
>gi_223023872_Mgal
|
2
|
+
MRLCGLLALISVSIVIVDSSPALSRHKRGFLAGVHDRMGHGFGKRTDPILSSYVDDVDKDDLMTVEDLVRHIMQSEVLADAIVRKFIDINDDGSVSYQELLRKLMR
|
3
|
+
>gi_148318561_Lsta
|
4
|
+
MSRTSLTLQVGVVLLAICLFDITYADERIHRQKRGFRANSASRVAHGYGKRGYLSSNENLPTLSLDQLESSTGLMEEISDGSLMTVNEFSQLLTSHPNLARALVKKFVDINGDDVISTDELFRPILKK
|
5
|
+
>gi_121313125_Acal
|
6
|
+
MLSAPSIAHTGVALLVLMCLCPFSQSTEASLSRAKRGFRLNSASRVAHGYGKRGYASSSGAVPYPELARDVLDNLRAEEEEKELEWSIMSVDELASLLQSHPKLARALVKKFVDINGDNLVTAEELFRPPTRK
|
7
|
+
>gi_163522278_Lgig
|
8
|
+
MKLTLVLVTVTLTITILANAYPQSPSLSHHRSKRGFKANSASRVAHGYGKRGFPSWKNYFQDGGSDVLSVEDMAELVAENPSLAKALLRKFVDTDNDGIISTTELLGTKQMLK
|
9
|
+
>jgi_226681_Ctel
|
10
|
+
MKVSICFIVVALVVCIEVMTSHAANLSRSKRGFRMGAADRFSHGFGKRGGDFNSLIDGESDMVMSDEDLTEIIRADARLAQTFVKRFIDTDGDGFVSRQELFEA
|
11
|
+
>gi_223784927_Apom
|
12
|
+
MKSILCLSVAALMLVAVSGVSSKLTVTGNSRRVARGFRLGAADRFSHGFGKRTDDHLPEVIPGAESDVLLSNAEFAELLRSDEKLANLIVQDFVDKNGDGFITRNELMGYRK
|
13
|
+
>gi_112983783_AT_Bmor
|
14
|
+
MNLTMQLEVIVAVCLVLAEGAPDVRLVRTKQQRPTRGFKNVEMMTARGFGRRDRPHPRAELYGLDNFWVMSEPSPEREVQEVDEKTFESIPLDWFVNEMLNNPDFARFVVEKFIDLNQDGMLSSEELRNV
|
15
|
+
>gi_240248407_Rpro
|
16
|
+
MMRWSSLLVLVALASIINCIKAGSPSSALYSSAARASGRTRTIRGFKNVQLSTARGFGKRTYPDSQLQPDLIPADWMAEELSSNPELARFIIRRFIDVDQDGLVSPVELLRNTVCQEPN
|
17
|
+
>BCM_Contig45963_Apis
|
18
|
+
MAVNNNIMVRLLVIEITFLILAVVNSYPAFEDSEFKHKHRDKGRTIRGFKNMDLSTARGFGKRTDHYMNLMPLDLFVDNKEDSFNQNIPMEVSLEKILKNKYKHFIEKLIDVNHDGYISGEELLLSIDGES
|
19
|
+
>jgi_255977_Dpul
|
20
|
+
MKGKGAFLMVLAGWGLIGLMILTTAVEAAPHPADYTSSSVNNQRDFRSRRGFKTVGLATARGFGKRAPSLSNFNSFQDAAEQMMQQQEENPNSDPDVNGKV
|
21
|
+
>jgi_50560525_Homalodisca_vitripennis
|
22
|
+
MRVYTLLLWLVVLLMSVTANSVPVYLRDKPRSIRGFKNHALSTARGFGKRSDSELSSSETSQFTDRDSFPADWFASEVQNNGELARLVVHKFIDTNQDGELSADELLRPLYGPPTTTYK
|
23
|
+
>sp|P21786|ALLT_MANSE Allatotropin OS=Manduca sexta PE=1 SV=2
|
24
|
+
MNLTMQLAVIVAVCLCLAEGAPDVRLTRTKQQRPTRGFKNVEMMTARGFGKRDRPHPRAERDVDHQAPSARPNRGTPTFKSPTVGIARDFGKRASQYGNEEEIRVTRGTFKPNSNILIARGYGKRTQLPQIDGVYGLDNFWEMLETSPEREVQEVDEKTLESIPLDWFVNEMLNNPDFARSVVRKFIDLNQDGMLSSEELLRNF
|
25
|
+
>sp|Q70XC3|ALLT_SPOFR Allatotropin OS=Spodoptera frugiperda PE=2 SV=2
|
26
|
+
MNISMHLAVAVAAAACLCVCAAAPENRLARTKQQRPTRGFKNVEMMTARGFGKRDRPHTRAEHQDSYDSHARRKFNPKSNLMVAYDFGKRSGNDDVTDEVYGLDNFWEMLEATPEREGQENDEKTLESIPLDWFVNEMLNNPDFARSVVRKFIDLNQHSFGLVRERDAEQSRFRAICGPQVH
|
27
|
+
>tr|G6DGJ8|G6DGJ8_DANPL Allatotropin OS=Danaus plexippus GN=KGM_16925 PE=4 SV=1
|
28
|
+
MVATYYGKRTDNDYLREEEEVVRVIRGSFKPNAKILIARGYGKRQEDPKGEEEIRVTRGTFNPHSNVLIARGYGKRESRDEEHEPNNFWENLEASQDGDNGNDEKTVDR
|
29
|
+
>tr|W5RWF8|W5RWF8_CULPI Allatotropin (Fragment) OS=Culex pipiens PE=4 SV=1
|
30
|
+
LCSVLLCCHTSSAGPARQLASLAARASKIPRSIRAPFRNSEMMTARGFGKRRAPIGANVGGGSASGTMVKHVADETPWGYDKHEAGKLIEELVADGVDSLQMGGAGEQESFPLDWFASEMTTNPALARTILQRFVDTNRDGILTTSELISSPMGGGGAAASDSNDLF
|
31
|
+
|
@@ -0,0 +1,90 @@
|
|
1
|
+
>gi_223023872_Mgal
|
2
|
+
MRLCGLLALISVSIVIV-------------------------DSSPALSRHKRG-FLAGV
|
3
|
+
HDRMGHGFGKR-------------------------------------------------
|
4
|
+
-------TDPILSSYV----------------------DDVDKDDL--------------
|
5
|
+
-----------MTVEDLVRHIMQSEVLADAIVRKFIDINDD----GSVSYQEL----L--
|
6
|
+
RKLMR-------
|
7
|
+
>gi_148318561_Lsta
|
8
|
+
MSRTSLTLQVGVVLLAICLFDITYA-------------------DERIHRQKRG-FRANS
|
9
|
+
ASRVAHGYGKR-------------------------------------------------
|
10
|
+
-------GYLSSNENL----------------------PTLSLDQLESST--------GL
|
11
|
+
MEEISD--GSLMTVNEFSQLLTSHPNLARALVKKFVDINGD----DVISTDEL----F--
|
12
|
+
RPILKK------
|
13
|
+
>gi_121313125_Acal
|
14
|
+
MLSAPSIAHTGVALLVLMCLCPFSQ-----------------STEASLSRAKRG-FRLNS
|
15
|
+
ASRVAHGYGKR-------------------------------------------------
|
16
|
+
-------GYASSSGAVPY--------------------PELARDVLDNLR--------AE
|
17
|
+
EEEKELE-WSIMSVDELASLLQSHPKLARALVKKFVDINGD----NLVTAEEL----F--
|
18
|
+
RPPTRK------
|
19
|
+
>gi_163522278_Lgig
|
20
|
+
-MKLTLV-LVTVTLTITILANAYPQ-----------------SPSLSHHRSKRG-FKANS
|
21
|
+
ASRVAHGYGKR-------------------------------------------------
|
22
|
+
-------GFPSWKNYF----------------------QDGGSDVL--------------
|
23
|
+
------------SVEDMAELVAENPSLAKALLRKFVDTDND----GIISTTEL----LGT
|
24
|
+
KQMLK-------
|
25
|
+
>jgi_226681_Ctel
|
26
|
+
-MKVSIC-FIVVAL-VVCIEVMTSH-------------------AANLSRSKRG-FRMGA
|
27
|
+
ADRFSHGFGKR-------------------------------------------------
|
28
|
+
-------GGD-FNSLI----------------------DG-ESDMV--------------
|
29
|
+
-----------MSDEDLTEIIRADARLAQTFVKRFIDTDGD----GFVSRQEL----FEA
|
30
|
+
------------
|
31
|
+
>gi_223784927_Apom
|
32
|
+
-MKSILC-LSVAALMLVAVSGVSSK---------L-------TVTGNSRRVARG-FRLGA
|
33
|
+
ADRFSHGFGKR-------------------------------------------------
|
34
|
+
-------TDDHLPEVI----------------------PGAESDVL--------------
|
35
|
+
-----------LSNAEFAELLRSDEKLANLIVQDFVDKNGD----GFITRNEL----MGY
|
36
|
+
RK----------
|
37
|
+
>gi_112983783_AT_Bmor
|
38
|
+
-MNLTMQLEVIVAV---CLVLAEGA----PDVRLV-------RTKQQ--RPTRG-FK-NV
|
39
|
+
EMMTARGFGRRDRPHPRAE-----------------------------------------
|
40
|
+
---------------------------------------LYGLDNFWVMSEPSPEREVQE
|
41
|
+
VDEKT---FESIPLDWFVNEMLNNPDFARFVVEKFIDLNQD----GMLSSEEL-------
|
42
|
+
RNV---------
|
43
|
+
>gi_240248407_Rpro
|
44
|
+
-MMRWSSLLVLVALASIINCIKAGS----PSSALYSSAA---RASGR-TRTIRG-FK-NV
|
45
|
+
QLSTARGFGKRTYPDSQLQ-----------------------------------------
|
46
|
+
------------------------------------------------------------
|
47
|
+
--------PDLIPADWMAEELSSNPELARFIIRRFIDVDQD----GLVSPVEL----L--
|
48
|
+
RNTVCQEPN---
|
49
|
+
>BCM_Contig45963_Apis
|
50
|
+
-MAVNNNIMVRLLVIEITFLILAVV----NSYPAFEDSEFKHKHRDK-GRTIRG-FK-NM
|
51
|
+
DLSTARGFGKRT------------------------------------------------
|
52
|
+
-------------------------------------------DHYMNLMPLD-----LF
|
53
|
+
VDNKEDSFNQNIPMEVSLEKILKNK--YKHFIEKLIDVNHD----GYISGEEL----L--
|
54
|
+
LSIDGES-----
|
55
|
+
>jgi_255977_Dpul
|
56
|
+
MKGKGAFLMVLAGWGLIGLMILTTAVEAAPHPADYTSSS---VNNQRDFRSRRG-FK-TV
|
57
|
+
GLATARGFGKRAP-----------------------------------------------
|
58
|
+
-------SLSNFNSFQD-------------------------------------------
|
59
|
+
------------AAEQMMQQQEENP-------------NSDPDVNGKV------------
|
60
|
+
------------
|
61
|
+
>jgi_50560525_Homalodisca_vitripennis
|
62
|
+
-MRVYTLLLWLVVL-----LMSVTA----NSVPVY--------LRDK-PRSIRG-FK-NH
|
63
|
+
ALSTARGFGKRS------------------------------------------------
|
64
|
+
-------------------------------------------DSELSSSETS-----QF
|
65
|
+
TD------RDSFPADWFASEVQNNGELARLVVHKFIDTNQD----GELSADEL----L--
|
66
|
+
RPLYGPPTTTYK
|
67
|
+
>sp|P21786|ALLT_MANSE Allatotropin OS=Manduca sexta PE=1 SV=2
|
68
|
+
-MNLTMQLAVIVAV---CLCLAEGA----PDVRLT-------RTKQQ--RPTRG-FK-NV
|
69
|
+
EMMTARGFGKRDRPHPRAERDVDHQAPSARPNRGTPTFKSPTVGIARDFGKRASQYGNEE
|
70
|
+
EIRVTRGTFKPNSNIL------IARGYGKRTQLPQI-DGVYGLDNFWEMLETSPEREVQE
|
71
|
+
VDEKT---LESIPLDWFVNEMLNNPDFARSVVRKFIDLNQD----GMLSSEEL----L--
|
72
|
+
RNF---------
|
73
|
+
>sp|Q70XC3|ALLT_SPOFR Allatotropin OS=Spodoptera frugiperda PE=2 SV=2
|
74
|
+
-MNISMHLAVAVAA-AACLCVCAAA----PENRLA-------RTKQQ--RPTRG-FK-NV
|
75
|
+
EMMTARGFGKRDRPHTRAE----HQ----------------------------DSYDSH-
|
76
|
+
----ARRKFNPKSNLM------VAYDFGKRSGNDDVTDEVYGLDNFWEMLEATPEREGQE
|
77
|
+
NDEKT---LESIPLDWFVNEMLNNPDFARSVVRKFIDLNQHS--FGLVRERDAEQSRF--
|
78
|
+
RAICGPQVH---
|
79
|
+
>tr|G6DGJ8|G6DGJ8_DANPL Allatotropin OS=Danaus plexippus GN=KGM_16925 PE=4 SV=1
|
80
|
+
----------MVA------TYYGKR----TDNDYL-------REEEEVVRVIRGSFKPNA
|
81
|
+
KILIARGYGKRQE-DPKGE----EE-----------------------------------
|
82
|
+
-IRVTRGTFNPHSNVL------IARGYGKRESR----DEEHEPNNFWENLEASQDGD-NG
|
83
|
+
NDEKT---VDR-------------------------------------------------
|
84
|
+
------------
|
85
|
+
>tr|W5RWF8|W5RWF8_CULPI Allatotropin (Fragment) OS=Culex pipiens PE=4 SV=1
|
86
|
+
-------------LCSVLLCCHTSS--AGPARQLASLA----ARASKIPRSIRAPFR-NS
|
87
|
+
EMMTARGFGKRRAP----------------------------------------------
|
88
|
+
-IGANVGGGSASGTMVKHVADETPWGYDKHEAGKLI--EELVADGVDSLQMGG-AGE---
|
89
|
+
--------QESFPLDWFASEMTTNPALARTILQRFVDTNRD----GILTTSELISSPMGG
|
90
|
+
GGAAASDSNDLF
|