protk 1.2.0 → 1.2.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data/README.md +69 -36
- data/bin/gffmerge.rb +16 -5
- data/bin/mascot_search.rb +174 -97
- data/bin/omssa_search.rb +31 -8
- data/bin/protk_setup.rb +0 -3
- data/bin/sixframe.rb +0 -6
- data/bin/tandem_search.rb +97 -6
- data/bin/template_search.rb +144 -0
- data/bin/uniprot_annotation.rb +130 -0
- data/lib/convert_util.rb +27 -0
- data/lib/pepxml.rb +22 -0
- data/lib/protk/big_search_rakefile.rake +16 -0
- data/lib/protk/big_search_tool.rb +23 -0
- data/lib/protk/bio_sptr_extensions.rb +41 -2
- data/lib/protk/constants.rb +13 -0
- data/lib/protk/data/apt-get_packages.yaml +4 -0
- data/lib/protk/data/default_config.yml +1 -0
- data/lib/protk/data/make_uniprot_table.rb +29 -0
- data/lib/protk/data/predefined_db.trembl_annotation.yaml +20 -0
- data/lib/protk/data/uniprot_accessions.loc +96 -0
- data/lib/protk/data/uniprot_accessions_table.txt +97 -0
- data/lib/protk/data/uniprot_input_accessions.loc +95 -0
- data/lib/protk/manage_db_rakefile.rake +25 -11
- data/lib/protk/omssa_util.rb +1 -1
- data/lib/protk/setup_rakefile.rake +39 -2
- metadata +13 -1
data/lib/convert_util.rb
ADDED
@@ -0,0 +1,27 @@
|
|
1
|
+
require 'libxml'
|
2
|
+
require 'constants'
|
3
|
+
|
4
|
+
class ConvertUtil
|
5
|
+
|
6
|
+
def self.ensure_mzml_indexed(run_file)
|
7
|
+
if unindexed_mzml?(run_file)
|
8
|
+
index_mzml(run_file)
|
9
|
+
end
|
10
|
+
end
|
11
|
+
|
12
|
+
def self.index_mzml(mzml_file)
|
13
|
+
Dir.mktmpdir do |tmpdir|
|
14
|
+
genv=Constants.new
|
15
|
+
%x["#{genv.tpp_bin}/msconvert -o #{tmpdir} #{mzml_file}"]
|
16
|
+
indexed_file = Dir["#{tmpdir}/*"][0]
|
17
|
+
FileUtils.mv(indexed_file, mzml_file)
|
18
|
+
end
|
19
|
+
end
|
20
|
+
|
21
|
+
def self.unindexed_mzml?(mzml_file)
|
22
|
+
reader = LibXML::XML::Reader.file(mzml_file)
|
23
|
+
reader.read
|
24
|
+
reader.name == "mzML"
|
25
|
+
end
|
26
|
+
|
27
|
+
end
|
data/lib/pepxml.rb
ADDED
@@ -0,0 +1,22 @@
|
|
1
|
+
require 'rubygems'
|
2
|
+
require 'rexml/document'
|
3
|
+
require 'rexml/xpath'
|
4
|
+
|
5
|
+
class PepXML
|
6
|
+
def initialize(file_name)
|
7
|
+
@doc=REXML::Document.new(File.new(file_name))
|
8
|
+
end
|
9
|
+
|
10
|
+
def find_runs()
|
11
|
+
runs = {}
|
12
|
+
REXML::XPath.each(@doc,"//msms_run_summary") do |summary|
|
13
|
+
base_name = summary.attributes["base_name"]
|
14
|
+
if not runs.has_key?(base_name)
|
15
|
+
runs[base_name] = {:base_name => summary.attributes["base_name"],
|
16
|
+
:type => summary.attributes["raw_data"]}
|
17
|
+
end
|
18
|
+
end
|
19
|
+
runs
|
20
|
+
end
|
21
|
+
|
22
|
+
end
|
@@ -0,0 +1,23 @@
|
|
1
|
+
# create rake dependencies
|
2
|
+
# run rakefile
|
3
|
+
#
|
4
|
+
require 'optparse'
|
5
|
+
require 'pathname'
|
6
|
+
require 'protk/tool'
|
7
|
+
require 'protk/command_runner'
|
8
|
+
require 'pp'
|
9
|
+
require 'rake'
|
10
|
+
|
11
|
+
class BigSearchTool < Tool
|
12
|
+
|
13
|
+
def run input_files
|
14
|
+
command = "rake -f #{rakefile_path} #{input_files.join(" ")}"
|
15
|
+
runner=CommandRunner.new(Constants.new)
|
16
|
+
runner.run_local(command)
|
17
|
+
end
|
18
|
+
|
19
|
+
def rakefile_path
|
20
|
+
"#{File.dirname(__FILE__)}/big_search_rakefile.rake"
|
21
|
+
end
|
22
|
+
|
23
|
+
end
|
@@ -177,7 +177,26 @@ class Bio::SPTR < Bio::EMBLDB
|
|
177
177
|
return self.safely_get_drentry_for_key("NextBio")
|
178
178
|
end
|
179
179
|
|
180
|
-
|
180
|
+
def uniprot_link
|
181
|
+
return "http://www.uniprot.org/uniprot/#{self.accession}.html"
|
182
|
+
end
|
183
|
+
|
184
|
+
def nextbio_link
|
185
|
+
return "http://www.nextbio.com/b/home/home.nb?id=#{self.nextbio}&type=feature"
|
186
|
+
end
|
187
|
+
|
188
|
+
def intact_link
|
189
|
+
return "http://www.ebi.ac.uk/intact/pages/interactions/interactions.xhtml?query=#{self.intact}*"
|
190
|
+
end
|
191
|
+
|
192
|
+
def pride_link
|
193
|
+
return "http://www.ebi.ac.uk/pride/searchSummary.do?queryTypeSelected=identification%20accession%20number&identificationAccessionNumber=#{self.pride}"
|
194
|
+
end
|
195
|
+
|
196
|
+
def ensembl_link
|
197
|
+
return "http://www.ensembl.org/Homo_sapiens/Transcript/Summary?db=core;t=#{self.ensembl}"
|
198
|
+
end
|
199
|
+
|
181
200
|
# Number of transmembrane regions
|
182
201
|
#
|
183
202
|
def num_transmem
|
@@ -206,5 +225,25 @@ class Bio::SPTR < Bio::EMBLDB
|
|
206
225
|
p "Warning: Unable to parse feature table for entry #{self.accession}"
|
207
226
|
end
|
208
227
|
end
|
209
|
-
|
228
|
+
|
229
|
+
def ref_dump
|
230
|
+
return self.ref.to_s
|
231
|
+
end
|
232
|
+
|
233
|
+
def seq_dump
|
234
|
+
return self.seq.to_s
|
235
|
+
end
|
236
|
+
|
237
|
+
def tax_dump
|
238
|
+
return self.ox.to_s
|
239
|
+
end
|
240
|
+
|
241
|
+
def species_dump
|
242
|
+
return self.os.to_s
|
243
|
+
end
|
244
|
+
|
245
|
+
def feature_dump
|
246
|
+
return self.ft.to_s
|
247
|
+
end
|
248
|
+
|
210
249
|
end
|
data/lib/protk/constants.rb
CHANGED
@@ -169,6 +169,19 @@ class Constants
|
|
169
169
|
return "#{self.openms_root}/bin/ExecutePipeline"
|
170
170
|
end
|
171
171
|
|
172
|
+
def tandem_root
|
173
|
+
path=@env['tandem_root']
|
174
|
+
if ( path =~ /^\//)
|
175
|
+
return path
|
176
|
+
else
|
177
|
+
return "#{@protk_dir}/#{@env['tandem_root']}"
|
178
|
+
end
|
179
|
+
end
|
180
|
+
|
181
|
+
def gpmtandem
|
182
|
+
return "#{self.tandem_root}/bin/tandem"
|
183
|
+
end
|
184
|
+
|
172
185
|
def protein_database_root
|
173
186
|
path=@env['protein_database_root']
|
174
187
|
if ( path =~ /^\// )
|
@@ -0,0 +1,29 @@
|
|
1
|
+
#!/usr/bin/env ruby
|
2
|
+
|
3
|
+
file_name = ARGV[0]
|
4
|
+
|
5
|
+
out_fh = File.new("uniprot_accessions.loc",'w')
|
6
|
+
|
7
|
+
File.foreach(file_name) { |line|
|
8
|
+
cols= line.chomp.split("\t")
|
9
|
+
if ( cols[2]!="from" )
|
10
|
+
db_key = "#{cols[0].gsub(" ","_").downcase}_"
|
11
|
+
out_fh.write "#{cols[0]}\t#{db_key}\t#{cols[1]}\t#{db_key}\n"
|
12
|
+
end
|
13
|
+
}
|
14
|
+
|
15
|
+
out_fh.close
|
16
|
+
|
17
|
+
|
18
|
+
|
19
|
+
out_fh = File.new("uniprot_input_accessions.loc",'w')
|
20
|
+
|
21
|
+
File.foreach(file_name) { |line|
|
22
|
+
cols= line.chomp.split("\t")
|
23
|
+
if ( cols[2]!="to" )
|
24
|
+
db_key = "#{cols[0].gsub(" ","_").downcase}_"
|
25
|
+
out_fh.write "#{cols[0]}\t#{db_key}\t#{cols[1]}\t#{db_key}\n"
|
26
|
+
end
|
27
|
+
}
|
28
|
+
|
29
|
+
out_fh.close
|
@@ -0,0 +1,20 @@
|
|
1
|
+
#
|
2
|
+
# This is a predefined setup file for manage_db
|
3
|
+
#
|
4
|
+
# Swissprot_uniprot annotation database (full entries for each protein)
|
5
|
+
#
|
6
|
+
---
|
7
|
+
:description: Swissprot Trembl annotation database (full entries for each protein)
|
8
|
+
:archive_old: false
|
9
|
+
:is_annotation_db: true
|
10
|
+
:decoy_prefix: decoy_
|
11
|
+
:include_filters: []
|
12
|
+
|
13
|
+
:format: dat
|
14
|
+
:id_regexes: []
|
15
|
+
|
16
|
+
:make_blast_index: false
|
17
|
+
:sources:
|
18
|
+
- - ftp://ftp.uniprot.org/pub/databases/uniprot/current_release/knowledgebase/complete/uniprot_trembl.dat.gz
|
19
|
+
- ftp://ftp.uniprot.org/pub/databases/uniprot/current_release/knowledgebase/complete/reldate.txt
|
20
|
+
:decoys: false
|
@@ -0,0 +1,96 @@
|
|
1
|
+
UniProtKB AC uniprotkb_ac_ ACC uniprotkb_ac_
|
2
|
+
UniProtKB ID uniprotkb_id_ ID uniprotkb_id_
|
3
|
+
UniParc uniparc_ UPARC uniparc_
|
4
|
+
UniRef50 uniref50_ NF50 uniref50_
|
5
|
+
UniRef90 uniref90_ NF90 uniref90_
|
6
|
+
UniRef100 uniref100_ NF100 uniref100_
|
7
|
+
EMBL/GenBank/DDBJ embl/genbank/ddbj_ EMBL_ID embl/genbank/ddbj_
|
8
|
+
EMBL/GenBank/DDBJ CDS embl/genbank/ddbj_cds_ EMBL embl/genbank/ddbj_cds_
|
9
|
+
PIR pir_ PIR pir_
|
10
|
+
UniGene unigene_ UNIGENE_ID unigene_
|
11
|
+
Entrez Gene (GeneID) entrez_gene_(geneid)_ P_ENTREZGENEID entrez_gene_(geneid)_
|
12
|
+
GI number* gi_number*_ P_GI gi_number*_
|
13
|
+
IPI ipi_ P_IPI ipi_
|
14
|
+
RefSeq Protein refseq_protein_ P_REFSEQ_AC refseq_protein_
|
15
|
+
RefSeq Nucleotide refseq_nucleotide_ REFSEQ_NT_ID refseq_nucleotide_
|
16
|
+
PDB pdb_ PDB_ID pdb_
|
17
|
+
DisProt disprot_ DISPROT_ID disprot_
|
18
|
+
HSSP hssp_ HSSP_ID hssp_
|
19
|
+
DIP dip_ DIP_ID dip_
|
20
|
+
MINT mint_ MINT_ID mint_
|
21
|
+
Allergome allergome_ ALLERGOME_ID allergome_
|
22
|
+
MEROPS merops_ MEROPS_ID merops_
|
23
|
+
PeroxiBase peroxibase_ PEROXIBASE_ID peroxibase_
|
24
|
+
PptaseDB pptasedb_ PPTASEDB_ID pptasedb_
|
25
|
+
REBASE rebase_ REBASE_ID rebase_
|
26
|
+
TCDB tcdb_ TCDB_ID tcdb_
|
27
|
+
PhosSite phossite_ PHOSSITE_ID phossite_
|
28
|
+
DMDM dmdm_ DMDM_ID dmdm_
|
29
|
+
Aarhus/Ghent-2DPAGE aarhus/ghent-2dpage_ AARHUS_GHENT_2DPAGE_ID aarhus/ghent-2dpage_
|
30
|
+
World-2DPAGE world-2dpage_ WORLD_2DPAGE_ID world-2dpage_
|
31
|
+
DNASU dnasu_ DNASU_ID dnasu_
|
32
|
+
Ensembl ensembl_ ENSEMBL_ID ensembl_
|
33
|
+
Ensembl Protein ensembl_protein_ ENSEMBL_PRO_ID ensembl_protein_
|
34
|
+
Ensembl Transcript ensembl_transcript_ ENSEMBL_TRS_ID ensembl_transcript_
|
35
|
+
Ensembl Genomes ensembl_genomes_ ENSEMBLGENOME_ID ensembl_genomes_
|
36
|
+
Ensembl Genomes Protein ensembl_genomes_protein_ ENSEMBLGENOME_PRO_ID ensembl_genomes_protein_
|
37
|
+
Ensembl Genomes Transcript ensembl_genomes_transcript_ ENSEMBLGENOME_TRS_ID ensembl_genomes_transcript_
|
38
|
+
GeneID geneid_ P_ENTREZGENEID geneid_
|
39
|
+
GenomeReviews genomereviews_ GENOMEREVIEWS_ID genomereviews_
|
40
|
+
KEGG kegg_ KEGG_ID kegg_
|
41
|
+
PATRIC patric_ PATRIC_ID patric_
|
42
|
+
UCSC ucsc_ UCSC_ID ucsc_
|
43
|
+
VectorBase vectorbase_ VECTORBASE_ID vectorbase_
|
44
|
+
AGD agd_ AGD_ID agd_
|
45
|
+
ArachnoServer arachnoserver_ ARACHNOSERVER_ID arachnoserver_
|
46
|
+
CGD cgd_ CGD cgd_
|
47
|
+
ConoServer conoserver_ CONOSERVER_ID conoserver_
|
48
|
+
CYGD cygd_ CYGD_ID cygd_
|
49
|
+
dictyBase dictybase_ DICTYBASE_ID dictybase_
|
50
|
+
EchoBASE echobase_ ECHOBASE_ID echobase_
|
51
|
+
EcoGene ecogene_ ECOGENE_ID ecogene_
|
52
|
+
euHCVdb euhcvdb_ EUHCVDB_ID euhcvdb_
|
53
|
+
EuPathDB eupathdb_ EUPATHDB_ID eupathdb_
|
54
|
+
FlyBase flybase_ FLYBASE_ID flybase_
|
55
|
+
GeneCards genecards_ GENECARDS_ID genecards_
|
56
|
+
GeneFarm genefarm_ GENEFARM_ID genefarm_
|
57
|
+
GenoList genolist_ GENOLIST_ID genolist_
|
58
|
+
H-InvDB h-invdb_ H_INVDB_ID h-invdb_
|
59
|
+
HGNC hgnc_ HGNC_ID hgnc_
|
60
|
+
HPA hpa_ HPA_ID hpa_
|
61
|
+
LegioList legiolist_ LEGIOLIST_ID legiolist_
|
62
|
+
Leproma leproma_ LEPROMA_ID leproma_
|
63
|
+
MaizeGDB maizegdb_ MAIZEGDB_ID maizegdb_
|
64
|
+
MIM mim_ MIM_ID mim_
|
65
|
+
MGI mgi_ MGI_ID mgi_
|
66
|
+
neXtProt nextprot_ NEXTPROT_ID nextprot_
|
67
|
+
Orphanet orphanet_ ORPHANET_ID orphanet_
|
68
|
+
PharmGKB pharmgkb_ PHARMGKB_ID pharmgkb_
|
69
|
+
PomBase pombase_ POMBASE_ID pombase_
|
70
|
+
PseudoCAP pseudocap_ PSEUDOCAP_ID pseudocap_
|
71
|
+
RGD rgd_ RGD_ID rgd_
|
72
|
+
SGD sgd_ SGD_ID sgd_
|
73
|
+
TAIR tair_ TAIR_ID tair_
|
74
|
+
TubercuList tuberculist_ TUBERCULIST_ID tuberculist_
|
75
|
+
WormBase wormbase_ WORMBASE_ID wormbase_
|
76
|
+
WormBase Transcript wormbase_transcript_ WORMBASE_TRS_ID wormbase_transcript_
|
77
|
+
WormBase Protein wormbase_protein_ WORMBASE_PRO_ID wormbase_protein_
|
78
|
+
Xenbase xenbase_ XENBASE_ID xenbase_
|
79
|
+
ZFIN zfin_ ZFIN_ID zfin_
|
80
|
+
eggNOG eggnog_ EGGNOG_ID eggnog_
|
81
|
+
GeneTree genetree_ GENETREE_ID genetree_
|
82
|
+
HOGENOM hogenom_ HOGENOM_ID hogenom_
|
83
|
+
HOVERGEN hovergen_ HOVERGEN_ID hovergen_
|
84
|
+
KO ko_ KO_ID ko_
|
85
|
+
OMA oma_ OMA_ID oma_
|
86
|
+
OrthoDB orthodb_ ORTHODB_ID orthodb_
|
87
|
+
ProtClustDB protclustdb_ PROTCLUSTDB_ID protclustdb_
|
88
|
+
BioCyc biocyc_ BIOCYC_ID biocyc_
|
89
|
+
Reactome reactome_ REACTOME_ID reactome_
|
90
|
+
UniPathWay unipathway_ UNIPATHWAY_ID unipathway_
|
91
|
+
CleanEx cleanex_ CLEANEX_ID cleanex_
|
92
|
+
GermOnline germonline_ GERMONLINE_ID germonline_
|
93
|
+
ChEMBL chembl_ CHEMBL chembl_
|
94
|
+
DrugBank drugbank_ DRUGBANK_ID drugbank_
|
95
|
+
GenomeRNAi genomernai_ GENOMERNAI_ID genomernai_
|
96
|
+
NextBio nextbio_ NEXTBIO_ID nextbio_
|
@@ -0,0 +1,97 @@
|
|
1
|
+
UniProtKB AC/ID ACC+ID from
|
2
|
+
UniProtKB AC ACC to
|
3
|
+
UniProtKB ID ID to
|
4
|
+
UniParc UPARC both
|
5
|
+
UniRef50 NF50 both
|
6
|
+
UniRef90 NF90 both
|
7
|
+
UniRef100 NF100 both
|
8
|
+
EMBL/GenBank/DDBJ EMBL_ID both
|
9
|
+
EMBL/GenBank/DDBJ CDS EMBL both
|
10
|
+
PIR PIR both
|
11
|
+
UniGene UNIGENE_ID both
|
12
|
+
Entrez Gene (GeneID) P_ENTREZGENEID both
|
13
|
+
GI number* P_GI both
|
14
|
+
IPI P_IPI both
|
15
|
+
RefSeq Protein P_REFSEQ_AC both
|
16
|
+
RefSeq Nucleotide REFSEQ_NT_ID both
|
17
|
+
PDB PDB_ID both
|
18
|
+
DisProt DISPROT_ID both
|
19
|
+
HSSP HSSP_ID both
|
20
|
+
DIP DIP_ID both
|
21
|
+
MINT MINT_ID both
|
22
|
+
Allergome ALLERGOME_ID both
|
23
|
+
MEROPS MEROPS_ID both
|
24
|
+
PeroxiBase PEROXIBASE_ID both
|
25
|
+
PptaseDB PPTASEDB_ID both
|
26
|
+
REBASE REBASE_ID both
|
27
|
+
TCDB TCDB_ID both
|
28
|
+
PhosSite PHOSSITE_ID both
|
29
|
+
DMDM DMDM_ID both
|
30
|
+
Aarhus/Ghent-2DPAGE AARHUS_GHENT_2DPAGE_ID both
|
31
|
+
World-2DPAGE WORLD_2DPAGE_ID both
|
32
|
+
DNASU DNASU_ID both
|
33
|
+
Ensembl ENSEMBL_ID both
|
34
|
+
Ensembl Protein ENSEMBL_PRO_ID both
|
35
|
+
Ensembl Transcript ENSEMBL_TRS_ID both
|
36
|
+
Ensembl Genomes ENSEMBLGENOME_ID both
|
37
|
+
Ensembl Genomes Protein ENSEMBLGENOME_PRO_ID both
|
38
|
+
Ensembl Genomes Transcript ENSEMBLGENOME_TRS_ID both
|
39
|
+
GeneID P_ENTREZGENEID both
|
40
|
+
GenomeReviews GENOMEREVIEWS_ID both
|
41
|
+
KEGG KEGG_ID both
|
42
|
+
PATRIC PATRIC_ID both
|
43
|
+
UCSC UCSC_ID both
|
44
|
+
VectorBase VECTORBASE_ID both
|
45
|
+
AGD AGD_ID both
|
46
|
+
ArachnoServer ARACHNOSERVER_ID both
|
47
|
+
CGD CGD both
|
48
|
+
ConoServer CONOSERVER_ID both
|
49
|
+
CYGD CYGD_ID both
|
50
|
+
dictyBase DICTYBASE_ID both
|
51
|
+
EchoBASE ECHOBASE_ID both
|
52
|
+
EcoGene ECOGENE_ID both
|
53
|
+
euHCVdb EUHCVDB_ID both
|
54
|
+
EuPathDB EUPATHDB_ID both
|
55
|
+
FlyBase FLYBASE_ID both
|
56
|
+
GeneCards GENECARDS_ID both
|
57
|
+
GeneFarm GENEFARM_ID both
|
58
|
+
GenoList GENOLIST_ID both
|
59
|
+
H-InvDB H_INVDB_ID both
|
60
|
+
HGNC HGNC_ID both
|
61
|
+
HPA HPA_ID both
|
62
|
+
LegioList LEGIOLIST_ID both
|
63
|
+
Leproma LEPROMA_ID both
|
64
|
+
MaizeGDB MAIZEGDB_ID both
|
65
|
+
MIM MIM_ID both
|
66
|
+
MGI MGI_ID both
|
67
|
+
neXtProt NEXTPROT_ID both
|
68
|
+
Orphanet ORPHANET_ID both
|
69
|
+
PharmGKB PHARMGKB_ID both
|
70
|
+
PomBase POMBASE_ID both
|
71
|
+
PseudoCAP PSEUDOCAP_ID both
|
72
|
+
RGD RGD_ID both
|
73
|
+
SGD SGD_ID both
|
74
|
+
TAIR TAIR_ID both
|
75
|
+
TubercuList TUBERCULIST_ID both
|
76
|
+
WormBase WORMBASE_ID both
|
77
|
+
WormBase Transcript WORMBASE_TRS_ID both
|
78
|
+
WormBase Protein WORMBASE_PRO_ID both
|
79
|
+
Xenbase XENBASE_ID both
|
80
|
+
ZFIN ZFIN_ID both
|
81
|
+
eggNOG EGGNOG_ID both
|
82
|
+
GeneTree GENETREE_ID both
|
83
|
+
HOGENOM HOGENOM_ID both
|
84
|
+
HOVERGEN HOVERGEN_ID both
|
85
|
+
KO KO_ID both
|
86
|
+
OMA OMA_ID both
|
87
|
+
OrthoDB ORTHODB_ID both
|
88
|
+
ProtClustDB PROTCLUSTDB_ID both
|
89
|
+
BioCyc BIOCYC_ID both
|
90
|
+
Reactome REACTOME_ID both
|
91
|
+
UniPathWay UNIPATHWAY_ID both
|
92
|
+
CleanEx CLEANEX_ID both
|
93
|
+
GermOnline GERMONLINE_ID both
|
94
|
+
ChEMBL CHEMBL both
|
95
|
+
DrugBank DRUGBANK_ID both
|
96
|
+
GenomeRNAi GENOMERNAI_ID both
|
97
|
+
NextBio NEXTBIO_ID both
|
@@ -0,0 +1,95 @@
|
|
1
|
+
UniProtKB AC/ID uniprotkb_ac/id_ ACC+ID uniprotkb_ac/id_
|
2
|
+
UniParc uniparc_ UPARC uniparc_
|
3
|
+
UniRef50 uniref50_ NF50 uniref50_
|
4
|
+
UniRef90 uniref90_ NF90 uniref90_
|
5
|
+
UniRef100 uniref100_ NF100 uniref100_
|
6
|
+
EMBL/GenBank/DDBJ embl/genbank/ddbj_ EMBL_ID embl/genbank/ddbj_
|
7
|
+
EMBL/GenBank/DDBJ CDS embl/genbank/ddbj_cds_ EMBL embl/genbank/ddbj_cds_
|
8
|
+
PIR pir_ PIR pir_
|
9
|
+
UniGene unigene_ UNIGENE_ID unigene_
|
10
|
+
Entrez Gene (GeneID) entrez_gene_(geneid)_ P_ENTREZGENEID entrez_gene_(geneid)_
|
11
|
+
GI number* gi_number*_ P_GI gi_number*_
|
12
|
+
IPI ipi_ P_IPI ipi_
|
13
|
+
RefSeq Protein refseq_protein_ P_REFSEQ_AC refseq_protein_
|
14
|
+
RefSeq Nucleotide refseq_nucleotide_ REFSEQ_NT_ID refseq_nucleotide_
|
15
|
+
PDB pdb_ PDB_ID pdb_
|
16
|
+
DisProt disprot_ DISPROT_ID disprot_
|
17
|
+
HSSP hssp_ HSSP_ID hssp_
|
18
|
+
DIP dip_ DIP_ID dip_
|
19
|
+
MINT mint_ MINT_ID mint_
|
20
|
+
Allergome allergome_ ALLERGOME_ID allergome_
|
21
|
+
MEROPS merops_ MEROPS_ID merops_
|
22
|
+
PeroxiBase peroxibase_ PEROXIBASE_ID peroxibase_
|
23
|
+
PptaseDB pptasedb_ PPTASEDB_ID pptasedb_
|
24
|
+
REBASE rebase_ REBASE_ID rebase_
|
25
|
+
TCDB tcdb_ TCDB_ID tcdb_
|
26
|
+
PhosSite phossite_ PHOSSITE_ID phossite_
|
27
|
+
DMDM dmdm_ DMDM_ID dmdm_
|
28
|
+
Aarhus/Ghent-2DPAGE aarhus/ghent-2dpage_ AARHUS_GHENT_2DPAGE_ID aarhus/ghent-2dpage_
|
29
|
+
World-2DPAGE world-2dpage_ WORLD_2DPAGE_ID world-2dpage_
|
30
|
+
DNASU dnasu_ DNASU_ID dnasu_
|
31
|
+
Ensembl ensembl_ ENSEMBL_ID ensembl_
|
32
|
+
Ensembl Protein ensembl_protein_ ENSEMBL_PRO_ID ensembl_protein_
|
33
|
+
Ensembl Transcript ensembl_transcript_ ENSEMBL_TRS_ID ensembl_transcript_
|
34
|
+
Ensembl Genomes ensembl_genomes_ ENSEMBLGENOME_ID ensembl_genomes_
|
35
|
+
Ensembl Genomes Protein ensembl_genomes_protein_ ENSEMBLGENOME_PRO_ID ensembl_genomes_protein_
|
36
|
+
Ensembl Genomes Transcript ensembl_genomes_transcript_ ENSEMBLGENOME_TRS_ID ensembl_genomes_transcript_
|
37
|
+
GeneID geneid_ P_ENTREZGENEID geneid_
|
38
|
+
GenomeReviews genomereviews_ GENOMEREVIEWS_ID genomereviews_
|
39
|
+
KEGG kegg_ KEGG_ID kegg_
|
40
|
+
PATRIC patric_ PATRIC_ID patric_
|
41
|
+
UCSC ucsc_ UCSC_ID ucsc_
|
42
|
+
VectorBase vectorbase_ VECTORBASE_ID vectorbase_
|
43
|
+
AGD agd_ AGD_ID agd_
|
44
|
+
ArachnoServer arachnoserver_ ARACHNOSERVER_ID arachnoserver_
|
45
|
+
CGD cgd_ CGD cgd_
|
46
|
+
ConoServer conoserver_ CONOSERVER_ID conoserver_
|
47
|
+
CYGD cygd_ CYGD_ID cygd_
|
48
|
+
dictyBase dictybase_ DICTYBASE_ID dictybase_
|
49
|
+
EchoBASE echobase_ ECHOBASE_ID echobase_
|
50
|
+
EcoGene ecogene_ ECOGENE_ID ecogene_
|
51
|
+
euHCVdb euhcvdb_ EUHCVDB_ID euhcvdb_
|
52
|
+
EuPathDB eupathdb_ EUPATHDB_ID eupathdb_
|
53
|
+
FlyBase flybase_ FLYBASE_ID flybase_
|
54
|
+
GeneCards genecards_ GENECARDS_ID genecards_
|
55
|
+
GeneFarm genefarm_ GENEFARM_ID genefarm_
|
56
|
+
GenoList genolist_ GENOLIST_ID genolist_
|
57
|
+
H-InvDB h-invdb_ H_INVDB_ID h-invdb_
|
58
|
+
HGNC hgnc_ HGNC_ID hgnc_
|
59
|
+
HPA hpa_ HPA_ID hpa_
|
60
|
+
LegioList legiolist_ LEGIOLIST_ID legiolist_
|
61
|
+
Leproma leproma_ LEPROMA_ID leproma_
|
62
|
+
MaizeGDB maizegdb_ MAIZEGDB_ID maizegdb_
|
63
|
+
MIM mim_ MIM_ID mim_
|
64
|
+
MGI mgi_ MGI_ID mgi_
|
65
|
+
neXtProt nextprot_ NEXTPROT_ID nextprot_
|
66
|
+
Orphanet orphanet_ ORPHANET_ID orphanet_
|
67
|
+
PharmGKB pharmgkb_ PHARMGKB_ID pharmgkb_
|
68
|
+
PomBase pombase_ POMBASE_ID pombase_
|
69
|
+
PseudoCAP pseudocap_ PSEUDOCAP_ID pseudocap_
|
70
|
+
RGD rgd_ RGD_ID rgd_
|
71
|
+
SGD sgd_ SGD_ID sgd_
|
72
|
+
TAIR tair_ TAIR_ID tair_
|
73
|
+
TubercuList tuberculist_ TUBERCULIST_ID tuberculist_
|
74
|
+
WormBase wormbase_ WORMBASE_ID wormbase_
|
75
|
+
WormBase Transcript wormbase_transcript_ WORMBASE_TRS_ID wormbase_transcript_
|
76
|
+
WormBase Protein wormbase_protein_ WORMBASE_PRO_ID wormbase_protein_
|
77
|
+
Xenbase xenbase_ XENBASE_ID xenbase_
|
78
|
+
ZFIN zfin_ ZFIN_ID zfin_
|
79
|
+
eggNOG eggnog_ EGGNOG_ID eggnog_
|
80
|
+
GeneTree genetree_ GENETREE_ID genetree_
|
81
|
+
HOGENOM hogenom_ HOGENOM_ID hogenom_
|
82
|
+
HOVERGEN hovergen_ HOVERGEN_ID hovergen_
|
83
|
+
KO ko_ KO_ID ko_
|
84
|
+
OMA oma_ OMA_ID oma_
|
85
|
+
OrthoDB orthodb_ ORTHODB_ID orthodb_
|
86
|
+
ProtClustDB protclustdb_ PROTCLUSTDB_ID protclustdb_
|
87
|
+
BioCyc biocyc_ BIOCYC_ID biocyc_
|
88
|
+
Reactome reactome_ REACTOME_ID reactome_
|
89
|
+
UniPathWay unipathway_ UNIPATHWAY_ID unipathway_
|
90
|
+
CleanEx cleanex_ CLEANEX_ID cleanex_
|
91
|
+
GermOnline germonline_ GERMONLINE_ID germonline_
|
92
|
+
ChEMBL chembl_ CHEMBL chembl_
|
93
|
+
DrugBank drugbank_ DRUGBANK_ID drugbank_
|
94
|
+
GenomeRNAi genomernai_ GENOMERNAI_ID genomernai_
|
95
|
+
NextBio nextbio_ NEXTBIO_ID nextbio_
|