protk 1.2.0 → 1.2.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- data/README.md +69 -36
- data/bin/gffmerge.rb +16 -5
- data/bin/mascot_search.rb +174 -97
- data/bin/omssa_search.rb +31 -8
- data/bin/protk_setup.rb +0 -3
- data/bin/sixframe.rb +0 -6
- data/bin/tandem_search.rb +97 -6
- data/bin/template_search.rb +144 -0
- data/bin/uniprot_annotation.rb +130 -0
- data/lib/convert_util.rb +27 -0
- data/lib/pepxml.rb +22 -0
- data/lib/protk/big_search_rakefile.rake +16 -0
- data/lib/protk/big_search_tool.rb +23 -0
- data/lib/protk/bio_sptr_extensions.rb +41 -2
- data/lib/protk/constants.rb +13 -0
- data/lib/protk/data/apt-get_packages.yaml +4 -0
- data/lib/protk/data/default_config.yml +1 -0
- data/lib/protk/data/make_uniprot_table.rb +29 -0
- data/lib/protk/data/predefined_db.trembl_annotation.yaml +20 -0
- data/lib/protk/data/uniprot_accessions.loc +96 -0
- data/lib/protk/data/uniprot_accessions_table.txt +97 -0
- data/lib/protk/data/uniprot_input_accessions.loc +95 -0
- data/lib/protk/manage_db_rakefile.rake +25 -11
- data/lib/protk/omssa_util.rb +1 -1
- data/lib/protk/setup_rakefile.rake +39 -2
- metadata +13 -1
    
        data/lib/convert_util.rb
    ADDED
    
    | @@ -0,0 +1,27 @@ | |
| 1 | 
            +
            require 'libxml'
         | 
| 2 | 
            +
            require 'constants'
         | 
| 3 | 
            +
             | 
| 4 | 
            +
            class ConvertUtil
         | 
| 5 | 
            +
             | 
| 6 | 
            +
              def self.ensure_mzml_indexed(run_file)
         | 
| 7 | 
            +
                if unindexed_mzml?(run_file)
         | 
| 8 | 
            +
                  index_mzml(run_file)
         | 
| 9 | 
            +
                end
         | 
| 10 | 
            +
              end
         | 
| 11 | 
            +
             | 
| 12 | 
            +
              def self.index_mzml(mzml_file)
         | 
| 13 | 
            +
                Dir.mktmpdir do |tmpdir|
         | 
| 14 | 
            +
                  genv=Constants.new
         | 
| 15 | 
            +
                  %x["#{genv.tpp_bin}/msconvert -o #{tmpdir} #{mzml_file}"]
         | 
| 16 | 
            +
                  indexed_file = Dir["#{tmpdir}/*"][0]
         | 
| 17 | 
            +
                  FileUtils.mv(indexed_file, mzml_file)
         | 
| 18 | 
            +
                end
         | 
| 19 | 
            +
              end
         | 
| 20 | 
            +
              
         | 
| 21 | 
            +
              def self.unindexed_mzml?(mzml_file)
         | 
| 22 | 
            +
                reader = LibXML::XML::Reader.file(mzml_file)
         | 
| 23 | 
            +
                reader.read
         | 
| 24 | 
            +
                reader.name == "mzML"
         | 
| 25 | 
            +
              end
         | 
| 26 | 
            +
             | 
| 27 | 
            +
            end
         | 
    
        data/lib/pepxml.rb
    ADDED
    
    | @@ -0,0 +1,22 @@ | |
| 1 | 
            +
            require 'rubygems'
         | 
| 2 | 
            +
            require 'rexml/document'
         | 
| 3 | 
            +
            require 'rexml/xpath'
         | 
| 4 | 
            +
             | 
| 5 | 
            +
            class PepXML
         | 
| 6 | 
            +
              def initialize(file_name)
         | 
| 7 | 
            +
                @doc=REXML::Document.new(File.new(file_name))
         | 
| 8 | 
            +
              end
         | 
| 9 | 
            +
             | 
| 10 | 
            +
              def find_runs() 
         | 
| 11 | 
            +
                runs = {}
         | 
| 12 | 
            +
                REXML::XPath.each(@doc,"//msms_run_summary") do |summary|
         | 
| 13 | 
            +
                  base_name = summary.attributes["base_name"]
         | 
| 14 | 
            +
                  if not runs.has_key?(base_name)
         | 
| 15 | 
            +
                    runs[base_name] = {:base_name => summary.attributes["base_name"],
         | 
| 16 | 
            +
                                       :type => summary.attributes["raw_data"]}
         | 
| 17 | 
            +
                  end
         | 
| 18 | 
            +
                end
         | 
| 19 | 
            +
                runs
         | 
| 20 | 
            +
              end
         | 
| 21 | 
            +
              
         | 
| 22 | 
            +
            end
         | 
| @@ -0,0 +1,23 @@ | |
| 1 | 
            +
            # create rake dependencies
         | 
| 2 | 
            +
            # run rakefile
         | 
| 3 | 
            +
            #
         | 
| 4 | 
            +
            require 'optparse'
         | 
| 5 | 
            +
            require 'pathname'
         | 
| 6 | 
            +
            require 'protk/tool'
         | 
| 7 | 
            +
            require 'protk/command_runner'
         | 
| 8 | 
            +
            require 'pp'
         | 
| 9 | 
            +
            require 'rake'
         | 
| 10 | 
            +
             | 
| 11 | 
            +
            class BigSearchTool < Tool
         | 
| 12 | 
            +
             | 
| 13 | 
            +
              def run input_files
         | 
| 14 | 
            +
            	command = "rake -f #{rakefile_path} #{input_files.join(" ")}"
         | 
| 15 | 
            +
            	runner=CommandRunner.new(Constants.new)
         | 
| 16 | 
            +
                runner.run_local(command)
         | 
| 17 | 
            +
              end
         | 
| 18 | 
            +
             | 
| 19 | 
            +
              def rakefile_path
         | 
| 20 | 
            +
                "#{File.dirname(__FILE__)}/big_search_rakefile.rake"
         | 
| 21 | 
            +
              end
         | 
| 22 | 
            +
             | 
| 23 | 
            +
            end
         | 
| @@ -177,7 +177,26 @@ class Bio::SPTR < Bio::EMBLDB | |
| 177 177 | 
             
                return self.safely_get_drentry_for_key("NextBio")
         | 
| 178 178 | 
             
              end
         | 
| 179 179 |  | 
| 180 | 
            -
              
         | 
| 180 | 
            +
              def uniprot_link
         | 
| 181 | 
            +
                return "http://www.uniprot.org/uniprot/#{self.accession}.html"
         | 
| 182 | 
            +
              end
         | 
| 183 | 
            +
             | 
| 184 | 
            +
              def nextbio_link
         | 
| 185 | 
            +
                return "http://www.nextbio.com/b/home/home.nb?id=#{self.nextbio}&type=feature"
         | 
| 186 | 
            +
              end
         | 
| 187 | 
            +
             | 
| 188 | 
            +
              def intact_link
         | 
| 189 | 
            +
                return "http://www.ebi.ac.uk/intact/pages/interactions/interactions.xhtml?query=#{self.intact}*"
         | 
| 190 | 
            +
              end
         | 
| 191 | 
            +
             | 
| 192 | 
            +
              def pride_link
         | 
| 193 | 
            +
                return "http://www.ebi.ac.uk/pride/searchSummary.do?queryTypeSelected=identification%20accession%20number&identificationAccessionNumber=#{self.pride}"
         | 
| 194 | 
            +
              end
         | 
| 195 | 
            +
             | 
| 196 | 
            +
              def ensembl_link
         | 
| 197 | 
            +
                return "http://www.ensembl.org/Homo_sapiens/Transcript/Summary?db=core;t=#{self.ensembl}"
         | 
| 198 | 
            +
              end
         | 
| 199 | 
            +
             | 
| 181 200 | 
             
              # Number of transmembrane regions
         | 
| 182 201 | 
             
              #
         | 
| 183 202 | 
             
              def num_transmem
         | 
| @@ -206,5 +225,25 @@ class Bio::SPTR < Bio::EMBLDB | |
| 206 225 | 
             
                  p "Warning: Unable to parse feature table for entry #{self.accession}"      
         | 
| 207 226 | 
             
                end
         | 
| 208 227 | 
             
              end
         | 
| 209 | 
            -
             | 
| 228 | 
            +
             | 
| 229 | 
            +
              def ref_dump
         | 
| 230 | 
            +
                return self.ref.to_s
         | 
| 231 | 
            +
              end
         | 
| 232 | 
            +
             | 
| 233 | 
            +
              def seq_dump
         | 
| 234 | 
            +
                return self.seq.to_s
         | 
| 235 | 
            +
              end
         | 
| 236 | 
            +
             | 
| 237 | 
            +
              def tax_dump
         | 
| 238 | 
            +
                return self.ox.to_s
         | 
| 239 | 
            +
              end
         | 
| 240 | 
            +
             | 
| 241 | 
            +
              def species_dump
         | 
| 242 | 
            +
                return self.os.to_s
         | 
| 243 | 
            +
              end
         | 
| 244 | 
            +
             | 
| 245 | 
            +
              def feature_dump
         | 
| 246 | 
            +
                return self.ft.to_s
         | 
| 247 | 
            +
              end
         | 
| 248 | 
            +
             | 
| 210 249 | 
             
            end
         | 
    
        data/lib/protk/constants.rb
    CHANGED
    
    | @@ -169,6 +169,19 @@ class Constants | |
| 169 169 | 
             
                return "#{self.openms_root}/bin/ExecutePipeline"
         | 
| 170 170 | 
             
              end
         | 
| 171 171 |  | 
| 172 | 
            +
              def tandem_root
         | 
| 173 | 
            +
                path=@env['tandem_root']
         | 
| 174 | 
            +
                if ( path =~ /^\//)
         | 
| 175 | 
            +
                  return path 
         | 
| 176 | 
            +
                else
         | 
| 177 | 
            +
                  return "#{@protk_dir}/#{@env['tandem_root']}"
         | 
| 178 | 
            +
                end
         | 
| 179 | 
            +
              end
         | 
| 180 | 
            +
             | 
| 181 | 
            +
              def gpmtandem
         | 
| 182 | 
            +
                return "#{self.tandem_root}/bin/tandem"
         | 
| 183 | 
            +
              end
         | 
| 184 | 
            +
             | 
| 172 185 | 
             
              def protein_database_root
         | 
| 173 186 | 
             
                path=@env['protein_database_root']
         | 
| 174 187 | 
             
                if ( path =~ /^\// )
         | 
| @@ -0,0 +1,29 @@ | |
| 1 | 
            +
            #!/usr/bin/env ruby
         | 
| 2 | 
            +
             | 
| 3 | 
            +
            file_name = ARGV[0]
         | 
| 4 | 
            +
             | 
| 5 | 
            +
            out_fh = File.new("uniprot_accessions.loc",'w')
         | 
| 6 | 
            +
             | 
| 7 | 
            +
            File.foreach(file_name) { |line|  
         | 
| 8 | 
            +
            	cols= line.chomp.split("\t")
         | 
| 9 | 
            +
            	if ( cols[2]!="from" )
         | 
| 10 | 
            +
            		db_key = "#{cols[0].gsub(" ","_").downcase}_"
         | 
| 11 | 
            +
            		out_fh.write "#{cols[0]}\t#{db_key}\t#{cols[1]}\t#{db_key}\n"
         | 
| 12 | 
            +
            	end
         | 
| 13 | 
            +
            }
         | 
| 14 | 
            +
             | 
| 15 | 
            +
            out_fh.close
         | 
| 16 | 
            +
             | 
| 17 | 
            +
             | 
| 18 | 
            +
             | 
| 19 | 
            +
            out_fh = File.new("uniprot_input_accessions.loc",'w')
         | 
| 20 | 
            +
             | 
| 21 | 
            +
            File.foreach(file_name) { |line|  
         | 
| 22 | 
            +
            	cols= line.chomp.split("\t")
         | 
| 23 | 
            +
            	if ( cols[2]!="to" )
         | 
| 24 | 
            +
            		db_key = "#{cols[0].gsub(" ","_").downcase}_"
         | 
| 25 | 
            +
            		out_fh.write "#{cols[0]}\t#{db_key}\t#{cols[1]}\t#{db_key}\n"
         | 
| 26 | 
            +
            	end
         | 
| 27 | 
            +
            }
         | 
| 28 | 
            +
             | 
| 29 | 
            +
            out_fh.close
         | 
| @@ -0,0 +1,20 @@ | |
| 1 | 
            +
            #
         | 
| 2 | 
            +
            # This is a predefined setup file for manage_db 
         | 
| 3 | 
            +
            #
         | 
| 4 | 
            +
            # Swissprot_uniprot annotation database (full entries for each protein)
         | 
| 5 | 
            +
            #
         | 
| 6 | 
            +
            --- 
         | 
| 7 | 
            +
            :description: Swissprot Trembl annotation database (full entries for each protein)
         | 
| 8 | 
            +
            :archive_old: false
         | 
| 9 | 
            +
            :is_annotation_db: true
         | 
| 10 | 
            +
            :decoy_prefix: decoy_
         | 
| 11 | 
            +
            :include_filters: []
         | 
| 12 | 
            +
             | 
| 13 | 
            +
            :format: dat
         | 
| 14 | 
            +
            :id_regexes: []
         | 
| 15 | 
            +
             | 
| 16 | 
            +
            :make_blast_index: false
         | 
| 17 | 
            +
            :sources: 
         | 
| 18 | 
            +
            - - ftp://ftp.uniprot.org/pub/databases/uniprot/current_release/knowledgebase/complete/uniprot_trembl.dat.gz
         | 
| 19 | 
            +
              - ftp://ftp.uniprot.org/pub/databases/uniprot/current_release/knowledgebase/complete/reldate.txt
         | 
| 20 | 
            +
            :decoys: false
         | 
| @@ -0,0 +1,96 @@ | |
| 1 | 
            +
            UniProtKB AC	uniprotkb_ac_	ACC	uniprotkb_ac_
         | 
| 2 | 
            +
            UniProtKB ID	uniprotkb_id_	ID	uniprotkb_id_
         | 
| 3 | 
            +
            UniParc	uniparc_	UPARC	uniparc_
         | 
| 4 | 
            +
            UniRef50	uniref50_	NF50	uniref50_
         | 
| 5 | 
            +
            UniRef90	uniref90_	NF90	uniref90_
         | 
| 6 | 
            +
            UniRef100	uniref100_	NF100	uniref100_
         | 
| 7 | 
            +
            EMBL/GenBank/DDBJ	embl/genbank/ddbj_	EMBL_ID	embl/genbank/ddbj_
         | 
| 8 | 
            +
            EMBL/GenBank/DDBJ CDS	embl/genbank/ddbj_cds_	EMBL	embl/genbank/ddbj_cds_
         | 
| 9 | 
            +
            PIR	pir_	PIR	pir_
         | 
| 10 | 
            +
            UniGene	unigene_	UNIGENE_ID	unigene_
         | 
| 11 | 
            +
            Entrez Gene (GeneID)	entrez_gene_(geneid)_	P_ENTREZGENEID	entrez_gene_(geneid)_
         | 
| 12 | 
            +
            GI number*	gi_number*_	P_GI	gi_number*_
         | 
| 13 | 
            +
            IPI	ipi_	P_IPI	ipi_
         | 
| 14 | 
            +
            RefSeq Protein	refseq_protein_	P_REFSEQ_AC	refseq_protein_
         | 
| 15 | 
            +
            RefSeq Nucleotide	refseq_nucleotide_	REFSEQ_NT_ID	refseq_nucleotide_
         | 
| 16 | 
            +
            PDB	pdb_	PDB_ID	pdb_
         | 
| 17 | 
            +
            DisProt	disprot_	DISPROT_ID	disprot_
         | 
| 18 | 
            +
            HSSP	hssp_	HSSP_ID	hssp_
         | 
| 19 | 
            +
            DIP	dip_	DIP_ID	dip_
         | 
| 20 | 
            +
            MINT	mint_	MINT_ID	mint_
         | 
| 21 | 
            +
            Allergome	allergome_	ALLERGOME_ID	allergome_
         | 
| 22 | 
            +
            MEROPS	merops_	MEROPS_ID	merops_
         | 
| 23 | 
            +
            PeroxiBase	peroxibase_	PEROXIBASE_ID	peroxibase_
         | 
| 24 | 
            +
            PptaseDB	pptasedb_	PPTASEDB_ID	pptasedb_
         | 
| 25 | 
            +
            REBASE	rebase_	REBASE_ID	rebase_
         | 
| 26 | 
            +
            TCDB	tcdb_	TCDB_ID	tcdb_
         | 
| 27 | 
            +
            PhosSite	phossite_	PHOSSITE_ID	phossite_
         | 
| 28 | 
            +
            DMDM	dmdm_	DMDM_ID	dmdm_
         | 
| 29 | 
            +
            Aarhus/Ghent-2DPAGE	aarhus/ghent-2dpage_	AARHUS_GHENT_2DPAGE_ID	aarhus/ghent-2dpage_
         | 
| 30 | 
            +
            World-2DPAGE	world-2dpage_	WORLD_2DPAGE_ID	world-2dpage_
         | 
| 31 | 
            +
            DNASU	dnasu_	DNASU_ID	dnasu_
         | 
| 32 | 
            +
            Ensembl	ensembl_	ENSEMBL_ID	ensembl_
         | 
| 33 | 
            +
            Ensembl Protein	ensembl_protein_	ENSEMBL_PRO_ID	ensembl_protein_
         | 
| 34 | 
            +
            Ensembl Transcript	ensembl_transcript_	ENSEMBL_TRS_ID	ensembl_transcript_
         | 
| 35 | 
            +
            Ensembl Genomes	ensembl_genomes_	ENSEMBLGENOME_ID	ensembl_genomes_
         | 
| 36 | 
            +
            Ensembl Genomes Protein	ensembl_genomes_protein_	ENSEMBLGENOME_PRO_ID	ensembl_genomes_protein_
         | 
| 37 | 
            +
            Ensembl Genomes Transcript	ensembl_genomes_transcript_	ENSEMBLGENOME_TRS_ID	ensembl_genomes_transcript_
         | 
| 38 | 
            +
            GeneID	geneid_	P_ENTREZGENEID	geneid_
         | 
| 39 | 
            +
            GenomeReviews	genomereviews_	GENOMEREVIEWS_ID	genomereviews_
         | 
| 40 | 
            +
            KEGG	kegg_	KEGG_ID	kegg_
         | 
| 41 | 
            +
            PATRIC	patric_	PATRIC_ID	patric_
         | 
| 42 | 
            +
            UCSC	ucsc_	UCSC_ID	ucsc_
         | 
| 43 | 
            +
            VectorBase	vectorbase_	VECTORBASE_ID	vectorbase_
         | 
| 44 | 
            +
            AGD	agd_	AGD_ID	agd_
         | 
| 45 | 
            +
            ArachnoServer	arachnoserver_	ARACHNOSERVER_ID	arachnoserver_
         | 
| 46 | 
            +
            CGD	cgd_	CGD	cgd_
         | 
| 47 | 
            +
            ConoServer	conoserver_	CONOSERVER_ID	conoserver_
         | 
| 48 | 
            +
            CYGD	cygd_	CYGD_ID	cygd_
         | 
| 49 | 
            +
            dictyBase	dictybase_	DICTYBASE_ID	dictybase_
         | 
| 50 | 
            +
            EchoBASE	echobase_	ECHOBASE_ID	echobase_
         | 
| 51 | 
            +
            EcoGene	ecogene_	ECOGENE_ID	ecogene_
         | 
| 52 | 
            +
            euHCVdb	euhcvdb_	EUHCVDB_ID	euhcvdb_
         | 
| 53 | 
            +
            EuPathDB	eupathdb_	EUPATHDB_ID	eupathdb_
         | 
| 54 | 
            +
            FlyBase	flybase_	FLYBASE_ID	flybase_
         | 
| 55 | 
            +
            GeneCards	genecards_	GENECARDS_ID	genecards_
         | 
| 56 | 
            +
            GeneFarm	genefarm_	GENEFARM_ID	genefarm_
         | 
| 57 | 
            +
            GenoList	genolist_	GENOLIST_ID	genolist_
         | 
| 58 | 
            +
            H-InvDB	h-invdb_	H_INVDB_ID	h-invdb_
         | 
| 59 | 
            +
            HGNC	hgnc_	HGNC_ID	hgnc_
         | 
| 60 | 
            +
            HPA	hpa_	HPA_ID	hpa_
         | 
| 61 | 
            +
            LegioList	legiolist_	LEGIOLIST_ID	legiolist_
         | 
| 62 | 
            +
            Leproma	leproma_	LEPROMA_ID	leproma_
         | 
| 63 | 
            +
            MaizeGDB	maizegdb_	MAIZEGDB_ID	maizegdb_
         | 
| 64 | 
            +
            MIM	mim_	MIM_ID	mim_
         | 
| 65 | 
            +
            MGI	mgi_	MGI_ID	mgi_
         | 
| 66 | 
            +
            neXtProt	nextprot_	NEXTPROT_ID	nextprot_
         | 
| 67 | 
            +
            Orphanet	orphanet_	ORPHANET_ID	orphanet_
         | 
| 68 | 
            +
            PharmGKB	pharmgkb_	PHARMGKB_ID	pharmgkb_
         | 
| 69 | 
            +
            PomBase	pombase_	POMBASE_ID	pombase_
         | 
| 70 | 
            +
            PseudoCAP	pseudocap_	PSEUDOCAP_ID	pseudocap_
         | 
| 71 | 
            +
            RGD	rgd_	RGD_ID	rgd_
         | 
| 72 | 
            +
            SGD	sgd_	SGD_ID	sgd_
         | 
| 73 | 
            +
            TAIR	tair_	TAIR_ID	tair_
         | 
| 74 | 
            +
            TubercuList	tuberculist_	TUBERCULIST_ID	tuberculist_
         | 
| 75 | 
            +
            WormBase	wormbase_	WORMBASE_ID	wormbase_
         | 
| 76 | 
            +
            WormBase Transcript	wormbase_transcript_	WORMBASE_TRS_ID	wormbase_transcript_
         | 
| 77 | 
            +
            WormBase Protein	wormbase_protein_	WORMBASE_PRO_ID	wormbase_protein_
         | 
| 78 | 
            +
            Xenbase	xenbase_	XENBASE_ID	xenbase_
         | 
| 79 | 
            +
            ZFIN	zfin_	ZFIN_ID	zfin_
         | 
| 80 | 
            +
            eggNOG	eggnog_	EGGNOG_ID	eggnog_
         | 
| 81 | 
            +
            GeneTree	genetree_	GENETREE_ID	genetree_
         | 
| 82 | 
            +
            HOGENOM	hogenom_	HOGENOM_ID	hogenom_
         | 
| 83 | 
            +
            HOVERGEN	hovergen_	HOVERGEN_ID	hovergen_
         | 
| 84 | 
            +
            KO	ko_	KO_ID	ko_
         | 
| 85 | 
            +
            OMA	oma_	OMA_ID	oma_
         | 
| 86 | 
            +
            OrthoDB	orthodb_	ORTHODB_ID	orthodb_
         | 
| 87 | 
            +
            ProtClustDB	protclustdb_	PROTCLUSTDB_ID	protclustdb_
         | 
| 88 | 
            +
            BioCyc	biocyc_	BIOCYC_ID	biocyc_
         | 
| 89 | 
            +
            Reactome	reactome_	REACTOME_ID	reactome_
         | 
| 90 | 
            +
            UniPathWay	unipathway_	UNIPATHWAY_ID	unipathway_
         | 
| 91 | 
            +
            CleanEx	cleanex_	CLEANEX_ID	cleanex_
         | 
| 92 | 
            +
            GermOnline	germonline_	GERMONLINE_ID	germonline_
         | 
| 93 | 
            +
            ChEMBL	chembl_	CHEMBL	chembl_
         | 
| 94 | 
            +
            DrugBank	drugbank_	DRUGBANK_ID	drugbank_
         | 
| 95 | 
            +
            GenomeRNAi	genomernai_	GENOMERNAI_ID	genomernai_
         | 
| 96 | 
            +
            NextBio	nextbio_	NEXTBIO_ID	nextbio_
         | 
| @@ -0,0 +1,97 @@ | |
| 1 | 
            +
            UniProtKB AC/ID	ACC+ID	from
         | 
| 2 | 
            +
            UniProtKB AC	ACC	to
         | 
| 3 | 
            +
            UniProtKB ID	ID	to
         | 
| 4 | 
            +
            UniParc	UPARC	both
         | 
| 5 | 
            +
            UniRef50	NF50	both
         | 
| 6 | 
            +
            UniRef90	NF90	both
         | 
| 7 | 
            +
            UniRef100	NF100	both
         | 
| 8 | 
            +
            EMBL/GenBank/DDBJ	EMBL_ID	both
         | 
| 9 | 
            +
            EMBL/GenBank/DDBJ CDS	EMBL	both
         | 
| 10 | 
            +
            PIR	PIR	both
         | 
| 11 | 
            +
            UniGene	UNIGENE_ID	both
         | 
| 12 | 
            +
            Entrez Gene (GeneID)	P_ENTREZGENEID	both
         | 
| 13 | 
            +
            GI number*	P_GI	both
         | 
| 14 | 
            +
            IPI	P_IPI	both
         | 
| 15 | 
            +
            RefSeq Protein	P_REFSEQ_AC	both
         | 
| 16 | 
            +
            RefSeq Nucleotide	REFSEQ_NT_ID	both
         | 
| 17 | 
            +
            PDB	PDB_ID	both
         | 
| 18 | 
            +
            DisProt	DISPROT_ID	both
         | 
| 19 | 
            +
            HSSP	HSSP_ID	both
         | 
| 20 | 
            +
            DIP	DIP_ID	both
         | 
| 21 | 
            +
            MINT	MINT_ID	both
         | 
| 22 | 
            +
            Allergome	ALLERGOME_ID	both
         | 
| 23 | 
            +
            MEROPS	MEROPS_ID	both
         | 
| 24 | 
            +
            PeroxiBase	PEROXIBASE_ID	both
         | 
| 25 | 
            +
            PptaseDB	PPTASEDB_ID	both
         | 
| 26 | 
            +
            REBASE	REBASE_ID	both
         | 
| 27 | 
            +
            TCDB	TCDB_ID	both
         | 
| 28 | 
            +
            PhosSite	PHOSSITE_ID	both
         | 
| 29 | 
            +
            DMDM	DMDM_ID	both
         | 
| 30 | 
            +
            Aarhus/Ghent-2DPAGE	AARHUS_GHENT_2DPAGE_ID	both
         | 
| 31 | 
            +
            World-2DPAGE	WORLD_2DPAGE_ID	both
         | 
| 32 | 
            +
            DNASU	DNASU_ID	both
         | 
| 33 | 
            +
            Ensembl	ENSEMBL_ID	both
         | 
| 34 | 
            +
            Ensembl Protein	ENSEMBL_PRO_ID	both
         | 
| 35 | 
            +
            Ensembl Transcript	ENSEMBL_TRS_ID	both
         | 
| 36 | 
            +
            Ensembl Genomes	ENSEMBLGENOME_ID	both
         | 
| 37 | 
            +
            Ensembl Genomes Protein	ENSEMBLGENOME_PRO_ID	both
         | 
| 38 | 
            +
            Ensembl Genomes Transcript	ENSEMBLGENOME_TRS_ID	both
         | 
| 39 | 
            +
            GeneID	P_ENTREZGENEID	both
         | 
| 40 | 
            +
            GenomeReviews	GENOMEREVIEWS_ID	both
         | 
| 41 | 
            +
            KEGG	KEGG_ID	both
         | 
| 42 | 
            +
            PATRIC	PATRIC_ID	both
         | 
| 43 | 
            +
            UCSC	UCSC_ID	both
         | 
| 44 | 
            +
            VectorBase	VECTORBASE_ID	both
         | 
| 45 | 
            +
            AGD	AGD_ID	both
         | 
| 46 | 
            +
            ArachnoServer	ARACHNOSERVER_ID	both
         | 
| 47 | 
            +
            CGD	CGD	both
         | 
| 48 | 
            +
            ConoServer	CONOSERVER_ID	both
         | 
| 49 | 
            +
            CYGD	CYGD_ID	both
         | 
| 50 | 
            +
            dictyBase	DICTYBASE_ID	both
         | 
| 51 | 
            +
            EchoBASE	ECHOBASE_ID	both
         | 
| 52 | 
            +
            EcoGene	ECOGENE_ID	both
         | 
| 53 | 
            +
            euHCVdb	EUHCVDB_ID	both
         | 
| 54 | 
            +
            EuPathDB	EUPATHDB_ID	both
         | 
| 55 | 
            +
            FlyBase	FLYBASE_ID	both
         | 
| 56 | 
            +
            GeneCards	GENECARDS_ID	both
         | 
| 57 | 
            +
            GeneFarm	GENEFARM_ID	both
         | 
| 58 | 
            +
            GenoList	GENOLIST_ID	both
         | 
| 59 | 
            +
            H-InvDB	H_INVDB_ID	both
         | 
| 60 | 
            +
            HGNC	HGNC_ID	both
         | 
| 61 | 
            +
            HPA	HPA_ID	both
         | 
| 62 | 
            +
            LegioList	LEGIOLIST_ID	both
         | 
| 63 | 
            +
            Leproma	LEPROMA_ID	both
         | 
| 64 | 
            +
            MaizeGDB	MAIZEGDB_ID	both
         | 
| 65 | 
            +
            MIM	MIM_ID	both
         | 
| 66 | 
            +
            MGI	MGI_ID	both
         | 
| 67 | 
            +
            neXtProt	NEXTPROT_ID	both
         | 
| 68 | 
            +
            Orphanet	ORPHANET_ID	both
         | 
| 69 | 
            +
            PharmGKB	PHARMGKB_ID	both
         | 
| 70 | 
            +
            PomBase	POMBASE_ID	both
         | 
| 71 | 
            +
            PseudoCAP	PSEUDOCAP_ID	both
         | 
| 72 | 
            +
            RGD	RGD_ID	both
         | 
| 73 | 
            +
            SGD	SGD_ID	both
         | 
| 74 | 
            +
            TAIR	TAIR_ID	both
         | 
| 75 | 
            +
            TubercuList	TUBERCULIST_ID	both
         | 
| 76 | 
            +
            WormBase	WORMBASE_ID	both
         | 
| 77 | 
            +
            WormBase Transcript	WORMBASE_TRS_ID	both
         | 
| 78 | 
            +
            WormBase Protein	WORMBASE_PRO_ID	both
         | 
| 79 | 
            +
            Xenbase	XENBASE_ID	both
         | 
| 80 | 
            +
            ZFIN	ZFIN_ID	both
         | 
| 81 | 
            +
            eggNOG	EGGNOG_ID	both
         | 
| 82 | 
            +
            GeneTree	GENETREE_ID	both
         | 
| 83 | 
            +
            HOGENOM	HOGENOM_ID	both
         | 
| 84 | 
            +
            HOVERGEN	HOVERGEN_ID	both
         | 
| 85 | 
            +
            KO	KO_ID	both
         | 
| 86 | 
            +
            OMA	OMA_ID	both
         | 
| 87 | 
            +
            OrthoDB	ORTHODB_ID	both
         | 
| 88 | 
            +
            ProtClustDB	PROTCLUSTDB_ID	both
         | 
| 89 | 
            +
            BioCyc	BIOCYC_ID	both
         | 
| 90 | 
            +
            Reactome	REACTOME_ID	both
         | 
| 91 | 
            +
            UniPathWay	UNIPATHWAY_ID	both
         | 
| 92 | 
            +
            CleanEx	CLEANEX_ID	both
         | 
| 93 | 
            +
            GermOnline	GERMONLINE_ID	both
         | 
| 94 | 
            +
            ChEMBL	CHEMBL	both
         | 
| 95 | 
            +
            DrugBank	DRUGBANK_ID	both
         | 
| 96 | 
            +
            GenomeRNAi	GENOMERNAI_ID	both
         | 
| 97 | 
            +
            NextBio	NEXTBIO_ID	both
         | 
| @@ -0,0 +1,95 @@ | |
| 1 | 
            +
            UniProtKB AC/ID	uniprotkb_ac/id_	ACC+ID	uniprotkb_ac/id_
         | 
| 2 | 
            +
            UniParc	uniparc_	UPARC	uniparc_
         | 
| 3 | 
            +
            UniRef50	uniref50_	NF50	uniref50_
         | 
| 4 | 
            +
            UniRef90	uniref90_	NF90	uniref90_
         | 
| 5 | 
            +
            UniRef100	uniref100_	NF100	uniref100_
         | 
| 6 | 
            +
            EMBL/GenBank/DDBJ	embl/genbank/ddbj_	EMBL_ID	embl/genbank/ddbj_
         | 
| 7 | 
            +
            EMBL/GenBank/DDBJ CDS	embl/genbank/ddbj_cds_	EMBL	embl/genbank/ddbj_cds_
         | 
| 8 | 
            +
            PIR	pir_	PIR	pir_
         | 
| 9 | 
            +
            UniGene	unigene_	UNIGENE_ID	unigene_
         | 
| 10 | 
            +
            Entrez Gene (GeneID)	entrez_gene_(geneid)_	P_ENTREZGENEID	entrez_gene_(geneid)_
         | 
| 11 | 
            +
            GI number*	gi_number*_	P_GI	gi_number*_
         | 
| 12 | 
            +
            IPI	ipi_	P_IPI	ipi_
         | 
| 13 | 
            +
            RefSeq Protein	refseq_protein_	P_REFSEQ_AC	refseq_protein_
         | 
| 14 | 
            +
            RefSeq Nucleotide	refseq_nucleotide_	REFSEQ_NT_ID	refseq_nucleotide_
         | 
| 15 | 
            +
            PDB	pdb_	PDB_ID	pdb_
         | 
| 16 | 
            +
            DisProt	disprot_	DISPROT_ID	disprot_
         | 
| 17 | 
            +
            HSSP	hssp_	HSSP_ID	hssp_
         | 
| 18 | 
            +
            DIP	dip_	DIP_ID	dip_
         | 
| 19 | 
            +
            MINT	mint_	MINT_ID	mint_
         | 
| 20 | 
            +
            Allergome	allergome_	ALLERGOME_ID	allergome_
         | 
| 21 | 
            +
            MEROPS	merops_	MEROPS_ID	merops_
         | 
| 22 | 
            +
            PeroxiBase	peroxibase_	PEROXIBASE_ID	peroxibase_
         | 
| 23 | 
            +
            PptaseDB	pptasedb_	PPTASEDB_ID	pptasedb_
         | 
| 24 | 
            +
            REBASE	rebase_	REBASE_ID	rebase_
         | 
| 25 | 
            +
            TCDB	tcdb_	TCDB_ID	tcdb_
         | 
| 26 | 
            +
            PhosSite	phossite_	PHOSSITE_ID	phossite_
         | 
| 27 | 
            +
            DMDM	dmdm_	DMDM_ID	dmdm_
         | 
| 28 | 
            +
            Aarhus/Ghent-2DPAGE	aarhus/ghent-2dpage_	AARHUS_GHENT_2DPAGE_ID	aarhus/ghent-2dpage_
         | 
| 29 | 
            +
            World-2DPAGE	world-2dpage_	WORLD_2DPAGE_ID	world-2dpage_
         | 
| 30 | 
            +
            DNASU	dnasu_	DNASU_ID	dnasu_
         | 
| 31 | 
            +
            Ensembl	ensembl_	ENSEMBL_ID	ensembl_
         | 
| 32 | 
            +
            Ensembl Protein	ensembl_protein_	ENSEMBL_PRO_ID	ensembl_protein_
         | 
| 33 | 
            +
            Ensembl Transcript	ensembl_transcript_	ENSEMBL_TRS_ID	ensembl_transcript_
         | 
| 34 | 
            +
            Ensembl Genomes	ensembl_genomes_	ENSEMBLGENOME_ID	ensembl_genomes_
         | 
| 35 | 
            +
            Ensembl Genomes Protein	ensembl_genomes_protein_	ENSEMBLGENOME_PRO_ID	ensembl_genomes_protein_
         | 
| 36 | 
            +
            Ensembl Genomes Transcript	ensembl_genomes_transcript_	ENSEMBLGENOME_TRS_ID	ensembl_genomes_transcript_
         | 
| 37 | 
            +
            GeneID	geneid_	P_ENTREZGENEID	geneid_
         | 
| 38 | 
            +
            GenomeReviews	genomereviews_	GENOMEREVIEWS_ID	genomereviews_
         | 
| 39 | 
            +
            KEGG	kegg_	KEGG_ID	kegg_
         | 
| 40 | 
            +
            PATRIC	patric_	PATRIC_ID	patric_
         | 
| 41 | 
            +
            UCSC	ucsc_	UCSC_ID	ucsc_
         | 
| 42 | 
            +
            VectorBase	vectorbase_	VECTORBASE_ID	vectorbase_
         | 
| 43 | 
            +
            AGD	agd_	AGD_ID	agd_
         | 
| 44 | 
            +
            ArachnoServer	arachnoserver_	ARACHNOSERVER_ID	arachnoserver_
         | 
| 45 | 
            +
            CGD	cgd_	CGD	cgd_
         | 
| 46 | 
            +
            ConoServer	conoserver_	CONOSERVER_ID	conoserver_
         | 
| 47 | 
            +
            CYGD	cygd_	CYGD_ID	cygd_
         | 
| 48 | 
            +
            dictyBase	dictybase_	DICTYBASE_ID	dictybase_
         | 
| 49 | 
            +
            EchoBASE	echobase_	ECHOBASE_ID	echobase_
         | 
| 50 | 
            +
            EcoGene	ecogene_	ECOGENE_ID	ecogene_
         | 
| 51 | 
            +
            euHCVdb	euhcvdb_	EUHCVDB_ID	euhcvdb_
         | 
| 52 | 
            +
            EuPathDB	eupathdb_	EUPATHDB_ID	eupathdb_
         | 
| 53 | 
            +
            FlyBase	flybase_	FLYBASE_ID	flybase_
         | 
| 54 | 
            +
            GeneCards	genecards_	GENECARDS_ID	genecards_
         | 
| 55 | 
            +
            GeneFarm	genefarm_	GENEFARM_ID	genefarm_
         | 
| 56 | 
            +
            GenoList	genolist_	GENOLIST_ID	genolist_
         | 
| 57 | 
            +
            H-InvDB	h-invdb_	H_INVDB_ID	h-invdb_
         | 
| 58 | 
            +
            HGNC	hgnc_	HGNC_ID	hgnc_
         | 
| 59 | 
            +
            HPA	hpa_	HPA_ID	hpa_
         | 
| 60 | 
            +
            LegioList	legiolist_	LEGIOLIST_ID	legiolist_
         | 
| 61 | 
            +
            Leproma	leproma_	LEPROMA_ID	leproma_
         | 
| 62 | 
            +
            MaizeGDB	maizegdb_	MAIZEGDB_ID	maizegdb_
         | 
| 63 | 
            +
            MIM	mim_	MIM_ID	mim_
         | 
| 64 | 
            +
            MGI	mgi_	MGI_ID	mgi_
         | 
| 65 | 
            +
            neXtProt	nextprot_	NEXTPROT_ID	nextprot_
         | 
| 66 | 
            +
            Orphanet	orphanet_	ORPHANET_ID	orphanet_
         | 
| 67 | 
            +
            PharmGKB	pharmgkb_	PHARMGKB_ID	pharmgkb_
         | 
| 68 | 
            +
            PomBase	pombase_	POMBASE_ID	pombase_
         | 
| 69 | 
            +
            PseudoCAP	pseudocap_	PSEUDOCAP_ID	pseudocap_
         | 
| 70 | 
            +
            RGD	rgd_	RGD_ID	rgd_
         | 
| 71 | 
            +
            SGD	sgd_	SGD_ID	sgd_
         | 
| 72 | 
            +
            TAIR	tair_	TAIR_ID	tair_
         | 
| 73 | 
            +
            TubercuList	tuberculist_	TUBERCULIST_ID	tuberculist_
         | 
| 74 | 
            +
            WormBase	wormbase_	WORMBASE_ID	wormbase_
         | 
| 75 | 
            +
            WormBase Transcript	wormbase_transcript_	WORMBASE_TRS_ID	wormbase_transcript_
         | 
| 76 | 
            +
            WormBase Protein	wormbase_protein_	WORMBASE_PRO_ID	wormbase_protein_
         | 
| 77 | 
            +
            Xenbase	xenbase_	XENBASE_ID	xenbase_
         | 
| 78 | 
            +
            ZFIN	zfin_	ZFIN_ID	zfin_
         | 
| 79 | 
            +
            eggNOG	eggnog_	EGGNOG_ID	eggnog_
         | 
| 80 | 
            +
            GeneTree	genetree_	GENETREE_ID	genetree_
         | 
| 81 | 
            +
            HOGENOM	hogenom_	HOGENOM_ID	hogenom_
         | 
| 82 | 
            +
            HOVERGEN	hovergen_	HOVERGEN_ID	hovergen_
         | 
| 83 | 
            +
            KO	ko_	KO_ID	ko_
         | 
| 84 | 
            +
            OMA	oma_	OMA_ID	oma_
         | 
| 85 | 
            +
            OrthoDB	orthodb_	ORTHODB_ID	orthodb_
         | 
| 86 | 
            +
            ProtClustDB	protclustdb_	PROTCLUSTDB_ID	protclustdb_
         | 
| 87 | 
            +
            BioCyc	biocyc_	BIOCYC_ID	biocyc_
         | 
| 88 | 
            +
            Reactome	reactome_	REACTOME_ID	reactome_
         | 
| 89 | 
            +
            UniPathWay	unipathway_	UNIPATHWAY_ID	unipathway_
         | 
| 90 | 
            +
            CleanEx	cleanex_	CLEANEX_ID	cleanex_
         | 
| 91 | 
            +
            GermOnline	germonline_	GERMONLINE_ID	germonline_
         | 
| 92 | 
            +
            ChEMBL	chembl_	CHEMBL	chembl_
         | 
| 93 | 
            +
            DrugBank	drugbank_	DRUGBANK_ID	drugbank_
         | 
| 94 | 
            +
            GenomeRNAi	genomernai_	GENOMERNAI_ID	genomernai_
         | 
| 95 | 
            +
            NextBio	nextbio_	NEXTBIO_ID	nextbio_
         |