rbbt-sources 0.4.0 → 1.0.0

Sign up to get free protection for your applications and to get access to all the features.
@@ -1,9 +1,9 @@
1
- require 'rbbt-util'
1
+ require 'rbbt'
2
2
  require 'rbbt/sources/biomart'
3
3
  require 'rbbt/sources/entrez'
4
4
 
5
5
  def tsv_file(url, native, extra, options = {})
6
- options = Misc.add_defaults options, :persistence => false, :keep_empty => true
6
+ options = Misc.add_defaults options, :persist => false, :keep_empty => true
7
7
 
8
8
  case
9
9
  when Array === native
@@ -27,7 +27,7 @@ def tsv_file(url, native, extra, options = {})
27
27
  fields = nil
28
28
  end
29
29
 
30
- tsv = TSV.new(Open.open(url), options)
30
+ tsv = TSV.open(Open.open(url), options)
31
31
  tsv.key_field ||= key_field
32
32
  tsv.fields ||= fields
33
33
  tsv
@@ -35,13 +35,14 @@ end
35
35
 
36
36
  def merge_entrez(data, taxs, native, fix = nil, select = nil)
37
37
  entrez = Entrez.entrez2native(taxs, :fix => fix, :select => select)
38
+ entrez.key_field = "Entrez Gene ID"
38
39
  entrez.fields = [native]
39
40
  entrez
40
41
 
41
- data.smart_merge entrez, native
42
+ data.attach entrez, "Entrez Gene ID"
42
43
  end
43
44
 
44
45
  def merge_biomart(lexicon, db, native, other, match = nil)
45
46
  match ||= native.first
46
- lexicon.smart_merge BioMart.tsv(db, native, other), match
47
+ lexicon.attach BioMart.tsv(db, native, other)
47
48
  end
@@ -1,4 +1,7 @@
1
- require File.dirname(__FILE__) + '/../../test_helper'
1
+ require File.expand_path(File.dirname(__FILE__) + '/../../test_helper')
2
+
3
+ require 'rbbt/sources/pubmed'
4
+ require 'test/unit'
2
5
  require 'rbbt/sources/biomart'
3
6
  require 'rbbt/util/tmpfile'
4
7
  require 'test/unit'
@@ -11,11 +14,11 @@ class TestBioMart < Test::Unit::TestCase
11
14
  end
12
15
 
13
16
  data = BioMart.get('scerevisiae_gene_ensembl','entrezgene', ['protein_id'],[], nil, :nocache => false, :merge => true, :wget_options => {:quiet => false})
14
- tsv = TSV.new data, :double, :merge => true
17
+ tsv = TSV.open data, :double, :merge => true
15
18
  assert(tsv['852236'][0].include? 'CAA84864')
16
19
 
17
20
  data = BioMart.get('scerevisiae_gene_ensembl','entrezgene', ['external_gene_id'],[], data, :nocache => false, :wget_options => { :quiet => false} )
18
- tsv = TSV.new data, :double, :merge => true
21
+ tsv = TSV.open data, :double, :merge => true
19
22
  assert(tsv['852236'][1].include? 'YBL044W')
20
23
  end
21
24
 
@@ -25,7 +28,7 @@ class TestBioMart < Test::Unit::TestCase
25
28
 
26
29
  TmpFile.with_file do |f|
27
30
  filename = BioMart.query('scerevisiae_gene_ensembl','entrezgene', ['protein_id','refseq_peptide','external_gene_id','ensembl_gene_id'], [], nil, :nocache => false, :wget_options => { :quiet => false}, :filename => f)
28
- data = TSV.new Open.open(filename)
31
+ data = TSV.open Open.open(filename)
29
32
  assert(data['852236']['external_gene_id'].include? 'YBL044W')
30
33
  end
31
34
  end
@@ -38,7 +41,7 @@ class TestBioMart < Test::Unit::TestCase
38
41
 
39
42
  TmpFile.with_file do |f|
40
43
  filename = BioMart.tsv('scerevisiae_gene_ensembl',['Entrez Gene', 'entrezgene'], [['Protein ID', 'protein_id'],['RefSeq Peptide','refseq_peptide']], [], nil, :nocache => false, :wget_options => { :quiet => false}, :filename => f)
41
- data = TSV.new Open.open(filename, :merge => true)
44
+ data = TSV.open Open.open(filename, :merge => true)
42
45
  assert(data['852236']['Protein ID'].include? 'CAA84864')
43
46
  assert_equal 'Entrez Gene', data.key_field
44
47
  assert_equal ['Protein ID', 'RefSeq Peptide'], data.fields
@@ -1,24 +1,28 @@
1
1
  require File.expand_path(File.dirname(__FILE__) + '/../../test_helper')
2
2
  require 'rbbt/sources/organism'
3
- require 'rbbt/sources/organism/sequence'
4
3
  require 'test/unit'
5
4
 
6
5
  class TestEntrez < Test::Unit::TestCase
6
+ def test_location
7
+ assert_equal "share/organisms/Sce/identifiers", Organism.identifiers('Sce')
8
+ end
9
+
10
+
7
11
  def test_identifiers
8
- assert Organism.identifiers('Sce').tsv['S000006120']["Ensembl Gene ID"].include?('YPL199C')
9
- assert Organism::Sce.identifiers.tsv['S000006120']["Ensembl Gene ID"].include?('YPL199C')
10
- assert Organism.identifiers('Hsa').tsv(:key => "Entrez Gene ID")['1020']["Associated Gene Name"].include?('CDK5')
12
+ assert Organism.identifiers('Hsa').tsv(:key_field => "Entrez Gene ID", :persist => true)['1020']["Associated Gene Name"].include?('CDK5')
13
+ assert Organism.identifiers('Sce').tsv(:persist => true)['S000006120']["Ensembl Gene ID"].include?('YPL199C')
14
+ assert Organism::Sce.identifiers.tsv(:persist => true)['S000006120']["Ensembl Gene ID"].include?('YPL199C')
11
15
  end
12
16
 
13
17
  def test_lexicon
14
- assert TSV.new(Organism.lexicon('Sce'))['S000006120'].flatten.include?('YPL199C')
18
+ assert TSV.open(Organism.lexicon('Sce'))['S000006120'].flatten.include?('YPL199C')
15
19
  end
16
20
 
17
21
  def test_guess_id
18
22
  ensembl = %w(YOL044W YDR289C YAL034C YGR246C ARS519 tH(GUG)E2 YDR218C YLR002C YGL224C)
19
23
  gene_name = %w(SNR64 MIP1 MRPS18 TFB2 JEN1 IVY1 TRS33 GAS3)
20
- assert_equal "Ensembl Gene ID", Organism::Sce.guess_id(ensembl).first
21
24
  assert_equal "Associated Gene Name", Organism::Sce.guess_id(gene_name).first
25
+ assert_equal "Ensembl Gene ID", Organism::Sce.guess_id(ensembl).first
22
26
  end
23
27
 
24
28
  def test_organisms
@@ -27,7 +31,7 @@ class TestEntrez < Test::Unit::TestCase
27
31
  end
28
32
 
29
33
  def test_attach_translations
30
- tsv = TSV.new({"1020" => []}, :list)
34
+ tsv = TSV.setup({"1020" => []}, :type => :list)
31
35
  tsv.key_field = "Entrez Gene ID"
32
36
  tsv.fields = []
33
37
  tsv.namespace = "Hsa"
@@ -38,20 +42,20 @@ class TestEntrez < Test::Unit::TestCase
38
42
  assert_equal "CDK5", tsv["1020"]["Associated Gene Name"]
39
43
  end
40
44
 
41
- def test_genes_at_chromosome
42
- pos = [12, 117799500]
43
- assert_equal "ENSG00000089250", Organism::Hsa.genes_at_chromosome_positions(pos.first, pos.last)
44
- end
45
+ #def test_genes_at_chromosome
46
+ # pos = [12, 117799500]
47
+ # assert_equal "ENSG00000089250", Organism::Hsa.genes_at_chromosome_positions(pos.first, pos.last)
48
+ #end
45
49
 
46
- def test_genes_at_chromosome_array
47
- pos = [12, [117799500, 106903900]]
48
- assert_equal ["ENSG00000089250", "ENSG00000013503"], Organism::Hsa.genes_at_chromosome_positions(pos.first, pos.last)
49
- end
50
+ #def test_genes_at_chromosome_array
51
+ # pos = [12, [117799500, 106903900]]
52
+ # assert_equal ["ENSG00000089250", "ENSG00000013503"], Organism::Hsa.genes_at_chromosome_positions(pos.first, pos.last)
53
+ #end
50
54
 
51
- def test_genes_at_genomic_positions
52
- pos = [[12, 117799500], [12, 106903900], [1, 115259500]]
53
- assert_equal ["ENSG00000089250", "ENSG00000013503", "ENSG00000213281"], Organism::Hsa.genes_at_genomic_positions(pos)
54
- end
55
+ #def test_genes_at_genomic_positions
56
+ # pos = [[12, 117799500], [12, 106903900], [1, 115259500]]
57
+ # assert_equal ["ENSG00000089250", "ENSG00000013503", "ENSG00000213281"], Organism::Hsa.genes_at_genomic_positions(pos)
58
+ #end
55
59
 
56
60
  end
57
61
 
metadata CHANGED
@@ -1,13 +1,13 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: rbbt-sources
3
3
  version: !ruby/object:Gem::Version
4
- hash: 15
5
- prerelease:
4
+ hash: 23
5
+ prerelease: false
6
6
  segments:
7
+ - 1
7
8
  - 0
8
- - 4
9
9
  - 0
10
- version: 0.4.0
10
+ version: 1.0.0
11
11
  platform: ruby
12
12
  authors:
13
13
  - Miguel Vazquez
@@ -15,7 +15,7 @@ autorequire:
15
15
  bindir: bin
16
16
  cert_chain: []
17
17
 
18
- date: 2011-03-23 00:00:00 +01:00
18
+ date: 2011-09-07 00:00:00 +02:00
19
19
  default_executable:
20
20
  dependencies:
21
21
  - !ruby/object:Gem::Dependency
@@ -26,10 +26,12 @@ dependencies:
26
26
  requirements:
27
27
  - - ">="
28
28
  - !ruby/object:Gem::Version
29
- hash: 3
29
+ hash: 63
30
30
  segments:
31
+ - 4
31
32
  - 0
32
- version: "0"
33
+ - 0
34
+ version: 4.0.0
33
35
  type: :runtime
34
36
  version_requirements: *id001
35
37
  - !ruby/object:Gem::Dependency
@@ -74,6 +76,20 @@ dependencies:
74
76
  version: "0"
75
77
  type: :runtime
76
78
  version_requirements: *id004
79
+ - !ruby/object:Gem::Dependency
80
+ name: bio
81
+ prerelease: false
82
+ requirement: &id005 !ruby/object:Gem::Requirement
83
+ none: false
84
+ requirements:
85
+ - - ">="
86
+ - !ruby/object:Gem::Version
87
+ hash: 3
88
+ segments:
89
+ - 0
90
+ version: "0"
91
+ type: :runtime
92
+ version_requirements: *id005
77
93
  description: Data sources like PubMed, Entrez Gene, or Gene Ontology
78
94
  email: miguel.vazquez@fdi.ucm.es
79
95
  executables: []
@@ -83,28 +99,37 @@ extensions: []
83
99
  extra_rdoc_files: []
84
100
 
85
101
  files:
102
+ - etc/biomart/missing_in_archive
103
+ - lib/rbbt/sources/COSMIC.rb
86
104
  - lib/rbbt/sources/COSTART.rb
87
105
  - lib/rbbt/sources/CTCAE.rb
106
+ - lib/rbbt/sources/InterPro.rb
107
+ - lib/rbbt/sources/NCI.rb
88
108
  - lib/rbbt/sources/bibtex.rb
89
109
  - lib/rbbt/sources/biomart.rb
90
110
  - lib/rbbt/sources/entrez.rb
91
111
  - lib/rbbt/sources/go.rb
92
112
  - lib/rbbt/sources/gscholar.rb
113
+ - lib/rbbt/sources/jochem.rb
93
114
  - lib/rbbt/sources/organism.rb
94
115
  - lib/rbbt/sources/organism/sequence.rb
95
116
  - lib/rbbt/sources/polysearch.rb
96
117
  - lib/rbbt/sources/pubmed.rb
118
+ - lib/rbbt/sources/wgEncodeBroadHmm.rb
119
+ - share/install/InterPro/Rakefile
120
+ - share/install/JoChem/Rakefile
121
+ - share/install/NCI/Rakefile
97
122
  - share/install/Organism/Hsa/Rakefile
98
123
  - share/install/Organism/Rno/Rakefile
99
124
  - share/install/Organism/Sce/Rakefile
100
125
  - share/install/Organism/organism_helpers.rb
101
126
  - share/install/lib/helpers.rb
102
- - test/rbbt/sources/test_biomart.rb
127
+ - test/test_helper.rb
103
128
  - test/rbbt/sources/test_entrez.rb
129
+ - test/rbbt/sources/test_pubmed.rb
104
130
  - test/rbbt/sources/test_go.rb
131
+ - test/rbbt/sources/test_biomart.rb
105
132
  - test/rbbt/sources/test_organism.rb
106
- - test/rbbt/sources/test_pubmed.rb
107
- - test/test_helper.rb
108
133
  has_rdoc: true
109
134
  homepage: http://github.com/mikisvaz/rbbt-sources
110
135
  licenses: []
@@ -135,14 +160,14 @@ required_rubygems_version: !ruby/object:Gem::Requirement
135
160
  requirements: []
136
161
 
137
162
  rubyforge_project:
138
- rubygems_version: 1.4.2
163
+ rubygems_version: 1.3.7
139
164
  signing_key:
140
165
  specification_version: 3
141
166
  summary: Data sources for the Ruby Bioinformatics Toolkit (rbbt)
142
167
  test_files:
143
- - test/rbbt/sources/test_biomart.rb
168
+ - test/test_helper.rb
144
169
  - test/rbbt/sources/test_entrez.rb
170
+ - test/rbbt/sources/test_pubmed.rb
145
171
  - test/rbbt/sources/test_go.rb
172
+ - test/rbbt/sources/test_biomart.rb
146
173
  - test/rbbt/sources/test_organism.rb
147
- - test/rbbt/sources/test_pubmed.rb
148
- - test/test_helper.rb