rbbt-sources 3.2.15 → 3.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: df44bcf0d03a785f8aa9b36b123491ed49187f710e70a346b645f257701a0ac2
4
- data.tar.gz: feef523710ea56093cdf4ff2df36d28f57a426a906e13ce3edbe6f71f7272452
3
+ metadata.gz: b10dbe140b4c0733476823e5f5d94e57a3d9a755fc370f6b9640d1e7b8efc368
4
+ data.tar.gz: 38aaf56670a07537ad0ef0c025d17e655fc5d7fb87d97ee1c08d0af82c44fbbd
5
5
  SHA512:
6
- metadata.gz: 3766aa7ce01f4ad44b7f759faa7b2790d4cdd3808a546978a06312f95662aa1ba6dc8d916c8b29d3d8f10699adc21cb80e55a496a2d8c9ec5a39191cdcd415d0
7
- data.tar.gz: 4882abf0ac721753c7f31e2f85d66e3f537c6b28b4cb62337b76031d1109a89c1cfb7c6409c535a3f49990c6ce4b32a76c476da6c7736361480ea423d0b0a1c9
6
+ metadata.gz: a8ac9df1da30fc7aec3c54a5a200a0c7a9629807b9238089a1e8064e78b0ecd5bad36c4b6a77fac7e7cfdf332ad56be06149b12d0e0fd7f6506b0b82d2e03bcf
7
+ data.tar.gz: acff50e8bdb0d4443c3e1dbd237539953206b7d5dcb886db64ec0677f7bba43cf3a9782e4147985a9b3fc1b34df692e89fb2b7185f2aa0f93ccd196a4d19d54a
@@ -1,6 +1,8 @@
1
1
  may2009
2
2
  feb2014
3
3
  may2017
4
+ oct2018
4
5
  apr2019
5
6
  feb2021
6
7
  feb2023
8
+ oct2016
@@ -14,7 +14,7 @@ module PRO
14
14
  #self.search_paths[:default] = :lib
15
15
 
16
16
  PRO.claim PRO.identifiers, :proc do
17
- url = "ftp://ftp.pir.georgetown.edu/databases/ontology/pro_obo/PRO_mappings/uniprotmapping.txt"
17
+ url = "ftp://ftp.proteininformationresource.org/databases/ontology/pro_obo/PRO_mappings/uniprotmapping.txt"
18
18
 
19
19
  dumper = TSV::Dumper.new :key_field => "PRO ID", :fields => ["UniProt/SwissProt Accession"], :type => :double, :namespace => PRO.organism
20
20
  dumper.init
@@ -22,7 +22,7 @@ module PRO
22
22
  pro, uni = line.split("\t")
23
23
  [pro, [uni.split(":").last]]
24
24
  end
25
- TSV.collapse_stream dumper
25
+ dumper.tsv merge: true
26
26
  end
27
27
 
28
28
  PRO.claim PRO.uniprot_equivalences, :proc do
@@ -15,7 +15,7 @@ module BioMart
15
15
 
16
16
  BIOMART_URL = 'http://www.ensembl.org/biomart/martservice?query='
17
17
 
18
- MISSING_IN_ARCHIVE = Rbbt.etc.biomart.missing_in_archive.exists? ? Rbbt.etc.biomart.missing_in_archive.yaml : {}
18
+ MISSING_IN_ARCHIVE = Rbbt.etc.biomart.missing_in_archive.exists? ? Rbbt.etc.biomart.missing_in_archive.find.yaml : {}
19
19
 
20
20
  private
21
21
 
@@ -33,7 +33,7 @@ module BioMart
33
33
 
34
34
  def self.set_archive(date)
35
35
  if defined? Rbbt and Rbbt.etc.allowed_biomart_archives.exists?
36
- raise "Biomart archive #{ date } is not allowed in this installation" unless Rbbt.etc.allowed_biomart_archives.read.split("\n").include? date
36
+ raise "Biomart archive #{ date } is not allowed in this installation" unless Rbbt.etc.allowed_biomart_archives.find.read.split("\n").include? date
37
37
  end
38
38
  Thread.current['archive'] = date
39
39
  Thread.current['archive_url'] = BIOMART_URL.sub(/www/, date + '.archive')
@@ -18,7 +18,7 @@ module GO
18
18
 
19
19
 
20
20
  MULTIPLE_VALUE_FIELDS = %w(is_a)
21
- TSV_GENE_ONTOLOGY = File.join(Persist.cachedir, 'gene_ontology')
21
+ #TSV_GENE_ONTOLOGY = File.join(Persist.cachedir, 'gene_ontology')
22
22
 
23
23
  # This method needs to be called before any translations can be made, it is
24
24
  # called automatically the first time the id2name method is called. It loads
@@ -241,11 +241,13 @@ module PubMed
241
241
  pmids = [pmids] unless Array === pmids
242
242
  pmids = pmids.compact.collect{|id| id}
243
243
 
244
+ chunk_size = 50
244
245
  result_files = FileCache.cache_online_elements(pmids, 'pubmed-{ID}.xml') do |ids|
245
246
  result = {}
246
247
  values = []
247
- chunks = Misc.divide(ids, (ids.length / 20) + 1)
248
+ chunks = Misc.divide(ids, (ids.length / chunk_size) + 1)
248
249
  Log::ProgressBar.with_bar(chunks.length, :desc => "Downloading articles from PubMed") do |bar|
250
+ bar.init
249
251
  chunks.each do |list|
250
252
  begin
251
253
  Misc.try3times do
@@ -19,7 +19,11 @@ module Signor
19
19
  end
20
20
 
21
21
  Signor.claim Signor.data, :proc do
22
- Signor[".source/all.csv"].tsv :header_hash => '', :merge => true, :zipped => true
22
+ begin
23
+ Signor[".source/all.csv"].tsv :header_hash => '', :merge => true, :zipped => true
24
+ rescue
25
+ Signor[".source/all.csv"].tsv :header_hash => '', :merge => true, :one2one => true
26
+ end
23
27
  end
24
28
 
25
29
  Signor.claim Signor.protein_protein, :proc do
@@ -57,7 +61,7 @@ module Signor
57
61
  #uni2name = Organism.identifiers(organism).index :target => "Associated Gene Name", :fields => ["UniProt/SwissProt Accession"], :persist => true
58
62
  uni2name = UniProt.identifiers.Hsa.index :target => "Associated Gene Name", :fields => ["UniProt/SwissProt Accession"], :persist => true
59
63
 
60
- parser = TSV::Parser.new Signor.data
64
+ parser = TSV::Parser.new Signor.data.produce
61
65
  fields = parser.fields
62
66
  dumper = TSV::Dumper.new :key_field => "Source (UniProt/SwissProt Accession)", :fields => ["Target (Associated Gene Name)", "Effect", "Sign", "PMID"], :type => :double, :merge => true, :organism => Signor.organism
63
67
  dumper.init
@@ -114,6 +114,7 @@ module TFactS
114
114
  pmids = "" if pmids.nil?
115
115
 
116
116
  values = [target, "", species, source, pmids]
117
+ values = values.collect{|v| [v]}
117
118
  tsv.zip_new(tf, values)
118
119
  end
119
120
 
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: rbbt-sources
3
3
  version: !ruby/object:Gem::Version
4
- version: 3.2.15
4
+ version: 3.3.0
5
5
  platform: ruby
6
6
  authors:
7
7
  - Miguel Vazquez
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2023-03-29 00:00:00.000000000 Z
11
+ date: 2023-12-21 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: rbbt-util
@@ -24,20 +24,6 @@ dependencies:
24
24
  - - ">="
25
25
  - !ruby/object:Gem::Version
26
26
  version: 4.0.0
27
- - !ruby/object:Gem::Dependency
28
- name: nokogiri
29
- requirement: !ruby/object:Gem::Requirement
30
- requirements:
31
- - - ">="
32
- - !ruby/object:Gem::Version
33
- version: '0'
34
- type: :runtime
35
- prerelease: false
36
- version_requirements: !ruby/object:Gem::Requirement
37
- requirements:
38
- - - ">="
39
- - !ruby/object:Gem::Version
40
- version: '0'
41
27
  - !ruby/object:Gem::Dependency
42
28
  name: net-ftp
43
29
  requirement: !ruby/object:Gem::Requirement
@@ -178,24 +164,24 @@ required_rubygems_version: !ruby/object:Gem::Requirement
178
164
  - !ruby/object:Gem::Version
179
165
  version: '0'
180
166
  requirements: []
181
- rubygems_version: 3.4.8
167
+ rubygems_version: 3.5.0.dev
182
168
  signing_key:
183
169
  specification_version: 4
184
170
  summary: Data sources for the Ruby Bioinformatics Toolkit (rbbt)
185
171
  test_files:
172
+ - test/rbbt/sources/test_HPRD.rb
173
+ - test/rbbt/sources/test_biomart.rb
174
+ - test/rbbt/sources/test_entrez.rb
186
175
  - test/rbbt/sources/test_go.rb
187
- - test/rbbt/sources/test_pubmed.rb
188
- - test/rbbt/sources/test_pina.rb
189
- - test/rbbt/sources/test_pharmagkb.rb
176
+ - test/rbbt/sources/test_gscholar.rb
177
+ - test/rbbt/sources/test_kegg.rb
178
+ - test/rbbt/sources/test_matador.rb
190
179
  - test/rbbt/sources/test_organism.rb
191
- - test/rbbt/sources/test_synapse.rb
192
- - test/rbbt/sources/test_entrez.rb
180
+ - test/rbbt/sources/test_pharmagkb.rb
181
+ - test/rbbt/sources/test_pina.rb
182
+ - test/rbbt/sources/test_pubmed.rb
193
183
  - test/rbbt/sources/test_stitch.rb
194
- - test/rbbt/sources/test_biomart.rb
195
- - test/rbbt/sources/test_HPRD.rb
196
184
  - test/rbbt/sources/test_string.rb
197
- - test/rbbt/sources/test_kegg.rb
185
+ - test/rbbt/sources/test_synapse.rb
198
186
  - test/rbbt/sources/test_tfacts.rb
199
- - test/rbbt/sources/test_matador.rb
200
- - test/rbbt/sources/test_gscholar.rb
201
187
  - test/test_helper.rb