genecache 0.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -0,0 +1,7 @@
1
+ ---
2
+ SHA1:
3
+ metadata.gz: 15de64a20d8f2335e5c101e3d93045ad3a78c6be
4
+ data.tar.gz: 35c7e5cdb8309c2ac1d1ce775ee8bad258d3128f
5
+ SHA512:
6
+ metadata.gz: 7e95d8bc1be6881cb5464c70ee6d0c5d7ee41a9bf15bf99d762c283f89f8d6926786030a1ae623fe7cd33036e26b846059b12fbab6f070c37f0b4e63e374f8a4
7
+ data.tar.gz: 129d3188032666eafa3903ad92092a6bb03f2139c66f7a1537e436bc4f72088fea453598d1819c9af2b6b1af0b01f24b30f16c557185747336a485bad78e207c
@@ -0,0 +1,17 @@
1
+ *.gem
2
+ *.rbc
3
+ .bundle
4
+ .config
5
+ .yardoc
6
+ Gemfile.lock
7
+ InstalledFiles
8
+ _yardoc
9
+ coverage
10
+ doc/
11
+ lib/bundler/man
12
+ pkg
13
+ rdoc
14
+ spec/reports
15
+ test/tmp
16
+ test/version_tmp
17
+ tmp
data/Gemfile ADDED
@@ -0,0 +1,4 @@
1
+ source 'https://rubygems.org'
2
+
3
+ # Specify your gem's dependencies in genecache.gemspec
4
+ gemspec
@@ -0,0 +1,22 @@
1
+ Copyright (c) 2013 Fedor Gusev
2
+
3
+ MIT License
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining
6
+ a copy of this software and associated documentation files (the
7
+ "Software"), to deal in the Software without restriction, including
8
+ without limitation the rights to use, copy, modify, merge, publish,
9
+ distribute, sublicense, and/or sell copies of the Software, and to
10
+ permit persons to whom the Software is furnished to do so, subject to
11
+ the following conditions:
12
+
13
+ The above copyright notice and this permission notice shall be
14
+ included in all copies or substantial portions of the Software.
15
+
16
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
17
+ EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
18
+ MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
19
+ NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
20
+ LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
21
+ OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
22
+ WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
@@ -0,0 +1,32 @@
1
+ # Genecache
2
+
3
+ Simple and fast conversion of GENE IDs. Major source of data is http://biodb.jp. Conversion tables are downloaded and stored in local SQLite database for very fast access.
4
+
5
+ ## Installation
6
+
7
+ Add this line to your application's Gemfile:
8
+
9
+ gem 'genecache'
10
+
11
+ And then execute:
12
+
13
+ $ bundle
14
+
15
+ Or install it yourself as:
16
+
17
+ $ gem install genecache
18
+
19
+ ## Usage
20
+
21
+ require 'genecache'
22
+
23
+ GeneCache.convert('hsa', 'ensg_id', 'omim_id', 'ENSG00000142192') # APP
24
+ # returns ['104300', '104760', '605714']
25
+
26
+ ## Contributing
27
+
28
+ 1. Fork it
29
+ 2. Create your feature branch (`git checkout -b my-new-feature`)
30
+ 3. Commit your changes (`git commit -am 'Add some feature'`)
31
+ 4. Push to the branch (`git push origin my-new-feature`)
32
+ 5. Create new Pull Request
@@ -0,0 +1 @@
1
+ require "bundler/gem_tasks"
@@ -0,0 +1,27 @@
1
+ # coding: utf-8
2
+ lib = File.expand_path('../lib', __FILE__)
3
+ $LOAD_PATH.unshift(lib) unless $LOAD_PATH.include?(lib)
4
+ require 'genecache/version'
5
+
6
+ Gem::Specification.new do |spec|
7
+ spec.name = "genecache"
8
+ spec.version = Genecache::VERSION
9
+ spec.authors = ["Fedor Gusev"]
10
+ spec.email = ["gusevfe@gmail.com"]
11
+ spec.description = %q{Very simple GENE ID conversion tool with a local SQLite3 DB for caching}
12
+ spec.summary = %q{Simple and fast conversion of GENE IDs. Major source of data is http://biodb.jp. Conversion tables are downloaded and stored in local SQLite database for very fast access.}
13
+ spec.homepage = ""
14
+ spec.license = "MIT"
15
+
16
+ spec.files = `git ls-files`.split($/)
17
+ spec.executables = spec.files.grep(%r{^bin/}) { |f| File.basename(f) }
18
+ spec.test_files = spec.files.grep(%r{^(test|spec|features)/})
19
+ spec.require_paths = ["lib"]
20
+
21
+ spec.add_development_dependency "bundler", "~> 1.3"
22
+ spec.add_development_dependency "rake"
23
+ spec.add_development_dependency "rspec"
24
+
25
+ spec.add_dependency 'sqlite3'
26
+ spec.add_dependency 'zipruby'
27
+ end
@@ -0,0 +1,65 @@
1
+ require "genecache/version"
2
+ require 'open-uri'
3
+ require 'zipruby'
4
+ require 'csv'
5
+ require 'tempfile'
6
+ require 'sqlite3'
7
+ require 'logger'
8
+ require 'fileutils'
9
+
10
+ $log = Logger.new STDERR
11
+
12
+ # TODO: check we have working sqlite3 executable for fast import of data
13
+
14
+ class GeneCache
15
+ def self.db_path
16
+ FileUtils.mkdir_p ENV['HOME'] + "/.genecache"
17
+ return ENV['HOME'] + "/.genecache/db.sqlite3"
18
+ end
19
+
20
+ @@db = SQLite3::Database.new GeneCache.db_path
21
+ @@tables = @@db.execute("SELECT name FROM sqlite_master where type = 'table'")
22
+
23
+ def self.convert(species, from, to, id)
24
+ table = "#{species}_#{from}_#{to}"
25
+ unless @@tables.include?([table])
26
+ # TODO: Update table sometimes!
27
+ self.download!(species, from, to)
28
+ end
29
+
30
+ r = @@db.execute "select #{to} from #{table} where #{from} = '#{id}'"
31
+ r.flatten
32
+ end
33
+
34
+ def self.download!(species, from, to)
35
+ table = "#{species}_#{from}_#{to}"
36
+ $log.info "Downloading table: #{table}"
37
+ @@db.execute "drop table if exists #{table}"
38
+ @@db.execute "drop index if exists from_index"
39
+ @@db.execute "drop index if exists to_index"
40
+
41
+ url = "http://biodb.jp/tmp/#{table}.zip"
42
+ zip_data = open(url).read
43
+
44
+ Zip::Archive.open_buffer(zip_data) do |ar|
45
+ ar.fopen(0) do |f|
46
+ tmp = Tempfile.new 'biodb'
47
+ data = f.read.split("\n")
48
+ header = data.first.split
49
+ throw "Invalid header!" if header.sort != [from, to].sort
50
+ @@db.execute "create table #{table} (#{header.first} VARCHAR(255), #{header.last} VARCHAR(255))"
51
+
52
+ rest = data[1..-5] * "\n"
53
+ tmp.write rest
54
+ tmp.close
55
+
56
+ system(%$echo -e ".mode tabs \\n.import #{File.expand_path(tmp.path)} #{table}" | sqlite3 #{self.db_path}$)
57
+ @@db.execute "create index from_index on #{table} (#{header.first})"
58
+ @@db.execute "create index to_index on #{table} (#{header.last})"
59
+ end
60
+
61
+ # Update local list of tables
62
+ @@tables = @@db.execute("SELECT name FROM sqlite_master where type = 'table' and name = '#{table}'")
63
+ end
64
+ end
65
+ end
@@ -0,0 +1,3 @@
1
+ module Genecache
2
+ VERSION = "0.0.1"
3
+ end
@@ -0,0 +1,8 @@
1
+ require 'spec_helper'
2
+
3
+ describe GeneCache do
4
+ it "does the job" do
5
+ r = GeneCache.convert('hsa', 'ensg_id', 'omim_id', 'ENSG00000142192') # APP
6
+ expect(r.sort).to eq(%w{104300 104760 605714}.sort)
7
+ end
8
+ end
@@ -0,0 +1,8 @@
1
+ require 'rubygems'
2
+ require 'bundler/setup'
3
+
4
+ require 'genecache' # and any other gems you need
5
+
6
+ RSpec.configure do |config|
7
+ # some (optional) config here
8
+ end
metadata ADDED
@@ -0,0 +1,129 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: genecache
3
+ version: !ruby/object:Gem::Version
4
+ version: 0.0.1
5
+ platform: ruby
6
+ authors:
7
+ - Fedor Gusev
8
+ autorequire:
9
+ bindir: bin
10
+ cert_chain: []
11
+ date: 2013-12-22 00:00:00.000000000 Z
12
+ dependencies:
13
+ - !ruby/object:Gem::Dependency
14
+ name: bundler
15
+ requirement: !ruby/object:Gem::Requirement
16
+ requirements:
17
+ - - ~>
18
+ - !ruby/object:Gem::Version
19
+ version: '1.3'
20
+ type: :development
21
+ prerelease: false
22
+ version_requirements: !ruby/object:Gem::Requirement
23
+ requirements:
24
+ - - ~>
25
+ - !ruby/object:Gem::Version
26
+ version: '1.3'
27
+ - !ruby/object:Gem::Dependency
28
+ name: rake
29
+ requirement: !ruby/object:Gem::Requirement
30
+ requirements:
31
+ - - '>='
32
+ - !ruby/object:Gem::Version
33
+ version: '0'
34
+ type: :development
35
+ prerelease: false
36
+ version_requirements: !ruby/object:Gem::Requirement
37
+ requirements:
38
+ - - '>='
39
+ - !ruby/object:Gem::Version
40
+ version: '0'
41
+ - !ruby/object:Gem::Dependency
42
+ name: rspec
43
+ requirement: !ruby/object:Gem::Requirement
44
+ requirements:
45
+ - - '>='
46
+ - !ruby/object:Gem::Version
47
+ version: '0'
48
+ type: :development
49
+ prerelease: false
50
+ version_requirements: !ruby/object:Gem::Requirement
51
+ requirements:
52
+ - - '>='
53
+ - !ruby/object:Gem::Version
54
+ version: '0'
55
+ - !ruby/object:Gem::Dependency
56
+ name: sqlite3
57
+ requirement: !ruby/object:Gem::Requirement
58
+ requirements:
59
+ - - '>='
60
+ - !ruby/object:Gem::Version
61
+ version: '0'
62
+ type: :runtime
63
+ prerelease: false
64
+ version_requirements: !ruby/object:Gem::Requirement
65
+ requirements:
66
+ - - '>='
67
+ - !ruby/object:Gem::Version
68
+ version: '0'
69
+ - !ruby/object:Gem::Dependency
70
+ name: zipruby
71
+ requirement: !ruby/object:Gem::Requirement
72
+ requirements:
73
+ - - '>='
74
+ - !ruby/object:Gem::Version
75
+ version: '0'
76
+ type: :runtime
77
+ prerelease: false
78
+ version_requirements: !ruby/object:Gem::Requirement
79
+ requirements:
80
+ - - '>='
81
+ - !ruby/object:Gem::Version
82
+ version: '0'
83
+ description: Very simple GENE ID conversion tool with a local SQLite3 DB for caching
84
+ email:
85
+ - gusevfe@gmail.com
86
+ executables: []
87
+ extensions: []
88
+ extra_rdoc_files: []
89
+ files:
90
+ - .gitignore
91
+ - Gemfile
92
+ - LICENSE.txt
93
+ - README.md
94
+ - Rakefile
95
+ - genecache.gemspec
96
+ - lib/genecache.rb
97
+ - lib/genecache/version.rb
98
+ - spec/genecache_spec.rb
99
+ - spec/spec_helper.rb
100
+ homepage: ''
101
+ licenses:
102
+ - MIT
103
+ metadata: {}
104
+ post_install_message:
105
+ rdoc_options: []
106
+ require_paths:
107
+ - lib
108
+ required_ruby_version: !ruby/object:Gem::Requirement
109
+ requirements:
110
+ - - '>='
111
+ - !ruby/object:Gem::Version
112
+ version: '0'
113
+ required_rubygems_version: !ruby/object:Gem::Requirement
114
+ requirements:
115
+ - - '>='
116
+ - !ruby/object:Gem::Version
117
+ version: '0'
118
+ requirements: []
119
+ rubyforge_project:
120
+ rubygems_version: 2.0.2
121
+ signing_key:
122
+ specification_version: 4
123
+ summary: Simple and fast conversion of GENE IDs. Major source of data is http://biodb.jp.
124
+ Conversion tables are downloaded and stored in local SQLite database for very fast
125
+ access.
126
+ test_files:
127
+ - spec/genecache_spec.rb
128
+ - spec/spec_helper.rb
129
+ has_rdoc: