PRbed 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -0,0 +1,7 @@
1
+ ---
2
+ SHA256:
3
+ metadata.gz: 46d90436d24fa45018d5edf825ba7f686fd1be4b658810790ed4228a4efad27a
4
+ data.tar.gz: d7b280dc3a680d456bbb379da04c372f969b4620302ed5a37cd099a7c4ed58c4
5
+ SHA512:
6
+ metadata.gz: 70feca0fe8180d84c7ada8e44bcaf1be6a6d3b4744533c240a796376ee8387d04b97d30983ecb630c73e872336b4224de617e2610e5b23966903938e9fd23a5e
7
+ data.tar.gz: a69beb9d167cb621531eeff54cd3d9b025c65e4e61c236ab0721f9c87ec69ece61fb8bfcd7449dba3bb13576ac7169b950ebca08a586fdfefc9ace1a1ecf9d34
@@ -0,0 +1,9 @@
1
+ /.bundle/
2
+ /.yardoc
3
+ /_yardoc/
4
+ /coverage/
5
+ /doc/
6
+ /pkg/
7
+ /spec/reports/
8
+ /tmp/
9
+ Gemfile.lock
@@ -0,0 +1,6 @@
1
+ ---
2
+ language: ruby
3
+ cache: bundler
4
+ rvm:
5
+ - 2.7.1
6
+ before_install: gem install bundler -v 2.1.4
data/Gemfile ADDED
@@ -0,0 +1,7 @@
1
+ source "https://rubygems.org"
2
+
3
+ # Specify your gem's dependencies in PRbed.gemspec
4
+ gemspec
5
+
6
+ gem "rake", "~> 12.0"
7
+ gem "minitest", "~> 5.0"
data/LICENSE ADDED
@@ -0,0 +1,21 @@
1
+ MIT License
2
+
3
+ Copyright (c) 2020 holrock <ispeporez@gmail.com>
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining a copy
6
+ of this software and associated documentation files (the "Software"), to deal
7
+ in the Software without restriction, including without limitation the rights
8
+ to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
9
+ copies of the Software, and to permit persons to whom the Software is
10
+ furnished to do so, subject to the following conditions:
11
+
12
+ The above copyright notice and this permission notice shall be included in all
13
+ copies or substantial portions of the Software.
14
+
15
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
+ IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
+ FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18
+ AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
+ LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20
+ OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21
+ SOFTWARE.
@@ -0,0 +1,23 @@
1
+ require_relative 'lib/PRbed/version'
2
+
3
+ Gem::Specification.new do |spec|
4
+ spec.name = "PRbed"
5
+ spec.version = PRbed::VERSION
6
+ spec.authors = ["holrock"]
7
+ spec.email = ["ispeporez@gmail.com"]
8
+
9
+ spec.summary = %q{PLINK bed file reader}
10
+ spec.description = %q{pure ruby implementation of PLINK bed file stream reader}
11
+ spec.homepage = "https://github.com/holrock/PRbed"
12
+ spec.required_ruby_version = Gem::Requirement.new(">= 2.3.0")
13
+ spec.license = "MIT"
14
+
15
+ # Specify which files should be added to the gem when it is released.
16
+ # The `git ls-files -z` loads the files in the RubyGem that have been added into git.
17
+ spec.files = Dir.chdir(File.expand_path('..', __FILE__)) do
18
+ `git ls-files -z`.split("\x0").reject { |f| f.match(%r{^(test|spec|features)/}) }
19
+ end
20
+ spec.bindir = "exe"
21
+ spec.executables = spec.files.grep(%r{^exe/}) { |f| File.basename(f) }
22
+ spec.require_paths = ["lib"]
23
+ end
@@ -0,0 +1,40 @@
1
+ # PRbed
2
+
3
+ pure ruby implementation of PLINK bed file stream reader
4
+
5
+ ## Installation
6
+
7
+ Add this line to your application's Gemfile:
8
+
9
+ ```ruby
10
+ gem 'PRbed'
11
+ ```
12
+
13
+ And then execute:
14
+
15
+ $ bundle install
16
+
17
+ Or install it yourself as:
18
+
19
+ $ gem install PRbed
20
+
21
+ ## Usage
22
+
23
+ ```ruby
24
+ require "PRbed"
25
+ r = PRbed::Reader.new("test/test") # bfile prefix
26
+ r.each_variants do |variant, fam, genotypes|
27
+ p [variant, fam, genotypes]
28
+ end
29
+ ```
30
+
31
+ ## Development
32
+
33
+ After checking out the repo, run `bin/setup` to install dependencies. Then, run `rake test` to run the tests. You can also run `bin/console` for an interactive prompt that will allow you to experiment.
34
+
35
+ To install this gem onto your local machine, run `bundle exec rake install`. To release a new version, update the version number in `version.rb`, and then run `bundle exec rake release`, which will create a git tag for the version, push git commits and tags, and push the `.gem` file to [rubygems.org](https://rubygems.org).
36
+
37
+ ## Contributing
38
+
39
+ Bug reports and pull requests are welcome on GitHub at https://github.com/holrock/PRbed.
40
+
@@ -0,0 +1,10 @@
1
+ require "bundler/gem_tasks"
2
+ require "rake/testtask"
3
+
4
+ Rake::TestTask.new(:test) do |t|
5
+ t.libs << "test"
6
+ t.libs << "lib"
7
+ t.test_files = FileList["test/**/*_test.rb"]
8
+ end
9
+
10
+ task :default => :test
@@ -0,0 +1,14 @@
1
+ #!/usr/bin/env ruby
2
+
3
+ require "bundler/setup"
4
+ require "PRbed"
5
+
6
+ # You can add fixtures and/or initialization code here to make experimenting
7
+ # with your gem easier. You can also use a different console, if you like.
8
+
9
+ # (If you use this, don't forget to add pry to your Gemfile!)
10
+ # require "pry"
11
+ # Pry.start
12
+
13
+ require "irb"
14
+ IRB.start(__FILE__)
@@ -0,0 +1,8 @@
1
+ #!/usr/bin/env bash
2
+ set -euo pipefail
3
+ IFS=$'\n\t'
4
+ set -vx
5
+
6
+ bundle install
7
+
8
+ # Do any other automated setup that you need to do here
@@ -0,0 +1,94 @@
1
+ require "PRbed/version"
2
+
3
+ module PRbed
4
+ class PRBedError < StandardError; end
5
+
6
+ HOMO_A1 = 0
7
+ MISSING = 1
8
+ HETERO = 2
9
+ HOMO_A2 = 3
10
+
11
+ SAMPLES_PER_BYTE = 4
12
+
13
+ Fam = Struct.new(:fid, :iid, :sex, :phenotype)
14
+ Bim = Struct.new(:chr, :vid, :bp, :a1, :a2)
15
+
16
+ class BytesParser
17
+ def initialize(nsamples)
18
+ @nsamples = nsamples
19
+ @bufsize = (@nsamples + 3) & ~3
20
+ end
21
+
22
+ def parse(bs)
23
+ a = Array.new(@bufsize, MISSING)
24
+ i = 0
25
+ bs.each_byte do |c|
26
+ a[i ] = c & 0b00000011
27
+ a[i + 1] = (c & 0b00001100) >> 2
28
+ a[i + 2] = (c & 0b00110000) >> 4
29
+ a[i + 3] = (c & 0b11000000) >> 6
30
+ i += SAMPLES_PER_BYTE
31
+ end
32
+ a.pop(@bufsize - @nsamples)
33
+ a
34
+ end
35
+ end
36
+
37
+ class Reader
38
+ attr_reader :fam, :bim
39
+
40
+ def initialize(bfile)
41
+ @bfile = bfile
42
+ @fam = load_fam("#{bfile}.fam")
43
+ @bim = load_bim("#{bfile}.bim")
44
+ end
45
+
46
+ def each_variants
47
+ nsamples = @fam.size
48
+ mod = nsamples % SAMPLES_PER_BYTE
49
+ nread_bytes = nsamples / SAMPLES_PER_BYTE
50
+ nread_bytes += 1 unless mod ==0
51
+
52
+ File.open("#{@bfile}.bed", "rb") do |f|
53
+ raise PRBedError.new("not plink bed file") unless f.read(3) == "\x6c\x1b\x01"
54
+ parser = BytesParser.new(nsamples)
55
+ buf = '\x0' * nsamples
56
+ @bim.each do |v|
57
+ b = f.read(nread_bytes, buf)
58
+ raise PRBedError.new("unpxpected file end") unless b
59
+ a = parser.parse(b)
60
+ yield(v, @fam, a)
61
+ end
62
+ end
63
+ self
64
+ end
65
+
66
+ alias_method :each, :each_variants
67
+
68
+ private
69
+
70
+ def load_fam(fam)
71
+ fs = []
72
+ File.open(fam) do |f|
73
+ while s = f.gets
74
+ s.chomp!
75
+ fid, iid, _, _, sex, pheno = s.split(/\s/)
76
+ fs.push(Fam.new(fid, iid, Integer(sex, 10), Integer(pheno, 10)))
77
+ end
78
+ end
79
+ fs
80
+ end
81
+
82
+ def load_bim(bim)
83
+ bs = []
84
+ File.open(bim) do |f|
85
+ while s = f.gets
86
+ s.chomp!
87
+ chr, vid, _, bp, a1, a2 = s.split(/\s/)
88
+ bs.push(Bim.new(Integer(chr, 10), vid, Integer(bp, 10), a1, a2))
89
+ end
90
+ end
91
+ bs
92
+ end
93
+ end
94
+ end
@@ -0,0 +1,3 @@
1
+ module PRbed
2
+ VERSION = "0.1.0"
3
+ end
metadata ADDED
@@ -0,0 +1,54 @@
1
+ --- !ruby/object:Gem::Specification
2
+ name: PRbed
3
+ version: !ruby/object:Gem::Version
4
+ version: 0.1.0
5
+ platform: ruby
6
+ authors:
7
+ - holrock
8
+ autorequire:
9
+ bindir: exe
10
+ cert_chain: []
11
+ date: 2020-07-24 00:00:00.000000000 Z
12
+ dependencies: []
13
+ description: pure ruby implementation of PLINK bed file stream reader
14
+ email:
15
+ - ispeporez@gmail.com
16
+ executables: []
17
+ extensions: []
18
+ extra_rdoc_files: []
19
+ files:
20
+ - ".gitignore"
21
+ - ".travis.yml"
22
+ - Gemfile
23
+ - LICENSE
24
+ - PRbed.gemspec
25
+ - README.md
26
+ - Rakefile
27
+ - bin/console
28
+ - bin/setup
29
+ - lib/PRbed.rb
30
+ - lib/PRbed/version.rb
31
+ homepage: https://github.com/holrock/PRbed
32
+ licenses:
33
+ - MIT
34
+ metadata: {}
35
+ post_install_message:
36
+ rdoc_options: []
37
+ require_paths:
38
+ - lib
39
+ required_ruby_version: !ruby/object:Gem::Requirement
40
+ requirements:
41
+ - - ">="
42
+ - !ruby/object:Gem::Version
43
+ version: 2.3.0
44
+ required_rubygems_version: !ruby/object:Gem::Requirement
45
+ requirements:
46
+ - - ">="
47
+ - !ruby/object:Gem::Version
48
+ version: '0'
49
+ requirements: []
50
+ rubygems_version: 3.1.2
51
+ signing_key:
52
+ specification_version: 4
53
+ summary: PLINK bed file reader
54
+ test_files: []