gfa 0.9.3 → 0.9.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (4) hide show
  1. checksums.yaml +4 -4
  2. data/lib/gfa/parser.rb +13 -10
  3. data/lib/gfa/version.rb +1 -1
  4. metadata +2 -2
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: 8919a697174aabef8c92bf7024d855c31c2adce2402e05474882cc03754e9ce2
4
- data.tar.gz: 3a03b9fd5446938df35974eb0e225a35ecdc69539546ff0c6873fdba0cb28928
3
+ metadata.gz: 77b3aea84dc5c5a0411e66da4947f418c051550c62c401a3eadb50043ec6ae0c
4
+ data.tar.gz: 9e901a36a7a22fa368b17e91b330dc4848dac8b647c684753618e7acef2ae1f1
5
5
  SHA512:
6
- metadata.gz: f72d49eb2fa08a89a8bf919cbc73161f65a1c2d083aa783856f33a5d872895a450d6de87a52977bfe69e5de35b0677cd00473b73d6a515449407c3705cfa3744
7
- data.tar.gz: b57b09ffd99e0744fbf686d328acf778d4dcb502ae88cb79cfc3722d2c0b0d415569db0a9cce27367e6c16048ac3788efd7d4af3bfa2f3bbce7e66fad8b0f776
6
+ metadata.gz: 84e37302e32e089c7644a2934bf3a101e064faff9fbbf2b36c82d24b3a99e2333a73fb0858a739f8857b08a464ad60858edf8ff074247490133ff40410099cc8
7
+ data.tar.gz: ec3c85a3da565babb7a0f1538a52321e567366cc56fcde09a82367b683669a57259a0603045b979205c763ad3198d7432edbe452fcdd20e66406036ed846fb3d
data/lib/gfa/parser.rb CHANGED
@@ -11,6 +11,8 @@ class GFA
11
11
  # - index_id: If the records should also be index by ID (default: false)
12
12
  # - comments: If the comment records should be saved (default: false)
13
13
  # - line_range: Two-integer array indicating the first and last lines to read
14
+ # - file_seek: Seek to this file position before start reading
15
+ # - until_line: Read until reaching this line only
14
16
  # (default: nil, read the entire file)
15
17
  def self.load(file, opts = {})
16
18
  gfa = GFA.new(opts)
@@ -23,11 +25,11 @@ class GFA
23
25
  def self.read_records(file, opts = {})
24
26
  rng = opts[:line_range]
25
27
  File.open(file, 'r') do |fh|
26
- lno = -1
27
- fh.each do |ln|
28
- lno += 1
29
- next if !rng.nil? && (lno < rng[0] || lno > rng[1])
30
- next if !opts[:comments] && ln[0] == '#'
28
+ fh.seek(opts[:file_seek], :SET) unless opts[:file_seek].nil?
29
+ fh.each_with_index do |ln, lno|
30
+ next if !rng.nil? && (lno < rng[0] || lno > rng[1])
31
+ break if !opts[:until_line].nil? && (lno == opts[:until_line])
32
+ next if !opts[:comments] && ln[0] == '#'
31
33
 
32
34
  yield(GFA::Record[ln])
33
35
  end
@@ -42,10 +44,10 @@ class GFA
42
44
  return self.load(file, opts) if thr < 1
43
45
 
44
46
  # Prepare data
45
- lno = 0
46
- File.open(file, 'r') { |fh| fh.each { lno += 1 } }
47
- thr = lno if thr > lno
48
- blk = (lno.to_f / thr).ceil
47
+ lsize = []
48
+ File.open(file, 'r') { |fh| fh.each { |ln| lsize << ln.size } }
49
+ thr = [lsize.size, thr].min
50
+ blk = (lsize.size.to_f / thr).ceil
49
51
 
50
52
  # Launch children processes
51
53
  advance_bar(blk + 1)
@@ -55,7 +57,8 @@ class GFA
55
57
  io[i] = IO.pipe
56
58
  pid << fork do
57
59
  io[i][0].close
58
- o = opts.merge(line_range: [i * blk, (i + 1) * blk - 1])
60
+ o = opts.merge(file_seek: lsize[0, blk * i].inject(:+), until_line: blk)
61
+ #o = opts.merge(line_range: [i * blk, (i + 1) * blk - 1])
59
62
  records = []
60
63
  read_records(file, o) do |record|
61
64
  records << record
data/lib/gfa/version.rb CHANGED
@@ -1,5 +1,5 @@
1
1
  class GFA
2
- VERSION = '0.9.3'
2
+ VERSION = '0.9.4'
3
3
  VERSION_ARRAY = VERSION.split(/\./).map { |x| x.to_i } # :nodoc:
4
4
  VERSION_MAJOR = VERSION_ARRAY[0] # :nodoc:
5
5
  VERSION_MINOR = VERSION_ARRAY[1] # :nodoc:
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: gfa
3
3
  version: !ruby/object:Gem::Version
4
- version: 0.9.3
4
+ version: 0.9.4
5
5
  platform: ruby
6
6
  authors:
7
7
  - Luis M. Rodriguez-R
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2024-08-30 00:00:00.000000000 Z
11
+ date: 2024-09-01 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: rgl