minimap2 0.2.22.0 → 0.2.24.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (101) hide show
  1. checksums.yaml +4 -4
  2. data/README.md +60 -76
  3. data/ext/Rakefile +55 -0
  4. data/ext/cmappy/cmappy.c +129 -0
  5. data/ext/cmappy/cmappy.h +44 -0
  6. data/ext/minimap2/FAQ.md +46 -0
  7. data/ext/minimap2/LICENSE.txt +24 -0
  8. data/ext/minimap2/MANIFEST.in +10 -0
  9. data/ext/minimap2/Makefile +132 -0
  10. data/ext/minimap2/Makefile.simde +97 -0
  11. data/ext/minimap2/NEWS.md +821 -0
  12. data/ext/minimap2/README.md +403 -0
  13. data/ext/minimap2/align.c +1020 -0
  14. data/ext/minimap2/bseq.c +169 -0
  15. data/ext/minimap2/bseq.h +64 -0
  16. data/ext/minimap2/code_of_conduct.md +30 -0
  17. data/ext/minimap2/cookbook.md +243 -0
  18. data/ext/minimap2/esterr.c +64 -0
  19. data/ext/minimap2/example.c +63 -0
  20. data/ext/minimap2/format.c +559 -0
  21. data/ext/minimap2/hit.c +466 -0
  22. data/ext/minimap2/index.c +775 -0
  23. data/ext/minimap2/kalloc.c +205 -0
  24. data/ext/minimap2/kalloc.h +76 -0
  25. data/ext/minimap2/kdq.h +132 -0
  26. data/ext/minimap2/ketopt.h +120 -0
  27. data/ext/minimap2/khash.h +615 -0
  28. data/ext/minimap2/krmq.h +474 -0
  29. data/ext/minimap2/kseq.h +256 -0
  30. data/ext/minimap2/ksort.h +153 -0
  31. data/ext/minimap2/ksw2.h +184 -0
  32. data/ext/minimap2/ksw2_dispatch.c +96 -0
  33. data/ext/minimap2/ksw2_extd2_sse.c +402 -0
  34. data/ext/minimap2/ksw2_exts2_sse.c +416 -0
  35. data/ext/minimap2/ksw2_extz2_sse.c +313 -0
  36. data/ext/minimap2/ksw2_ll_sse.c +152 -0
  37. data/ext/minimap2/kthread.c +159 -0
  38. data/ext/minimap2/kthread.h +15 -0
  39. data/ext/minimap2/kvec.h +105 -0
  40. data/ext/minimap2/lchain.c +369 -0
  41. data/ext/minimap2/main.c +459 -0
  42. data/ext/minimap2/map.c +714 -0
  43. data/ext/minimap2/minimap.h +410 -0
  44. data/ext/minimap2/minimap2.1 +725 -0
  45. data/ext/minimap2/misc/README.md +179 -0
  46. data/ext/minimap2/misc/mmphase.js +335 -0
  47. data/ext/minimap2/misc/paftools.js +3149 -0
  48. data/ext/minimap2/misc.c +162 -0
  49. data/ext/minimap2/mmpriv.h +132 -0
  50. data/ext/minimap2/options.c +234 -0
  51. data/ext/minimap2/pe.c +177 -0
  52. data/ext/minimap2/python/README.rst +196 -0
  53. data/ext/minimap2/python/cmappy.h +152 -0
  54. data/ext/minimap2/python/cmappy.pxd +153 -0
  55. data/ext/minimap2/python/mappy.pyx +273 -0
  56. data/ext/minimap2/python/minimap2.py +39 -0
  57. data/ext/minimap2/sdust.c +213 -0
  58. data/ext/minimap2/sdust.h +25 -0
  59. data/ext/minimap2/seed.c +131 -0
  60. data/ext/minimap2/setup.py +55 -0
  61. data/ext/minimap2/sketch.c +143 -0
  62. data/ext/minimap2/splitidx.c +84 -0
  63. data/ext/minimap2/sse2neon/emmintrin.h +1689 -0
  64. data/ext/minimap2/test/MT-human.fa +278 -0
  65. data/ext/minimap2/test/MT-orang.fa +276 -0
  66. data/ext/minimap2/test/q-inv.fa +4 -0
  67. data/ext/minimap2/test/q2.fa +2 -0
  68. data/ext/minimap2/test/t-inv.fa +127 -0
  69. data/ext/minimap2/test/t2.fa +2 -0
  70. data/ext/minimap2/tex/Makefile +21 -0
  71. data/ext/minimap2/tex/bioinfo.cls +930 -0
  72. data/ext/minimap2/tex/blasr-mc.eval +17 -0
  73. data/ext/minimap2/tex/bowtie2-s3.sam.eval +28 -0
  74. data/ext/minimap2/tex/bwa-s3.sam.eval +52 -0
  75. data/ext/minimap2/tex/bwa.eval +55 -0
  76. data/ext/minimap2/tex/eval2roc.pl +33 -0
  77. data/ext/minimap2/tex/graphmap.eval +4 -0
  78. data/ext/minimap2/tex/hs38-simu.sh +10 -0
  79. data/ext/minimap2/tex/minialign.eval +49 -0
  80. data/ext/minimap2/tex/minimap2.bib +460 -0
  81. data/ext/minimap2/tex/minimap2.tex +724 -0
  82. data/ext/minimap2/tex/mm2-s3.sam.eval +62 -0
  83. data/ext/minimap2/tex/mm2-update.tex +240 -0
  84. data/ext/minimap2/tex/mm2.approx.eval +12 -0
  85. data/ext/minimap2/tex/mm2.eval +13 -0
  86. data/ext/minimap2/tex/natbib.bst +1288 -0
  87. data/ext/minimap2/tex/natbib.sty +803 -0
  88. data/ext/minimap2/tex/ngmlr.eval +38 -0
  89. data/ext/minimap2/tex/roc.gp +60 -0
  90. data/ext/minimap2/tex/snap-s3.sam.eval +62 -0
  91. data/ext/minimap2.patch +19 -0
  92. data/lib/minimap2/aligner.rb +4 -4
  93. data/lib/minimap2/alignment.rb +11 -11
  94. data/lib/minimap2/ffi/constants.rb +20 -16
  95. data/lib/minimap2/ffi/functions.rb +5 -0
  96. data/lib/minimap2/ffi.rb +4 -5
  97. data/lib/minimap2/version.rb +2 -2
  98. data/lib/minimap2.rb +51 -15
  99. metadata +97 -79
  100. data/lib/minimap2/ffi_helper.rb +0 -53
  101. data/vendor/libminimap2.so +0 -0
@@ -0,0 +1,38 @@
1
+ Q 60 23616 0 0.000000000
2
+ Q 45 3520 1 0.000036851
3
+ Q 41 1840 1 0.000069023
4
+ Q 37 328 2 0.000136500
5
+ Q 36 276 1 0.000169033
6
+ Q 35 480 1 0.000199601
7
+ Q 33 375 2 0.000262855
8
+ Q 31 178 2 0.000326659
9
+ Q 30 153 5 0.000487551
10
+ Q 29 200 1 0.000516696
11
+ Q 27 100 3 0.000611601
12
+ Q 26 93 3 0.000706056
13
+ Q 25 75 2 0.000768393
14
+ Q 24 82 1 0.000798314
15
+ Q 23 80 6 0.000987387
16
+ Q 22 71 6 0.001175835
17
+ Q 21 76 7 0.001394921
18
+ Q 20 63 9 0.001676897
19
+ Q 19 55 4 0.001800322
20
+ Q 18 62 8 0.002048987
21
+ Q 17 55 7 0.002265718
22
+ Q 16 60 10 0.002575539
23
+ Q 15 82 9 0.002850877
24
+ Q 14 67 7 0.003063745
25
+ Q 13 62 11 0.003401042
26
+ Q 12 64 13 0.003799084
27
+ Q 11 56 5 0.003947900
28
+ Q 10 58 17 0.004468303
29
+ Q 9 70 22 0.005139796
30
+ Q 8 23 9 0.005414604
31
+ Q 7 41 17 0.005933068
32
+ Q 6 42 18 0.006480881
33
+ Q 5 33 9 0.006751757
34
+ Q 4 29 9 0.007022948
35
+ Q 3 27 15 0.007478764
36
+ Q 2 23 10 0.007781024
37
+ Q 1 9 2 0.007840364
38
+ Q 0 13 8 0.008083105
@@ -0,0 +1,60 @@
1
+ set t po eps enh co so "Helvetica,26"
2
+
3
+ set style line 1 lt 1 pt 1 lc rgb "#e41a1c" lw 2;
4
+ set style line 2 lt 1 pt 2 lc rgb "#377eb8" lw 2;
5
+ set style line 3 lt 1 pt 3 lc rgb "#4daf4a" lw 2;
6
+ set style line 4 lt 1 pt 4 lc rgb "#984ea3" lw 2;
7
+ set style line 5 lt 1 pt 6 lc rgb "#ff7f00" lw 2;
8
+ set style line 6 lt 1 pt 8 lc rgb "#f781bf" lw 2;
9
+
10
+ set out "roc-color.eps"
11
+
12
+ set pointsize 2.0
13
+ set size 1.59,1.04
14
+ set multiplot layout 1,2
15
+
16
+ set label "(a)" at graph -0.245,1.06 font "Helvetica-bold,40"
17
+ set xlab "Error rate of mapped PacBio reads"
18
+ set ylab "Fraction of mapped reads" off +1.8
19
+ set ytics 0.02
20
+ set yran [0.9:1]
21
+
22
+ set size 0.8,1
23
+ set log x
24
+ set format x "10^{%L}"
25
+ set key bot right
26
+ plot "<./eval2roc.pl blasr-mc.eval" u 2:3 t "blasr-mc" w lp ls 4, \
27
+ "<./eval2roc.pl bwa.eval" u 2:3 t "bwa-mem" w lp ls 2, \
28
+ "<./eval2roc.pl graphmap.eval" u 2:3 t "graphmap" w lp ls 3, \
29
+ "<./eval2roc.pl minialign.eval" u 2:3 t "minialign" w lp ls 1, \
30
+ "<./eval2roc.pl mm2.eval" u 2:3 t "minimap2" w lp ls 6, \
31
+ "<./eval2roc.pl ngmlr.eval" u 2:3 t "ngm-lr" w lp ls 5
32
+ unset label
33
+
34
+ set origin 0.8,0
35
+ set size 0.79,1
36
+ set label "(b)" at graph -0.245,1.06 font "Helvetica-bold,40"
37
+ set xlab "Error rate of mapped short reads"
38
+
39
+ set key top left
40
+ plot "<./eval2roc.pl -n2e7 bowtie2-s3.sam.eval" u 2:3 t "bowtie2" w lp ls 5, \
41
+ "<./eval2roc.pl -n2e7 bwa-s3.sam.eval" u 2:3 t "bwa-mem" w lp ls 2, \
42
+ "<./eval2roc.pl -n2e7 mm2-s3.sam.eval" u 2:3 t "minimap2" w lp ls 6, \
43
+ "<./eval2roc.pl -n2e7 snap-s3.sam.eval" u 2:3 t "snap" w lp ls 3
44
+
45
+ #unset log
46
+ #unset format
47
+ #unset key
48
+ #set log y
49
+ #set ylab "Accumulative mapping error rate" off +0
50
+ #set xlab "Mapping quality"
51
+ #set yran [1e-5:0.1]
52
+ #set ytics 1e-5,0.1
53
+ #set format y "10^{%L}"
54
+ #set xran [60:0] reverse
55
+ #plot "<./eval2roc.pl blasr-mc.eval" u 1:2 w lp ls 4, \
56
+ # "<./eval2roc.pl bwa.eval" u 1:2 t "bwa-mem" w lp ls 2, \
57
+ # "<./eval2roc.pl graphmap.eval" u 1:2 t "graphmap" w lp ls 3, \
58
+ # "<./eval2roc.pl minialign.eval" u 1:2 t "minialign" w lp ls 1, \
59
+ # "<./eval2roc.pl mm2.eval" u 1:2 t "minimap2" w lp ls 6, \
60
+ # "<./eval2roc.pl ngmlr.eval" u 1:2 t "ngm-lr" w lp ls 5
@@ -0,0 +1,62 @@
1
+ Q 60 18993268 10320 0.000543350 18993268
2
+ Q 59 33156 216 0.000553756 19026424
3
+ Q 58 29982 295 0.000568365 19056406
4
+ Q 57 9412 278 0.000582666 19065818
5
+ Q 56 11012 228 0.000594281 19076830
6
+ Q 55 9968 235 0.000606283 19086798
7
+ Q 54 8602 292 0.000621301 19095400
8
+ Q 53 6094 259 0.000634662 19101494
9
+ Q 52 5026 257 0.000647946 19106520
10
+ Q 51 4278 224 0.000659522 19110798
11
+ Q 50 3682 178 0.000668708 19114480
12
+ Q 49 2750 156 0.000676772 19117230
13
+ Q 48 2314 112 0.000682548 19119544
14
+ Q 47 2056 96 0.000687495 19121600
15
+ Q 46 1658 62 0.000690677 19123258
16
+ Q 45 1492 74 0.000694493 19124750
17
+ Q 44 1150 56 0.000697379 19125900
18
+ Q 43 1062 48 0.000699850 19126962
19
+ Q 42 976 60 0.000702951 19127938
20
+ Q 41 884 36 0.000704800 19128822
21
+ Q 40 708 52 0.000707493 19129530
22
+ Q 39 870 26 0.000708819 19130400
23
+ Q 38 598 26 0.000710156 19130998
24
+ Q 37 542 34 0.000711913 19131540
25
+ Q 36 846 50 0.000714495 19132386
26
+ Q 35 590 50 0.000717087 19132976
27
+ Q 34 550 42 0.000719261 19133526
28
+ Q 33 2174 66 0.000722628 19135700
29
+ Q 32 876 86 0.000727089 19136576
30
+ Q 31 638 104 0.000732500 19137214
31
+ Q 30 1718 196 0.000742675 19138932
32
+ Q 29 91022 968 0.000789497 19229954
33
+ Q 28 12864 781 0.000829556 19242818
34
+ Q 27 5806 427 0.000851489 19248624
35
+ Q 26 25274 728 0.000888144 19273898
36
+ Q 25 7418 680 0.000923070 19281316
37
+ Q 24 11800 701 0.000958839 19293116
38
+ Q 23 57328 3933 0.001159250 19350444
39
+ Q 22 7662 846 0.001202494 19358106
40
+ Q 21 5924 617 0.001233989 19364030
41
+ Q 20 4623 574 0.001263330 19368653
42
+ Q 19 4988 942 0.001311627 19373641
43
+ Q 18 3968 793 0.001352282 19377609
44
+ Q 17 3630 681 0.001387166 19381239
45
+ Q 16 2921 513 0.001413422 19384160
46
+ Q 15 2716 424 0.001435095 19386876
47
+ Q 14 2366 365 0.001453744 19389242
48
+ Q 13 2169 412 0.001474828 19391411
49
+ Q 12 2077 360 0.001493233 19393488
50
+ Q 11 2016 441 0.001515815 19395504
51
+ Q 10 2292 738 0.001553682 19397796
52
+ Q 9 4165 1832 0.001647772 19401961
53
+ Q 8 3963 1862 0.001743385 19405924
54
+ Q 7 3927 1793 0.001835408 19409851
55
+ Q 6 3572 1639 0.001919497 19413423
56
+ Q 5 3270 1533 0.001998126 19416693
57
+ Q 4 3046 1610 0.002080718 19419739
58
+ Q 3 251447 125550 0.008436553 19671186
59
+ Q 2 24390 13537 0.009113417 19695576
60
+ Q 1 124406 86780 0.013434624 19819982
61
+ Q 0 171254 153874 0.021016609 19991236
62
+ U 8764
@@ -0,0 +1,19 @@
1
+ --- Makefile.org 2021-05-27 15:45:11.993128205 +0900
2
+ +++ Makefile 2021-05-27 15:46:02.320569154 +0900
3
+ @@ -1,9 +1,9 @@
4
+ -CFLAGS= -g -Wall -O2 -Wc++-compat #-Wextra
5
+ +CFLAGS= -g -Wall -O2 -Wc++-compat -fPIC #-Wextra
6
+ CPPFLAGS= -DHAVE_KALLOC
7
+ INCLUDES=
8
+ OBJS= kthread.o kalloc.o misc.o bseq.o sketch.o sdust.o options.o index.o \
9
+ lchain.o align.o hit.o seed.o map.o format.o pe.o esterr.o splitidx.o \
10
+ - ksw2_ll_sse.o
11
+ + ksw2_ll_sse.o cmappy.o
12
+ PROG= minimap2
13
+ PROG_EXTRA= sdust minimap2-lite
14
+ LIBS= -lm -lz -lpthread
15
+ @@ -130,3 +130,4 @@ sdust.o: kalloc.h kdq.h kvec.h sdust.h
16
+ seed.o: mmpriv.h minimap.h bseq.h kseq.h kalloc.h ksort.h
17
+ sketch.o: kvec.h kalloc.h mmpriv.h minimap.h bseq.h kseq.h
18
+ splitidx.o: mmpriv.h minimap.h bseq.h kseq.h
19
+ +cmappy.o: cmappy.h
@@ -90,7 +90,7 @@ module Minimap2
90
90
  end
91
91
 
92
92
  if fn_idx_in
93
- warn 'Since fn_idx_in is specified, the seq argument will be ignored.' if seq
93
+ warn "Since fn_idx_in is specified, the seq argument will be ignored." if seq
94
94
  reader = FFI.mm_idx_reader_open(fn_idx_in, idx_opt, fn_idx_out)
95
95
 
96
96
  # The Ruby version raises an error here
@@ -169,13 +169,13 @@ module Minimap2
169
169
  c = hit[:cigar32].read_array_of_uint32(hit[:n_cigar32])
170
170
  cigar = c.map { |x| [x >> 4, x & 0xf] } # 32-bit CIGAR encoding -> Ruby array
171
171
 
172
- _cs = ''
172
+ _cs = ""
173
173
  if cs
174
174
  l_cs_str = FFI.mm_gen_cs(km, cs_str, m_cs_str, @index, regs[i], seq, 1)
175
175
  _cs = cs_str.read_pointer.read_string(l_cs_str)
176
176
  end
177
177
 
178
- _md = ''
178
+ _md = ""
179
179
  if md
180
180
  l_cs_str = FFI.mm_gen_md(km, cs_str, m_cs_str, @index, regs[i], seq)
181
181
  _md = cs_str.read_pointer.read_string(l_cs_str)
@@ -204,7 +204,7 @@ module Minimap2
204
204
  lp = ::FFI::MemoryPointer.new(:int)
205
205
  s = FFI.mappy_fetch_seq(index, name, start, stop, lp)
206
206
  l = lp.read_int
207
- return nil if l.zero?
207
+ return nil if l == 0
208
208
 
209
209
  s.read_string(l)
210
210
  end
@@ -89,20 +89,20 @@ module Minimap2
89
89
  # Convert to the PAF format without the QueryName and QueryLength columns.
90
90
 
91
91
  def to_s
92
- strand = if @strand.positive?
93
- '+'
94
- elsif @strand.negative?
95
- '-'
92
+ strand = if @strand > 0
93
+ "+"
94
+ elsif @strand < 0
95
+ "-"
96
96
  else
97
- '?'
97
+ "?"
98
98
  end
99
- tp = @primary != 0 ? 'tp:A:P' : 'tp:A:S'
100
- ts = if @trans_strand.positive?
101
- 'ts:A:+'
102
- elsif @trans_strand.negative?
103
- 'ts:A:-'
99
+ tp = @primary != 0 ? "tp:A:P" : "tp:A:S"
100
+ ts = if @trans_strand > 0
101
+ "ts:A:+"
102
+ elsif @trans_strand < 0
103
+ "ts:A:-"
104
104
  else
105
- 'ts:A:.'
105
+ "ts:A:."
106
106
  end
107
107
  a = [@q_st, @q_en, strand, @ctg, @ctg_len, @r_st, @r_en,
108
108
  @mlen, @blen, @mapq, tp, ts, "cg:Z:#{@cigar_str}"]
@@ -36,7 +36,8 @@ module Minimap2
36
36
  SAM_HIT_ONLY = 0x40000000
37
37
  RMQ = 0x80000000 # LL
38
38
  QSTRAND = 0x100000000 # LL
39
- NO_INV = 0x200000000
39
+ NO_INV = 0x200000000 # LL
40
+ NO_HASH_NAME = 0x400000000 # LL
40
41
 
41
42
  HPC = 0x1
42
43
  NO_SEQ = 0x2
@@ -56,7 +57,7 @@ module Minimap2
56
57
  CIGAR_EQ_MATCH = 7
57
58
  CIGAR_X_MISMATCH = 8
58
59
 
59
- CIGAR_STR = 'MIDNSHP=XB'
60
+ CIGAR_STR = "MIDNSHP=XB"
60
61
 
61
62
  # emulate 128-bit integers
62
63
  class MM128 < ::FFI::Struct
@@ -101,6 +102,7 @@ module Minimap2
101
102
  :min_cnt, :int, # min number of minimizers on each chain
102
103
  :min_chain_score, :int, # min chaining score
103
104
  :chain_gap_scale, :float,
105
+ :chain_skip_scale, :float,
104
106
  :rmq_size_cap, :int,
105
107
  :rmq_inner_dist, :int,
106
108
  :rmq_rescue_size, :int,
@@ -132,6 +134,7 @@ module Minimap2
132
134
  :pe_ori, :int,
133
135
  :pe_bonus, :int,
134
136
  :mid_occ_frac, :float, # only used by mm_mapopt_update(); see below
137
+ :q_occ_frac, :float,
135
138
  :min_mid_occ, :int32_t,
136
139
  :mid_occ, :int32_t, # ignore seeds with occurrences above this threshold
137
140
  :max_occ, :int32_t,
@@ -188,7 +191,7 @@ module Minimap2
188
191
  :n_ambi_trans_strand, :uint32,
189
192
  :n_cigar, :uint32
190
193
 
191
- bitfields :n_ambi_trans_strand,
194
+ bit_field :n_ambi_trans_strand,
192
195
  :n_ambi, 30, # number of ambiguous bases
193
196
  :trans_strand, 2 # transcript strand: 0 for unknown, 1 for +, 2 for -
194
197
 
@@ -220,19 +223,20 @@ module Minimap2
220
223
  :div, :float,
221
224
  :p, Extra.ptr
222
225
 
223
- bitfields :fields,
224
- :mapq, 8,
225
- :split, 2,
226
- :rev, 1,
227
- :inv, 1,
228
- :sam_pri, 1,
229
- :proper_frag, 1,
230
- :pe_thru, 1,
231
- :seg_split, 1,
232
- :seg_id, 8,
233
- :split_inv, 1,
234
- :is_alt, 1,
235
- :dummy, 6
226
+ bit_field :fields,
227
+ :mapq, 8,
228
+ :split, 2,
229
+ :rev, 1,
230
+ :inv, 1,
231
+ :sam_pri, 1,
232
+ :proper_frag, 1,
233
+ :pe_thru, 1,
234
+ :seg_split, 1,
235
+ :seg_id, 8,
236
+ :split_inv, 1,
237
+ :is_alt, 1,
238
+ :strand_retained, 1,
239
+ :dummy, 5
236
240
  end
237
241
 
238
242
  # memory buffer for thread-local storage during mapping
@@ -2,6 +2,11 @@
2
2
 
3
3
  module Minimap2
4
4
  module FFI
5
+ attach_function \
6
+ :main,
7
+ %i[int pointer],
8
+ :int
9
+
5
10
  attach_function \
6
11
  :mm_set_opt_raw, :mm_set_opt,
7
12
  [:pointer, IdxOpt.by_ref, MapOpt.by_ref],
data/lib/minimap2/ffi.rb CHANGED
@@ -1,8 +1,7 @@
1
1
  # frozen_string_literal: true
2
2
 
3
3
  # bit fields
4
- require_relative 'ffi_helper'
5
-
4
+ require "ffi/bit_struct"
6
5
  module Minimap2
7
6
  # Native APIs
8
7
  module FFI
@@ -22,6 +21,6 @@ module Minimap2
22
21
  end
23
22
  end
24
23
 
25
- require_relative 'ffi/constants'
26
- require_relative 'ffi/functions'
27
- require_relative 'ffi/mappy'
24
+ require_relative "ffi/constants"
25
+ require_relative "ffi/functions"
26
+ require_relative "ffi/mappy"
@@ -1,6 +1,6 @@
1
1
  # frozen_string_literal: true
2
2
 
3
3
  module Minimap2
4
- # Minimap2-2.22 (r1101)
5
- VERSION = '0.2.22.0'
4
+ # Minimap2-2.23 (r1111)
5
+ VERSION = "0.2.24.1"
6
6
  end
data/lib/minimap2.rb CHANGED
@@ -1,15 +1,12 @@
1
1
  # frozen_string_literal: true
2
2
 
3
3
  # dependencies
4
- require 'ffi'
5
-
6
- # bit fields
7
- require_relative 'minimap2/ffi_helper'
4
+ require "ffi"
8
5
 
9
6
  # modules
10
- require_relative 'minimap2/aligner'
11
- require_relative 'minimap2/alignment'
12
- require_relative 'minimap2/version'
7
+ require_relative "minimap2/aligner"
8
+ require_relative "minimap2/alignment"
9
+ require_relative "minimap2/version"
13
10
 
14
11
  # Minimap2 mapper for long read sequences
15
12
  # https://github.com/lh3/minimap2
@@ -22,22 +19,56 @@ module Minimap2
22
19
  attr_accessor :ffi_lib
23
20
  end
24
21
 
25
- lib_name = ::FFI.map_library_name('minimap2')
26
- self.ffi_lib = if ENV['MINIMAPDIR']
27
- File.expand_path(lib_name, ENV['MINIMAPDIR'])
22
+ lib_name = ::FFI.map_library_name("minimap2")
23
+ self.ffi_lib = if ENV["MINIMAPDIR"]
24
+ File.expand_path(lib_name, ENV["MINIMAPDIR"])
28
25
  else
29
26
  File.expand_path("../vendor/#{lib_name}", __dir__)
30
27
  end
31
28
 
32
29
  # friendlier error message
33
- autoload :FFI, 'minimap2/ffi'
30
+ autoload :FFI, "minimap2/ffi"
34
31
 
35
32
  # methods from mappy
36
33
  class << self
34
+ # Execute minimap2 comannd with given options.
35
+ # @overload execute(arg0,arg1,...)
36
+ # @param [String] arg minimap2 command option.
37
+ # @example Get minimap2 version
38
+ # Minimap2.execute('--version')
39
+
40
+ def Minimap2.execute(*rb_argv)
41
+ str_ptrs = []
42
+ # First argument is the program name.
43
+ str_ptrs << ::FFI::MemoryPointer.from_string("minimap2")
44
+ rb_argv.each do |arg|
45
+ arg.to_s.split(/\s+/).each do |s|
46
+ str_ptrs << ::FFI::MemoryPointer.from_string(s)
47
+ end
48
+ end
49
+ str_ptrs << nil
50
+
51
+ # Load all the pointers into a native memory block
52
+ argv = ::FFI::MemoryPointer.new(:pointer, str_ptrs.length)
53
+ str_ptrs.each_with_index do |p, i|
54
+ argv[i].put_pointer(0, p)
55
+ end
56
+
57
+ FFI.main(str_ptrs.length - 1, argv)
58
+ end
59
+
60
+ # Get verbosity level.
61
+ # @return [Integer] verbosity level.
62
+
63
+ def verbose
64
+ FFI.mm_verbose_level(-1)
65
+ end
66
+
37
67
  # Set verbosity level.
38
- # @param [Integer] level
68
+ # @param [Integer] verbosity level
69
+ # @return [Integer] verbosity level.
39
70
 
40
- def verbose(level = -1)
71
+ def verbose=(level)
41
72
  FFI.mm_verbose_level(level)
42
73
  end
43
74
 
@@ -50,7 +81,12 @@ module Minimap2
50
81
 
51
82
  def fastx_read(file_path, comment: false, &block)
52
83
  path = File.expand_path(file_path)
84
+
85
+ # raise error in Ruby because ks.null? is false even if file not exist.
86
+ raise ArgumentError, "File not found: #{path}" unless File.exist?(path)
87
+
53
88
  ks = FFI.mm_fastx_open(path)
89
+
54
90
  if block_given?
55
91
  fastx_each(ks, comment, &block)
56
92
  else
@@ -80,11 +116,11 @@ module Minimap2
80
116
  end
81
117
 
82
118
  def fastx_next(ks, read_comment)
83
- qual = ks[:qual][:s] if (ks[:qual][:l]).positive?
119
+ qual = ks[:qual][:s] if (ks[:qual][:l]) > 0
84
120
  name = ks[:name][:s]
85
121
  seq = ks[:seq][:s]
86
122
  if read_comment
87
- comment = ks[:comment][:s] if (ks[:comment][:l]).positive?
123
+ comment = ks[:comment][:s] if (ks[:comment][:l]) > 0
88
124
  [name, seq, qual, comment]
89
125
  else
90
126
  [name, seq, qual]