minimap2 0.2.22.0 → 0.2.24.1

Sign up to get free protection for your applications and to get access to all the features.
Files changed (101) hide show
  1. checksums.yaml +4 -4
  2. data/README.md +60 -76
  3. data/ext/Rakefile +55 -0
  4. data/ext/cmappy/cmappy.c +129 -0
  5. data/ext/cmappy/cmappy.h +44 -0
  6. data/ext/minimap2/FAQ.md +46 -0
  7. data/ext/minimap2/LICENSE.txt +24 -0
  8. data/ext/minimap2/MANIFEST.in +10 -0
  9. data/ext/minimap2/Makefile +132 -0
  10. data/ext/minimap2/Makefile.simde +97 -0
  11. data/ext/minimap2/NEWS.md +821 -0
  12. data/ext/minimap2/README.md +403 -0
  13. data/ext/minimap2/align.c +1020 -0
  14. data/ext/minimap2/bseq.c +169 -0
  15. data/ext/minimap2/bseq.h +64 -0
  16. data/ext/minimap2/code_of_conduct.md +30 -0
  17. data/ext/minimap2/cookbook.md +243 -0
  18. data/ext/minimap2/esterr.c +64 -0
  19. data/ext/minimap2/example.c +63 -0
  20. data/ext/minimap2/format.c +559 -0
  21. data/ext/minimap2/hit.c +466 -0
  22. data/ext/minimap2/index.c +775 -0
  23. data/ext/minimap2/kalloc.c +205 -0
  24. data/ext/minimap2/kalloc.h +76 -0
  25. data/ext/minimap2/kdq.h +132 -0
  26. data/ext/minimap2/ketopt.h +120 -0
  27. data/ext/minimap2/khash.h +615 -0
  28. data/ext/minimap2/krmq.h +474 -0
  29. data/ext/minimap2/kseq.h +256 -0
  30. data/ext/minimap2/ksort.h +153 -0
  31. data/ext/minimap2/ksw2.h +184 -0
  32. data/ext/minimap2/ksw2_dispatch.c +96 -0
  33. data/ext/minimap2/ksw2_extd2_sse.c +402 -0
  34. data/ext/minimap2/ksw2_exts2_sse.c +416 -0
  35. data/ext/minimap2/ksw2_extz2_sse.c +313 -0
  36. data/ext/minimap2/ksw2_ll_sse.c +152 -0
  37. data/ext/minimap2/kthread.c +159 -0
  38. data/ext/minimap2/kthread.h +15 -0
  39. data/ext/minimap2/kvec.h +105 -0
  40. data/ext/minimap2/lchain.c +369 -0
  41. data/ext/minimap2/main.c +459 -0
  42. data/ext/minimap2/map.c +714 -0
  43. data/ext/minimap2/minimap.h +410 -0
  44. data/ext/minimap2/minimap2.1 +725 -0
  45. data/ext/minimap2/misc/README.md +179 -0
  46. data/ext/minimap2/misc/mmphase.js +335 -0
  47. data/ext/minimap2/misc/paftools.js +3149 -0
  48. data/ext/minimap2/misc.c +162 -0
  49. data/ext/minimap2/mmpriv.h +132 -0
  50. data/ext/minimap2/options.c +234 -0
  51. data/ext/minimap2/pe.c +177 -0
  52. data/ext/minimap2/python/README.rst +196 -0
  53. data/ext/minimap2/python/cmappy.h +152 -0
  54. data/ext/minimap2/python/cmappy.pxd +153 -0
  55. data/ext/minimap2/python/mappy.pyx +273 -0
  56. data/ext/minimap2/python/minimap2.py +39 -0
  57. data/ext/minimap2/sdust.c +213 -0
  58. data/ext/minimap2/sdust.h +25 -0
  59. data/ext/minimap2/seed.c +131 -0
  60. data/ext/minimap2/setup.py +55 -0
  61. data/ext/minimap2/sketch.c +143 -0
  62. data/ext/minimap2/splitidx.c +84 -0
  63. data/ext/minimap2/sse2neon/emmintrin.h +1689 -0
  64. data/ext/minimap2/test/MT-human.fa +278 -0
  65. data/ext/minimap2/test/MT-orang.fa +276 -0
  66. data/ext/minimap2/test/q-inv.fa +4 -0
  67. data/ext/minimap2/test/q2.fa +2 -0
  68. data/ext/minimap2/test/t-inv.fa +127 -0
  69. data/ext/minimap2/test/t2.fa +2 -0
  70. data/ext/minimap2/tex/Makefile +21 -0
  71. data/ext/minimap2/tex/bioinfo.cls +930 -0
  72. data/ext/minimap2/tex/blasr-mc.eval +17 -0
  73. data/ext/minimap2/tex/bowtie2-s3.sam.eval +28 -0
  74. data/ext/minimap2/tex/bwa-s3.sam.eval +52 -0
  75. data/ext/minimap2/tex/bwa.eval +55 -0
  76. data/ext/minimap2/tex/eval2roc.pl +33 -0
  77. data/ext/minimap2/tex/graphmap.eval +4 -0
  78. data/ext/minimap2/tex/hs38-simu.sh +10 -0
  79. data/ext/minimap2/tex/minialign.eval +49 -0
  80. data/ext/minimap2/tex/minimap2.bib +460 -0
  81. data/ext/minimap2/tex/minimap2.tex +724 -0
  82. data/ext/minimap2/tex/mm2-s3.sam.eval +62 -0
  83. data/ext/minimap2/tex/mm2-update.tex +240 -0
  84. data/ext/minimap2/tex/mm2.approx.eval +12 -0
  85. data/ext/minimap2/tex/mm2.eval +13 -0
  86. data/ext/minimap2/tex/natbib.bst +1288 -0
  87. data/ext/minimap2/tex/natbib.sty +803 -0
  88. data/ext/minimap2/tex/ngmlr.eval +38 -0
  89. data/ext/minimap2/tex/roc.gp +60 -0
  90. data/ext/minimap2/tex/snap-s3.sam.eval +62 -0
  91. data/ext/minimap2.patch +19 -0
  92. data/lib/minimap2/aligner.rb +4 -4
  93. data/lib/minimap2/alignment.rb +11 -11
  94. data/lib/minimap2/ffi/constants.rb +20 -16
  95. data/lib/minimap2/ffi/functions.rb +5 -0
  96. data/lib/minimap2/ffi.rb +4 -5
  97. data/lib/minimap2/version.rb +2 -2
  98. data/lib/minimap2.rb +51 -15
  99. metadata +97 -79
  100. data/lib/minimap2/ffi_helper.rb +0 -53
  101. data/vendor/libminimap2.so +0 -0
@@ -0,0 +1,460 @@
1
+ @article{Chaisson:2012aa,
2
+ Author = {Chaisson, Mark J and Tesler, Glenn},
3
+ Journal = {BMC Bioinformatics},
4
+ Pages = {238},
5
+ Title = {{Mapping single molecule sequencing reads using basic local alignment with successive refinement (BLASR): application and theory}},
6
+ Volume = {13},
7
+ Year = {2012}}
8
+
9
+ @article{Liu:2016ab,
10
+ Author = {Liu, Bo and others},
11
+ Journal = {Bioinformatics},
12
+ Pages = {1625-31},
13
+ Title = {{rHAT}: fast alignment of noisy long reads with regional hashing},
14
+ Volume = {32},
15
+ Year = {2016}}
16
+
17
+ @article{Liu:2017aa,
18
+ Author = {Liu, Bo and others},
19
+ Journal = {Bioinformatics},
20
+ Pages = {192-201},
21
+ Title = {{LAMSA}: fast split read alignment with long approximate matches},
22
+ Volume = {33},
23
+ Year = {2017}}
24
+
25
+ @article{Lin:2017aa,
26
+ Author = {Lin, Hsin-Nan and Hsu, Wen-Lian},
27
+ Journal = {Bioinformatics},
28
+ Title = {Kart: a divide-and-conquer algorithm for {NGS} read alignment},
29
+ Year = {2017}}
30
+
31
+ @article{Li:2013aa,
32
+ Author = {Li, Heng},
33
+ Journal = {arXiv:1303.3997},
34
+ Title = {Aligning sequence reads, clone sequences and assembly contigs with {BWA-MEM}},
35
+ archivePrefix = "arXiv",
36
+ eprint = {1303.3997},
37
+ primaryClass = "q-bio",
38
+ Year = {2013}}
39
+
40
+ @article{Sovic:2016aa,
41
+ Author = {Sovi{\'c}, Ivan and others},
42
+ Journal = {Nat Commun},
43
+ Pages = {11307},
44
+ Title = {Fast and sensitive mapping of nanopore sequencing reads with {GraphMap}},
45
+ Volume = {7},
46
+ Year = {2016}}
47
+
48
+ @article{Langmead:2012fk,
49
+ Author = {Langmead, Ben and Salzberg, Steven L},
50
+ Journal = {Nat Methods},
51
+ Pages = {357-9},
52
+ Title = {Fast gapped-read alignment with {Bowtie} 2},
53
+ Volume = {9},
54
+ Year = {2012}}
55
+
56
+ @article{Li:2016aa,
57
+ Author = {Li, Heng},
58
+ Journal = {Bioinformatics},
59
+ Pages = {2103-10},
60
+ Title = {Minimap and miniasm: fast mapping and de novo assembly for noisy long sequences},
61
+ Volume = {32},
62
+ Year = {2016}}
63
+
64
+ @misc{Ruan:2016,
65
+ title = {Ultra-fast de novo assembler using long noisy reads},
66
+ author = {Jue Ruan},
67
+ journal = {Unpulished},
68
+ howpublished = {\href{https://github.com/ruanjue/smartdenovo}{https://github.com/ruanjue/smartdenovo}},
69
+ year = {2016}}
70
+
71
+ @article{Miller:1988aa,
72
+ Author = {Miller, W and Myers, E W},
73
+ Journal = {Bull Math Biol},
74
+ Number = {2},
75
+ Pages = {97-120},
76
+ Title = {Sequence comparison with concave weighting functions},
77
+ Volume = {50},
78
+ Year = {1988}}
79
+
80
+ @article{Gotoh:1990aa,
81
+ Author = {Gotoh, O},
82
+ Journal = {Bull Math Biol},
83
+ Pages = {359-73},
84
+ Title = {Optimal sequence alignment allowing for long gaps},
85
+ Volume = {52},
86
+ Year = {1990}}
87
+
88
+ @article{Wu:1996aa,
89
+ Author = {Wu, Sun and others},
90
+ Journal = {Algorithmica},
91
+ Pages = {50-67},
92
+ Title = {A subquadratic algorithm for approximate limited expression matching},
93
+ Volume = {15},
94
+ Year = {1996}}
95
+
96
+ @article{Daily:2016aa,
97
+ Author = {Daily, Jeff},
98
+ Journal = {BMC Bioinformatics},
99
+ Month = {Feb},
100
+ Pages = {81},
101
+ Title = {Parasail: {SIMD C} library for global, semi-global, and local pairwise sequence alignments},
102
+ Volume = {17},
103
+ Year = {2016}}
104
+
105
+ @article{Sedlazeck169557,
106
+ author = {Sedlazeck, Fritz J and others},
107
+ title = {Accurate detection of complex structural variations using single molecule sequencing},
108
+ note = {doi:10.1101/169557},
109
+ journal = {bioRxiv},
110
+ year = {2017}}
111
+
112
+ @article{Altschul:1997vn,
113
+ Author = {Altschul, S F and others},
114
+ Journal = {Nucleic Acids Res},
115
+ Pages = {3389-402},
116
+ Title = {Gapped {BLAST} and {PSI-BLAST}: a new generation of protein database search programs},
117
+ Volume = {25},
118
+ Year = {1997}}
119
+
120
+ @article{Sosic:2017aa,
121
+ Author = {{\v S}o{\v s}i\'{c}, Martin and {\v S}ikic, Mile},
122
+ Journal = {Bioinformatics},
123
+ Pages = {1394-1395},
124
+ Title = {Edlib: a {C/C++} library for fast, exact sequence alignment using edit distance},
125
+ Volume = {33},
126
+ Year = {2017}}
127
+
128
+ @article{Abouelhoda:2005aa,
129
+ Author = {Mohamed Ibrahim Abouelhoda and Enno Ohlebusch},
130
+ Journal = {J. Discrete Algorithms},
131
+ Pages = {321-41},
132
+ Title = {Chaining algorithms for multiple genome comparison},
133
+ Volume = {3},
134
+ Year = {2005}}
135
+
136
+ @article{Ono:2013aa,
137
+ Author = {Ono, Yukiteru and others},
138
+ Journal = {Bioinformatics},
139
+ Pages = {119-21},
140
+ Title = {{PBSIM}: {PacBio} reads simulator--toward accurate genome assembly},
141
+ Volume = {29},
142
+ Year = {2013}}
143
+
144
+ @article {Jain128835,
145
+ author = {Jain, Miten and others},
146
+ title = {Nanopore sequencing and assembly of a human genome with ultra-long reads},
147
+ year = {2017},
148
+ note = {doi:10.1101/128835},
149
+ publisher = {Cold Spring Harbor Labs Journals},
150
+ journal = {bioRxiv}}
151
+
152
+ @article{Lau:2016aa,
153
+ Author = {Lau, Bayo and others},
154
+ Journal = {Bioinformatics},
155
+ Pages = {3829-3832},
156
+ Title = {{LongISLND}: in silico sequencing of lengthy and noisy datatypes},
157
+ Volume = {32},
158
+ Year = {2016}}
159
+
160
+ @article{Robinson:2011aa,
161
+ Author = {Robinson, James T and others},
162
+ Journal = {Nat Biotechnol},
163
+ Pages = {24-6},
164
+ Title = {Integrative genomics viewer},
165
+ Volume = {29},
166
+ Year = {2011}}
167
+
168
+ @article{Gotoh:1982aa,
169
+ Author = {Gotoh, O},
170
+ Journal = {J Mol Biol},
171
+ Pages = {705-8},
172
+ Title = {An improved algorithm for matching biological sequences},
173
+ Volume = {162},
174
+ Year = {1982}}
175
+
176
+ @article{Altschul:1986aa,
177
+ Author = {Altschul, S F and Erickson, B W},
178
+ Journal = {Bull Math Biol},
179
+ Pages = {603-16},
180
+ Title = {Optimal sequence alignment using affine gap costs},
181
+ Volume = {48},
182
+ Year = {1986}}
183
+
184
+ @article{Wu:2005vn,
185
+ Author = {Wu, Thomas D and Watanabe, Colin K},
186
+ Journal = {Bioinformatics},
187
+ Pages = {1859-75},
188
+ Title = {{GMAP}: a genomic mapping and alignment program for {mRNA} and {EST} sequences},
189
+ Volume = {21},
190
+ Year = {2005}}
191
+
192
+ @article{Iwata:2012aa,
193
+ Author = {Iwata, Hiroaki and Gotoh, Osamu},
194
+ Journal = {Nucleic Acids Res},
195
+ Pages = {e161},
196
+ Title = {Benchmarking spliced alignment programs including {Spaln2}, an extended version of {Spaln} that incorporates additional species-specific features},
197
+ Volume = {40},
198
+ Year = {2012}}
199
+
200
+ @article{Dobin:2013kx,
201
+ Author = {Dobin, Alexander and others},
202
+ Journal = {Bioinformatics},
203
+ Pages = {15-21},
204
+ Title = {{STAR}: ultrafast universal {RNA-seq} aligner},
205
+ Volume = {29},
206
+ Year = {2013}}
207
+
208
+ @article{Byrne:2017aa,
209
+ Author = {Byrne, Ashley and others},
210
+ Journal = {Nat Commun},
211
+ Pages = {16027},
212
+ Title = {Nanopore long-read {RNAseq} reveals widespread transcriptional variation among the surface receptors of individual {B} cells},
213
+ Volume = {8},
214
+ Year = {2017}}
215
+
216
+ @article{Roberts:2004fv,
217
+ Author = {Roberts, Michael and others},
218
+ Journal = {Bioinformatics},
219
+ Pages = {3363-9},
220
+ Title = {Reducing storage requirements for biological sequence comparison},
221
+ Volume = {20},
222
+ Year = {2004}}
223
+
224
+ @article{Zhang:2006aa,
225
+ Author = {Zhang, Miao and Gish, Warren},
226
+ Journal = {Bioinformatics},
227
+ Pages = {13-20},
228
+ Title = {Improved spliced alignment from an information theoretic approach},
229
+ Volume = {22},
230
+ Year = {2006}}
231
+
232
+ @article{Li:2007aa,
233
+ Author = {Li, Heng and others},
234
+ Journal = {BMC Bioinformatics},
235
+ Pages = {349},
236
+ Title = {A cross-species alignment tool {(CAT)}},
237
+ Volume = {8},
238
+ Year = {2007}}
239
+
240
+ @article{Farrar:2007hs,
241
+ Author = {Farrar, Michael},
242
+ Journal = {Bioinformatics},
243
+ Pages = {156-61},
244
+ Title = {{Striped Smith-Waterman speeds database searches six times over other SIMD implementations}},
245
+ Volume = {23},
246
+ Year = {2007}}
247
+
248
+ @techreport{Holtgrewe:2010aa,
249
+ Address = {Freie Universit{\"a}t Berlin},
250
+ Author = {Holtgrewe, M.},
251
+ Institution = {Institut f{\"u}r Mathematik und Informatik},
252
+ Number = {TR-B-10-06},
253
+ Title = {Mason -- a read simulator for second generation sequencing data},
254
+ Year = {2010}}
255
+
256
+ @article{Zaharia:2011aa,
257
+ Author = {Zaharia, Matei and others},
258
+ Journal = {arXiv:1111:5572},
259
+ Title = {Faster and More Accurate Sequence Alignment with {SNAP}},
260
+ Year = {2011}}
261
+
262
+ @article{Irimia:2008aa,
263
+ Author = {Irimia, Manuel and Roy, Scott William},
264
+ Journal = {PLoS Genet},
265
+ Pages = {e1000148},
266
+ Title = {Evolutionary convergence on highly-conserved 3' intron structures in intron-poor eukaryotes and insights into the ancestral eukaryotic genome},
267
+ Volume = {4},
268
+ Year = {2008}}
269
+
270
+ @article{Depristo:2011vn,
271
+ Author = {Depristo, Mark A and others},
272
+ Journal = {Nat Genet},
273
+ Pages = {491-8},
274
+ Title = {A framework for variation discovery and genotyping using next-generation {DNA} sequencing data},
275
+ Volume = {43},
276
+ Year = {2011}}
277
+
278
+ @article{Kurtz:2004zr,
279
+ Author = {Kurtz, Stefan and others},
280
+ Journal = {Genome Biol},
281
+ Pages = {R12},
282
+ Title = {Versatile and open software for comparing large genomes},
283
+ Volume = {5},
284
+ Year = {2004}}
285
+
286
+ @article {Li223297,
287
+ author = {Li, Heng and others},
288
+ title = {New synthetic-diploid benchmark for accurate variant calling evaluation},
289
+ year = {2017},
290
+ note = {doi:10.1101/223297},
291
+ journal = {bioRxiv}
292
+ }
293
+
294
+ @article{Berlin:2015xy,
295
+ Author = {Berlin, Konstantin and others},
296
+ Journal = {Nat Biotechnol},
297
+ Pages = {623-30},
298
+ Title = {Assembling large genomes with single-molecule sequencing and locality-sensitive hashing},
299
+ Volume = {33},
300
+ Year = {2015}}
301
+
302
+ @article{Gurevich:2013aa,
303
+ Author = {Gurevich, Alexey and others},
304
+ Journal = {Bioinformatics},
305
+ Pages = {1072-5},
306
+ Title = {{QUAST}: quality assessment tool for genome assemblies},
307
+ Volume = {29},
308
+ Year = {2013}}
309
+
310
+ @article{Li:2010fk,
311
+ Author = {Li, Heng and Durbin, Richard},
312
+ Journal = {Bioinformatics},
313
+ Pages = {589-95},
314
+ Title = {Fast and accurate long-read alignment with {Burrows-Wheeler} transform},
315
+ Volume = {26},
316
+ Year = {2010}}
317
+
318
+ @article{Marcais:2018aa,
319
+ Author = {Mar{\c c}ais, Guillaume and others},
320
+ Journal = {PLoS Comput Biol},
321
+ Pages = {e1005944},
322
+ Title = {{MUMmer4}: A fast and versatile genome alignment system},
323
+ Volume = {14},
324
+ Year = {2018}}
325
+
326
+ @article{Li:2009ys,
327
+ Author = {Li, Heng and others},
328
+ Journal = {Bioinformatics},
329
+ Pages = {2078-9},
330
+ Title = {The {Sequence Alignment/Map format and SAMtools}},
331
+ Volume = {25},
332
+ Year = {2009}}
333
+
334
+ @article{Suzuki:2018aa,
335
+ Author = {Suzuki, Hajime and Kasahara, Masahiro},
336
+ Journal = {BMC Bioinformatics},
337
+ Pages = {45},
338
+ Title = {Introducing difference recurrence relations for faster semi-global alignment of long sequences},
339
+ Volume = {19},
340
+ Year = {2018}}
341
+
342
+ @article{Li:2018ab,
343
+ Author = {Li, Heng},
344
+ Journal = {Bioinformatics},
345
+ Pages = {3094-3100},
346
+ Title = {Minimap2: pairwise alignment for nucleotide sequences},
347
+ Volume = {34},
348
+ Year = {2018}}
349
+
350
+ @article{Jain:2020aa,
351
+ Author = {Jain, Chirag and others},
352
+ Journal = {Bioinformatics},
353
+ Pages = {i111-i118},
354
+ Title = {Weighted minimizer sampling improves long read mapping},
355
+ Volume = {36},
356
+ Year = {2020}}
357
+
358
+ @article{Miga:2020aa,
359
+ Author = {Miga, Karen H and others},
360
+ Journal = {Nature},
361
+ Pages = {79-84},
362
+ Title = {Telomere-to-telomere assembly of a complete human {X} chromosome},
363
+ Volume = {585},
364
+ Year = {2020}}
365
+
366
+ @article {Jain2020.11.01.363887,
367
+ author = {Jain, Chirag and others},
368
+ title = {A long read mapping method for highly repetitive reference sequences},
369
+ elocation-id = {2020.11.01.363887},
370
+ year = {2020},
371
+ doi = {10.1101/2020.11.01.363887},
372
+ publisher = {Cold Spring Harbor Laboratory},
373
+ URL = {https://www.biorxiv.org/content/early/2020/11/02/2020.11.01.363887},
374
+ eprint = {https://www.biorxiv.org/content/early/2020/11/02/2020.11.01.363887.full.pdf},
375
+ journal = {bioRxiv}
376
+ }
377
+
378
+ @article{Li:2020aa,
379
+ Author = {Li, Heng and others},
380
+ Journal = {Genome Biol},
381
+ Pages = {265},
382
+ Title = {The design and construction of reference pangenome graphs with minigraph},
383
+ Volume = {21},
384
+ Year = {2020}}
385
+
386
+ @article{Ren:2021aa,
387
+ Author = {Ren, Jingwen and Chaisson, Mark J P},
388
+ Journal = {PLoS Comput Biol},
389
+ Pages = {e1009078},
390
+ Title = {lra: A long read aligner for sequences and contigs},
391
+ Volume = {17},
392
+ Year = {2021}}
393
+
394
+ @inproceedings{DBLP:conf/wabi/AbouelhodaO03,
395
+ Author = {Mohamed Ibrahim Abouelhoda and Enno Ohlebusch},
396
+ Booktitle = {Algorithms in Bioinformatics, Third International Workshop, {WABI} 2003, Budapest, Hungary, September 15-20, 2003, Proceedings},
397
+ Crossref = {DBLP:conf/wabi/2003},
398
+ Pages = {1--16},
399
+ Title = {A Local Chaining Algorithm and Its Applications in Comparative Genomics},
400
+ Year = {2003}}
401
+
402
+ @article{Ono:2021aa,
403
+ Author = {Ono, Yukiteru and others},
404
+ Journal = {Bioinformatics},
405
+ Pages = {589-595},
406
+ Title = {{PBSIM2}: a simulator for long-read sequencers with a novel generative model of quality scores},
407
+ Volume = {37},
408
+ Year = {2021}}
409
+
410
+ @article{Sedlazeck:2018ab,
411
+ Author = {Sedlazeck, Fritz J and others},
412
+ Journal = {Nat Methods},
413
+ Pages = {461-468},
414
+ Title = {Accurate detection of complex structural variations using single-molecule sequencing},
415
+ Volume = {15},
416
+ Year = {2018}}
417
+
418
+ @article{Jeffares:2017aa,
419
+ Author = {Jeffares, Daniel C and others},
420
+ Journal = {Nat Commun},
421
+ Pages = {14061},
422
+ Title = {Transient structural variations have strong effects on quantitative traits and reproductive isolation in fission yeast},
423
+ Volume = {8},
424
+ Year = {2017}}
425
+
426
+ @article{Zook:2020aa,
427
+ Author = {Zook, Justin M and others},
428
+ Journal = {Nat Biotechnol},
429
+ Pages = {1347-1355},
430
+ Title = {A robust benchmark for detection of germline large deletions and insertions},
431
+ Volume = {38},
432
+ Year = {2020}}
433
+
434
+ @article{Harpak:2017aa,
435
+ Author = {Harpak, Arbel and others},
436
+ Journal = {Proc Natl Acad Sci U S A},
437
+ Pages = {12779-12784},
438
+ Title = {Frequent nonallelic gene conversion on the human lineage and its effect on the divergence of gene duplicates},
439
+ Volume = {114},
440
+ Year = {2017}}
441
+
442
+ @article{Li:2018aa,
443
+ Author = {Li, Heng and others},
444
+ Journal = {Nat Methods},
445
+ Month = {Aug},
446
+ Number = {8},
447
+ Pages = {595-597},
448
+ Title = {A synthetic-diploid benchmark for accurate variant-calling evaluation},
449
+ Volume = {15},
450
+ Year = {2018}}
451
+
452
+ @article{Gu:1995wt,
453
+ author = {Gu, X and Li, W H},
454
+ journal = {J Mol Evol},
455
+ month = {Apr},
456
+ number = {4},
457
+ pages = {464-73},
458
+ title = {The size distribution of insertions and deletions in human and rodent pseudogenes suggests the logarithmic gap penalty for sequence alignment},
459
+ volume = {40},
460
+ year = {1995}}