bio-polymarker 1.3.2

Sign up to get free protection for your applications and to get access to all the features.
Files changed (177) hide show
  1. checksums.yaml +7 -0
  2. data/.travis.yml +24 -0
  3. data/Gemfile +23 -0
  4. data/README.md +205 -0
  5. data/Rakefile +61 -0
  6. data/SECURITY.md +16 -0
  7. data/VERSION +1 -0
  8. data/bin/bfr.rb +128 -0
  9. data/bin/blast_triads.rb +166 -0
  10. data/bin/blast_triads_promoters.rb +192 -0
  11. data/bin/count_variations.rb +36 -0
  12. data/bin/filter_blat_by_target_coverage.rb +69 -0
  13. data/bin/filter_exonerate_by_identity.rb +38 -0
  14. data/bin/find_best_blat_hit.rb +33 -0
  15. data/bin/find_best_exonerate.rb +17 -0
  16. data/bin/get_longest_hsp_blastx_triads.rb +66 -0
  17. data/bin/hexaploid_primers.rb +168 -0
  18. data/bin/homokaryot_primers.rb +183 -0
  19. data/bin/mafft_triads.rb +120 -0
  20. data/bin/mafft_triads_promoters.rb +403 -0
  21. data/bin/map_markers_to_contigs.rb +66 -0
  22. data/bin/marker_to_vcf.rb +241 -0
  23. data/bin/markers_in_region.rb +42 -0
  24. data/bin/mask_triads.rb +169 -0
  25. data/bin/polymarker.rb +410 -0
  26. data/bin/polymarker_capillary.rb +443 -0
  27. data/bin/polymarker_deletions.rb +350 -0
  28. data/bin/snp_position_to_polymarker.rb +101 -0
  29. data/bin/snps_between_bams.rb +107 -0
  30. data/bin/tag_stats.rb +75 -0
  31. data/bin/vcfLineToTable.rb +56 -0
  32. data/bin/vcfToPolyMarker.rb +82 -0
  33. data/bio-polymarker.gemspec +227 -0
  34. data/conf/defaults.rb +1 -0
  35. data/conf/primer3_config/dangle.dh +128 -0
  36. data/conf/primer3_config/dangle.ds +128 -0
  37. data/conf/primer3_config/interpretations/dangle_i.dh +131 -0
  38. data/conf/primer3_config/interpretations/dangle_i.ds +131 -0
  39. data/conf/primer3_config/interpretations/loops_i.dh +34 -0
  40. data/conf/primer3_config/interpretations/loops_i.ds +31 -0
  41. data/conf/primer3_config/interpretations/stack_i.dh +257 -0
  42. data/conf/primer3_config/interpretations/stack_i.ds +256 -0
  43. data/conf/primer3_config/interpretations/stackmm_i_mm.dh +257 -0
  44. data/conf/primer3_config/interpretations/stackmm_i_mm.ds +256 -0
  45. data/conf/primer3_config/interpretations/tetraloop_i.dh +79 -0
  46. data/conf/primer3_config/interpretations/tetraloop_i.ds +81 -0
  47. data/conf/primer3_config/interpretations/triloop_i.dh +21 -0
  48. data/conf/primer3_config/interpretations/triloop_i.ds +18 -0
  49. data/conf/primer3_config/interpretations/tstack2_i.dh +256 -0
  50. data/conf/primer3_config/interpretations/tstack2_i.ds +256 -0
  51. data/conf/primer3_config/interpretations/tstack_i.dh +256 -0
  52. data/conf/primer3_config/interpretations/tstack_i.ds +256 -0
  53. data/conf/primer3_config/interpretations/tstack_tm_inf_i.dh +256 -0
  54. data/conf/primer3_config/interpretations/tstack_tm_inf_i.ds +256 -0
  55. data/conf/primer3_config/loops.dh +30 -0
  56. data/conf/primer3_config/loops.ds +30 -0
  57. data/conf/primer3_config/stack.dh +256 -0
  58. data/conf/primer3_config/stack.ds +256 -0
  59. data/conf/primer3_config/stackmm.dh +256 -0
  60. data/conf/primer3_config/stackmm.ds +256 -0
  61. data/conf/primer3_config/tetraloop.dh +77 -0
  62. data/conf/primer3_config/tetraloop.ds +77 -0
  63. data/conf/primer3_config/triloop.dh +16 -0
  64. data/conf/primer3_config/triloop.ds +16 -0
  65. data/conf/primer3_config/tstack.dh +256 -0
  66. data/conf/primer3_config/tstack2.dh +256 -0
  67. data/conf/primer3_config/tstack2.ds +256 -0
  68. data/conf/primer3_config/tstack_tm_inf.ds +256 -0
  69. data/lib/bio/BFRTools.rb +465 -0
  70. data/lib/bio/BIOExtensions.rb +153 -0
  71. data/lib/bio/PolyploidTools/ChromosomeArm.rb +63 -0
  72. data/lib/bio/PolyploidTools/ExonContainer.rb +245 -0
  73. data/lib/bio/PolyploidTools/Marker.rb +175 -0
  74. data/lib/bio/PolyploidTools/Mask.rb +116 -0
  75. data/lib/bio/PolyploidTools/NoSNPSequence.rb +292 -0
  76. data/lib/bio/PolyploidTools/PrimerRegion.rb +30 -0
  77. data/lib/bio/PolyploidTools/SNP.rb +804 -0
  78. data/lib/bio/PolyploidTools/SNPMutant.rb +86 -0
  79. data/lib/bio/PolyploidTools/SNPSequence.rb +55 -0
  80. data/lib/bio/db/blast.rb +114 -0
  81. data/lib/bio/db/exonerate.rb +333 -0
  82. data/lib/bio/db/primer3.rb +820 -0
  83. data/lib/bio-polymarker.rb +28 -0
  84. data/test/data/7B_amplicon_test.fa +12 -0
  85. data/test/data/7B_amplicon_test.fa.fai +1 -0
  86. data/test/data/7B_amplicon_test_reference.fa +110 -0
  87. data/test/data/7B_amplicon_test_reference.fa.fai +3 -0
  88. data/test/data/7B_marker_test.txt +1 -0
  89. data/test/data/BS00068396_51.fa +2 -0
  90. data/test/data/BS00068396_51_blast.tab +4 -0
  91. data/test/data/BS00068396_51_contigs.aln +1412 -0
  92. data/test/data/BS00068396_51_contigs.dnd +7 -0
  93. data/test/data/BS00068396_51_contigs.fa +8 -0
  94. data/test/data/BS00068396_51_contigs.fa.fai +4 -0
  95. data/test/data/BS00068396_51_contigs.fa.nhr +0 -0
  96. data/test/data/BS00068396_51_contigs.fa.nin +0 -0
  97. data/test/data/BS00068396_51_contigs.fa.nsq +0 -0
  98. data/test/data/BS00068396_51_contigs.nhr +0 -0
  99. data/test/data/BS00068396_51_contigs.nin +0 -0
  100. data/test/data/BS00068396_51_contigs.nsq +0 -0
  101. data/test/data/BS00068396_51_exonerate.tab +6 -0
  102. data/test/data/BS00068396_51_for_polymarker.txt +1 -0
  103. data/test/data/BS00068396_51_genes.txt +14 -0
  104. data/test/data/IWGSC_CSS_1AL_scaff_1455974.fa +112 -0
  105. data/test/data/IWGSC_CSS_1AL_scaff_1455974_aln_contigs.fa +2304 -0
  106. data/test/data/IWGSC_CSS_1AL_scaff_1455974_aln_contigs.fa.fai +11 -0
  107. data/test/data/LIB1716.bam +0 -0
  108. data/test/data/LIB1716.bam.bai +0 -0
  109. data/test/data/LIB1719.bam +0 -0
  110. data/test/data/LIB1719.bam.bai +0 -0
  111. data/test/data/LIB1721.bam +0 -0
  112. data/test/data/LIB1721.bam.bai +0 -0
  113. data/test/data/LIB1722.bam +0 -0
  114. data/test/data/LIB1722.bam.bai +0 -0
  115. data/test/data/PST130_7067.csv +1 -0
  116. data/test/data/PST130_7067.fa +2 -0
  117. data/test/data/PST130_7067.fa.fai +1 -0
  118. data/test/data/PST130_7067.fa.ndb +0 -0
  119. data/test/data/PST130_7067.fa.nhr +0 -0
  120. data/test/data/PST130_7067.fa.nin +0 -0
  121. data/test/data/PST130_7067.fa.not +0 -0
  122. data/test/data/PST130_7067.fa.nsq +0 -0
  123. data/test/data/PST130_7067.fa.ntf +0 -0
  124. data/test/data/PST130_7067.fa.nto +0 -0
  125. data/test/data/PST130_reverse_primer.csv +1 -0
  126. data/test/data/S22380157.fa +16 -0
  127. data/test/data/S22380157.fa.fai +1 -0
  128. data/test/data/S22380157.vcf +67 -0
  129. data/test/data/S58861868/LIB1716.bam +0 -0
  130. data/test/data/S58861868/LIB1716.sam +651 -0
  131. data/test/data/S58861868/LIB1719.bam +0 -0
  132. data/test/data/S58861868/LIB1719.sam +805 -0
  133. data/test/data/S58861868/LIB1721.bam +0 -0
  134. data/test/data/S58861868/LIB1721.sam +1790 -0
  135. data/test/data/S58861868/LIB1722.bam +0 -0
  136. data/test/data/S58861868/LIB1722.sam +1271 -0
  137. data/test/data/S58861868/S58861868.fa +16 -0
  138. data/test/data/S58861868/S58861868.fa.fai +1 -0
  139. data/test/data/S58861868/S58861868.vcf +76 -0
  140. data/test/data/S58861868/header.txt +9 -0
  141. data/test/data/S58861868/merged.bam +0 -0
  142. data/test/data/S58861868/merged_reheader.bam +0 -0
  143. data/test/data/S58861868/merged_reheader.bam.bai +0 -0
  144. data/test/data/Test3Aspecific.csv +2 -0
  145. data/test/data/Test3Aspecific_contigs.fa +6 -0
  146. data/test/data/bfr_out_test.csv +5 -0
  147. data/test/data/chr1A_C1145499T/chr1A_C1145499T.csv +1 -0
  148. data/test/data/chr1A_G540414846C/chr1A_G540414846C.csv +1 -0
  149. data/test/data/chr1A_G540414846C/chr1A_G540414846C.fa +2 -0
  150. data/test/data/chr1A_T517634750C/chr1A_T517634750C.csv +1 -0
  151. data/test/data/chr2D_C112180134A/chr2D_C112180134A.csv +1 -0
  152. data/test/data/chr4D_C14473543T/chr4D_C14473543T.csv +1 -0
  153. data/test/data/chr4D_C14473543T/chr4D_C14473543T.fa +2 -0
  154. data/test/data/headerMergeed.txt +9 -0
  155. data/test/data/headerS2238015 +1 -0
  156. data/test/data/mergedLibs.bam +0 -0
  157. data/test/data/mergedLibsReheader.bam +0 -0
  158. data/test/data/mergedLibsSorted.bam +0 -0
  159. data/test/data/mergedLibsSorted.bam.bai +0 -0
  160. data/test/data/patological_cases5D.csv +1 -0
  161. data/test/data/primer_3_input_header_test +5 -0
  162. data/test/data/short_primer_design_test.csv +10 -0
  163. data/test/data/some_tests/some_tests.csv +201 -0
  164. data/test/data/test_from_mutant.csv +3 -0
  165. data/test/data/test_iselect.csv +196 -0
  166. data/test/data/test_iselect_reference.fa +1868 -0
  167. data/test/data/test_iselect_reference.fa.fai +934 -0
  168. data/test/data/test_primer3_error.csv +4 -0
  169. data/test/data/test_primer3_error_contigs.fa +10 -0
  170. data/test/test_bfr.rb +135 -0
  171. data/test/test_blast.rb +47 -0
  172. data/test/test_exon_container.rb +17 -0
  173. data/test/test_exonearate.rb +48 -0
  174. data/test/test_integration.rb +76 -0
  175. data/test/test_snp_parsing.rb +121 -0
  176. data/test/test_wrong_selection.sh +5 -0
  177. metadata +356 -0
@@ -0,0 +1,11 @@
1
+ IWGSC_CSS_1AL_scaff_1455974 6657 29 60 61
2
+ IWGSC_CSS_1BL_scaff_3810460 17934 6826 60 61
3
+ IWGSC_CSS_1DL_scaff_2258883 12498 25088 60 61
4
+ IWGSC_CSS_6DS_scaff_2124533 31105 37824 60 61
5
+ IWGSC_CSS_6BS_scaff_2937320 8310 69477 60 61
6
+ IWGSC_CSS_6AS_scaff_4377549 11838 77955 60 61
7
+ IWGSC_CSS_5BL_scaff_10907528 20876 90021 60 61
8
+ IWGSC_CSS_5BL_scaff_10907771 11095 111275 60 61
9
+ IWGSC_CSS_1DS_scaff_1880574 10154 122584 60 61
10
+ IWGSC_CSS_1BS_scaff_3443604 3550 132937 60 61
11
+ IWGSC_CSS_1BS_scaff_3443603 3292 136576 60 61
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
@@ -0,0 +1 @@
1
+ PST130_7067,T,3334,G,7067
@@ -0,0 +1,2 @@
1
+ >PST130_7067
2
+ ggggggaggctaacttttggaaatcttttcctttctcttcttttcctatcatcttattatgaacattattattctatctgtgcacggagtgaactattatttattatttttgattgggatattctttttgttttgttttggagtgttattcagtaaggcagtaaggaagagatcagtccttattagttaaagaattctcttctcctttgggtcagaccttttagcgtgcaccacaaagtagcttacggagaagaggccatatttaccctccagctttcatctcaacctacctgtcccggaaacggacaggcaggtagttgctgagtaagttaaataactacttattctacaccaactcacttttctttccatagcgcaaagggccagcctccaaaggatccaaaggagggacttgttggggatactcaaatcttgcactgagagcatccactggtttggtgggcgattttttcccctgccttcacaacacctttgtggagctcaaaaatcacgcctgtgggacctgtttatgcacttttccgtccagcatggttacaaaacaacaacagaatgcttatgctccttagatctccagaggtagaaccaagaacacaagtgttgttgtgatgaagtcaatgagtgaggattcaattccaggcttgttttagataaagcttttcaccttacctagcatgtcttgttaaatagatatactgccgcagcagaatcgtgatgattatccagcaagccttatagtgtcttgcagttttttttgaggtgaagaggacggtagaagatagctacagttgtatgttgtaacgtcagtggactcctcggtagtctcgtttacggagaatggcccagcgaagtctgagccacaaaatatttcgaaaaacttcagtgctcgaagtcacgatagtcatattgcatcagatcaggaacctcaaagaaaattttcgggtgtggtacccaaaatgagcagacccttatttgaaagccaaccatcccgaccgtctaagtttactacttgaggcaagactaggtgtcaagcctctctcagaggctgatttcggaaggagttgaaacgtacaactgcgctcagctcgctgatagatcaagccaagacgaacgagccatcatcatcttagactgcaggaccaacaagccaggaaggtaaatctgtttcatgcattgcgagcacacaatcacgaatcacgggatgttcatttacagttctaaataacaaatggtgaaagtgacaaaaatggcgcgaagaggtttgctagcagttaggacaagccttcaagatcacgacgtatcgtccttcgccgatcggatagacgatataatgcagcaaagatgtttggaagagagcttgtgccagttcgttcaacccatcgagttcacccggtgctctacggatggtttcagagaattgatcatttggttagggtcccgtgtgcttaatagaagttgaaactggaagatagatcagtgatggcgtactgttagtggttccatcgttgtgaaattcggatagactgctgggctaggatactggaacgcaaccaaccgtctttgcttctgatactttgtgaccgcggttgacctttagtcgcagaacatttattggggtgaattcacaagtcttgcgtaatcagacaggcaatttgtgaaagaaatctgactcactgtcagtttgtaccgaggacaacaccagagcacgtcatgcggagcacatgttgggggatccaccgcgatgtctttcattccacatcaacagaggaaaaaacatgagcgtggtcaactctaagcgtgatttgaggagggaaaaaaagaatcacaaagattcctgtcgctttccttgccattgctgcacgcaggccacggagtgtcgccgctgcacttcgacgatacgaactcgctaagaccaaagacgcaaagtagaagtgcgggtttcatgaagttcatggtatcgaacaggcgacggggagtgcgatagggctgaagatgaagtggatgcttgtggatttgagggtgagttcgagaaaaatatgtgagttgttgacttctgagggcggccgaagtgaaaccactcgcctgttatatacatttccgaaagaagcctttcaaatgtatcaggtgtaatccaatcaccgaagattcctgcaaaaccttcagctgaggaatagacagcgggatgatttccccgacgacggtacagtcacagtgcccggtggcaccgcaggataacacacaaccccgtcgaaagctgtagctaacggggccgtcaagttgggccctgtgtggcctcggcgtactggctggcgaccctgagggtctccttggctttatacgattgcgtcgtgagcgcgcattgggtcaccggtcacccgtcgccacaaccaactcggtggggtccgatgctgtctgatggcgcctcgcggcgaccaaccttatgagctaagggaagtcacaaactcacacgaacaataaagtgggatatacatgctcgcaagagtcaggaaaatacaatggcttggagtgatgttagtgataaaaatgaatcagatggatgaaggtgctgaacccactttttgttctcttttcgagattactctatacatacaacctcagctgcaagtttatcggaaaaatgatcaaaacttgacataaatatcgaaaaaacctcaattgtcaatgtaactcagtgtaatgtttcgataagcaacaatcgttgctgattgaatttttcaaataagtggcatagagattgaagtatcgttaaaaatagatcaagaaagatacaatgagttattttgagtcattggaaggtcattgatgtaaaagatgatcaagcgaagtaaaatatggtaccgacgacttttcacaaactgatcaagaaaagaggattgtaaaactttcgacacagcgtggacaaagataaacaacaggaattgcttatgtctcttagatctcaagggaaagagaaaaaaaaaagcaagctgtgacatgatgggatcaatgagtttggccttgaaagtcgtgttttagatagagcttgtcgtatcttttagctagtctcctacaaatgaataaatccccatttcaaaagtggcattcttagtcagctggcctcatagtggcttgaagtttttcttggaggtgaagagacccttcaaggaaggtcgagacagtctgctgttgtagcgagaggtgacatgttgagataagagggacactcacattttctgaaaaaggcccagcgcattttgtgcttccaaagtttccaaaaagatttactcgtcaaagcagctatcatttccctacaccaaatcgagaatctgtaaaaatgcgtttgggtgtggtgcttggcttgacgcaaccgagacttggcagccaaccaccaaagttgacgttttggtatcccattatacttgtgacatttcttattagaatgacctcgttttactagtgttctttgttgtcgtccggtcattgtccgggattgaacgagactggtctccatgctttctcgctctctcaaacaatatatgagaagagcagcttcctcttcggcctcctctgagtcaacatcatcatttgctaagtcaaccctattggtttctacgattgaattctgggtcgaagaggttctttccaagggacctaatttcagctcatctcccgcttcttcgcccatggtaccggtttccttgttcccgagcgcgagcgtctttatggactctaagtcgtggattccattttctactccaactgggccatgtgcgacgcccccaatgccatgaagaggtattaaaagaaagatcaagtaaaatgggagatgcatgatttcttcactacttgtgagtaattttaaagttctcaaagggtgatggatggcaagatgaatgcaatctctcctccggcaaagattccaaggatgactgaaggttttatattgtttactccggagattgtgaggtacctgcgcagccgaatctagagctgcactgccttttgcttacttgtacgatagtcacatacacgactgtgaacactgacttcgcgcaaacatgaaagatactctccctaccacacaaggccatcgacgttctccaaatgtgtcggcgtctcaggtgatgtagaagcggggcatctcgtagatagtgccgtcatacggtgcaagaaaccctctgctgtgaagatagtggggaaatgtgggcggtcgcatcggaggtggcaagttgtgatcccttcaaactctcaatatatcaaagtgtccgaacaaccacgcggcaaaactgaccatgacttagcttgcaatcgggtgacgaaatcaaaatctcgtcatgctgacgttctgaatacgtatcctcaagttcgcgtgcaggcctgcacaggctcagtcgtcgtcacatacacaagtactgtgaacactgacctcgcgcagacatgacagatagcctgcctacaacgaggctatggaggttctgcgagttgaccggcgtctcaagtagtgtagtcacggagcgatgcaaggcataacctctgatgtggtaatagggggtcaaattttcgtggtcggatccagggtggcaagttgtgatcatttcaaactcatattagagtattgagactccgaacaaccgcaccacaaaaccaagacggccggcacgagtgtctctactaatcttacggtaatacgtagtctttcgttcaagcagcgttacctcttgactgtatgaatgtataattcagtaattctggttcaattttaatcagcatatgggaggacttccggccgatctgtaggatcagatctagacccccctggaaattgatttttccgggggcatctggttctgaggcaggcaaatctgactctgtaagggctgccaagggctacagaaaatgacgagaagtcctccattacatacgacatacaagtaatcaaacatatggcttactagagatcaattttacccaagaatacaaaatacacagatagagatatatgggtttagcaaatcacttttcctctcaattttcaacgttttttctagatagtgtgtgtgacgagatggtttggatgtacatggaatctgtgaagagattgggtgggtattgaatgaataagagattgcgtgaatataagaatcaagcttctaatttttcttgcgttcgctcagactgggtactaagatttcgaacaaagcttcttcccgttccctgaaagatggtatttggcttatgcctagagcgagtgtattgattcgattagctgcgaccctgacagtgcccatgggactaggagctcgattgttgtgactctcatctgggttttgtccggcttcccaattagtaccatgttccaagtcattcttgagtctatcgattttggtgggatgagttctttctccatggctcacactttctaccgcagattcatcgtcatctcgggctaaagcttgagtagaggaagcgatcaaaaataattgagcagctagtggttgaaggtgaggtggacaatcttccactttgaggatcgatggataaccgcttcctaaattcaccactcgtacttgacgatcagcgggattgacaagcgtcaatgaaacttctagaatagctagacagagtgcaccaaagtatgctcgagagagttgaccatcggttgaatttctggattgtaatatttcgaagactgttggggtggtataaaggatatcggtaagtgatgcgtacagcgtttcacgaataatactaagtgcaggatggttttccagagcggaatcaagcccagaaagaggtgatgtgttcaatttggcaccggagttcggagcgagagtaggaggtattgtagcgggggtagcatttccctcgtacgctggaggcggtcgaaaggtggaagaaggcactactgttggtgtagctctggtatcgtgaccgaattgaagcgcataatcaagatctacagtcaaagatggaggaggaagggttcagtaaacctcccaattccgtcagatggcccgagctggtgttcgaagatcacaactgactcaccttgagagaatctctcttgaaatgtacgccgctgagaaatttcaattgcgatcgctttcaaatctcgagccatgatcggaaggtcaattcggatcggttggcattgaggttcttgatcacaaatcattctggccaaatcgttgctcagatccggcggaagtgctttaatcttggggactgattgaaaagatgtacaggtgtgcatttttgaggattgattagataggtatgtcgtaactcgatggattgcagaaaacatagaagaagactgaccagcttcggaccagagtatgaaccagttccgaaaagaggcagggcaattatttgcgtccaagcatatcatggaggtggcaatgctgggaggtctcccttcgctacgaagtgctgccaggaagagacatatagcagggcccgcaatctggatatcagcttccgcggaactgaggacgctggtatctagcagtcgttcggcatgggcttgagccaaggcaccctagttttccacttcgaaaattagtaagccggccaatgattcgtcagaggggcgagtctggaaggctcacctggaggaaagagtgaaaggcaacaatgacctgaaacggagaatgtcgatcagctcacgttatctcgtcggagttctttgctcgtggacagcagctgaggatgactggagaactgatgatgagggactaacctgctcctccgaaatgttagtgtgtatcaagttgctgggcgacatccaatcagcagggtatcgtggaataagaaaacgggtcaagttctgttggactagcttcacatctgaattcttggcgtggcctggttttccccacacaaactccgcatacagcttgcaccgcaccctctgagctcaatcgggtcacccgatcccccggagtggcaatggagtcaaacgcccggcagggactcttggggctggaaaccagctctattcctgaattttggtgcttgatagcgtcaaatgggtgtatctccaagtagacatctgttaccctgcatcgaaaaagcgtcagcttgattgatccatcaagagttgaccaagtatttcaagattctttcaccctgctccaacccctctgtactagcagttaaggtcacccagctaggtacttcacaaaattcaagcatgttgctgaagagaagagggatgaaatgttacacccatatgtgcttctccacgggttgtacccctctttttccttctccccctttaccaatttgctgctcagaagctaaggcctacgaaggaaaagctgaaaagatactcaagatattactgatgtataaaccatttcaaacttctcctcttggacatgctgagagtcttatcttggcgtactcggttttaacatcagggttcccccaaatgcgagaaaatctcccaatgtgaacagagcatttctcaaggttcaaatcaaggatgtataaaggcagctttcctaggtcctcagtcagtctcttgctatgatcaagttattgattgatggtcgctcgggtcgtgaatccatttgccttcatttcacgcgcacctcattgctgtcggtggaaagcgtcgatgtttcgcgcagaggaccctgtgatctctatagctttgcttctttcatcctcatcacgttggagctgcaggacaaactgacacttgtgttgatctgcctaattttttactagacgcgaactgctctcgttaactggacgaataacagcagggaaaaaaaaatcatgcatcactttatctagcagctcttccgatcagaacaatggaaagcttattcttttgttactgaaagaatgcaggagctatggggtgttgttgtcgtaatattcgatagcagtgataaaggtttgcttggctttgtagaactgatcctgccaagtagcaaaccaagtcacgaagtaagttcgacttggaaaaccgtcggtttccgggatcagaggcacaaagtgaaggagtatgagaactaagcaagatgaaagacgagtgctaaggttttcagcctctcgagtaagctgatcgatgatgacgtgcttatacgtcgtctcagcttgttctatggataacttgatattggtgatggatttatgaacgtcgtccaccgagtcccccaaagtctgtagttgataagaatgcatccctgtgcacaacggaagtcgcctcttgttcatgcctcgtctggataattgcttgaaaaagagtctacacagcttcgtgattgttattgctgatctagccaggacaacgactggcgaaccgaggcgatcgctcacaagtgcttcagcttgaggtttcgcattttctccctcggcgttgtttggggaattggcaagcgttagaagattttgaagggtggactccattttctctaactgctggggccacttaatttgaacaacatccaattcggatccttcaaagcagagcatcatgtccttggtttcaatatgagttgagtagtcgaggaaataatgtctgatttcgtagatctcactctcatacggaggtctctctgtggagagctggagttgttttatgagcgaagaggtttctgcaacagcgtggacgagatgccgaaaacatggagcctcgatccagttcctgagcgcctcgactcggtacattttgaattctttgtgatgctggtcgtcacttttgtttgatgctaatatcttggtttctccacagttgacaaagaatagaggtgagatctgatcgacagctcgttcgatctccggttgaacggccaagatgagtttgagtgccgagcctggttctttgagtaagtcggatgtgtttaggagacgtgtaagaatcgaacattgatgaagtagtagcggcaggacgcttgagcgtagctggcccatgtaagctttgatcgggtcgtctccttcgatagactcaattgtaggcctcctctcgcggtaatgcaaatcccaaagtttggcagctattccttcaaagccttggatgaccaaatctagcacaagagttgtgggaagggtcagccactacgcccaaacatgtctggtgttgatcagatctggtgaatgagtcgctccagtacacaccaccttgttgccagacctctcgtcttgctgattcactcaaatgctcgagcgggtccgcggcgccttgaatgatcgagttgtaatcgatcgagcataccatcgtttgccgtagatttttcttggccttcccacaaaatttccgtggataaatccgtgttgagcagcggtctcaggcgcaaggtggccctgtacagtcagctgcttcttgctgaggcgagagcggatttcgtctaggaagccgtggaagattgaaggtgcggcgggcgacaaacttacaccaccgggtcaccttttgtgatcggtggccattaatacaatccatgcatgatttgtaagcagtttgccaacaaaatctcagatcgaggaccattggtccaacccaatccttgatcgtggactagtgtgggtcaacatgaaccacctcggccgcccgcggggcgtgggcgtggttgcgggacgattggcaggcgattgacgccacgcttgccccaaccttggcacttcgctgtcgttggcccaacctgaattcagacattttgtcgaacactcgggttgggaccggtcttgaccattgatgggctggcaggctgtccatgcctgcgggcccgcttggttgcaacatgtcagacggacaaatttcatcctttttgtccaagaagtcaagaaaactttgttagaaaaaaaaattaaaatgttaaaaaaaataaaaataaaacgttagacacttcaacagtgacacaattacccaagtgggtaatgaagtaaaatttagggtaattgagtatttttccatttttattcttctaattttcattatacatctacagaaaaaagatacaaaagagaaaaacaagctcattaccctgaattttactgaattacccacttgggtaattgtgtcactgttgaagtgagagtcaaaataaaaaataaataaatgacacttagaacgttcatagatgtttttgagtgtggatgaggaaagaaacaatggccaagtggttagcgtgatggctagagatgcgtgcatccggatgtagagggttcatacctgagtctatctttttggcaaatgcggccccttcggagggctcttggaggccattggagggccattgaagggccattggggggtcattgagaggagattggaggcaatggtgggttgatgtggtattgggaggaggttggtacagtccacacagccaacacatcgtgtgttcccatttggggacggcatcaaaatacggacacaatcttggttaccaaagcccaaattgtggcttggtccaatgcctccagaggtattgaaccactagcgagatgacccagtggtgtaacacaagtcccttgcttcggaggggataattttttgcgggtaaattgccgaccgagtgtgagcctccaaaggagggacttgttggaaatctggcctgggagctggaggtctcttggtggaagaaattttcccctgccaattccccctccttcccaaaaccaaaaacttccgctggatgtgaccaggcaaaaggcctgatttttccctttatttctgtccaggcaaaatggccttgggcctcctccttctgcagtgaaaaattgtgaaagatttcacttttcacttgaatttggaggagtgaaacagaagttccttgatcttccatgagcttccctctcttatttacagcagatcaattgaaatgcgcatggctgtggcatcaatcccttatgtacacattgaatcacaaatacagctcaagatggcatccggtacccggcacccgcccacacccgcctcacacccggttgggcggtccgggtgcggtgccaggtccctgatttcctcagcaaatttggatggcacccgggtgccgcctgccacacccgcccacagccacttattatgccgggggcttgggtgagccagggggttgcgcaagtgtaaattacattcaaaactcgccctaagcaatcaatcttcacggggggcttggggagactggagggcgcgcaacggtgaatctcatccgagcggatctggatatccacatatccagcccttcagatatcccccacccggaaccaacacaatgccctcgtcacgcaagcaaaaaaagaacaaccacccctcactcgaatcctcagccatctcctccccaaccaacccacccctaattgaagttggccattactcatagggtgggcggatacaaagtacgggtacgggtgttgatattttgtgattttccaagcgggtacccgagtaccgtcacccaattcctgtccgggtatccatgttccaccggttgcaacctaacctgttagtttacacacaatgagactcagctgctgctgataccaagaaggtatggtttatcggacaagagttcctctccaccagtcttccgctcttcacaccagtcttccgctcttcaccattcacaacgtcccttccatcaaatcttctcacaactaccaatgaccatgaatcgatgtccacgtaacaaggcccggccttgcagctcaccctcccccagctctgcaaccaaccatagcgcagtacctgactctttaacacaagaagaagaatcaattgacaaacccaccgaaagtgtagatctaacacccctcactgacaaagaagagcttggtcagttcctcaaagcaatttcttcatatgtatcaagctgacaatgtattttttcaacttagcccgtgcacagagaattgcaaaaacagctgtcagtttcagttacgcttcatacaaccgttcgcagctatcaaatcaaatggataagaacggacggcaaatgatcacatatccctgtaaaacgtgagctttttgcttatcatttttttggaggctgcactgattcttcttaacctgtagctgtggaaccaaaatcaatcgtcctatgaccgactctccatgtagcaacctccttaaacatgcagccagttgcaaaaggaaacagacggaaaaggaacaaacttgtttgctggcatcactcagagtttgaggaacaggggatatcaatgtttgtgaggtgagttatgtttgactaaaccaacaattttttttcatgttaattacctgacattccatcaaacaggtcaaccaactgtgtgcgatctggtgtgcagaggctgcccaaccattctcggcattggaagacaagagcctcaagagactatcacacccaacggtcctcaagcactaaccaactcaatgcacggtcttgagatccatccatctcctgtacactgtggtacaggaaagctttaagcttgaactcaaggtattttccattcccaattcctcacttgagaagatatactaacagataattgattctatgcttcatagaaccacactcgtgcgttttatctgggtgtcaatgcatggcaatcactgaatggattcaacatccttggtattttcatgtcctggatcaacaaatcggaagctttgagtcagaaacttcaatcaatgctgctggacttcatcaagttgtctcaaagccacacgggcaaatacttggctgaaatggtccaatttgtcgtggagaagttttggttcaaaacaaggtatgttgtgttcacctgtctggatatctaattgccagccactgaccatttttcatttcagatctgtggcattgtttcagataacgcttccaacaacgcagtgatggtcgatgagttgaaaaaacttaaatggcctcgtttcaagggagaaccccattggatctgttgctttgcgcacatactcaaccttatcgtgaaaaccatcttgagatcgtttggaaccgagaggaactcaagccaaaacatcaacattgattcagaacacaaaaaggaagctaatatacaacaggttgaccagtaagtttgaaaacatcgattgatctatattcttgcctgagactgacgaaatgttggttttacctaagctacactaaagggcaccccaattctcagttggccaaagaagatgatttggattcagatgaggatgacaagggagtgaccagagtcacataagttgaaggattggatatcacagacatcaacaatctgagtgacaaagacgatcaagatcagtacactgcgcacaattgtcaacagactcttgcaaaggtaataagaacgtaatgaatcatatttttgattccgcctggaaattaactcatctttctctgatgcagccacagttttgagcaattgctcgtaaattgaaaaagtcaccaaaatccaaagagttgtttgccgagatctgtgaagcccactcaattcaatcacctcatagaatcccacaagacgtacaaacgaggtggaactcaacgttcctggaactaaccagtgttgattggtgtcacaaggcaatgtaagtaatttcttatatgctgagatcaatcaaacaacaccatgctgatccaacaattcagccttgagtggcaacacgatgagaaatacggccttaatcaaaagtaccaagtcggtgctagtgacttggaattgtcgaacgattggggagttgttctccagccattctacaagattaccttgcaagtattgaccaaaggatcagctcgtttatcacatgttgtggttttcattgactagattactgaacatctgtcaacaatcatctctgaaaagaagtacccggccccattgaggaatgcctgttgggcgggtcttcagatccacgctaactgactgctctcctttgtaccaagttgcaatgagtaagccgctggttcctttatgtcttttctgaggctgcaatctgattttatttgttttttgcagtactccacccctcgttcaaagacgagtactttgaaattgccagatggagtccagagtggatcaaagcggccattgatctcacccaagagatgtggatctcacattacaagccccaagtcaaggaaacagtttccgaagacactacttcaaaatcaaaagtaagtgattggctttcttcgatcttttatttgttctcaaattaacgattcttaatgttctttcagtccctaaccggtttcgtatctcaactcggtgcagcttcagcagcacggtcaggtaattcatcaactgaaccaattgacatctggctctcaggaggcctcatcttgtaaggatcagcgccagtcaatgccctcaaatggtggctgcaacagaagtggggaggaaacacttacgttgggctttcaaacatggctctcaatgtcttgagttgcccaggtttgttttgattctttatcatatccattcactcagagattgtcaactgttacagcaacatccgtggtcgtcgagcgcacattcagctttggccgtgactatgtcacaaccaaaaggcaccgcttgagtgcagctttggtgagcaggggaatgacggtagcattctatttgaaaaataaaaagatcaaaagcggggaactcaacaggtttgaagagaagctcaaaacagaaaaaaaaaaaagatgaaggcaacaggaaaaggaaaaggaaaagaacgtgtagagattgttataaattaagagaaaattgtgtgaagtgaatctatgtgtctgaacaagataaaagaaattgttgtgtctgaatgaaactaaatgaatccatgtgtccaaacaaaataaaatgattattgcctgcaagtaccgacggtaccggccaaaatttcccggatacccgcccagcgggtcccgagtacgtgtctgtgtcttgagtttgagctaaaaacatgagaggtacccggacccgttgcgggtacctgggtccagtctgccatctttagttttgcctttagaattgttacttccatctccttgaagtggtgaagaagataaacaaaaactaatatggacttggtcaggtctgaaagcccaaaagcagcaaccaacaaaaggtgatggcaagcaacagtcttgtgtgtctaccaatgtagttggtttgaaagaaggattgattatctcagtttgtctatctgcgtagtccgtacaaaaacaagattggtcaactaatatcttatgagaatccaatagtgtgatcaagaatctctttgggtgatcaagtctctttaatgtttatcattctgcgtccattcagttaccaacccaaacaatccaaatacactattacatataactagagaaaggagtgaaaagtatgatttttgttgaagtacattgtttgtgggctgaggtgttgatactggtgggagtccgtgatcaattggtcttgacatgcacaagtggagacgagtcatgctggttgatattgggtgggtatgtcaaaggggatgggtgatgatgattgagatgagtgaagatgatctgatgattactgtgagtgattctggatgatgttgggtatgttgaggcagttggggtgttgctatgcttccctaagttgaggttaaggaggacccactacaaaatcaattgcatcacattccgaagatgcgcggtaacattgcatgtgacatgcaatgccactttgcattttcaaaatgcaattgaatttttggccccaaaaattcaatcacattttggaaatgcgaggtgacatcgcatgtcacctgcgatgttaccgcgcattttcggaatgcaatgtaacaccttctgtagtgacttgaggagctccgtaagatttggtaagtctaccggtccttaaagagttacggaggaatcccatagctactgagctctaaagagcaaaggggggtgggattttccgctaaagtcgtgtaagttgaggttacagagcgggcttaccaaaacaagggtggatgctcttagactgcacatgccatagggccatgaatttcctccctttgtatttcttttggcacttgacttgatttttattgcttctattatatcatactagagaacacccaagtgttagccaaagaccgaccttgaaggatggtacagagccgtgcgtaaaggggcctcaaagggggtatttgcgtgtgttttacaacatgccaaatttgccatatgtacaacagattggccacttctaaaaccacaaaacacatcactcaacctactacaattgttgttttgagaaaaaacagccctgatacctaaagcctaccctaacacctacaccacgactcaattttttttgaaatcacacggcgggcccacagcgtggttggagttgggttggcgcgggtcatggaggacctgtctgccatggatcccacgtcacaggcgggctgacagcaaattaaagtcagcctgacttgaacacacctgggtacgacttggatgtcatgccaaccctgccgatgagcctgcgtgggcagatgtgcttgacatctggtcattcaagttggccacaccaccgtgtccaaccagaatctgcccttcccattgagcggacagaaaccatagggggggccgccgtggattttaatttcatggcatcaagcctgcgtgggcagacgtgcttgacatctggtcattcaagtggggcacaccaccttgtccgactagagtcttccctgggcaccgggttgacgagagctgttggcagtgaggcaccgtgaatctcaaggcaacgaatgaccttctaatcaacgttgttgccatggagccacctcacagtcaagatcaatggcatacataaatagtccattatgtacatctatcatagttaattacatgtattatacatagtttgaaagctatttgatgtacaattacagccctatgtcattaaatctggatccgttgttgttatcaccaaagtcaatgccctttgtcttgcacgtgttactttcttcacaacatttgatgcccactccttaaacccattgtgaagtgcatccagtcactgaagtgggctaggtggatcagctgggatatctgagaacttttggtgataatcaattgaggagagtgaagctaagttgacaatgtattgctcgttaattggtgtgtgtcaactcaagtgtcttccttgtactcctctgccgctccacaatcacaatctttgttgcagtcaacttacattcaccgtgttgatagttgtgctgggcattcaatccagctttgacactctgtatagtgagtgtgaaaggaggttaatttctatcaaataactttgaatgattgattggttttacttacatgtgaattgacaaaagtagagtgagaagtcctttggatctctctcatcttataaaagtcattttttcccatcctttgaaacattgtcgtattgataaagaactggctctgatgagaaagtttctcaaccttccagattgaattgactgatccaatatgttgagtttcttgagtttgtgtaacattaaactacataaagaccagcaatttgagtaaacacaaggaggagagacctgaatggcaaaatcaaaagagaacgaagaaaagtaccaagatgaaagagtttttcttgagaacttgctttccattcaattttagttcagatatctgtttgattttgtgatcaggataagaattttggaggtcctaggagttgcaatccaatcaacatctggtactttgaggttcttaacaaaagggtagttaacattttgaagatatgatgactgattgtagcccaacatctgctggattaaagcattttgtttgaatatactcgtgattctgttgaaagcttgtatgtatttcttttgttttttttcaaagaagaaaccactggagataatctgacggaaggtgtggtaactagtgactgaacgtaatggctatatctctgagaatgcccttaaaaatttcaaatttcccagtcgcaaaaagagaggctggaccatatcgaagaattgattctggtagatgaagtaacatatggaacttagctttactaacccattgggctgaatcttgaattatgtgcttcaagaatatattgatagtactgatacccattactaatccccatgggttaaaaaactgagactgggagcaatttgttttcagtatcgggacaacttctggaccaccacagattctgtgaggcctatgatttcttcattgggtaaattactcaacttggaccttcgtacagtgatttgggctggagtaagtgaagtcctcaaaagtatcaggtacatagatccgatggctgatgagcaggcgttttgaatccgttaggacaaagactttatttgcaatgtgtttgtataatcatctaacaggctgagctgacttaaaagttgacctcaacaacattccaccaaattaattttgatttacgaatcaccttatggattgggagtccattggtctctcttagcaatgaaatggaaatattcccaatagtttgccaaggctccctagaagaacctcaccctctaggttagagtagggggagtttatagggttgcaggtataattccttgttctagttttacagtcctgctccgagtccaaaagagtgaccacaaagacactaaaaaattggatttctttatatcaggtcccttgacgtatataaacgtctacagtgcaggccacgaagttccagccttccagtcagtacttttcctatcccgctaaccccctcttgctgtgaaatgagacatttagaattgcctttcttgttcttcagacccgctttatcattggtgatatacaaacaaactatctcacatcaaaacattcatagcacgagttatctcacatcaaaaattcatagcacgagttaataaatgggacccggtccttgtcgaattccatacgagttccactttccctaccagggttcaggacttgtgtgacatctgacaaggaaactactaatttcaaatttcaaaaaaaaattaaaatcctgaattaagaagattctagatcagtcgggtagctcagaatctgagtaagcaaaattctagaaacttcttttcctttttctgctaaaatttagaatcttccagaaaagctttccttgtatttccctttttccctcttagaatatttaagctcaacaagtttgtactcgcgaagggtttctttccttcgtggcaaaaattttgtttcatctttttcatcaccctttctctctcagaaaatcaaatccaagaaattcataaacaaatctgattctctaaataaagaactttaagtgttgcacccaaccacaaaattaagaaaccttaaaccaatccccaaatccctacccaatcaaccttgtagtgtgtcttcagtgaggtttggaattctttagcttgtctacgaattcccggaattccccgttgcttacaacccgccagtcttcaagacaaaaaatttgaaaaaaaagtgttttctttgtgttgtcaattgtagccgtccatcacatcctagtaatttacaatcttatccagccctatatgctcaaaccacctgaatcttgtaatagatcatgaatactattccgcatcctgagtcacgcgatccacgctggtcatgactgggtaaaaaacaagacaattcatcaatccagaaaaaattcatttaaaaaacttcatcatgtaacttacatgttgaccctcttggaagtatttatctttcatttgagtattgatcaaacgcaggaaattcttccaaagcgtaaatgtggcatcatgtttcagcatctcaactttagcgctggtgggtacatggaattaaagatctattgaacaacagccttcatcaccgatcacttgtgttggtttctcttgaagagatgtaaccctcccttcaagtttagtaatttagacaacagaatattgacaatttgtgctttgatccatcactcctttggctgtccagtccaaagttatcagctctgagatatcaaagatagctggattttcacttgcgtttttttttgcgaccaacaattcaggttatcctttttattctatttactttgcaaagctccccagtaattcatttcaagcggttcgattccatctaacactgtgaacaaaactcaaacaattctcaactgctgacatccctcttgagttgaacaggatgttctcactgtgcaactttcaacaccgttcgtgtaagaaggttctctccaattgtacgtccttggagggtttttaattggtagagacaggggatgctcttagaaaattgatagatgcatgatacatcaagacctggaaactacttccttttgttggaccgcctcagttccaactgcaaagcctgaaatttggctacaaggctggttcttgacgatgatcccaacagcgaagtttatcagaaaattgaccccgtgccaacatcgttgcccatgacaatagatggcaatcgtgcgcctcatcgaatcaaggaacgctctacacaacttctcctctcgaaggtgagtatgctcatgtaaggggtaagcatttggattatcaaggagccgggcttatctggcgccgggagttcgtcacgagagggacaatcatgaacgtcaagtcgcgtaccgcgaggcaccctctcggctcgatcaccacgtcgaacaaatactgaaacctctcaaaatagagaatctgagtcaacatgcaccccttcacatggtatgtcagctcggggatccttcacagtcctcaatcatctacgcccgccgagcgatggggtggcaatagtgagaaaagttgggacaagtagggggtagcttaccgagcgggtttatcggcacgagggtggatgctcttattagagttgtaaggatcggatgaaatcggactgactgtgtggcccgacttcttccgccgcttatatgtattaacccctgcggaatagactctatatgcacccctttatttccgctcttgtacactcttttccacctctttgctcccggagtgaaggggggtgatctgctgcaggtgaagtcgatccgaccgccttccgtcgcactacctcagtcccctctcacaaattaattttttttatcctcttatctcgaagtcaggtgaaatggacgatcctgtggctgaggtacgtgaagtgtgatcccaaatgctttggtttttctccttatctttcttgcaagaaggggcccgaatcttaggtgaattacagagctaactgatgtcaggatttttgatttgaaattttcatgcgtaaatcagattagggacgttgtacgatcacttgttgaaccgtatgaagcatcagtgcttgcttcgaatgtggaaaagttagacttgaatatctgttgttgtgttgaactctgaagtcaaaggatgtaacaaaatctccgaattttttttcatttgtgctcacttccagatacttcactgaggacgcgttcatcttgcatccgcttttgaaccagactccttccaaaggtagccgagaacatctgagaggcatttacaaaattctgtgagtttttttttctctctggatcgtgcatcctaggacgtcttggatgtctaatcgtgaacgaatttcctgcgcagtcgagtttttactatcaacaataagatcgagtttcacgctgtgatgtttaacgaggataaaactcaaggttcaattggtaagtcttgaaaccttaacctagtgtaccagaacctaaccactgatcaacaacaaactttttcttatggttccctccaaccagaattgactgagcatctctacccacgactatttccatgcgaaagtttgaagatgtcacttccattatggatcagaatcgacttgattaaagataccgatgggaaatatcgaatatgcaggttagccaagtctggctagatattcccagtcacctgttaccaccatgctgaatttactttttatttatcctcagacaacacgacatgattccagctgatccaggaatcgttgcacttccgttcctttcgatctttacccacgggtttaacatcatcaaagcgtttaatggtttggctatgggaacaatcggaaagtttcttcttgatcggaaatattttggagcttgaaaatcgaaatctagtgtgaatgataatattgttggtgacaaatcatgttgtgatgacacaaagaaaaccgaaaaacaaaaatgtagcttttcctaaataatctgaattgaatcatcaaccactttcagtttggtatactatcacccgatgtagcctccttccttgaattgtttgcgttccgaataggcaagaccttgtggcaagggtcacagccagccagtccaagataatgattagaggaacgtatcgtccttgtttagctcgaccatgtgcaaagagagaatgcacaaaaattacaagtgatgaatgtgtgaagactatgattgcttgggttactcagatctaacctcaagagatcgatgtcgtgtgtgaagtggttgcatgaaatcttgttgatggagttgcagatccgccagtcatatgacgtgatccgacagtatccgaggctcgagggaagtagggtagttggcaacttgcctgttccacctgccaacgcatggtggactttcttcgagccagcaccacccaagaacatcttcactactaccaaaacgcaacagccatccagttcaactacagcccttagtaatccaatcaaccaaacgatgtctacctgcaccggctatctcgatccgatcaagcgctcctttgcggatgcaccagttgctgacgagggcgtggacacagtaccattcttggaagcctgcgaagacctcgtcaagctattcggtgagtgaatcgtctcattattatcttttctccgattcatagatcacgaattataacgtacgctttcatgtatatcttcagatctttttcggaagtaaagcgttcgccgtcgtgcagaatgatttgaccggcaatattactgtgagtacgcttcacgcccgagaccccaccttatgcgcttacagagactgacgtgtgtaactctttttttttcattggatcccacagaaaaatcgtactcgttataacgctttcccagagaaatcaaagactctcgagtcactcgtagagaacgatattcgtgaagagaagaaagatgcaacccacgcactactctggttaactcggtaaaatcacatttgatttcttgaatataaaaaaagattgagttataagctggaaggtgacttacatatcaagaactcttttttcttgtaggggtttacacttcacctctgaagggcttcgattatcccagaacaatccaggagaagagttatctatatcgtttacgaaaggttatgaagctacattaaaacagtatcattcctttgtaatgaaaccattactcggagtaagttcatatatctgattcctcgccatttccatcacaaagatgtggacatgtattctgactctgattgaaatcaccacagctcgccatgaaagcgtgcccttatccagcagatttatatcaaaaattgggaactaaggagaaagtggaagtcaaattagaaagatggctttcagctctagaaatgatcgttgtccgaatccaaaaattctatgaaaagggcaactatggcaacggtctttgagaaggcgtgattcaccacacccgcccaacaaatcttgaccatgttggaccagtaattgagcatgttcttctcttgctccggatcgtcaatcaatttggaggcctaggcaaggagattcttctggatatgccacacacagagcatttgtttggtgtcagggaaggtggtggctagagagttaattaatgcttgtttgcggtcagtgatgacaacagctgggaaaggtatcttgtgggatttgaagcccgtgaccaacgcttgcagcgcccagtcgcagaaagatttggtttgtttgctcatgaaacagaaggcaatactgaaagtcttgttggcaccagtgattcctgagatgtgaagcaagggcatgttgtatttatttgtcttgtacgtacagtcaagtagaatgatgtgagggtaagccgtgagcaattcaactgatctagcgtgacataaaaatagggctttgagaactccttcatcattgactttggttgttgtggtgaaatcggtgttgaggagagttttgttgagatgggcgatcgggctgagtccttgaagggattggagtcttgatttcttccttgccgtatatatggtgcttatggtcgctagaatcttctcgttggggtgagttttcttcattgcggtgaggattccctgtggtttcaagccagtgtcgccaagatccttcattttgataatgagtgcaggtgccagcttttgattagctgtatgtgcagctgcgtatgcagatggtgggtggttgtgtctaggttctttacaagtgaagtaccaagcttgctttttcttgtggaaataaccagtggcggtgaaaggacagtcaatcaattttgtcgaagctgtcgaggccttggtctctcctgggcgcctgttctggttgggattgccgccactggagaatgcacaagggaaaaaaaaacaggtgggtcagcatcaggaaggtgcaaaacatggcagagaaatgggggttggcaagtggattttgggagtcggcactcggaaaaagtgagtcggtgatagaatcttgggagttgggagtcaggaaaacaattcctgagccccttgtgtacaaaggagtggatttgggagtcagaaatgggagaatgagagctggaagtccaagtttggcagtcacagattgaaaactggaagtcggaatgacaaataaaagagaaagataaaaatcaaactcaccagtcacatttcattgtcttgctcttcccggctactcctcgtctacacactactgcaaagccattctcaaccctgaagcccttagcagtagagagcattttgtccacatcttctgaataagcgtccggagggcaaggaaaagcatatagacaatccccagtttttggatcaatttcgtcgtagtcaagactaaaaacaaagctagataatgagatgttatcgtccatttcactattgccgtcatcaggttccgctacaatatttttctttggcacatttttttttgagaattccagttttttctccaggtttttcatttttttgtatgattttttgattttttcttcgaatcttggtgcatttatttcttttgagttctcagtggcttcatcaatttcaatggaccgaaatgatgtccggttgaccgcacggcgacgtcgactcaaccgtcacccggacgtcgagtgcatttgggagtcagaactccaatttttgggagttgatcaaccaagccccaaaataaataacattgattatgaaaagaagtgaaagcggtatgaattcctggaatgatacacctgcgatcaggtagctgatcacaatcatcaagccactatcctcagtcatggaagatgagaacgggttccaatattgagtatccaatgaacttttgattcacaaagatatacaagaacgtatttgttgacaatcaaatagggtgtcaaatgtggtaagatttttgcccaaacgcgtcaggtgagcttcttttttttagtgcttattgatctgacattgcgcacttaagtggatactagttaatgtagacatgcggtgatgtttgatagactacacatgattgaatatgggaaaatattttcaaccttgagaacttataagatctgagtttgtacatgactgaaaaggaaaagaaaaaggacaaaagaacaacaataaaaaataaaatgaaatccatctcttttgaccgggtctgaaaatagcaaaaactggctccaaccgacttttggcaccctgcgacccagacaggacgcttcatgggtgctcaagccatgaaccctaaattgaggagcgggcagaaagttgattgaaaccaatagccacttgtatccagctcgacaaccctactgatatctatcctaaacaataaattcaaaattaacaatagggggtgtcaatgatgcaaaatccaccattagaaaccagttaatt
@@ -0,0 +1 @@
1
+ PST130_7067 26091 13 26091 26092
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
@@ -0,0 +1 @@
1
+ PST130_7067,T,3334,G,7067
@@ -0,0 +1,16 @@
1
+ >gnl|UG|Ta#S22380157 FGAS065873 Triticum aestivum FGAS: Library 2 Gate 3 Triticum aestivum cDNA, mRNA sequence /gb=CV771480 /gi=55676420 /ug=Ta.5437 /len=859
2
+ acgcttgaccttaggcctatttaggtgacactatagaacaagtttgtacaaaaaagcagg
3
+ ctggtaccggtccggaattcccgggatatcgtcgacCCACGCGTCCGCGTCCGACCAGCA
4
+ CAAACAAGACTGTACTCTGGGCTCCTCTGACTCCGTGTCTTGCTAAAATATCTTTGGTCG
5
+ ACTCGTTGCGAGGTTGATCAGATGGCGGAGGAAGCGAAGCAGGATGTGGCGCCACCCGCG
6
+ CCGGAGCCGACCGAGGACGTCGCGGACGAGAAGGTGGCGGTTCCGTCGCCGGAGGAGTCT
7
+ AAGGCCCTCGTTGTCGCCGAGAATGACGCTGAGAAGCCTGCAGCTACAGGGGGCTCACAC
8
+ GAACGAGATGCTCTGCTCACGAGGGTCGCGACCGAGAAGAGGATTTCGCTGATCAAGGCA
9
+ TGGGAGGAGAACGAGAAGGCCAAAGCCGAGAACAAGGCCGTGAAGTTGCTGGCGGACATC
10
+ ACCTCGTGGGAGAACTCCAAGGCCGCGGAACTGGAAGCCGAGCTCAAGAAGATGCAAGAG
11
+ CAGCTGGAGAAGAAGAAGGCGCGCTGCGTGGAGAAGCTCAAGAACAGCGCCGCGACGGTG
12
+ CACAAAGAGGCGGAANGAGAAGCGTGCCGCGGCggaagcgcggcacggcgaggagatcgt
13
+ cgcggcggaggagaccGCCGCCAAGTACCGCGCCAAGGGTGAAGCGCCGAAGAAGCTGCT
14
+ CTTCGGCAGAAGATAGATATCGCTTCATCTTCAGCTTCTCTCTGTTTGACCGNTTGCATG
15
+ TCTCCTGCCCATGGCATCACTTGTGTATTTATCTTTGGGGGNGATCTTAGTTTGTATGGT
16
+ ATCATCAAATGCGTCGTGA
@@ -0,0 +1 @@
1
+ gnl|UG|Ta#S22380157 859 158 60 61
@@ -0,0 +1,67 @@
1
+ ##fileformat=VCFv4.1
2
+ ##fileDate=20160614
3
+ ##source=freeBayes v1.0.2-dirty
4
+ ##reference=S22380157.fa
5
+ ##phasing=none
6
+ ##commandline="freebayes -f S22380157.fa mergedLibsSorted.bam"
7
+ ##INFO=<ID=NS,Number=1,Type=Integer,Description="Number of samples with data">
8
+ ##INFO=<ID=DP,Number=1,Type=Integer,Description="Total read depth at the locus">
9
+ ##INFO=<ID=DPB,Number=1,Type=Float,Description="Total read depth per bp at the locus; bases in reads overlapping / bases in haplotype">
10
+ ##INFO=<ID=AC,Number=A,Type=Integer,Description="Total number of alternate alleles in called genotypes">
11
+ ##INFO=<ID=AN,Number=1,Type=Integer,Description="Total number of alleles in called genotypes">
12
+ ##INFO=<ID=AF,Number=A,Type=Float,Description="Estimated allele frequency in the range (0,1]">
13
+ ##INFO=<ID=RO,Number=1,Type=Integer,Description="Reference allele observation count, with partial observations recorded fractionally">
14
+ ##INFO=<ID=AO,Number=A,Type=Integer,Description="Alternate allele observations, with partial observations recorded fractionally">
15
+ ##INFO=<ID=PRO,Number=1,Type=Float,Description="Reference allele observation count, with partial observations recorded fractionally">
16
+ ##INFO=<ID=PAO,Number=A,Type=Float,Description="Alternate allele observations, with partial observations recorded fractionally">
17
+ ##INFO=<ID=QR,Number=1,Type=Integer,Description="Reference allele quality sum in phred">
18
+ ##INFO=<ID=QA,Number=A,Type=Integer,Description="Alternate allele quality sum in phred">
19
+ ##INFO=<ID=PQR,Number=1,Type=Float,Description="Reference allele quality sum in phred for partial observations">
20
+ ##INFO=<ID=PQA,Number=A,Type=Float,Description="Alternate allele quality sum in phred for partial observations">
21
+ ##INFO=<ID=SRF,Number=1,Type=Integer,Description="Number of reference observations on the forward strand">
22
+ ##INFO=<ID=SRR,Number=1,Type=Integer,Description="Number of reference observations on the reverse strand">
23
+ ##INFO=<ID=SAF,Number=A,Type=Integer,Description="Number of alternate observations on the forward strand">
24
+ ##INFO=<ID=SAR,Number=A,Type=Integer,Description="Number of alternate observations on the reverse strand">
25
+ ##INFO=<ID=SRP,Number=1,Type=Float,Description="Strand balance probability for the reference allele: Phred-scaled upper-bounds estimate of the probability of observing the deviation between SRF and SRR given E(SRF/SRR) ~ 0.5, derived using Hoeffding's inequality">
26
+ ##INFO=<ID=SAP,Number=A,Type=Float,Description="Strand balance probability for the alternate allele: Phred-scaled upper-bounds estimate of the probability of observing the deviation between SAF and SAR given E(SAF/SAR) ~ 0.5, derived using Hoeffding's inequality">
27
+ ##INFO=<ID=AB,Number=A,Type=Float,Description="Allele balance at heterozygous sites: a number between 0 and 1 representing the ratio of reads showing the reference allele to all reads, considering only reads from individuals called as heterozygous">
28
+ ##INFO=<ID=ABP,Number=A,Type=Float,Description="Allele balance probability at heterozygous sites: Phred-scaled upper-bounds estimate of the probability of observing the deviation between ABR and ABA given E(ABR/ABA) ~ 0.5, derived using Hoeffding's inequality">
29
+ ##INFO=<ID=RUN,Number=A,Type=Integer,Description="Run length: the number of consecutive repeats of the alternate allele in the reference genome">
30
+ ##INFO=<ID=RPP,Number=A,Type=Float,Description="Read Placement Probability: Phred-scaled upper-bounds estimate of the probability of observing the deviation between RPL and RPR given E(RPL/RPR) ~ 0.5, derived using Hoeffding's inequality">
31
+ ##INFO=<ID=RPPR,Number=1,Type=Float,Description="Read Placement Probability for reference observations: Phred-scaled upper-bounds estimate of the probability of observing the deviation between RPL and RPR given E(RPL/RPR) ~ 0.5, derived using Hoeffding's inequality">
32
+ ##INFO=<ID=RPL,Number=A,Type=Float,Description="Reads Placed Left: number of reads supporting the alternate balanced to the left (5') of the alternate allele">
33
+ ##INFO=<ID=RPR,Number=A,Type=Float,Description="Reads Placed Right: number of reads supporting the alternate balanced to the right (3') of the alternate allele">
34
+ ##INFO=<ID=EPP,Number=A,Type=Float,Description="End Placement Probability: Phred-scaled upper-bounds estimate of the probability of observing the deviation between EL and ER given E(EL/ER) ~ 0.5, derived using Hoeffding's inequality">
35
+ ##INFO=<ID=EPPR,Number=1,Type=Float,Description="End Placement Probability for reference observations: Phred-scaled upper-bounds estimate of the probability of observing the deviation between EL and ER given E(EL/ER) ~ 0.5, derived using Hoeffding's inequality">
36
+ ##INFO=<ID=DPRA,Number=A,Type=Float,Description="Alternate allele depth ratio. Ratio between depth in samples with each called alternate allele and those without.">
37
+ ##INFO=<ID=ODDS,Number=1,Type=Float,Description="The log odds ratio of the best genotype combination to the second-best.">
38
+ ##INFO=<ID=GTI,Number=1,Type=Integer,Description="Number of genotyping iterations required to reach convergence or bailout.">
39
+ ##INFO=<ID=TYPE,Number=A,Type=String,Description="The type of allele, either snp, mnp, ins, del, or complex.">
40
+ ##INFO=<ID=CIGAR,Number=A,Type=String,Description="The extended CIGAR representation of each alternate allele, with the exception that '=' is replaced by 'M' to ease VCF parsing. Note that INDEL alleles do not have the first matched base (which is provided by default, per the spec) referred to by the CIGAR.">
41
+ ##INFO=<ID=NUMALT,Number=1,Type=Integer,Description="Number of unique non-reference alleles in called genotypes at this position.">
42
+ ##INFO=<ID=MEANALT,Number=A,Type=Float,Description="Mean number of unique non-reference allele observations per sample with the corresponding alternate alleles.">
43
+ ##INFO=<ID=LEN,Number=A,Type=Integer,Description="allele length">
44
+ ##INFO=<ID=MQM,Number=A,Type=Float,Description="Mean mapping quality of observed alternate alleles">
45
+ ##INFO=<ID=MQMR,Number=1,Type=Float,Description="Mean mapping quality of observed reference alleles">
46
+ ##INFO=<ID=PAIRED,Number=A,Type=Float,Description="Proportion of observed alternate alleles which are supported by properly paired read fragments">
47
+ ##INFO=<ID=PAIREDR,Number=1,Type=Float,Description="Proportion of observed reference alleles which are supported by properly paired read fragments">
48
+ ##INFO=<ID=MIN,Number=1,Type=Integer,Description="Minimum depth in gVCF output block.">
49
+ ##INFO=<ID=END,Number=1,Type=Integer,Description="Last position (inclusive) in gVCF output record.">
50
+ ##INFO=<ID=technology.Illumina,Number=A,Type=Float,Description="Fraction of observations supporting the alternate observed in reads from Illumina">
51
+ ##FORMAT=<ID=GT,Number=1,Type=String,Description="Genotype">
52
+ ##FORMAT=<ID=GQ,Number=1,Type=Float,Description="Genotype Quality, the Phred-scaled marginal (or unconditional) probability of the called genotype">
53
+ ##FORMAT=<ID=GL,Number=G,Type=Float,Description="Genotype Likelihood, log10-scaled likelihoods of the data given the called genotype for each possible genotype generated from the reference and alternate alleles given the sample ploidy">
54
+ ##FORMAT=<ID=DP,Number=1,Type=Integer,Description="Read Depth">
55
+ ##FORMAT=<ID=RO,Number=1,Type=Integer,Description="Reference allele observation count">
56
+ ##FORMAT=<ID=QR,Number=1,Type=Integer,Description="Sum of quality of the reference observations">
57
+ ##FORMAT=<ID=AO,Number=A,Type=Integer,Description="Alternate allele observation count">
58
+ ##FORMAT=<ID=QA,Number=A,Type=Integer,Description="Sum of quality of the alternate observations">
59
+ ##FORMAT=<ID=MIN,Number=1,Type=Integer,Description="Minimum depth in gVCF output block.">
60
+ #CHROM POS ID REF ALT QUAL FILTER INFO FORMAT AVS Yr15 R2 S2
61
+ gnl|UG|Ta#S22380157 103 . GTCCG CACCA 110.198 . AB=0;ABP=0;AC=8;AF=1;AN=8;AO=5;CIGAR=2X2M1X;DP=7;DPB=15.4;DPRA=2;EPP=13.8677;EPPR=0;GTI=0;LEN=5;MEANALT=1.33333;MQM=34.6;MQMR=0;NS=4;NUMALT=1;ODDS=8.46791;PAIRED=0;PAIREDR=0;PAO=10;PQA=295.5;PQR=0;PRO=0;QA=113;QR=0;RO=0;RPL=0;RPP=13.8677;RPPR=0;RPR=5;RUN=1;SAF=0;SAP=13.8677;SAR=5;SRF=0;SRP=0;SRR=0;TYPE=complex;technology.Illumina=1 GT:DP:RO:QR:AO:QA:GL 1/1:3:0:0:2:32:-5.6255,-3.31133,0 1/1:2:0:0:2:49:-4.02265,-3.61236,0 1/1:1:0:0:0:0:-2.84294,-2.10721,0 1/1:1:0:0:1:32:-3.04402,-2.70927,0
62
+ gnl|UG|Ta#S22380157 172 . CTT CT 7962.24 . AB=0.587891;ABP=37.3637;AC=4;AF=0.5;AN=8;AO=301;CIGAR=1M1D1M;DP=512;DPB=419.333;DPRA=0;EPP=3.3638;EPPR=3.8683;GTI=0;LEN=1;MEANALT=2;MQM=50.8306;MQMR=55.2293;NS=4;NUMALT=1;ODDS=200.967;PAIRED=0.601329;PAIREDR=0.834146;PAO=9.5;PQA=200;PQR=66;PRO=5.5;QA=11120;QR=7815;RO=205;RPL=83;RPP=134.489;RPPR=83.1853;RPR=218;RUN=1;SAF=126;SAP=20.3316;SAR=175;SRF=132;SRP=39.883;SRR=73;TYPE=del;technology.Illumina=1 GT:DP:RO:QR:AO:QA:GL 0/1:133:63:2420:68:2491:-178.443,0,-172.662 0/1:132:39:1500:91:3403:-257.087,0,-93.0558 0/1:124:51:1932:72:2658:-200.413,0,-132.449 0/1:123:52:1963:70:2568:-189.353,0,-136.176
63
+ gnl|UG|Ta#S22380157 177 . G A 8949.82 . AB=0.611615;ABP=62.6332;AC=4;AF=0.5;AN=8;AO=337;CIGAR=1X;DP=551;DPB=551;DPRA=0;EPP=6.41893;EPPR=3.65971;GTI=0;LEN=1;MEANALT=1;MQM=51.6053;MQMR=55.4299;NS=4;NUMALT=1;ODDS=204.975;PAIRED=0.635015;PAIREDR=0.841121;PAO=0;PQA=0;PQR=0;PRO=0;QA=12529;QR=8228;RO=214;RPL=107;RPP=100.495;RPPR=74.608;RPR=230;RUN=1;SAF=140;SAP=23.9454;SAR=197;SRF=138;SRP=42.0156;SRR=76;TYPE=snp;technology.Illumina=1 GT:DP:RO:QR:AO:QA:GL 0/1:143:66:2551:77:2853:-204.971,0,-179.577 0/1:142:41:1586:101:3776:-284.807,0,-95.8858 0/1:132:52:1994:80:2979:-220.768,0,-136.603 0/1:134:55:2097:79:2921:-212.665,0,-146.38
64
+ gnl|UG|Ta#S22380157 210 . G C 1400.07 . AB=0.188172;ABP=631.383;AC=4;AF=0.5;AN=8;AO=140;CIGAR=1X;DP=744;DPB=744;DPRA=0;EPP=9.21451;EPPR=4.59839;GTI=1;LEN=1;MEANALT=1.25;MQM=55.9143;MQMR=54.0116;NS=4;NUMALT=1;ODDS=6.55347;PAIRED=0.835714;PAIREDR=0.761194;PAO=0;PQA=0;PQR=0;PRO=0;QA=4961;QR=21949;RO=603;RPL=50;RPP=27.8271;RPPR=13.1258;RPR=90;RUN=1;SAF=78;SAP=6.98099;SAR=62;SRF=298;SRP=3.18675;SRR=305;TYPE=snp;technology.Illumina=1 GT:DP:RO:QR:AO:QA:GL 0/1:193:162:5923:31:1092:-39.117,0,-463.027 0/1:194:144:5267:49:1753:-98.1484,0,-401.844 0/1:179:153:5554:26:936:-30.3158,0,-436.408 0/1:178:144:5205:34:1180:-49.8312,0,-403.758
65
+ gnl|UG|Ta#S22380157 275 . T C 10383.1 . AB=0;ABP=0;AC=8;AF=1;AN=8;AO=372;CIGAR=1X;DP=373;DPB=373;DPRA=0;EPP=3.1037;EPPR=0;GTI=0;LEN=1;MEANALT=1.25;MQM=56.828;MQMR=0;NS=4;NUMALT=1;ODDS=114.919;PAIRED=0.892473;PAIREDR=0;PAO=0;PQA=0;PQR=0;PRO=0;QA=12770;QR=0;RO=0;RPL=364;RPP=742.805;RPPR=0;RPR=8;RUN=1;SAF=192;SAP=3.85087;SAR=180;SRF=0;SRP=0;SRR=0;TYPE=snp;technology.Illumina=1 GT:DP:RO:QR:AO:QA:GL 1/1:98:0:0:97:3332:-295.121,-29.1999,0 1/1:98:0:0:98:3365:-299.931,-29.5009,0 1/1:90:0:0:90:3088:-276.481,-27.0927,0 1/1:87:0:0:87:2985:-265.696,-26.1896,0
66
+ gnl|UG|Ta#S22380157 297 . G A 116.697 . AB=0.171171;ABP=211.511;AC=4;AF=0.5;AN=8;AO=38;CIGAR=1X;DP=222;DPB=222;DPRA=0;EPP=30.668;EPPR=5.32339;GTI=2;LEN=1;MEANALT=1;MQM=55.5789;MQMR=56.75;NS=4;NUMALT=1;ODDS=5.24021;PAIRED=0.921053;PAIREDR=0.880435;PAO=0;PQA=0;PQR=0;PRO=0;QA=1246;QR=6568;RO=184;RPL=38;RPP=85.5263;RPPR=402.561;RPR=0;RUN=1;SAF=30;SAP=30.668;SAR=8;SRF=85;SRP=5.32339;SRR=99;TYPE=snp;technology.Illumina=1 GT:DP:RO:QR:AO:QA:GL 0/1:58:49:1733:9:299:-9.50685,0,-137.27 0/1:57:44:1595:13:431:-21.9339,0,-124.308 0/1:55:45:1602:10:322:-12.5,0,-127.194 0/1:52:46:1638:6:194:-1.85608,0,-130.564
67
+ gnl|UG|Ta#S22380157 309 . C G 1804.05 . AB=0.589552;ABP=12.3444;AC=4;AF=0.5;AN=8;AO=79;CIGAR=1X;DP=134;DPB=134;DPRA=0;EPP=3.03779;EPPR=6.20829;GTI=0;LEN=1;MEANALT=1;MQM=56.8354;MQMR=58.3273;NS=4;NUMALT=1;ODDS=60.1531;PAIRED=0.911392;PAIREDR=0.945455;PAO=0;PQA=0;PQR=0;PRO=0;QA=2820;QR=1984;RO=55;RPL=79;RPP=174.557;RPPR=122.441;RPR=0;RUN=1;SAF=40;SAP=3.03779;SAR=39;SRF=32;SRP=6.20829;SRR=23;TYPE=snp;technology.Illumina=1 GT:DP:RO:QR:AO:QA:GL 0/1:35:12:445:23:821:-62.9805,0,-29.8575 0/1:34:13:471:21:756:-57.6467,0,-32.1685 0/1:33:14:508:19:675:-50.6881,0,-35.9275 0/1:32:16:560:16:568:-41.3553,0,-41.0568
Binary file