bio-polymarker 1.3.2
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +7 -0
- data/.travis.yml +24 -0
- data/Gemfile +23 -0
- data/README.md +205 -0
- data/Rakefile +61 -0
- data/SECURITY.md +16 -0
- data/VERSION +1 -0
- data/bin/bfr.rb +128 -0
- data/bin/blast_triads.rb +166 -0
- data/bin/blast_triads_promoters.rb +192 -0
- data/bin/count_variations.rb +36 -0
- data/bin/filter_blat_by_target_coverage.rb +69 -0
- data/bin/filter_exonerate_by_identity.rb +38 -0
- data/bin/find_best_blat_hit.rb +33 -0
- data/bin/find_best_exonerate.rb +17 -0
- data/bin/get_longest_hsp_blastx_triads.rb +66 -0
- data/bin/hexaploid_primers.rb +168 -0
- data/bin/homokaryot_primers.rb +183 -0
- data/bin/mafft_triads.rb +120 -0
- data/bin/mafft_triads_promoters.rb +403 -0
- data/bin/map_markers_to_contigs.rb +66 -0
- data/bin/marker_to_vcf.rb +241 -0
- data/bin/markers_in_region.rb +42 -0
- data/bin/mask_triads.rb +169 -0
- data/bin/polymarker.rb +410 -0
- data/bin/polymarker_capillary.rb +443 -0
- data/bin/polymarker_deletions.rb +350 -0
- data/bin/snp_position_to_polymarker.rb +101 -0
- data/bin/snps_between_bams.rb +107 -0
- data/bin/tag_stats.rb +75 -0
- data/bin/vcfLineToTable.rb +56 -0
- data/bin/vcfToPolyMarker.rb +82 -0
- data/bio-polymarker.gemspec +227 -0
- data/conf/defaults.rb +1 -0
- data/conf/primer3_config/dangle.dh +128 -0
- data/conf/primer3_config/dangle.ds +128 -0
- data/conf/primer3_config/interpretations/dangle_i.dh +131 -0
- data/conf/primer3_config/interpretations/dangle_i.ds +131 -0
- data/conf/primer3_config/interpretations/loops_i.dh +34 -0
- data/conf/primer3_config/interpretations/loops_i.ds +31 -0
- data/conf/primer3_config/interpretations/stack_i.dh +257 -0
- data/conf/primer3_config/interpretations/stack_i.ds +256 -0
- data/conf/primer3_config/interpretations/stackmm_i_mm.dh +257 -0
- data/conf/primer3_config/interpretations/stackmm_i_mm.ds +256 -0
- data/conf/primer3_config/interpretations/tetraloop_i.dh +79 -0
- data/conf/primer3_config/interpretations/tetraloop_i.ds +81 -0
- data/conf/primer3_config/interpretations/triloop_i.dh +21 -0
- data/conf/primer3_config/interpretations/triloop_i.ds +18 -0
- data/conf/primer3_config/interpretations/tstack2_i.dh +256 -0
- data/conf/primer3_config/interpretations/tstack2_i.ds +256 -0
- data/conf/primer3_config/interpretations/tstack_i.dh +256 -0
- data/conf/primer3_config/interpretations/tstack_i.ds +256 -0
- data/conf/primer3_config/interpretations/tstack_tm_inf_i.dh +256 -0
- data/conf/primer3_config/interpretations/tstack_tm_inf_i.ds +256 -0
- data/conf/primer3_config/loops.dh +30 -0
- data/conf/primer3_config/loops.ds +30 -0
- data/conf/primer3_config/stack.dh +256 -0
- data/conf/primer3_config/stack.ds +256 -0
- data/conf/primer3_config/stackmm.dh +256 -0
- data/conf/primer3_config/stackmm.ds +256 -0
- data/conf/primer3_config/tetraloop.dh +77 -0
- data/conf/primer3_config/tetraloop.ds +77 -0
- data/conf/primer3_config/triloop.dh +16 -0
- data/conf/primer3_config/triloop.ds +16 -0
- data/conf/primer3_config/tstack.dh +256 -0
- data/conf/primer3_config/tstack2.dh +256 -0
- data/conf/primer3_config/tstack2.ds +256 -0
- data/conf/primer3_config/tstack_tm_inf.ds +256 -0
- data/lib/bio/BFRTools.rb +465 -0
- data/lib/bio/BIOExtensions.rb +153 -0
- data/lib/bio/PolyploidTools/ChromosomeArm.rb +63 -0
- data/lib/bio/PolyploidTools/ExonContainer.rb +245 -0
- data/lib/bio/PolyploidTools/Marker.rb +175 -0
- data/lib/bio/PolyploidTools/Mask.rb +116 -0
- data/lib/bio/PolyploidTools/NoSNPSequence.rb +292 -0
- data/lib/bio/PolyploidTools/PrimerRegion.rb +30 -0
- data/lib/bio/PolyploidTools/SNP.rb +804 -0
- data/lib/bio/PolyploidTools/SNPMutant.rb +86 -0
- data/lib/bio/PolyploidTools/SNPSequence.rb +55 -0
- data/lib/bio/db/blast.rb +114 -0
- data/lib/bio/db/exonerate.rb +333 -0
- data/lib/bio/db/primer3.rb +820 -0
- data/lib/bio-polymarker.rb +28 -0
- data/test/data/7B_amplicon_test.fa +12 -0
- data/test/data/7B_amplicon_test.fa.fai +1 -0
- data/test/data/7B_amplicon_test_reference.fa +110 -0
- data/test/data/7B_amplicon_test_reference.fa.fai +3 -0
- data/test/data/7B_marker_test.txt +1 -0
- data/test/data/BS00068396_51.fa +2 -0
- data/test/data/BS00068396_51_blast.tab +4 -0
- data/test/data/BS00068396_51_contigs.aln +1412 -0
- data/test/data/BS00068396_51_contigs.dnd +7 -0
- data/test/data/BS00068396_51_contigs.fa +8 -0
- data/test/data/BS00068396_51_contigs.fa.fai +4 -0
- data/test/data/BS00068396_51_contigs.fa.nhr +0 -0
- data/test/data/BS00068396_51_contigs.fa.nin +0 -0
- data/test/data/BS00068396_51_contigs.fa.nsq +0 -0
- data/test/data/BS00068396_51_contigs.nhr +0 -0
- data/test/data/BS00068396_51_contigs.nin +0 -0
- data/test/data/BS00068396_51_contigs.nsq +0 -0
- data/test/data/BS00068396_51_exonerate.tab +6 -0
- data/test/data/BS00068396_51_for_polymarker.txt +1 -0
- data/test/data/BS00068396_51_genes.txt +14 -0
- data/test/data/IWGSC_CSS_1AL_scaff_1455974.fa +112 -0
- data/test/data/IWGSC_CSS_1AL_scaff_1455974_aln_contigs.fa +2304 -0
- data/test/data/IWGSC_CSS_1AL_scaff_1455974_aln_contigs.fa.fai +11 -0
- data/test/data/LIB1716.bam +0 -0
- data/test/data/LIB1716.bam.bai +0 -0
- data/test/data/LIB1719.bam +0 -0
- data/test/data/LIB1719.bam.bai +0 -0
- data/test/data/LIB1721.bam +0 -0
- data/test/data/LIB1721.bam.bai +0 -0
- data/test/data/LIB1722.bam +0 -0
- data/test/data/LIB1722.bam.bai +0 -0
- data/test/data/PST130_7067.csv +1 -0
- data/test/data/PST130_7067.fa +2 -0
- data/test/data/PST130_7067.fa.fai +1 -0
- data/test/data/PST130_7067.fa.ndb +0 -0
- data/test/data/PST130_7067.fa.nhr +0 -0
- data/test/data/PST130_7067.fa.nin +0 -0
- data/test/data/PST130_7067.fa.not +0 -0
- data/test/data/PST130_7067.fa.nsq +0 -0
- data/test/data/PST130_7067.fa.ntf +0 -0
- data/test/data/PST130_7067.fa.nto +0 -0
- data/test/data/PST130_reverse_primer.csv +1 -0
- data/test/data/S22380157.fa +16 -0
- data/test/data/S22380157.fa.fai +1 -0
- data/test/data/S22380157.vcf +67 -0
- data/test/data/S58861868/LIB1716.bam +0 -0
- data/test/data/S58861868/LIB1716.sam +651 -0
- data/test/data/S58861868/LIB1719.bam +0 -0
- data/test/data/S58861868/LIB1719.sam +805 -0
- data/test/data/S58861868/LIB1721.bam +0 -0
- data/test/data/S58861868/LIB1721.sam +1790 -0
- data/test/data/S58861868/LIB1722.bam +0 -0
- data/test/data/S58861868/LIB1722.sam +1271 -0
- data/test/data/S58861868/S58861868.fa +16 -0
- data/test/data/S58861868/S58861868.fa.fai +1 -0
- data/test/data/S58861868/S58861868.vcf +76 -0
- data/test/data/S58861868/header.txt +9 -0
- data/test/data/S58861868/merged.bam +0 -0
- data/test/data/S58861868/merged_reheader.bam +0 -0
- data/test/data/S58861868/merged_reheader.bam.bai +0 -0
- data/test/data/Test3Aspecific.csv +2 -0
- data/test/data/Test3Aspecific_contigs.fa +6 -0
- data/test/data/bfr_out_test.csv +5 -0
- data/test/data/chr1A_C1145499T/chr1A_C1145499T.csv +1 -0
- data/test/data/chr1A_G540414846C/chr1A_G540414846C.csv +1 -0
- data/test/data/chr1A_G540414846C/chr1A_G540414846C.fa +2 -0
- data/test/data/chr1A_T517634750C/chr1A_T517634750C.csv +1 -0
- data/test/data/chr2D_C112180134A/chr2D_C112180134A.csv +1 -0
- data/test/data/chr4D_C14473543T/chr4D_C14473543T.csv +1 -0
- data/test/data/chr4D_C14473543T/chr4D_C14473543T.fa +2 -0
- data/test/data/headerMergeed.txt +9 -0
- data/test/data/headerS2238015 +1 -0
- data/test/data/mergedLibs.bam +0 -0
- data/test/data/mergedLibsReheader.bam +0 -0
- data/test/data/mergedLibsSorted.bam +0 -0
- data/test/data/mergedLibsSorted.bam.bai +0 -0
- data/test/data/patological_cases5D.csv +1 -0
- data/test/data/primer_3_input_header_test +5 -0
- data/test/data/short_primer_design_test.csv +10 -0
- data/test/data/some_tests/some_tests.csv +201 -0
- data/test/data/test_from_mutant.csv +3 -0
- data/test/data/test_iselect.csv +196 -0
- data/test/data/test_iselect_reference.fa +1868 -0
- data/test/data/test_iselect_reference.fa.fai +934 -0
- data/test/data/test_primer3_error.csv +4 -0
- data/test/data/test_primer3_error_contigs.fa +10 -0
- data/test/test_bfr.rb +135 -0
- data/test/test_blast.rb +47 -0
- data/test/test_exon_container.rb +17 -0
- data/test/test_exonearate.rb +48 -0
- data/test/test_integration.rb +76 -0
- data/test/test_snp_parsing.rb +121 -0
- data/test/test_wrong_selection.sh +5 -0
- metadata +356 -0
@@ -0,0 +1,82 @@
|
|
1
|
+
#!/usr/bin/env ruby
|
2
|
+
|
3
|
+
require 'optparse'
|
4
|
+
|
5
|
+
require 'csv'
|
6
|
+
require 'bio'
|
7
|
+
require 'bio-samtools-wrapper'
|
8
|
+
|
9
|
+
$: << File.expand_path(File.dirname(__FILE__) + '/../lib')
|
10
|
+
$: << File.expand_path('.')
|
11
|
+
path= File.expand_path(File.dirname(__FILE__) + '/../lib/bio-polymarker.rb')
|
12
|
+
require path
|
13
|
+
|
14
|
+
options = {}
|
15
|
+
options[:arm_selection] = Bio::PolyploidTools::ChromosomeArm.getArmSelection("nrgene");
|
16
|
+
|
17
|
+
|
18
|
+
OptionParser.new do |opts|
|
19
|
+
opts.banner = "Usage: vcfToPolyMarker.rb [options]"
|
20
|
+
|
21
|
+
opts.on("-c", "--reference FILE", "File with genome reference to use as database") do |o|
|
22
|
+
options[:path_to_contigs] = o
|
23
|
+
end
|
24
|
+
|
25
|
+
opts.on("-a", "--arm_selection #{Bio::PolyploidTools::ChromosomeArm.getValidFunctions.join('|')}", "Function to decide the chromome arm") do |o|
|
26
|
+
tmp_str = o
|
27
|
+
arr = o.split(",")
|
28
|
+
if arr.size == 2
|
29
|
+
options[:arm_selection] = lambda do |contig_name|
|
30
|
+
separator, field = arr
|
31
|
+
field = field.to_i
|
32
|
+
ret = contig_name.split(separator)[field]
|
33
|
+
return ret
|
34
|
+
end
|
35
|
+
else
|
36
|
+
options[:arm_selection] = Bio::PolyploidTools::ChromosomeArm.getArmSelection(o)
|
37
|
+
end
|
38
|
+
end
|
39
|
+
|
40
|
+
|
41
|
+
end.parse!
|
42
|
+
|
43
|
+
def parseVCFheader(head_line="")
|
44
|
+
##INFO=<ID=NS,Number=1,Type=Integer,Description="Number of samples with data">
|
45
|
+
|
46
|
+
m=/##INFO=<ID=(.+),Number=(.+),Type=(.+),Description="(.+)">/.match(head_line)
|
47
|
+
{:id=>m[1],:number=>m[2],:type=>m[3],:desc=>m[4]}
|
48
|
+
|
49
|
+
end
|
50
|
+
|
51
|
+
|
52
|
+
|
53
|
+
|
54
|
+
header_info = Hash.new
|
55
|
+
ref=options[:path_to_contigs]
|
56
|
+
|
57
|
+
fasta_reference_db = Bio::DB::Fasta::FastaFile.new({:fasta=>ref})
|
58
|
+
fasta_reference_db.load_fai_entries
|
59
|
+
|
60
|
+
$stdin.each do |line|
|
61
|
+
|
62
|
+
h = nil
|
63
|
+
h = parseVCFheader(line) if line.start_with? "##INFO"
|
64
|
+
|
65
|
+
header_info[h[:id]] = h[:desc] if h
|
66
|
+
#puts header_info.inspect
|
67
|
+
next if line.start_with? "##"
|
68
|
+
if line.start_with? "#CHROM"
|
69
|
+
arr = line.split
|
70
|
+
arr = arr.drop(9)
|
71
|
+
arr2 = arr.map { |s| [s.clone().prepend('Cov'), s.clone().prepend('Hap') ]}
|
72
|
+
#header += arr2.join("\t")
|
73
|
+
#puts header
|
74
|
+
next
|
75
|
+
end
|
76
|
+
line.chomp!
|
77
|
+
#puts line
|
78
|
+
snp = Bio::PolyploidTools::SNP.parseVCF( line , chr_arm_parser: options[:arm_selection])
|
79
|
+
#puts snp.inspect
|
80
|
+
snp.setTemplateFromFastaFile(fasta_reference_db, flanking_size: 100)
|
81
|
+
puts [snp.gene, snp.chromosome ,snp.to_polymarker_sequence(100)].join(",")
|
82
|
+
end
|
@@ -0,0 +1,227 @@
|
|
1
|
+
# Generated by juwelier
|
2
|
+
# DO NOT EDIT THIS FILE DIRECTLY
|
3
|
+
# Instead, edit Juwelier::Tasks in Rakefile, and run 'rake gemspec'
|
4
|
+
# -*- encoding: utf-8 -*-
|
5
|
+
# stub: bio-polymarker 1.3.2 ruby lib
|
6
|
+
|
7
|
+
Gem::Specification.new do |s|
|
8
|
+
s.name = "bio-polymarker".freeze
|
9
|
+
s.version = "1.3.2"
|
10
|
+
|
11
|
+
s.required_rubygems_version = Gem::Requirement.new(">= 0".freeze) if s.respond_to? :required_rubygems_version=
|
12
|
+
s.require_paths = ["lib".freeze]
|
13
|
+
s.authors = ["Rob Ellis".freeze]
|
14
|
+
s.date = "2024-09-25"
|
15
|
+
s.description = "Repository of tools developed at Crop Genetics in JIC to work with polyploid wheat".freeze
|
16
|
+
s.email = "rob.ellis@jic.ac.uk".freeze
|
17
|
+
s.executables = ["bfr.rb".freeze, "blast_triads.rb".freeze, "blast_triads_promoters.rb".freeze, "count_variations.rb".freeze, "filter_blat_by_target_coverage.rb".freeze, "filter_exonerate_by_identity.rb".freeze, "find_best_blat_hit.rb".freeze, "find_best_exonerate.rb".freeze, "get_longest_hsp_blastx_triads.rb".freeze, "hexaploid_primers.rb".freeze, "homokaryot_primers.rb".freeze, "mafft_triads.rb".freeze, "mafft_triads_promoters.rb".freeze, "map_markers_to_contigs.rb".freeze, "marker_to_vcf.rb".freeze, "markers_in_region.rb".freeze, "mask_triads.rb".freeze, "polymarker.rb".freeze, "polymarker_capillary.rb".freeze, "polymarker_deletions.rb".freeze, "snp_position_to_polymarker.rb".freeze, "snps_between_bams.rb".freeze, "tag_stats.rb".freeze, "vcfLineToTable.rb".freeze, "vcfToPolyMarker.rb".freeze]
|
18
|
+
s.extra_rdoc_files = [
|
19
|
+
"README.md"
|
20
|
+
]
|
21
|
+
s.files = [
|
22
|
+
".travis.yml",
|
23
|
+
"Gemfile",
|
24
|
+
"README.md",
|
25
|
+
"Rakefile",
|
26
|
+
"SECURITY.md",
|
27
|
+
"VERSION",
|
28
|
+
"bin/bfr.rb",
|
29
|
+
"bin/blast_triads.rb",
|
30
|
+
"bin/blast_triads_promoters.rb",
|
31
|
+
"bin/count_variations.rb",
|
32
|
+
"bin/filter_blat_by_target_coverage.rb",
|
33
|
+
"bin/filter_exonerate_by_identity.rb",
|
34
|
+
"bin/find_best_blat_hit.rb",
|
35
|
+
"bin/find_best_exonerate.rb",
|
36
|
+
"bin/get_longest_hsp_blastx_triads.rb",
|
37
|
+
"bin/hexaploid_primers.rb",
|
38
|
+
"bin/homokaryot_primers.rb",
|
39
|
+
"bin/mafft_triads.rb",
|
40
|
+
"bin/mafft_triads_promoters.rb",
|
41
|
+
"bin/map_markers_to_contigs.rb",
|
42
|
+
"bin/marker_to_vcf.rb",
|
43
|
+
"bin/markers_in_region.rb",
|
44
|
+
"bin/mask_triads.rb",
|
45
|
+
"bin/polymarker.rb",
|
46
|
+
"bin/polymarker_capillary.rb",
|
47
|
+
"bin/polymarker_deletions.rb",
|
48
|
+
"bin/snp_position_to_polymarker.rb",
|
49
|
+
"bin/snps_between_bams.rb",
|
50
|
+
"bin/tag_stats.rb",
|
51
|
+
"bin/vcfLineToTable.rb",
|
52
|
+
"bin/vcfToPolyMarker.rb",
|
53
|
+
"bio-polymarker.gemspec",
|
54
|
+
"conf/defaults.rb",
|
55
|
+
"conf/primer3_config/dangle.dh",
|
56
|
+
"conf/primer3_config/dangle.ds",
|
57
|
+
"conf/primer3_config/interpretations/dangle_i.dh",
|
58
|
+
"conf/primer3_config/interpretations/dangle_i.ds",
|
59
|
+
"conf/primer3_config/interpretations/loops_i.dh",
|
60
|
+
"conf/primer3_config/interpretations/loops_i.ds",
|
61
|
+
"conf/primer3_config/interpretations/stack_i.dh",
|
62
|
+
"conf/primer3_config/interpretations/stack_i.ds",
|
63
|
+
"conf/primer3_config/interpretations/stackmm_i_mm.dh",
|
64
|
+
"conf/primer3_config/interpretations/stackmm_i_mm.ds",
|
65
|
+
"conf/primer3_config/interpretations/tetraloop_i.dh",
|
66
|
+
"conf/primer3_config/interpretations/tetraloop_i.ds",
|
67
|
+
"conf/primer3_config/interpretations/triloop_i.dh",
|
68
|
+
"conf/primer3_config/interpretations/triloop_i.ds",
|
69
|
+
"conf/primer3_config/interpretations/tstack2_i.dh",
|
70
|
+
"conf/primer3_config/interpretations/tstack2_i.ds",
|
71
|
+
"conf/primer3_config/interpretations/tstack_i.dh",
|
72
|
+
"conf/primer3_config/interpretations/tstack_i.ds",
|
73
|
+
"conf/primer3_config/interpretations/tstack_tm_inf_i.dh",
|
74
|
+
"conf/primer3_config/interpretations/tstack_tm_inf_i.ds",
|
75
|
+
"conf/primer3_config/loops.dh",
|
76
|
+
"conf/primer3_config/loops.ds",
|
77
|
+
"conf/primer3_config/stack.dh",
|
78
|
+
"conf/primer3_config/stack.ds",
|
79
|
+
"conf/primer3_config/stackmm.dh",
|
80
|
+
"conf/primer3_config/stackmm.ds",
|
81
|
+
"conf/primer3_config/tetraloop.dh",
|
82
|
+
"conf/primer3_config/tetraloop.ds",
|
83
|
+
"conf/primer3_config/triloop.dh",
|
84
|
+
"conf/primer3_config/triloop.ds",
|
85
|
+
"conf/primer3_config/tstack.dh",
|
86
|
+
"conf/primer3_config/tstack2.dh",
|
87
|
+
"conf/primer3_config/tstack2.ds",
|
88
|
+
"conf/primer3_config/tstack_tm_inf.ds",
|
89
|
+
"lib/bio/BFRTools.rb",
|
90
|
+
"lib/bio/BIOExtensions.rb",
|
91
|
+
"lib/bio/PolyploidTools/ChromosomeArm.rb",
|
92
|
+
"lib/bio/PolyploidTools/ExonContainer.rb",
|
93
|
+
"lib/bio/PolyploidTools/Marker.rb",
|
94
|
+
"lib/bio/PolyploidTools/Mask.rb",
|
95
|
+
"lib/bio/PolyploidTools/NoSNPSequence.rb",
|
96
|
+
"lib/bio/PolyploidTools/PrimerRegion.rb",
|
97
|
+
"lib/bio/PolyploidTools/SNP.rb",
|
98
|
+
"lib/bio/PolyploidTools/SNPMutant.rb",
|
99
|
+
"lib/bio/PolyploidTools/SNPSequence.rb",
|
100
|
+
"lib/bio/db/blast.rb",
|
101
|
+
"lib/bio/db/exonerate.rb",
|
102
|
+
"lib/bio/db/primer3.rb",
|
103
|
+
"lib/bio-polymarker.rb",
|
104
|
+
"test/data/7B_amplicon_test.fa",
|
105
|
+
"test/data/7B_amplicon_test.fa.fai",
|
106
|
+
"test/data/7B_amplicon_test_reference.fa",
|
107
|
+
"test/data/7B_amplicon_test_reference.fa.fai",
|
108
|
+
"test/data/7B_marker_test.txt",
|
109
|
+
"test/data/BS00068396_51.fa",
|
110
|
+
"test/data/BS00068396_51_blast.tab",
|
111
|
+
"test/data/BS00068396_51_contigs.aln",
|
112
|
+
"test/data/BS00068396_51_contigs.dnd",
|
113
|
+
"test/data/BS00068396_51_contigs.fa",
|
114
|
+
"test/data/BS00068396_51_contigs.fa.fai",
|
115
|
+
"test/data/BS00068396_51_contigs.fa.nhr",
|
116
|
+
"test/data/BS00068396_51_contigs.fa.nin",
|
117
|
+
"test/data/BS00068396_51_contigs.fa.nsq",
|
118
|
+
"test/data/BS00068396_51_contigs.nhr",
|
119
|
+
"test/data/BS00068396_51_contigs.nin",
|
120
|
+
"test/data/BS00068396_51_contigs.nsq",
|
121
|
+
"test/data/BS00068396_51_exonerate.tab",
|
122
|
+
"test/data/BS00068396_51_for_polymarker.txt",
|
123
|
+
"test/data/BS00068396_51_genes.txt",
|
124
|
+
"test/data/IWGSC_CSS_1AL_scaff_1455974.fa",
|
125
|
+
"test/data/IWGSC_CSS_1AL_scaff_1455974_aln_contigs.fa",
|
126
|
+
"test/data/IWGSC_CSS_1AL_scaff_1455974_aln_contigs.fa.fai",
|
127
|
+
"test/data/LIB1716.bam",
|
128
|
+
"test/data/LIB1716.bam.bai",
|
129
|
+
"test/data/LIB1719.bam",
|
130
|
+
"test/data/LIB1719.bam.bai",
|
131
|
+
"test/data/LIB1721.bam",
|
132
|
+
"test/data/LIB1721.bam.bai",
|
133
|
+
"test/data/LIB1722.bam",
|
134
|
+
"test/data/LIB1722.bam.bai",
|
135
|
+
"test/data/PST130_7067.csv",
|
136
|
+
"test/data/PST130_7067.fa",
|
137
|
+
"test/data/PST130_7067.fa.fai",
|
138
|
+
"test/data/PST130_7067.fa.ndb",
|
139
|
+
"test/data/PST130_7067.fa.nhr",
|
140
|
+
"test/data/PST130_7067.fa.nin",
|
141
|
+
"test/data/PST130_7067.fa.not",
|
142
|
+
"test/data/PST130_7067.fa.nsq",
|
143
|
+
"test/data/PST130_7067.fa.ntf",
|
144
|
+
"test/data/PST130_7067.fa.nto",
|
145
|
+
"test/data/PST130_reverse_primer.csv",
|
146
|
+
"test/data/S22380157.fa",
|
147
|
+
"test/data/S22380157.fa.fai",
|
148
|
+
"test/data/S22380157.vcf",
|
149
|
+
"test/data/S58861868/LIB1716.bam",
|
150
|
+
"test/data/S58861868/LIB1716.sam",
|
151
|
+
"test/data/S58861868/LIB1719.bam",
|
152
|
+
"test/data/S58861868/LIB1719.sam",
|
153
|
+
"test/data/S58861868/LIB1721.bam",
|
154
|
+
"test/data/S58861868/LIB1721.sam",
|
155
|
+
"test/data/S58861868/LIB1722.bam",
|
156
|
+
"test/data/S58861868/LIB1722.sam",
|
157
|
+
"test/data/S58861868/S58861868.fa",
|
158
|
+
"test/data/S58861868/S58861868.fa.fai",
|
159
|
+
"test/data/S58861868/S58861868.vcf",
|
160
|
+
"test/data/S58861868/header.txt",
|
161
|
+
"test/data/S58861868/merged.bam",
|
162
|
+
"test/data/S58861868/merged_reheader.bam",
|
163
|
+
"test/data/S58861868/merged_reheader.bam.bai",
|
164
|
+
"test/data/Test3Aspecific.csv",
|
165
|
+
"test/data/Test3Aspecific_contigs.fa",
|
166
|
+
"test/data/bfr_out_test.csv",
|
167
|
+
"test/data/chr1A_C1145499T/chr1A_C1145499T.csv",
|
168
|
+
"test/data/chr1A_G540414846C/chr1A_G540414846C.csv",
|
169
|
+
"test/data/chr1A_G540414846C/chr1A_G540414846C.fa",
|
170
|
+
"test/data/chr1A_T517634750C/chr1A_T517634750C.csv",
|
171
|
+
"test/data/chr2D_C112180134A/chr2D_C112180134A.csv",
|
172
|
+
"test/data/chr4D_C14473543T/chr4D_C14473543T.csv",
|
173
|
+
"test/data/chr4D_C14473543T/chr4D_C14473543T.fa",
|
174
|
+
"test/data/headerMergeed.txt",
|
175
|
+
"test/data/headerS2238015",
|
176
|
+
"test/data/mergedLibs.bam",
|
177
|
+
"test/data/mergedLibsReheader.bam",
|
178
|
+
"test/data/mergedLibsSorted.bam",
|
179
|
+
"test/data/mergedLibsSorted.bam.bai",
|
180
|
+
"test/data/patological_cases5D.csv",
|
181
|
+
"test/data/primer_3_input_header_test",
|
182
|
+
"test/data/short_primer_design_test.csv",
|
183
|
+
"test/data/some_tests/some_tests.csv",
|
184
|
+
"test/data/test_from_mutant.csv",
|
185
|
+
"test/data/test_iselect.csv",
|
186
|
+
"test/data/test_iselect_reference.fa",
|
187
|
+
"test/data/test_iselect_reference.fa.fai",
|
188
|
+
"test/data/test_primer3_error.csv",
|
189
|
+
"test/data/test_primer3_error_contigs.fa",
|
190
|
+
"test/test_bfr.rb",
|
191
|
+
"test/test_blast.rb",
|
192
|
+
"test/test_exon_container.rb",
|
193
|
+
"test/test_exonearate.rb",
|
194
|
+
"test/test_integration.rb",
|
195
|
+
"test/test_snp_parsing.rb",
|
196
|
+
"test/test_wrong_selection.sh"
|
197
|
+
]
|
198
|
+
s.homepage = "https://github.com/cb2e6f/bio-polymarker".freeze
|
199
|
+
s.licenses = ["MIT".freeze]
|
200
|
+
s.rubygems_version = "3.1.4".freeze
|
201
|
+
s.summary = "Tool to work with polyploids, NGS and molecular biology".freeze
|
202
|
+
|
203
|
+
if s.respond_to? :specification_version then
|
204
|
+
s.specification_version = 4
|
205
|
+
end
|
206
|
+
|
207
|
+
if s.respond_to? :add_runtime_dependency then
|
208
|
+
s.add_runtime_dependency(%q<bio>.freeze, [">= 1.5.1"])
|
209
|
+
s.add_runtime_dependency(%q<bio-samtools-wrapper>.freeze, [">= 2.7.0"])
|
210
|
+
s.add_runtime_dependency(%q<descriptive_statistics>.freeze, [">= 0"])
|
211
|
+
s.add_runtime_dependency(%q<systemu>.freeze, [">= 2.5.2"])
|
212
|
+
s.add_development_dependency(%q<shoulda>.freeze, [">= 2.10"])
|
213
|
+
s.add_development_dependency(%q<test-unit>.freeze, [">= 0"])
|
214
|
+
s.add_development_dependency(%q<juwelier>.freeze, [">= 0"])
|
215
|
+
s.add_development_dependency(%q<sorted_set>.freeze, [">= 0"])
|
216
|
+
else
|
217
|
+
s.add_dependency(%q<bio>.freeze, [">= 1.5.1"])
|
218
|
+
s.add_dependency(%q<bio-samtools-wrapper>.freeze, [">= 2.7.0"])
|
219
|
+
s.add_dependency(%q<descriptive_statistics>.freeze, [">= 0"])
|
220
|
+
s.add_dependency(%q<systemu>.freeze, [">= 2.5.2"])
|
221
|
+
s.add_dependency(%q<shoulda>.freeze, [">= 2.10"])
|
222
|
+
s.add_dependency(%q<test-unit>.freeze, [">= 0"])
|
223
|
+
s.add_dependency(%q<juwelier>.freeze, [">= 0"])
|
224
|
+
s.add_development_dependency(%q<sorted_set>.freeze, [">= 0"])
|
225
|
+
end
|
226
|
+
end
|
227
|
+
|
data/conf/defaults.rb
ADDED
@@ -0,0 +1 @@
|
|
1
|
+
path_to_chromosomes="/Users/ramirezr/Documents/PHD/201305_Databases/iwgcs"
|
@@ -0,0 +1,128 @@
|
|
1
|
+
0
|
2
|
+
0
|
3
|
+
0
|
4
|
+
0
|
5
|
+
0
|
6
|
+
0
|
7
|
+
0
|
8
|
+
0
|
9
|
+
0
|
10
|
+
0
|
11
|
+
0
|
12
|
+
0
|
13
|
+
-500
|
14
|
+
4700
|
15
|
+
-4100
|
16
|
+
-3800
|
17
|
+
0
|
18
|
+
0
|
19
|
+
0
|
20
|
+
0
|
21
|
+
0
|
22
|
+
0
|
23
|
+
0
|
24
|
+
0
|
25
|
+
-5900
|
26
|
+
-2600
|
27
|
+
-3200
|
28
|
+
-5200
|
29
|
+
0
|
30
|
+
0
|
31
|
+
0
|
32
|
+
0
|
33
|
+
0
|
34
|
+
0
|
35
|
+
0
|
36
|
+
0
|
37
|
+
-2100
|
38
|
+
-200
|
39
|
+
-3900
|
40
|
+
-4400
|
41
|
+
0
|
42
|
+
0
|
43
|
+
0
|
44
|
+
0
|
45
|
+
0
|
46
|
+
0
|
47
|
+
0
|
48
|
+
0
|
49
|
+
-700
|
50
|
+
4400
|
51
|
+
-1600
|
52
|
+
2900
|
53
|
+
0
|
54
|
+
0
|
55
|
+
0
|
56
|
+
0
|
57
|
+
0
|
58
|
+
0
|
59
|
+
0
|
60
|
+
0
|
61
|
+
0
|
62
|
+
0
|
63
|
+
0
|
64
|
+
0
|
65
|
+
0
|
66
|
+
0
|
67
|
+
0
|
68
|
+
0
|
69
|
+
0
|
70
|
+
0
|
71
|
+
0
|
72
|
+
0
|
73
|
+
0
|
74
|
+
0
|
75
|
+
0
|
76
|
+
0
|
77
|
+
-2900
|
78
|
+
-4100
|
79
|
+
-4200
|
80
|
+
-200
|
81
|
+
0
|
82
|
+
0
|
83
|
+
0
|
84
|
+
0
|
85
|
+
0
|
86
|
+
0
|
87
|
+
0
|
88
|
+
0
|
89
|
+
-3700
|
90
|
+
-4000
|
91
|
+
-3900
|
92
|
+
-4900
|
93
|
+
0
|
94
|
+
0
|
95
|
+
0
|
96
|
+
0
|
97
|
+
0
|
98
|
+
0
|
99
|
+
0
|
100
|
+
0
|
101
|
+
-6300
|
102
|
+
-4400
|
103
|
+
-5100
|
104
|
+
-4000
|
105
|
+
0
|
106
|
+
0
|
107
|
+
0
|
108
|
+
0
|
109
|
+
0
|
110
|
+
0
|
111
|
+
0
|
112
|
+
0
|
113
|
+
200
|
114
|
+
600
|
115
|
+
-1100
|
116
|
+
-6900
|
117
|
+
0
|
118
|
+
0
|
119
|
+
0
|
120
|
+
0
|
121
|
+
0
|
122
|
+
0
|
123
|
+
0
|
124
|
+
0
|
125
|
+
0
|
126
|
+
0
|
127
|
+
0
|
128
|
+
0
|
@@ -0,0 +1,128 @@
|
|
1
|
+
inf
|
2
|
+
inf
|
3
|
+
inf
|
4
|
+
inf
|
5
|
+
inf
|
6
|
+
inf
|
7
|
+
inf
|
8
|
+
inf
|
9
|
+
inf
|
10
|
+
inf
|
11
|
+
inf
|
12
|
+
inf
|
13
|
+
-1.1
|
14
|
+
14.2
|
15
|
+
-13.1
|
16
|
+
-12.6
|
17
|
+
inf
|
18
|
+
inf
|
19
|
+
inf
|
20
|
+
inf
|
21
|
+
inf
|
22
|
+
inf
|
23
|
+
inf
|
24
|
+
inf
|
25
|
+
-16.5
|
26
|
+
-7.4
|
27
|
+
-10.4
|
28
|
+
-15
|
29
|
+
inf
|
30
|
+
inf
|
31
|
+
inf
|
32
|
+
inf
|
33
|
+
inf
|
34
|
+
inf
|
35
|
+
inf
|
36
|
+
inf
|
37
|
+
-3.9
|
38
|
+
-0.1
|
39
|
+
-11.2
|
40
|
+
-13.1
|
41
|
+
inf
|
42
|
+
inf
|
43
|
+
inf
|
44
|
+
inf
|
45
|
+
inf
|
46
|
+
inf
|
47
|
+
inf
|
48
|
+
inf
|
49
|
+
-0.8
|
50
|
+
14.9
|
51
|
+
-3.6
|
52
|
+
10.4
|
53
|
+
inf
|
54
|
+
inf
|
55
|
+
inf
|
56
|
+
inf
|
57
|
+
inf
|
58
|
+
inf
|
59
|
+
inf
|
60
|
+
inf
|
61
|
+
inf
|
62
|
+
inf
|
63
|
+
inf
|
64
|
+
inf
|
65
|
+
inf
|
66
|
+
inf
|
67
|
+
inf
|
68
|
+
inf
|
69
|
+
inf
|
70
|
+
inf
|
71
|
+
inf
|
72
|
+
inf
|
73
|
+
inf
|
74
|
+
inf
|
75
|
+
inf
|
76
|
+
inf
|
77
|
+
-7.6
|
78
|
+
-13
|
79
|
+
-15
|
80
|
+
-0.5
|
81
|
+
inf
|
82
|
+
inf
|
83
|
+
inf
|
84
|
+
inf
|
85
|
+
inf
|
86
|
+
inf
|
87
|
+
inf
|
88
|
+
inf
|
89
|
+
-10
|
90
|
+
-11.9
|
91
|
+
-10.9
|
92
|
+
-13.8
|
93
|
+
inf
|
94
|
+
inf
|
95
|
+
inf
|
96
|
+
inf
|
97
|
+
inf
|
98
|
+
inf
|
99
|
+
inf
|
100
|
+
inf
|
101
|
+
-17.1
|
102
|
+
-12.6
|
103
|
+
-14
|
104
|
+
-10.9
|
105
|
+
inf
|
106
|
+
inf
|
107
|
+
inf
|
108
|
+
inf
|
109
|
+
inf
|
110
|
+
inf
|
111
|
+
inf
|
112
|
+
inf
|
113
|
+
2.3
|
114
|
+
3.3
|
115
|
+
-1.6
|
116
|
+
-20
|
117
|
+
inf
|
118
|
+
inf
|
119
|
+
inf
|
120
|
+
inf
|
121
|
+
inf
|
122
|
+
inf
|
123
|
+
inf
|
124
|
+
inf
|
125
|
+
inf
|
126
|
+
inf
|
127
|
+
inf
|
128
|
+
inf
|
@@ -0,0 +1,131 @@
|
|
1
|
+
/* Enthalpy of dangling end */
|
2
|
+
/* 3' dangling */
|
3
|
+
AA_A 0
|
4
|
+
AC_A 0
|
5
|
+
AG_A 0
|
6
|
+
AT_A 0
|
7
|
+
AA_C 0
|
8
|
+
AC_C 0
|
9
|
+
AG_C 0
|
10
|
+
AT_C 0
|
11
|
+
AA_G 0
|
12
|
+
AC_G 0
|
13
|
+
AG_G 0
|
14
|
+
AT_G 0
|
15
|
+
AA_T 5
|
16
|
+
AC_T -47
|
17
|
+
AG_T 41
|
18
|
+
AT_T 38
|
19
|
+
CA_A 0
|
20
|
+
CC_A 0
|
21
|
+
CG_A 0
|
22
|
+
CT_A 0
|
23
|
+
CA_C 0
|
24
|
+
CC_C 0
|
25
|
+
CG_C 0
|
26
|
+
CT_C 0
|
27
|
+
CA_G 59
|
28
|
+
CC_G 26
|
29
|
+
CG_G 32
|
30
|
+
CT_G 52
|
31
|
+
CA_T 0
|
32
|
+
CC_T 0
|
33
|
+
CG_T 0
|
34
|
+
CT_T 0
|
35
|
+
GA_A 0
|
36
|
+
GC_A 0
|
37
|
+
GG_A 0
|
38
|
+
GT_A 0
|
39
|
+
GA_C 21
|
40
|
+
GC_C 2
|
41
|
+
GG_C 39
|
42
|
+
GT_C 44
|
43
|
+
GA_G 0
|
44
|
+
GC_G 0
|
45
|
+
GG_G 0
|
46
|
+
GT_G 0
|
47
|
+
GA_T 0
|
48
|
+
GC_T 0
|
49
|
+
GG_T 0
|
50
|
+
GT_T 0
|
51
|
+
TA_A 7
|
52
|
+
TC_A -44
|
53
|
+
TG_A 16
|
54
|
+
TT_A -29
|
55
|
+
TA_C 0
|
56
|
+
TC_C 0
|
57
|
+
TG_C 0
|
58
|
+
TT_C 0
|
59
|
+
TA_G 0
|
60
|
+
TC_G 0
|
61
|
+
TG_G 0
|
62
|
+
TT_G 0
|
63
|
+
TA_T 0
|
64
|
+
TC_T 0
|
65
|
+
TG_T 0
|
66
|
+
TT_T 0
|
67
|
+
/* 5' dangling */
|
68
|
+
A_AA 0
|
69
|
+
A_AC 0
|
70
|
+
A_AG 0
|
71
|
+
A_AT 0
|
72
|
+
A_CA 0
|
73
|
+
A_CC 0
|
74
|
+
A_CG 0
|
75
|
+
A_CT 0
|
76
|
+
A_GA 0
|
77
|
+
A_GC 0
|
78
|
+
A_GG 0
|
79
|
+
A_GT 0
|
80
|
+
A_TA 29
|
81
|
+
A_TC 41
|
82
|
+
A_TG 42
|
83
|
+
A_TT 2
|
84
|
+
C_AA 0
|
85
|
+
C_AC 0
|
86
|
+
C_AG 0
|
87
|
+
C_AT 0
|
88
|
+
C_CA 0
|
89
|
+
C_CC 0
|
90
|
+
C_CG 0
|
91
|
+
C_CT 0
|
92
|
+
C_GA 37
|
93
|
+
C_GC 40
|
94
|
+
C_GG 39
|
95
|
+
C_GT 49
|
96
|
+
C_TA 0
|
97
|
+
C_TC 0
|
98
|
+
C_TG 0
|
99
|
+
C_TT 0
|
100
|
+
G_AA 0
|
101
|
+
G_AC 0
|
102
|
+
G_AG 0
|
103
|
+
G_AT 0
|
104
|
+
G_CA 63
|
105
|
+
G_CC 44
|
106
|
+
G_CG 51
|
107
|
+
G_CT 40
|
108
|
+
G_GA 0
|
109
|
+
G_GC 0
|
110
|
+
G_GG 0
|
111
|
+
G_GT 0
|
112
|
+
G_TA 0
|
113
|
+
G_TC 0
|
114
|
+
G_TG 0
|
115
|
+
G_TT 0
|
116
|
+
T_AA -2
|
117
|
+
T_AC -6
|
118
|
+
T_AG 11
|
119
|
+
T_AT 69
|
120
|
+
T_CA 0
|
121
|
+
T_CC 0
|
122
|
+
T_CG 0
|
123
|
+
T_CT 0
|
124
|
+
T_GA 0
|
125
|
+
T_GC 0
|
126
|
+
T_GG 0
|
127
|
+
T_GT 0
|
128
|
+
T_TA 0
|
129
|
+
T_TC 0
|
130
|
+
T_TG 0
|
131
|
+
T_TT 0
|