viral_seq 1.6.3 → 1.6.4

Sign up to get free protection for your applications and to get access to all the features.
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA256:
3
- metadata.gz: ed86467ec77cdce9b1175604528937233fb2d3e91081a294b8a9aed2e5ca2b68
4
- data.tar.gz: 3c9eef94e3252e5f486ee82b69b45e584810281d50c7d7ceaad0d51ec87ba890
3
+ metadata.gz: 02d26d720fef0501d70b012d9919f932b23a21b1caabbf508a56fffa162c311b
4
+ data.tar.gz: '0681add2b2fa2ca7dedffeaaf43bd8b0e2b6200dd38633e2eeda58946ced8238'
5
5
  SHA512:
6
- metadata.gz: cf23bedc3bc4be082eeb1e1a512fa5ae4777ca2d7b7d425348e2f95cc934fe6a1aed5875998fd5236f1485ed86797d3b2fed1d416a4cca6442e4dfa35967dd3b
7
- data.tar.gz: 4958b976b7d97d1c7f052b0341bdbf9eee66db86cabf6aada972afb081a4766d20af3cc0c13e0c14a01b4a1e831c62c49e03ffd6131a21f8215b66fc19cee61b
6
+ metadata.gz: 301c188d736c9812006d30db8995fa7df683cc63443c1370de3d487dae77b88cfc60c8b674abc93b35f7457ced536a6e374433e5fbe0f423e4a7993ea4240ebc
7
+ data.tar.gz: 1118ab7b586da98bb2c3533f81c35a02f0efb1978c0b91e15b56218b05342ad83e73f96bd2df53f75e2e6cdd16c591582ebe864562a02d3dd78997678b706233
data/README.md CHANGED
@@ -179,6 +179,12 @@ qc_seqhash.sdrm_hiv_pr(cut_off)
179
179
 
180
180
  ## Updates
181
181
 
182
+ ### Version-1.6.4-07182022
183
+
184
+ 1. Included region "P17" in the default `tcs -d` pipeline setting. `tcs` pipeline updated to version 2.5.1.
185
+ 2. Loosen the locator params for the "V1V3" end region for rare alignment issues. Now the default "V1V3" region end with position 7205 to 7210 instead of 7208.
186
+ 3. `tcs_sdrm` now analyse "P17" region for pairwise diversity.
187
+
182
188
  ### Version-1.6.3-02052022
183
189
 
184
190
  1. Updated on `ViralSeq::Muscle` module along with the update of `muscle` from version 3.8.1 to 5.1.
data/bin/tcs_sdrm CHANGED
@@ -172,6 +172,25 @@ libs.each do |lib|
172
172
  linkage_list += sdrm[1]
173
173
  aa_report_list += sdrm[2]
174
174
 
175
+ elsif seq_basename =~/P17/i
176
+ a3g_check = seqs.a3g
177
+ a3g_seqs = a3g_check[:a3g_seq]
178
+ a3g_filtered_seqs = a3g_check[:filtered_seq]
179
+ stop_codon_check = a3g_filtered_seqs.stop_codon(2)
180
+ stop_codon_seqs = stop_codon_check[:with_stop_codon]
181
+ filtered_seqs = stop_codon_check[:without_stop_codon]
182
+ poisson_minority_cutoff = filtered_seqs.pm
183
+ fdr_hash = filtered_seqs.fdr
184
+ summary_hash[:P17] = [
185
+ seqs.size.to_s,
186
+ a3g_seqs.size.to_s,
187
+ stop_codon_seqs.size.to_s,
188
+ filtered_seqs.size.to_s,
189
+ poisson_minority_cutoff.to_s
190
+ ].join(',')
191
+ next if filtered_seqs.size < 3
192
+ filtered_seqs.write_nt_fa(File.join(filtered_seq_dir,seq_basename))
193
+
175
194
  elsif seq_basename =~/RT/i
176
195
  rt_seq1 = {}
177
196
  rt_seq2 = {}
@@ -231,7 +250,6 @@ libs.each do |lib|
231
250
  next if filtered_sh.size < 3
232
251
  aligned_sh = filtered_sh.random_select(1000).align(:Super5)
233
252
  aligned_sh.write_nt_fa(File.join(aln_seq_dir, File.basename(seq_file)))
234
- puts 'aligned sequence written.'
235
253
  end
236
254
 
237
255
  r_script.gsub!(/PATH_TO_FASTA/,aln_seq_dir)
@@ -250,7 +268,7 @@ libs.each do |lib|
250
268
  tag = data[0].split("_")[-1].gsub(/\W/,"").to_sym
251
269
  summary_hash[tag] += "," + data[1].to_f.round(4).to_s + "," + data[2].to_f.round(4).to_s
252
270
  end
253
- [:PR, :RT, :IN, :V1V3].each do |regions|
271
+ [:PR, :RT, :IN, :V1V3, :P17].each do |regions|
254
272
  next unless summary_hash[regions]
255
273
  seq_summary_out.puts regions.to_s + "," + summary_hash[regions]
256
274
  end
@@ -271,10 +289,13 @@ libs.each do |lib|
271
289
  tcs_RT = 0
272
290
  tcs_IN = 0
273
291
  tcs_V1V3 = 0
292
+ tcs_P17 = 0
274
293
  pi_RT = 0.0
275
294
  pi_V1V3 = 0.0
295
+ pi_P17 = 0.0
276
296
  dist20_RT = 0.0
277
297
  dist20_V1V3 = 0.0
298
+ dist20_P17 = 0.0
278
299
  summary_lines.each do |line|
279
300
  data = line.chomp.split(",")
280
301
  if data[0] == "PR"
@@ -289,6 +310,10 @@ libs.each do |lib|
289
310
  tcs_V1V3 = data[1].to_i
290
311
  pi_V1V3 = data[6].to_f
291
312
  dist20_V1V3 = data[7].to_f
313
+ elsif data[0] == "P17"
314
+ tcs_P17 = data[4].to_i
315
+ pi_P17 = data[6].to_f
316
+ dist20_P17 = data[7].to_f
292
317
  end
293
318
  end
294
319
 
@@ -324,9 +349,13 @@ libs.each do |lib|
324
349
  tcs_RT: tcs_RT,
325
350
  tcs_IN: tcs_IN,
326
351
  tcs_V1V3: tcs_V1V3,
352
+ tcs_P17: tcs_P17,
327
353
  pi_RT: pi_RT,
354
+ pi_V1V3: pi_V1V3,
355
+ pi_P17: pi_P17,
328
356
  dist20_RT: dist20_RT,
329
357
  dist20_V1V3: dist20_V1V3,
358
+ dist20_P17: dist20_P17,
330
359
  recency: recency,
331
360
  sdrm_PR: sdrm_PR,
332
361
  sdrm_RT: sdrm_RT,
data/docs/dr.json CHANGED
@@ -62,6 +62,21 @@
62
62
  "ref_end": 7208,
63
63
  "indel": true,
64
64
  "trim": false
65
+ },
66
+ {
67
+ "region": "P17",
68
+ "cdna": "GTGACTGGAGTTCAGACGTGTGCTCTTCCGATCTNNNNNNNNNNNCAGTCAACAAGGTTTCTGTCATCCAATTTTTTAC",
69
+ "forward": "GCCTCCCTCGCGCCATCAGAGATGTGTATAAGAGACAGNNNNGTCAGCCAAAATTACCCTATAGTGC",
70
+ "majority": 0.5,
71
+ "end_join": true,
72
+ "end_join_option": 1,
73
+ "overlap": 0,
74
+ "TCS_QC": true,
75
+ "ref_genome": "HXB2",
76
+ "ref_start": 1196,
77
+ "ref_end": 1725,
78
+ "indel": true,
79
+ "trim": false
65
80
  }
66
81
  ]
67
82
  }
@@ -5,7 +5,7 @@ module ViralSeq
5
5
  # functions to identify SDRMs from a ViralSeq::SeqHash object at HIV PR region.
6
6
  # works for MPID-DR protocol (dx.doi.org/10.17504/protocols.io.useewbe)
7
7
  # PR codon 1-99
8
- # RT codon 34-122 (HXB2 2650-2914) and 152-236(3001-3257)
8
+ # RT codon 34-122 (HXB2 2649-2914) and 152-236(3001-3257)
9
9
  # IN codon 53-174 (HXB2 4384-4751)
10
10
  # @param cutoff [Integer] cut-off for minimal abundance of a mutation to be called as valid mutation,
11
11
  # can be obtained using ViralSeq::SeqHash#poisson_minority_cutoff function
@@ -61,11 +61,26 @@ module ViralSeq
61
61
  :TCS_QC=>true,
62
62
  :ref_genome=>"HXB2",
63
63
  :ref_start=>6585,
64
- :ref_end=>7208,
64
+ :ref_end=>7205..7210,
65
65
  :indel=>true,
66
- :trim=>false}
66
+ :trim=>false},
67
+ {:region=>"P17",
68
+ :cdna=>
69
+ "GTGACTGGAGTTCAGACGTGTGCTCTTCCGATCTNNNNNNNNNNNCAGTCAACAAGGTTTCTGTCATCCAATTTTTTAC",
70
+ :forward=>
71
+ "GCCTCCCTCGCGCCATCAGAGATGTGTATAAGAGACAGNNNNGTCAGCCAAAATTACCCTATAGTGC",
72
+ :majority=>0,
73
+ :end_join=>true,
74
+ :end_join_option=>1,
75
+ :overlap=>0,
76
+ :TCS_QC=>true,
77
+ :ref_genome=>"HXB2",
78
+ :ref_start=>1196,
79
+ :ref_end=>1725,
80
+ :indel=>true,
81
+ :trim=>false}
67
82
  ]
68
- }
83
+ }
69
84
  end
70
85
 
71
86
  end
@@ -2,6 +2,6 @@
2
2
  # version info and histroy
3
3
 
4
4
  module ViralSeq
5
- VERSION = "1.6.3"
6
- TCS_VERSION = "2.5.0"
5
+ VERSION = "1.6.4"
6
+ TCS_VERSION = "2.5.1"
7
7
  end
Binary file
metadata CHANGED
@@ -1,7 +1,7 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: viral_seq
3
3
  version: !ruby/object:Gem::Version
4
- version: 1.6.3
4
+ version: 1.6.4
5
5
  platform: ruby
6
6
  authors:
7
7
  - Shuntai Zhou
@@ -9,7 +9,7 @@ authors:
9
9
  autorequire:
10
10
  bindir: bin
11
11
  cert_chain: []
12
- date: 2022-02-05 00:00:00.000000000 Z
12
+ date: 2022-07-19 00:00:00.000000000 Z
13
13
  dependencies:
14
14
  - !ruby/object:Gem::Dependency
15
15
  name: bundler
@@ -193,6 +193,7 @@ files:
193
193
  - lib/viral_seq/tcs_dr.rb
194
194
  - lib/viral_seq/tcs_json.rb
195
195
  - lib/viral_seq/version.rb
196
+ - rc_swans.svc@longleaf.unc.edu
196
197
  - viral_seq.gemspec
197
198
  homepage: https://github.com/ViralSeq/viral_seq
198
199
  licenses: