RubyGems - viral_seq - Versions diffs - 1.0.4 → 1.0.5 - Mend

viral_seq 1.0.4 → 1.0.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

checksums.yaml CHANGED

@@ -1,7 +1,7 @@
 ---
 SHA256:
-  metadata.gz: 7f54bac7de0e2ffe1b4eac99b6f325b039a3be19d832926ebf1b280154cd0ad2
-  data.tar.gz: f5c5fe62299ec5253c4b8b395816a9158e8d60f428b757161daf209da70b0c0e
+  metadata.gz: a13ba7912ee87511c2ecf19f07256d3a129661c6d7e180d57ecd1e34978386e6
+  data.tar.gz: 61e5ed6b423f0b64c53a6bb8e8ec3801bf7e093e4d0741bd71bf9fbfa24f1b55
 SHA512:
-  metadata.gz: 5c9b7767cbd000c253c7a6f98432e6230adfb6736cf39ced62815443f82f1cee7f446ebabf7791c67675bf37e664f7f4ac9570350894a871ac0310c36844213e
-  data.tar.gz: '049d8b2fc82f09ab618d777a2dc6d20922dd6e4c9af8f6c47ca734b8caa46c4fcee10617247404b6ac85c3e31e3d47353c7162b7c6f1df17ec6ce9efb94829a5'
+  metadata.gz: f18d03220190bf1479ed29bd4d4b83777ffe5216951d38a91dd2afdc6c07b516883a8694291106b6fee2693a246b8a3c6a824786527cd03730f28f6777fa3231
+  data.tar.gz: 7fe146b081a7b633de963ed632bdcb548c71d1f401e227109d8745d23ad770d2099a2aa50bc4553a9450b260b7206892ed2a898d9154764aebe4094f38faeb44

data/Gemfile.lock CHANGED

@@ -1,7 +1,7 @@
 PATH
   remote: .
   specs:
-    viral_seq (1.0.2)
+    viral_seq (1.0.5)
       muscle_bio (~> 0.4)
 GEM

data/README.md CHANGED

@@ -17,36 +17,46 @@ Load all ViralSeq classes by requiring 'viral_seq.rb'
 ## Some Examples
-Load nucleotide sequences from a FASTA format sequence file
+### Load nucleotide sequences from a FASTA format sequence file
     my_seqhash = ViralSeq::SeqHash.fa('my_seq_file.fasta')
-Make an alignment (using MUSCLE)
+### Make an alignment (using MUSCLE)
     aligned_seqhash = my_seqhash.align
-Filter nucleotide sequences with the reference coordinates (HIV Protease)
+### Filter nucleotide sequences with the reference coordinates (HIV Protease)
     qc_seqhash = aligned_seqhash.hiv_seq_qc(2253, 2549, false, :HXB2)
-Further filter out sequences with Apobec3g/f hypermutations
+### Further filter out sequences with Apobec3g/f hypermutations
     qc_seqhash = qc_seqhash.a3g
-Calculate nucleotide diveristy π
+### Calculate nucleotide diveristy π
     qc_seqhash.pi
-Calculate cut-off for minority variants based on Poisson model
+### Calculate cut-off for minority variants based on Poisson model
     cut_off = qc_seqhash.pm
-Examine for drug resistance mutations for HIV PR region
+### Examine for drug resistance mutations for HIV PR region
     qc_seqhash.sdrm_hiv_pr(cut_off)
+### Use executable `locator` to get the coordinates of the sequences on HIV/SIV reference genome from a FASTA file through a terminal
+    $ locator -i sequence.fasta -o sequence.fasta.csv
 ## Updates
+Version 1.0.5-07112019:
+    1. Update ViralSeq::SeqHash#sequence_locator.
+       Program will try to determine the direction (`+` or `-` of the query sequence)
+    2. update executable `locator` to have a column of `direction` in output .csv file
 Version 1.0.4-07102019:
     1. Use home directory (Dir.home) instead of the directory of the script file for temp MUSCLE file.

data/bin/locator CHANGED

@@ -4,29 +4,6 @@ require 'viral_seq'
 require 'csv'
 require 'optparse'
-module ViralSeq
-  class SeqHash
-    def sequence_locator(ref_option = :HXB2)
-      out_array = []
-      dna_seq = self.dna_hash
-      title = self.title
-      uniq_dna = dna_seq.uniq_hash
-      uniq_dna.each do |seq,names|
-        s = ViralSeq::Sequence.new('',seq)
-        loc = s.locator(ref_option)
-        names.each do |name|
-          out_array << ([title, name, ref_option.to_s] + loc)
-        end
-      end
-      return out_array
-    end # end of locator
-    alias_method :loc, :sequence_locator
-  end
-end
 def myparser
   options = {}
   OptionParser.new do |opts|
@@ -36,7 +13,7 @@ def myparser
       options[:infile] = i
     end
-    opts.on('-o', '--outfile CSV_FILE', 'output .csv file for locator info') do |o|
+    opts.on('-o', '--outfile CSV_FILE', "output .csv file for locator info, default as \#\{infile\}.csv") do |o|
       options[:outfile] = o
     end
@@ -48,11 +25,17 @@ def myparser
       puts opts
       exit
     end
+    opts.on("-v", "--version", "Version number of RubyGem::ViralSeq") do
+      puts opts
+      exit
+    end
   end.parse!
   return options
 end
-puts "\nSequence Locator (RubyGem::ViralSeq) #{ViralSeq::VERSION} by Shuntai Zhou"
+puts "\nSequence Locator (RubyGem::ViralSeq Version #{ViralSeq::VERSION}) by Shuntai Zhou"
 puts "See details at https://github.com/ViralSeq/viral_seq\n"
 puts "Resembling Sequence Locator from LANL (https://www.hiv.lanl.gov/content/sequence/LOCATE/locate.html)\n\n"
@@ -70,7 +53,7 @@ begin
   if options[:outfile]
     csv_file = options[:outfile]
   else
-    raise StandardError.new("Please provide path to output csv file")
+    csv_file = seq_file + ".csv"
   end
   unless File.exist?(seq_file)
@@ -86,7 +69,7 @@ begin
   end
   locs = seqs.loc(opt)
-  head = ["title", "sequence", "ref", "start", "end", "similarity", "indel", "aligned_input", "aligned_ref"]
+  head = ["title", "sequence", "ref", "direction", "start", "end", "similarity", "indel", "aligned_input", "aligned_ref"]
   locs.unshift(head)
   data = CSV.generate do |csv|
     locs.each {|loc| csv << loc}

data/lib/viral_seq/seq_hash.rb CHANGED

@@ -729,6 +729,8 @@ module ViralSeq
     #
     #     containing_indel? (Boolean)
     #
+    #     direction ('forward' or 'reverse')
+    #
     #     aligned_input_sequence (String)
     #
     #     aligned_reference_sequence (String)
@@ -742,9 +744,13 @@ module ViralSeq
       uniq_dna.each do |seq,names|
         s = ViralSeq::Sequence.new('',seq)
-        loc = s.locator(ref_option)
+        loc1 = s.locator(ref_option)
+        s.rc!
+        loc2 = s.locator(ref_option)
+        loc1[2] >= loc2[2] ? (direction = :+; loc = loc1): (direction = :-; loc = loc2)
         names.each do |name|
-          out_array << ([title, name, ref_option.to_s] + loc)
+          out_array << ([title, name, ref_option.to_s, direction.to_s] + loc)
         end
       end
       return out_array

data/lib/viral_seq/version.rb CHANGED

@@ -2,5 +2,5 @@
 # version info and histroy
 module ViralSeq
-  VERSION = "1.0.4"
+  VERSION = "1.0.5"
 end

metadata CHANGED

@@ -1,7 +1,7 @@
 --- !ruby/object:Gem::Specification
 name: viral_seq
 version: !ruby/object:Gem::Version
-  version: 1.0.4
+  version: 1.0.5
 platform: ruby
 authors:
 - Shuntai Zhou
@@ -9,7 +9,7 @@ authors:
 autorequire:
 bindir: bin
 cert_chain: []
-date: 2019-07-10 00:00:00.000000000 Z
+date: 2019-07-11 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: bundler