RubyGems - smarter_csv - Versions diffs - 1.1.3 → 1.1.4 - Mend

smarter_csv 1.1.3 → 1.1.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (10) hide show

checksums.yaml +4 -4
data/README.md +4 -0
data/lib/extensions/hash.rb +1 -3
data/lib/smarter_csv/smarter_csv.rb +2 -3
data/lib/smarter_csv/version.rb +1 -1
data/spec/fixtures/valid_unicode.csv +5 -0
data/spec/smarter_csv/extenstions_spec.rb +17 -0
data/spec/smarter_csv/quoted_spec.rb +11 -1
data/spec/smarter_csv/valid_unicode_spec.rb +94 -0
metadata +8 -2

checksums.yaml CHANGED

@@ -1,7 +1,7 @@
 ---
 SHA1:
-  metadata.gz: cbd937d958dbb95653e9368a6b10075162f122e7
-  data.tar.gz: eaf5a03e4a209900189f035d2b5b876cc1c08e51
+  metadata.gz: cb1216b85e197c77005a95ab4c3bc46896b7719f
+  data.tar.gz: 7539e858a39825e5fac1dc27e51f53f1e3f20c2c
 SHA512:
-  metadata.gz: 7abffcc904a90122851159a5d241ad0f5944c0b3c67a288c5f91f93c86667f3ce0293cbb14dbe5d8c507a8ed955d8583d39099431ec929ba0d822b163a3e0ff1
-  data.tar.gz: a96735123fb0c8f5dae9eeea4b7606feba984d6daa6f347125a2cd6a810cb5a3eecf3af733277f4ee8143077b08fffbca4ce9a83c0eecccc7972e3a0ce43ef77
+  metadata.gz: 2669d2f524e138bdcd8e9ded254a8dee1996589d56eabe4ac2f4480be7ebc88c1360600d26e109d3eba7e1e91075aa52629663ef4fd32489a7fd7e809f8b587c
+  data.tar.gz: 39cf42229ab96f15e860472ea138e04ba18c6c717e0860eaa87e9fd2e0c8ca516a8070ee6333f96a6cbc8a40662b509fef492eaefc72b95ecb1ccf5d8c1b1faa

data/README.md CHANGED

@@ -293,6 +293,9 @@ Planned in the next releases:
 ## Changes
+#### 1.1.4 (2017-01-16)
+ * fixing UTF-8 related bug which was introduced in 1.1.2 (thank to Tirdad C.)
 #### 1.1.3 (2016-12-30)
  * added warning when options indicate UTF-8 processing, but input filehandle is not opened with r:UTF-8 option
@@ -445,6 +448,7 @@ And a special thanks to those who contributed pull requests:
  * [Jordan Graft](https://github.com/jordangraft)
  * [Michael](https://github.com/polycarpou)
  * [Kevin Coleman](https://github.com/KevinColemanInc)
+ * [Tirdad C.](https://github.com/tridadc)
 ## Contributing

data/lib/extensions/hash.rb CHANGED

@@ -2,8 +2,6 @@
 class Hash
   def self.zip(keys,values) # from Facets of Ruby library
-    h = {}
-    keys.size.times{ |i| h[ keys[i] ] = values[i] }
-    h
+    (keys.zip(values)).to_h
   end
 end

data/lib/smarter_csv/smarter_csv.rb CHANGED

@@ -40,7 +40,7 @@ module SmarterCSV
         # process the header line in the CSV file..
         # the first line of a CSV file contains the header .. it might be commented out, so we need to read it anyhow
         header = f.readline.sub(options[:comment_regexp],'').chomp(options[:row_sep])
-        header = header.encode!('UTF-8', 'binary', invalid: :replace, undef: :replace, replace: options[:invalid_byte_sequence]) if options[:force_utf8] || options[:file_encoding] =~ /utf-8/i
+        header = header.force_encoding('utf-8').encode('utf-8', invalid: :replace, undef: :replace, replace: options[:invalid_byte_sequence]) if options[:force_utf8] || options[:file_encoding] !~ /utf-8/i
         file_line_count += 1
         csv_line_count += 1
@@ -104,10 +104,9 @@ module SmarterCSV
       # now on to processing all the rest of the lines in the CSV file:
       while ! f.eof?    # we can't use f.readlines() here, because this would read the whole file into memory at once, and eof => true
         line = f.readline  # read one line.. this uses the input_record_separator $/ which we set previously!
-        line = line.encode!('UTF-8', 'binary', invalid: :replace, undef: :replace, replace: '') if options[:force_utf8]
         # replace invalid byte sequence in UTF-8 with question mark to avoid errors
-        line = line.encode('UTF-8', 'binary', invalid: :replace, undef: :replace, replace: options[:invalid_byte_sequence]) if options[:force_utf8] || options[:file_encoding] =~ /utf-8/i
+        line = line.force_encoding('utf-8').encode('utf-8', invalid: :replace, undef: :replace, replace: options[:invalid_byte_sequence]) if options[:force_utf8] || options[:file_encoding] !~ /utf-8/i
         file_line_count += 1
         csv_line_count += 1

data/lib/smarter_csv/version.rb CHANGED

@@ -1,3 +1,3 @@
 module SmarterCSV
-  VERSION = "1.1.3"
+  VERSION = "1.1.4"
 end

data/spec/fixtures/valid_unicode.csv ADDED

@@ -0,0 +1,5 @@
+"Artist","Track","Album","Label","Year"
+Кино,"Мама, мы все сошли с ума",Группа Крови,Moroz Records,1998
+"Кино","Мама, мы все сошли с ума","Группа Крови","Moroz Records",1998
+Rammstein,Frühling in Paris,Liebe ist für alle da,Vagrant,2009
+"Rammstein","Frühling in Paris","Liebe ist für alle da","Vagrant",2009

data/spec/smarter_csv/extenstions_spec.rb ADDED

@@ -0,0 +1,17 @@
+require 'spec_helper'
+describe "Hash.zip" do
+  it "constructs a new Hash from two Arrays" do
+    Hash.zip(["a", "b"], [1, 2]).should == { "a" => 1, "b" => 2 }
+  end
+  it "constructs an empty Hash if given no keys" do
+    Hash.zip([], []).should == {}
+    Hash.zip([], [1]).should == {}
+  end
+  it "uses nil values if there are more keys than values" do
+    Hash.zip(["a"], []).should == { "a" => nil }
+    Hash.zip(["a", "b"], [1]).should == { "a" => 1, "b" => nil }
+  end
+end

data/spec/smarter_csv/quoted_spec.rb CHANGED

@@ -3,11 +3,21 @@ require 'spec_helper'
 fixture_path = 'spec/fixtures'
 describe 'be_able_to' do
-  it 'loads_file_with_quoted_fields' do
+  it 'loads_file_with_quoted_fields' do
     options = {}
     data = SmarterCSV.process("#{fixture_path}/quoted.csv", options)
     data.flatten.size.should == 4
+    data[1][:model].should eq 'Venture "Extended Edition"'
     data[1][:description].should be_nil
+    data[2][:model].should eq 'Venture "Extended Edition, Very Large"'
     data[2][:description].should be_nil
+    data.each do |h|
+      h[:year].class.should eq Fixnum
+      h[:make].should_not be_nil
+      h[:model].should_not be_nil
+      h[:price].class.should eq Float
+    end
   end
 end

data/spec/smarter_csv/valid_unicode_spec.rb ADDED

@@ -0,0 +1,94 @@
+require 'spec_helper'
+fixture_path = 'spec/fixtures'
+describe 'be_able_to' do
+  it 'loads file with unicode strings' do
+    options = {}
+    data = SmarterCSV.process("#{fixture_path}/valid_unicode.csv", options)
+    data.flatten.size.should == 4
+    data[0][:artist].should eq 'Кино'
+    data[0][:track].should eq 'Мама, мы все сошли с ума'
+    data[0][:album].should eq 'Группа Крови'
+    data[0][:label].should eq 'Moroz Records'
+    data[0][:year].should eq 1998
+    data[0].should eq  data[1]
+    data[2][:artist].should eq 'Rammstein'
+    data[2][:track].should eq 'Frühling in Paris'
+    data[2][:album].should eq 'Liebe ist für alle da'
+    data[2][:label].should eq 'Vagrant'
+    data[2][:year].should eq 2009
+    data[2].should eq  data[3]
+  end
+  it 'loads file with unicode strings, when forcing utf8' do
+    options = {:force_utf8 => true}
+    data = SmarterCSV.process("#{fixture_path}/valid_unicode.csv", options)
+    data.flatten.size.should == 4
+    data[0][:artist].should eq 'Кино'
+    data[0][:track].should eq 'Мама, мы все сошли с ума'
+    data[0][:album].should eq 'Группа Крови'
+    data[0][:label].should eq 'Moroz Records'
+    data[0][:year].should eq 1998
+    data[0].should eq  data[1]
+    data[2][:artist].should eq 'Rammstein'
+    data[2][:track].should eq 'Frühling in Paris'
+    data[2][:album].should eq 'Liebe ist für alle da'
+    data[2][:label].should eq 'Vagrant'
+    data[2][:year].should eq 2009
+    data[2].should eq  data[3]
+  end
+  it 'loads file with unicode strings, when loading from binary input' do
+    options = {:file_encoding => 'binary'}
+    data = SmarterCSV.process("#{fixture_path}/valid_unicode.csv", options)
+    data.flatten.size.should == 4
+    data[0][:artist].should eq 'Кино'
+    data[0][:track].should eq 'Мама, мы все сошли с ума'
+    data[0][:album].should eq 'Группа Крови'
+    data[0][:label].should eq 'Moroz Records'
+    data[0][:year].should eq 1998
+    data[0].should eq  data[1]
+    data[2][:artist].should eq 'Rammstein'
+    data[2][:track].should eq 'Frühling in Paris'
+    data[2][:album].should eq 'Liebe ist für alle da'
+    data[2][:label].should eq 'Vagrant'
+    data[2][:year].should eq 2009
+    data[2].should eq  data[3]
+  end
+  it 'loads file with unicode strings, when forcing utf8 with binary input' do
+    options = {:file_encoding => 'binary', :force_utf8 => true}
+    data = SmarterCSV.process("#{fixture_path}/valid_unicode.csv", options)
+    data.flatten.size.should == 4
+    data[0][:artist].should eq 'Кино'
+    data[0][:track].should eq 'Мама, мы все сошли с ума'
+    data[0][:album].should eq 'Группа Крови'
+    data[0][:label].should eq 'Moroz Records'
+    data[0][:year].should eq 1998
+    data[0].should eq  data[1]
+    data[2][:artist].should eq 'Rammstein'
+    data[2][:track].should eq 'Frühling in Paris'
+    data[2][:album].should eq 'Liebe ist für alle da'
+    data[2][:label].should eq 'Vagrant'
+    data[2][:year].should eq 2009
+    data[2].should eq  data[3]
+  end
+end

metadata CHANGED

@@ -1,7 +1,7 @@
 --- !ruby/object:Gem::Specification
 name: smarter_csv
 version: !ruby/object:Gem::Version
-  version: 1.1.3
+  version: 1.1.4
 platform: ruby
 authors:
 - |
@@ -9,7 +9,7 @@ authors:
 autorequire:
 bindir: bin
 cert_chain: []
-date: 2016-12-30 00:00:00.000000000 Z
+date: 2017-01-17 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: rspec
@@ -68,6 +68,7 @@ files:
 - spec/fixtures/quoted.csv
 - spec/fixtures/separator.csv
 - spec/fixtures/skip_lines.csv
+- spec/fixtures/valid_unicode.csv
 - spec/fixtures/with_dashes.csv
 - spec/fixtures/with_dates.csv
 - spec/smarter_csv/binary_file2_spec.rb
@@ -77,6 +78,7 @@ files:
 - spec/smarter_csv/close_file_spec.rb
 - spec/smarter_csv/column_separator_spec.rb
 - spec/smarter_csv/convert_values_to_numeric_spec.rb
+- spec/smarter_csv/extenstions_spec.rb
 - spec/smarter_csv/header_transformation_spec.rb
 - spec/smarter_csv/keep_headers_spec.rb
 - spec/smarter_csv/key_mapping_spec.rb
@@ -94,6 +96,7 @@ files:
 - spec/smarter_csv/skip_lines_spec.rb
 - spec/smarter_csv/strings_as_keys_spec.rb
 - spec/smarter_csv/strip_chars_from_headers_spec.rb
+- spec/smarter_csv/valid_unicode_spec.rb
 - spec/smarter_csv/value_converters_spec.rb
 - spec/spec.opts
 - spec/spec/spec_helper.rb
@@ -147,6 +150,7 @@ test_files:
 - spec/fixtures/quoted.csv
 - spec/fixtures/separator.csv
 - spec/fixtures/skip_lines.csv
+- spec/fixtures/valid_unicode.csv
 - spec/fixtures/with_dashes.csv
 - spec/fixtures/with_dates.csv
 - spec/smarter_csv/binary_file2_spec.rb
@@ -156,6 +160,7 @@ test_files:
 - spec/smarter_csv/close_file_spec.rb
 - spec/smarter_csv/column_separator_spec.rb
 - spec/smarter_csv/convert_values_to_numeric_spec.rb
+- spec/smarter_csv/extenstions_spec.rb
 - spec/smarter_csv/header_transformation_spec.rb
 - spec/smarter_csv/keep_headers_spec.rb
 - spec/smarter_csv/key_mapping_spec.rb
@@ -173,6 +178,7 @@ test_files:
 - spec/smarter_csv/skip_lines_spec.rb
 - spec/smarter_csv/strings_as_keys_spec.rb
 - spec/smarter_csv/strip_chars_from_headers_spec.rb
+- spec/smarter_csv/valid_unicode_spec.rb
 - spec/smarter_csv/value_converters_spec.rb
 - spec/spec.opts
 - spec/spec/spec_helper.rb