RubyGems - rubysl-iconv - Versions diffs - 1.0.1 - Mend

rubysl-iconv 1.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (27) hide show

checksums.yaml +7 -0
data/.gitignore +17 -0
data/.travis.yml +7 -0
data/Gemfile +4 -0
data/LICENSE +25 -0
data/README.md +29 -0
data/Rakefile +1 -0
data/ext/rubysl/iconv/extconf.rb +51 -0
data/ext/rubysl/iconv/iconv.c +927 -0
data/lib/iconv.rb +1 -0
data/lib/rubysl/iconv.rb +2 -0
data/lib/rubysl/iconv/version.rb +5 -0
data/rubysl-iconv.gemspec +23 -0
data/spec/charset_map_spec.rb +20 -0
data/spec/close_spec.rb +24 -0
data/spec/conv_spec.rb +32 -0
data/spec/failure/failed_spec.rb +53 -0
data/spec/failure/inspect_spec.rb +22 -0
data/spec/failure/success_spec.rb +51 -0
data/spec/failure_spec.rb +30 -0
data/spec/fixtures/classes.rb +11 -0
data/spec/iconv_spec.rb +211 -0
data/spec/new_spec.rb +8 -0
data/spec/open_spec.rb +29 -0
data/spec/shared/initialize_exceptions.rb +13 -0
data/spec/shared/new.rb +33 -0
metadata +125 -0

data/lib/iconv.rb ADDED

	@@ -0,0 +1 @@
1	+ require "rubysl/iconv"

data/lib/rubysl/iconv.rb ADDED

	@@ -0,0 +1,2 @@
1	+ require "iconv/iconv"
2	+ require "rubysl/iconv/version"

data/lib/rubysl/iconv/version.rb ADDED

@@ -0,0 +1,5 @@
+module RubySL
+  module Iconv
+    VERSION = "1.0.1"
+  end
+end

data/rubysl-iconv.gemspec ADDED

@@ -0,0 +1,23 @@
+# coding: utf-8
+require './lib/rubysl/iconv/version'
+Gem::Specification.new do |spec|
+  spec.name          = "rubysl-iconv"
+  spec.version       = RubySL::Iconv::VERSION
+  spec.authors       = ["Brian Shirai"]
+  spec.email         = ["brixen@gmail.com"]
+  spec.description   = %q{Ruby standard library iconv.}
+  spec.summary       = %q{Ruby standard library iconv.}
+  spec.homepage      = "https://github.com/rubysl/rubysl-iconv"
+  spec.license       = "BSD"
+  spec.files         = `git ls-files`.split($/)
+  spec.executables   = spec.files.grep(%r{^bin/}) { |f| File.basename(f) }
+  spec.extensions    = ["ext/rubysl/iconv/extconf.rb"]
+  spec.test_files    = spec.files.grep(%r{^(test|spec|features)/})
+  spec.require_paths = ["lib"]
+  spec.add_development_dependency "bundler", "~> 1.3"
+  spec.add_development_dependency "rake", "~> 10.0"
+  spec.add_development_dependency "mspec", "~> 1.5"
+end

data/spec/charset_map_spec.rb ADDED

@@ -0,0 +1,20 @@
+require File.expand_path('../fixtures/classes.rb', __FILE__)
+ruby_version_is ''...'2.0' do
+  describe "Iconv.charset_map" do
+    it "acts as a map" do
+      Iconv.charset_map.respond_to?(:[]).should be_true
+      Iconv.charset_map.respond_to?(:include?).should be_true
+      Iconv.charset_map.respond_to?(:to_hash).should be_true
+      Iconv.charset_map.include?("x-nonexistent-encoding").should be_false
+    end
+    #  it "maps from canonical name to system dependent name" do
+    #  end
+    it "returns nil when given an unknown encoding name" do
+      Iconv.charset_map["x-nonexistent-encoding"].should be_nil
+    end
+  end
+end

data/spec/close_spec.rb ADDED

@@ -0,0 +1,24 @@
+require File.expand_path('../fixtures/classes.rb', __FILE__)
+ruby_version_is ''...'2.0' do
+  describe "Iconv#close" do
+    it "ignores multiple calls" do
+      conv1 = Iconv.new("us-ascii", "us-ascii")
+      conv1.close.should == ""
+      conv1.close.should be_nil
+    end
+    it "does not raise an exception if called inside an .open block" do
+      Iconv.open "us-ascii", "us-ascii" do |conv2|
+        conv2.close.should == ""
+      end
+    end
+    it "returns a string containing the byte sequence to change the output buffer to its initial shift state" do
+      Iconv.open "ISO-2022-JP", "UTF-8" do |cd|
+        cd.iconv("\343\201\262")
+        cd.close.should == encode("\e(B", "iso-2022-jp")
+      end
+    end
+  end
+end

data/spec/conv_spec.rb ADDED

@@ -0,0 +1,32 @@
+require File.expand_path('../shared/initialize_exceptions', __FILE__)
+require File.expand_path('../fixtures/classes.rb', __FILE__)
+ruby_version_is ''...'2.0' do
+  describe "Iconv.conv" do
+    it_behaves_like :iconv_initialize_exceptions, :conv, "test"
+    it "acts exactly as if opening a converter and invoking #iconv once" do
+      Iconv.conv("utf-8", "iso-8859-1", "expos\xe9").should == encode("expos\xc3\xa9", "utf-8")
+      str = mock("string-like")
+      str.should_receive(:to_str).and_return("cacha\xc3\xa7a")
+      Iconv.conv("iso-8859-1", "utf-8", str).should == encode("cacha\xe7a", "iso-8859-1")
+      Iconv.conv("utf-16", "us-ascii", "a").should equal_utf16("\xfe\xff\0a")
+      # each call is completely independent; never retain context!
+      Iconv.conv("utf-16", "us-ascii", "b").should equal_utf16("\xfe\xff\0b")
+      Iconv.conv("us-ascii", "iso-8859-1", nil).should == ""
+      Iconv.conv("utf-16", "utf-8", "").should == ""
+      lambda do
+        Iconv.conv("utf-8", "utf-8", "test\xff")
+      end.should raise_error(Iconv::IllegalSequence)
+      lambda do
+        Iconv.conv("utf-8", "utf-8", "euro \xe2")
+      end.should raise_error(Iconv::InvalidCharacter)
+    end
+  end
+end

data/spec/failure/failed_spec.rb ADDED

@@ -0,0 +1,53 @@
+require File.expand_path('../../fixtures/classes.rb', __FILE__)
+ruby_version_is ''...'2.0' do
+  describe "Iconv::Failure#failed" do
+    it "returns a substring of the original string passed to Iconv that starts at the character which caused the exception" do
+      lambda {
+        begin
+          Iconv.open "utf-8", "utf-8" do |conv|
+            conv.iconv "test \xff test \xff"
+          end
+        rescue Iconv::Failure => e
+          @ex = e
+          raise e
+        end
+      }.should raise_error(Iconv::Failure)
+      @ex.failed.should == "\xff test \xff"
+      lambda {
+        begin
+          Iconv.open "utf-8", "utf-8" do |conv|
+            conv.iconv "test \xe2\x82"
+          end
+        rescue Iconv::Failure => e
+          @ex = e
+          raise e
+        end
+      }.should raise_error(Iconv::Failure)
+      @ex.failed.should == "\xe2\x82"
+    end
+    it "for Iconv.iconv and Iconv.conv returns an array containing a single element when instantiated" do
+      lambda {
+        begin
+          Iconv.iconv("utf-8", "utf-8", "test \xff test")
+        rescue Iconv::Failure => e
+          @ex = e
+          raise e
+        end
+      }.should raise_error(Iconv::Failure)
+      @ex.failed.should == ["\xff test"]
+      lambda {
+        begin
+          Iconv.conv("utf-8", "utf-8", "test \xff test")
+        rescue Iconv::Failure => e
+          @ex = e
+          raise e
+        end
+      }.should raise_error(Iconv::Failure)
+      @ex.failed.should == ["\xff test"]
+    end
+  end
+end

data/spec/failure/inspect_spec.rb ADDED

@@ -0,0 +1,22 @@
+require File.expand_path('../../fixtures/classes.rb', __FILE__)
+ruby_version_is ''...'2.0' do
+  describe "Iconv::Failure#inspect" do
+    it "includes information on the exception class name, #succes and #failed" do
+      lambda {
+        begin
+          Iconv.open "utf-8", "utf-8" do |conv|
+            conv.iconv "testing string \x80 until an error occurred"
+          end
+        rescue Iconv::Failure => e
+          @ex = e
+          raise e
+        end
+      }.should raise_error(Iconv::Failure)
+      inspection = @ex.inspect
+      inspection.should include(@ex.class.to_s)
+      inspection.should include(@ex.success.inspect)
+      inspection.should include(@ex.failed.inspect)
+    end
+  end
+end

data/spec/failure/success_spec.rb ADDED

@@ -0,0 +1,51 @@
+require File.expand_path('../../fixtures/classes.rb', __FILE__)
+ruby_version_is ''...'2.0' do
+  describe "Iconv::Failure#success" do
+    it "for Iconv#iconv and Iconv.conv returns the substring of the original string passed which was translated successfully until the exception ocurred" do
+      lambda {
+        begin
+          Iconv.open "utf-8", "utf-8" do |conv|
+            conv.iconv "test \xff test \xff"
+          end
+        rescue Iconv::Failure => e
+          @ex = e
+          raise e
+        end
+      }.should raise_error(Iconv::Failure)
+      @ex.success.should == "test "
+      lambda {
+        begin
+          Iconv.conv "utf-8", "utf-8", "\xe2\x82"
+        rescue Iconv::Failure => e
+          @ex = e
+          raise e
+        end
+      }.should raise_error(Iconv::Failure)
+      @ex.success.should == ""
+    end
+    it "for Iconv.iconv returns an array containing all the strings that were translated successfully until the exception ocurred, in order" do
+      lambda {
+        begin
+          Iconv.iconv("utf-8", "utf-8", "\xfferror")
+        rescue Iconv::Failure => e
+          @ex = e
+          raise e
+        end
+      }.should raise_error(Iconv::Failure)
+      @ex.success.should == [""]
+      lambda {
+        begin
+          Iconv.iconv("utf-8", "utf-8", "test", "testing", "until\xfferror")
+        rescue Iconv::Failure => e
+          @ex = e
+          raise e
+        end
+      }.should raise_error(Iconv::Failure)
+      @ex.success.should == ["test", "testing", "until"]
+    end
+  end
+end

data/spec/failure_spec.rb ADDED

@@ -0,0 +1,30 @@
+require File.expand_path('../fixtures/classes.rb', __FILE__)
+ruby_version_is ''...'2.0' do
+  describe "Iconv::Failure" do
+    it "is a module" do
+      Iconv::Failure.should be_kind_of(Module)
+      Iconv::Failure.should_not be_kind_of(Class)
+    end
+    it "is included by Iconv::InvalidEncoding" do
+      Iconv::Failure.should be_ancestor_of(Iconv::InvalidEncoding)
+    end
+    it "is included by Iconv::IllegalSequence" do
+      Iconv::Failure.should be_ancestor_of(Iconv::IllegalSequence)
+    end
+    it "is included by Iconv::InvalidCharacter" do
+      Iconv::Failure.should be_ancestor_of(Iconv::InvalidCharacter)
+    end
+    it "is included by Iconv::OutOfRange" do
+      Iconv::Failure.should be_ancestor_of(Iconv::OutOfRange)
+    end
+    it "is included by Iconv::BrokenLibrary" do
+      Iconv::Failure.should be_ancestor_of(Iconv::BrokenLibrary)
+    end
+  end
+end

data/spec/fixtures/classes.rb ADDED

@@ -0,0 +1,11 @@
+begin
+  require 'iconv'
+  module IconvSpecs
+    class IconvSubclass < Iconv
+    end
+  end
+rescue LoadError
+  # do nothing
+end

data/spec/iconv_spec.rb ADDED

@@ -0,0 +1,211 @@
+# -*- encoding: utf-8 -*-
+require File.expand_path('../shared/initialize_exceptions', __FILE__)
+require File.expand_path('../fixtures/classes.rb', __FILE__)
+# These specs assume the Iconv implementation supports at least
+# the following encodings:
+#   us-ascii, utf-8, utf-16, utf-16be, utf-16le, iso-8859-1
+ruby_version_is ''...'2.0' do
+  describe "Iconv#iconv" do
+    it "raises an ArgumentError when called on a closed converter" do
+      conv = Iconv.new("us-ascii", "us-ascii")
+      conv.close
+      lambda { conv.iconv("test") }.should raise_error(ArgumentError)
+    end
+    it "when given a string or string-like parameter returns a converted version of it" do
+      Iconv.open "utf-8", "iso-8859-1" do |conv|
+        conv.iconv("expos\xe9").should == "expos\xc3\xa9"
+        stringlike = mock("string-like")
+        stringlike.should_receive(:to_str).and_return("r\xe9sum\xe9")
+        conv.iconv(stringlike).should == "r\xc3\xa9sum\xc3\xa9"
+      end
+    end
+    it "keeps context between calls" do
+      Iconv.open "utf-16", "us-ascii" do |conv|
+        # BOM for first call of utf-16
+        conv.iconv("a").should equal_utf16("\xfe\xff\0a")
+        # no BOM for consecutive calls
+        conv.iconv("a").should equal_utf16("\0a")
+      end
+    end
+    it "when given a start and end position returns the substring" do
+      Iconv.open "us-ascii", "us-ascii" do |conv|
+        conv.iconv("testing", 1, 4).should == "esti"
+        conv.iconv("testing", 2, 1).should == "s"
+      end
+    end
+    it "when given a negative start position counts from the end of string" do
+      Iconv.open "us-ascii", "us-ascii" do |conv|
+        conv.iconv("testing", -7, 4).should == "test"
+        conv.iconv("testing", -3, 7).should == "ing"
+      end
+    end
+    it "when the end parameter is omitted or nil goes until the end of the string" do
+      Iconv.open "us-ascii", "us-ascii" do |conv|
+        conv.iconv("testing", 0).should == "testing"
+        conv.iconv("testing", 4).should == "ing"
+        conv.iconv("testing", 4, nil).should == "ing"
+        conv.iconv("testing", -3).should == "ing"
+        conv.iconv("testing", -4, nil).should == "ting"
+      end
+    end
+    ruby_bug "[ruby-core:17092]", "1.8.6.258" do
+      it "when given a positive length" do
+        Iconv.open "us-ascii", "us-ascii" do |conv|
+          conv.iconv("testing", 0, 4).should == "test"
+          conv.iconv("testing", 4, 6).should == "ing"
+          conv.iconv("substring", -6, 6).should == "string"
+        end
+      end
+      it "when given a negative length" do
+        Iconv.open "us-ascii", "us-ascii" do |conv|
+          conv.iconv("testing", 0, -1).should == "testing"
+          conv.iconv("testing", 2, -4).should == "sting"
+          conv.iconv("substring", -6, -4).should == "string"
+        end
+      end
+    end
+    it "raises Iconv::IllegalSequence when faced with an invalid byte for the source encoding" do
+      Iconv.open "utf-8", "utf-8" do |conv|
+        lambda { conv.iconv("test\x80") }.should raise_error(Iconv::IllegalSequence)
+      end
+    end
+    platform_is :linux, :darwin, :freebsd do
+      # glibc iconv and GNU libiconv wrongly raises EILSEQ.
+      # Linux, Darwin, and FreeBSD usually use them.
+      # NetBSD's libc iconv, Citrus iconv, correctly behaves as POSIX,
+      # but on NetBSD users may install GNU libiconv and use it.
+      it "raises Iconv::IllegalSequence when a character cannot be represented on the target encoding" do
+        Iconv.open "us-ascii", "utf-8" do |conv|
+          lambda { conv.iconv("euro \xe2\x82\xac") }.should raise_error(Iconv::IllegalSequence)
+        end
+      end
+    end
+    it "raises Iconv::InvalidCharacter when an incomplete character or shift sequence happens at the end of the input buffer" do
+      Iconv.open "utf-8", "utf-8" do |conv|
+        lambda { conv.iconv("euro \xe2") }.should raise_error(Iconv::InvalidCharacter)
+        lambda { conv.iconv("euro \xe2\x82") }.should raise_error(Iconv::InvalidCharacter)
+      end
+      Iconv.open "utf-16be", "utf-16be" do |conv|
+        lambda { conv.iconv("a") }.should raise_error(Iconv::InvalidCharacter)
+      end
+    end
+    ruby_bug "#17910", "1.8.6.114" do
+      it "sanitizes invalid upper bounds" do
+        Iconv.open "us-ascii", "us-ascii" do |conv|
+          conv.iconv("testing", 0, 99).should == "testing"
+          conv.iconv("testing", 10, 12).should == ""
+        end
+      end
+    end
+    it "returns a blank string on invalid lower bounds" do
+      Iconv.open "us-ascii", "us-ascii" do |conv|
+        conv.iconv("testing", -10, -8).should == ""
+        conv.iconv("testing", -8).should == ""
+        conv.iconv("testing", -9, 5).should == ""
+      end
+    end
+  end
+  describe "Iconv.iconv" do
+    it "converts a series of strings with a single converter" do
+      ary = [encode("\0a\0b\0c", "utf-16be"), encode("\0d\0e", "utf-16be")]
+      Iconv.iconv("utf-16be", "us-ascii", "abc", "de").should == ary
+      # BOM only on first string
+      Iconv.iconv("utf-16", "utf-8", "abc", "de").should equal_utf16(["\xfe\xff\0a\0b\0c", "\0d\0e"])
+    end
+    it "returns an empty array when given no strings to convert" do
+      Iconv.iconv("us-ascii", "utf-8").should == []
+    end
+    it_behaves_like :iconv_initialize_exceptions, :iconv, "test"
+    platform_is :linux, :darwin, :freebsd do
+      # //ignore is glibc iconv and GNU libiconv specific behavior, not POSIX
+      describe "using the ignore option" do
+        # This spec exists because some implementions of libiconv return
+        # an error for this sequence even though they consume all of the
+        # input and write the proper output. We want to be sure that those
+        # platforms ignore the error and give us the data back.
+        #
+        it "causes unknown bytes to be ignored" do
+          str = "f\303\266\303\266 bar" # this is foo bar, with umlate o's
+          Iconv.iconv('ascii//ignore', 'utf-8', str)[0].should == "f bar"
+        end
+      end
+    end
+  end
+  describe "The 'utf-8' encoder" do
+    it "emits proper representations for characters outside the Basic Multilingual Plane" do
+      Iconv.iconv("utf-8", "utf-16be", "\xd8\x40\xdc\x00").should == ["\xf0\xa0\x80\x80"]
+    end
+  end
+  describe "The 'utf-16' encoder" do
+    ruby_version_is "".."1.8.6p230" do
+      it "emits an empty string when the source input is empty" do
+        Iconv.iconv("utf-16", "us-ascii", "", "").should == ["", ""]
+        Iconv.open "utf-16", "utf-8" do |conv|
+          conv.iconv("").should == ""
+          conv.iconv("test", 1, 1).should == ""
+          conv.iconv("test", 3, -3).should == ""
+          conv.iconv("test", 1, -4).should == ""
+        end
+      end
+    end
+    ruby_version_is "1.8.6p238".."1.9" do
+      it "emits an empty string when the source input is empty" do
+        Iconv.iconv("utf-16", "us-ascii", "", "").should == ["", ""]
+        Iconv.open "utf-16", "utf-8" do |conv|
+          conv.iconv("").should == ""
+          conv.iconv("test", 1, 0).should == ""
+        end
+      end
+    end
+    it "emits a byte-order mark on first non-empty output" do
+      Iconv.iconv("utf-16", "us-ascii", "a").should equal_utf16(["\xfe\xff\0a"])
+      Iconv.iconv("utf-16", "utf-16", "\x80\x80", "\x81\x81").should equal_utf16(["\xfe\xff\x80\x80", "\x81\x81"])
+    end
+  end
+  describe "The 'utf-16be' decoder" do
+    it "does not emit a byte-order mark" do
+      Iconv.iconv("utf-16be", "utf-8", "ab").should == [encode("\0a\0b", "utf-16be")]
+    end
+    it "treats possible byte-order marks as regular characters" do
+      Iconv.iconv("utf-8", "utf-16be", "\xfe\xff\0a").should == ["\xef\xbb\xbfa"]
+      Iconv.iconv("utf-8", "utf-16be", "\xff\xfe\0a").should == ["\xef\xbf\xbea"]
+    end
+  end
+  describe "The 'utf-16le' decoder" do
+    it "does not emit a byte-order mark" do
+      Iconv.iconv("utf-16le", "utf-8", "ab").should == [encode("a\0b\0", "utf-16le")]
+    end
+    it "treats possible byte-order marks as regular characters" do
+      Iconv.iconv("utf-8", "utf-16le", "\xfe\xff\0a").should == ["\xef\xbf\xbe\xe6\x84\x80"]
+      Iconv.iconv("utf-8", "utf-16le", "\xff\xfe\0a").should == ["\xef\xbb\xbf\xe6\x84\x80"]
+    end
+  end
+end