RubyGems - twitter_cldr - Versions diffs - 1.0.1 → 1.1.0 - Mend

twitter_cldr 1.0.1 → 1.1.0

Files changed (303) hide show

data/NOTICE +95 -1
data/README.md +4 -4
data/Rakefile +18 -28
data/lib/ext/calendars/date.rb +3 -0
data/lib/ext/calendars/datetime.rb +3 -0
data/lib/ext/calendars/time.rb +3 -0
data/lib/ext/localized_object.rb +3 -0
data/lib/ext/numbers/bignum.rb +3 -0
data/lib/ext/numbers/fixnum.rb +3 -0
data/lib/ext/numbers/float.rb +3 -0
data/lib/ext/numbers/localized_number.rb +3 -0
data/lib/ext/strings/string.rb +31 -0
data/lib/ext/strings/symbol.rb +3 -0
data/lib/formatters/base.rb +3 -0
data/lib/formatters/calendars/date_formatter.rb +3 -0
data/lib/formatters/calendars/datetime_formatter.rb +3 -0
data/lib/formatters/calendars/time_formatter.rb +3 -0
data/lib/formatters/numbers/currency_formatter.rb +3 -0
data/lib/formatters/numbers/decimal_formatter.rb +3 -0
data/lib/formatters/numbers/helpers/base.rb +3 -0
data/lib/formatters/numbers/helpers/fraction.rb +3 -0
data/lib/formatters/numbers/helpers/integer.rb +3 -0
data/lib/formatters/numbers/number_formatter.rb +3 -0
data/lib/formatters/numbers/percent_formatter.rb +3 -0
data/lib/formatters/plurals/plural_formatter.rb +141 -0
data/lib/formatters/plurals/rules.rb +4 -1
data/lib/normalizers/base.rb +17 -0
data/lib/normalizers/canonical/nfd.rb +81 -0
data/lib/shared/currencies.rb +4 -1
data/lib/shared/languages.rb +4 -1
data/lib/shared/resources.rb +8 -28
data/lib/shared/timezones.rb +3 -0
data/lib/shared/unicode_data.rb +44 -0
data/lib/tokenizers/base.rb +3 -0
data/lib/tokenizers/calendars/date_tokenizer.rb +3 -0
data/lib/tokenizers/calendars/datetime_tokenizer.rb +4 -1
data/lib/tokenizers/calendars/time_tokenizer.rb +3 -0
data/lib/tokenizers/key_path.rb +3 -0
data/lib/tokenizers/numbers/number_tokenizer.rb +4 -1
data/lib/tokenizers/token.rb +3 -0
data/lib/twitter_cldr.rb +52 -29
data/lib/utils/interpolation.rb +105 -0
data/lib/utils.rb +28 -0
data/lib/version.rb +6 -1
data/resources/unicode_data/aegean_numbers.yml +913 -0
data/resources/unicode_data/alchemical_symbols.yml +1857 -0
data/resources/unicode_data/alphabetic_presentation_forms.yml +929 -0
data/resources/unicode_data/ancient_greek_musical_notation.yml +1121 -0
data/resources/unicode_data/ancient_greek_numbers.yml +1201 -0
data/resources/unicode_data/ancient_symbols.yml +193 -0
data/resources/unicode_data/arabic.yml +4049 -0
data/resources/unicode_data/arabic_extended_a.yml +625 -0
data/resources/unicode_data/arabic_mathematical_alphabetic_symbols.yml +2289 -0
data/resources/unicode_data/arabic_presentation_forms_a.yml +9777 -0
data/resources/unicode_data/arabic_presentation_forms_b.yml +2257 -0
data/resources/unicode_data/arabic_supplement.yml +769 -0
data/resources/unicode_data/armenian.yml +1393 -0
data/resources/unicode_data/arrows.yml +1793 -0
data/resources/unicode_data/avestan.yml +977 -0
data/resources/unicode_data/balinese.yml +1937 -0
data/resources/unicode_data/bamum.yml +1409 -0
data/resources/unicode_data/bamum_supplement.yml +9105 -0
data/resources/unicode_data/basic_latin.yml +2049 -0
data/resources/unicode_data/batak.yml +897 -0
data/resources/unicode_data/bengali.yml +1473 -0
data/resources/unicode_data/block_elements.yml +513 -0
data/resources/unicode_data/blocks.yml +881 -0
data/resources/unicode_data/bopomofo.yml +657 -0
data/resources/unicode_data/bopomofo_extended.yml +433 -0
data/resources/unicode_data/box_drawing.yml +2049 -0
data/resources/unicode_data/brahmi.yml +1729 -0
data/resources/unicode_data/braille_patterns.yml +4097 -0
data/resources/unicode_data/buginese.yml +481 -0
data/resources/unicode_data/buhid.yml +321 -0
data/resources/unicode_data/byzantine_musical_symbols.yml +3937 -0
data/resources/unicode_data/carian.yml +785 -0
data/resources/unicode_data/chakma.yml +1073 -0
data/resources/unicode_data/cham.yml +1329 -0
data/resources/unicode_data/cherokee.yml +1361 -0
data/resources/unicode_data/cjk_compatibility.yml +4097 -0
data/resources/unicode_data/cjk_compatibility_forms.yml +513 -0
data/resources/unicode_data/cjk_compatibility_ideographs.yml +7553 -0
data/resources/unicode_data/cjk_compatibility_ideographs_supplement.yml +8673 -0
data/resources/unicode_data/cjk_radicals_supplement.yml +1841 -0
data/resources/unicode_data/cjk_strokes.yml +577 -0
data/resources/unicode_data/cjk_symbols_and_punctuation.yml +1025 -0
data/resources/unicode_data/cjk_unified_ideographs.yml +33 -0
data/resources/unicode_data/cjk_unified_ideographs_extension_a.yml +33 -0
data/resources/unicode_data/cjk_unified_ideographs_extension_b.yml +33 -0
data/resources/unicode_data/cjk_unified_ideographs_extension_c.yml +33 -0
data/resources/unicode_data/cjk_unified_ideographs_extension_d.yml +33 -0
data/resources/unicode_data/combining_diacritical_marks.yml +1793 -0
data/resources/unicode_data/combining_diacritical_marks_for_symbols.yml +529 -0
data/resources/unicode_data/combining_diacritical_marks_supplement.yml +689 -0
data/resources/unicode_data/combining_half_marks.yml +113 -0
data/resources/unicode_data/common_indic_number_forms.yml +161 -0
data/resources/unicode_data/control_pictures.yml +625 -0
data/resources/unicode_data/coptic.yml +1969 -0
data/resources/unicode_data/counting_rod_numerals.yml +289 -0
data/resources/unicode_data/cuneiform.yml +14065 -0
data/resources/unicode_data/cuneiform_numbers_and_punctuation.yml +1649 -0
data/resources/unicode_data/currency_symbols.yml +417 -0
data/resources/unicode_data/cypriot_syllabary.yml +881 -0
data/resources/unicode_data/cyrillic.yml +4097 -0
data/resources/unicode_data/cyrillic_extended_a.yml +513 -0
data/resources/unicode_data/cyrillic_extended_b.yml +1425 -0
data/resources/unicode_data/cyrillic_supplement.yml +641 -0
data/resources/unicode_data/deseret.yml +1281 -0
data/resources/unicode_data/devanagari.yml +2033 -0
data/resources/unicode_data/devanagari_extended.yml +449 -0
data/resources/unicode_data/dingbats.yml +3057 -0
data/resources/unicode_data/domino_tiles.yml +1601 -0
data/resources/unicode_data/egyptian_hieroglyphs.yml +17137 -0
data/resources/unicode_data/emoticons.yml +1217 -0
data/resources/unicode_data/enclosed_alphanumeric_supplement.yml +2737 -0
data/resources/unicode_data/enclosed_alphanumerics.yml +2561 -0
data/resources/unicode_data/enclosed_cjk_letters_and_months.yml +4065 -0
data/resources/unicode_data/enclosed_ideographic_supplement.yml +913 -0
data/resources/unicode_data/ethiopic.yml +5729 -0
data/resources/unicode_data/ethiopic_extended.yml +1265 -0
data/resources/unicode_data/ethiopic_extended_a.yml +513 -0
data/resources/unicode_data/ethiopic_supplement.yml +417 -0
data/resources/unicode_data/general_punctuation.yml +1713 -0
data/resources/unicode_data/geometric_shapes.yml +1537 -0
data/resources/unicode_data/georgian.yml +1409 -0
data/resources/unicode_data/georgian_supplement.yml +641 -0
data/resources/unicode_data/glagolitic.yml +1505 -0
data/resources/unicode_data/gothic.yml +433 -0
data/resources/unicode_data/greek_and_coptic.yml +2145 -0
data/resources/unicode_data/greek_extended.yml +3729 -0
data/resources/unicode_data/gujarati.yml +1345 -0
data/resources/unicode_data/gurmukhi.yml +1265 -0
data/resources/unicode_data/halfwidth_and_fullwidth_forms.yml +3601 -0
data/resources/unicode_data/hangul_compatibility_jamo.yml +1505 -0
data/resources/unicode_data/hangul_jamo.yml +4097 -0
data/resources/unicode_data/hangul_jamo_extended_a.yml +465 -0
data/resources/unicode_data/hangul_jamo_extended_b.yml +1153 -0
data/resources/unicode_data/hangul_syllables.yml +33 -0
data/resources/unicode_data/hanunoo.yml +369 -0
data/resources/unicode_data/hebrew.yml +1393 -0
data/resources/unicode_data/high_private_use_surrogates.yml +33 -0
data/resources/unicode_data/high_surrogates.yml +33 -0
data/resources/unicode_data/hiragana.yml +1489 -0
data/resources/unicode_data/ideographic_description_characters.yml +193 -0
data/resources/unicode_data/imperial_aramaic.yml +497 -0
data/resources/unicode_data/inscriptional_pahlavi.yml +433 -0
data/resources/unicode_data/inscriptional_parthian.yml +481 -0
data/resources/unicode_data/ipa_extensions.yml +1537 -0
data/resources/unicode_data/javanese.yml +1457 -0
data/resources/unicode_data/kaithi.yml +1057 -0
data/resources/unicode_data/kana_supplement.yml +33 -0
data/resources/unicode_data/kanbun.yml +257 -0
data/resources/unicode_data/kangxi_radicals.yml +3425 -0
data/resources/unicode_data/kannada.yml +1377 -0
data/resources/unicode_data/katakana.yml +1537 -0
data/resources/unicode_data/katakana_phonetic_extensions.yml +257 -0
data/resources/unicode_data/kayah_li.yml +769 -0
data/resources/unicode_data/kharoshthi.yml +1041 -0
data/resources/unicode_data/khmer.yml +1825 -0
data/resources/unicode_data/khmer_symbols.yml +513 -0
data/resources/unicode_data/lao.yml +1073 -0
data/resources/unicode_data/latin_1_supplement.yml +2049 -0
data/resources/unicode_data/latin_extended_a.yml +2049 -0
data/resources/unicode_data/latin_extended_additional.yml +4097 -0
data/resources/unicode_data/latin_extended_b.yml +3329 -0
data/resources/unicode_data/latin_extended_c.yml +513 -0
data/resources/unicode_data/latin_extended_d.yml +2145 -0
data/resources/unicode_data/lepcha.yml +1185 -0
data/resources/unicode_data/letterlike_symbols.yml +1281 -0
data/resources/unicode_data/limbu.yml +1057 -0
data/resources/unicode_data/linear_b_ideograms.yml +1969 -0
data/resources/unicode_data/linear_b_syllabary.yml +1409 -0
data/resources/unicode_data/lisu.yml +769 -0
data/resources/unicode_data/low_surrogates.yml +33 -0
data/resources/unicode_data/lycian.yml +465 -0
data/resources/unicode_data/lydian.yml +433 -0
data/resources/unicode_data/mahjong_tiles.yml +705 -0
data/resources/unicode_data/malayalam.yml +1569 -0
data/resources/unicode_data/mandaic.yml +465 -0
data/resources/unicode_data/mathematical_alphanumeric_symbols.yml +15937 -0
data/resources/unicode_data/mathematical_operators.yml +4097 -0
data/resources/unicode_data/meetei_mayek.yml +897 -0
data/resources/unicode_data/meetei_mayek_extensions.yml +369 -0
data/resources/unicode_data/meroitic_cursive.yml +417 -0
data/resources/unicode_data/meroitic_hieroglyphs.yml +513 -0
data/resources/unicode_data/miao.yml +2129 -0
data/resources/unicode_data/miscellaneous_mathematical_symbols_a.yml +769 -0
data/resources/unicode_data/miscellaneous_mathematical_symbols_b.yml +2049 -0
data/resources/unicode_data/miscellaneous_symbols.yml +4097 -0
data/resources/unicode_data/miscellaneous_symbols_and_arrows.yml +1393 -0
data/resources/unicode_data/miscellaneous_symbols_and_pictographs.yml +8529 -0
data/resources/unicode_data/miscellaneous_technical.yml +3905 -0
data/resources/unicode_data/modifier_tone_letters.yml +513 -0
data/resources/unicode_data/mongolian.yml +2497 -0
data/resources/unicode_data/musical_symbols.yml +3521 -0
data/resources/unicode_data/myanmar.yml +2561 -0
data/resources/unicode_data/myanmar_extended_a.yml +449 -0
data/resources/unicode_data/new_tai_lue.yml +1329 -0
data/resources/unicode_data/nko.yml +945 -0
data/resources/unicode_data/number_forms.yml +929 -0
data/resources/unicode_data/ogham.yml +465 -0
data/resources/unicode_data/ol_chiki.yml +769 -0
data/resources/unicode_data/old_italic.yml +561 -0
data/resources/unicode_data/old_persian.yml +801 -0
data/resources/unicode_data/old_south_arabian.yml +513 -0
data/resources/unicode_data/old_turkic.yml +1169 -0
data/resources/unicode_data/optical_character_recognition.yml +177 -0
data/resources/unicode_data/oriya.yml +1441 -0
data/resources/unicode_data/osmanya.yml +641 -0
data/resources/unicode_data/phags_pa.yml +897 -0
data/resources/unicode_data/phaistos_disc.yml +737 -0
data/resources/unicode_data/phoenician.yml +465 -0
data/resources/unicode_data/phonetic_extensions.yml +2049 -0
data/resources/unicode_data/phonetic_extensions_supplement.yml +1025 -0
data/resources/unicode_data/playing_cards.yml +945 -0
data/resources/unicode_data/private_use_area.yml +33 -0
data/resources/unicode_data/rejang.yml +593 -0
data/resources/unicode_data/rumi_numeral_symbols.yml +497 -0
data/resources/unicode_data/runic.yml +1297 -0
data/resources/unicode_data/samaritan.yml +977 -0
data/resources/unicode_data/saurashtra.yml +1297 -0
data/resources/unicode_data/sharada.yml +1329 -0
data/resources/unicode_data/shavian.yml +769 -0
data/resources/unicode_data/sinhala.yml +1281 -0
data/resources/unicode_data/small_form_variants.yml +417 -0
data/resources/unicode_data/sora_sompeng.yml +561 -0
data/resources/unicode_data/spacing_modifier_letters.yml +1281 -0
data/resources/unicode_data/specials.yml +81 -0
data/resources/unicode_data/sundanese.yml +1025 -0
data/resources/unicode_data/sundanese_supplement.yml +129 -0
data/resources/unicode_data/superscripts_and_subscripts.yml +673 -0
data/resources/unicode_data/supplemental_arrows_a.yml +257 -0
data/resources/unicode_data/supplemental_arrows_b.yml +2049 -0
data/resources/unicode_data/supplemental_mathematical_operators.yml +4097 -0
data/resources/unicode_data/supplemental_punctuation.yml +961 -0
data/resources/unicode_data/supplementary_private_use_area_a.yml +33 -0
data/resources/unicode_data/supplementary_private_use_area_b.yml +33 -0
data/resources/unicode_data/syloti_nagri.yml +705 -0
data/resources/unicode_data/syriac.yml +1233 -0
data/resources/unicode_data/tagalog.yml +321 -0
data/resources/unicode_data/tagbanwa.yml +289 -0
data/resources/unicode_data/tags.yml +1553 -0
data/resources/unicode_data/tai_le.yml +561 -0
data/resources/unicode_data/tai_tham.yml +2033 -0
data/resources/unicode_data/tai_viet.yml +1153 -0
data/resources/unicode_data/tai_xuan_jing_symbols.yml +1393 -0
data/resources/unicode_data/takri.yml +1057 -0
data/resources/unicode_data/tamil.yml +1153 -0
data/resources/unicode_data/telugu.yml +1489 -0
data/resources/unicode_data/thaana.yml +801 -0
data/resources/unicode_data/thai.yml +1393 -0
data/resources/unicode_data/tibetan.yml +3377 -0
data/resources/unicode_data/tifinagh.yml +945 -0
data/resources/unicode_data/transport_and_map_symbols.yml +1121 -0
data/resources/unicode_data/ugaritic.yml +497 -0
data/resources/unicode_data/unified_canadian_aboriginal_syllabics.yml +10241 -0
data/resources/unicode_data/unified_canadian_aboriginal_syllabics_extended.yml +1121 -0
data/resources/unicode_data/vai.yml +4801 -0
data/resources/unicode_data/variation_selectors.yml +257 -0
data/resources/unicode_data/variation_selectors_supplement.yml +3841 -0
data/resources/unicode_data/vedic_extensions.yml +625 -0
data/resources/unicode_data/vertical_forms.yml +161 -0
data/resources/unicode_data/yi_radicals.yml +881 -0
data/resources/unicode_data/yi_syllables.yml +18641 -0
data/resources/unicode_data/yijing_hexagram_symbols.yml +1025 -0
data/spec/ext/calendars/date_spec.rb +5 -1
data/spec/ext/calendars/datetime_spec.rb +5 -1
data/spec/ext/calendars/time_spec.rb +5 -1
data/spec/ext/numbers/bignum_spec.rb +5 -1
data/spec/ext/numbers/fixnum_spec.rb +5 -1
data/spec/ext/numbers/float_spec.rb +5 -1
data/spec/ext/numbers/localized_number_spec.rb +5 -1
data/spec/ext/strings/string_spec.rb +102 -0
data/spec/ext/strings/symbol_spec.rb +5 -1
data/spec/formatters/base_spec.rb +5 -1
data/spec/formatters/calendars/datetime_formatter_spec.rb +5 -1
data/spec/formatters/numbers/currency_formatter_spec.rb +5 -1
data/spec/formatters/numbers/decimal_formatter_spec.rb +5 -1
data/spec/formatters/numbers/helpers/fraction_spec.rb +5 -1
data/spec/formatters/numbers/helpers/integer_spec.rb +5 -1
data/spec/formatters/numbers/number_formatter_spec.rb +6 -2
data/spec/formatters/numbers/percent_formatter_spec.rb +5 -1
data/spec/formatters/plurals/plural_formatter_spec.rb +205 -0
data/spec/formatters/plurals/rules_spec.rb +28 -28
data/spec/normalizers/NormalizationTest.txt +602 -0
data/spec/normalizers/base_spec.rb +16 -0
data/spec/normalizers/canonical/nfd_spec.rb +50 -0
data/spec/shared/currencies_spec.rb +5 -1
data/spec/shared/languages_spec.rb +5 -1
data/spec/shared/resources_spec.rb +5 -18
data/spec/shared/unicode_data_spec.rb +51 -0
data/spec/spec_helper.rb +6 -3
data/spec/tokenizers/base_spec.rb +3 -0
data/spec/tokenizers/calendars/date_tokenizer_spec.rb +5 -1
data/spec/tokenizers/calendars/datetime_tokenizer_spec.rb +5 -1
data/spec/tokenizers/calendars/time_tokenizer_spec.rb +5 -1
data/spec/tokenizers/key_path_spec.rb +3 -0
data/spec/tokenizers/numbers/number_tokenizer_spec.rb +5 -1
data/spec/tokenizers/token_spec.rb +5 -1
data/spec/twitter_cldr_spec.rb +23 -1
data/spec/utils/interpolation_spec.rb +124 -0
data/spec/utils_spec.rb +32 -0
metadata +285 -21

data/spec/normalizers/base_spec.rb ADDED Viewed

@@ -0,0 +1,16 @@
+# encoding: UTF-8
+require 'spec_helper'
+describe Base do
+  describe "#code_point_to_char" do
+    it "converts unicode code points to the actual character" do
+      TwitterCldr::Normalizers::Base.code_point_to_char("221E").should == "∞"
+    end
+  end
+  describe "#char_to_code_point" do
+    it "converts a character to a unicode code point" do
+      TwitterCldr::Normalizers::Base.char_to_code_point("∞").should == "221E"
+    end
+  end
+end

data/spec/normalizers/canonical/nfd_spec.rb ADDED Viewed

@@ -0,0 +1,50 @@
+# encoding: UTF-8
+require 'spec_helper'
+include TwitterCldr::Normalizers
+describe NFD do
+  describe "#normalize" do
+    NFD.normalize("庠摪饢鼢豦樄澸脧鱵礩翜艰").should == "庠摪饢鼢豦樄澸脧鱵礩翜艰"
+    NFD.normalize("䷙䷿").should == "䷙䷿"
+    NFD.normalize("ᎿᎲᎪᏨᎨᏪᎧᎵᏥ").should == "ᎿᎲᎪᏨᎨᏪᎧᎵᏥ"
+    NFD.normalize("ᆙᅓᆼᄋᇶ").should == "ᆙᅓᆼᄋᇶ"
+    NFD.normalize("…‾⁋ ⁒⁯‒′‾⁖").should == "…‾⁋ ⁒⁯‒′‾⁖"
+    NFD.normalize("ⶾⷕⶱⷀ").should == "ⶾⷕⶱⷀ"
+  end
+  describe "#decompose" do
+    it "does not decompose a character with no decomposition mapping" do
+      code_points = ["0EB8", "041F", "0066", "1F52C", "A2D6"]
+      code_points.each do |code_point|
+        NFD.decompose(code_point).should == code_point
+      end
+    end
+    it "does not decompose a character with compatibility decomposition mapping" do
+      code_points = ["A770", "FB02", "FC35", "FD20", "00BC"]
+      code_points.each do |code_point|
+        NFD.decompose(code_point).should == code_point
+      end
+    end
+  end
+  describe "#normalize_code_points" do
+    it "passes all the tests in NormalizersTest.txt" do
+      normalization_test_file = File.join(File.dirname(File.dirname(__FILE__)), "NormalizationTest.txt")
+      File.open(normalization_test_file, "r:UTF-8") do |file|
+        while line = file.gets
+          unless line[0,1] =~ /(@|#)/ || line.empty?
+            c1, c2, c3, c4, c5 = line.split(';')[0...5].map { |cps| cps.split }
+            NFD.normalize_code_points(c1).should == c3
+            NFD.normalize_code_points(c2).should == c3
+            NFD.normalize_code_points(c3).should == c3
+            NFD.normalize_code_points(c4).should == c5
+            NFD.normalize_code_points(c5).should == c5
+          end
+        end
+      end
+    end
+  end
+end

data/spec/shared/currencies_spec.rb CHANGED Viewed

@@ -1,6 +1,10 @@
 # encoding: UTF-8
-require File.join(File.dirname(__FILE__), %w[.. spec_helper])
+# Copyright 2012 Twitter, Inc
+# http://www.apache.org/licenses/LICENSE-2.0
+require 'spec_helper'
 include TwitterCldr::Shared
 TEST_COUNTRIES = ["Australia", "Thailand", "Russia", "China", "Japan", "Peru", "South Africa", "India", "South Korea", "United Kingdom"]

data/spec/shared/languages_spec.rb CHANGED Viewed

@@ -1,6 +1,10 @@
 # encoding: UTF-8
-require File.join(File.dirname(__FILE__), %w[.. spec_helper])
+# Copyright 2012 Twitter, Inc
+# http://www.apache.org/licenses/LICENSE-2.0
+require 'spec_helper'
 include TwitterCldr::Shared
 describe Languages do

data/spec/shared/resources_spec.rb CHANGED Viewed

@@ -1,6 +1,10 @@
 # encoding: UTF-8
-require File.join(File.dirname(__FILE__), %w[.. spec_helper])
+# Copyright 2012 Twitter, Inc
+# http://www.apache.org/licenses/LICENSE-2.0
+require 'spec_helper'
 include TwitterCldr::Shared
 describe Resources do
@@ -26,21 +30,4 @@ describe Resources do
       @resource.resource_for("de", "racehorse").should == { :key => "value" }
     end
   end
-  describe "#deep_symbolize_keys" do
-    it "should work with a regular hash" do
-      result = @resource.send(:deep_symbolize_keys, { "twitter" => "rocks", "my" => "socks" })
-      result.should == { :twitter => "rocks", :my => "socks"}
-    end
-    it "should work with nested hashes" do
-      result = @resource.send(:deep_symbolize_keys, { "twitter" => { "rocks" => "my socks" } })
-      result.should == { :twitter => { :rocks => "my socks" } }
-    end
-    it "should work with nested hashes and arrays" do
-      result = @resource.send(:deep_symbolize_keys, { "twitter" => { "rocks_my" => [{ "socks" => "and mind" }, { "hard" => "core" }] } })
-      result.should == { :twitter => { :rocks_my => [{ :socks => "and mind" }, { :hard => "core" }] } }
-    end
-  end
 end

data/spec/shared/unicode_data_spec.rb ADDED Viewed

@@ -0,0 +1,51 @@
+# encoding: UTF-8
+# Copyright 2012 Twitter, Inc
+# http://www.apache.org/licenses/LICENSE-2.0
+require 'spec_helper'
+include TwitterCldr::Shared
+describe UnicodeData do
+  describe "#for_code_point" do
+    it "should retrieve information for any valid code point" do
+      data = UnicodeData.for_code_point('0301')
+      data.should be_a(Struct)
+      data.length.should == 15
+    end
+    it "should return nil for invalid code points" do
+      UnicodeData.for_code_point('abcd').should be_nil
+      UnicodeData.for_code_point('FFFFFFF').should be_nil
+      UnicodeData.for_code_point('uytukhil123').should be_nil
+    end
+    it "fetches valid information for the specified code point" do
+      test_data = {
+        '17D1' => ['17D1','KHMER SIGN VIRIAM','Mn','0','NSM',"","","","",'N',"","","","",""],
+        'FE91' => ['FE91','ARABIC LETTER BEH INITIAL FORM','Lo','0','AL','<initial> 0628',"","","",'N','GLYPH FOR INITIAL ARABIC BAA',"","","",""],
+        '24B5' => ['24B5','PARENTHESIZED LATIN SMALL LETTER Z','So','0','L','<compat> 0028 007A 0029',"","","",'N',"","","","",""],
+        '2128' => ['2128','BLACK-LETTER CAPITAL Z','Lu','0','L','<font> 005A',"","","",'N','BLACK-LETTER Z',"","","",""],
+        '1F241'=> ['1F241','TORTOISE SHELL BRACKETED CJK UNIFIED IDEOGRAPH-4E09','So','0','L','<compat> 3014 4E09 3015',"","","",'N',"","","","",""]
+      }
+      test_data.each_pair do |code_point, data|
+        UnicodeData.for_code_point(code_point).values.should == data
+      end
+    end
+    it "fetches valid information for a code point within a range" do
+      test_data = {
+        '4E11' => ["4E11","<CJK Ideograph>","Lo","0","L","","","","","N","","","","",""],
+        'AC55' => ["AC55","<Hangul Syllable>","Lo","0","L","","","","","N","","","","",""],
+        'D7A1' => ["D7A1","<Hangul Syllable>","Lo","0","L","","","","","N","","","","",""],
+        'DAAA' => ["DAAA","<Non Private Use High Surrogate>","Cs","0","L","","","","","N","","","","",""],
+        'F8FE' => ["F8FE","<Private Use>","Co","0","L","","","","","N","","","","",""]
+      }
+      test_data.each_pair do |code_point, data|
+        UnicodeData.for_code_point(code_point).values.should == data
+      end
+    end
+  end
+end

data/spec/spec_helper.rb CHANGED Viewed

@@ -1,7 +1,10 @@
 # encoding: UTF-8
-require File.expand_path(File.join(File.dirname(__FILE__), %w[.. lib twitter_cldr]))
-FIXTURE_DIR = File.expand_path(File.join(File.dirname(__FILE__), %w[fixtures]))
+# Copyright 2012 Twitter, Inc
+# http://www.apache.org/licenses/LICENSE-2.0
+require 'rspec'
+require 'twitter_cldr'
 class FastGettext
   class << self
@@ -15,7 +18,7 @@ class FastGettext
   end
 end
-Spec::Runner.configure do |config|
+RSpec.configure do |config|
   config.mock_with :rr
   config.before(:each) do

data/spec/tokenizers/base_spec.rb CHANGED Viewed

@@ -1,5 +1,8 @@
 # encoding: UTF-8
+# Copyright 2012 Twitter, Inc
+# http://www.apache.org/licenses/LICENSE-2.0
 require File.join(File.dirname(File.dirname(__FILE__)), "spec_helper")
 include TwitterCldr::Tokenizers

data/spec/tokenizers/calendars/date_tokenizer_spec.rb CHANGED Viewed

@@ -1,6 +1,10 @@
 # encoding: UTF-8
-require File.join(File.dirname(File.dirname(File.dirname(__FILE__))), "spec_helper")
+# Copyright 2012 Twitter, Inc
+# http://www.apache.org/licenses/LICENSE-2.0
+require 'spec_helper'
 include TwitterCldr::Tokenizers
 describe DateTokenizer do

data/spec/tokenizers/calendars/datetime_tokenizer_spec.rb CHANGED Viewed

@@ -1,6 +1,10 @@
 # encoding: UTF-8
-require File.join(File.dirname(File.dirname(File.dirname(__FILE__))), "spec_helper")
+# Copyright 2012 Twitter, Inc
+# http://www.apache.org/licenses/LICENSE-2.0
+require 'spec_helper'
 include TwitterCldr::Tokenizers
 describe DateTimeTokenizer do

data/spec/tokenizers/calendars/time_tokenizer_spec.rb CHANGED Viewed

@@ -1,6 +1,10 @@
 # encoding: UTF-8
-require File.join(File.dirname(File.dirname(File.dirname(__FILE__))), "spec_helper")
+# Copyright 2012 Twitter, Inc
+# http://www.apache.org/licenses/LICENSE-2.0
+require 'spec_helper'
 include TwitterCldr::Tokenizers
 describe DateTokenizer do

data/spec/tokenizers/key_path_spec.rb CHANGED Viewed

@@ -1,5 +1,8 @@
 # encoding: UTF-8
+# Copyright 2012 Twitter, Inc
+# http://www.apache.org/licenses/LICENSE-2.0
 require File.join(File.dirname(File.dirname(__FILE__)), "spec_helper")
 include TwitterCldr::Tokenizers

data/spec/tokenizers/numbers/number_tokenizer_spec.rb CHANGED Viewed

@@ -1,6 +1,10 @@
 # encoding: UTF-8
-require File.join(File.dirname(File.dirname(File.dirname(__FILE__))), "spec_helper")
+# Copyright 2012 Twitter, Inc
+# http://www.apache.org/licenses/LICENSE-2.0
+require 'spec_helper'
 include TwitterCldr::Tokenizers
 describe NumberTokenizer do

data/spec/tokenizers/token_spec.rb CHANGED Viewed

@@ -1,6 +1,10 @@
 # encoding: UTF-8
-require File.join(File.dirname(File.dirname(__FILE__)), "spec_helper")
+# Copyright 2012 Twitter, Inc
+# http://www.apache.org/licenses/LICENSE-2.0
+require 'spec_helper'
 include TwitterCldr::Tokenizers
 describe Token do

data/spec/twitter_cldr_spec.rb CHANGED Viewed

@@ -1,6 +1,9 @@
 # encoding: UTF-8
-require File.join(File.dirname(__FILE__), "spec_helper")
+# Copyright 2012 Twitter, Inc
+# http://www.apache.org/licenses/LICENSE-2.0
+require 'spec_helper'
 describe TwitterCldr do
   describe "#supported_locale?" do
@@ -52,4 +55,23 @@ describe TwitterCldr do
       end
     end
   end
+  describe '#resources' do
+    it 'returns @@resources' do
+      resources = TwitterCldr::Shared::Resources.new
+      TwitterCldr.send :class_variable_set, :@@resources, resources
+      TwitterCldr.resources.should == resources
+    end
+  end
+  describe '#get_resource' do
+    it 'delegates to @@resources' do
+      resources = TwitterCldr::Shared::Resources.new
+      mock(resources).resource_for('locale', 'resource') { 'result' }
+      TwitterCldr.send :class_variable_set, :@@resources, resources
+      TwitterCldr.get_resource('locale', 'resource').should == 'result'
+    end
+  end
 end

data/spec/utils/interpolation_spec.rb ADDED Viewed

@@ -0,0 +1,124 @@
+# encoding: UTF-8
+# Copyright 2012 Twitter, Inc
+# http://www.apache.org/licenses/LICENSE-2.0
+# Some test cases were taken from i18n (https://github.com/svenfuchs/i18n/blob/89ea337f48562370988421e50caa7c2fe89452c7/test/core_ext/string/interpolate_test.rb)
+# and gettext (https://github.com/mutoh/gettext/blob/11b8c1525ba9f00afb1942f7ebf34bec12f7558b/test/test_string.rb) gems.
+#
+# See NOTICE file for corresponding license agreements.
+require 'spec_helper'
+describe TwitterCldr::Utils do
+  describe '#interpolate' do
+    context 'when argument is a Hash' do
+      it 'does nothing if no placeholder give' do
+        TwitterCldr::Utils.interpolate('foo', :foo => 'bar').should == 'foo'
+      end
+      it 'interpolates named placeholders' do
+        TwitterCldr::Utils.interpolate('%{digit} %{sign} %{digit}', :digit => 2, :sign => '+').should == '2 + 2'
+      end
+      it 'interpolates named placeholders with formatting' do
+        TwitterCldr::Utils.interpolate(
+            '%<as_integer>d %<as_float>.2f', :as_integer => 3.14, :as_float => 15
+        ).should == '3 15.00'
+      end
+      it 'interpolates mixed placeholders' do
+        TwitterCldr::Utils.interpolate(
+            '%{regular} is approx. %<pi>.4f', :regular => 'pi', :pi => 3.141592
+        ).should == 'pi is approx. 3.1416'
+      end
+      it 'does not recurse' do
+        TwitterCldr::Utils.interpolate(
+            '%{top_level}', :top_level => '%<second_level>', :second_level => 'unexpected'
+        ).should == '%<second_level>'
+      end
+      it 'treats % before placeholder as escape character' do
+        TwitterCldr::Utils.interpolate(
+            '%%{foo} = %{foo}, %%<bar>d = %<bar>d', :foo => 1, :bar => 2.3
+        ).should == '%{foo} = 1, %<bar>d = 2'
+      end
+      it 'interpolates formatted placeholders as Ruby 1.9' do
+        TwitterCldr::Utils.interpolate('%<msg>s',    :msg => 'foo').should == 'foo'
+        TwitterCldr::Utils.interpolate('%<num>d',    :num => 1    ).should == '1'
+        TwitterCldr::Utils.interpolate('%<num>f',    :num => 1.0  ).should == '1.000000'
+        TwitterCldr::Utils.interpolate('%<num>3.0f', :num => 1.0  ).should == '  1'
+        TwitterCldr::Utils.interpolate('%<num>2.2f', :num => 100.0).should == '100.00'
+        TwitterCldr::Utils.interpolate('%<num>#b',   :num => 1    ).should == '0b1'
+        TwitterCldr::Utils.interpolate('%<num>#x',   :num => 100.0).should == '0x64'
+      end
+      it 'ignores extra values' do
+        TwitterCldr::Utils.interpolate('%{msg}', :msg => 'hello', :extra => 'extra').should == 'hello'
+      end
+      it 'raises ArgumentError if formatted placeholder is malformed' do
+        lambda { TwitterCldr::Utils.interpolate('%<num>,d', :num => 100) }.should raise_error(ArgumentError)
+        lambda { TwitterCldr::Utils.interpolate('%<num>/d', :num => 100) }.should raise_error(ArgumentError)
+      end
+      it 'raises KeyError when the value is missing' do
+        lambda { TwitterCldr::Utils.interpolate('%{msg}', {}) }.should raise_error(KeyError)
+      end
+    end
+    context 'when argument is an Array' do
+      it 'does nothing if no placeholder give' do
+        TwitterCldr::Utils.interpolate('foo', [111]).should == 'foo'
+      end
+      it 'interpolates all placeholders' do
+        TwitterCldr::Utils.interpolate('%d %s', [12, 'monkeys']).should == '12 monkeys'
+      end
+      it 'interpolates all placeholders with formatting' do
+        TwitterCldr::Utils.interpolate('%d %.3f %#b', [3.1415, 92, 6]).should == '3 92.000 0b110'
+      end
+      it 'formats positional arguments' do
+        TwitterCldr::Utils.interpolate('%1$*2$s %2$d %1$s', ['hello', 8]).should == '   hello 8 hello'
+      end
+      it 'treats % as escape character' do
+        TwitterCldr::Utils.interpolate('%s: %+.2f±%.2f%%', ['total', 3.14159, 2.6535]).should == 'total: +3.14±2.65%'
+      end
+      it 'ignores extra values' do
+        TwitterCldr::Utils.interpolate('%d', [2, 1]).should == '2'
+      end
+      it 'raises ArgumentError when given not enough values' do
+        lambda { TwitterCldr::Utils.interpolate('%d %d', [1]) }.should raise_error(ArgumentError)
+      end
+      it 'raises ArgumentError if the string contains named placeholders' do
+        lambda { TwitterCldr::Utils.interpolate('%{name} %d', [1, 2]) }.should raise_error(ArgumentError)
+      end
+    end
+    context 'when argument is a single value' do
+      it 'formats a string' do
+        TwitterCldr::Utils.interpolate('a string: %s', 'string').should == 'a string: string'
+      end
+      it 'formats a number' do
+        TwitterCldr::Utils.interpolate('a number: %4.1f', 3.1415).should == 'a number:  3.1'
+      end
+      it 'raises ArgumentError if the string contains named placeholders' do
+        lambda { TwitterCldr::Utils.interpolate('%{name}', 'must be hash') }.should raise_error(ArgumentError)
+      end
+    end
+  end
+end

data/spec/utils_spec.rb ADDED Viewed

@@ -0,0 +1,32 @@
+# encoding: UTF-8
+# Copyright 2012 Twitter, Inc
+# http://www.apache.org/licenses/LICENSE-2.0
+require 'spec_helper'
+describe TwitterCldr::Utils do
+  describe '#deep_symbolize_keys' do
+    let(:hash) { { 'foo' => { 'bar' => { 'baz' => 'woot' }, :ar => [1, 2] }, 42 => { 'baz' => 'wat' } } }
+    let(:symbolized_hash) { { :foo => { :bar => { :baz => 'woot' }, :ar => [1, 2] }, 42 => { :baz => 'wat' } } }
+    it 'symbolizes string keys of a hash' do
+      TwitterCldr::Utils.deep_symbolize_keys(hash).should == symbolized_hash
+    end
+    it 'deeply symbolizes elements of an array' do
+      TwitterCldr::Utils.deep_symbolize_keys([1, hash, 'foo', :bar]).should == [1, symbolized_hash, 'foo', :bar]
+    end
+    it 'deeply symbolizes elements of an array nested in a hash' do
+      TwitterCldr::Utils.deep_symbolize_keys({ 'foo' => [1, hash] }).should == { :foo => [1, symbolized_hash] }
+    end
+    it 'leaves arguments of other types alone' do
+      ['foo', :bar, 42].each { |arg| TwitterCldr::Utils.deep_symbolize_keys(arg).should == arg }
+    end
+  end
+end