twitter_cldr 3.2.1 → 3.3.0
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/Gemfile +9 -4
- data/History.txt +11 -0
- data/README.md +40 -3
- data/Rakefile +26 -21
- data/lib/twitter_cldr/collation/collator.rb +3 -3
- data/lib/twitter_cldr/collation/sort_key_builder.rb +10 -10
- data/lib/twitter_cldr/data_readers/calendar_data_reader.rb +8 -8
- data/lib/twitter_cldr/data_readers/date_time_data_reader.rb +2 -2
- data/lib/twitter_cldr/data_readers/number_data_reader.rb +10 -10
- data/lib/twitter_cldr/data_readers/timespan_data_reader.rb +27 -27
- data/lib/twitter_cldr/formatters/list_formatter.rb +1 -1
- data/lib/twitter_cldr/formatters/numbers/currency_formatter.rb +3 -3
- data/lib/twitter_cldr/formatters/numbers/helpers/integer.rb +7 -5
- data/lib/twitter_cldr/formatters/numbers/rbnf/formatters.rb +1 -1
- data/lib/twitter_cldr/formatters/numbers/rbnf/rule.rb +1 -1
- data/lib/twitter_cldr/formatters/numbers/rbnf/rule_set.rb +3 -2
- data/lib/twitter_cldr/formatters/numbers/rbnf.rb +2 -2
- data/lib/twitter_cldr/formatters/plurals/rules.rb +1 -1
- data/lib/twitter_cldr/localized/localized_date.rb +2 -2
- data/lib/twitter_cldr/localized/localized_datetime.rb +8 -8
- data/lib/twitter_cldr/localized/localized_number.rb +7 -7
- data/lib/twitter_cldr/localized/localized_string.rb +33 -1
- data/lib/twitter_cldr/localized/localized_symbol.rb +9 -1
- data/lib/twitter_cldr/localized/localized_time.rb +2 -2
- data/lib/twitter_cldr/localized/localized_timespan.rb +10 -10
- data/lib/twitter_cldr/parsers/number_parser.rb +1 -1
- data/lib/twitter_cldr/parsers/parser.rb +5 -1
- data/lib/twitter_cldr/parsers/unicode_regex/character_class.rb +41 -2
- data/lib/twitter_cldr/parsers/unicode_regex/character_range.rb +8 -0
- data/lib/twitter_cldr/parsers/unicode_regex/character_set.rb +66 -23
- data/lib/twitter_cldr/parsers/unicode_regex/literal.rb +4 -0
- data/lib/twitter_cldr/parsers/unicode_regex/unicode_string.rb +6 -3
- data/lib/twitter_cldr/parsers/unicode_regex_parser.rb +65 -32
- data/lib/twitter_cldr/parsers.rb +1 -2
- data/lib/twitter_cldr/resources/custom_locales_resources_importer.rb +4 -4
- data/lib/twitter_cldr/resources/download.rb +13 -6
- data/lib/twitter_cldr/resources/language_codes_importer.rb +7 -7
- data/lib/twitter_cldr/resources/loader.rb +4 -1
- data/lib/twitter_cldr/resources/locales_resources_importer.rb +30 -12
- data/lib/twitter_cldr/resources/postal_codes_importer.rb +32 -22
- data/lib/twitter_cldr/resources/properties/age_property_importer.rb +27 -0
- data/lib/twitter_cldr/resources/properties/arabic_shaping_property_importer.rb +42 -0
- data/lib/twitter_cldr/resources/properties/bidi_brackets_property_importer.rb +41 -0
- data/lib/twitter_cldr/resources/properties/blocks_property_importer.rb +27 -0
- data/lib/twitter_cldr/resources/properties/derived_core_properties_importer.rb +36 -0
- data/lib/twitter_cldr/resources/properties/east_asian_width_property_importer.rb +27 -0
- data/lib/twitter_cldr/resources/properties/grapheme_break_property_importer.rb +27 -0
- data/lib/twitter_cldr/resources/properties/hangul_syllable_type_property_importer.rb +27 -0
- data/lib/twitter_cldr/resources/properties/indic_positional_category_property_importer.rb +27 -0
- data/lib/twitter_cldr/resources/properties/indic_syllabic_category_property_importer.rb +27 -0
- data/lib/twitter_cldr/resources/properties/jamo_property_importer.rb +27 -0
- data/lib/twitter_cldr/resources/properties/line_break_property_importer.rb +27 -0
- data/lib/twitter_cldr/resources/properties/prop_list_importer.rb +36 -0
- data/lib/twitter_cldr/resources/properties/properties_importer.rb +59 -0
- data/lib/twitter_cldr/resources/properties/property_importer.rb +83 -0
- data/lib/twitter_cldr/resources/properties/script_extensions_property_importer.rb +40 -0
- data/lib/twitter_cldr/resources/properties/script_property_importer.rb +27 -0
- data/lib/twitter_cldr/resources/properties/sentence_break_property_importer.rb +27 -0
- data/lib/twitter_cldr/resources/properties/unicode_data_properties_importer.rb +60 -0
- data/lib/twitter_cldr/resources/properties/word_break_property_importer.rb +27 -0
- data/lib/twitter_cldr/resources/properties.rb +36 -0
- data/lib/twitter_cldr/resources/readme_renderer.rb +2 -2
- data/lib/twitter_cldr/resources/segment_tests_importer.rb +66 -0
- data/lib/twitter_cldr/resources/tailoring_importer.rb +7 -7
- data/lib/twitter_cldr/resources/uli/segment_exceptions_importer.rb +1 -1
- data/lib/twitter_cldr/resources/unicode_data_importer.rb +19 -60
- data/lib/twitter_cldr/resources/unicode_property_aliases_importer.rb +97 -0
- data/lib/twitter_cldr/resources.rb +21 -22
- data/lib/twitter_cldr/segmentation/break_iterator.rb +54 -0
- data/lib/twitter_cldr/segmentation/cursor.rb +34 -0
- data/lib/twitter_cldr/segmentation/parser.rb +71 -0
- data/lib/twitter_cldr/segmentation/rule.rb +79 -0
- data/lib/twitter_cldr/segmentation/rule_set.rb +116 -0
- data/lib/twitter_cldr/segmentation/rule_set_builder.rb +142 -0
- data/lib/twitter_cldr/segmentation.rb +17 -0
- data/lib/twitter_cldr/shared/bidi.rb +4 -4
- data/lib/twitter_cldr/shared/calendar.rb +11 -11
- data/lib/twitter_cldr/shared/caser.rb +84 -0
- data/lib/twitter_cldr/shared/code_point.rb +101 -139
- data/lib/twitter_cldr/shared/currencies.rb +5 -5
- data/lib/twitter_cldr/shared/language_codes.rb +2 -2
- data/lib/twitter_cldr/shared/languages.rb +1 -1
- data/lib/twitter_cldr/shared/likely_subtags.rb +104 -0
- data/lib/twitter_cldr/shared/locale.rb +252 -0
- data/lib/twitter_cldr/shared/postal_codes.rb +21 -9
- data/lib/twitter_cldr/shared/properties/arabic_shaping.rb +40 -0
- data/lib/twitter_cldr/shared/properties/bidi_brackets.rb +28 -0
- data/lib/twitter_cldr/shared/properties.rb +13 -0
- data/lib/twitter_cldr/shared/properties_database.rb +180 -0
- data/lib/twitter_cldr/shared/property_name_aliases.rb +48 -0
- data/lib/twitter_cldr/shared/property_normalizer.rb +108 -0
- data/lib/twitter_cldr/shared/property_set.rb +113 -0
- data/lib/twitter_cldr/shared/property_value_aliases.rb +99 -0
- data/lib/twitter_cldr/shared/unicode_regex.rb +29 -3
- data/lib/twitter_cldr/shared.rb +9 -1
- data/lib/twitter_cldr/tokenizers/numbers/number_tokenizer.rb +1 -1
- data/lib/twitter_cldr/tokenizers/token.rb +1 -1
- data/lib/twitter_cldr/tokenizers/tokenizer.rb +15 -13
- data/lib/twitter_cldr/tokenizers/unicode_regex/unicode_regex_tokenizer.rb +4 -4
- data/lib/twitter_cldr/utils/file_system_trie.rb +145 -0
- data/lib/twitter_cldr/utils/range_set.rb +131 -31
- data/lib/twitter_cldr/utils/regexp_sampler.rb +0 -1
- data/lib/twitter_cldr/utils/script_detector.rb +75 -0
- data/lib/twitter_cldr/utils/yaml.rb +3 -3
- data/lib/twitter_cldr/utils.rb +8 -5
- data/lib/twitter_cldr/version.rb +1 -1
- data/lib/twitter_cldr/versions.rb +30 -0
- data/lib/twitter_cldr.rb +8 -10
- data/resources/locales/af/calendars.yml +8 -8
- data/resources/locales/af/lists.yml +8 -4
- data/resources/locales/af/numbers.yml +54 -30
- data/resources/locales/ar/lists.yml +8 -4
- data/resources/locales/ar/numbers.yml +48 -24
- data/resources/locales/be/calendars.yml +4 -4
- data/resources/locales/be/lists.yml +2 -1
- data/resources/locales/be/numbers.yml +24 -12
- data/resources/locales/bg/calendars.yml +8 -8
- data/resources/locales/bg/lists.yml +8 -4
- data/resources/locales/bg/numbers.yml +48 -24
- data/resources/locales/bn/lists.yml +8 -4
- data/resources/locales/bn/numbers.yml +48 -24
- data/resources/locales/ca/calendars.yml +8 -8
- data/resources/locales/ca/lists.yml +8 -4
- data/resources/locales/ca/numbers.yml +48 -24
- data/resources/locales/cs/calendars.yml +32 -32
- data/resources/locales/cs/lists.yml +8 -4
- data/resources/locales/cs/numbers.yml +48 -24
- data/resources/locales/cy/calendars.yml +8 -8
- data/resources/locales/cy/lists.yml +6 -3
- data/resources/locales/cy/numbers.yml +48 -24
- data/resources/locales/da/calendars.yml +10 -10
- data/resources/locales/da/lists.yml +8 -4
- data/resources/locales/da/numbers.yml +48 -24
- data/resources/locales/de/calendars.yml +8 -8
- data/resources/locales/de/lists.yml +8 -4
- data/resources/locales/de/numbers.yml +48 -24
- data/resources/locales/de-CH/calendars.yml +8 -8
- data/resources/locales/de-CH/lists.yml +8 -4
- data/resources/locales/de-CH/numbers.yml +48 -24
- data/resources/locales/el/calendars.yml +8 -8
- data/resources/locales/el/lists.yml +8 -4
- data/resources/locales/el/numbers.yml +48 -24
- data/resources/locales/en/calendars.yml +4 -4
- data/resources/locales/en/lists.yml +8 -4
- data/resources/locales/en/numbers.yml +48 -24
- data/resources/locales/en-150/calendars.yml +4 -4
- data/resources/locales/en-150/lists.yml +8 -4
- data/resources/locales/en-150/numbers.yml +48 -24
- data/resources/locales/en-AU/calendars.yml +4 -4
- data/resources/locales/en-AU/lists.yml +8 -4
- data/resources/locales/en-AU/numbers.yml +48 -24
- data/resources/locales/en-CA/calendars.yml +4 -4
- data/resources/locales/en-CA/lists.yml +8 -4
- data/resources/locales/en-CA/numbers.yml +48 -24
- data/resources/locales/en-GB/calendars.yml +4 -4
- data/resources/locales/en-GB/lists.yml +8 -4
- data/resources/locales/en-GB/numbers.yml +48 -24
- data/resources/locales/en-IE/calendars.yml +4 -4
- data/resources/locales/en-IE/lists.yml +8 -4
- data/resources/locales/en-IE/numbers.yml +48 -24
- data/resources/locales/en-SG/calendars.yml +4 -4
- data/resources/locales/en-SG/lists.yml +8 -4
- data/resources/locales/en-SG/numbers.yml +48 -24
- data/resources/locales/en-ZA/calendars.yml +4 -4
- data/resources/locales/en-ZA/lists.yml +8 -4
- data/resources/locales/en-ZA/numbers.yml +48 -24
- data/resources/locales/es/lists.yml +8 -4
- data/resources/locales/es/numbers.yml +48 -24
- data/resources/locales/es-419/calendars.yml +8 -8
- data/resources/locales/es-419/lists.yml +8 -4
- data/resources/locales/es-419/numbers.yml +50 -26
- data/resources/locales/es-CO/lists.yml +8 -4
- data/resources/locales/es-CO/numbers.yml +48 -24
- data/resources/locales/es-MX/lists.yml +8 -4
- data/resources/locales/es-MX/numbers.yml +48 -24
- data/resources/locales/es-US/lists.yml +8 -4
- data/resources/locales/es-US/numbers.yml +48 -24
- data/resources/locales/eu/calendars.yml +8 -8
- data/resources/locales/eu/lists.yml +8 -4
- data/resources/locales/eu/numbers.yml +48 -24
- data/resources/locales/fa/lists.yml +8 -4
- data/resources/locales/fa/numbers.yml +48 -24
- data/resources/locales/fi/calendars.yml +8 -8
- data/resources/locales/fi/lists.yml +8 -4
- data/resources/locales/fi/numbers.yml +48 -24
- data/resources/locales/fil/calendars.yml +8 -8
- data/resources/locales/fil/lists.yml +8 -4
- data/resources/locales/fil/numbers.yml +48 -24
- data/resources/locales/fr/calendars.yml +8 -8
- data/resources/locales/fr/lists.yml +8 -4
- data/resources/locales/fr/numbers.yml +48 -24
- data/resources/locales/fr-BE/calendars.yml +8 -8
- data/resources/locales/fr-BE/lists.yml +8 -4
- data/resources/locales/fr-BE/numbers.yml +48 -24
- data/resources/locales/fr-CA/calendars.yml +8 -8
- data/resources/locales/fr-CA/lists.yml +8 -4
- data/resources/locales/fr-CA/numbers.yml +48 -24
- data/resources/locales/fr-CH/calendars.yml +8 -8
- data/resources/locales/fr-CH/lists.yml +8 -4
- data/resources/locales/fr-CH/numbers.yml +48 -24
- data/resources/locales/ga/calendars.yml +8 -8
- data/resources/locales/ga/lists.yml +8 -4
- data/resources/locales/ga/numbers.yml +48 -24
- data/resources/locales/gl/calendars.yml +8 -8
- data/resources/locales/gl/lists.yml +8 -4
- data/resources/locales/gl/numbers.yml +48 -24
- data/resources/locales/he/calendars.yml +28 -28
- data/resources/locales/he/lists.yml +8 -4
- data/resources/locales/he/numbers.yml +48 -24
- data/resources/locales/hi/calendars.yml +8 -8
- data/resources/locales/hi/lists.yml +8 -4
- data/resources/locales/hi/numbers.yml +48 -24
- data/resources/locales/hr/lists.yml +8 -4
- data/resources/locales/hr/numbers.yml +48 -24
- data/resources/locales/hu/lists.yml +8 -4
- data/resources/locales/hu/numbers.yml +48 -24
- data/resources/locales/id/calendars.yml +8 -8
- data/resources/locales/id/lists.yml +8 -4
- data/resources/locales/id/numbers.yml +49 -25
- data/resources/locales/is/calendars.yml +8 -8
- data/resources/locales/is/lists.yml +8 -4
- data/resources/locales/is/numbers.yml +48 -24
- data/resources/locales/it/calendars.yml +8 -8
- data/resources/locales/it/lists.yml +8 -4
- data/resources/locales/it/numbers.yml +54 -30
- data/resources/locales/it-CH/calendars.yml +8 -8
- data/resources/locales/it-CH/lists.yml +8 -4
- data/resources/locales/it-CH/numbers.yml +54 -30
- data/resources/locales/ja/calendars.yml +32 -32
- data/resources/locales/ja/lists.yml +8 -4
- data/resources/locales/ja/numbers.yml +48 -24
- data/resources/locales/ko/calendars.yml +8 -8
- data/resources/locales/ko/lists.yml +8 -4
- data/resources/locales/ko/numbers.yml +48 -24
- data/resources/locales/lv/lists.yml +8 -4
- data/resources/locales/lv/numbers.yml +48 -24
- data/resources/locales/ms/calendars.yml +8 -8
- data/resources/locales/ms/lists.yml +8 -4
- data/resources/locales/ms/numbers.yml +48 -24
- data/resources/locales/nb/calendars.yml +9 -9
- data/resources/locales/nb/lists.yml +8 -4
- data/resources/locales/nb/numbers.yml +48 -24
- data/resources/locales/nl/calendars.yml +8 -8
- data/resources/locales/nl/lists.yml +8 -4
- data/resources/locales/nl/numbers.yml +48 -24
- data/resources/locales/pl/calendars.yml +8 -8
- data/resources/locales/pl/lists.yml +8 -4
- data/resources/locales/pl/numbers.yml +48 -24
- data/resources/locales/pt/calendars.yml +8 -8
- data/resources/locales/pt/lists.yml +8 -4
- data/resources/locales/pt/numbers.yml +48 -24
- data/resources/locales/ro/calendars.yml +8 -8
- data/resources/locales/ro/lists.yml +8 -4
- data/resources/locales/ro/numbers.yml +48 -24
- data/resources/locales/ru/calendars.yml +8 -8
- data/resources/locales/ru/lists.yml +8 -4
- data/resources/locales/ru/numbers.yml +48 -24
- data/resources/locales/sk/calendars.yml +8 -8
- data/resources/locales/sk/lists.yml +8 -4
- data/resources/locales/sk/numbers.yml +48 -24
- data/resources/locales/sq/calendars.yml +8 -8
- data/resources/locales/sq/lists.yml +8 -4
- data/resources/locales/sq/numbers.yml +48 -24
- data/resources/locales/sr/lists.yml +8 -4
- data/resources/locales/sr/numbers.yml +48 -24
- data/resources/locales/sv/calendars.yml +10 -10
- data/resources/locales/sv/lists.yml +8 -4
- data/resources/locales/sv/numbers.yml +48 -24
- data/resources/locales/ta/calendars.yml +8 -8
- data/resources/locales/ta/lists.yml +8 -4
- data/resources/locales/ta/numbers.yml +48 -24
- data/resources/locales/th/calendars.yml +8 -8
- data/resources/locales/th/lists.yml +8 -4
- data/resources/locales/th/numbers.yml +48 -24
- data/resources/locales/tr/lists.yml +8 -4
- data/resources/locales/tr/numbers.yml +50 -26
- data/resources/locales/uk/calendars.yml +8 -8
- data/resources/locales/uk/lists.yml +8 -4
- data/resources/locales/uk/numbers.yml +48 -24
- data/resources/locales/ur/calendars.yml +8 -8
- data/resources/locales/ur/lists.yml +8 -4
- data/resources/locales/ur/numbers.yml +48 -24
- data/resources/locales/vi/calendars.yml +32 -32
- data/resources/locales/vi/lists.yml +8 -4
- data/resources/locales/vi/numbers.yml +48 -24
- data/resources/locales/zh/calendars.yml +32 -32
- data/resources/locales/zh/lists.yml +8 -4
- data/resources/locales/zh/numbers.yml +48 -24
- data/resources/locales/zh-Hant/calendars.yml +32 -32
- data/resources/locales/zh-Hant/lists.yml +8 -4
- data/resources/locales/zh-Hant/numbers.yml +48 -24
- data/resources/shared/aliases.yml +1351 -0
- data/resources/shared/likely_subtags.yml +1149 -0
- data/resources/shared/postal_codes.yml +486 -289
- data/resources/shared/segments/segments_root.yml +57 -57
- data/resources/shared/segments/tests/sentence_break_test.yml +527 -0
- data/resources/shared/segments/tests/word_break_test.yml +1379 -0
- data/resources/shared/territories_containment.yml +25 -17
- data/resources/shared/variables.yml +1194 -0
- data/resources/unicode_data/blocks/ahom.yml +913 -0
- data/resources/unicode_data/blocks/anatolian_hieroglyphs.yml +9329 -0
- data/resources/unicode_data/blocks/arabic.yml +16 -0
- data/resources/unicode_data/blocks/arabic_presentation_forms_a.yml +2 -2
- data/resources/unicode_data/blocks/bassa_vah.yml +577 -0
- data/resources/unicode_data/blocks/buginese.yml +2 -2
- data/resources/unicode_data/blocks/caucasian_albanian.yml +849 -0
- data/resources/unicode_data/blocks/cherokee_supplement.yml +1281 -0
- data/resources/unicode_data/blocks/cjk_unified_ideographs_extension_e.yml +33 -0
- data/resources/unicode_data/blocks/combining_diacritical_marks_extended.yml +241 -0
- data/resources/unicode_data/blocks/coptic_epact_numbers.yml +449 -0
- data/resources/unicode_data/blocks/cuneiform_numbers_and_punctuation.yml +2 -2
- data/resources/unicode_data/blocks/duployan.yml +2289 -0
- data/resources/unicode_data/blocks/early_dynastic_cuneiform.yml +3137 -0
- data/resources/unicode_data/blocks/elbasan.yml +641 -0
- data/resources/unicode_data/blocks/general_punctuation.yml +64 -0
- data/resources/unicode_data/blocks/geometric_shapes_extended.yml +1361 -0
- data/resources/unicode_data/blocks/grantha.yml +1361 -0
- data/resources/unicode_data/blocks/gujarati.yml +0 -16
- data/resources/unicode_data/blocks/hatran.yml +417 -0
- data/resources/unicode_data/blocks/kannada.yml +0 -16
- data/resources/unicode_data/blocks/khojki.yml +977 -0
- data/resources/unicode_data/blocks/khudawadi.yml +1105 -0
- data/resources/unicode_data/blocks/latin_extended_e.yml +865 -0
- data/resources/unicode_data/blocks/linear_a.yml +5457 -0
- data/resources/unicode_data/blocks/mahajani.yml +625 -0
- data/resources/unicode_data/blocks/manichaean.yml +817 -0
- data/resources/unicode_data/blocks/mende_kikakui.yml +3409 -0
- data/resources/unicode_data/blocks/miscellaneous_technical.yml +4 -4
- data/resources/unicode_data/blocks/modi.yml +1265 -0
- data/resources/unicode_data/blocks/mongolian.yml +2 -2
- data/resources/unicode_data/blocks/mro.yml +689 -0
- data/resources/unicode_data/blocks/multani.yml +609 -0
- data/resources/unicode_data/blocks/myanmar_extended_b.yml +497 -0
- data/resources/unicode_data/blocks/nabataean.yml +641 -0
- data/resources/unicode_data/blocks/old_hungarian.yml +1729 -0
- data/resources/unicode_data/blocks/old_north_arabian.yml +513 -0
- data/resources/unicode_data/blocks/old_permic.yml +689 -0
- data/resources/unicode_data/blocks/ornamental_dingbats.yml +769 -0
- data/resources/unicode_data/blocks/pahawh_hmong.yml +2033 -0
- data/resources/unicode_data/blocks/palmyrene.yml +513 -0
- data/resources/unicode_data/blocks/pau_cin_hau.yml +913 -0
- data/resources/unicode_data/blocks/psalter_pahlavi.yml +465 -0
- data/resources/unicode_data/blocks/shorthand_format_controls.yml +65 -0
- data/resources/unicode_data/blocks/siddham.yml +1473 -0
- data/resources/unicode_data/blocks/sinhala_archaic_numbers.yml +321 -0
- data/resources/unicode_data/blocks/supplemental_arrows_c.yml +2369 -0
- data/resources/unicode_data/blocks/supplemental_symbols_and_pictographs.yml +241 -0
- data/resources/unicode_data/blocks/sutton_signwriting.yml +10753 -0
- data/resources/unicode_data/blocks/tirhuta.yml +1313 -0
- data/resources/unicode_data/blocks/warang_citi.yml +1345 -0
- data/resources/unicode_data/properties/ASCII_Hex_Digit/value.dump +5 -0
- data/resources/unicode_data/properties/Age/1.1/value.dump +0 -0
- data/resources/unicode_data/properties/Age/2.0/value.dump +0 -0
- data/resources/unicode_data/properties/Age/2.1/value.dump +4 -0
- data/resources/unicode_data/properties/Age/3.0/value.dump +0 -0
- data/resources/unicode_data/properties/Age/3.1/value.dump +0 -0
- data/resources/unicode_data/properties/Age/3.2/value.dump +0 -0
- data/resources/unicode_data/properties/Age/4.0/value.dump +0 -0
- data/resources/unicode_data/properties/Age/4.1/value.dump +0 -0
- data/resources/unicode_data/properties/Age/5.0/value.dump +0 -0
- data/resources/unicode_data/properties/Age/5.1/value.dump +0 -0
- data/resources/unicode_data/properties/Age/5.2/value.dump +0 -0
- data/resources/unicode_data/properties/Age/6.0/value.dump +0 -0
- data/resources/unicode_data/properties/Age/6.1/value.dump +0 -0
- data/resources/unicode_data/properties/Age/6.2/value.dump +3 -0
- data/resources/unicode_data/properties/Age/6.3/value.dump +4 -0
- data/resources/unicode_data/properties/Alphabetic/value.dump +0 -0
- data/resources/unicode_data/properties/Bidi_Class/AL/value.dump +0 -0
- data/resources/unicode_data/properties/Bidi_Class/AN/value.dump +0 -0
- data/resources/unicode_data/properties/Bidi_Class/B/value.dump +8 -0
- data/resources/unicode_data/properties/Bidi_Class/BN/value.dump +0 -0
- data/resources/unicode_data/properties/Bidi_Class/CS/value.dump +15 -0
- data/resources/unicode_data/properties/Bidi_Class/EN/value.dump +0 -0
- data/resources/unicode_data/properties/Bidi_Class/ES/value.dump +11 -0
- data/resources/unicode_data/properties/Bidi_Class/ET/value.dump +27 -0
- data/resources/unicode_data/properties/Bidi_Class/FSI/value.dump +3 -0
- data/resources/unicode_data/properties/Bidi_Class/L/value.dump +0 -0
- data/resources/unicode_data/properties/Bidi_Class/LRE/value.dump +3 -0
- data/resources/unicode_data/properties/Bidi_Class/LRI/value.dump +3 -0
- data/resources/unicode_data/properties/Bidi_Class/LRO/value.dump +3 -0
- data/resources/unicode_data/properties/Bidi_Class/NSM/value.dump +0 -0
- data/resources/unicode_data/properties/Bidi_Class/ON/value.dump +0 -0
- data/resources/unicode_data/properties/Bidi_Class/PDF/value.dump +3 -0
- data/resources/unicode_data/properties/Bidi_Class/PDI/value.dump +3 -0
- data/resources/unicode_data/properties/Bidi_Class/R/value.dump +0 -0
- data/resources/unicode_data/properties/Bidi_Class/RLE/value.dump +3 -0
- data/resources/unicode_data/properties/Bidi_Class/RLI/value.dump +3 -0
- data/resources/unicode_data/properties/Bidi_Class/RLO/value.dump +3 -0
- data/resources/unicode_data/properties/Bidi_Class/S/value.dump +5 -0
- data/resources/unicode_data/properties/Bidi_Class/WS/value.dump +0 -0
- data/resources/unicode_data/properties/Bidi_Control/value.dump +4 -0
- data/resources/unicode_data/properties/Bidi_Mirrored/N/value.dump +0 -0
- data/resources/unicode_data/properties/Bidi_Mirrored/Y/value.dump +115 -0
- data/resources/unicode_data/properties/Block/Aegean Numbers/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Alchemical Symbols/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Alphabetic Presentation Forms/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Ancient Greek Musical Notation/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Ancient Greek Numbers/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Ancient Symbols/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Arabic/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Arabic Extended-A/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Arabic Mathematical Alphabetic Symbols/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Arabic Presentation Forms-A/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Arabic Presentation Forms-B/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Arabic Supplement/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Armenian/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Arrows/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Avestan/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Balinese/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Bamum/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Bamum Supplement/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Basic Latin/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Batak/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Bengali/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Block Elements/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Bopomofo/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Bopomofo Extended/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Box Drawing/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Brahmi/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Braille Patterns/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Buginese/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Buhid/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Byzantine Musical Symbols/value.dump +0 -0
- data/resources/unicode_data/properties/Block/CJK Compatibility/value.dump +0 -0
- data/resources/unicode_data/properties/Block/CJK Compatibility Forms/value.dump +3 -0
- data/resources/unicode_data/properties/Block/CJK Compatibility Ideographs/value.dump +0 -0
- data/resources/unicode_data/properties/Block/CJK Compatibility Ideographs Supplement/value.dump +0 -0
- data/resources/unicode_data/properties/Block/CJK Radicals Supplement/value.dump +3 -0
- data/resources/unicode_data/properties/Block/CJK Strokes/value.dump +3 -0
- Punctuation/value.dump +0 -0
- data/resources/unicode_data/properties/Block/CJK Unified Ideographs/value.dump +0 -0
- data/resources/unicode_data/properties/Block/CJK Unified Ideographs Extension A/value.dump +0 -0
- data/resources/unicode_data/properties/Block/CJK Unified Ideographs Extension B/value.dump +0 -0
- data/resources/unicode_data/properties/Block/CJK Unified Ideographs Extension C/value.dump +0 -0
- data/resources/unicode_data/properties/Block/CJK Unified Ideographs Extension D/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Carian/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Chakma/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Cham/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Cherokee/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Combining Diacritical Marks/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Combining Diacritical Marks Supplement/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Combining Diacritical Marks for Symbols/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Combining Half Marks/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Common Indic Number Forms/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Control Pictures/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Coptic/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Counting Rod Numerals/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Cuneiform/value.dump +0 -0
- Punctuation/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Currency Symbols/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Cypriot Syllabary/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Cyrillic/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Cyrillic Extended-A/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Cyrillic Extended-B/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Cyrillic Supplement/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Deseret/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Devanagari/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Devanagari Extended/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Dingbats/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Domino Tiles/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Egyptian Hieroglyphs/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Emoticons/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Enclosed Alphanumeric Supplement/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Enclosed Alphanumerics/value.dump +3 -0
- Months/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Enclosed Ideographic Supplement/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Ethiopic/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Ethiopic Extended/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Ethiopic Extended-A/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Ethiopic Supplement/value.dump +3 -0
- data/resources/unicode_data/properties/Block/General Punctuation/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Geometric Shapes/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Georgian/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Georgian Supplement/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Glagolitic/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Gothic/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Greek Extended/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Greek and Coptic/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Gujarati/value.dump +4 -0
- data/resources/unicode_data/properties/Block/Gurmukhi/value.dump +0 -0
- Fullwidth Forms/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Hangul Compatibility Jamo/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Hangul Jamo/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Hangul Jamo Extended-A/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Hangul Jamo Extended-B/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Hangul Syllables/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Hanunoo/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Hebrew/value.dump +3 -0
- data/resources/unicode_data/properties/Block/High Private Use Surrogates/value.dump +3 -0
- data/resources/unicode_data/properties/Block/High Surrogates/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Hiragana/value.dump +3 -0
- data/resources/unicode_data/properties/Block/IPA Extensions/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Ideographic Description Characters/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Imperial Aramaic/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Inscriptional Pahlavi/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Inscriptional Parthian/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Javanese/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Kaithi/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Kana Supplement/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Kanbun/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Kangxi Radicals/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Kannada/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Katakana/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Katakana Phonetic Extensions/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Kayah Li/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Kharoshthi/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Khmer/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Khmer Symbols/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Lao/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Latin Extended Additional/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Latin Extended-A/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Latin Extended-B/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Latin Extended-C/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Latin Extended-D/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Latin-1 Supplement/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Lepcha/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Letterlike Symbols/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Limbu/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Linear B Ideograms/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Linear B Syllabary/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Lisu/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Low Surrogates/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Lycian/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Lydian/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Mahjong Tiles/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Malayalam/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Mandaic/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Mathematical Alphanumeric Symbols/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Mathematical Operators/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Meetei Mayek/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Meetei Mayek Extensions/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Meroitic Cursive/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Meroitic Hieroglyphs/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Miao/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Miscellaneous Mathematical Symbols-A/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Miscellaneous Mathematical Symbols-B/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Miscellaneous Symbols/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Miscellaneous Symbols And Pictographs/value.dump +0 -0
- Arrows/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Miscellaneous Technical/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Modifier Tone Letters/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Mongolian/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Musical Symbols/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Myanmar/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Myanmar Extended-A/value.dump +3 -0
- data/resources/unicode_data/properties/Block/NKo/value.dump +3 -0
- data/resources/unicode_data/properties/Block/New Tai Lue/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Number Forms/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Ogham/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Ol Chiki/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Old Italic/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Old Persian/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Old South Arabian/value.dump +5 -0
- data/resources/unicode_data/properties/Block/Old Turkic/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Optical Character Recognition/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Oriya/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Osmanya/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Phags-pa/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Phaistos Disc/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Phoenician/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Phonetic Extensions/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Phonetic Extensions Supplement/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Playing Cards/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Private Use Area/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Rejang/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Rumi Numeral Symbols/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Runic/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Samaritan/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Saurashtra/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Sharada/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Shavian/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Sinhala/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Small Form Variants/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Sora Sompeng/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Spacing Modifier Letters/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Specials/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Sundanese/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Sundanese Supplement/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Superscripts and Subscripts/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Supplemental Arrows-A/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Supplemental Arrows-B/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Supplemental Mathematical Operators/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Supplemental Punctuation/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Supplementary Private Use Area-A/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Supplementary Private Use Area-B/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Syloti Nagri/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Syriac/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Tagalog/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Tagbanwa/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Tags/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Tai Le/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Tai Tham/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Tai Viet/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Tai Xuan Jing Symbols/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Takri/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Tamil/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Telugu/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Thaana/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Thai/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Tibetan/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Tifinagh/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Transport And Map Symbols/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Ugaritic/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Unified Canadian Aboriginal Syllabics/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Unified Canadian Aboriginal Syllabics Extended/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Vai/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Variation Selectors/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Variation Selectors Supplement/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Vedic Extensions/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Vertical Forms/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Yi Radicals/value.dump +3 -0
- data/resources/unicode_data/properties/Block/Yi Syllables/value.dump +0 -0
- data/resources/unicode_data/properties/Block/Yijing Hexagram Symbols/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/0/value.dump +0 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/1/value.dump +13 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/10/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/103/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/107/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/11/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/118/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/12/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/122/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/129/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/13/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/130/value.dump +5 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/132/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/14/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/15/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/16/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/17/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/18/value.dump +4 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/19/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/20/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/202/value.dump +5 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/21/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/214/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/216/value.dump +6 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/218/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/22/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/220/value.dump +70 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/222/value.dump +6 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/224/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/226/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/228/value.dump +5 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/23/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/230/value.dump +0 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/232/value.dump +6 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/233/value.dump +6 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/234/value.dump +5 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/24/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/240/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/25/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/26/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/27/value.dump +4 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/28/value.dump +4 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/29/value.dump +4 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/30/value.dump +4 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/31/value.dump +4 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/32/value.dump +4 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/33/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/34/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/35/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/36/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/7/value.dump +19 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/8/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/84/value.dump +3 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/9/value.dump +41 -0
- data/resources/unicode_data/properties/Canonical_Combining_Class/91/value.dump +3 -0
- data/resources/unicode_data/properties/Case_Ignorable/value.dump +0 -0
- data/resources/unicode_data/properties/Cased/value.dump +0 -0
- data/resources/unicode_data/properties/Changes_When_Casefolded/value.dump +0 -0
- data/resources/unicode_data/properties/Changes_When_Casemapped/value.dump +0 -0
- data/resources/unicode_data/properties/Changes_When_Lowercased/value.dump +0 -0
- data/resources/unicode_data/properties/Changes_When_Titlecased/value.dump +589 -0
- data/resources/unicode_data/properties/Changes_When_Uppercased/value.dump +588 -0
- data/resources/unicode_data/properties/Dash/value.dump +0 -0
- data/resources/unicode_data/properties/Default_Ignorable_Code_Point/value.dump +0 -0
- data/resources/unicode_data/properties/Deprecated/value.dump +0 -0
- data/resources/unicode_data/properties/Diacritic/value.dump +135 -0
- data/resources/unicode_data/properties/East_Asian_Width/A/value.dump +0 -0
- data/resources/unicode_data/properties/East_Asian_Width/F/value.dump +0 -0
- data/resources/unicode_data/properties/East_Asian_Width/H/value.dump +9 -0
- data/resources/unicode_data/properties/East_Asian_Width/N/value.dump +0 -0
- data/resources/unicode_data/properties/East_Asian_Width/Na/value.dump +9 -0
- data/resources/unicode_data/properties/East_Asian_Width/W/value.dump +0 -0
- data/resources/unicode_data/properties/Extender/value.dump +26 -0
- data/resources/unicode_data/properties/General_Category/C/c/value.dump +0 -0
- data/resources/unicode_data/properties/General_Category/C/f/value.dump +0 -0
- data/resources/unicode_data/properties/General_Category/C/o/value.dump +0 -0
- data/resources/unicode_data/properties/General_Category/C/s/value.dump +0 -0
- data/resources/unicode_data/properties/General_Category/L/l/value.dump +0 -0
- data/resources/unicode_data/properties/General_Category/L/m/value.dump +54 -0
- data/resources/unicode_data/properties/General_Category/L/o/value.dump +0 -0
- data/resources/unicode_data/properties/General_Category/L/t/value.dump +12 -0
- data/resources/unicode_data/properties/General_Category/L/u/value.dump +0 -0
- data/resources/unicode_data/properties/General_Category/M/c/value.dump +0 -0
- data/resources/unicode_data/properties/General_Category/M/e/value.dump +6 -0
- data/resources/unicode_data/properties/General_Category/M/n/value.dump +0 -0
- data/resources/unicode_data/properties/General_Category/N/d/value.dump +0 -0
- data/resources/unicode_data/properties/General_Category/N/l/value.dump +0 -0
- data/resources/unicode_data/properties/General_Category/N/o/value.dump +0 -0
- data/resources/unicode_data/properties/General_Category/P/c/value.dump +8 -0
- data/resources/unicode_data/properties/General_Category/P/d/value.dump +0 -0
- data/resources/unicode_data/properties/General_Category/P/e/value.dump +72 -0
- data/resources/unicode_data/properties/General_Category/P/f/value.dump +14 -0
- data/resources/unicode_data/properties/General_Category/P/i/value.dump +13 -0
- data/resources/unicode_data/properties/General_Category/P/o/value.dump +0 -0
- data/resources/unicode_data/properties/General_Category/P/s/value.dump +76 -0
- data/resources/unicode_data/properties/General_Category/S/c/value.dump +21 -0
- data/resources/unicode_data/properties/General_Category/S/k/value.dump +0 -0
- data/resources/unicode_data/properties/General_Category/S/m/value.dump +0 -0
- data/resources/unicode_data/properties/General_Category/S/o/value.dump +0 -0
- data/resources/unicode_data/properties/General_Category/Z/l/value.dump +3 -0
- data/resources/unicode_data/properties/General_Category/Z/p/value.dump +3 -0
- data/resources/unicode_data/properties/General_Category/Z/s/value.dump +0 -0
- data/resources/unicode_data/properties/Grapheme_Base/value.dump +0 -0
- data/resources/unicode_data/properties/Grapheme_Cluster_Break/CR/value.dump +3 -0
- data/resources/unicode_data/properties/Grapheme_Cluster_Break/Control/value.dump +0 -0
- data/resources/unicode_data/properties/Grapheme_Cluster_Break/Extend/value.dump +0 -0
- data/resources/unicode_data/properties/Grapheme_Cluster_Break/L/value.dump +0 -0
- data/resources/unicode_data/properties/Grapheme_Cluster_Break/LF/value.dump +3 -0
- data/resources/unicode_data/properties/Grapheme_Cluster_Break/LV/value.dump +0 -0
- data/resources/unicode_data/properties/Grapheme_Cluster_Break/LVT/value.dump +401 -0
- data/resources/unicode_data/properties/Grapheme_Cluster_Break/Regional_Indicator/value.dump +3 -0
- data/resources/unicode_data/properties/Grapheme_Cluster_Break/SpacingMark/value.dump +0 -0
- data/resources/unicode_data/properties/Grapheme_Cluster_Break/T/value.dump +4 -0
- data/resources/unicode_data/properties/Grapheme_Cluster_Break/V/value.dump +4 -0
- data/resources/unicode_data/properties/Grapheme_Extend/value.dump +0 -0
- data/resources/unicode_data/properties/Grapheme_Link/value.dump +41 -0
- data/resources/unicode_data/properties/Hangul_Syllable_Type/L/value.dump +0 -0
- data/resources/unicode_data/properties/Hangul_Syllable_Type/LV/value.dump +0 -0
- data/resources/unicode_data/properties/Hangul_Syllable_Type/LVT/value.dump +401 -0
- data/resources/unicode_data/properties/Hangul_Syllable_Type/T/value.dump +4 -0
- data/resources/unicode_data/properties/Hangul_Syllable_Type/V/value.dump +4 -0
- data/resources/unicode_data/properties/Hex_Digit/value.dump +8 -0
- data/resources/unicode_data/properties/Hyphen/value.dump +12 -0
- data/resources/unicode_data/properties/IDS_Binary_Operator/value.dump +4 -0
- data/resources/unicode_data/properties/IDS_Trinary_Operator/value.dump +3 -0
- data/resources/unicode_data/properties/ID_Continue/value.dump +0 -0
- data/resources/unicode_data/properties/ID_Start/value.dump +0 -0
- data/resources/unicode_data/properties/Ideographic/value.dump +0 -0
- data/resources/unicode_data/properties/Indic_Positional_Category/Bottom/value.dump +78 -0
- data/resources/unicode_data/properties/Indic_Positional_Category/Bottom_And_Right/value.dump +4 -0
- data/resources/unicode_data/properties/Indic_Positional_Category/Invisible/value.dump +10 -0
- data/resources/unicode_data/properties/Indic_Positional_Category/Left/value.dump +36 -0
- data/resources/unicode_data/properties/Indic_Positional_Category/Left_And_Right/value.dump +10 -0
- data/resources/unicode_data/properties/Indic_Positional_Category/Overstruck/value.dump +8 -0
- data/resources/unicode_data/properties/Indic_Positional_Category/Right/value.dump +86 -0
- data/resources/unicode_data/properties/Indic_Positional_Category/Top/value.dump +91 -0
- data/resources/unicode_data/properties/Indic_Positional_Category/Top_And_Bottom/value.dump +8 -0
- data/resources/unicode_data/properties/Indic_Positional_Category/Top_And_Bottom_And_Right/value.dump +3 -0
- data/resources/unicode_data/properties/Indic_Positional_Category/Top_And_Left/value.dump +6 -0
- data/resources/unicode_data/properties/Indic_Positional_Category/Top_And_Left_And_Right/value.dump +4 -0
- data/resources/unicode_data/properties/Indic_Positional_Category/Top_And_Right/value.dump +12 -0
- data/resources/unicode_data/properties/Indic_Positional_Category/Visual_Order_Left/value.dump +8 -0
- data/resources/unicode_data/properties/Indic_Syllabic_Category/Avagraha/value.dump +15 -0
- data/resources/unicode_data/properties/Indic_Syllabic_Category/Bindu/value.dump +0 -0
- data/resources/unicode_data/properties/Indic_Syllabic_Category/Consonant/value.dump +0 -0
- data/resources/unicode_data/properties/Indic_Syllabic_Category/Consonant_Dead/value.dump +4 -0
- data/resources/unicode_data/properties/Indic_Syllabic_Category/Consonant_Final/value.dump +13 -0
- data/resources/unicode_data/properties/Indic_Syllabic_Category/Consonant_Head_Letter/value.dump +3 -0
- data/resources/unicode_data/properties/Indic_Syllabic_Category/Consonant_Medial/value.dump +12 -0
- data/resources/unicode_data/properties/Indic_Syllabic_Category/Consonant_Placeholder/value.dump +0 -0
- data/resources/unicode_data/properties/Indic_Syllabic_Category/Consonant_Repha/value.dump +8 -0
- data/resources/unicode_data/properties/Indic_Syllabic_Category/Consonant_Subjoined/value.dump +11 -0
- data/resources/unicode_data/properties/Indic_Syllabic_Category/Modifying_Letter/value.dump +3 -0
- data/resources/unicode_data/properties/Indic_Syllabic_Category/Nukta/value.dump +18 -0
- data/resources/unicode_data/properties/Indic_Syllabic_Category/Register_Shifter/value.dump +3 -0
- data/resources/unicode_data/properties/Indic_Syllabic_Category/Tone_Letter/value.dump +5 -0
- data/resources/unicode_data/properties/Indic_Syllabic_Category/Tone_Mark/value.dump +17 -0
- data/resources/unicode_data/properties/Indic_Syllabic_Category/Virama/value.dump +41 -0
- data/resources/unicode_data/properties/Indic_Syllabic_Category/Visarga/value.dump +32 -0
- data/resources/unicode_data/properties/Indic_Syllabic_Category/Vowel/value.dump +6 -0
- data/resources/unicode_data/properties/Indic_Syllabic_Category/Vowel_Dependent/value.dump +112 -0
- data/resources/unicode_data/properties/Indic_Syllabic_Category/Vowel_Independent/value.dump +0 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/A/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/AE/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/B/value.dump +4 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/BB/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/BS/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/C/value.dump +4 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/D/value.dump +4 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/DD/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/E/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/EO/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/EU/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/G/value.dump +0 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/GG/value.dump +4 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/GS/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/H/value.dump +4 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/I/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/J/value.dump +4 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/JJ/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/K/value.dump +4 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/L/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/LB/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/LG/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/LH/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/LM/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/LP/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/LS/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/LT/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/M/value.dump +4 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/N/value.dump +4 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/NG/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/NH/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/NJ/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/O/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/OE/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/P/value.dump +4 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/R/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/S/value.dump +4 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/SS/value.dump +6 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/T/value.dump +4 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/U/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/WA/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/WAE/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/WE/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/WEO/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/WI/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/YA/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/YAE/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/YE/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/YEO/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/YI/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/YO/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/YU/value.dump +3 -0
- data/resources/unicode_data/properties/Jamo_Short_Name/value.dump +3 -0
- data/resources/unicode_data/properties/Join_Control/value.dump +3 -0
- data/resources/unicode_data/properties/Line_Break/AI/value.dump +0 -0
- data/resources/unicode_data/properties/Line_Break/AL/value.dump +0 -0
- data/resources/unicode_data/properties/Line_Break/B2/value.dump +4 -0
- data/resources/unicode_data/properties/Line_Break/BA/value.dump +0 -0
- data/resources/unicode_data/properties/Line_Break/BB/value.dump +15 -0
- data/resources/unicode_data/properties/Line_Break/BK/value.dump +4 -0
- data/resources/unicode_data/properties/Line_Break/CB/value.dump +3 -0
- data/resources/unicode_data/properties/Line_Break/CJ/value.dump +27 -0
- data/resources/unicode_data/properties/Line_Break/CL/value.dump +81 -0
- data/resources/unicode_data/properties/Line_Break/CM/value.dump +0 -0
- data/resources/unicode_data/properties/Line_Break/CP/value.dump +4 -0
- data/resources/unicode_data/properties/Line_Break/CR/value.dump +3 -0
- data/resources/unicode_data/properties/Line_Break/EX/value.dump +24 -0
- data/resources/unicode_data/properties/Line_Break/GL/value.dump +13 -0
- data/resources/unicode_data/properties/Line_Break/H2/value.dump +0 -0
- data/resources/unicode_data/properties/Line_Break/H3/value.dump +401 -0
- data/resources/unicode_data/properties/Line_Break/HL/value.dump +12 -0
- data/resources/unicode_data/properties/Line_Break/HY/value.dump +3 -0
- data/resources/unicode_data/properties/Line_Break/ID/value.dump +0 -0
- data/resources/unicode_data/properties/Line_Break/IN/value.dump +4 -0
- data/resources/unicode_data/properties/Line_Break/IS/value.dump +12 -0
- data/resources/unicode_data/properties/Line_Break/JL/value.dump +0 -0
- data/resources/unicode_data/properties/Line_Break/JT/value.dump +4 -0
- data/resources/unicode_data/properties/Line_Break/JV/value.dump +4 -0
- data/resources/unicode_data/properties/Line_Break/LF/value.dump +3 -0
- data/resources/unicode_data/properties/Line_Break/NL/value.dump +3 -0
- data/resources/unicode_data/properties/Line_Break/NS/value.dump +17 -0
- data/resources/unicode_data/properties/Line_Break/NU/value.dump +0 -0
- data/resources/unicode_data/properties/Line_Break/OP/value.dump +83 -0
- data/resources/unicode_data/properties/Line_Break/PO/value.dump +20 -0
- data/resources/unicode_data/properties/Line_Break/PR/value.dump +24 -0
- data/resources/unicode_data/properties/Line_Break/QU/value.dump +0 -0
- data/resources/unicode_data/properties/Line_Break/RI/value.dump +3 -0
- data/resources/unicode_data/properties/Line_Break/SA/value.dump +0 -0
- data/resources/unicode_data/properties/Line_Break/SG/value.dump +0 -0
- data/resources/unicode_data/properties/Line_Break/SP/value.dump +3 -0
- data/resources/unicode_data/properties/Line_Break/SY/value.dump +3 -0
- data/resources/unicode_data/properties/Line_Break/WJ/value.dump +4 -0
- data/resources/unicode_data/properties/Line_Break/XX/value.dump +0 -0
- data/resources/unicode_data/properties/Line_Break/ZW/value.dump +3 -0
- data/resources/unicode_data/properties/Logical_Order_Exception/value.dump +8 -0
- data/resources/unicode_data/properties/Lowercase/value.dump +0 -0
- data/resources/unicode_data/properties/Math/value.dump +0 -0
- data/resources/unicode_data/properties/Noncharacter_Code_Point/value.dump +22 -0
- data/resources/unicode_data/properties/Numeric_Type/0/value.dump +0 -0
- data/resources/unicode_data/properties/Numeric_Type/1/value.dump +69 -0
- data/resources/unicode_data/properties/Numeric_Type/2/value.dump +68 -0
- data/resources/unicode_data/properties/Numeric_Type/3/value.dump +68 -0
- data/resources/unicode_data/properties/Numeric_Type/4/value.dump +68 -0
- data/resources/unicode_data/properties/Numeric_Type/5/value.dump +65 -0
- data/resources/unicode_data/properties/Numeric_Type/6/value.dump +65 -0
- data/resources/unicode_data/properties/Numeric_Type/7/value.dump +65 -0
- data/resources/unicode_data/properties/Numeric_Type/8/value.dump +65 -0
- data/resources/unicode_data/properties/Numeric_Type/9/value.dump +67 -0
- data/resources/unicode_data/properties/Numeric_Type/value.dump +0 -0
- data/resources/unicode_data/properties/Other_Alphabetic/value.dump +0 -0
- data/resources/unicode_data/properties/Other_Default_Ignorable_Code_Point/value.dump +0 -0
- data/resources/unicode_data/properties/Other_Grapheme_Extend/value.dump +19 -0
- data/resources/unicode_data/properties/Other_ID_Continue/value.dump +6 -0
- data/resources/unicode_data/properties/Other_ID_Start/value.dump +5 -0
- data/resources/unicode_data/properties/Other_Lowercase/value.dump +20 -0
- data/resources/unicode_data/properties/Other_Math/value.dump +0 -0
- data/resources/unicode_data/properties/Other_Uppercase/value.dump +4 -0
- data/resources/unicode_data/properties/Pattern_Syntax/value.dump +0 -0
- data/resources/unicode_data/properties/Pattern_White_Space/value.dump +8 -0
- data/resources/unicode_data/properties/Quotation_Mark/value.dump +14 -0
- data/resources/unicode_data/properties/Radical/value.dump +0 -0
- data/resources/unicode_data/properties/STerm/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Arabic/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Armenian/value.dump +8 -0
- data/resources/unicode_data/properties/Script/Avestan/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Balinese/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Bamum/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Batak/value.dump +4 -0
- data/resources/unicode_data/properties/Script/Bengali/value.dump +16 -0
- data/resources/unicode_data/properties/Script/Bopomofo/value.dump +5 -0
- data/resources/unicode_data/properties/Script/Brahmi/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Braille/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Buginese/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Buhid/value.dump +3 -0
- data/resources/unicode_data/properties/Script/Canadian_Aboriginal/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Carian/value.dump +3 -0
- data/resources/unicode_data/properties/Script/Chakma/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Cham/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Cherokee/value.dump +3 -0
- data/resources/unicode_data/properties/Script/Common/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Coptic/value.dump +5 -0
- data/resources/unicode_data/properties/Script/Cuneiform/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Cypriot/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Cyrillic/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Deseret/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Devanagari/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Egyptian_Hieroglyphs/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Ethiopic/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Georgian/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Glagolitic/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Gothic/value.dump +3 -0
- data/resources/unicode_data/properties/Script/Greek/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Gujarati/value.dump +40 -0
- data/resources/unicode_data/properties/Script/Gurmukhi/value.dump +50 -0
- data/resources/unicode_data/properties/Script/Han/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Hangul/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Hanunoo/value.dump +3 -0
- data/resources/unicode_data/properties/Script/Hebrew/value.dump +11 -0
- data/resources/unicode_data/properties/Script/Hiragana/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Imperial_Aramaic/value.dump +4 -0
- data/resources/unicode_data/properties/Script/Inherited/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Inscriptional_Pahlavi/value.dump +4 -0
- data/resources/unicode_data/properties/Script/Inscriptional_Parthian/value.dump +4 -0
- data/resources/unicode_data/properties/Script/Javanese/value.dump +5 -0
- data/resources/unicode_data/properties/Script/Kaithi/value.dump +3 -0
- data/resources/unicode_data/properties/Script/Kannada/value.dump +16 -0
- data/resources/unicode_data/properties/Script/Katakana/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Kayah_Li/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Kharoshthi/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Khmer/value.dump +6 -0
- data/resources/unicode_data/properties/Script/Lao/value.dump +20 -0
- data/resources/unicode_data/properties/Script/Latin/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Lepcha/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Limbu/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Linear_B/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Lisu/value.dump +3 -0
- data/resources/unicode_data/properties/Script/Lycian/value.dump +3 -0
- data/resources/unicode_data/properties/Script/Lydian/value.dump +4 -0
- data/resources/unicode_data/properties/Script/Malayalam/value.dump +13 -0
- data/resources/unicode_data/properties/Script/Mandaic/value.dump +4 -0
- data/resources/unicode_data/properties/Script/Meetei_Mayek/value.dump +5 -0
- data/resources/unicode_data/properties/Script/Meroitic_Cursive/value.dump +4 -0
- data/resources/unicode_data/properties/Script/Meroitic_Hieroglyphs/value.dump +3 -0
- data/resources/unicode_data/properties/Script/Miao/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Mongolian/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Myanmar/value.dump +0 -0
- data/resources/unicode_data/properties/Script/New_Tai_Lue/value.dump +6 -0
- data/resources/unicode_data/properties/Script/Nko/value.dump +3 -0
- data/resources/unicode_data/properties/Script/Ogham/value.dump +3 -0
- data/resources/unicode_data/properties/Script/Ol_Chiki/value.dump +3 -0
- data/resources/unicode_data/properties/Script/Old_Italic/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Old_Persian/value.dump +4 -0
- data/resources/unicode_data/properties/Script/Old_South_Arabian/value.dump +5 -0
- data/resources/unicode_data/properties/Script/Old_Turkic/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Oriya/value.dump +16 -0
- data/resources/unicode_data/properties/Script/Osmanya/value.dump +4 -0
- data/resources/unicode_data/properties/Script/Phags_Pa/value.dump +3 -0
- data/resources/unicode_data/properties/Script/Phoenician/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Rejang/value.dump +4 -0
- data/resources/unicode_data/properties/Script/Runic/value.dump +4 -0
- data/resources/unicode_data/properties/Script/Samaritan/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Saurashtra/value.dump +4 -0
- data/resources/unicode_data/properties/Script/Sharada/value.dump +4 -0
- data/resources/unicode_data/properties/Script/Shavian/value.dump +3 -0
- data/resources/unicode_data/properties/Script/Sinhala/value.dump +13 -0
- data/resources/unicode_data/properties/Script/Sora_Sompeng/value.dump +4 -0
- data/resources/unicode_data/properties/Script/Sundanese/value.dump +4 -0
- data/resources/unicode_data/properties/Script/Syloti_Nagri/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Syriac/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Tagalog/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Tagbanwa/value.dump +5 -0
- data/resources/unicode_data/properties/Script/Tai_Le/value.dump +4 -0
- data/resources/unicode_data/properties/Script/Tai_Tham/value.dump +8 -0
- data/resources/unicode_data/properties/Script/Tai_Viet/value.dump +4 -0
- data/resources/unicode_data/properties/Script/Takri/value.dump +4 -0
- data/resources/unicode_data/properties/Script/Tamil/value.dump +18 -0
- data/resources/unicode_data/properties/Script/Telugu/value.dump +16 -0
- data/resources/unicode_data/properties/Script/Thaana/value.dump +3 -0
- data/resources/unicode_data/properties/Script/Thai/value.dump +4 -0
- data/resources/unicode_data/properties/Script/Tibetan/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Tifinagh/value.dump +5 -0
- data/resources/unicode_data/properties/Script/Ugaritic/value.dump +4 -0
- data/resources/unicode_data/properties/Script/Vai/value.dump +0 -0
- data/resources/unicode_data/properties/Script/Yi/value.dump +0 -0
- data/resources/unicode_data/properties/Script_Extensions/Arab/value.dump +11 -0
- data/resources/unicode_data/properties/Script_Extensions/Armn/value.dump +3 -0
- data/resources/unicode_data/properties/Script_Extensions/Beng/value.dump +3 -0
- data/resources/unicode_data/properties/Script_Extensions/Bopo/value.dump +19 -0
- data/resources/unicode_data/properties/Script_Extensions/Bugi/value.dump +3 -0
- data/resources/unicode_data/properties/Script_Extensions/Buhd/value.dump +3 -0
- data/resources/unicode_data/properties/Script_Extensions/Cakm/value.dump +4 -0
- data/resources/unicode_data/properties/Script_Extensions/Cprt/value.dump +0 -0
- data/resources/unicode_data/properties/Script_Extensions/Cyrl/value.dump +3 -0
- data/resources/unicode_data/properties/Script_Extensions/Deva/value.dump +4 -0
- data/resources/unicode_data/properties/Script_Extensions/Geor/value.dump +3 -0
- data/resources/unicode_data/properties/Script_Extensions/Grek/value.dump +5 -0
- data/resources/unicode_data/properties/Script_Extensions/Gujr/value.dump +3 -0
- data/resources/unicode_data/properties/Script_Extensions/Guru/value.dump +4 -0
- data/resources/unicode_data/properties/Script_Extensions/Hang/value.dump +18 -0
- data/resources/unicode_data/properties/Script_Extensions/Hani/value.dump +21 -0
- data/resources/unicode_data/properties/Script_Extensions/Hano/value.dump +3 -0
- data/resources/unicode_data/properties/Script_Extensions/Hira/value.dump +24 -0
- data/resources/unicode_data/properties/Script_Extensions/Java/value.dump +3 -0
- data/resources/unicode_data/properties/Script_Extensions/Kana/value.dump +24 -0
- data/resources/unicode_data/properties/Script_Extensions/Kthi/value.dump +3 -0
- data/resources/unicode_data/properties/Script_Extensions/Latn/value.dump +5 -0
- data/resources/unicode_data/properties/Script_Extensions/Linb/value.dump +0 -0
- data/resources/unicode_data/properties/Script_Extensions/Mand/value.dump +3 -0
- data/resources/unicode_data/properties/Script_Extensions/Mong/value.dump +4 -0
- data/resources/unicode_data/properties/Script_Extensions/Mymr/value.dump +3 -0
- data/resources/unicode_data/properties/Script_Extensions/Orya/value.dump +3 -0
- data/resources/unicode_data/properties/Script_Extensions/Phag/value.dump +4 -0
- data/resources/unicode_data/properties/Script_Extensions/Sylo/value.dump +3 -0
- data/resources/unicode_data/properties/Script_Extensions/Syrc/value.dump +8 -0
- data/resources/unicode_data/properties/Script_Extensions/Tagb/value.dump +3 -0
- data/resources/unicode_data/properties/Script_Extensions/Takr/value.dump +3 -0
- data/resources/unicode_data/properties/Script_Extensions/Tale/value.dump +3 -0
- data/resources/unicode_data/properties/Script_Extensions/Tglg/value.dump +3 -0
- data/resources/unicode_data/properties/Script_Extensions/Thaa/value.dump +8 -0
- data/resources/unicode_data/properties/Script_Extensions/Yiii/value.dump +8 -0
- data/resources/unicode_data/properties/Sentence_Break/ATerm/value.dump +6 -0
- data/resources/unicode_data/properties/Sentence_Break/CR/value.dump +3 -0
- data/resources/unicode_data/properties/Sentence_Break/Close/value.dump +0 -0
- data/resources/unicode_data/properties/Sentence_Break/Extend/value.dump +0 -0
- data/resources/unicode_data/properties/Sentence_Break/Format/value.dump +0 -0
- data/resources/unicode_data/properties/Sentence_Break/LF/value.dump +3 -0
- data/resources/unicode_data/properties/Sentence_Break/Lower/value.dump +0 -0
- data/resources/unicode_data/properties/Sentence_Break/Numeric/value.dump +0 -0
- data/resources/unicode_data/properties/Sentence_Break/OLetter/value.dump +0 -0
- data/resources/unicode_data/properties/Sentence_Break/SContinue/value.dump +21 -0
- data/resources/unicode_data/properties/Sentence_Break/STerm/value.dump +0 -0
- data/resources/unicode_data/properties/Sentence_Break/Sep/value.dump +4 -0
- data/resources/unicode_data/properties/Sentence_Break/Sp/value.dump +0 -0
- data/resources/unicode_data/properties/Sentence_Break/Upper/value.dump +0 -0
- data/resources/unicode_data/properties/Soft_Dotted/value.dump +33 -0
- data/resources/unicode_data/properties/Terminal_Punctuation/value.dump +0 -0
- data/resources/unicode_data/properties/Unified_Ideograph/value.dump +0 -0
- data/resources/unicode_data/properties/Uppercase/value.dump +0 -0
- data/resources/unicode_data/properties/Variation_Selector/value.dump +0 -0
- data/resources/unicode_data/properties/White_Space/value.dump +0 -0
- data/resources/unicode_data/properties/Word_Break/ALetter/value.dump +0 -0
- data/resources/unicode_data/properties/Word_Break/CR/value.dump +3 -0
- data/resources/unicode_data/properties/Word_Break/Double_Quote/value.dump +3 -0
- data/resources/unicode_data/properties/Word_Break/Extend/value.dump +0 -0
- data/resources/unicode_data/properties/Word_Break/ExtendNumLet/value.dump +8 -0
- data/resources/unicode_data/properties/Word_Break/Format/value.dump +0 -0
- data/resources/unicode_data/properties/Word_Break/Hebrew_Letter/value.dump +12 -0
- data/resources/unicode_data/properties/Word_Break/Katakana/value.dump +0 -0
- data/resources/unicode_data/properties/Word_Break/LF/value.dump +3 -0
- data/resources/unicode_data/properties/Word_Break/MidLetter/value.dump +10 -0
- data/resources/unicode_data/properties/Word_Break/MidNum/value.dump +16 -0
- data/resources/unicode_data/properties/Word_Break/MidNumLet/value.dump +9 -0
- data/resources/unicode_data/properties/Word_Break/Newline/value.dump +5 -0
- data/resources/unicode_data/properties/Word_Break/Numeric/value.dump +0 -0
- data/resources/unicode_data/properties/Word_Break/Regional_Indicator/value.dump +3 -0
- data/resources/unicode_data/properties/Word_Break/Single_Quote/value.dump +3 -0
- data/resources/unicode_data/properties/XID_Continue/value.dump +0 -0
- data/resources/unicode_data/properties/XID_Start/value.dump +0 -0
- data/resources/unicode_data/property_aliases.yml +350 -0
- data/resources/unicode_data/property_value_aliases.yml +1829 -0
- data/spec/bidi/bidi_spec.rb +2 -2
- data/spec/collation/collation_spec.rb +1 -1
- data/spec/collation/collator_spec.rb +6 -6
- data/spec/collation/sort_key_builder_spec.rb +11 -11
- data/spec/collation/tailoring_spec.rb +1 -1
- data/spec/collation/trie_dumps_spec.rb +1 -1
- data/spec/data_readers/date_time_data_reader_spec.rb +1 -1
- data/spec/data_readers/number_data_reader_spec.rb +19 -6
- data/spec/formatters/calendars/datetime_formatter_spec.rb +1 -1
- data/spec/formatters/numbers/abbreviated/abbreviated_number_formatter_spec.rb +1 -1
- data/spec/formatters/numbers/abbreviated/long_decimal_formatter_spec.rb +5 -5
- data/spec/formatters/numbers/abbreviated/short_decimal_formatter_spec.rb +4 -4
- data/spec/formatters/numbers/currency_formatter_spec.rb +10 -10
- data/spec/formatters/numbers/decimal_formatter_spec.rb +2 -2
- data/spec/formatters/numbers/helpers/fraction_spec.rb +4 -4
- data/spec/formatters/numbers/helpers/integer_spec.rb +21 -16
- data/spec/formatters/numbers/number_formatter_spec.rb +9 -9
- data/spec/formatters/numbers/percent_formatter_spec.rb +2 -2
- data/spec/formatters/numbers/rbnf/rbnf_spec.rb +5 -5
- data/spec/formatters/plurals/plural_formatter_spec.rb +25 -25
- data/spec/formatters/plurals/rules_spec.rb +4 -4
- data/spec/localized/localized_date_spec.rb +25 -25
- data/spec/localized/localized_datetime_spec.rb +7 -7
- data/spec/localized/localized_hash_spec.rb +1 -1
- data/spec/localized/localized_number_spec.rb +23 -23
- data/spec/localized/localized_object_spec.rb +2 -2
- data/spec/localized/localized_string_spec.rb +43 -16
- data/spec/localized/localized_symbol_spec.rb +31 -4
- data/spec/localized/localized_time_spec.rb +3 -3
- data/spec/localized/localized_timespan_spec.rb +42 -42
- data/spec/normalization_spec.rb +4 -4
- data/spec/parsers/number_parser_spec.rb +10 -10
- data/spec/parsers/parser_spec.rb +19 -3
- data/spec/parsers/symbol_table_spec.rb +1 -1
- data/spec/parsers/unicode_regex/character_class_spec.rb +12 -0
- data/spec/parsers/unicode_regex/character_range_spec.rb +24 -5
- data/spec/parsers/unicode_regex/character_set_spec.rb +9 -1
- data/spec/parsers/unicode_regex_parser_spec.rb +1 -1
- data/spec/resources/loader_spec.rb +6 -6
- data/spec/{shared → segmentation}/break_iterator_spec.rb +45 -16
- data/spec/segmentation/parser_spec.rb +107 -0
- data/spec/segmentation/rule_set_spec.rb +102 -0
- data/spec/shared/calendar_spec.rb +30 -30
- data/spec/shared/caser_spec.rb +79 -0
- data/spec/shared/code_point_spec.rb +52 -151
- data/spec/shared/currencies_spec.rb +8 -8
- data/spec/shared/language_codes_spec.rb +13 -13
- data/spec/shared/likely_subtags_spec.rb +58 -0
- data/spec/shared/locale_spec.rb +211 -0
- data/spec/shared/numbers_spec.rb +4 -4
- data/spec/shared/postal_codes_spec.rb +24 -4
- data/spec/shared/properties_database_spec.rb +157 -0
- data/spec/shared/property_name_aliases_spec.rb +56 -0
- data/spec/shared/property_normalizer_spec.rb +64 -0
- data/spec/shared/property_set_spec.rb +218 -0
- data/spec/shared/property_value_aliases_spec.rb +58 -0
- data/spec/shared/territories_spec.rb +1 -1
- data/spec/shared/unicode_regex_spec.rb +35 -2
- data/spec/spec_helper.rb +3 -3
- data/spec/tokenizers/calendars/date_tokenizer_spec.rb +23 -23
- data/spec/tokenizers/calendars/datetime_tokenizer_spec.rb +18 -18
- data/spec/tokenizers/calendars/time_tokenizer_spec.rb +19 -19
- data/spec/tokenizers/composite_token_spec.rb +4 -4
- data/spec/tokenizers/numbers/number_tokenizer_spec.rb +16 -16
- data/spec/tokenizers/token_spec.rb +2 -2
- data/spec/tokenizers/unicode_regex/unicode_regex_tokenizer_spec.rb +94 -94
- data/spec/utils/file_system_trie_spec.rb +98 -0
- data/spec/utils/range_set_spec.rb +53 -1
- data/spec/utils/script_detector_spec.rb +58 -0
- data/spec/utils/yaml/yaml_spec.rb +22 -22
- data/spec/utils_spec.rb +21 -21
- metadata +832 -28
- data/lib/twitter_cldr/parsers/segmentation_parser.rb +0 -137
- data/lib/twitter_cldr/resources/canonical_compositions_updater.rb +0 -51
- data/lib/twitter_cldr/resources/composition_exclusions_importer.rb +0 -62
- data/lib/twitter_cldr/resources/normalization_quick_check_importer.rb +0 -73
- data/lib/twitter_cldr/resources/unicode_properties_importer.rb +0 -79
- data/lib/twitter_cldr/shared/break_iterator.rb +0 -213
- data/lib/twitter_cldr/tokenizers/segmentation/segmentation_tokenizer.rb +0 -39
- data/resources/shared/segments/tailorings/en.yml +0 -8
- data/resources/unicode_data/canonical_compositions.yml +0 -4925
- data/resources/unicode_data/composition_exclusions.yml +0 -297
- data/resources/unicode_data/hangul_blocks.yml +0 -21
- data/resources/unicode_data/indices/bidi_class.yml +0 -4572
- data/resources/unicode_data/indices/bidi_mirrored.yml +0 -3087
- data/resources/unicode_data/indices/category.yml +0 -10918
- data/resources/unicode_data/indices/keys.yml +0 -101
- data/resources/unicode_data/nfc_quick_check.yml +0 -293
- data/resources/unicode_data/nfd_quick_check.yml +0 -909
- data/resources/unicode_data/nfkc_quick_check.yml +0 -989
- data/resources/unicode_data/nfkd_quick_check.yml +0 -1537
- data/resources/unicode_data/properties/line_break.yml +0 -9269
- data/resources/unicode_data/properties/sentence_break.yml +0 -8067
- data/resources/unicode_data/properties/word_break.yml +0 -3001
- data/spec/parsers/segmentation_parser_spec.rb +0 -100
- data/spec/tokenizers/segmentation/segmentation_tokenizer_spec.rb +0 -40
@@ -78,13 +78,33 @@ describe PostalCodes do
|
|
78
78
|
postal_code = PostalCodes.for_territory(territory)
|
79
79
|
|
80
80
|
it "returns samples that match #{territory}" do
|
81
|
-
postal_code.
|
82
|
-
|
83
|
-
|
84
|
-
|
81
|
+
if postal_code.has_generator?
|
82
|
+
postal_code.sample(10).each do |sample|
|
83
|
+
result = postal_code.valid?(sample)
|
84
|
+
puts "Failed with example #{sample}" unless result
|
85
|
+
result.should be_true
|
86
|
+
end
|
85
87
|
end
|
86
88
|
end
|
87
89
|
end
|
88
90
|
end
|
89
91
|
end
|
92
|
+
|
93
|
+
context 'with a postal code that has no AST' do
|
94
|
+
let(:postal_code) { PostalCodes.new(:xx, /\d{5}/, nil) }
|
95
|
+
|
96
|
+
describe '#sample' do
|
97
|
+
it 'raises an exception' do
|
98
|
+
expect { postal_code.sample }.to raise_error(
|
99
|
+
MissingPostcodeGeneratorError
|
100
|
+
)
|
101
|
+
end
|
102
|
+
end
|
103
|
+
|
104
|
+
describe '#has_generator?' do
|
105
|
+
it 'returns false' do
|
106
|
+
expect(postal_code).to_not have_generator
|
107
|
+
end
|
108
|
+
end
|
109
|
+
end
|
90
110
|
end
|
@@ -0,0 +1,157 @@
|
|
1
|
+
# encoding: UTF-8
|
2
|
+
|
3
|
+
# Copyright 2012 Twitter, Inc
|
4
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
5
|
+
|
6
|
+
require 'spec_helper'
|
7
|
+
|
8
|
+
require 'fileutils'
|
9
|
+
require 'securerandom'
|
10
|
+
require 'tmpdir'
|
11
|
+
|
12
|
+
include TwitterCldr::Shared
|
13
|
+
include TwitterCldr::Utils
|
14
|
+
|
15
|
+
describe PropertiesDatabase do
|
16
|
+
context 'with an empty database' do
|
17
|
+
let(:tmp_dir) do
|
18
|
+
File.join(Dir.tmpdir, SecureRandom.hex)
|
19
|
+
end
|
20
|
+
|
21
|
+
let(:database) { PropertiesDatabase.new(tmp_dir) }
|
22
|
+
|
23
|
+
before(:each) do
|
24
|
+
FileUtils.mkdir_p(tmp_dir)
|
25
|
+
end
|
26
|
+
|
27
|
+
after(:each) do
|
28
|
+
FileUtils.rm_rf(tmp_dir)
|
29
|
+
end
|
30
|
+
|
31
|
+
describe '#store' do
|
32
|
+
it 'associates the code points with the property name/value' do
|
33
|
+
database.store('foo', 'bar', RangeSet.new([1..4]))
|
34
|
+
result = database.code_points_for_property('foo', 'bar')
|
35
|
+
expect(result).to be_a(RangeSet)
|
36
|
+
expect(result.to_a).to eq([1..4])
|
37
|
+
end
|
38
|
+
end
|
39
|
+
end
|
40
|
+
|
41
|
+
context 'with a full database of properties' do
|
42
|
+
let(:database) { PropertiesDatabase.new }
|
43
|
+
|
44
|
+
describe '#code_points_for_property' do
|
45
|
+
it 'retrieves code points for the property name' do
|
46
|
+
code_points = database.code_points_for_property('Math')
|
47
|
+
[126, 172, 215, 1014, 9168, 10176].each do |cp|
|
48
|
+
expect(code_points).to include(cp)
|
49
|
+
end
|
50
|
+
end
|
51
|
+
|
52
|
+
it 'retrieves code points for the property name/value pair' do
|
53
|
+
code_points = database.code_points_for_property('Age', '1.1')
|
54
|
+
[501, 736, 890, 990, 1118, 1227, 1632].each do |cp|
|
55
|
+
expect(code_points).to include(cp)
|
56
|
+
end
|
57
|
+
end
|
58
|
+
|
59
|
+
it "returns an empty range set if the property name can't be found" do
|
60
|
+
code_points = database.code_points_for_property('foo')
|
61
|
+
expect(code_points.to_a).to eq([])
|
62
|
+
end
|
63
|
+
|
64
|
+
it "returns an empty range set if the property name/value pair can't be found" do
|
65
|
+
code_points = database.code_points_for_property('Age', 'foo')
|
66
|
+
expect(code_points.to_a).to eq([])
|
67
|
+
end
|
68
|
+
end
|
69
|
+
|
70
|
+
describe '#include?' do
|
71
|
+
it 'returns true if the database contains the property name' do
|
72
|
+
expect(database.include?('Age')).to be_true
|
73
|
+
end
|
74
|
+
|
75
|
+
it 'returns true if the database contains the property name/value pair' do
|
76
|
+
expect(database.include?('Age', '1.1')).to be_true
|
77
|
+
end
|
78
|
+
|
79
|
+
it "returns false if the database doesn't contain the property name" do
|
80
|
+
expect(database.include?('foo')).to be_false
|
81
|
+
end
|
82
|
+
|
83
|
+
it "returns false if the database doesn't contain the property name/value pair" do
|
84
|
+
expect(database.include?('Age', 'foo')).to be_false
|
85
|
+
end
|
86
|
+
end
|
87
|
+
|
88
|
+
describe '#properties_for_code_point' do
|
89
|
+
it 'returns a property set for the given code point' do
|
90
|
+
property_set = database.properties_for_code_point(65)
|
91
|
+
expect(property_set).to be_a(PropertySet)
|
92
|
+
expect(property_set.general_category).to eq(Set.new(%w(L Lu)))
|
93
|
+
expect(property_set.word_break).to eq(Set.new(%w(ALetter)))
|
94
|
+
end
|
95
|
+
end
|
96
|
+
|
97
|
+
describe '#property_names' do
|
98
|
+
it 'returns a list of all valid property names' do
|
99
|
+
%w(Radical Script Hex_Digit Diacritic).each do |property_name|
|
100
|
+
expect(database.property_names).to include(property_name)
|
101
|
+
end
|
102
|
+
end
|
103
|
+
end
|
104
|
+
|
105
|
+
describe '#property_values_for' do
|
106
|
+
it 'returns a list of all valid values for a property name' do
|
107
|
+
values = database.property_values_for('Script')
|
108
|
+
%w(Cyrillic Latin Hangul Han Bengali Tagalog Yi).each do |script|
|
109
|
+
expect(values).to include(script)
|
110
|
+
end
|
111
|
+
end
|
112
|
+
|
113
|
+
it 'correctly expands value prefixes for General_Category' do
|
114
|
+
values = database.property_values_for('General_Category')
|
115
|
+
expect(values).to include('Cc')
|
116
|
+
expect(values).to include('C')
|
117
|
+
|
118
|
+
expect(values).to include('Lo')
|
119
|
+
expect(values).to include('L')
|
120
|
+
|
121
|
+
expect(values).to include('Pd')
|
122
|
+
expect(values).to include('P')
|
123
|
+
|
124
|
+
expect(values).to include('Sm')
|
125
|
+
expect(values).to include('S')
|
126
|
+
end
|
127
|
+
end
|
128
|
+
|
129
|
+
describe '#each_property_pair' do
|
130
|
+
it 'yields each property name/value pair' do
|
131
|
+
pairs = database.each_property_pair.to_a
|
132
|
+
|
133
|
+
expected_pairs = [
|
134
|
+
%w(Script Thai), ['Radical', nil],
|
135
|
+
['Math', nil], %w(Line_Break HY),
|
136
|
+
%w(Jamo_Short_Name EU), ['Hyphen', nil]
|
137
|
+
]
|
138
|
+
|
139
|
+
expected_pairs.each do |expected_pair|
|
140
|
+
expect(pairs).to include(expected_pair)
|
141
|
+
end
|
142
|
+
end
|
143
|
+
end
|
144
|
+
|
145
|
+
describe '#normalize' do
|
146
|
+
let(:property_name) { 'foo' }
|
147
|
+
let(:property_value) { 'bar' }
|
148
|
+
|
149
|
+
it 'delegates normalization to a normalizer' do
|
150
|
+
normalizer = Object.new
|
151
|
+
stub(database).normalizer { normalizer }
|
152
|
+
mock(normalizer).normalize(property_name, property_value)
|
153
|
+
database.normalize(property_name, property_value)
|
154
|
+
end
|
155
|
+
end
|
156
|
+
end
|
157
|
+
end
|
@@ -0,0 +1,56 @@
|
|
1
|
+
# encoding: UTF-8
|
2
|
+
|
3
|
+
# Copyright 2012 Twitter, Inc
|
4
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
5
|
+
|
6
|
+
require 'spec_helper'
|
7
|
+
|
8
|
+
include TwitterCldr::Shared
|
9
|
+
|
10
|
+
describe PropertyNameAliases do
|
11
|
+
let(:alias_class) { PropertyNameAliases }
|
12
|
+
|
13
|
+
describe '#abbreviated_alias_for' do
|
14
|
+
it 'finds the abbreviated alias for a long property name' do
|
15
|
+
expect(alias_class.abbreviated_alias_for('Script')).to eq('sc')
|
16
|
+
expect(alias_class.abbreviated_alias_for('Age')).to eq('age')
|
17
|
+
expect(alias_class.abbreviated_alias_for('Uppercase_Mapping')).to eq('uc')
|
18
|
+
end
|
19
|
+
|
20
|
+
it 'returns nil if no alias can be found' do
|
21
|
+
expect(alias_class.abbreviated_alias_for('foo')).to be_nil
|
22
|
+
end
|
23
|
+
end
|
24
|
+
|
25
|
+
describe '#long_alias_for' do
|
26
|
+
it 'finds the long alias for an abbreviated property name' do
|
27
|
+
expect(alias_class.long_alias_for('sc')).to eq('Script')
|
28
|
+
expect(alias_class.long_alias_for('age')).to eq('Age')
|
29
|
+
expect(alias_class.long_alias_for('uc')).to eq('Uppercase_Mapping')
|
30
|
+
end
|
31
|
+
|
32
|
+
it 'returns nil if no alias can be found' do
|
33
|
+
expect(alias_class.long_alias_for('foo')).to be_nil
|
34
|
+
end
|
35
|
+
end
|
36
|
+
|
37
|
+
describe '#aliases_for' do
|
38
|
+
examples = {
|
39
|
+
'cjkRSUnicode' => %w(kRSUnicode Unicode_Radical_Stroke URS),
|
40
|
+
'WSpace' => %w(White_Space space),
|
41
|
+
'scf' => %w(Simple_Case_Folding sfc),
|
42
|
+
'IDS' => %w(ID_Start)
|
43
|
+
}
|
44
|
+
|
45
|
+
examples.each_pair do |property_name, aliases|
|
46
|
+
it "finds all the known aliases for the #{property_name} property name" do
|
47
|
+
found = alias_class.aliases_for(property_name)
|
48
|
+
expect(found).to match_array(aliases)
|
49
|
+
end
|
50
|
+
end
|
51
|
+
|
52
|
+
it 'returns an empty array if no aliases are found' do
|
53
|
+
expect(alias_class.aliases_for('foo')).to eq([])
|
54
|
+
end
|
55
|
+
end
|
56
|
+
end
|
@@ -0,0 +1,64 @@
|
|
1
|
+
# encoding: UTF-8
|
2
|
+
|
3
|
+
# Copyright 2012 Twitter, Inc
|
4
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
5
|
+
|
6
|
+
require 'spec_helper'
|
7
|
+
|
8
|
+
include TwitterCldr::Shared
|
9
|
+
|
10
|
+
describe PropertyNormalizer do
|
11
|
+
let(:database) { PropertiesDatabase.new }
|
12
|
+
let(:normalizer) { PropertyNormalizer.new(database) }
|
13
|
+
|
14
|
+
describe '#normalize' do
|
15
|
+
it 'correctly normalizes just property names' do
|
16
|
+
name, value = normalizer.normalize('IDS')
|
17
|
+
expect(name).to eq('ID_Start')
|
18
|
+
expect(value).to be_nil
|
19
|
+
end
|
20
|
+
|
21
|
+
it 'correctly normalizes property names and values' do
|
22
|
+
%w(age Age).each do |name|
|
23
|
+
%w(1.1 V1_1).each do |value|
|
24
|
+
cur_name, cur_value = normalizer.normalize(name, value)
|
25
|
+
expect(cur_name).to eq('Age')
|
26
|
+
expect(cur_value).to eq('1.1')
|
27
|
+
end
|
28
|
+
end
|
29
|
+
end
|
30
|
+
|
31
|
+
it 'correctly normalizes properties that support numeric values' do
|
32
|
+
%w(ccc Canonical_Combining_Class).each do |name|
|
33
|
+
%w(0 NR Not_Reordered).each do |value|
|
34
|
+
cur_name, cur_value = normalizer.normalize(name, value)
|
35
|
+
expect(cur_name).to eq('Canonical_Combining_Class')
|
36
|
+
expect(cur_value).to eq('0')
|
37
|
+
end
|
38
|
+
end
|
39
|
+
end
|
40
|
+
|
41
|
+
it "returns a blank property when the name and value can't be found" do
|
42
|
+
name, value = normalizer.normalize('foo', 'bar')
|
43
|
+
expect(name).to be_nil
|
44
|
+
expect(value).to be_nil
|
45
|
+
end
|
46
|
+
|
47
|
+
it 'handles valid name but invalid value' do
|
48
|
+
name, value = normalizer.normalize('ideographic', 'ideographic')
|
49
|
+
expect(name).to be_nil
|
50
|
+
expect(value).to be_nil
|
51
|
+
end
|
52
|
+
|
53
|
+
it 'fixes casing of property names' do
|
54
|
+
name, value = normalizer.normalize('ideographic')
|
55
|
+
expect(name).to eq('Ideographic')
|
56
|
+
end
|
57
|
+
|
58
|
+
it 'fixes casing of property names and values' do
|
59
|
+
name, value = normalizer.normalize('sc', 'han')
|
60
|
+
expect(name).to eq('Script')
|
61
|
+
expect(value).to eq('Han')
|
62
|
+
end
|
63
|
+
end
|
64
|
+
end
|
@@ -0,0 +1,218 @@
|
|
1
|
+
# encoding: UTF-8
|
2
|
+
|
3
|
+
# Copyright 2012 Twitter, Inc
|
4
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
5
|
+
|
6
|
+
require 'spec_helper'
|
7
|
+
|
8
|
+
include TwitterCldr::Shared
|
9
|
+
|
10
|
+
describe PropertySet do
|
11
|
+
let(:properties_hash) { {} }
|
12
|
+
let(:property_set) { PropertySet.new(properties_hash) }
|
13
|
+
|
14
|
+
describe '#age' do
|
15
|
+
it 'defaults to "Unassigned"' do
|
16
|
+
expect(property_set.age).to eq(['Unassigned'])
|
17
|
+
end
|
18
|
+
|
19
|
+
it 'returns the age when one is supplied' do
|
20
|
+
properties_hash.merge!('Age' => ['foo'])
|
21
|
+
expect(property_set.age).to eq(['foo'])
|
22
|
+
end
|
23
|
+
end
|
24
|
+
|
25
|
+
describe '#joining_type' do
|
26
|
+
it 'defaults to "Non_Joining"' do
|
27
|
+
expect(property_set.joining_type).to eq(['Non_Joining'])
|
28
|
+
end
|
29
|
+
|
30
|
+
it 'defaults to the joining type that corresponds to the general category (if set)' do
|
31
|
+
properties_hash.merge!('General_Category' => ['Mn'])
|
32
|
+
expect(property_set.joining_type).to eq(['Transparent'])
|
33
|
+
end
|
34
|
+
|
35
|
+
it 'returns the joining type when one is supplied' do
|
36
|
+
properties_hash.merge!('Joining_Type' => ['foo'])
|
37
|
+
expect(property_set.joining_type).to eq(['foo'])
|
38
|
+
end
|
39
|
+
end
|
40
|
+
|
41
|
+
describe '#bidi_paired_bracket_type' do
|
42
|
+
it 'defaults to "None"' do
|
43
|
+
expect(property_set.bidi_paired_bracket_type).to eq(['None'])
|
44
|
+
end
|
45
|
+
|
46
|
+
it 'returns the bracket type when one is supplied' do
|
47
|
+
properties_hash.merge!('Bidi_Paired_Bracket_Type' => ['foo'])
|
48
|
+
expect(property_set.bidi_paired_bracket_type).to eq(['foo'])
|
49
|
+
end
|
50
|
+
end
|
51
|
+
|
52
|
+
describe '#block' do
|
53
|
+
it 'defaults to "No_Block"' do
|
54
|
+
expect(property_set.block).to eq(['No_Block'])
|
55
|
+
end
|
56
|
+
|
57
|
+
it 'returns the block when one is supplied' do
|
58
|
+
properties_hash.merge!('Block' => ['foo'])
|
59
|
+
expect(property_set.block).to eq(['foo'])
|
60
|
+
end
|
61
|
+
end
|
62
|
+
|
63
|
+
describe '#east_asian_width' do
|
64
|
+
it 'defaults to "N"' do
|
65
|
+
expect(property_set.east_asian_width).to eq(['N'])
|
66
|
+
end
|
67
|
+
|
68
|
+
it 'returns the width when one is supplied' do
|
69
|
+
properties_hash.merge!('East_Asian_Width' => ['foo'])
|
70
|
+
expect(property_set.east_asian_width).to eq(['foo'])
|
71
|
+
end
|
72
|
+
end
|
73
|
+
|
74
|
+
describe '#grapheme_cluster_break' do
|
75
|
+
it 'defaults to "Other"' do
|
76
|
+
expect(property_set.grapheme_cluster_break).to eq(['Other'])
|
77
|
+
end
|
78
|
+
|
79
|
+
it 'returns the break when one is supplied' do
|
80
|
+
properties_hash.merge!('Grapheme_Cluster_Break' => ['foo'])
|
81
|
+
expect(property_set.grapheme_cluster_break).to eq(['foo'])
|
82
|
+
end
|
83
|
+
end
|
84
|
+
|
85
|
+
describe '#hangul_syllable_type' do
|
86
|
+
it 'defaults to "Not_Applicable"' do
|
87
|
+
expect(property_set.hangul_syllable_type).to eq(['Not_Applicable'])
|
88
|
+
end
|
89
|
+
|
90
|
+
it 'returns the syllable type when one is supplied' do
|
91
|
+
properties_hash.merge!('Hangul_Syllable_Type' => ['foo'])
|
92
|
+
expect(property_set.hangul_syllable_type).to eq(['foo'])
|
93
|
+
end
|
94
|
+
end
|
95
|
+
|
96
|
+
describe '#indic_positional_category' do
|
97
|
+
it 'defaults to "NA"' do
|
98
|
+
expect(property_set.indic_positional_category).to eq(['NA'])
|
99
|
+
end
|
100
|
+
|
101
|
+
it 'returns the positional category if one is supplied' do
|
102
|
+
properties_hash.merge!('Indic_Positional_Category' => ['foo'])
|
103
|
+
expect(property_set.indic_positional_category).to eq(['foo'])
|
104
|
+
end
|
105
|
+
end
|
106
|
+
|
107
|
+
describe '#indic_syllabic_category' do
|
108
|
+
it 'defaults to "Other"' do
|
109
|
+
expect(property_set.indic_syllabic_category).to eq(['Other'])
|
110
|
+
end
|
111
|
+
|
112
|
+
it 'returns the syllabic category if one is supplied' do
|
113
|
+
properties_hash.merge!('Indic_Syllabic_Category' => ['foo'])
|
114
|
+
expect(property_set.indic_syllabic_category).to eq(['foo'])
|
115
|
+
end
|
116
|
+
end
|
117
|
+
|
118
|
+
describe '#jamo_short_name' do
|
119
|
+
it 'defaults to "<none>"' do
|
120
|
+
expect(property_set.jamo_short_name).to eq(['<none>'])
|
121
|
+
end
|
122
|
+
|
123
|
+
it 'returns the short name if one is supplied' do
|
124
|
+
properties_hash.merge!('Jamo_Short_Name' => ['foo'])
|
125
|
+
expect(property_set.jamo_short_name).to eq(['foo'])
|
126
|
+
end
|
127
|
+
end
|
128
|
+
|
129
|
+
describe '#line_break' do
|
130
|
+
it 'defaults to XX' do
|
131
|
+
expect(property_set.line_break).to eq(['XX'])
|
132
|
+
end
|
133
|
+
|
134
|
+
it 'returns the line break category if one is supplied' do
|
135
|
+
properties_hash.merge!('Line_Break' => ['foo'])
|
136
|
+
expect(property_set.line_break).to eq(['foo'])
|
137
|
+
end
|
138
|
+
end
|
139
|
+
|
140
|
+
describe '#general_category' do
|
141
|
+
it 'defaults to nil' do
|
142
|
+
expect(property_set.general_category).to eq([])
|
143
|
+
end
|
144
|
+
|
145
|
+
it 'returns the general category if one is supplied' do
|
146
|
+
properties_hash.merge!('General_Category' => ['foo'])
|
147
|
+
expect(property_set.general_category).to eq(['foo'])
|
148
|
+
end
|
149
|
+
end
|
150
|
+
|
151
|
+
describe '#script_extensions' do
|
152
|
+
it 'defaults to "<script>"' do
|
153
|
+
expect(property_set.script_extensions).to eq(['<script>'])
|
154
|
+
end
|
155
|
+
|
156
|
+
it 'returns the script extension if one is supplied' do
|
157
|
+
properties_hash.merge!('Script_Extensions' => ['foo'])
|
158
|
+
expect(property_set.script_extensions).to eq(['foo'])
|
159
|
+
end
|
160
|
+
end
|
161
|
+
|
162
|
+
describe '#script' do
|
163
|
+
it 'defaults to "Unknown"' do
|
164
|
+
expect(property_set.script).to eq(['Unknown'])
|
165
|
+
end
|
166
|
+
|
167
|
+
it 'returns the script if one is supplied' do
|
168
|
+
properties_hash.merge!('Script' => ['foo'])
|
169
|
+
expect(property_set.script).to eq(['foo'])
|
170
|
+
end
|
171
|
+
end
|
172
|
+
|
173
|
+
describe '#sentence_break' do
|
174
|
+
it 'defaults to "Other"' do
|
175
|
+
expect(property_set.sentence_break).to eq(['Other'])
|
176
|
+
end
|
177
|
+
|
178
|
+
it 'returns the sentence break category if one is supplied' do
|
179
|
+
properties_hash.merge!('Sentence_Break' => ['foo'])
|
180
|
+
expect(property_set.sentence_break).to eq(['foo'])
|
181
|
+
end
|
182
|
+
end
|
183
|
+
|
184
|
+
describe '#word_break' do
|
185
|
+
it 'defaults to "Other"' do
|
186
|
+
expect(property_set.word_break).to eq(['Other'])
|
187
|
+
end
|
188
|
+
|
189
|
+
it 'returns the word break category if one is supplied' do
|
190
|
+
properties_hash.merge!('Word_Break' => ['foo'])
|
191
|
+
expect(property_set.word_break).to eq(['foo'])
|
192
|
+
end
|
193
|
+
end
|
194
|
+
|
195
|
+
describe 'properties without defaults' do
|
196
|
+
CodePoint.properties.property_names.each do |property_name|
|
197
|
+
method_name = property_name.downcase
|
198
|
+
|
199
|
+
if PropertySet::AdditionalPropertyMethods.method_defined?(method_name)
|
200
|
+
describe "##{method_name}" do
|
201
|
+
it 'returns true if the property has been set but has no value' do
|
202
|
+
properties_hash.merge!(property_name => nil)
|
203
|
+
expect(property_set.send(method_name)).to eq(true)
|
204
|
+
end
|
205
|
+
|
206
|
+
it 'returns false if the property has not been set' do
|
207
|
+
expect(property_set.send(method_name)).to eq(false)
|
208
|
+
end
|
209
|
+
|
210
|
+
it 'returns the property value if it has been set' do
|
211
|
+
properties_hash.merge!(property_name => ['foo'])
|
212
|
+
expect(property_set.send(method_name)).to eq(['foo'])
|
213
|
+
end
|
214
|
+
end
|
215
|
+
end
|
216
|
+
end
|
217
|
+
end
|
218
|
+
end
|
@@ -0,0 +1,58 @@
|
|
1
|
+
# encoding: UTF-8
|
2
|
+
|
3
|
+
# Copyright 2012 Twitter, Inc
|
4
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
5
|
+
|
6
|
+
require 'spec_helper'
|
7
|
+
|
8
|
+
include TwitterCldr::Shared
|
9
|
+
|
10
|
+
describe PropertyValueAliases do
|
11
|
+
let(:alias_class) { PropertyValueAliases }
|
12
|
+
|
13
|
+
describe '#abbreviated_alias_for' do
|
14
|
+
it 'finds the abbreviated alias for a long property value' do
|
15
|
+
expect(alias_class.abbreviated_alias_for('AHex', 'No')).to eq('N')
|
16
|
+
expect(alias_class.abbreviated_alias_for('AHex', 'Yes')).to eq('Y')
|
17
|
+
|
18
|
+
expect(alias_class.abbreviated_alias_for('dt', 'Canonical')).to eq('Can')
|
19
|
+
expect(alias_class.abbreviated_alias_for('dt', 'Circle')).to eq('Enc')
|
20
|
+
expect(alias_class.abbreviated_alias_for('dt', 'Final')).to eq('Fin')
|
21
|
+
end
|
22
|
+
|
23
|
+
it 'returns nil if no alias can be found' do
|
24
|
+
expect(alias_class.abbreviated_alias_for('AHex', 'foo')).to be_nil
|
25
|
+
end
|
26
|
+
end
|
27
|
+
|
28
|
+
describe '#long_alias_for' do
|
29
|
+
it 'finds the long alias for an abbreviated property value' do
|
30
|
+
expect(alias_class.long_alias_for('AHex', 'N')).to eq('No')
|
31
|
+
expect(alias_class.long_alias_for('AHex', 'Y')).to eq('Yes')
|
32
|
+
|
33
|
+
expect(alias_class.long_alias_for('dt', 'Can')).to eq('Canonical')
|
34
|
+
expect(alias_class.long_alias_for('dt', 'Enc')).to eq('Circle')
|
35
|
+
expect(alias_class.long_alias_for('dt', 'Fin')).to eq('Final')
|
36
|
+
end
|
37
|
+
|
38
|
+
it 'returns nil if no alias can be found' do
|
39
|
+
expect(alias_class.long_alias_for('AHex', 'foo')).to be_nil
|
40
|
+
end
|
41
|
+
end
|
42
|
+
|
43
|
+
describe '#numeric_alias_for' do
|
44
|
+
it 'finds the numeric alias (if one exists) for a long or abbreviated property value' do
|
45
|
+
%w(0 NR Not_Reordered).each do |value|
|
46
|
+
expect(alias_class.numeric_alias_for('ccc', value)).to eq('0')
|
47
|
+
end
|
48
|
+
end
|
49
|
+
end
|
50
|
+
|
51
|
+
describe '#aliases_for' do
|
52
|
+
it 'compiles a list of value aliases for the given property name' do
|
53
|
+
expect(alias_class.aliases_for('ccc', 'NR')).to match_array(%w(0 Not_Reordered))
|
54
|
+
expect(alias_class.aliases_for('ccc', 'Not_Reordered')).to match_array(%w(0 NR))
|
55
|
+
expect(alias_class.aliases_for('ccc', '0')).to match_array(%w(NR Not_Reordered))
|
56
|
+
end
|
57
|
+
end
|
58
|
+
end
|
@@ -121,7 +121,7 @@ describe Territories do
|
|
121
121
|
{ "is" => [ { "US" => "United States",
|
122
122
|
5 => "Suður-Ameríka" },
|
123
123
|
{ "009" => "Eyjaálfa" } ] }
|
124
|
-
).should == { :
|
124
|
+
).should == { is: [ { us: "United States" }, { } ] }
|
125
125
|
end
|
126
126
|
|
127
127
|
end
|
@@ -60,6 +60,18 @@ describe UnicodeRegex do
|
|
60
60
|
"(?:[\\u{0067}-\\u{006b}])(?:[\\u{0070}-\\u{0073}])"
|
61
61
|
)
|
62
62
|
end
|
63
|
+
|
64
|
+
it "supports modifiers" do
|
65
|
+
regex = UnicodeRegex.compile('abc', 'm').to_regexp
|
66
|
+
expect(regex.options).to eq(Regexp::MULTILINE)
|
67
|
+
end
|
68
|
+
|
69
|
+
it "supports multiple modifiers at once" do
|
70
|
+
regex = UnicodeRegex.compile('abc', 'mi').to_regexp
|
71
|
+
expect(regex.options).to eq(
|
72
|
+
Regexp::MULTILINE | Regexp::IGNORECASE
|
73
|
+
)
|
74
|
+
end
|
63
75
|
end
|
64
76
|
end
|
65
77
|
|
@@ -160,6 +172,20 @@ describe UnicodeRegex do
|
|
160
172
|
expect(regex).not_to exactly_match("a")
|
161
173
|
end
|
162
174
|
|
175
|
+
it "should match a regex containing a unioned character set" do
|
176
|
+
regex = compile("[[:L:][:White_Space:]]*")
|
177
|
+
expect(regex).to exactly_match("abc")
|
178
|
+
expect(regex).to exactly_match("くøß")
|
179
|
+
expect("a b c _ d".gsub(regex.to_regexp, "")).to eq("_")
|
180
|
+
end
|
181
|
+
|
182
|
+
it "should match a regex containing a negated unioned character set" do
|
183
|
+
regex = compile("[^[:L:][:White_Space:]]*")
|
184
|
+
expect(regex).to exactly_match(".,/")
|
185
|
+
expect(regex).to_not exactly_match("a b c")
|
186
|
+
expect("a b c _ d".gsub(regex.to_regexp, "")).to eq("a b c d")
|
187
|
+
end
|
188
|
+
|
163
189
|
it "should match a regex containing a negated character set (alternate syntax)" do
|
164
190
|
regex = compile("[[:^Zs:]]")
|
165
191
|
expect(regex).to exactly_match("a")
|
@@ -192,12 +218,19 @@ describe UnicodeRegex do
|
|
192
218
|
end
|
193
219
|
|
194
220
|
it "should match a regex with a complicated expression inside the char class" do
|
195
|
-
#
|
196
|
-
regex = compile("[
|
221
|
+
# [separators U space-tilde] diff [letters diff numbers] (diff is commutative)
|
222
|
+
regex = compile("[[\\p{Z}\\u0020-\\u007f]-[\\p{L}]-[\\p{N}]]")
|
197
223
|
expect(regex).to exactly_match(" ")
|
198
224
|
expect(regex).to exactly_match(",")
|
199
225
|
expect(regex).not_to exactly_match("a")
|
200
226
|
end
|
227
|
+
|
228
|
+
it "should treat a dash that is the first character of a character class as a literal dash instead of a range" do
|
229
|
+
regex = compile("[-abc]*")
|
230
|
+
expect(regex).to exactly_match("a-b-c")
|
231
|
+
expect(regex).to exactly_match("--a")
|
232
|
+
expect(regex).not_to exactly_match("def")
|
233
|
+
end
|
201
234
|
end
|
202
235
|
end
|
203
236
|
end
|
data/spec/spec_helper.rb
CHANGED
@@ -48,9 +48,9 @@ end
|
|
48
48
|
RSpec.configure do |config|
|
49
49
|
config.mock_with :rr
|
50
50
|
|
51
|
-
config.filter_run(:
|
51
|
+
config.filter_run(focus: true)
|
52
52
|
config.run_all_when_everything_filtered = true
|
53
|
-
config.filter_run_excluding(:
|
53
|
+
config.filter_run_excluding(slow: true) unless ENV['FULL_SPEC']
|
54
54
|
|
55
55
|
config.before(:each) do
|
56
56
|
TwitterCldr.reset_locale_fallbacks
|
@@ -62,7 +62,7 @@ end
|
|
62
62
|
|
63
63
|
RSpec::Matchers.define :match_normalized do |expected|
|
64
64
|
match do |actual|
|
65
|
-
expected.localize.normalize(:
|
65
|
+
expected.localize.normalize(using: :NFKC).to_s == actual.localize.normalize(using: :NFKC).to_s
|
66
66
|
end
|
67
67
|
end
|
68
68
|
|