cldr-transforms 46.0.0-BETA2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +41 -0
- package/README.md +27 -0
- package/bower.json +13 -0
- package/package.json +29 -0
- package/transforms/Amharic-Latin-BGN.json +9 -0
- package/transforms/Amharic-Latin-BGN.txt +441 -0
- package/transforms/Any-Accents.json +9 -0
- package/transforms/Any-Accents.txt +270 -0
- package/transforms/Any-Publishing.json +9 -0
- package/transforms/Any-Publishing.txt +63 -0
- package/transforms/Arabic-Latin-BGN.json +9 -0
- package/transforms/Arabic-Latin-BGN.txt +205 -0
- package/transforms/Arabic-Latin.json +11 -0
- package/transforms/Arabic-Latin.txt +181 -0
- package/transforms/Armenian-Latin-BGN.json +9 -0
- package/transforms/Armenian-Latin-BGN.txt +165 -0
- package/transforms/Azerbaijani-Latin-BGN.json +9 -0
- package/transforms/Azerbaijani-Latin-BGN.txt +183 -0
- package/transforms/Belarusian-Latin-BGN.json +9 -0
- package/transforms/Belarusian-Latin-BGN.txt +194 -0
- package/transforms/Bengali-Arabic.json +9 -0
- package/transforms/Bengali-Arabic.txt +7 -0
- package/transforms/Bengali-Devanagari.json +9 -0
- package/transforms/Bengali-Devanagari.txt +7 -0
- package/transforms/Bengali-Gujarati.json +9 -0
- package/transforms/Bengali-Gujarati.txt +7 -0
- package/transforms/Bengali-Gurmukhi.json +9 -0
- package/transforms/Bengali-Gurmukhi.txt +7 -0
- package/transforms/Bengali-InterIndic.json +7 -0
- package/transforms/Bengali-InterIndic.txt +99 -0
- package/transforms/Bengali-Kannada.json +9 -0
- package/transforms/Bengali-Kannada.txt +7 -0
- package/transforms/Bengali-Latin.json +9 -0
- package/transforms/Bengali-Latin.txt +7 -0
- package/transforms/Bengali-Malayalam.json +9 -0
- package/transforms/Bengali-Malayalam.txt +7 -0
- package/transforms/Bengali-Oriya.json +9 -0
- package/transforms/Bengali-Oriya.txt +7 -0
- package/transforms/Bengali-Tamil.json +9 -0
- package/transforms/Bengali-Tamil.txt +7 -0
- package/transforms/Bengali-Telugu.json +9 -0
- package/transforms/Bengali-Telugu.txt +7 -0
- package/transforms/Bengali-ur.json +8 -0
- package/transforms/Bengali-ur.txt +7 -0
- package/transforms/Bulgarian-Latin-BGN.json +9 -0
- package/transforms/Bulgarian-Latin-BGN.txt +237 -0
- package/transforms/CanadianAboriginal-Latin.json +11 -0
- package/transforms/CanadianAboriginal-Latin.txt +184 -0
- package/transforms/Cyrillic-Latin.json +11 -0
- package/transforms/Cyrillic-Latin.txt +280 -0
- package/transforms/Devanagari-Arabic.json +9 -0
- package/transforms/Devanagari-Arabic.txt +7 -0
- package/transforms/Devanagari-Bengali.json +9 -0
- package/transforms/Devanagari-Bengali.txt +7 -0
- package/transforms/Devanagari-Gujarati.json +9 -0
- package/transforms/Devanagari-Gujarati.txt +7 -0
- package/transforms/Devanagari-Gurmukhi.json +9 -0
- package/transforms/Devanagari-Gurmukhi.txt +7 -0
- package/transforms/Devanagari-InterIndic.json +7 -0
- package/transforms/Devanagari-InterIndic.txt +113 -0
- package/transforms/Devanagari-Kannada.json +9 -0
- package/transforms/Devanagari-Kannada.txt +7 -0
- package/transforms/Devanagari-Latin.json +9 -0
- package/transforms/Devanagari-Latin.txt +7 -0
- package/transforms/Devanagari-Malayalam.json +9 -0
- package/transforms/Devanagari-Malayalam.txt +7 -0
- package/transforms/Devanagari-Oriya.json +9 -0
- package/transforms/Devanagari-Oriya.txt +7 -0
- package/transforms/Devanagari-Tamil.json +9 -0
- package/transforms/Devanagari-Tamil.txt +7 -0
- package/transforms/Devanagari-Telugu.json +9 -0
- package/transforms/Devanagari-Telugu.txt +7 -0
- package/transforms/Devanagari-ur.json +8 -0
- package/transforms/Devanagari-ur.txt +7 -0
- package/transforms/Fullwidth-Halfwidth.json +9 -0
- package/transforms/Fullwidth-Halfwidth.txt +261 -0
- package/transforms/Georgian-Latin-BGN.json +9 -0
- package/transforms/Georgian-Latin-BGN.txt +43 -0
- package/transforms/Georgian-Latin-BGN_1981.json +8 -0
- package/transforms/Georgian-Latin-BGN_1981.txt +54 -0
- package/transforms/Georgian-Latin.json +11 -0
- package/transforms/Georgian-Latin.txt +53 -0
- package/transforms/Greek-Latin-BGN.json +9 -0
- package/transforms/Greek-Latin-BGN.txt +419 -0
- package/transforms/Greek-Latin.json +11 -0
- package/transforms/Greek-Latin.txt +251 -0
- package/transforms/Greek_Latin_UNGEGN.json +11 -0
- package/transforms/Greek_Latin_UNGEGN.txt +179 -0
- package/transforms/Gujarati-Arabic.json +9 -0
- package/transforms/Gujarati-Arabic.txt +7 -0
- package/transforms/Gujarati-Bengali.json +9 -0
- package/transforms/Gujarati-Bengali.txt +7 -0
- package/transforms/Gujarati-Devanagari.json +9 -0
- package/transforms/Gujarati-Devanagari.txt +7 -0
- package/transforms/Gujarati-Gurmukhi.json +9 -0
- package/transforms/Gujarati-Gurmukhi.txt +7 -0
- package/transforms/Gujarati-InterIndic.json +7 -0
- package/transforms/Gujarati-InterIndic.txt +89 -0
- package/transforms/Gujarati-Kannada.json +9 -0
- package/transforms/Gujarati-Kannada.txt +7 -0
- package/transforms/Gujarati-Latin.json +9 -0
- package/transforms/Gujarati-Latin.txt +7 -0
- package/transforms/Gujarati-Malayalam.json +9 -0
- package/transforms/Gujarati-Malayalam.txt +7 -0
- package/transforms/Gujarati-Oriya.json +9 -0
- package/transforms/Gujarati-Oriya.txt +7 -0
- package/transforms/Gujarati-Tamil.json +9 -0
- package/transforms/Gujarati-Tamil.txt +7 -0
- package/transforms/Gujarati-Telugu.json +9 -0
- package/transforms/Gujarati-Telugu.txt +7 -0
- package/transforms/Gujarati-ur.json +8 -0
- package/transforms/Gujarati-ur.txt +7 -0
- package/transforms/Gurmukhi-Arabic.json +9 -0
- package/transforms/Gurmukhi-Arabic.txt +7 -0
- package/transforms/Gurmukhi-Bengali.json +9 -0
- package/transforms/Gurmukhi-Bengali.txt +7 -0
- package/transforms/Gurmukhi-Devanagari.json +9 -0
- package/transforms/Gurmukhi-Devanagari.txt +7 -0
- package/transforms/Gurmukhi-Gujarati.json +9 -0
- package/transforms/Gurmukhi-Gujarati.txt +7 -0
- package/transforms/Gurmukhi-InterIndic.json +7 -0
- package/transforms/Gurmukhi-InterIndic.txt +88 -0
- package/transforms/Gurmukhi-Kannada.json +9 -0
- package/transforms/Gurmukhi-Kannada.txt +7 -0
- package/transforms/Gurmukhi-Latin.json +9 -0
- package/transforms/Gurmukhi-Latin.txt +7 -0
- package/transforms/Gurmukhi-Malayalam.json +9 -0
- package/transforms/Gurmukhi-Malayalam.txt +7 -0
- package/transforms/Gurmukhi-Oriya.json +9 -0
- package/transforms/Gurmukhi-Oriya.txt +7 -0
- package/transforms/Gurmukhi-Tamil.json +9 -0
- package/transforms/Gurmukhi-Tamil.txt +7 -0
- package/transforms/Gurmukhi-Telugu.json +9 -0
- package/transforms/Gurmukhi-Telugu.txt +7 -0
- package/transforms/Gurmukhi-ur.json +8 -0
- package/transforms/Gurmukhi-ur.txt +7 -0
- package/transforms/Han-Latin-Names.json +8 -0
- package/transforms/Han-Latin-Names.txt +65 -0
- package/transforms/Han-Latin.json +9 -0
- package/transforms/Han-Latin.txt +1501 -0
- package/transforms/Han-Spacedhan.json +7 -0
- package/transforms/Han-Spacedhan.txt +35 -0
- package/transforms/Hangul-Latin.json +9 -0
- package/transforms/Hangul-Latin.txt +6 -0
- package/transforms/Hebrew-Latin-BGN.json +9 -0
- package/transforms/Hebrew-Latin-BGN.txt +113 -0
- package/transforms/Hebrew-Latin.json +11 -0
- package/transforms/Hebrew-Latin.txt +91 -0
- package/transforms/Hiragana-Katakana.json +11 -0
- package/transforms/Hiragana-Katakana.txt +179 -0
- package/transforms/Hiragana-Latin.json +11 -0
- package/transforms/Hiragana-Latin.txt +9 -0
- package/transforms/IPA-XSampa.json +11 -0
- package/transforms/IPA-XSampa.txt +228 -0
- package/transforms/InterIndic-Arabic.json +7 -0
- package/transforms/InterIndic-Arabic.txt +128 -0
- package/transforms/InterIndic-Bengali.json +7 -0
- package/transforms/InterIndic-Bengali.txt +135 -0
- package/transforms/InterIndic-Devanagari.json +7 -0
- package/transforms/InterIndic-Devanagari.txt +151 -0
- package/transforms/InterIndic-Gujarati.json +7 -0
- package/transforms/InterIndic-Gujarati.txt +136 -0
- package/transforms/InterIndic-Gurmukhi.json +7 -0
- package/transforms/InterIndic-Gurmukhi.txt +142 -0
- package/transforms/InterIndic-Kannada.json +7 -0
- package/transforms/InterIndic-Kannada.txt +137 -0
- package/transforms/InterIndic-Latin.json +7 -0
- package/transforms/InterIndic-Latin.txt +492 -0
- package/transforms/InterIndic-Malayalam.json +7 -0
- package/transforms/InterIndic-Malayalam.txt +137 -0
- package/transforms/InterIndic-Oriya.json +7 -0
- package/transforms/InterIndic-Oriya.txt +135 -0
- package/transforms/InterIndic-Tamil.json +7 -0
- package/transforms/InterIndic-Tamil.txt +136 -0
- package/transforms/InterIndic-Telugu.json +7 -0
- package/transforms/InterIndic-Telugu.txt +136 -0
- package/transforms/InterIndic-ur.json +7 -0
- package/transforms/InterIndic-ur.txt +119 -0
- package/transforms/Jamo-Latin.json +9 -0
- package/transforms/Jamo-Latin.txt +6 -0
- package/transforms/Kannada-Arabic.json +9 -0
- package/transforms/Kannada-Arabic.txt +7 -0
- package/transforms/Kannada-Bengali.json +9 -0
- package/transforms/Kannada-Bengali.txt +7 -0
- package/transforms/Kannada-Devanagari.json +9 -0
- package/transforms/Kannada-Devanagari.txt +7 -0
- package/transforms/Kannada-Gujarati.json +9 -0
- package/transforms/Kannada-Gujarati.txt +7 -0
- package/transforms/Kannada-Gurmukhi.json +9 -0
- package/transforms/Kannada-Gurmukhi.txt +7 -0
- package/transforms/Kannada-InterIndic.json +7 -0
- package/transforms/Kannada-InterIndic.txt +87 -0
- package/transforms/Kannada-Latin.json +9 -0
- package/transforms/Kannada-Latin.txt +7 -0
- package/transforms/Kannada-Malayalam.json +9 -0
- package/transforms/Kannada-Malayalam.txt +7 -0
- package/transforms/Kannada-Oriya.json +9 -0
- package/transforms/Kannada-Oriya.txt +7 -0
- package/transforms/Kannada-Tamil.json +9 -0
- package/transforms/Kannada-Tamil.txt +7 -0
- package/transforms/Kannada-Telugu.json +9 -0
- package/transforms/Kannada-Telugu.txt +7 -0
- package/transforms/Kannada-ur.json +8 -0
- package/transforms/Kannada-ur.txt +7 -0
- package/transforms/Katakana-Latin-BGN.json +9 -0
- package/transforms/Katakana-Latin-BGN.txt +335 -0
- package/transforms/Kazakh-Latin-BGN.json +9 -0
- package/transforms/Kazakh-Latin-BGN.txt +332 -0
- package/transforms/Kirghiz-Latin-BGN.json +9 -0
- package/transforms/Kirghiz-Latin-BGN.txt +211 -0
- package/transforms/Korean-Latin-BGN.json +9 -0
- package/transforms/Korean-Latin-BGN.txt +345 -0
- package/transforms/Latin-ASCII.json +9 -0
- package/transforms/Latin-ASCII.txt +909 -0
- package/transforms/Latin-Armenian.json +11 -0
- package/transforms/Latin-Armenian.txt +88 -0
- package/transforms/Latin-Bengali.json +9 -0
- package/transforms/Latin-Bengali.txt +8 -0
- package/transforms/Latin-Bopomofo.json +11 -0
- package/transforms/Latin-Bopomofo.txt +1445 -0
- package/transforms/Latin-ConjoiningJamo.json +7 -0
- package/transforms/Latin-ConjoiningJamo.txt +477 -0
- package/transforms/Latin-Devanagari.json +9 -0
- package/transforms/Latin-Devanagari.txt +8 -0
- package/transforms/Latin-Ethiopic.json +11 -0
- package/transforms/Latin-Ethiopic.txt +277 -0
- package/transforms/Latin-Gujarati.json +9 -0
- package/transforms/Latin-Gujarati.txt +8 -0
- package/transforms/Latin-Gurmukhi.json +9 -0
- package/transforms/Latin-Gurmukhi.txt +8 -0
- package/transforms/Latin-Hangul.json +9 -0
- package/transforms/Latin-Hangul.txt +7 -0
- package/transforms/Latin-InterIndic.json +7 -0
- package/transforms/Latin-InterIndic.txt +377 -0
- package/transforms/Latin-Jamo.json +9 -0
- package/transforms/Latin-Jamo.txt +7 -0
- package/transforms/Latin-Kannada.json +9 -0
- package/transforms/Latin-Kannada.txt +8 -0
- package/transforms/Latin-Katakana.json +11 -0
- package/transforms/Latin-Katakana.txt +382 -0
- package/transforms/Latin-Malayalam.json +9 -0
- package/transforms/Latin-Malayalam.txt +8 -0
- package/transforms/Latin-NumericPinyin.json +9 -0
- package/transforms/Latin-NumericPinyin.txt +29 -0
- package/transforms/Latin-Oriya.json +9 -0
- package/transforms/Latin-Oriya.txt +8 -0
- package/transforms/Latin-Tamil.json +9 -0
- package/transforms/Latin-Tamil.txt +8 -0
- package/transforms/Latin-Telugu.json +9 -0
- package/transforms/Latin-Telugu.txt +8 -0
- package/transforms/Latin-Thai.json +9 -0
- package/transforms/Latin-Thai.txt +7 -0
- package/transforms/Macedonian-Latin-BGN.json +9 -0
- package/transforms/Macedonian-Latin-BGN.txt +176 -0
- package/transforms/Malayalam-Arabic.json +9 -0
- package/transforms/Malayalam-Arabic.txt +7 -0
- package/transforms/Malayalam-Bengali.json +9 -0
- package/transforms/Malayalam-Bengali.txt +7 -0
- package/transforms/Malayalam-Devanagari.json +9 -0
- package/transforms/Malayalam-Devanagari.txt +7 -0
- package/transforms/Malayalam-Gujarati.json +9 -0
- package/transforms/Malayalam-Gujarati.txt +7 -0
- package/transforms/Malayalam-Gurmukhi.json +9 -0
- package/transforms/Malayalam-Gurmukhi.txt +7 -0
- package/transforms/Malayalam-InterIndic.json +7 -0
- package/transforms/Malayalam-InterIndic.txt +87 -0
- package/transforms/Malayalam-Kannada.json +9 -0
- package/transforms/Malayalam-Kannada.txt +7 -0
- package/transforms/Malayalam-Latin.json +9 -0
- package/transforms/Malayalam-Latin.txt +7 -0
- package/transforms/Malayalam-Oriya.json +9 -0
- package/transforms/Malayalam-Oriya.txt +7 -0
- package/transforms/Malayalam-Tamil.json +9 -0
- package/transforms/Malayalam-Tamil.txt +7 -0
- package/transforms/Malayalam-Telugu.json +9 -0
- package/transforms/Malayalam-Telugu.txt +7 -0
- package/transforms/Malayalam-ur.json +8 -0
- package/transforms/Malayalam-ur.txt +7 -0
- package/transforms/Maldivian-Latin-BGN.json +9 -0
- package/transforms/Maldivian-Latin-BGN.txt +171 -0
- package/transforms/Mongolian-Latin-BGN.json +9 -0
- package/transforms/Mongolian-Latin-BGN.txt +151 -0
- package/transforms/Myanmar-Latin.json +9 -0
- package/transforms/Myanmar-Latin.txt +367 -0
- package/transforms/Oriya-Arabic.json +9 -0
- package/transforms/Oriya-Arabic.txt +7 -0
- package/transforms/Oriya-Bengali.json +9 -0
- package/transforms/Oriya-Bengali.txt +7 -0
- package/transforms/Oriya-Devanagari.json +9 -0
- package/transforms/Oriya-Devanagari.txt +7 -0
- package/transforms/Oriya-Gujarati.json +9 -0
- package/transforms/Oriya-Gujarati.txt +7 -0
- package/transforms/Oriya-Gurmukhi.json +9 -0
- package/transforms/Oriya-Gurmukhi.txt +7 -0
- package/transforms/Oriya-InterIndic.json +7 -0
- package/transforms/Oriya-InterIndic.txt +91 -0
- package/transforms/Oriya-Kannada.json +9 -0
- package/transforms/Oriya-Kannada.txt +7 -0
- package/transforms/Oriya-Latin.json +9 -0
- package/transforms/Oriya-Latin.txt +7 -0
- package/transforms/Oriya-Malayalam.json +9 -0
- package/transforms/Oriya-Malayalam.txt +7 -0
- package/transforms/Oriya-Tamil.json +9 -0
- package/transforms/Oriya-Tamil.txt +7 -0
- package/transforms/Oriya-Telugu.json +9 -0
- package/transforms/Oriya-Telugu.txt +7 -0
- package/transforms/Oriya-ur.json +8 -0
- package/transforms/Oriya-ur.txt +7 -0
- package/transforms/Pashto-Latin-BGN.json +9 -0
- package/transforms/Pashto-Latin-BGN.txt +231 -0
- package/transforms/Persian-Latin-BGN.json +9 -0
- package/transforms/Persian-Latin-BGN.txt +203 -0
- package/transforms/Pinyin-NumericPinyin.json +7 -0
- package/transforms/Pinyin-NumericPinyin.txt +8 -0
- package/transforms/Russian-Latin-BGN.json +9 -0
- package/transforms/Russian-Latin-BGN.txt +235 -0
- package/transforms/Serbian-Latin-BGN.json +9 -0
- package/transforms/Serbian-Latin-BGN.txt +119 -0
- package/transforms/Simplified-Traditional.json +11 -0
- package/transforms/Simplified-Traditional.txt +4393 -0
- package/transforms/Syriac-Latin.json +11 -0
- package/transforms/Syriac-Latin.txt +52 -0
- package/transforms/Tamil-Arabic.json +9 -0
- package/transforms/Tamil-Arabic.txt +7 -0
- package/transforms/Tamil-Bengali.json +9 -0
- package/transforms/Tamil-Bengali.txt +7 -0
- package/transforms/Tamil-Devanagari.json +9 -0
- package/transforms/Tamil-Devanagari.txt +7 -0
- package/transforms/Tamil-Gujarati.json +9 -0
- package/transforms/Tamil-Gujarati.txt +7 -0
- package/transforms/Tamil-Gurmukhi.json +9 -0
- package/transforms/Tamil-Gurmukhi.txt +7 -0
- package/transforms/Tamil-InterIndic.json +7 -0
- package/transforms/Tamil-InterIndic.txt +70 -0
- package/transforms/Tamil-Kannada.json +9 -0
- package/transforms/Tamil-Kannada.txt +7 -0
- package/transforms/Tamil-Latin.json +9 -0
- package/transforms/Tamil-Latin.txt +7 -0
- package/transforms/Tamil-Malayalam.json +9 -0
- package/transforms/Tamil-Malayalam.txt +7 -0
- package/transforms/Tamil-Oriya.json +9 -0
- package/transforms/Tamil-Oriya.txt +7 -0
- package/transforms/Tamil-Telugu.json +9 -0
- package/transforms/Tamil-Telugu.txt +7 -0
- package/transforms/Tamil-ur.json +8 -0
- package/transforms/Tamil-ur.txt +7 -0
- package/transforms/Telugu-Arabic.json +9 -0
- package/transforms/Telugu-Arabic.txt +7 -0
- package/transforms/Telugu-Bengali.json +9 -0
- package/transforms/Telugu-Bengali.txt +7 -0
- package/transforms/Telugu-Devanagari.json +9 -0
- package/transforms/Telugu-Devanagari.txt +7 -0
- package/transforms/Telugu-Gujarati.json +9 -0
- package/transforms/Telugu-Gujarati.txt +7 -0
- package/transforms/Telugu-Gurmukhi.json +9 -0
- package/transforms/Telugu-Gurmukhi.txt +7 -0
- package/transforms/Telugu-InterIndic.json +7 -0
- package/transforms/Telugu-InterIndic.txt +87 -0
- package/transforms/Telugu-Kannada.json +9 -0
- package/transforms/Telugu-Kannada.txt +7 -0
- package/transforms/Telugu-Latin.json +9 -0
- package/transforms/Telugu-Latin.txt +7 -0
- package/transforms/Telugu-Malayalam.json +9 -0
- package/transforms/Telugu-Malayalam.txt +7 -0
- package/transforms/Telugu-Oriya.json +9 -0
- package/transforms/Telugu-Oriya.txt +7 -0
- package/transforms/Telugu-Tamil.json +9 -0
- package/transforms/Telugu-Tamil.txt +7 -0
- package/transforms/Telugu-ur.json +8 -0
- package/transforms/Telugu-ur.txt +7 -0
- package/transforms/Thaana-Latin.json +11 -0
- package/transforms/Thaana-Latin.txt +433 -0
- package/transforms/Thai-Latin.json +9 -0
- package/transforms/Thai-Latin.txt +9 -0
- package/transforms/Thai-ThaiLogical.json +7 -0
- package/transforms/Thai-ThaiLogical.txt +16 -0
- package/transforms/Thai-ThaiSemi.json +7 -0
- package/transforms/Thai-ThaiSemi.txt +6 -0
- package/transforms/ThaiLogical-Latin.json +7 -0
- package/transforms/ThaiLogical-Latin.txt +147 -0
- package/transforms/Turkmen-Latin-BGN.json +9 -0
- package/transforms/Turkmen-Latin-BGN.txt +302 -0
- package/transforms/Ukrainian-Latin-BGN.json +9 -0
- package/transforms/Ukrainian-Latin-BGN.txt +283 -0
- package/transforms/Uzbek-Latin-BGN.json +9 -0
- package/transforms/Uzbek-Latin-BGN.txt +261 -0
- package/transforms/am-Ethi-t-am-brai.json +11 -0
- package/transforms/am-Ethi-t-am-brai.txt +652 -0
- package/transforms/am-Ethi-t-am-ethi-m0-geminate.json +9 -0
- package/transforms/am-Ethi-t-am-ethi-m0-geminate.txt +6925 -0
- package/transforms/am-Ethi-t-d0-morse.json +9 -0
- package/transforms/am-Ethi-t-d0-morse.txt +657 -0
- package/transforms/am-am_FONIPA.json +9 -0
- package/transforms/am-am_FONIPA.txt +694 -0
- package/transforms/am-ar.json +8 -0
- package/transforms/am-ar.txt +5 -0
- package/transforms/am-chr.json +8 -0
- package/transforms/am-chr.txt +4 -0
- package/transforms/am-fa.json +8 -0
- package/transforms/am-fa.txt +4 -0
- package/transforms/az-Lower.json +8 -0
- package/transforms/az-Lower.txt +13 -0
- package/transforms/az-Title.json +8 -0
- package/transforms/az-Title.txt +11 -0
- package/transforms/az-Upper.json +8 -0
- package/transforms/az-Upper.txt +5 -0
- package/transforms/blt-fonipa-t-blt.json +8 -0
- package/transforms/blt-fonipa-t-blt.txt +132 -0
- package/transforms/byn-Ethi-t-byn-latn-m0-tekie-alibekit.json +11 -0
- package/transforms/byn-Ethi-t-byn-latn-m0-tekie-alibekit.txt +537 -0
- package/transforms/byn-Ethi-t-byn-latn-m0-xaleget.json +11 -0
- package/transforms/byn-Ethi-t-byn-latn-m0-xaleget.txt +773 -0
- package/transforms/ch-am.json +8 -0
- package/transforms/ch-am.txt +4 -0
- package/transforms/ch-ar.json +8 -0
- package/transforms/ch-ar.txt +4 -0
- package/transforms/ch-ch_FONIPA.json +8 -0
- package/transforms/ch-ch_FONIPA.txt +79 -0
- package/transforms/ch-chr.json +8 -0
- package/transforms/ch-chr.txt +4 -0
- package/transforms/ch-fa.json +8 -0
- package/transforms/ch-fa.txt +4 -0
- package/transforms/chr-chr_FONIPA.json +8 -0
- package/transforms/chr-chr_FONIPA.txt +111 -0
- package/transforms/cs-am.json +8 -0
- package/transforms/cs-am.txt +4 -0
- package/transforms/cs-ar.json +8 -0
- package/transforms/cs-ar.txt +4 -0
- package/transforms/cs-chr.json +8 -0
- package/transforms/cs-chr.txt +4 -0
- package/transforms/cs-cs_FONIPA.json +8 -0
- package/transforms/cs-cs_FONIPA.txt +74 -0
- package/transforms/cs-fa.json +8 -0
- package/transforms/cs-fa.txt +4 -0
- package/transforms/cs-ja.json +8 -0
- package/transforms/cs-ja.txt +4 -0
- package/transforms/cs-ko.json +8 -0
- package/transforms/cs-ko.txt +4 -0
- package/transforms/cs_FONIPA-ja.json +8 -0
- package/transforms/cs_FONIPA-ja.txt +228 -0
- package/transforms/cs_FONIPA-ko.json +8 -0
- package/transforms/cs_FONIPA-ko.txt +88 -0
- package/transforms/cy-fonipa-t-cy.json +8 -0
- package/transforms/cy-fonipa-t-cy.txt +189 -0
- package/transforms/de-ASCII.json +8 -0
- package/transforms/de-ASCII.txt +15 -0
- package/transforms/dsb-dsb_FONIPA.json +8 -0
- package/transforms/dsb-dsb_FONIPA.txt +67 -0
- package/transforms/el-Lower.json +8 -0
- package/transforms/el-Lower.txt +12 -0
- package/transforms/el-Title.json +8 -0
- package/transforms/el-Title.txt +12 -0
- package/transforms/el-Upper.json +8 -0
- package/transforms/el-Upper.txt +11 -0
- package/transforms/eo-am.json +8 -0
- package/transforms/eo-am.txt +4 -0
- package/transforms/eo-ar.json +8 -0
- package/transforms/eo-ar.txt +4 -0
- package/transforms/eo-chr.json +8 -0
- package/transforms/eo-chr.txt +4 -0
- package/transforms/eo-eo_FONIPA.json +8 -0
- package/transforms/eo-eo_FONIPA.txt +47 -0
- package/transforms/eo-fa.json +8 -0
- package/transforms/eo-fa.txt +4 -0
- package/transforms/es-am.json +8 -0
- package/transforms/es-am.txt +4 -0
- package/transforms/es-ar.json +8 -0
- package/transforms/es-ar.txt +13 -0
- package/transforms/es-chr.json +8 -0
- package/transforms/es-chr.txt +4 -0
- package/transforms/es-es_FONIPA.json +8 -0
- package/transforms/es-es_FONIPA.txt +139 -0
- package/transforms/es-fa.json +8 -0
- package/transforms/es-fa.txt +13 -0
- package/transforms/es-ja.json +8 -0
- package/transforms/es-ja.txt +4 -0
- package/transforms/es-zh.json +8 -0
- package/transforms/es-zh.txt +4 -0
- package/transforms/es_419-am.json +8 -0
- package/transforms/es_419-am.txt +5 -0
- package/transforms/es_419-ar.json +8 -0
- package/transforms/es_419-ar.txt +14 -0
- package/transforms/es_419-chr.json +8 -0
- package/transforms/es_419-chr.txt +5 -0
- package/transforms/es_419-fa.json +8 -0
- package/transforms/es_419-fa.txt +14 -0
- package/transforms/es_419-ja.json +8 -0
- package/transforms/es_419-ja.txt +5 -0
- package/transforms/es_419-zh.json +8 -0
- package/transforms/es_419-zh.txt +5 -0
- package/transforms/es_FONIPA-am.json +8 -0
- package/transforms/es_FONIPA-am.txt +230 -0
- package/transforms/es_FONIPA-es_419_FONIPA.json +8 -0
- package/transforms/es_FONIPA-es_419_FONIPA.txt +6 -0
- package/transforms/es_FONIPA-ja.json +8 -0
- package/transforms/es_FONIPA-ja.txt +155 -0
- package/transforms/es_FONIPA-zh.json +8 -0
- package/transforms/es_FONIPA-zh.txt +522 -0
- package/transforms/fa-fa_FONIPA.json +8 -0
- package/transforms/fa-fa_FONIPA.txt +107 -0
- package/transforms/gz-Ethi-t-und-sarb.json +11 -0
- package/transforms/gz-Ethi-t-und-sarb.txt +180 -0
- package/transforms/ha-ha_NE.json +8 -0
- package/transforms/ha-ha_NE.txt +6 -0
- package/transforms/hy-am.json +8 -0
- package/transforms/hy-am.txt +4 -0
- package/transforms/hy-ar.json +8 -0
- package/transforms/hy-ar.txt +4 -0
- package/transforms/hy-chr.json +8 -0
- package/transforms/hy-chr.txt +4 -0
- package/transforms/hy-fa.json +8 -0
- package/transforms/hy-fa.txt +4 -0
- package/transforms/hy-hy_FONIPA.json +8 -0
- package/transforms/hy-hy_FONIPA.txt +52 -0
- package/transforms/hy_AREVMDA-am.json +8 -0
- package/transforms/hy_AREVMDA-am.txt +4 -0
- package/transforms/hy_AREVMDA-ar.json +8 -0
- package/transforms/hy_AREVMDA-ar.txt +4 -0
- package/transforms/hy_AREVMDA-chr.json +8 -0
- package/transforms/hy_AREVMDA-chr.txt +4 -0
- package/transforms/hy_AREVMDA-fa.json +8 -0
- package/transforms/hy_AREVMDA-fa.txt +4 -0
- package/transforms/hy_AREVMDA-hy_AREVMDA_FONIPA.json +8 -0
- package/transforms/hy_AREVMDA-hy_AREVMDA_FONIPA.txt +80 -0
- package/transforms/ia-am.json +8 -0
- package/transforms/ia-am.txt +4 -0
- package/transforms/ia-ar.json +8 -0
- package/transforms/ia-ar.txt +4 -0
- package/transforms/ia-chr.json +8 -0
- package/transforms/ia-chr.txt +4 -0
- package/transforms/ia-fa.json +8 -0
- package/transforms/ia-fa.txt +4 -0
- package/transforms/ia-ia_FONIPA.json +8 -0
- package/transforms/ia-ia_FONIPA.txt +71 -0
- package/transforms/it-am.json +8 -0
- package/transforms/it-am.txt +257 -0
- package/transforms/it-ja.json +8 -0
- package/transforms/it-ja.txt +259 -0
- package/transforms/ja_Latn-ko.json +8 -0
- package/transforms/ja_Latn-ko.txt +141 -0
- package/transforms/ja_Latn-ru.json +8 -0
- package/transforms/ja_Latn-ru.txt +123 -0
- package/transforms/kk-am.json +8 -0
- package/transforms/kk-am.txt +4 -0
- package/transforms/kk-ar.json +8 -0
- package/transforms/kk-ar.txt +4 -0
- package/transforms/kk-chr.json +8 -0
- package/transforms/kk-chr.txt +4 -0
- package/transforms/kk-fa.json +8 -0
- package/transforms/kk-fa.txt +4 -0
- package/transforms/kk-kk_FONIPA.json +8 -0
- package/transforms/kk-kk_FONIPA.txt +59 -0
- package/transforms/ky-am.json +8 -0
- package/transforms/ky-am.txt +4 -0
- package/transforms/ky-ar.json +8 -0
- package/transforms/ky-ar.txt +4 -0
- package/transforms/ky-chr.json +8 -0
- package/transforms/ky-chr.txt +4 -0
- package/transforms/ky-fa.json +8 -0
- package/transforms/ky-fa.txt +4 -0
- package/transforms/ky-ky_FONIPA.json +8 -0
- package/transforms/ky-ky_FONIPA.txt +71 -0
- package/transforms/la-la_FONIPA.json +8 -0
- package/transforms/la-la_FONIPA.txt +79 -0
- package/transforms/lt-Lower.json +8 -0
- package/transforms/lt-Lower.txt +20 -0
- package/transforms/lt-Title.json +8 -0
- package/transforms/lt-Title.txt +15 -0
- package/transforms/lt-Upper.json +8 -0
- package/transforms/lt-Upper.txt +8 -0
- package/transforms/mn-mn_Latn-MNS.json +8 -0
- package/transforms/mn-mn_Latn-MNS.txt +86 -0
- package/transforms/my-am.json +8 -0
- package/transforms/my-am.txt +4 -0
- package/transforms/my-ar.json +8 -0
- package/transforms/my-ar.txt +4 -0
- package/transforms/my-chr.json +8 -0
- package/transforms/my-chr.txt +4 -0
- package/transforms/my-fa.json +8 -0
- package/transforms/my-fa.txt +4 -0
- package/transforms/my-my_FONIPA.json +8 -0
- package/transforms/my-my_FONIPA.txt +325 -0
- package/transforms/my-t-my-d0-zawgyi.json +8 -0
- package/transforms/my-t-my-d0-zawgyi.txt +222 -0
- package/transforms/my-t-my-s0-zawgyi.json +8 -0
- package/transforms/my-t-my-s0-zawgyi.txt +231 -0
- package/transforms/nl-Title.json +8 -0
- package/transforms/nl-Title.txt +7 -0
- package/transforms/nv-nv_FONIPA.json +8 -0
- package/transforms/nv-nv_FONIPA.txt +74 -0
- package/transforms/pl-am.json +8 -0
- package/transforms/pl-am.txt +4 -0
- package/transforms/pl-ar.json +8 -0
- package/transforms/pl-ar.txt +4 -0
- package/transforms/pl-chr.json +8 -0
- package/transforms/pl-chr.txt +4 -0
- package/transforms/pl-fa.json +8 -0
- package/transforms/pl-fa.txt +4 -0
- package/transforms/pl-ja.json +8 -0
- package/transforms/pl-ja.txt +4 -0
- package/transforms/pl-pl_FONIPA.json +8 -0
- package/transforms/pl-pl_FONIPA.txt +113 -0
- package/transforms/pl_FONIPA-ja.json +8 -0
- package/transforms/pl_FONIPA-ja.txt +301 -0
- package/transforms/rm_SURSILV-am.json +8 -0
- package/transforms/rm_SURSILV-am.txt +4 -0
- package/transforms/rm_SURSILV-ar.json +8 -0
- package/transforms/rm_SURSILV-ar.txt +4 -0
- package/transforms/rm_SURSILV-chr.json +8 -0
- package/transforms/rm_SURSILV-chr.txt +4 -0
- package/transforms/rm_SURSILV-fa.json +8 -0
- package/transforms/rm_SURSILV-fa.txt +4 -0
- package/transforms/rm_SURSILV-rm_FONIPA_SURSILV.json +8 -0
- package/transforms/rm_SURSILV-rm_FONIPA_SURSILV.txt +96 -0
- package/transforms/ro-am.json +8 -0
- package/transforms/ro-am.txt +4 -0
- package/transforms/ro-ar.json +8 -0
- package/transforms/ro-ar.txt +4 -0
- package/transforms/ro-chr.json +8 -0
- package/transforms/ro-chr.txt +4 -0
- package/transforms/ro-fa.json +8 -0
- package/transforms/ro-fa.txt +4 -0
- package/transforms/ro-ja.json +8 -0
- package/transforms/ro-ja.txt +4 -0
- package/transforms/ro-ro_FONIPA.json +8 -0
- package/transforms/ro-ro_FONIPA.txt +121 -0
- package/transforms/ro_FONIPA-ja.json +8 -0
- package/transforms/ro_FONIPA-ja.txt +211 -0
- package/transforms/ru-ja.json +8 -0
- package/transforms/ru-ja.txt +444 -0
- package/transforms/ru-zh.json +8 -0
- package/transforms/ru-zh.txt +996 -0
- package/transforms/ru_Latn-ru-BGN.json +9 -0
- package/transforms/ru_Latn-ru-BGN.txt +97 -0
- package/transforms/sat-am.json +8 -0
- package/transforms/sat-am.txt +6 -0
- package/transforms/sat-ar.json +8 -0
- package/transforms/sat-ar.txt +6 -0
- package/transforms/sat-chr.json +8 -0
- package/transforms/sat-chr.txt +6 -0
- package/transforms/sat-fa.json +8 -0
- package/transforms/sat-fa.txt +6 -0
- package/transforms/sat_Olck-sat_FONIPA.json +8 -0
- package/transforms/sat_Olck-sat_FONIPA.txt +174 -0
- package/transforms/sgw-Ethi-t-und-ethi.json +11 -0
- package/transforms/sgw-Ethi-t-und-ethi.txt +138 -0
- package/transforms/si-am.json +8 -0
- package/transforms/si-am.txt +4 -0
- package/transforms/si-ar.json +8 -0
- package/transforms/si-ar.txt +4 -0
- package/transforms/si-chr.json +8 -0
- package/transforms/si-chr.txt +4 -0
- package/transforms/si-fa.json +8 -0
- package/transforms/si-fa.txt +4 -0
- package/transforms/si-si_FONIPA.json +8 -0
- package/transforms/si-si_FONIPA.txt +157 -0
- package/transforms/si-si_Latn.json +8 -0
- package/transforms/si-si_Latn.txt +94 -0
- package/transforms/sk-am.json +8 -0
- package/transforms/sk-am.txt +4 -0
- package/transforms/sk-ar.json +8 -0
- package/transforms/sk-ar.txt +4 -0
- package/transforms/sk-chr.json +8 -0
- package/transforms/sk-chr.txt +4 -0
- package/transforms/sk-fa.json +8 -0
- package/transforms/sk-fa.txt +4 -0
- package/transforms/sk-ja.json +8 -0
- package/transforms/sk-ja.txt +4 -0
- package/transforms/sk-sk_FONIPA.json +8 -0
- package/transforms/sk-sk_FONIPA.txt +101 -0
- package/transforms/sk_FONIPA-ja.json +8 -0
- package/transforms/sk_FONIPA-ja.txt +252 -0
- package/transforms/ta-ta_FONIPA.json +8 -0
- package/transforms/ta-ta_FONIPA.txt +73 -0
- package/transforms/tlh-am.json +8 -0
- package/transforms/tlh-am.txt +4 -0
- package/transforms/tlh-ar.json +8 -0
- package/transforms/tlh-ar.txt +4 -0
- package/transforms/tlh-chr.json +8 -0
- package/transforms/tlh-chr.txt +4 -0
- package/transforms/tlh-fa.json +8 -0
- package/transforms/tlh-fa.txt +4 -0
- package/transforms/tlh-tlh_FONIPA.json +8 -0
- package/transforms/tlh-tlh_FONIPA.txt +46 -0
- package/transforms/tr-Lower.json +8 -0
- package/transforms/tr-Lower.txt +13 -0
- package/transforms/tr-Title.json +8 -0
- package/transforms/tr-Title.txt +11 -0
- package/transforms/tr-Upper.json +8 -0
- package/transforms/tr-Upper.txt +8 -0
- package/transforms/ug-ug_FONIPA.json +8 -0
- package/transforms/ug-ug_FONIPA.txt +69 -0
- package/transforms/und-Ethi-t-und-cyrl-m0-gutgarts.json +11 -0
- package/transforms/und-Ethi-t-und-cyrl-m0-gutgarts.txt +747 -0
- package/transforms/und-Ethi-t-und-latn-m0-aethiopi-geminate.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-aethiopi-geminate.txt +19 -0
- package/transforms/und-Ethi-t-und-latn-m0-aethiopi.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-aethiopi.txt +633 -0
- package/transforms/und-Ethi-t-und-latn-m0-alaloc-geminate.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-alaloc-geminate.txt +19 -0
- package/transforms/und-Ethi-t-und-latn-m0-alaloc.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-alaloc.txt +757 -0
- package/transforms/und-Ethi-t-und-latn-m0-beta_metsehaf-geminate.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-beta_metsehaf-geminate.txt +19 -0
- package/transforms/und-Ethi-t-und-latn-m0-beta_metsehaf.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-beta_metsehaf.txt +585 -0
- package/transforms/und-Ethi-t-und-latn-m0-es3842.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-es3842.txt +640 -0
- package/transforms/und-Ethi-t-und-latn-m0-ies-jes-1964-geminate.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-ies-jes-1964-geminate.txt +19 -0
- package/transforms/und-Ethi-t-und-latn-m0-ies-jes-1964.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-ies-jes-1964.txt +619 -0
- package/transforms/und-Ethi-t-und-latn-m0-lambdin.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-lambdin.txt +627 -0
- package/transforms/und-Ethi-t-und-latn-m0-sera.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-sera.txt +695 -0
- package/transforms/und-Ethi-t-und-latn.json +11 -0
- package/transforms/und-Ethi-t-und-latn.txt +16 -0
- package/transforms/und_FONIPA-ar.json +8 -0
- package/transforms/und_FONIPA-ar.txt +114 -0
- package/transforms/und_FONIPA-chr.json +8 -0
- package/transforms/und_FONIPA-chr.txt +172 -0
- package/transforms/und_FONIPA-fa.json +8 -0
- package/transforms/und_FONIPA-fa.txt +109 -0
- package/transforms/uz_Cyrl-uz_Latn.json +9 -0
- package/transforms/uz_Cyrl-uz_Latn.txt +103 -0
- package/transforms/vec-vec_FONIPA.json +8 -0
- package/transforms/vec-vec_FONIPA.txt +85 -0
- package/transforms/xh-am.json +8 -0
- package/transforms/xh-am.txt +4 -0
- package/transforms/xh-ar.json +8 -0
- package/transforms/xh-ar.txt +4 -0
- package/transforms/xh-chr.json +8 -0
- package/transforms/xh-chr.txt +4 -0
- package/transforms/xh-fa.json +8 -0
- package/transforms/xh-fa.txt +4 -0
- package/transforms/xh-xh_FONIPA.json +8 -0
- package/transforms/xh-xh_FONIPA.txt +85 -0
- package/transforms/yo-yo_BJ.json +8 -0
- package/transforms/yo-yo_BJ.txt +36 -0
- package/transforms/zh_Latn_PINYIN-ru.json +8 -0
- package/transforms/zh_Latn_PINYIN-ru.txt +148 -0
- package/transforms/zu-am.json +8 -0
- package/transforms/zu-am.txt +4 -0
- package/transforms/zu-ar.json +8 -0
- package/transforms/zu-ar.txt +4 -0
- package/transforms/zu-chr.json +8 -0
- package/transforms/zu-chr.txt +4 -0
- package/transforms/zu-fa.json +8 -0
- package/transforms/zu-fa.txt +4 -0
- package/transforms/zu-zu_FONIPA.json +8 -0
- package/transforms/zu-zu_FONIPA.txt +72 -0
- package/transforms.json +385 -0
|
@@ -0,0 +1,35 @@
|
|
|
1
|
+
|
|
2
|
+
# Only intended for internal use
|
|
3
|
+
# Make sure Han are normalized, including characters that contain them.
|
|
4
|
+
# The first set in the filter is computed with http://unicode.org/cldr/utility/list-unicodeset.jsp?a=[:tonfkd:/XXX/:]-[:ideographic:]-[:sc=han:]
|
|
5
|
+
# Where XXX is the resolved [:ideographic:][:sc=han:]. It needs updating with each Unicode release!
|
|
6
|
+
:: [[、。々《-』〜・㆒-㆟㈠-㉇㊀-㊰㋀-㋋ ㍘-㍰㍻-㍿㏠-㏾🈐-🈒🈔-🈺🉀-🉈🉐🉑][:ideographic:][:sc=han:]] nfkc;
|
|
7
|
+
:: fullwidth-halfwidth;
|
|
8
|
+
。 → '.';
|
|
9
|
+
。→ '.';
|
|
10
|
+
、→ ',';
|
|
11
|
+
、→ ',';
|
|
12
|
+
《→ '«';
|
|
13
|
+
》→ '»';
|
|
14
|
+
〈 → '‹';
|
|
15
|
+
〉→ '›';
|
|
16
|
+
「→ '‘';
|
|
17
|
+
」→ '’';
|
|
18
|
+
「→ '‘';
|
|
19
|
+
」→ '’';
|
|
20
|
+
『→ '“';
|
|
21
|
+
』→ '”';
|
|
22
|
+
・→ '‧';
|
|
23
|
+
・ → '‧';
|
|
24
|
+
々→ '⓶';
|
|
25
|
+
〜→ '~';
|
|
26
|
+
$terminalPunct = [\.\,\:\;\?\!.,:?!。、;[:Pe:][:Pf:]];
|
|
27
|
+
$initialPunct = [:Ps:][:Pi:];
|
|
28
|
+
# add space between any Han or terminal punctuation and letters, and
|
|
29
|
+
# between letters and Han or initial punct
|
|
30
|
+
[[:Ideographic:] $terminalPunct] {} [:Letter:] → ' ' ;
|
|
31
|
+
[:Letter:] [:Mark:]* {} [[:Ideographic:] $initialPunct] → ' ' ;
|
|
32
|
+
# remove spacing between ideographs and other letters
|
|
33
|
+
← [:Ideographic:] { ' ' } [:Letter:] ;
|
|
34
|
+
← [:Letter:] [:Mark:]* { ' ' } [:Ideographic:] ;
|
|
35
|
+
|
|
@@ -0,0 +1,113 @@
|
|
|
1
|
+
|
|
2
|
+
#
|
|
3
|
+
########################################################################
|
|
4
|
+
# BGN/PCGN 1981 System
|
|
5
|
+
#
|
|
6
|
+
# The BGN/PCGN system for Hebrew was designed for use in romanizing
|
|
7
|
+
# names written in the Hebrew alphabet. The Roman letters and letter
|
|
8
|
+
# combinations shown as equivalents to the Hebrew characters reflect
|
|
9
|
+
# the eastern variety of Hebrew, i.e., the language spoken in
|
|
10
|
+
# the Republic of Armenia.
|
|
11
|
+
#
|
|
12
|
+
# The Hebrew Alphabet as defined by the BGN (Page 33-35):
|
|
13
|
+
#
|
|
14
|
+
# אבגדהוזחטיכךלמםנןסעפףצץקרששת
|
|
15
|
+
#
|
|
16
|
+
# Originally prepared by Michael Everson <everson@evertype.com>
|
|
17
|
+
########################################################################
|
|
18
|
+
#
|
|
19
|
+
# MINIMAL FILTER: Hebrew-Latin
|
|
20
|
+
#
|
|
21
|
+
:: [ ְֱֲֳִֵֶַָֹֻּׁׂאבגדהוזחטיךכלםמןנסעףפץצקרשת׳] ;
|
|
22
|
+
:: NFD (NFC) ;
|
|
23
|
+
#
|
|
24
|
+
#
|
|
25
|
+
########################################################################
|
|
26
|
+
#
|
|
27
|
+
########################################################################
|
|
28
|
+
#
|
|
29
|
+
# Define All Transformation Variables
|
|
30
|
+
#
|
|
31
|
+
########################################################################
|
|
32
|
+
#
|
|
33
|
+
$alef = ’;
|
|
34
|
+
$ayin = ‘;
|
|
35
|
+
#
|
|
36
|
+
#
|
|
37
|
+
# Use this $wordBoundary until bug 2034 is fixed in ICU:
|
|
38
|
+
# http://bugs.icu-project.org/cgi-bin/icu-bugs/transliterate?id=2034;expression=boundary;user=guest
|
|
39
|
+
#
|
|
40
|
+
$wordBoundary = [^[:L:][:M:][:N:]] ;
|
|
41
|
+
#
|
|
42
|
+
#
|
|
43
|
+
########################################################################
|
|
44
|
+
#
|
|
45
|
+
########################################################################
|
|
46
|
+
#
|
|
47
|
+
# Rules moved to front to avoid masking
|
|
48
|
+
#
|
|
49
|
+
########################################################################
|
|
50
|
+
#
|
|
51
|
+
בּ → b ; # HEBREW LETTER BET + DAGESH
|
|
52
|
+
פּ → P ; # HEBREW LETTER PE + DAGESH
|
|
53
|
+
גּ → g ; # HEBREW LETTER GIMEL + DAGESH
|
|
54
|
+
ג׳ → ǧ ; # HEBREW LETTER GIMEL + GERESH
|
|
55
|
+
וּ → u ; # HEBREW LETTER VAV + POINT DAGESH
|
|
56
|
+
וֹ → o ; # HEBREW LETTER VAV + POINT HOLAM
|
|
57
|
+
צ׳ → č ; # HEBREW LETTER TSADI + GERESH
|
|
58
|
+
ז׳ → ž ; # HEBREW LETTER ZAYIN + GERESH
|
|
59
|
+
דּ → d ; # HEBREW LETTER DALET + DAGESH
|
|
60
|
+
הּ → h ; # HEBREW LETTER HE + DAGESH
|
|
61
|
+
ךּ → k ; # HEBREW LETTER FINAL KAF + DAGESH
|
|
62
|
+
כּ → k ; # HEBREW LETTER KAF + DAGESH
|
|
63
|
+
ךְ → kh ; # HEBREW LETTER FINAL KAF + SHEVA
|
|
64
|
+
תּ → t ; # HEBREW LETTER TAV + DAGESH
|
|
65
|
+
#
|
|
66
|
+
#
|
|
67
|
+
########################################################################
|
|
68
|
+
#
|
|
69
|
+
########################################################################
|
|
70
|
+
#
|
|
71
|
+
# Start of Alphabetic Transformations
|
|
72
|
+
#
|
|
73
|
+
########################################################################
|
|
74
|
+
#
|
|
75
|
+
א → $alef ; # HEBREW LETTER ALEF
|
|
76
|
+
ב → v ; # HEBREW LETTER BET
|
|
77
|
+
ג → g ; # HEBREW LETTER GIMEL
|
|
78
|
+
ד → d ; # HEBREW LETTER DALET
|
|
79
|
+
ה → h ; # HEBREW LETTER HE
|
|
80
|
+
ח → ẖ ; # HEBREW LETTER HET
|
|
81
|
+
ו → w ; # HEBREW LETTER VAV
|
|
82
|
+
ז → z ; # HEBREW LETTER ZAYIN
|
|
83
|
+
[טת] → t ; # HEBREW LETTER TET
|
|
84
|
+
י → y ; # HEBREW LETTER YOD
|
|
85
|
+
[כך] → kh ; # HEBREW LETTER KAF and FINAL KAF
|
|
86
|
+
ל → l ; # HEBREW LETTER LAMED
|
|
87
|
+
[מם] → m ; # HEBREW LETTER MEM and FINAL MEM
|
|
88
|
+
[נן] → n ; # HEBREW LETTER NUN and FINAL NUN
|
|
89
|
+
ס → s ; # HEBREW LETTER SAMEKH
|
|
90
|
+
ע → $ayin ; # HEBREW LETTER AYIN
|
|
91
|
+
[פף] → f ; # HEBREW LETTER PE and FINAL PE
|
|
92
|
+
[צץ] → ẕ ; # HEBREW LETTER TSADI and FINAL TSADI
|
|
93
|
+
ק → q ; # HEBREW LETTER QOF
|
|
94
|
+
ר → r ; # HEBREW LETTER RESH
|
|
95
|
+
שׁ → sh ; # HEBREW LETTER SHIN
|
|
96
|
+
שׂ → s ; # HEBREW LETTER SHIN
|
|
97
|
+
ַ → a ; # HEBREW POINT PATAH
|
|
98
|
+
ֲ → a ; # HEBREW POINT HATAF PATAH
|
|
99
|
+
ָ → o ; # HEBREW POINT QAMATS
|
|
100
|
+
ֶ → e ; # HEBREW POINT SEGOL
|
|
101
|
+
ֱ → e ; # HEBREW POINT HATAF SEGOL
|
|
102
|
+
ֵי → e ; # HEBREW POINT TSERE + LETTER YOD
|
|
103
|
+
ֵ → e ; # HEBREW POINT TSERE
|
|
104
|
+
ְ → e ; # HEBREW POINT SHEVA
|
|
105
|
+
ִי → i ; # HEBREW POINT HIRIQ + LETTER YOD
|
|
106
|
+
ִ → i ; # HEBREW POINT HIRIQ
|
|
107
|
+
ֳ → o ; # HEBREW LETTER HATAF QAMATS
|
|
108
|
+
ֹ → o ; # HEBREW POINT HOLAM
|
|
109
|
+
ֻ → u ; # HEBREW POINT QUBUTS
|
|
110
|
+
#
|
|
111
|
+
#
|
|
112
|
+
########################################################################
|
|
113
|
+
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
{
|
|
2
|
+
"_backwardAlias": "Latin-Hebrew",
|
|
3
|
+
"_visibility": "external",
|
|
4
|
+
"_backwardAliasBcp47": "und-Hebr-t-und-latn",
|
|
5
|
+
"_alias": "Hebrew-Latin",
|
|
6
|
+
"_aliasBcp47": "und-Latn-t-und-hebr",
|
|
7
|
+
"_source": "Hebr",
|
|
8
|
+
"_direction": "both",
|
|
9
|
+
"_target": "Latn",
|
|
10
|
+
"_rulesFile": "Hebrew-Latin.txt"
|
|
11
|
+
}
|
|
@@ -0,0 +1,91 @@
|
|
|
1
|
+
|
|
2
|
+
# Transliteration table for Hebrew
|
|
3
|
+
# Based on the UNGEGN table at:
|
|
4
|
+
# http://www.eki.ee/wgrs/rom1_he.pdf
|
|
5
|
+
#
|
|
6
|
+
# Exceptions:
|
|
7
|
+
# - Accents are added to disambiguate letters
|
|
8
|
+
# - Combinations of dagesh, shin/sin dot that produce different
|
|
9
|
+
# letters are not yet encoded.
|
|
10
|
+
#
|
|
11
|
+
# To test, open:
|
|
12
|
+
# http://www.ibm.com/software/globalization/icu/demo/transform
|
|
13
|
+
# Click Edit, paste in this file, Save As hebrew-latin/XXX
|
|
14
|
+
# (where XXX is a username)
|
|
15
|
+
# Now go back to the main window, and try it out.
|
|
16
|
+
# Use hebrew-latin/XXX for Output 1, and (Inverse) for Output 2
|
|
17
|
+
# Paste in hebrew text in Input, and hit Transliterate.
|
|
18
|
+
#
|
|
19
|
+
# For more information, see:
|
|
20
|
+
# http://icu.sourceforge.net/userguide/Transform.html
|
|
21
|
+
:: [[־׳״][:Hebrew:] [:^ccc=0:] [ְ-ֹֻ-ּׁ-ׂℵ-ℸֿ̄] - [ֽ]] ;
|
|
22
|
+
:: nfkd (nfc) ;
|
|
23
|
+
׳ ↔ '′';
|
|
24
|
+
״ ↔ '″';
|
|
25
|
+
־ ↔ '-';
|
|
26
|
+
$letterAfter = [:M:]* [:L:] ;
|
|
27
|
+
# move longer items here to avoid masking
|
|
28
|
+
ח ↔ ẖ ;
|
|
29
|
+
צ ↔ ẕ } $letterAfter;
|
|
30
|
+
ץ ↔ ẕ ;
|
|
31
|
+
ש ↔ ş ;
|
|
32
|
+
ת ↔ ţ ;
|
|
33
|
+
א ↔ ʼ ;
|
|
34
|
+
ב ↔ b ;
|
|
35
|
+
ג ↔ g ;
|
|
36
|
+
ד ↔ d ;
|
|
37
|
+
ה ↔ h ;
|
|
38
|
+
ו ↔ w ;
|
|
39
|
+
ז ↔ z ;
|
|
40
|
+
ט ↔ t ;
|
|
41
|
+
י ↔ y ;
|
|
42
|
+
כ ↔ k } $letterAfter;
|
|
43
|
+
ך ↔ k ;
|
|
44
|
+
ל ↔ l ;
|
|
45
|
+
מ ↔ m } $letterAfter;
|
|
46
|
+
ם ↔ m ;
|
|
47
|
+
נ ↔ n } $letterAfter;
|
|
48
|
+
ן ↔ n ;
|
|
49
|
+
ס ↔ s ;
|
|
50
|
+
ע ↔ ʻ ;
|
|
51
|
+
פ ↔ p } $letterAfter;
|
|
52
|
+
ף ↔ p ;
|
|
53
|
+
ק ↔ q ;
|
|
54
|
+
ר ↔ r ;
|
|
55
|
+
װ → | וו; # HEBREW LIGATURE YIDDISH DOUBLE VAV
|
|
56
|
+
ױ → | וי; # HEBREW LIGATURE YIDDISH VAV YOD
|
|
57
|
+
ײ → | יי ; # HEBREW LIGATURE YIDDISH DOUBLE YOD
|
|
58
|
+
ּ ↔ ̇ ; # dagesh just goes to overdot for now
|
|
59
|
+
ׁ ↔ ̌ ; # shin dot -→ sh
|
|
60
|
+
ׂ ↔ ̂ ; # sin dot -→ s
|
|
61
|
+
# points
|
|
62
|
+
$above = [^[:ccc=0:][:ccc=230:]]*;
|
|
63
|
+
ֲ → à ;
|
|
64
|
+
ֲ $1← a ($above) ̀;
|
|
65
|
+
ָ → á ;
|
|
66
|
+
ָ $1 ← a ($above) ́;
|
|
67
|
+
ֱ → è ;
|
|
68
|
+
ֱ $1 ← e ($above) ̀;
|
|
69
|
+
ֵ → é ;
|
|
70
|
+
ֵ $1 ← e ($above) ́;
|
|
71
|
+
ְ → e ̆ ;
|
|
72
|
+
ְ $1 ← e ($above) ̆;
|
|
73
|
+
ֹ → ò ;
|
|
74
|
+
ֹ $1 ← o ($above) ̀;
|
|
75
|
+
ִ ↔ i ;
|
|
76
|
+
ֻ ↔ u ;
|
|
77
|
+
ַ ↔ a ;
|
|
78
|
+
ֶ ↔ e ;
|
|
79
|
+
ֳ ↔ o ;
|
|
80
|
+
ֿ ↔ ̄ ;
|
|
81
|
+
# fallbacks
|
|
82
|
+
ק ← c ;
|
|
83
|
+
פ ← f } $letterAfter;
|
|
84
|
+
ף ← f ;
|
|
85
|
+
ז ← j ;
|
|
86
|
+
ו ← v ;
|
|
87
|
+
כס ← x ;
|
|
88
|
+
:: (lower);
|
|
89
|
+
:: nfc (nfd) ;
|
|
90
|
+
:: ([[-′″][:Latin:] [:^ccc=0:] [ʻ-ʼ̀-̧̱̂̇̌̀-́ ̄ ]]);
|
|
91
|
+
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
{
|
|
2
|
+
"_backwardAlias": "Katakana-Hiragana",
|
|
3
|
+
"_visibility": "external",
|
|
4
|
+
"_backwardAliasBcp47": "und-Hira-t-und-kana",
|
|
5
|
+
"_alias": "Hiragana-Katakana",
|
|
6
|
+
"_aliasBcp47": "und-Kana-t-und-hira",
|
|
7
|
+
"_source": "Hira",
|
|
8
|
+
"_direction": "both",
|
|
9
|
+
"_target": "Kana",
|
|
10
|
+
"_rulesFile": "Hiragana-Katakana.txt"
|
|
11
|
+
}
|
|
@@ -0,0 +1,179 @@
|
|
|
1
|
+
|
|
2
|
+
# note: a global filter is more efficient, but MUST include all source chars
|
|
3
|
+
:: [[\u0000-\u007E 、。 ゙-゜ ァ-ー 。-゚ー[:Hiragana:] [:Katakana:] [:nonspacing mark:]]-[\u309B \u309C]];
|
|
4
|
+
:: NFKC (NFC);
|
|
5
|
+
# Hiragana-Katakana
|
|
6
|
+
# This is largely a one-to-one mapping, but it has a
|
|
7
|
+
# few kinks:
|
|
8
|
+
# 1. The Katakana va/vi/ve/vo (30F7-30FA) have no
|
|
9
|
+
# Hiragana equivalents. We use Hiragana wa/wi/we/wo
|
|
10
|
+
# (308F-3092) with a voicing mark (3099), which is
|
|
11
|
+
# semantically equivalent. However, this is a non-
|
|
12
|
+
# roundtripping transformation.
|
|
13
|
+
# 2. The Katakana small ka/ke (30F5,30F6) have no
|
|
14
|
+
# Hiragana equiavlents. We convert them to normal
|
|
15
|
+
# Hiragana ka/ke (304B,3051). This is a one-way
|
|
16
|
+
# information-losing transformation and precludes
|
|
17
|
+
# round-tripping of 30F5 and 30F6.
|
|
18
|
+
# 3. The combining marks 3099-309C are in the Hiragana
|
|
19
|
+
# block, but they apply to Katakana as well, so we
|
|
20
|
+
# leave them untouched.
|
|
21
|
+
# 4. The Katakana prolonged sound mark 30FC doubles the
|
|
22
|
+
# preceding vowel. This is a one-way information-
|
|
23
|
+
# losing transformation from Katakana to Hiragana.
|
|
24
|
+
# 5. The Katakana middle dot separates words in foreign
|
|
25
|
+
# expressions; we leave this unmodified.
|
|
26
|
+
# The above points preclude successful round-trip
|
|
27
|
+
# transformations of arbitrary input text. However,
|
|
28
|
+
# they provide naturalistic results that should conform
|
|
29
|
+
# to user expectations.
|
|
30
|
+
# Combining equivalents va/vi/ve/vo
|
|
31
|
+
わ゙ ↔ ヷ;
|
|
32
|
+
ゐ゙ ↔ ヸ;
|
|
33
|
+
ゑ゙ ↔ ヹ;
|
|
34
|
+
を゙ ↔ ヺ;
|
|
35
|
+
# One-to-one mappings, main block
|
|
36
|
+
# 3041:3094 ↔ 30A1:30F4
|
|
37
|
+
# 309D,E ↔ 30FD,E
|
|
38
|
+
ぁ ↔ ァ;
|
|
39
|
+
あ ↔ ア;
|
|
40
|
+
ぃ ↔ ィ;
|
|
41
|
+
い ↔ イ;
|
|
42
|
+
ぅ ↔ ゥ;
|
|
43
|
+
う ↔ ウ;
|
|
44
|
+
ぇ ↔ ェ;
|
|
45
|
+
え ↔ エ;
|
|
46
|
+
ぉ ↔ ォ;
|
|
47
|
+
お ↔ オ;
|
|
48
|
+
か ↔ カ;
|
|
49
|
+
が ↔ ガ;
|
|
50
|
+
き ↔ キ;
|
|
51
|
+
ぎ ↔ ギ;
|
|
52
|
+
く ↔ ク;
|
|
53
|
+
ぐ ↔ グ;
|
|
54
|
+
け ↔ ケ;
|
|
55
|
+
げ ↔ ゲ;
|
|
56
|
+
こ ↔ コ;
|
|
57
|
+
ご ↔ ゴ;
|
|
58
|
+
さ ↔ サ;
|
|
59
|
+
ざ ↔ ザ;
|
|
60
|
+
し ↔ シ;
|
|
61
|
+
じ ↔ ジ;
|
|
62
|
+
す ↔ ス;
|
|
63
|
+
ず ↔ ズ;
|
|
64
|
+
せ ↔ セ;
|
|
65
|
+
ぜ ↔ ゼ;
|
|
66
|
+
そ ↔ ソ;
|
|
67
|
+
ぞ ↔ ゾ;
|
|
68
|
+
た ↔ タ;
|
|
69
|
+
だ ↔ ダ;
|
|
70
|
+
ち ↔ チ;
|
|
71
|
+
ぢ ↔ ヂ;
|
|
72
|
+
っ ↔ ッ;
|
|
73
|
+
つ ↔ ツ;
|
|
74
|
+
づ ↔ ヅ;
|
|
75
|
+
て ↔ テ;
|
|
76
|
+
で ↔ デ;
|
|
77
|
+
と ↔ ト;
|
|
78
|
+
ど ↔ ド;
|
|
79
|
+
な ↔ ナ;
|
|
80
|
+
に ↔ ニ;
|
|
81
|
+
ぬ ↔ ヌ;
|
|
82
|
+
ね ↔ ネ;
|
|
83
|
+
の ↔ ノ;
|
|
84
|
+
は ↔ ハ;
|
|
85
|
+
ば ↔ バ;
|
|
86
|
+
ぱ ↔ パ;
|
|
87
|
+
ひ ↔ ヒ;
|
|
88
|
+
び ↔ ビ;
|
|
89
|
+
ぴ ↔ ピ;
|
|
90
|
+
ふ ↔ フ;
|
|
91
|
+
ぶ ↔ ブ;
|
|
92
|
+
ぷ ↔ プ;
|
|
93
|
+
へ ↔ ヘ;
|
|
94
|
+
べ ↔ ベ;
|
|
95
|
+
ぺ ↔ ペ;
|
|
96
|
+
ほ ↔ ホ;
|
|
97
|
+
ぼ ↔ ボ;
|
|
98
|
+
ぽ ↔ ポ;
|
|
99
|
+
ま ↔ マ;
|
|
100
|
+
み ↔ ミ;
|
|
101
|
+
む ↔ ム;
|
|
102
|
+
め ↔ メ;
|
|
103
|
+
も ↔ モ;
|
|
104
|
+
ゃ ↔ ャ;
|
|
105
|
+
や ↔ ヤ;
|
|
106
|
+
ゅ ↔ ュ;
|
|
107
|
+
ゆ ↔ ユ;
|
|
108
|
+
ょ ↔ ョ;
|
|
109
|
+
よ ↔ ヨ;
|
|
110
|
+
ら ↔ ラ;
|
|
111
|
+
り ↔ リ;
|
|
112
|
+
る ↔ ル;
|
|
113
|
+
れ ↔ レ;
|
|
114
|
+
ろ ↔ ロ;
|
|
115
|
+
ゎ ↔ ヮ;
|
|
116
|
+
わ ↔ ワ;
|
|
117
|
+
ゐ ↔ ヰ;
|
|
118
|
+
ゑ ↔ ヱ;
|
|
119
|
+
を ↔ ヲ;
|
|
120
|
+
ん ↔ ン;
|
|
121
|
+
ゔ ↔ ヴ;
|
|
122
|
+
ゝ ↔ ヽ;
|
|
123
|
+
ゞ ↔ ヾ;
|
|
124
|
+
# One-way Katakana-Hiragana xform of small K ka/ke to
|
|
125
|
+
# normal H ka/ke.
|
|
126
|
+
か ← ヵ;
|
|
127
|
+
け ← ヶ;
|
|
128
|
+
# Katakana followed by a prolonged sound mark 30FC has
|
|
129
|
+
# its final vowel doubled. This is a Katakana-Hiragana
|
|
130
|
+
# one-way information-losing transformation. We
|
|
131
|
+
# include the small Katakana (e.g., small A 3041) and
|
|
132
|
+
# do not distinguish them from their large
|
|
133
|
+
# counterparts. It doesn't make sense to double a
|
|
134
|
+
# small counterpart vowel as a small Hiragana vowel, so
|
|
135
|
+
# we don't do so. In natural text this should never
|
|
136
|
+
# occur anyway. If a 30FC is seen without a preceding
|
|
137
|
+
# vowel sound (e.g., after n 30F3) we do not change it.
|
|
138
|
+
### $long = ー;
|
|
139
|
+
# The following categories are Hiragana, not Katakana
|
|
140
|
+
# as might be expected, since by the time we get to the
|
|
141
|
+
# 30FC, the preceding character will have already been
|
|
142
|
+
# transformed to Hiragana.
|
|
143
|
+
# {The following mechanically generated from the
|
|
144
|
+
# Unicode 3.0 data:}
|
|
145
|
+
$xa = [
|
|
146
|
+
ぁ あ か が さ ざ
|
|
147
|
+
た だ な は ば ぱ
|
|
148
|
+
ま ゃ や ら ゎ わ
|
|
149
|
+
];
|
|
150
|
+
$xi = [
|
|
151
|
+
ぃ い き ぎ し じ
|
|
152
|
+
ち ぢ に ひ び ぴ
|
|
153
|
+
み り ゐ
|
|
154
|
+
];
|
|
155
|
+
$xu = [
|
|
156
|
+
ぅ う く ぐ す ず
|
|
157
|
+
っ つ づ ぬ ふ ぶ
|
|
158
|
+
ぷ む ゅ ゆ る ゔ
|
|
159
|
+
];
|
|
160
|
+
$xe = [
|
|
161
|
+
ぇ え け げ せ ぜ
|
|
162
|
+
て で ね へ べ ぺ
|
|
163
|
+
め れ ゑ
|
|
164
|
+
];
|
|
165
|
+
$xo = [
|
|
166
|
+
ぉ お こ ご そ ぞ
|
|
167
|
+
と ど の ほ ぼ ぽ
|
|
168
|
+
も ょ よ ろ を
|
|
169
|
+
];
|
|
170
|
+
あ ← $xa {ー};
|
|
171
|
+
い ← $xi {ー};
|
|
172
|
+
う ← $xu {ー};
|
|
173
|
+
え ← $xe {ー};
|
|
174
|
+
お ← $xo {ー};
|
|
175
|
+
:: NFC (NFKC) ;
|
|
176
|
+
# note: a global filter is more efficient, but MUST include all source chars!!
|
|
177
|
+
:: ([[\u0000-\u007E 、。 ゙-゜ ァ-ー 。-゚ー[:Hiragana:] [:Katakana:] [:nonspacing mark:]]-[\u309B \u309C]]);
|
|
178
|
+
# eof
|
|
179
|
+
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
{
|
|
2
|
+
"_backwardAlias": "Latin-Hiragana",
|
|
3
|
+
"_visibility": "external",
|
|
4
|
+
"_backwardAliasBcp47": "und-Hira-t-und-latn",
|
|
5
|
+
"_alias": "Hiragana-Latin",
|
|
6
|
+
"_aliasBcp47": "und-Latn-t-und-hira",
|
|
7
|
+
"_source": "Hira",
|
|
8
|
+
"_direction": "both",
|
|
9
|
+
"_target": "Latn",
|
|
10
|
+
"_rulesFile": "Hiragana-Latin.txt"
|
|
11
|
+
}
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
{
|
|
2
|
+
"_backwardAlias": "XSampa-IPA",
|
|
3
|
+
"_visibility": "external",
|
|
4
|
+
"_backwardAliasBcp47": "und-fonipa-t-und-fonxsamp",
|
|
5
|
+
"_alias": "IPA-XSampa",
|
|
6
|
+
"_aliasBcp47": "und-fonxsamp-t-und-fonipa",
|
|
7
|
+
"_source": "und_FONIPA",
|
|
8
|
+
"_direction": "both",
|
|
9
|
+
"_target": "und_FONXSAMP",
|
|
10
|
+
"_rulesFile": "IPA-XSampa.txt"
|
|
11
|
+
}
|