cldr-transforms 46.0.0-BETA2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +41 -0
- package/README.md +27 -0
- package/bower.json +13 -0
- package/package.json +29 -0
- package/transforms/Amharic-Latin-BGN.json +9 -0
- package/transforms/Amharic-Latin-BGN.txt +441 -0
- package/transforms/Any-Accents.json +9 -0
- package/transforms/Any-Accents.txt +270 -0
- package/transforms/Any-Publishing.json +9 -0
- package/transforms/Any-Publishing.txt +63 -0
- package/transforms/Arabic-Latin-BGN.json +9 -0
- package/transforms/Arabic-Latin-BGN.txt +205 -0
- package/transforms/Arabic-Latin.json +11 -0
- package/transforms/Arabic-Latin.txt +181 -0
- package/transforms/Armenian-Latin-BGN.json +9 -0
- package/transforms/Armenian-Latin-BGN.txt +165 -0
- package/transforms/Azerbaijani-Latin-BGN.json +9 -0
- package/transforms/Azerbaijani-Latin-BGN.txt +183 -0
- package/transforms/Belarusian-Latin-BGN.json +9 -0
- package/transforms/Belarusian-Latin-BGN.txt +194 -0
- package/transforms/Bengali-Arabic.json +9 -0
- package/transforms/Bengali-Arabic.txt +7 -0
- package/transforms/Bengali-Devanagari.json +9 -0
- package/transforms/Bengali-Devanagari.txt +7 -0
- package/transforms/Bengali-Gujarati.json +9 -0
- package/transforms/Bengali-Gujarati.txt +7 -0
- package/transforms/Bengali-Gurmukhi.json +9 -0
- package/transforms/Bengali-Gurmukhi.txt +7 -0
- package/transforms/Bengali-InterIndic.json +7 -0
- package/transforms/Bengali-InterIndic.txt +99 -0
- package/transforms/Bengali-Kannada.json +9 -0
- package/transforms/Bengali-Kannada.txt +7 -0
- package/transforms/Bengali-Latin.json +9 -0
- package/transforms/Bengali-Latin.txt +7 -0
- package/transforms/Bengali-Malayalam.json +9 -0
- package/transforms/Bengali-Malayalam.txt +7 -0
- package/transforms/Bengali-Oriya.json +9 -0
- package/transforms/Bengali-Oriya.txt +7 -0
- package/transforms/Bengali-Tamil.json +9 -0
- package/transforms/Bengali-Tamil.txt +7 -0
- package/transforms/Bengali-Telugu.json +9 -0
- package/transforms/Bengali-Telugu.txt +7 -0
- package/transforms/Bengali-ur.json +8 -0
- package/transforms/Bengali-ur.txt +7 -0
- package/transforms/Bulgarian-Latin-BGN.json +9 -0
- package/transforms/Bulgarian-Latin-BGN.txt +237 -0
- package/transforms/CanadianAboriginal-Latin.json +11 -0
- package/transforms/CanadianAboriginal-Latin.txt +184 -0
- package/transforms/Cyrillic-Latin.json +11 -0
- package/transforms/Cyrillic-Latin.txt +280 -0
- package/transforms/Devanagari-Arabic.json +9 -0
- package/transforms/Devanagari-Arabic.txt +7 -0
- package/transforms/Devanagari-Bengali.json +9 -0
- package/transforms/Devanagari-Bengali.txt +7 -0
- package/transforms/Devanagari-Gujarati.json +9 -0
- package/transforms/Devanagari-Gujarati.txt +7 -0
- package/transforms/Devanagari-Gurmukhi.json +9 -0
- package/transforms/Devanagari-Gurmukhi.txt +7 -0
- package/transforms/Devanagari-InterIndic.json +7 -0
- package/transforms/Devanagari-InterIndic.txt +113 -0
- package/transforms/Devanagari-Kannada.json +9 -0
- package/transforms/Devanagari-Kannada.txt +7 -0
- package/transforms/Devanagari-Latin.json +9 -0
- package/transforms/Devanagari-Latin.txt +7 -0
- package/transforms/Devanagari-Malayalam.json +9 -0
- package/transforms/Devanagari-Malayalam.txt +7 -0
- package/transforms/Devanagari-Oriya.json +9 -0
- package/transforms/Devanagari-Oriya.txt +7 -0
- package/transforms/Devanagari-Tamil.json +9 -0
- package/transforms/Devanagari-Tamil.txt +7 -0
- package/transforms/Devanagari-Telugu.json +9 -0
- package/transforms/Devanagari-Telugu.txt +7 -0
- package/transforms/Devanagari-ur.json +8 -0
- package/transforms/Devanagari-ur.txt +7 -0
- package/transforms/Fullwidth-Halfwidth.json +9 -0
- package/transforms/Fullwidth-Halfwidth.txt +261 -0
- package/transforms/Georgian-Latin-BGN.json +9 -0
- package/transforms/Georgian-Latin-BGN.txt +43 -0
- package/transforms/Georgian-Latin-BGN_1981.json +8 -0
- package/transforms/Georgian-Latin-BGN_1981.txt +54 -0
- package/transforms/Georgian-Latin.json +11 -0
- package/transforms/Georgian-Latin.txt +53 -0
- package/transforms/Greek-Latin-BGN.json +9 -0
- package/transforms/Greek-Latin-BGN.txt +419 -0
- package/transforms/Greek-Latin.json +11 -0
- package/transforms/Greek-Latin.txt +251 -0
- package/transforms/Greek_Latin_UNGEGN.json +11 -0
- package/transforms/Greek_Latin_UNGEGN.txt +179 -0
- package/transforms/Gujarati-Arabic.json +9 -0
- package/transforms/Gujarati-Arabic.txt +7 -0
- package/transforms/Gujarati-Bengali.json +9 -0
- package/transforms/Gujarati-Bengali.txt +7 -0
- package/transforms/Gujarati-Devanagari.json +9 -0
- package/transforms/Gujarati-Devanagari.txt +7 -0
- package/transforms/Gujarati-Gurmukhi.json +9 -0
- package/transforms/Gujarati-Gurmukhi.txt +7 -0
- package/transforms/Gujarati-InterIndic.json +7 -0
- package/transforms/Gujarati-InterIndic.txt +89 -0
- package/transforms/Gujarati-Kannada.json +9 -0
- package/transforms/Gujarati-Kannada.txt +7 -0
- package/transforms/Gujarati-Latin.json +9 -0
- package/transforms/Gujarati-Latin.txt +7 -0
- package/transforms/Gujarati-Malayalam.json +9 -0
- package/transforms/Gujarati-Malayalam.txt +7 -0
- package/transforms/Gujarati-Oriya.json +9 -0
- package/transforms/Gujarati-Oriya.txt +7 -0
- package/transforms/Gujarati-Tamil.json +9 -0
- package/transforms/Gujarati-Tamil.txt +7 -0
- package/transforms/Gujarati-Telugu.json +9 -0
- package/transforms/Gujarati-Telugu.txt +7 -0
- package/transforms/Gujarati-ur.json +8 -0
- package/transforms/Gujarati-ur.txt +7 -0
- package/transforms/Gurmukhi-Arabic.json +9 -0
- package/transforms/Gurmukhi-Arabic.txt +7 -0
- package/transforms/Gurmukhi-Bengali.json +9 -0
- package/transforms/Gurmukhi-Bengali.txt +7 -0
- package/transforms/Gurmukhi-Devanagari.json +9 -0
- package/transforms/Gurmukhi-Devanagari.txt +7 -0
- package/transforms/Gurmukhi-Gujarati.json +9 -0
- package/transforms/Gurmukhi-Gujarati.txt +7 -0
- package/transforms/Gurmukhi-InterIndic.json +7 -0
- package/transforms/Gurmukhi-InterIndic.txt +88 -0
- package/transforms/Gurmukhi-Kannada.json +9 -0
- package/transforms/Gurmukhi-Kannada.txt +7 -0
- package/transforms/Gurmukhi-Latin.json +9 -0
- package/transforms/Gurmukhi-Latin.txt +7 -0
- package/transforms/Gurmukhi-Malayalam.json +9 -0
- package/transforms/Gurmukhi-Malayalam.txt +7 -0
- package/transforms/Gurmukhi-Oriya.json +9 -0
- package/transforms/Gurmukhi-Oriya.txt +7 -0
- package/transforms/Gurmukhi-Tamil.json +9 -0
- package/transforms/Gurmukhi-Tamil.txt +7 -0
- package/transforms/Gurmukhi-Telugu.json +9 -0
- package/transforms/Gurmukhi-Telugu.txt +7 -0
- package/transforms/Gurmukhi-ur.json +8 -0
- package/transforms/Gurmukhi-ur.txt +7 -0
- package/transforms/Han-Latin-Names.json +8 -0
- package/transforms/Han-Latin-Names.txt +65 -0
- package/transforms/Han-Latin.json +9 -0
- package/transforms/Han-Latin.txt +1501 -0
- package/transforms/Han-Spacedhan.json +7 -0
- package/transforms/Han-Spacedhan.txt +35 -0
- package/transforms/Hangul-Latin.json +9 -0
- package/transforms/Hangul-Latin.txt +6 -0
- package/transforms/Hebrew-Latin-BGN.json +9 -0
- package/transforms/Hebrew-Latin-BGN.txt +113 -0
- package/transforms/Hebrew-Latin.json +11 -0
- package/transforms/Hebrew-Latin.txt +91 -0
- package/transforms/Hiragana-Katakana.json +11 -0
- package/transforms/Hiragana-Katakana.txt +179 -0
- package/transforms/Hiragana-Latin.json +11 -0
- package/transforms/Hiragana-Latin.txt +9 -0
- package/transforms/IPA-XSampa.json +11 -0
- package/transforms/IPA-XSampa.txt +228 -0
- package/transforms/InterIndic-Arabic.json +7 -0
- package/transforms/InterIndic-Arabic.txt +128 -0
- package/transforms/InterIndic-Bengali.json +7 -0
- package/transforms/InterIndic-Bengali.txt +135 -0
- package/transforms/InterIndic-Devanagari.json +7 -0
- package/transforms/InterIndic-Devanagari.txt +151 -0
- package/transforms/InterIndic-Gujarati.json +7 -0
- package/transforms/InterIndic-Gujarati.txt +136 -0
- package/transforms/InterIndic-Gurmukhi.json +7 -0
- package/transforms/InterIndic-Gurmukhi.txt +142 -0
- package/transforms/InterIndic-Kannada.json +7 -0
- package/transforms/InterIndic-Kannada.txt +137 -0
- package/transforms/InterIndic-Latin.json +7 -0
- package/transforms/InterIndic-Latin.txt +492 -0
- package/transforms/InterIndic-Malayalam.json +7 -0
- package/transforms/InterIndic-Malayalam.txt +137 -0
- package/transforms/InterIndic-Oriya.json +7 -0
- package/transforms/InterIndic-Oriya.txt +135 -0
- package/transforms/InterIndic-Tamil.json +7 -0
- package/transforms/InterIndic-Tamil.txt +136 -0
- package/transforms/InterIndic-Telugu.json +7 -0
- package/transforms/InterIndic-Telugu.txt +136 -0
- package/transforms/InterIndic-ur.json +7 -0
- package/transforms/InterIndic-ur.txt +119 -0
- package/transforms/Jamo-Latin.json +9 -0
- package/transforms/Jamo-Latin.txt +6 -0
- package/transforms/Kannada-Arabic.json +9 -0
- package/transforms/Kannada-Arabic.txt +7 -0
- package/transforms/Kannada-Bengali.json +9 -0
- package/transforms/Kannada-Bengali.txt +7 -0
- package/transforms/Kannada-Devanagari.json +9 -0
- package/transforms/Kannada-Devanagari.txt +7 -0
- package/transforms/Kannada-Gujarati.json +9 -0
- package/transforms/Kannada-Gujarati.txt +7 -0
- package/transforms/Kannada-Gurmukhi.json +9 -0
- package/transforms/Kannada-Gurmukhi.txt +7 -0
- package/transforms/Kannada-InterIndic.json +7 -0
- package/transforms/Kannada-InterIndic.txt +87 -0
- package/transforms/Kannada-Latin.json +9 -0
- package/transforms/Kannada-Latin.txt +7 -0
- package/transforms/Kannada-Malayalam.json +9 -0
- package/transforms/Kannada-Malayalam.txt +7 -0
- package/transforms/Kannada-Oriya.json +9 -0
- package/transforms/Kannada-Oriya.txt +7 -0
- package/transforms/Kannada-Tamil.json +9 -0
- package/transforms/Kannada-Tamil.txt +7 -0
- package/transforms/Kannada-Telugu.json +9 -0
- package/transforms/Kannada-Telugu.txt +7 -0
- package/transforms/Kannada-ur.json +8 -0
- package/transforms/Kannada-ur.txt +7 -0
- package/transforms/Katakana-Latin-BGN.json +9 -0
- package/transforms/Katakana-Latin-BGN.txt +335 -0
- package/transforms/Kazakh-Latin-BGN.json +9 -0
- package/transforms/Kazakh-Latin-BGN.txt +332 -0
- package/transforms/Kirghiz-Latin-BGN.json +9 -0
- package/transforms/Kirghiz-Latin-BGN.txt +211 -0
- package/transforms/Korean-Latin-BGN.json +9 -0
- package/transforms/Korean-Latin-BGN.txt +345 -0
- package/transforms/Latin-ASCII.json +9 -0
- package/transforms/Latin-ASCII.txt +909 -0
- package/transforms/Latin-Armenian.json +11 -0
- package/transforms/Latin-Armenian.txt +88 -0
- package/transforms/Latin-Bengali.json +9 -0
- package/transforms/Latin-Bengali.txt +8 -0
- package/transforms/Latin-Bopomofo.json +11 -0
- package/transforms/Latin-Bopomofo.txt +1445 -0
- package/transforms/Latin-ConjoiningJamo.json +7 -0
- package/transforms/Latin-ConjoiningJamo.txt +477 -0
- package/transforms/Latin-Devanagari.json +9 -0
- package/transforms/Latin-Devanagari.txt +8 -0
- package/transforms/Latin-Ethiopic.json +11 -0
- package/transforms/Latin-Ethiopic.txt +277 -0
- package/transforms/Latin-Gujarati.json +9 -0
- package/transforms/Latin-Gujarati.txt +8 -0
- package/transforms/Latin-Gurmukhi.json +9 -0
- package/transforms/Latin-Gurmukhi.txt +8 -0
- package/transforms/Latin-Hangul.json +9 -0
- package/transforms/Latin-Hangul.txt +7 -0
- package/transforms/Latin-InterIndic.json +7 -0
- package/transforms/Latin-InterIndic.txt +377 -0
- package/transforms/Latin-Jamo.json +9 -0
- package/transforms/Latin-Jamo.txt +7 -0
- package/transforms/Latin-Kannada.json +9 -0
- package/transforms/Latin-Kannada.txt +8 -0
- package/transforms/Latin-Katakana.json +11 -0
- package/transforms/Latin-Katakana.txt +382 -0
- package/transforms/Latin-Malayalam.json +9 -0
- package/transforms/Latin-Malayalam.txt +8 -0
- package/transforms/Latin-NumericPinyin.json +9 -0
- package/transforms/Latin-NumericPinyin.txt +29 -0
- package/transforms/Latin-Oriya.json +9 -0
- package/transforms/Latin-Oriya.txt +8 -0
- package/transforms/Latin-Tamil.json +9 -0
- package/transforms/Latin-Tamil.txt +8 -0
- package/transforms/Latin-Telugu.json +9 -0
- package/transforms/Latin-Telugu.txt +8 -0
- package/transforms/Latin-Thai.json +9 -0
- package/transforms/Latin-Thai.txt +7 -0
- package/transforms/Macedonian-Latin-BGN.json +9 -0
- package/transforms/Macedonian-Latin-BGN.txt +176 -0
- package/transforms/Malayalam-Arabic.json +9 -0
- package/transforms/Malayalam-Arabic.txt +7 -0
- package/transforms/Malayalam-Bengali.json +9 -0
- package/transforms/Malayalam-Bengali.txt +7 -0
- package/transforms/Malayalam-Devanagari.json +9 -0
- package/transforms/Malayalam-Devanagari.txt +7 -0
- package/transforms/Malayalam-Gujarati.json +9 -0
- package/transforms/Malayalam-Gujarati.txt +7 -0
- package/transforms/Malayalam-Gurmukhi.json +9 -0
- package/transforms/Malayalam-Gurmukhi.txt +7 -0
- package/transforms/Malayalam-InterIndic.json +7 -0
- package/transforms/Malayalam-InterIndic.txt +87 -0
- package/transforms/Malayalam-Kannada.json +9 -0
- package/transforms/Malayalam-Kannada.txt +7 -0
- package/transforms/Malayalam-Latin.json +9 -0
- package/transforms/Malayalam-Latin.txt +7 -0
- package/transforms/Malayalam-Oriya.json +9 -0
- package/transforms/Malayalam-Oriya.txt +7 -0
- package/transforms/Malayalam-Tamil.json +9 -0
- package/transforms/Malayalam-Tamil.txt +7 -0
- package/transforms/Malayalam-Telugu.json +9 -0
- package/transforms/Malayalam-Telugu.txt +7 -0
- package/transforms/Malayalam-ur.json +8 -0
- package/transforms/Malayalam-ur.txt +7 -0
- package/transforms/Maldivian-Latin-BGN.json +9 -0
- package/transforms/Maldivian-Latin-BGN.txt +171 -0
- package/transforms/Mongolian-Latin-BGN.json +9 -0
- package/transforms/Mongolian-Latin-BGN.txt +151 -0
- package/transforms/Myanmar-Latin.json +9 -0
- package/transforms/Myanmar-Latin.txt +367 -0
- package/transforms/Oriya-Arabic.json +9 -0
- package/transforms/Oriya-Arabic.txt +7 -0
- package/transforms/Oriya-Bengali.json +9 -0
- package/transforms/Oriya-Bengali.txt +7 -0
- package/transforms/Oriya-Devanagari.json +9 -0
- package/transforms/Oriya-Devanagari.txt +7 -0
- package/transforms/Oriya-Gujarati.json +9 -0
- package/transforms/Oriya-Gujarati.txt +7 -0
- package/transforms/Oriya-Gurmukhi.json +9 -0
- package/transforms/Oriya-Gurmukhi.txt +7 -0
- package/transforms/Oriya-InterIndic.json +7 -0
- package/transforms/Oriya-InterIndic.txt +91 -0
- package/transforms/Oriya-Kannada.json +9 -0
- package/transforms/Oriya-Kannada.txt +7 -0
- package/transforms/Oriya-Latin.json +9 -0
- package/transforms/Oriya-Latin.txt +7 -0
- package/transforms/Oriya-Malayalam.json +9 -0
- package/transforms/Oriya-Malayalam.txt +7 -0
- package/transforms/Oriya-Tamil.json +9 -0
- package/transforms/Oriya-Tamil.txt +7 -0
- package/transforms/Oriya-Telugu.json +9 -0
- package/transforms/Oriya-Telugu.txt +7 -0
- package/transforms/Oriya-ur.json +8 -0
- package/transforms/Oriya-ur.txt +7 -0
- package/transforms/Pashto-Latin-BGN.json +9 -0
- package/transforms/Pashto-Latin-BGN.txt +231 -0
- package/transforms/Persian-Latin-BGN.json +9 -0
- package/transforms/Persian-Latin-BGN.txt +203 -0
- package/transforms/Pinyin-NumericPinyin.json +7 -0
- package/transforms/Pinyin-NumericPinyin.txt +8 -0
- package/transforms/Russian-Latin-BGN.json +9 -0
- package/transforms/Russian-Latin-BGN.txt +235 -0
- package/transforms/Serbian-Latin-BGN.json +9 -0
- package/transforms/Serbian-Latin-BGN.txt +119 -0
- package/transforms/Simplified-Traditional.json +11 -0
- package/transforms/Simplified-Traditional.txt +4393 -0
- package/transforms/Syriac-Latin.json +11 -0
- package/transforms/Syriac-Latin.txt +52 -0
- package/transforms/Tamil-Arabic.json +9 -0
- package/transforms/Tamil-Arabic.txt +7 -0
- package/transforms/Tamil-Bengali.json +9 -0
- package/transforms/Tamil-Bengali.txt +7 -0
- package/transforms/Tamil-Devanagari.json +9 -0
- package/transforms/Tamil-Devanagari.txt +7 -0
- package/transforms/Tamil-Gujarati.json +9 -0
- package/transforms/Tamil-Gujarati.txt +7 -0
- package/transforms/Tamil-Gurmukhi.json +9 -0
- package/transforms/Tamil-Gurmukhi.txt +7 -0
- package/transforms/Tamil-InterIndic.json +7 -0
- package/transforms/Tamil-InterIndic.txt +70 -0
- package/transforms/Tamil-Kannada.json +9 -0
- package/transforms/Tamil-Kannada.txt +7 -0
- package/transforms/Tamil-Latin.json +9 -0
- package/transforms/Tamil-Latin.txt +7 -0
- package/transforms/Tamil-Malayalam.json +9 -0
- package/transforms/Tamil-Malayalam.txt +7 -0
- package/transforms/Tamil-Oriya.json +9 -0
- package/transforms/Tamil-Oriya.txt +7 -0
- package/transforms/Tamil-Telugu.json +9 -0
- package/transforms/Tamil-Telugu.txt +7 -0
- package/transforms/Tamil-ur.json +8 -0
- package/transforms/Tamil-ur.txt +7 -0
- package/transforms/Telugu-Arabic.json +9 -0
- package/transforms/Telugu-Arabic.txt +7 -0
- package/transforms/Telugu-Bengali.json +9 -0
- package/transforms/Telugu-Bengali.txt +7 -0
- package/transforms/Telugu-Devanagari.json +9 -0
- package/transforms/Telugu-Devanagari.txt +7 -0
- package/transforms/Telugu-Gujarati.json +9 -0
- package/transforms/Telugu-Gujarati.txt +7 -0
- package/transforms/Telugu-Gurmukhi.json +9 -0
- package/transforms/Telugu-Gurmukhi.txt +7 -0
- package/transforms/Telugu-InterIndic.json +7 -0
- package/transforms/Telugu-InterIndic.txt +87 -0
- package/transforms/Telugu-Kannada.json +9 -0
- package/transforms/Telugu-Kannada.txt +7 -0
- package/transforms/Telugu-Latin.json +9 -0
- package/transforms/Telugu-Latin.txt +7 -0
- package/transforms/Telugu-Malayalam.json +9 -0
- package/transforms/Telugu-Malayalam.txt +7 -0
- package/transforms/Telugu-Oriya.json +9 -0
- package/transforms/Telugu-Oriya.txt +7 -0
- package/transforms/Telugu-Tamil.json +9 -0
- package/transforms/Telugu-Tamil.txt +7 -0
- package/transforms/Telugu-ur.json +8 -0
- package/transforms/Telugu-ur.txt +7 -0
- package/transforms/Thaana-Latin.json +11 -0
- package/transforms/Thaana-Latin.txt +433 -0
- package/transforms/Thai-Latin.json +9 -0
- package/transforms/Thai-Latin.txt +9 -0
- package/transforms/Thai-ThaiLogical.json +7 -0
- package/transforms/Thai-ThaiLogical.txt +16 -0
- package/transforms/Thai-ThaiSemi.json +7 -0
- package/transforms/Thai-ThaiSemi.txt +6 -0
- package/transforms/ThaiLogical-Latin.json +7 -0
- package/transforms/ThaiLogical-Latin.txt +147 -0
- package/transforms/Turkmen-Latin-BGN.json +9 -0
- package/transforms/Turkmen-Latin-BGN.txt +302 -0
- package/transforms/Ukrainian-Latin-BGN.json +9 -0
- package/transforms/Ukrainian-Latin-BGN.txt +283 -0
- package/transforms/Uzbek-Latin-BGN.json +9 -0
- package/transforms/Uzbek-Latin-BGN.txt +261 -0
- package/transforms/am-Ethi-t-am-brai.json +11 -0
- package/transforms/am-Ethi-t-am-brai.txt +652 -0
- package/transforms/am-Ethi-t-am-ethi-m0-geminate.json +9 -0
- package/transforms/am-Ethi-t-am-ethi-m0-geminate.txt +6925 -0
- package/transforms/am-Ethi-t-d0-morse.json +9 -0
- package/transforms/am-Ethi-t-d0-morse.txt +657 -0
- package/transforms/am-am_FONIPA.json +9 -0
- package/transforms/am-am_FONIPA.txt +694 -0
- package/transforms/am-ar.json +8 -0
- package/transforms/am-ar.txt +5 -0
- package/transforms/am-chr.json +8 -0
- package/transforms/am-chr.txt +4 -0
- package/transforms/am-fa.json +8 -0
- package/transforms/am-fa.txt +4 -0
- package/transforms/az-Lower.json +8 -0
- package/transforms/az-Lower.txt +13 -0
- package/transforms/az-Title.json +8 -0
- package/transforms/az-Title.txt +11 -0
- package/transforms/az-Upper.json +8 -0
- package/transforms/az-Upper.txt +5 -0
- package/transforms/blt-fonipa-t-blt.json +8 -0
- package/transforms/blt-fonipa-t-blt.txt +132 -0
- package/transforms/byn-Ethi-t-byn-latn-m0-tekie-alibekit.json +11 -0
- package/transforms/byn-Ethi-t-byn-latn-m0-tekie-alibekit.txt +537 -0
- package/transforms/byn-Ethi-t-byn-latn-m0-xaleget.json +11 -0
- package/transforms/byn-Ethi-t-byn-latn-m0-xaleget.txt +773 -0
- package/transforms/ch-am.json +8 -0
- package/transforms/ch-am.txt +4 -0
- package/transforms/ch-ar.json +8 -0
- package/transforms/ch-ar.txt +4 -0
- package/transforms/ch-ch_FONIPA.json +8 -0
- package/transforms/ch-ch_FONIPA.txt +79 -0
- package/transforms/ch-chr.json +8 -0
- package/transforms/ch-chr.txt +4 -0
- package/transforms/ch-fa.json +8 -0
- package/transforms/ch-fa.txt +4 -0
- package/transforms/chr-chr_FONIPA.json +8 -0
- package/transforms/chr-chr_FONIPA.txt +111 -0
- package/transforms/cs-am.json +8 -0
- package/transforms/cs-am.txt +4 -0
- package/transforms/cs-ar.json +8 -0
- package/transforms/cs-ar.txt +4 -0
- package/transforms/cs-chr.json +8 -0
- package/transforms/cs-chr.txt +4 -0
- package/transforms/cs-cs_FONIPA.json +8 -0
- package/transforms/cs-cs_FONIPA.txt +74 -0
- package/transforms/cs-fa.json +8 -0
- package/transforms/cs-fa.txt +4 -0
- package/transforms/cs-ja.json +8 -0
- package/transforms/cs-ja.txt +4 -0
- package/transforms/cs-ko.json +8 -0
- package/transforms/cs-ko.txt +4 -0
- package/transforms/cs_FONIPA-ja.json +8 -0
- package/transforms/cs_FONIPA-ja.txt +228 -0
- package/transforms/cs_FONIPA-ko.json +8 -0
- package/transforms/cs_FONIPA-ko.txt +88 -0
- package/transforms/cy-fonipa-t-cy.json +8 -0
- package/transforms/cy-fonipa-t-cy.txt +189 -0
- package/transforms/de-ASCII.json +8 -0
- package/transforms/de-ASCII.txt +15 -0
- package/transforms/dsb-dsb_FONIPA.json +8 -0
- package/transforms/dsb-dsb_FONIPA.txt +67 -0
- package/transforms/el-Lower.json +8 -0
- package/transforms/el-Lower.txt +12 -0
- package/transforms/el-Title.json +8 -0
- package/transforms/el-Title.txt +12 -0
- package/transforms/el-Upper.json +8 -0
- package/transforms/el-Upper.txt +11 -0
- package/transforms/eo-am.json +8 -0
- package/transforms/eo-am.txt +4 -0
- package/transforms/eo-ar.json +8 -0
- package/transforms/eo-ar.txt +4 -0
- package/transforms/eo-chr.json +8 -0
- package/transforms/eo-chr.txt +4 -0
- package/transforms/eo-eo_FONIPA.json +8 -0
- package/transforms/eo-eo_FONIPA.txt +47 -0
- package/transforms/eo-fa.json +8 -0
- package/transforms/eo-fa.txt +4 -0
- package/transforms/es-am.json +8 -0
- package/transforms/es-am.txt +4 -0
- package/transforms/es-ar.json +8 -0
- package/transforms/es-ar.txt +13 -0
- package/transforms/es-chr.json +8 -0
- package/transforms/es-chr.txt +4 -0
- package/transforms/es-es_FONIPA.json +8 -0
- package/transforms/es-es_FONIPA.txt +139 -0
- package/transforms/es-fa.json +8 -0
- package/transforms/es-fa.txt +13 -0
- package/transforms/es-ja.json +8 -0
- package/transforms/es-ja.txt +4 -0
- package/transforms/es-zh.json +8 -0
- package/transforms/es-zh.txt +4 -0
- package/transforms/es_419-am.json +8 -0
- package/transforms/es_419-am.txt +5 -0
- package/transforms/es_419-ar.json +8 -0
- package/transforms/es_419-ar.txt +14 -0
- package/transforms/es_419-chr.json +8 -0
- package/transforms/es_419-chr.txt +5 -0
- package/transforms/es_419-fa.json +8 -0
- package/transforms/es_419-fa.txt +14 -0
- package/transforms/es_419-ja.json +8 -0
- package/transforms/es_419-ja.txt +5 -0
- package/transforms/es_419-zh.json +8 -0
- package/transforms/es_419-zh.txt +5 -0
- package/transforms/es_FONIPA-am.json +8 -0
- package/transforms/es_FONIPA-am.txt +230 -0
- package/transforms/es_FONIPA-es_419_FONIPA.json +8 -0
- package/transforms/es_FONIPA-es_419_FONIPA.txt +6 -0
- package/transforms/es_FONIPA-ja.json +8 -0
- package/transforms/es_FONIPA-ja.txt +155 -0
- package/transforms/es_FONIPA-zh.json +8 -0
- package/transforms/es_FONIPA-zh.txt +522 -0
- package/transforms/fa-fa_FONIPA.json +8 -0
- package/transforms/fa-fa_FONIPA.txt +107 -0
- package/transforms/gz-Ethi-t-und-sarb.json +11 -0
- package/transforms/gz-Ethi-t-und-sarb.txt +180 -0
- package/transforms/ha-ha_NE.json +8 -0
- package/transforms/ha-ha_NE.txt +6 -0
- package/transforms/hy-am.json +8 -0
- package/transforms/hy-am.txt +4 -0
- package/transforms/hy-ar.json +8 -0
- package/transforms/hy-ar.txt +4 -0
- package/transforms/hy-chr.json +8 -0
- package/transforms/hy-chr.txt +4 -0
- package/transforms/hy-fa.json +8 -0
- package/transforms/hy-fa.txt +4 -0
- package/transforms/hy-hy_FONIPA.json +8 -0
- package/transforms/hy-hy_FONIPA.txt +52 -0
- package/transforms/hy_AREVMDA-am.json +8 -0
- package/transforms/hy_AREVMDA-am.txt +4 -0
- package/transforms/hy_AREVMDA-ar.json +8 -0
- package/transforms/hy_AREVMDA-ar.txt +4 -0
- package/transforms/hy_AREVMDA-chr.json +8 -0
- package/transforms/hy_AREVMDA-chr.txt +4 -0
- package/transforms/hy_AREVMDA-fa.json +8 -0
- package/transforms/hy_AREVMDA-fa.txt +4 -0
- package/transforms/hy_AREVMDA-hy_AREVMDA_FONIPA.json +8 -0
- package/transforms/hy_AREVMDA-hy_AREVMDA_FONIPA.txt +80 -0
- package/transforms/ia-am.json +8 -0
- package/transforms/ia-am.txt +4 -0
- package/transforms/ia-ar.json +8 -0
- package/transforms/ia-ar.txt +4 -0
- package/transforms/ia-chr.json +8 -0
- package/transforms/ia-chr.txt +4 -0
- package/transforms/ia-fa.json +8 -0
- package/transforms/ia-fa.txt +4 -0
- package/transforms/ia-ia_FONIPA.json +8 -0
- package/transforms/ia-ia_FONIPA.txt +71 -0
- package/transforms/it-am.json +8 -0
- package/transforms/it-am.txt +257 -0
- package/transforms/it-ja.json +8 -0
- package/transforms/it-ja.txt +259 -0
- package/transforms/ja_Latn-ko.json +8 -0
- package/transforms/ja_Latn-ko.txt +141 -0
- package/transforms/ja_Latn-ru.json +8 -0
- package/transforms/ja_Latn-ru.txt +123 -0
- package/transforms/kk-am.json +8 -0
- package/transforms/kk-am.txt +4 -0
- package/transforms/kk-ar.json +8 -0
- package/transforms/kk-ar.txt +4 -0
- package/transforms/kk-chr.json +8 -0
- package/transforms/kk-chr.txt +4 -0
- package/transforms/kk-fa.json +8 -0
- package/transforms/kk-fa.txt +4 -0
- package/transforms/kk-kk_FONIPA.json +8 -0
- package/transforms/kk-kk_FONIPA.txt +59 -0
- package/transforms/ky-am.json +8 -0
- package/transforms/ky-am.txt +4 -0
- package/transforms/ky-ar.json +8 -0
- package/transforms/ky-ar.txt +4 -0
- package/transforms/ky-chr.json +8 -0
- package/transforms/ky-chr.txt +4 -0
- package/transforms/ky-fa.json +8 -0
- package/transforms/ky-fa.txt +4 -0
- package/transforms/ky-ky_FONIPA.json +8 -0
- package/transforms/ky-ky_FONIPA.txt +71 -0
- package/transforms/la-la_FONIPA.json +8 -0
- package/transforms/la-la_FONIPA.txt +79 -0
- package/transforms/lt-Lower.json +8 -0
- package/transforms/lt-Lower.txt +20 -0
- package/transforms/lt-Title.json +8 -0
- package/transforms/lt-Title.txt +15 -0
- package/transforms/lt-Upper.json +8 -0
- package/transforms/lt-Upper.txt +8 -0
- package/transforms/mn-mn_Latn-MNS.json +8 -0
- package/transforms/mn-mn_Latn-MNS.txt +86 -0
- package/transforms/my-am.json +8 -0
- package/transforms/my-am.txt +4 -0
- package/transforms/my-ar.json +8 -0
- package/transforms/my-ar.txt +4 -0
- package/transforms/my-chr.json +8 -0
- package/transforms/my-chr.txt +4 -0
- package/transforms/my-fa.json +8 -0
- package/transforms/my-fa.txt +4 -0
- package/transforms/my-my_FONIPA.json +8 -0
- package/transforms/my-my_FONIPA.txt +325 -0
- package/transforms/my-t-my-d0-zawgyi.json +8 -0
- package/transforms/my-t-my-d0-zawgyi.txt +222 -0
- package/transforms/my-t-my-s0-zawgyi.json +8 -0
- package/transforms/my-t-my-s0-zawgyi.txt +231 -0
- package/transforms/nl-Title.json +8 -0
- package/transforms/nl-Title.txt +7 -0
- package/transforms/nv-nv_FONIPA.json +8 -0
- package/transforms/nv-nv_FONIPA.txt +74 -0
- package/transforms/pl-am.json +8 -0
- package/transforms/pl-am.txt +4 -0
- package/transforms/pl-ar.json +8 -0
- package/transforms/pl-ar.txt +4 -0
- package/transforms/pl-chr.json +8 -0
- package/transforms/pl-chr.txt +4 -0
- package/transforms/pl-fa.json +8 -0
- package/transforms/pl-fa.txt +4 -0
- package/transforms/pl-ja.json +8 -0
- package/transforms/pl-ja.txt +4 -0
- package/transforms/pl-pl_FONIPA.json +8 -0
- package/transforms/pl-pl_FONIPA.txt +113 -0
- package/transforms/pl_FONIPA-ja.json +8 -0
- package/transforms/pl_FONIPA-ja.txt +301 -0
- package/transforms/rm_SURSILV-am.json +8 -0
- package/transforms/rm_SURSILV-am.txt +4 -0
- package/transforms/rm_SURSILV-ar.json +8 -0
- package/transforms/rm_SURSILV-ar.txt +4 -0
- package/transforms/rm_SURSILV-chr.json +8 -0
- package/transforms/rm_SURSILV-chr.txt +4 -0
- package/transforms/rm_SURSILV-fa.json +8 -0
- package/transforms/rm_SURSILV-fa.txt +4 -0
- package/transforms/rm_SURSILV-rm_FONIPA_SURSILV.json +8 -0
- package/transforms/rm_SURSILV-rm_FONIPA_SURSILV.txt +96 -0
- package/transforms/ro-am.json +8 -0
- package/transforms/ro-am.txt +4 -0
- package/transforms/ro-ar.json +8 -0
- package/transforms/ro-ar.txt +4 -0
- package/transforms/ro-chr.json +8 -0
- package/transforms/ro-chr.txt +4 -0
- package/transforms/ro-fa.json +8 -0
- package/transforms/ro-fa.txt +4 -0
- package/transforms/ro-ja.json +8 -0
- package/transforms/ro-ja.txt +4 -0
- package/transforms/ro-ro_FONIPA.json +8 -0
- package/transforms/ro-ro_FONIPA.txt +121 -0
- package/transforms/ro_FONIPA-ja.json +8 -0
- package/transforms/ro_FONIPA-ja.txt +211 -0
- package/transforms/ru-ja.json +8 -0
- package/transforms/ru-ja.txt +444 -0
- package/transforms/ru-zh.json +8 -0
- package/transforms/ru-zh.txt +996 -0
- package/transforms/ru_Latn-ru-BGN.json +9 -0
- package/transforms/ru_Latn-ru-BGN.txt +97 -0
- package/transforms/sat-am.json +8 -0
- package/transforms/sat-am.txt +6 -0
- package/transforms/sat-ar.json +8 -0
- package/transforms/sat-ar.txt +6 -0
- package/transforms/sat-chr.json +8 -0
- package/transforms/sat-chr.txt +6 -0
- package/transforms/sat-fa.json +8 -0
- package/transforms/sat-fa.txt +6 -0
- package/transforms/sat_Olck-sat_FONIPA.json +8 -0
- package/transforms/sat_Olck-sat_FONIPA.txt +174 -0
- package/transforms/sgw-Ethi-t-und-ethi.json +11 -0
- package/transforms/sgw-Ethi-t-und-ethi.txt +138 -0
- package/transforms/si-am.json +8 -0
- package/transforms/si-am.txt +4 -0
- package/transforms/si-ar.json +8 -0
- package/transforms/si-ar.txt +4 -0
- package/transforms/si-chr.json +8 -0
- package/transforms/si-chr.txt +4 -0
- package/transforms/si-fa.json +8 -0
- package/transforms/si-fa.txt +4 -0
- package/transforms/si-si_FONIPA.json +8 -0
- package/transforms/si-si_FONIPA.txt +157 -0
- package/transforms/si-si_Latn.json +8 -0
- package/transforms/si-si_Latn.txt +94 -0
- package/transforms/sk-am.json +8 -0
- package/transforms/sk-am.txt +4 -0
- package/transforms/sk-ar.json +8 -0
- package/transforms/sk-ar.txt +4 -0
- package/transforms/sk-chr.json +8 -0
- package/transforms/sk-chr.txt +4 -0
- package/transforms/sk-fa.json +8 -0
- package/transforms/sk-fa.txt +4 -0
- package/transforms/sk-ja.json +8 -0
- package/transforms/sk-ja.txt +4 -0
- package/transforms/sk-sk_FONIPA.json +8 -0
- package/transforms/sk-sk_FONIPA.txt +101 -0
- package/transforms/sk_FONIPA-ja.json +8 -0
- package/transforms/sk_FONIPA-ja.txt +252 -0
- package/transforms/ta-ta_FONIPA.json +8 -0
- package/transforms/ta-ta_FONIPA.txt +73 -0
- package/transforms/tlh-am.json +8 -0
- package/transforms/tlh-am.txt +4 -0
- package/transforms/tlh-ar.json +8 -0
- package/transforms/tlh-ar.txt +4 -0
- package/transforms/tlh-chr.json +8 -0
- package/transforms/tlh-chr.txt +4 -0
- package/transforms/tlh-fa.json +8 -0
- package/transforms/tlh-fa.txt +4 -0
- package/transforms/tlh-tlh_FONIPA.json +8 -0
- package/transforms/tlh-tlh_FONIPA.txt +46 -0
- package/transforms/tr-Lower.json +8 -0
- package/transforms/tr-Lower.txt +13 -0
- package/transforms/tr-Title.json +8 -0
- package/transforms/tr-Title.txt +11 -0
- package/transforms/tr-Upper.json +8 -0
- package/transforms/tr-Upper.txt +8 -0
- package/transforms/ug-ug_FONIPA.json +8 -0
- package/transforms/ug-ug_FONIPA.txt +69 -0
- package/transforms/und-Ethi-t-und-cyrl-m0-gutgarts.json +11 -0
- package/transforms/und-Ethi-t-und-cyrl-m0-gutgarts.txt +747 -0
- package/transforms/und-Ethi-t-und-latn-m0-aethiopi-geminate.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-aethiopi-geminate.txt +19 -0
- package/transforms/und-Ethi-t-und-latn-m0-aethiopi.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-aethiopi.txt +633 -0
- package/transforms/und-Ethi-t-und-latn-m0-alaloc-geminate.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-alaloc-geminate.txt +19 -0
- package/transforms/und-Ethi-t-und-latn-m0-alaloc.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-alaloc.txt +757 -0
- package/transforms/und-Ethi-t-und-latn-m0-beta_metsehaf-geminate.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-beta_metsehaf-geminate.txt +19 -0
- package/transforms/und-Ethi-t-und-latn-m0-beta_metsehaf.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-beta_metsehaf.txt +585 -0
- package/transforms/und-Ethi-t-und-latn-m0-es3842.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-es3842.txt +640 -0
- package/transforms/und-Ethi-t-und-latn-m0-ies-jes-1964-geminate.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-ies-jes-1964-geminate.txt +19 -0
- package/transforms/und-Ethi-t-und-latn-m0-ies-jes-1964.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-ies-jes-1964.txt +619 -0
- package/transforms/und-Ethi-t-und-latn-m0-lambdin.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-lambdin.txt +627 -0
- package/transforms/und-Ethi-t-und-latn-m0-sera.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-sera.txt +695 -0
- package/transforms/und-Ethi-t-und-latn.json +11 -0
- package/transforms/und-Ethi-t-und-latn.txt +16 -0
- package/transforms/und_FONIPA-ar.json +8 -0
- package/transforms/und_FONIPA-ar.txt +114 -0
- package/transforms/und_FONIPA-chr.json +8 -0
- package/transforms/und_FONIPA-chr.txt +172 -0
- package/transforms/und_FONIPA-fa.json +8 -0
- package/transforms/und_FONIPA-fa.txt +109 -0
- package/transforms/uz_Cyrl-uz_Latn.json +9 -0
- package/transforms/uz_Cyrl-uz_Latn.txt +103 -0
- package/transforms/vec-vec_FONIPA.json +8 -0
- package/transforms/vec-vec_FONIPA.txt +85 -0
- package/transforms/xh-am.json +8 -0
- package/transforms/xh-am.txt +4 -0
- package/transforms/xh-ar.json +8 -0
- package/transforms/xh-ar.txt +4 -0
- package/transforms/xh-chr.json +8 -0
- package/transforms/xh-chr.txt +4 -0
- package/transforms/xh-fa.json +8 -0
- package/transforms/xh-fa.txt +4 -0
- package/transforms/xh-xh_FONIPA.json +8 -0
- package/transforms/xh-xh_FONIPA.txt +85 -0
- package/transforms/yo-yo_BJ.json +8 -0
- package/transforms/yo-yo_BJ.txt +36 -0
- package/transforms/zh_Latn_PINYIN-ru.json +8 -0
- package/transforms/zh_Latn_PINYIN-ru.txt +148 -0
- package/transforms/zu-am.json +8 -0
- package/transforms/zu-am.txt +4 -0
- package/transforms/zu-ar.json +8 -0
- package/transforms/zu-ar.txt +4 -0
- package/transforms/zu-chr.json +8 -0
- package/transforms/zu-chr.txt +4 -0
- package/transforms/zu-fa.json +8 -0
- package/transforms/zu-fa.txt +4 -0
- package/transforms/zu-zu_FONIPA.json +8 -0
- package/transforms/zu-zu_FONIPA.txt +72 -0
- package/transforms.json +385 -0
|
@@ -0,0 +1,141 @@
|
|
|
1
|
+
|
|
2
|
+
# Japanese (Rōmaji) to Korean (Hangul) transliteration table for ICU.
|
|
3
|
+
# Can be run in sequence after e.g. Katakana-Latin.
|
|
4
|
+
#
|
|
5
|
+
# Based on 문교부 고시 제85-11호 (1986. 1. 7.) 외래어 표기법
|
|
6
|
+
# For background info, see http://ko.wikisource.org/wiki/문교부_고시_제85-11호
|
|
7
|
+
# and http://ko.wikipedia.org/wiki/외래어_표기법 (外來語表記法)
|
|
8
|
+
::NFD(NFC);
|
|
9
|
+
::[:Latin:] Lower();
|
|
10
|
+
$consonant = [ᄀᄁᄂᄃᄄᄅᄆᄇᄈᄉᄊᄋᄌᄍᄎᄏᄐᄑᄒ];
|
|
11
|
+
$lengthMarker = [̂̄];
|
|
12
|
+
#
|
|
13
|
+
#
|
|
14
|
+
# Drop hyphens and apostrophes.
|
|
15
|
+
[\-\'] → ;
|
|
16
|
+
#
|
|
17
|
+
#
|
|
18
|
+
# Turn long /e:/ into diphthong /ei/.
|
|
19
|
+
e $lengthMarker → | e i ;
|
|
20
|
+
#
|
|
21
|
+
#
|
|
22
|
+
# Ignore vowel length everywhere else.
|
|
23
|
+
$lengthMarker → ;
|
|
24
|
+
#
|
|
25
|
+
#
|
|
26
|
+
# Vowels.
|
|
27
|
+
#
|
|
28
|
+
[^$consonant] { ( [aiueoyw] ) → ᄋ | $1 ; # Supply a required null initial.
|
|
29
|
+
a → ᅡ ;
|
|
30
|
+
i\~e → | ie ; # イェ
|
|
31
|
+
i → ᅵ ;
|
|
32
|
+
u\~a → | wa ; # クァ, グァ
|
|
33
|
+
u\~i → ᅱ ; # ウィ, クィ, etc.
|
|
34
|
+
u\~e → ᅰ ; # ウェ
|
|
35
|
+
u\~o → ᅯ ; # ウォ
|
|
36
|
+
u → ᅮ ;
|
|
37
|
+
e → ᅦ ;
|
|
38
|
+
o → ᅩ ;
|
|
39
|
+
#
|
|
40
|
+
#
|
|
41
|
+
# Geminates.
|
|
42
|
+
#
|
|
43
|
+
kk → ᆺ | k ;
|
|
44
|
+
ss → ᆺ | s ;
|
|
45
|
+
tt → ᆺ | t ;
|
|
46
|
+
tc → ᆺ | c ;
|
|
47
|
+
cc → ᆺ | c ;
|
|
48
|
+
hh → ᆺ | h ;
|
|
49
|
+
ff → ᆺ | f ;
|
|
50
|
+
rr → ᆺ | r ;
|
|
51
|
+
gg → ᆺ | g ;
|
|
52
|
+
zz → ᆺ | z ;
|
|
53
|
+
jj → ᆺ | j ;
|
|
54
|
+
dd → ᆺ | d ;
|
|
55
|
+
bb → ᆺ | b ;
|
|
56
|
+
vv → ᆺ | v ;
|
|
57
|
+
pp → ᆺ | p ;
|
|
58
|
+
#
|
|
59
|
+
#
|
|
60
|
+
# Consonants.
|
|
61
|
+
#
|
|
62
|
+
' ' { k → | g ; # Beginning of a word (after space).
|
|
63
|
+
^k → | g ; # Beginning of the string.
|
|
64
|
+
k → ᄏ ;
|
|
65
|
+
#
|
|
66
|
+
#
|
|
67
|
+
sh → | sy ;
|
|
68
|
+
su → 스 ;
|
|
69
|
+
s → ᄉ ;
|
|
70
|
+
#
|
|
71
|
+
#
|
|
72
|
+
te\~ → | t ; # テュ
|
|
73
|
+
to\~ → | t ; # トゥ
|
|
74
|
+
tsu\~ → | ch ; # ツァ, ツィ, etc.
|
|
75
|
+
tsu → 쓰 ;
|
|
76
|
+
ts → | ch ;
|
|
77
|
+
' ' { t → | d ;
|
|
78
|
+
^t → | d ;
|
|
79
|
+
t → ᄐ ;
|
|
80
|
+
' ' { ch → | j ;
|
|
81
|
+
^ch → | j ;
|
|
82
|
+
ch → ᄎ ;
|
|
83
|
+
#
|
|
84
|
+
#
|
|
85
|
+
n } [\ \'bcdfghjkmnprstwz] → ᆫ ;
|
|
86
|
+
n$ → ᆫ ;
|
|
87
|
+
n → ᄂ ;
|
|
88
|
+
#
|
|
89
|
+
#
|
|
90
|
+
h → ᄒ ;
|
|
91
|
+
fu\~ → | p ; # フュ
|
|
92
|
+
fu → | hu ;
|
|
93
|
+
f → | p ;
|
|
94
|
+
#
|
|
95
|
+
#
|
|
96
|
+
m } [bmp] → ᆫ ;
|
|
97
|
+
m → ᄆ ;
|
|
98
|
+
#
|
|
99
|
+
#
|
|
100
|
+
ya → ᅣ ;
|
|
101
|
+
yi → ᅵ ; # Added for convenience, after shi.
|
|
102
|
+
yu → ᅲ ;
|
|
103
|
+
ye → ᅨ ;
|
|
104
|
+
yo → ᅭ ;
|
|
105
|
+
#
|
|
106
|
+
#
|
|
107
|
+
r → ᄅ ;
|
|
108
|
+
#
|
|
109
|
+
#
|
|
110
|
+
wa → ᅪ ;
|
|
111
|
+
w → ;
|
|
112
|
+
#
|
|
113
|
+
#
|
|
114
|
+
g → ᄀ ;
|
|
115
|
+
#
|
|
116
|
+
#
|
|
117
|
+
zu → 즈 ;
|
|
118
|
+
z → | j ;
|
|
119
|
+
j → ᄌ ;
|
|
120
|
+
#
|
|
121
|
+
#
|
|
122
|
+
de\~ → | d ; # デュ
|
|
123
|
+
dji\~ → | j ; # ヂァ, ヂゥ, etc.
|
|
124
|
+
dji → | ji ; # ヂ
|
|
125
|
+
do\~ → | d ; # ドゥ
|
|
126
|
+
dzu\~ → | j ; # ヅァ, ヅィ, etc.
|
|
127
|
+
dzu → | zu ; # ヅ
|
|
128
|
+
dz → | j ;
|
|
129
|
+
d → ᄃ ;
|
|
130
|
+
#
|
|
131
|
+
#
|
|
132
|
+
b → ᄇ ;
|
|
133
|
+
vu\~ → | b ; # ヴァ, etc.
|
|
134
|
+
v → | b ;
|
|
135
|
+
#
|
|
136
|
+
#
|
|
137
|
+
p → ᄑ ;
|
|
138
|
+
#
|
|
139
|
+
#
|
|
140
|
+
::NFC(NFD);
|
|
141
|
+
|
|
@@ -0,0 +1,123 @@
|
|
|
1
|
+
|
|
2
|
+
# Japanese (Rōmaji) to Russian (Cyrillic) Polivanov transliteration for ICU.
|
|
3
|
+
# Can be run in sequence after e.g. Katakana-Latin.
|
|
4
|
+
#
|
|
5
|
+
# These rules cannot be used to target Bulgarian, Serbian, Tajik, or Ukrainian.
|
|
6
|
+
#
|
|
7
|
+
# TODO: Cyrillization needs to respect morpheme/Kanji boundaries.
|
|
8
|
+
# 中井 becomes Накаи, but 北海道 becomes Хоккайдо. We need boundary
|
|
9
|
+
# markup in the input in order to do that properly.
|
|
10
|
+
#
|
|
11
|
+
::NFD(NFC);
|
|
12
|
+
::[:Latin:] Lower();
|
|
13
|
+
#
|
|
14
|
+
#
|
|
15
|
+
$lengthMarker = [̂̄];
|
|
16
|
+
#
|
|
17
|
+
#
|
|
18
|
+
# Delete apostrophes. Apostrophes after "n" are consumed below.
|
|
19
|
+
\' → ;
|
|
20
|
+
#
|
|
21
|
+
#
|
|
22
|
+
# Turn long /e:/ into diphthong /ei/.
|
|
23
|
+
# Note that /ei/ across a morpheme boundary (e.g. 武井 Takei) becomes эи.
|
|
24
|
+
e $lengthMarker → эй ;
|
|
25
|
+
#
|
|
26
|
+
#
|
|
27
|
+
# Turn long /i:/ into two vowels /ii/.
|
|
28
|
+
i $lengthMarker → | i i ;
|
|
29
|
+
#
|
|
30
|
+
#
|
|
31
|
+
# Ignore vowel length everywhere else.
|
|
32
|
+
$lengthMarker → ;
|
|
33
|
+
#
|
|
34
|
+
#
|
|
35
|
+
# Vowels.
|
|
36
|
+
#
|
|
37
|
+
# TODO(mjansche): Enable diphthongs once we have Kanji boundaries.
|
|
38
|
+
## ai → ай ;
|
|
39
|
+
a → а ;
|
|
40
|
+
i\~e → | ye ;
|
|
41
|
+
i → и ;
|
|
42
|
+
u\~ → в ; # ウィ etc.
|
|
43
|
+
#
|
|
44
|
+
## ui → уй ;
|
|
45
|
+
u → у ;
|
|
46
|
+
e → э ;
|
|
47
|
+
o → о ;
|
|
48
|
+
#
|
|
49
|
+
#
|
|
50
|
+
# Consonants.
|
|
51
|
+
#
|
|
52
|
+
k → к ;
|
|
53
|
+
#
|
|
54
|
+
#
|
|
55
|
+
sh → | sy ;
|
|
56
|
+
s → с ;
|
|
57
|
+
#
|
|
58
|
+
#
|
|
59
|
+
ch → | ty ;
|
|
60
|
+
c } ch → t ;
|
|
61
|
+
te\~ → | t ; # テュ
|
|
62
|
+
to\~ → | t ; # トゥ
|
|
63
|
+
tsu\~ → | ts ; # ツァ, ツィ, etc.
|
|
64
|
+
ts → ц ;
|
|
65
|
+
t → т ;
|
|
66
|
+
#
|
|
67
|
+
#
|
|
68
|
+
\~tsu → | tsu ;
|
|
69
|
+
#
|
|
70
|
+
#
|
|
71
|
+
n } [bpm] → м ; # 群馬 → Гумма
|
|
72
|
+
n\' → нъ ;
|
|
73
|
+
n → н ;
|
|
74
|
+
#
|
|
75
|
+
#
|
|
76
|
+
h → х ;
|
|
77
|
+
fu\~ → | f ; # フュ
|
|
78
|
+
f → ф ;
|
|
79
|
+
#
|
|
80
|
+
#
|
|
81
|
+
m → м ;
|
|
82
|
+
#
|
|
83
|
+
#
|
|
84
|
+
ya → я ;
|
|
85
|
+
yi → и ; # Added for convenience, after sh, ch, j.
|
|
86
|
+
yu → ю ;
|
|
87
|
+
ye → е ; # ?? unobserved
|
|
88
|
+
yo → ё ;
|
|
89
|
+
#
|
|
90
|
+
#
|
|
91
|
+
r → р ;
|
|
92
|
+
#
|
|
93
|
+
#
|
|
94
|
+
wa → ва ;
|
|
95
|
+
w → ;
|
|
96
|
+
#
|
|
97
|
+
#
|
|
98
|
+
g → г ;
|
|
99
|
+
#
|
|
100
|
+
#
|
|
101
|
+
j → | zy ;
|
|
102
|
+
z → дз ;
|
|
103
|
+
#
|
|
104
|
+
#
|
|
105
|
+
de\~ → | d ; # デュ
|
|
106
|
+
dji\~ → | z ; # ヂャ, ヂュ, etc.
|
|
107
|
+
dj → | j ; # ヂ
|
|
108
|
+
do\~ → | d ; # ドゥ
|
|
109
|
+
dzu\~ → | z ; # ヅァ, ヅィ, etc.
|
|
110
|
+
dz → | z ; # ヅ
|
|
111
|
+
d → д ;
|
|
112
|
+
#
|
|
113
|
+
#
|
|
114
|
+
b → б ;
|
|
115
|
+
vu\~ → | v ; # ヴァ, etc.
|
|
116
|
+
v → в ; # ?? unobserved
|
|
117
|
+
#
|
|
118
|
+
#
|
|
119
|
+
p → п ;
|
|
120
|
+
#
|
|
121
|
+
#
|
|
122
|
+
::NFC(NFD);
|
|
123
|
+
|
|
@@ -0,0 +1,59 @@
|
|
|
1
|
+
|
|
2
|
+
# http://en.wikipedia.org/wiki/Kazakh_language#Phonology
|
|
3
|
+
#
|
|
4
|
+
# Output:
|
|
5
|
+
# m n ŋ
|
|
6
|
+
# p b t d k ɡ q ɢ
|
|
7
|
+
# f v x h
|
|
8
|
+
# s z ʃ ʒ ɕ t͡s t͡ɕ
|
|
9
|
+
# j w l ɾ
|
|
10
|
+
# ʉ ʊ ɘ ə ɛ æ ɑ
|
|
11
|
+
# i̯ɘ y̯ʉ u̯ʊ
|
|
12
|
+
::NFC;
|
|
13
|
+
::Lower;
|
|
14
|
+
ә → æ;
|
|
15
|
+
а → ɑ;
|
|
16
|
+
п → p;
|
|
17
|
+
б → b;
|
|
18
|
+
д → d;
|
|
19
|
+
е → i̯ɘ;
|
|
20
|
+
г → ɡ;
|
|
21
|
+
ғ → ɢ;
|
|
22
|
+
һ → h;
|
|
23
|
+
і → ɘ;
|
|
24
|
+
й → j;
|
|
25
|
+
к → k;
|
|
26
|
+
қ → q;
|
|
27
|
+
л → l;
|
|
28
|
+
м → m;
|
|
29
|
+
н → n;
|
|
30
|
+
ң → ŋ;
|
|
31
|
+
р → ɾ;
|
|
32
|
+
с → s;
|
|
33
|
+
т → t;
|
|
34
|
+
у → w;
|
|
35
|
+
з → z;
|
|
36
|
+
ш → ʃ;
|
|
37
|
+
ж → ʒ;
|
|
38
|
+
ы → ə;
|
|
39
|
+
ө → y̯ʉ;
|
|
40
|
+
о → u̯ʊ;
|
|
41
|
+
ү → ʉ;
|
|
42
|
+
ұ → ʊ;
|
|
43
|
+
# Some characters that are not really Kazakh, but appear frequently
|
|
44
|
+
# in Kazakh-language text as part of loanwords.
|
|
45
|
+
в → v;
|
|
46
|
+
и → i;
|
|
47
|
+
ц → t͡s;
|
|
48
|
+
ч → t͡ɕ;
|
|
49
|
+
щ → ɕ;
|
|
50
|
+
х → x;
|
|
51
|
+
ф → f;
|
|
52
|
+
э → ɛ;
|
|
53
|
+
ю → ju;
|
|
54
|
+
я → jɑ;
|
|
55
|
+
ё → jo;
|
|
56
|
+
ъ →;
|
|
57
|
+
ь →;
|
|
58
|
+
\- → ' ';
|
|
59
|
+
|
|
@@ -0,0 +1,71 @@
|
|
|
1
|
+
|
|
2
|
+
# Transformation from Kyrgyz (ky) to its IPA transcription (ky_FONIPA).
|
|
3
|
+
# http://en.wikipedia.org/wiki/Kyrgyz_alphabet#Correspondence_chart
|
|
4
|
+
::Lower;
|
|
5
|
+
::NFC;
|
|
6
|
+
$consonant_sound = [bdfɡklmnŋpqrʁsʃtvzʒχ];
|
|
7
|
+
аа → ɑː;
|
|
8
|
+
а → ɑ;
|
|
9
|
+
б → b;
|
|
10
|
+
в → v;
|
|
11
|
+
{г} [аоуы] → ʁ;
|
|
12
|
+
г → ɡ;
|
|
13
|
+
дж → d͡ʒ; # eg. Джамадан
|
|
14
|
+
дд → dː;
|
|
15
|
+
д → d;
|
|
16
|
+
[$] {е} → je; # at the beginning of a word
|
|
17
|
+
е → e;
|
|
18
|
+
ё → jo; # appears only in loanwords
|
|
19
|
+
ж → d͡ʒ;
|
|
20
|
+
з → z;
|
|
21
|
+
ии → iː;
|
|
22
|
+
и → i;
|
|
23
|
+
й → j;
|
|
24
|
+
кк → kː;
|
|
25
|
+
[$] {к} [еёиɵүю] → ɡ; # eg. кирет, кишиден, келди
|
|
26
|
+
{к} [аоуы] → q; # eg. чокусу, факультетин, нукура
|
|
27
|
+
[ɑouɯ] ː? {к} → q; # eg. Исак, Бирок, Кутлук, Ферганалык
|
|
28
|
+
[y] $consonant_sound+ ː? {к} [$] → k; # eg. мүлк, түрк
|
|
29
|
+
$consonant_sound {к} [$] → q; # eg. даңк, калк, кырк
|
|
30
|
+
[ŋ] {к} → q;
|
|
31
|
+
к → k;
|
|
32
|
+
# TODO(sascha): Verify whether /lʲ/ is really phonemic in Kyrgyz;
|
|
33
|
+
# is there really a minimal pair with /l/ versus /lʲ/?
|
|
34
|
+
[eøy] ː? {л}к → lʲ; # eg. мүлк, күлкү, өлкө, эзелки
|
|
35
|
+
лл → lː;
|
|
36
|
+
л → l;
|
|
37
|
+
мм → mː;
|
|
38
|
+
м → m;
|
|
39
|
+
нн → nː;
|
|
40
|
+
н → n;
|
|
41
|
+
ң → ŋ;
|
|
42
|
+
оо → oː;
|
|
43
|
+
о → o;
|
|
44
|
+
өө → øː;
|
|
45
|
+
ө → ø;
|
|
46
|
+
п → p;
|
|
47
|
+
р → r;
|
|
48
|
+
сс → sː;
|
|
49
|
+
с → s;
|
|
50
|
+
тт → tː;
|
|
51
|
+
тч → t͡ʃ; # eg. екетчилерден
|
|
52
|
+
т → t;
|
|
53
|
+
уу → uː;
|
|
54
|
+
у → u;
|
|
55
|
+
үү → yː;
|
|
56
|
+
ү → y;
|
|
57
|
+
ф → f; # only in loanwords
|
|
58
|
+
х → χ;
|
|
59
|
+
ц → t͡s; # only in loanwords
|
|
60
|
+
ч → t͡ʃ;
|
|
61
|
+
ш → ʃ;
|
|
62
|
+
щ → ʃ t͡ʃ; # only in loanwords
|
|
63
|
+
ъ → ; # no phonemic value; appears only in loanwords
|
|
64
|
+
ы → ɯ;
|
|
65
|
+
ь → ; # no phonemic value; appears only in loanwords
|
|
66
|
+
ээ → eː;
|
|
67
|
+
э → e;
|
|
68
|
+
ю → ju;
|
|
69
|
+
я → jɑ;
|
|
70
|
+
\- → ' ';
|
|
71
|
+
|
|
@@ -0,0 +1,79 @@
|
|
|
1
|
+
|
|
2
|
+
# Transformation from Latin (la) to its IPA transcription (la_FONIPA).
|
|
3
|
+
# http://en.wikipedia.org/wiki/Latin_spelling_and_pronunciation
|
|
4
|
+
# http://en.wikipedia.org/wiki/Wikipedia:IPA_for_Latin
|
|
5
|
+
#
|
|
6
|
+
# These rules follow the Wikipedia description of the presumed pronunciation
|
|
7
|
+
# of Classical Latin. This is different from Medieval Latin, and it is also
|
|
8
|
+
# different from the ecclesiastical pronunciation used by the Roman Catholic
|
|
9
|
+
# church.
|
|
10
|
+
::Lower;
|
|
11
|
+
::NFC;
|
|
12
|
+
$vowel = [aáàăāeéèĕēiíìĭīoóòŏōuúùŭūæœ];
|
|
13
|
+
$end_of_word = [$ ];
|
|
14
|
+
ae → aj;
|
|
15
|
+
av → aw;
|
|
16
|
+
æ → aj; # 19th century English orthography
|
|
17
|
+
ā → aː;
|
|
18
|
+
[aáàă] → a;
|
|
19
|
+
b → b;
|
|
20
|
+
ch → kʰ; # Greek loanwoards
|
|
21
|
+
c → k;
|
|
22
|
+
d → d;
|
|
23
|
+
ev → ew;
|
|
24
|
+
ē → eː;
|
|
25
|
+
[eéèĕ] → ɛ;
|
|
26
|
+
f → f;
|
|
27
|
+
{g} n → ŋ; # eg. agnus
|
|
28
|
+
g → ɡ;
|
|
29
|
+
h → h;
|
|
30
|
+
ī → iː;
|
|
31
|
+
{[iíìĭ]} $vowel → j; # eg. cuius
|
|
32
|
+
[iíìĭ] → ɪ;
|
|
33
|
+
k → k;
|
|
34
|
+
l → l;
|
|
35
|
+
m → m;
|
|
36
|
+
{n} [bpfm] → m; # eg. infirmus
|
|
37
|
+
{n} [gckq] → ŋ; # eg. quinque
|
|
38
|
+
n → n;
|
|
39
|
+
œ → oj; # 19th century English orthography
|
|
40
|
+
oe → oj;
|
|
41
|
+
ō → oː;
|
|
42
|
+
[oóòŏ] → ɔ;
|
|
43
|
+
ph → pʰ; # Greek loanwords
|
|
44
|
+
p → p;
|
|
45
|
+
qu → kʷ;
|
|
46
|
+
qv → kʷ;
|
|
47
|
+
rh → rʰ; # Greek loanwords
|
|
48
|
+
r → r;
|
|
49
|
+
s → s;
|
|
50
|
+
th → tʰ; # Greek loanwords
|
|
51
|
+
t → t;
|
|
52
|
+
ū → uː;
|
|
53
|
+
[uúùŭ] → ʊ;
|
|
54
|
+
{v} $vowel → w;
|
|
55
|
+
v → u;
|
|
56
|
+
xs → ks; # Old Latin spelling
|
|
57
|
+
x → ks;
|
|
58
|
+
y → y; # Greek loanwords
|
|
59
|
+
z → d͡z; # eg. zerum
|
|
60
|
+
::Null;
|
|
61
|
+
# Gemination of double consonants.
|
|
62
|
+
# http://en.wikipedia.org/wiki/Latin_spelling_and_pronunciation#Double_consonants
|
|
63
|
+
bb → bː;
|
|
64
|
+
dd → dː;
|
|
65
|
+
ɡɡ → ɡː;
|
|
66
|
+
hh → hː;
|
|
67
|
+
kk → kː;
|
|
68
|
+
ll → lː;
|
|
69
|
+
mm → mː;
|
|
70
|
+
nn → nː;
|
|
71
|
+
pp → pː;
|
|
72
|
+
rr → rː;
|
|
73
|
+
ss → sː;
|
|
74
|
+
tt → tː;
|
|
75
|
+
# Velarization of [l].
|
|
76
|
+
# http://en.wikipedia.org/wiki/Latin_spelling_and_pronunciation#cite_note-20
|
|
77
|
+
{l} [^aeɛiouː] → ɫ;
|
|
78
|
+
::NFC;
|
|
79
|
+
|
|
@@ -0,0 +1,20 @@
|
|
|
1
|
+
|
|
2
|
+
# Introduce an explicit dot above when lowercasing capital Is and Js
|
|
3
|
+
# whenever there are more accents above.
|
|
4
|
+
# (of the accents used in Lithuanian: grave, acute, tilde above, and ogonek)
|
|
5
|
+
# 0049; 0069 0307; 0049; 0049; lt More_Above; # LATIN CAPITAL LETTER I
|
|
6
|
+
# 004A; 006A 0307; 004A; 004A; lt More_Above; # LATIN CAPITAL LETTER J
|
|
7
|
+
# 012E; 012F 0307; 012E; 012E; lt More_Above; # LATIN CAPITAL LETTER I WITH OGONEK
|
|
8
|
+
# 00CC; 0069 0307 0300; 00CC; 00CC; lt; # LATIN CAPITAL LETTER I WITH GRAVE
|
|
9
|
+
# 00CD; 0069 0307 0301; 00CD; 00CD; lt; # LATIN CAPITAL LETTER I WITH ACUTE
|
|
10
|
+
# 0128; 0069 0307 0303; 0128; 0128; lt; # LATIN CAPITAL LETTER I WITH TILDE
|
|
11
|
+
::NFD();
|
|
12
|
+
I } [^[:ccc=Not_Reordered:][:ccc=Above:]]* [:ccc=Above:] → i \u0307;
|
|
13
|
+
J } [^[:ccc=Not_Reordered:][:ccc=Above:]]* [:ccc=Above:] → j \u0307;
|
|
14
|
+
I \u0328 } [^[:ccc=Not_Reordered:][:ccc=Above:]]* [:ccc=Above:] → i \u0328 \u0307;
|
|
15
|
+
I \u0300 → i \u0307 \u0300;
|
|
16
|
+
I \u0301 → i \u0307 \u0301;
|
|
17
|
+
I \u0303 → i \u0307 \u0303;
|
|
18
|
+
::Any-Lower();
|
|
19
|
+
::NFC();
|
|
20
|
+
|
|
@@ -0,0 +1,15 @@
|
|
|
1
|
+
|
|
2
|
+
# Make any string of letters after a cased letter be lower
|
|
3
|
+
::NFD();
|
|
4
|
+
[:cased:] [:case-ignorable:]* {I } [^[:ccc=Not_Reordered:][:ccc=Above:]]* [:ccc=Above:] → i \u0307;
|
|
5
|
+
[:cased:] [:case-ignorable:]* {J } [^[:ccc=Not_Reordered:][:ccc=Above:]]* [:ccc=Above:] → j \u0307;
|
|
6
|
+
[:cased:] [:case-ignorable:]* {I \u0328 } [^[:ccc=Not_Reordered:][:ccc=Above:]]* [:ccc=Above:] → i \u0328 \u0307;
|
|
7
|
+
[:cased:] [:case-ignorable:]* {I \u0300 → i \u0307 \u0300;
|
|
8
|
+
[:cased:] [:case-ignorable:]* {I \u0301 → i \u0307 \u0301;
|
|
9
|
+
[:cased:] [:case-ignorable:]* {I \u0303 → i \u0307 \u0303;
|
|
10
|
+
[:cased:] [:case-ignorable:]* { (.) → &Any-Lower($1) ;
|
|
11
|
+
# Otherwise all lowercase go to upper (titlecase stay as is)
|
|
12
|
+
[:Soft_Dotted:] [^[:ccc=Not_Reordered:][:ccc=Above:]]* { \u0307 → ;
|
|
13
|
+
([:Lowercase:]) → &Any-Upper($1) ;
|
|
14
|
+
::NFC();
|
|
15
|
+
|