cldr-transforms 46.0.0-BETA2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +41 -0
- package/README.md +27 -0
- package/bower.json +13 -0
- package/package.json +29 -0
- package/transforms/Amharic-Latin-BGN.json +9 -0
- package/transforms/Amharic-Latin-BGN.txt +441 -0
- package/transforms/Any-Accents.json +9 -0
- package/transforms/Any-Accents.txt +270 -0
- package/transforms/Any-Publishing.json +9 -0
- package/transforms/Any-Publishing.txt +63 -0
- package/transforms/Arabic-Latin-BGN.json +9 -0
- package/transforms/Arabic-Latin-BGN.txt +205 -0
- package/transforms/Arabic-Latin.json +11 -0
- package/transforms/Arabic-Latin.txt +181 -0
- package/transforms/Armenian-Latin-BGN.json +9 -0
- package/transforms/Armenian-Latin-BGN.txt +165 -0
- package/transforms/Azerbaijani-Latin-BGN.json +9 -0
- package/transforms/Azerbaijani-Latin-BGN.txt +183 -0
- package/transforms/Belarusian-Latin-BGN.json +9 -0
- package/transforms/Belarusian-Latin-BGN.txt +194 -0
- package/transforms/Bengali-Arabic.json +9 -0
- package/transforms/Bengali-Arabic.txt +7 -0
- package/transforms/Bengali-Devanagari.json +9 -0
- package/transforms/Bengali-Devanagari.txt +7 -0
- package/transforms/Bengali-Gujarati.json +9 -0
- package/transforms/Bengali-Gujarati.txt +7 -0
- package/transforms/Bengali-Gurmukhi.json +9 -0
- package/transforms/Bengali-Gurmukhi.txt +7 -0
- package/transforms/Bengali-InterIndic.json +7 -0
- package/transforms/Bengali-InterIndic.txt +99 -0
- package/transforms/Bengali-Kannada.json +9 -0
- package/transforms/Bengali-Kannada.txt +7 -0
- package/transforms/Bengali-Latin.json +9 -0
- package/transforms/Bengali-Latin.txt +7 -0
- package/transforms/Bengali-Malayalam.json +9 -0
- package/transforms/Bengali-Malayalam.txt +7 -0
- package/transforms/Bengali-Oriya.json +9 -0
- package/transforms/Bengali-Oriya.txt +7 -0
- package/transforms/Bengali-Tamil.json +9 -0
- package/transforms/Bengali-Tamil.txt +7 -0
- package/transforms/Bengali-Telugu.json +9 -0
- package/transforms/Bengali-Telugu.txt +7 -0
- package/transforms/Bengali-ur.json +8 -0
- package/transforms/Bengali-ur.txt +7 -0
- package/transforms/Bulgarian-Latin-BGN.json +9 -0
- package/transforms/Bulgarian-Latin-BGN.txt +237 -0
- package/transforms/CanadianAboriginal-Latin.json +11 -0
- package/transforms/CanadianAboriginal-Latin.txt +184 -0
- package/transforms/Cyrillic-Latin.json +11 -0
- package/transforms/Cyrillic-Latin.txt +280 -0
- package/transforms/Devanagari-Arabic.json +9 -0
- package/transforms/Devanagari-Arabic.txt +7 -0
- package/transforms/Devanagari-Bengali.json +9 -0
- package/transforms/Devanagari-Bengali.txt +7 -0
- package/transforms/Devanagari-Gujarati.json +9 -0
- package/transforms/Devanagari-Gujarati.txt +7 -0
- package/transforms/Devanagari-Gurmukhi.json +9 -0
- package/transforms/Devanagari-Gurmukhi.txt +7 -0
- package/transforms/Devanagari-InterIndic.json +7 -0
- package/transforms/Devanagari-InterIndic.txt +113 -0
- package/transforms/Devanagari-Kannada.json +9 -0
- package/transforms/Devanagari-Kannada.txt +7 -0
- package/transforms/Devanagari-Latin.json +9 -0
- package/transforms/Devanagari-Latin.txt +7 -0
- package/transforms/Devanagari-Malayalam.json +9 -0
- package/transforms/Devanagari-Malayalam.txt +7 -0
- package/transforms/Devanagari-Oriya.json +9 -0
- package/transforms/Devanagari-Oriya.txt +7 -0
- package/transforms/Devanagari-Tamil.json +9 -0
- package/transforms/Devanagari-Tamil.txt +7 -0
- package/transforms/Devanagari-Telugu.json +9 -0
- package/transforms/Devanagari-Telugu.txt +7 -0
- package/transforms/Devanagari-ur.json +8 -0
- package/transforms/Devanagari-ur.txt +7 -0
- package/transforms/Fullwidth-Halfwidth.json +9 -0
- package/transforms/Fullwidth-Halfwidth.txt +261 -0
- package/transforms/Georgian-Latin-BGN.json +9 -0
- package/transforms/Georgian-Latin-BGN.txt +43 -0
- package/transforms/Georgian-Latin-BGN_1981.json +8 -0
- package/transforms/Georgian-Latin-BGN_1981.txt +54 -0
- package/transforms/Georgian-Latin.json +11 -0
- package/transforms/Georgian-Latin.txt +53 -0
- package/transforms/Greek-Latin-BGN.json +9 -0
- package/transforms/Greek-Latin-BGN.txt +419 -0
- package/transforms/Greek-Latin.json +11 -0
- package/transforms/Greek-Latin.txt +251 -0
- package/transforms/Greek_Latin_UNGEGN.json +11 -0
- package/transforms/Greek_Latin_UNGEGN.txt +179 -0
- package/transforms/Gujarati-Arabic.json +9 -0
- package/transforms/Gujarati-Arabic.txt +7 -0
- package/transforms/Gujarati-Bengali.json +9 -0
- package/transforms/Gujarati-Bengali.txt +7 -0
- package/transforms/Gujarati-Devanagari.json +9 -0
- package/transforms/Gujarati-Devanagari.txt +7 -0
- package/transforms/Gujarati-Gurmukhi.json +9 -0
- package/transforms/Gujarati-Gurmukhi.txt +7 -0
- package/transforms/Gujarati-InterIndic.json +7 -0
- package/transforms/Gujarati-InterIndic.txt +89 -0
- package/transforms/Gujarati-Kannada.json +9 -0
- package/transforms/Gujarati-Kannada.txt +7 -0
- package/transforms/Gujarati-Latin.json +9 -0
- package/transforms/Gujarati-Latin.txt +7 -0
- package/transforms/Gujarati-Malayalam.json +9 -0
- package/transforms/Gujarati-Malayalam.txt +7 -0
- package/transforms/Gujarati-Oriya.json +9 -0
- package/transforms/Gujarati-Oriya.txt +7 -0
- package/transforms/Gujarati-Tamil.json +9 -0
- package/transforms/Gujarati-Tamil.txt +7 -0
- package/transforms/Gujarati-Telugu.json +9 -0
- package/transforms/Gujarati-Telugu.txt +7 -0
- package/transforms/Gujarati-ur.json +8 -0
- package/transforms/Gujarati-ur.txt +7 -0
- package/transforms/Gurmukhi-Arabic.json +9 -0
- package/transforms/Gurmukhi-Arabic.txt +7 -0
- package/transforms/Gurmukhi-Bengali.json +9 -0
- package/transforms/Gurmukhi-Bengali.txt +7 -0
- package/transforms/Gurmukhi-Devanagari.json +9 -0
- package/transforms/Gurmukhi-Devanagari.txt +7 -0
- package/transforms/Gurmukhi-Gujarati.json +9 -0
- package/transforms/Gurmukhi-Gujarati.txt +7 -0
- package/transforms/Gurmukhi-InterIndic.json +7 -0
- package/transforms/Gurmukhi-InterIndic.txt +88 -0
- package/transforms/Gurmukhi-Kannada.json +9 -0
- package/transforms/Gurmukhi-Kannada.txt +7 -0
- package/transforms/Gurmukhi-Latin.json +9 -0
- package/transforms/Gurmukhi-Latin.txt +7 -0
- package/transforms/Gurmukhi-Malayalam.json +9 -0
- package/transforms/Gurmukhi-Malayalam.txt +7 -0
- package/transforms/Gurmukhi-Oriya.json +9 -0
- package/transforms/Gurmukhi-Oriya.txt +7 -0
- package/transforms/Gurmukhi-Tamil.json +9 -0
- package/transforms/Gurmukhi-Tamil.txt +7 -0
- package/transforms/Gurmukhi-Telugu.json +9 -0
- package/transforms/Gurmukhi-Telugu.txt +7 -0
- package/transforms/Gurmukhi-ur.json +8 -0
- package/transforms/Gurmukhi-ur.txt +7 -0
- package/transforms/Han-Latin-Names.json +8 -0
- package/transforms/Han-Latin-Names.txt +65 -0
- package/transforms/Han-Latin.json +9 -0
- package/transforms/Han-Latin.txt +1501 -0
- package/transforms/Han-Spacedhan.json +7 -0
- package/transforms/Han-Spacedhan.txt +35 -0
- package/transforms/Hangul-Latin.json +9 -0
- package/transforms/Hangul-Latin.txt +6 -0
- package/transforms/Hebrew-Latin-BGN.json +9 -0
- package/transforms/Hebrew-Latin-BGN.txt +113 -0
- package/transforms/Hebrew-Latin.json +11 -0
- package/transforms/Hebrew-Latin.txt +91 -0
- package/transforms/Hiragana-Katakana.json +11 -0
- package/transforms/Hiragana-Katakana.txt +179 -0
- package/transforms/Hiragana-Latin.json +11 -0
- package/transforms/Hiragana-Latin.txt +9 -0
- package/transforms/IPA-XSampa.json +11 -0
- package/transforms/IPA-XSampa.txt +228 -0
- package/transforms/InterIndic-Arabic.json +7 -0
- package/transforms/InterIndic-Arabic.txt +128 -0
- package/transforms/InterIndic-Bengali.json +7 -0
- package/transforms/InterIndic-Bengali.txt +135 -0
- package/transforms/InterIndic-Devanagari.json +7 -0
- package/transforms/InterIndic-Devanagari.txt +151 -0
- package/transforms/InterIndic-Gujarati.json +7 -0
- package/transforms/InterIndic-Gujarati.txt +136 -0
- package/transforms/InterIndic-Gurmukhi.json +7 -0
- package/transforms/InterIndic-Gurmukhi.txt +142 -0
- package/transforms/InterIndic-Kannada.json +7 -0
- package/transforms/InterIndic-Kannada.txt +137 -0
- package/transforms/InterIndic-Latin.json +7 -0
- package/transforms/InterIndic-Latin.txt +492 -0
- package/transforms/InterIndic-Malayalam.json +7 -0
- package/transforms/InterIndic-Malayalam.txt +137 -0
- package/transforms/InterIndic-Oriya.json +7 -0
- package/transforms/InterIndic-Oriya.txt +135 -0
- package/transforms/InterIndic-Tamil.json +7 -0
- package/transforms/InterIndic-Tamil.txt +136 -0
- package/transforms/InterIndic-Telugu.json +7 -0
- package/transforms/InterIndic-Telugu.txt +136 -0
- package/transforms/InterIndic-ur.json +7 -0
- package/transforms/InterIndic-ur.txt +119 -0
- package/transforms/Jamo-Latin.json +9 -0
- package/transforms/Jamo-Latin.txt +6 -0
- package/transforms/Kannada-Arabic.json +9 -0
- package/transforms/Kannada-Arabic.txt +7 -0
- package/transforms/Kannada-Bengali.json +9 -0
- package/transforms/Kannada-Bengali.txt +7 -0
- package/transforms/Kannada-Devanagari.json +9 -0
- package/transforms/Kannada-Devanagari.txt +7 -0
- package/transforms/Kannada-Gujarati.json +9 -0
- package/transforms/Kannada-Gujarati.txt +7 -0
- package/transforms/Kannada-Gurmukhi.json +9 -0
- package/transforms/Kannada-Gurmukhi.txt +7 -0
- package/transforms/Kannada-InterIndic.json +7 -0
- package/transforms/Kannada-InterIndic.txt +87 -0
- package/transforms/Kannada-Latin.json +9 -0
- package/transforms/Kannada-Latin.txt +7 -0
- package/transforms/Kannada-Malayalam.json +9 -0
- package/transforms/Kannada-Malayalam.txt +7 -0
- package/transforms/Kannada-Oriya.json +9 -0
- package/transforms/Kannada-Oriya.txt +7 -0
- package/transforms/Kannada-Tamil.json +9 -0
- package/transforms/Kannada-Tamil.txt +7 -0
- package/transforms/Kannada-Telugu.json +9 -0
- package/transforms/Kannada-Telugu.txt +7 -0
- package/transforms/Kannada-ur.json +8 -0
- package/transforms/Kannada-ur.txt +7 -0
- package/transforms/Katakana-Latin-BGN.json +9 -0
- package/transforms/Katakana-Latin-BGN.txt +335 -0
- package/transforms/Kazakh-Latin-BGN.json +9 -0
- package/transforms/Kazakh-Latin-BGN.txt +332 -0
- package/transforms/Kirghiz-Latin-BGN.json +9 -0
- package/transforms/Kirghiz-Latin-BGN.txt +211 -0
- package/transforms/Korean-Latin-BGN.json +9 -0
- package/transforms/Korean-Latin-BGN.txt +345 -0
- package/transforms/Latin-ASCII.json +9 -0
- package/transforms/Latin-ASCII.txt +909 -0
- package/transforms/Latin-Armenian.json +11 -0
- package/transforms/Latin-Armenian.txt +88 -0
- package/transforms/Latin-Bengali.json +9 -0
- package/transforms/Latin-Bengali.txt +8 -0
- package/transforms/Latin-Bopomofo.json +11 -0
- package/transforms/Latin-Bopomofo.txt +1445 -0
- package/transforms/Latin-ConjoiningJamo.json +7 -0
- package/transforms/Latin-ConjoiningJamo.txt +477 -0
- package/transforms/Latin-Devanagari.json +9 -0
- package/transforms/Latin-Devanagari.txt +8 -0
- package/transforms/Latin-Ethiopic.json +11 -0
- package/transforms/Latin-Ethiopic.txt +277 -0
- package/transforms/Latin-Gujarati.json +9 -0
- package/transforms/Latin-Gujarati.txt +8 -0
- package/transforms/Latin-Gurmukhi.json +9 -0
- package/transforms/Latin-Gurmukhi.txt +8 -0
- package/transforms/Latin-Hangul.json +9 -0
- package/transforms/Latin-Hangul.txt +7 -0
- package/transforms/Latin-InterIndic.json +7 -0
- package/transforms/Latin-InterIndic.txt +377 -0
- package/transforms/Latin-Jamo.json +9 -0
- package/transforms/Latin-Jamo.txt +7 -0
- package/transforms/Latin-Kannada.json +9 -0
- package/transforms/Latin-Kannada.txt +8 -0
- package/transforms/Latin-Katakana.json +11 -0
- package/transforms/Latin-Katakana.txt +382 -0
- package/transforms/Latin-Malayalam.json +9 -0
- package/transforms/Latin-Malayalam.txt +8 -0
- package/transforms/Latin-NumericPinyin.json +9 -0
- package/transforms/Latin-NumericPinyin.txt +29 -0
- package/transforms/Latin-Oriya.json +9 -0
- package/transforms/Latin-Oriya.txt +8 -0
- package/transforms/Latin-Tamil.json +9 -0
- package/transforms/Latin-Tamil.txt +8 -0
- package/transforms/Latin-Telugu.json +9 -0
- package/transforms/Latin-Telugu.txt +8 -0
- package/transforms/Latin-Thai.json +9 -0
- package/transforms/Latin-Thai.txt +7 -0
- package/transforms/Macedonian-Latin-BGN.json +9 -0
- package/transforms/Macedonian-Latin-BGN.txt +176 -0
- package/transforms/Malayalam-Arabic.json +9 -0
- package/transforms/Malayalam-Arabic.txt +7 -0
- package/transforms/Malayalam-Bengali.json +9 -0
- package/transforms/Malayalam-Bengali.txt +7 -0
- package/transforms/Malayalam-Devanagari.json +9 -0
- package/transforms/Malayalam-Devanagari.txt +7 -0
- package/transforms/Malayalam-Gujarati.json +9 -0
- package/transforms/Malayalam-Gujarati.txt +7 -0
- package/transforms/Malayalam-Gurmukhi.json +9 -0
- package/transforms/Malayalam-Gurmukhi.txt +7 -0
- package/transforms/Malayalam-InterIndic.json +7 -0
- package/transforms/Malayalam-InterIndic.txt +87 -0
- package/transforms/Malayalam-Kannada.json +9 -0
- package/transforms/Malayalam-Kannada.txt +7 -0
- package/transforms/Malayalam-Latin.json +9 -0
- package/transforms/Malayalam-Latin.txt +7 -0
- package/transforms/Malayalam-Oriya.json +9 -0
- package/transforms/Malayalam-Oriya.txt +7 -0
- package/transforms/Malayalam-Tamil.json +9 -0
- package/transforms/Malayalam-Tamil.txt +7 -0
- package/transforms/Malayalam-Telugu.json +9 -0
- package/transforms/Malayalam-Telugu.txt +7 -0
- package/transforms/Malayalam-ur.json +8 -0
- package/transforms/Malayalam-ur.txt +7 -0
- package/transforms/Maldivian-Latin-BGN.json +9 -0
- package/transforms/Maldivian-Latin-BGN.txt +171 -0
- package/transforms/Mongolian-Latin-BGN.json +9 -0
- package/transforms/Mongolian-Latin-BGN.txt +151 -0
- package/transforms/Myanmar-Latin.json +9 -0
- package/transforms/Myanmar-Latin.txt +367 -0
- package/transforms/Oriya-Arabic.json +9 -0
- package/transforms/Oriya-Arabic.txt +7 -0
- package/transforms/Oriya-Bengali.json +9 -0
- package/transforms/Oriya-Bengali.txt +7 -0
- package/transforms/Oriya-Devanagari.json +9 -0
- package/transforms/Oriya-Devanagari.txt +7 -0
- package/transforms/Oriya-Gujarati.json +9 -0
- package/transforms/Oriya-Gujarati.txt +7 -0
- package/transforms/Oriya-Gurmukhi.json +9 -0
- package/transforms/Oriya-Gurmukhi.txt +7 -0
- package/transforms/Oriya-InterIndic.json +7 -0
- package/transforms/Oriya-InterIndic.txt +91 -0
- package/transforms/Oriya-Kannada.json +9 -0
- package/transforms/Oriya-Kannada.txt +7 -0
- package/transforms/Oriya-Latin.json +9 -0
- package/transforms/Oriya-Latin.txt +7 -0
- package/transforms/Oriya-Malayalam.json +9 -0
- package/transforms/Oriya-Malayalam.txt +7 -0
- package/transforms/Oriya-Tamil.json +9 -0
- package/transforms/Oriya-Tamil.txt +7 -0
- package/transforms/Oriya-Telugu.json +9 -0
- package/transforms/Oriya-Telugu.txt +7 -0
- package/transforms/Oriya-ur.json +8 -0
- package/transforms/Oriya-ur.txt +7 -0
- package/transforms/Pashto-Latin-BGN.json +9 -0
- package/transforms/Pashto-Latin-BGN.txt +231 -0
- package/transforms/Persian-Latin-BGN.json +9 -0
- package/transforms/Persian-Latin-BGN.txt +203 -0
- package/transforms/Pinyin-NumericPinyin.json +7 -0
- package/transforms/Pinyin-NumericPinyin.txt +8 -0
- package/transforms/Russian-Latin-BGN.json +9 -0
- package/transforms/Russian-Latin-BGN.txt +235 -0
- package/transforms/Serbian-Latin-BGN.json +9 -0
- package/transforms/Serbian-Latin-BGN.txt +119 -0
- package/transforms/Simplified-Traditional.json +11 -0
- package/transforms/Simplified-Traditional.txt +4393 -0
- package/transforms/Syriac-Latin.json +11 -0
- package/transforms/Syriac-Latin.txt +52 -0
- package/transforms/Tamil-Arabic.json +9 -0
- package/transforms/Tamil-Arabic.txt +7 -0
- package/transforms/Tamil-Bengali.json +9 -0
- package/transforms/Tamil-Bengali.txt +7 -0
- package/transforms/Tamil-Devanagari.json +9 -0
- package/transforms/Tamil-Devanagari.txt +7 -0
- package/transforms/Tamil-Gujarati.json +9 -0
- package/transforms/Tamil-Gujarati.txt +7 -0
- package/transforms/Tamil-Gurmukhi.json +9 -0
- package/transforms/Tamil-Gurmukhi.txt +7 -0
- package/transforms/Tamil-InterIndic.json +7 -0
- package/transforms/Tamil-InterIndic.txt +70 -0
- package/transforms/Tamil-Kannada.json +9 -0
- package/transforms/Tamil-Kannada.txt +7 -0
- package/transforms/Tamil-Latin.json +9 -0
- package/transforms/Tamil-Latin.txt +7 -0
- package/transforms/Tamil-Malayalam.json +9 -0
- package/transforms/Tamil-Malayalam.txt +7 -0
- package/transforms/Tamil-Oriya.json +9 -0
- package/transforms/Tamil-Oriya.txt +7 -0
- package/transforms/Tamil-Telugu.json +9 -0
- package/transforms/Tamil-Telugu.txt +7 -0
- package/transforms/Tamil-ur.json +8 -0
- package/transforms/Tamil-ur.txt +7 -0
- package/transforms/Telugu-Arabic.json +9 -0
- package/transforms/Telugu-Arabic.txt +7 -0
- package/transforms/Telugu-Bengali.json +9 -0
- package/transforms/Telugu-Bengali.txt +7 -0
- package/transforms/Telugu-Devanagari.json +9 -0
- package/transforms/Telugu-Devanagari.txt +7 -0
- package/transforms/Telugu-Gujarati.json +9 -0
- package/transforms/Telugu-Gujarati.txt +7 -0
- package/transforms/Telugu-Gurmukhi.json +9 -0
- package/transforms/Telugu-Gurmukhi.txt +7 -0
- package/transforms/Telugu-InterIndic.json +7 -0
- package/transforms/Telugu-InterIndic.txt +87 -0
- package/transforms/Telugu-Kannada.json +9 -0
- package/transforms/Telugu-Kannada.txt +7 -0
- package/transforms/Telugu-Latin.json +9 -0
- package/transforms/Telugu-Latin.txt +7 -0
- package/transforms/Telugu-Malayalam.json +9 -0
- package/transforms/Telugu-Malayalam.txt +7 -0
- package/transforms/Telugu-Oriya.json +9 -0
- package/transforms/Telugu-Oriya.txt +7 -0
- package/transforms/Telugu-Tamil.json +9 -0
- package/transforms/Telugu-Tamil.txt +7 -0
- package/transforms/Telugu-ur.json +8 -0
- package/transforms/Telugu-ur.txt +7 -0
- package/transforms/Thaana-Latin.json +11 -0
- package/transforms/Thaana-Latin.txt +433 -0
- package/transforms/Thai-Latin.json +9 -0
- package/transforms/Thai-Latin.txt +9 -0
- package/transforms/Thai-ThaiLogical.json +7 -0
- package/transforms/Thai-ThaiLogical.txt +16 -0
- package/transforms/Thai-ThaiSemi.json +7 -0
- package/transforms/Thai-ThaiSemi.txt +6 -0
- package/transforms/ThaiLogical-Latin.json +7 -0
- package/transforms/ThaiLogical-Latin.txt +147 -0
- package/transforms/Turkmen-Latin-BGN.json +9 -0
- package/transforms/Turkmen-Latin-BGN.txt +302 -0
- package/transforms/Ukrainian-Latin-BGN.json +9 -0
- package/transforms/Ukrainian-Latin-BGN.txt +283 -0
- package/transforms/Uzbek-Latin-BGN.json +9 -0
- package/transforms/Uzbek-Latin-BGN.txt +261 -0
- package/transforms/am-Ethi-t-am-brai.json +11 -0
- package/transforms/am-Ethi-t-am-brai.txt +652 -0
- package/transforms/am-Ethi-t-am-ethi-m0-geminate.json +9 -0
- package/transforms/am-Ethi-t-am-ethi-m0-geminate.txt +6925 -0
- package/transforms/am-Ethi-t-d0-morse.json +9 -0
- package/transforms/am-Ethi-t-d0-morse.txt +657 -0
- package/transforms/am-am_FONIPA.json +9 -0
- package/transforms/am-am_FONIPA.txt +694 -0
- package/transforms/am-ar.json +8 -0
- package/transforms/am-ar.txt +5 -0
- package/transforms/am-chr.json +8 -0
- package/transforms/am-chr.txt +4 -0
- package/transforms/am-fa.json +8 -0
- package/transforms/am-fa.txt +4 -0
- package/transforms/az-Lower.json +8 -0
- package/transforms/az-Lower.txt +13 -0
- package/transforms/az-Title.json +8 -0
- package/transforms/az-Title.txt +11 -0
- package/transforms/az-Upper.json +8 -0
- package/transforms/az-Upper.txt +5 -0
- package/transforms/blt-fonipa-t-blt.json +8 -0
- package/transforms/blt-fonipa-t-blt.txt +132 -0
- package/transforms/byn-Ethi-t-byn-latn-m0-tekie-alibekit.json +11 -0
- package/transforms/byn-Ethi-t-byn-latn-m0-tekie-alibekit.txt +537 -0
- package/transforms/byn-Ethi-t-byn-latn-m0-xaleget.json +11 -0
- package/transforms/byn-Ethi-t-byn-latn-m0-xaleget.txt +773 -0
- package/transforms/ch-am.json +8 -0
- package/transforms/ch-am.txt +4 -0
- package/transforms/ch-ar.json +8 -0
- package/transforms/ch-ar.txt +4 -0
- package/transforms/ch-ch_FONIPA.json +8 -0
- package/transforms/ch-ch_FONIPA.txt +79 -0
- package/transforms/ch-chr.json +8 -0
- package/transforms/ch-chr.txt +4 -0
- package/transforms/ch-fa.json +8 -0
- package/transforms/ch-fa.txt +4 -0
- package/transforms/chr-chr_FONIPA.json +8 -0
- package/transforms/chr-chr_FONIPA.txt +111 -0
- package/transforms/cs-am.json +8 -0
- package/transforms/cs-am.txt +4 -0
- package/transforms/cs-ar.json +8 -0
- package/transforms/cs-ar.txt +4 -0
- package/transforms/cs-chr.json +8 -0
- package/transforms/cs-chr.txt +4 -0
- package/transforms/cs-cs_FONIPA.json +8 -0
- package/transforms/cs-cs_FONIPA.txt +74 -0
- package/transforms/cs-fa.json +8 -0
- package/transforms/cs-fa.txt +4 -0
- package/transforms/cs-ja.json +8 -0
- package/transforms/cs-ja.txt +4 -0
- package/transforms/cs-ko.json +8 -0
- package/transforms/cs-ko.txt +4 -0
- package/transforms/cs_FONIPA-ja.json +8 -0
- package/transforms/cs_FONIPA-ja.txt +228 -0
- package/transforms/cs_FONIPA-ko.json +8 -0
- package/transforms/cs_FONIPA-ko.txt +88 -0
- package/transforms/cy-fonipa-t-cy.json +8 -0
- package/transforms/cy-fonipa-t-cy.txt +189 -0
- package/transforms/de-ASCII.json +8 -0
- package/transforms/de-ASCII.txt +15 -0
- package/transforms/dsb-dsb_FONIPA.json +8 -0
- package/transforms/dsb-dsb_FONIPA.txt +67 -0
- package/transforms/el-Lower.json +8 -0
- package/transforms/el-Lower.txt +12 -0
- package/transforms/el-Title.json +8 -0
- package/transforms/el-Title.txt +12 -0
- package/transforms/el-Upper.json +8 -0
- package/transforms/el-Upper.txt +11 -0
- package/transforms/eo-am.json +8 -0
- package/transforms/eo-am.txt +4 -0
- package/transforms/eo-ar.json +8 -0
- package/transforms/eo-ar.txt +4 -0
- package/transforms/eo-chr.json +8 -0
- package/transforms/eo-chr.txt +4 -0
- package/transforms/eo-eo_FONIPA.json +8 -0
- package/transforms/eo-eo_FONIPA.txt +47 -0
- package/transforms/eo-fa.json +8 -0
- package/transforms/eo-fa.txt +4 -0
- package/transforms/es-am.json +8 -0
- package/transforms/es-am.txt +4 -0
- package/transforms/es-ar.json +8 -0
- package/transforms/es-ar.txt +13 -0
- package/transforms/es-chr.json +8 -0
- package/transforms/es-chr.txt +4 -0
- package/transforms/es-es_FONIPA.json +8 -0
- package/transforms/es-es_FONIPA.txt +139 -0
- package/transforms/es-fa.json +8 -0
- package/transforms/es-fa.txt +13 -0
- package/transforms/es-ja.json +8 -0
- package/transforms/es-ja.txt +4 -0
- package/transforms/es-zh.json +8 -0
- package/transforms/es-zh.txt +4 -0
- package/transforms/es_419-am.json +8 -0
- package/transforms/es_419-am.txt +5 -0
- package/transforms/es_419-ar.json +8 -0
- package/transforms/es_419-ar.txt +14 -0
- package/transforms/es_419-chr.json +8 -0
- package/transforms/es_419-chr.txt +5 -0
- package/transforms/es_419-fa.json +8 -0
- package/transforms/es_419-fa.txt +14 -0
- package/transforms/es_419-ja.json +8 -0
- package/transforms/es_419-ja.txt +5 -0
- package/transforms/es_419-zh.json +8 -0
- package/transforms/es_419-zh.txt +5 -0
- package/transforms/es_FONIPA-am.json +8 -0
- package/transforms/es_FONIPA-am.txt +230 -0
- package/transforms/es_FONIPA-es_419_FONIPA.json +8 -0
- package/transforms/es_FONIPA-es_419_FONIPA.txt +6 -0
- package/transforms/es_FONIPA-ja.json +8 -0
- package/transforms/es_FONIPA-ja.txt +155 -0
- package/transforms/es_FONIPA-zh.json +8 -0
- package/transforms/es_FONIPA-zh.txt +522 -0
- package/transforms/fa-fa_FONIPA.json +8 -0
- package/transforms/fa-fa_FONIPA.txt +107 -0
- package/transforms/gz-Ethi-t-und-sarb.json +11 -0
- package/transforms/gz-Ethi-t-und-sarb.txt +180 -0
- package/transforms/ha-ha_NE.json +8 -0
- package/transforms/ha-ha_NE.txt +6 -0
- package/transforms/hy-am.json +8 -0
- package/transforms/hy-am.txt +4 -0
- package/transforms/hy-ar.json +8 -0
- package/transforms/hy-ar.txt +4 -0
- package/transforms/hy-chr.json +8 -0
- package/transforms/hy-chr.txt +4 -0
- package/transforms/hy-fa.json +8 -0
- package/transforms/hy-fa.txt +4 -0
- package/transforms/hy-hy_FONIPA.json +8 -0
- package/transforms/hy-hy_FONIPA.txt +52 -0
- package/transforms/hy_AREVMDA-am.json +8 -0
- package/transforms/hy_AREVMDA-am.txt +4 -0
- package/transforms/hy_AREVMDA-ar.json +8 -0
- package/transforms/hy_AREVMDA-ar.txt +4 -0
- package/transforms/hy_AREVMDA-chr.json +8 -0
- package/transforms/hy_AREVMDA-chr.txt +4 -0
- package/transforms/hy_AREVMDA-fa.json +8 -0
- package/transforms/hy_AREVMDA-fa.txt +4 -0
- package/transforms/hy_AREVMDA-hy_AREVMDA_FONIPA.json +8 -0
- package/transforms/hy_AREVMDA-hy_AREVMDA_FONIPA.txt +80 -0
- package/transforms/ia-am.json +8 -0
- package/transforms/ia-am.txt +4 -0
- package/transforms/ia-ar.json +8 -0
- package/transforms/ia-ar.txt +4 -0
- package/transforms/ia-chr.json +8 -0
- package/transforms/ia-chr.txt +4 -0
- package/transforms/ia-fa.json +8 -0
- package/transforms/ia-fa.txt +4 -0
- package/transforms/ia-ia_FONIPA.json +8 -0
- package/transforms/ia-ia_FONIPA.txt +71 -0
- package/transforms/it-am.json +8 -0
- package/transforms/it-am.txt +257 -0
- package/transforms/it-ja.json +8 -0
- package/transforms/it-ja.txt +259 -0
- package/transforms/ja_Latn-ko.json +8 -0
- package/transforms/ja_Latn-ko.txt +141 -0
- package/transforms/ja_Latn-ru.json +8 -0
- package/transforms/ja_Latn-ru.txt +123 -0
- package/transforms/kk-am.json +8 -0
- package/transforms/kk-am.txt +4 -0
- package/transforms/kk-ar.json +8 -0
- package/transforms/kk-ar.txt +4 -0
- package/transforms/kk-chr.json +8 -0
- package/transforms/kk-chr.txt +4 -0
- package/transforms/kk-fa.json +8 -0
- package/transforms/kk-fa.txt +4 -0
- package/transforms/kk-kk_FONIPA.json +8 -0
- package/transforms/kk-kk_FONIPA.txt +59 -0
- package/transforms/ky-am.json +8 -0
- package/transforms/ky-am.txt +4 -0
- package/transforms/ky-ar.json +8 -0
- package/transforms/ky-ar.txt +4 -0
- package/transforms/ky-chr.json +8 -0
- package/transforms/ky-chr.txt +4 -0
- package/transforms/ky-fa.json +8 -0
- package/transforms/ky-fa.txt +4 -0
- package/transforms/ky-ky_FONIPA.json +8 -0
- package/transforms/ky-ky_FONIPA.txt +71 -0
- package/transforms/la-la_FONIPA.json +8 -0
- package/transforms/la-la_FONIPA.txt +79 -0
- package/transforms/lt-Lower.json +8 -0
- package/transforms/lt-Lower.txt +20 -0
- package/transforms/lt-Title.json +8 -0
- package/transforms/lt-Title.txt +15 -0
- package/transforms/lt-Upper.json +8 -0
- package/transforms/lt-Upper.txt +8 -0
- package/transforms/mn-mn_Latn-MNS.json +8 -0
- package/transforms/mn-mn_Latn-MNS.txt +86 -0
- package/transforms/my-am.json +8 -0
- package/transforms/my-am.txt +4 -0
- package/transforms/my-ar.json +8 -0
- package/transforms/my-ar.txt +4 -0
- package/transforms/my-chr.json +8 -0
- package/transforms/my-chr.txt +4 -0
- package/transforms/my-fa.json +8 -0
- package/transforms/my-fa.txt +4 -0
- package/transforms/my-my_FONIPA.json +8 -0
- package/transforms/my-my_FONIPA.txt +325 -0
- package/transforms/my-t-my-d0-zawgyi.json +8 -0
- package/transforms/my-t-my-d0-zawgyi.txt +222 -0
- package/transforms/my-t-my-s0-zawgyi.json +8 -0
- package/transforms/my-t-my-s0-zawgyi.txt +231 -0
- package/transforms/nl-Title.json +8 -0
- package/transforms/nl-Title.txt +7 -0
- package/transforms/nv-nv_FONIPA.json +8 -0
- package/transforms/nv-nv_FONIPA.txt +74 -0
- package/transforms/pl-am.json +8 -0
- package/transforms/pl-am.txt +4 -0
- package/transforms/pl-ar.json +8 -0
- package/transforms/pl-ar.txt +4 -0
- package/transforms/pl-chr.json +8 -0
- package/transforms/pl-chr.txt +4 -0
- package/transforms/pl-fa.json +8 -0
- package/transforms/pl-fa.txt +4 -0
- package/transforms/pl-ja.json +8 -0
- package/transforms/pl-ja.txt +4 -0
- package/transforms/pl-pl_FONIPA.json +8 -0
- package/transforms/pl-pl_FONIPA.txt +113 -0
- package/transforms/pl_FONIPA-ja.json +8 -0
- package/transforms/pl_FONIPA-ja.txt +301 -0
- package/transforms/rm_SURSILV-am.json +8 -0
- package/transforms/rm_SURSILV-am.txt +4 -0
- package/transforms/rm_SURSILV-ar.json +8 -0
- package/transforms/rm_SURSILV-ar.txt +4 -0
- package/transforms/rm_SURSILV-chr.json +8 -0
- package/transforms/rm_SURSILV-chr.txt +4 -0
- package/transforms/rm_SURSILV-fa.json +8 -0
- package/transforms/rm_SURSILV-fa.txt +4 -0
- package/transforms/rm_SURSILV-rm_FONIPA_SURSILV.json +8 -0
- package/transforms/rm_SURSILV-rm_FONIPA_SURSILV.txt +96 -0
- package/transforms/ro-am.json +8 -0
- package/transforms/ro-am.txt +4 -0
- package/transforms/ro-ar.json +8 -0
- package/transforms/ro-ar.txt +4 -0
- package/transforms/ro-chr.json +8 -0
- package/transforms/ro-chr.txt +4 -0
- package/transforms/ro-fa.json +8 -0
- package/transforms/ro-fa.txt +4 -0
- package/transforms/ro-ja.json +8 -0
- package/transforms/ro-ja.txt +4 -0
- package/transforms/ro-ro_FONIPA.json +8 -0
- package/transforms/ro-ro_FONIPA.txt +121 -0
- package/transforms/ro_FONIPA-ja.json +8 -0
- package/transforms/ro_FONIPA-ja.txt +211 -0
- package/transforms/ru-ja.json +8 -0
- package/transforms/ru-ja.txt +444 -0
- package/transforms/ru-zh.json +8 -0
- package/transforms/ru-zh.txt +996 -0
- package/transforms/ru_Latn-ru-BGN.json +9 -0
- package/transforms/ru_Latn-ru-BGN.txt +97 -0
- package/transforms/sat-am.json +8 -0
- package/transforms/sat-am.txt +6 -0
- package/transforms/sat-ar.json +8 -0
- package/transforms/sat-ar.txt +6 -0
- package/transforms/sat-chr.json +8 -0
- package/transforms/sat-chr.txt +6 -0
- package/transforms/sat-fa.json +8 -0
- package/transforms/sat-fa.txt +6 -0
- package/transforms/sat_Olck-sat_FONIPA.json +8 -0
- package/transforms/sat_Olck-sat_FONIPA.txt +174 -0
- package/transforms/sgw-Ethi-t-und-ethi.json +11 -0
- package/transforms/sgw-Ethi-t-und-ethi.txt +138 -0
- package/transforms/si-am.json +8 -0
- package/transforms/si-am.txt +4 -0
- package/transforms/si-ar.json +8 -0
- package/transforms/si-ar.txt +4 -0
- package/transforms/si-chr.json +8 -0
- package/transforms/si-chr.txt +4 -0
- package/transforms/si-fa.json +8 -0
- package/transforms/si-fa.txt +4 -0
- package/transforms/si-si_FONIPA.json +8 -0
- package/transforms/si-si_FONIPA.txt +157 -0
- package/transforms/si-si_Latn.json +8 -0
- package/transforms/si-si_Latn.txt +94 -0
- package/transforms/sk-am.json +8 -0
- package/transforms/sk-am.txt +4 -0
- package/transforms/sk-ar.json +8 -0
- package/transforms/sk-ar.txt +4 -0
- package/transforms/sk-chr.json +8 -0
- package/transforms/sk-chr.txt +4 -0
- package/transforms/sk-fa.json +8 -0
- package/transforms/sk-fa.txt +4 -0
- package/transforms/sk-ja.json +8 -0
- package/transforms/sk-ja.txt +4 -0
- package/transforms/sk-sk_FONIPA.json +8 -0
- package/transforms/sk-sk_FONIPA.txt +101 -0
- package/transforms/sk_FONIPA-ja.json +8 -0
- package/transforms/sk_FONIPA-ja.txt +252 -0
- package/transforms/ta-ta_FONIPA.json +8 -0
- package/transforms/ta-ta_FONIPA.txt +73 -0
- package/transforms/tlh-am.json +8 -0
- package/transforms/tlh-am.txt +4 -0
- package/transforms/tlh-ar.json +8 -0
- package/transforms/tlh-ar.txt +4 -0
- package/transforms/tlh-chr.json +8 -0
- package/transforms/tlh-chr.txt +4 -0
- package/transforms/tlh-fa.json +8 -0
- package/transforms/tlh-fa.txt +4 -0
- package/transforms/tlh-tlh_FONIPA.json +8 -0
- package/transforms/tlh-tlh_FONIPA.txt +46 -0
- package/transforms/tr-Lower.json +8 -0
- package/transforms/tr-Lower.txt +13 -0
- package/transforms/tr-Title.json +8 -0
- package/transforms/tr-Title.txt +11 -0
- package/transforms/tr-Upper.json +8 -0
- package/transforms/tr-Upper.txt +8 -0
- package/transforms/ug-ug_FONIPA.json +8 -0
- package/transforms/ug-ug_FONIPA.txt +69 -0
- package/transforms/und-Ethi-t-und-cyrl-m0-gutgarts.json +11 -0
- package/transforms/und-Ethi-t-und-cyrl-m0-gutgarts.txt +747 -0
- package/transforms/und-Ethi-t-und-latn-m0-aethiopi-geminate.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-aethiopi-geminate.txt +19 -0
- package/transforms/und-Ethi-t-und-latn-m0-aethiopi.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-aethiopi.txt +633 -0
- package/transforms/und-Ethi-t-und-latn-m0-alaloc-geminate.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-alaloc-geminate.txt +19 -0
- package/transforms/und-Ethi-t-und-latn-m0-alaloc.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-alaloc.txt +757 -0
- package/transforms/und-Ethi-t-und-latn-m0-beta_metsehaf-geminate.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-beta_metsehaf-geminate.txt +19 -0
- package/transforms/und-Ethi-t-und-latn-m0-beta_metsehaf.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-beta_metsehaf.txt +585 -0
- package/transforms/und-Ethi-t-und-latn-m0-es3842.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-es3842.txt +640 -0
- package/transforms/und-Ethi-t-und-latn-m0-ies-jes-1964-geminate.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-ies-jes-1964-geminate.txt +19 -0
- package/transforms/und-Ethi-t-und-latn-m0-ies-jes-1964.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-ies-jes-1964.txt +619 -0
- package/transforms/und-Ethi-t-und-latn-m0-lambdin.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-lambdin.txt +627 -0
- package/transforms/und-Ethi-t-und-latn-m0-sera.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-sera.txt +695 -0
- package/transforms/und-Ethi-t-und-latn.json +11 -0
- package/transforms/und-Ethi-t-und-latn.txt +16 -0
- package/transforms/und_FONIPA-ar.json +8 -0
- package/transforms/und_FONIPA-ar.txt +114 -0
- package/transforms/und_FONIPA-chr.json +8 -0
- package/transforms/und_FONIPA-chr.txt +172 -0
- package/transforms/und_FONIPA-fa.json +8 -0
- package/transforms/und_FONIPA-fa.txt +109 -0
- package/transforms/uz_Cyrl-uz_Latn.json +9 -0
- package/transforms/uz_Cyrl-uz_Latn.txt +103 -0
- package/transforms/vec-vec_FONIPA.json +8 -0
- package/transforms/vec-vec_FONIPA.txt +85 -0
- package/transforms/xh-am.json +8 -0
- package/transforms/xh-am.txt +4 -0
- package/transforms/xh-ar.json +8 -0
- package/transforms/xh-ar.txt +4 -0
- package/transforms/xh-chr.json +8 -0
- package/transforms/xh-chr.txt +4 -0
- package/transforms/xh-fa.json +8 -0
- package/transforms/xh-fa.txt +4 -0
- package/transforms/xh-xh_FONIPA.json +8 -0
- package/transforms/xh-xh_FONIPA.txt +85 -0
- package/transforms/yo-yo_BJ.json +8 -0
- package/transforms/yo-yo_BJ.txt +36 -0
- package/transforms/zh_Latn_PINYIN-ru.json +8 -0
- package/transforms/zh_Latn_PINYIN-ru.txt +148 -0
- package/transforms/zu-am.json +8 -0
- package/transforms/zu-am.txt +4 -0
- package/transforms/zu-ar.json +8 -0
- package/transforms/zu-ar.txt +4 -0
- package/transforms/zu-chr.json +8 -0
- package/transforms/zu-chr.txt +4 -0
- package/transforms/zu-fa.json +8 -0
- package/transforms/zu-fa.txt +4 -0
- package/transforms/zu-zu_FONIPA.json +8 -0
- package/transforms/zu-zu_FONIPA.txt +72 -0
- package/transforms.json +385 -0
|
@@ -0,0 +1,88 @@
|
|
|
1
|
+
|
|
2
|
+
# Transliteration of Phonemic Czech (cs_FONIPA) to Korean (ko).
|
|
3
|
+
#
|
|
4
|
+
# First pass: Phonemic Czech (cs_FONIPA) to Latinized Korean (ko_Latn).
|
|
5
|
+
$vowel = [aeɛiɪoux];
|
|
6
|
+
$start = [\u0020$];
|
|
7
|
+
$end = [\u0020$];
|
|
8
|
+
b } $end → peu ;
|
|
9
|
+
b } $vowel → b ;
|
|
10
|
+
bj } $vowel → b ; # objɛc → obeti
|
|
11
|
+
b → beu ;
|
|
12
|
+
c } $end → ti ;
|
|
13
|
+
c → t ;
|
|
14
|
+
d͡z → deuj ;
|
|
15
|
+
d } $end → teu ;
|
|
16
|
+
d } $vowel → d ;
|
|
17
|
+
d → deu ;
|
|
18
|
+
ɛ → e ;
|
|
19
|
+
f } $vowel → p ;
|
|
20
|
+
f → peu ;
|
|
21
|
+
ɡ } $vowel → g ;
|
|
22
|
+
ɡ → geu ;
|
|
23
|
+
ɦ } $vowel → h ;
|
|
24
|
+
ɦ → heu ;
|
|
25
|
+
h } $vowel → h ;
|
|
26
|
+
h → heu ;
|
|
27
|
+
i → i ;
|
|
28
|
+
ɪ → i ;
|
|
29
|
+
j } $end → i ; # pokoj → pokoi
|
|
30
|
+
j → y ;
|
|
31
|
+
kvu → keub ; # kvuasɪ → keubasi
|
|
32
|
+
ks } $end → gseu ; # ksɛroks → jelogseu
|
|
33
|
+
$start { ks → j ; # ksɛroks → jelogseu
|
|
34
|
+
ks → gs ; # saksofoːn → sagsopon
|
|
35
|
+
k } $vowel → k ;
|
|
36
|
+
k → keu ;
|
|
37
|
+
$vowel { l } $vowel → ll ;
|
|
38
|
+
lz → lj ;
|
|
39
|
+
m } $end → m ;
|
|
40
|
+
m } $vowel → m ;
|
|
41
|
+
m } [l] → m ;
|
|
42
|
+
m → meu ;
|
|
43
|
+
ɲ → n ;
|
|
44
|
+
ŋ → n ;
|
|
45
|
+
p } $vowel → p ;
|
|
46
|
+
p } t → b ; # koroptɛv
|
|
47
|
+
p → peu ;
|
|
48
|
+
r̝ } $end → leusi ; # kour̝ → kouleusi
|
|
49
|
+
r̝ } $vowel → leuj ;
|
|
50
|
+
r̝ } k → leusyu ; # ɦor̝kiː → holeusyuki
|
|
51
|
+
r̝ → leuju ;
|
|
52
|
+
r } $vowel → l ;
|
|
53
|
+
r → leu ;
|
|
54
|
+
s } $vowel → s ;
|
|
55
|
+
s → seu ;
|
|
56
|
+
ʃ } $end → si ;
|
|
57
|
+
ʃ } $vowel → sy ;
|
|
58
|
+
ʃ → syu ;
|
|
59
|
+
t͡s} $vowel → ch ;
|
|
60
|
+
t͡s → cheu ;
|
|
61
|
+
t͡ʃ} $vowel → ch ;
|
|
62
|
+
t͡ʃ → chi ;
|
|
63
|
+
t } $vowel → t ;
|
|
64
|
+
t → teu ;
|
|
65
|
+
vj → b ; # ʒvjɛr̝ɪna → jubeleujina
|
|
66
|
+
v } $end → peu ;
|
|
67
|
+
v } $vowel → b ;
|
|
68
|
+
v → beu ;
|
|
69
|
+
x } $vowel → h ;
|
|
70
|
+
x → heu ;
|
|
71
|
+
ɣ } $vowel → h ;
|
|
72
|
+
ɣ → heu ;
|
|
73
|
+
z } $vowel → j ; # zaːmɛk → jamekeu
|
|
74
|
+
z } $end → seu ; # ɦmɪz → heumiseu
|
|
75
|
+
z → jeu ; # pozdniː → pojeudeuni
|
|
76
|
+
ʒ } $vowel → j ; # ʒɪʒka → jisyuka (first ʒ)
|
|
77
|
+
ʒ } v → ju ; # ʒvjɛr̝ɪna → jubeleujina
|
|
78
|
+
ʒ } $end → si ; # broʒ → beulosi
|
|
79
|
+
ʒ → syu ; # ʒɪʒka → jisyuka (second ʒ)
|
|
80
|
+
ɟ } $vowel → dy ;
|
|
81
|
+
ɟ → ti ;
|
|
82
|
+
ː → ;
|
|
83
|
+
\u0020 → ; # space
|
|
84
|
+
#
|
|
85
|
+
#
|
|
86
|
+
# Second pass.
|
|
87
|
+
:: Latin-Hangul ();
|
|
88
|
+
|
|
@@ -0,0 +1,189 @@
|
|
|
1
|
+
|
|
2
|
+
# Transformation from Welsh (cy) to its IPA transcription (cy_FONIPA).
|
|
3
|
+
# Based on description of Northern Welsh in:
|
|
4
|
+
#
|
|
5
|
+
# http://en.wikipedia.org/wiki/Welsh_orthography
|
|
6
|
+
# http://en.wikipedia.org/wiki/Welsh_phonology
|
|
7
|
+
#
|
|
8
|
+
# Note that these rules are NOT complete: to be complete we would have to know
|
|
9
|
+
# the morphological analysis of the word. For example, final ‹au› is pronounced
|
|
10
|
+
# /a/ if it is the noun plural marker, otherwise it is /aɨ/. Similarly in
|
|
11
|
+
# “llongyfarch” (‘congratulating’), the morphological decomposition — “llon +
|
|
12
|
+
# cyfarch” — is needed to know that the ‹ng› is pronounced as /ŋg/, not as
|
|
13
|
+
# /ŋ/.
|
|
14
|
+
#
|
|
15
|
+
# Author: Richard Sproat
|
|
16
|
+
::Lower;
|
|
17
|
+
::NFC;
|
|
18
|
+
[’ [:P:]] → ;
|
|
19
|
+
# Class definitions
|
|
20
|
+
$end = [$ ];
|
|
21
|
+
# Both orthographic and phonetic vowels
|
|
22
|
+
$vowel = [aeiouwyâêîôûŵŷɑɨəɛɪɔʊ];
|
|
23
|
+
# W is a placeholder for the glide -- see below
|
|
24
|
+
$cons = [
|
|
25
|
+
m {m̥} n {n̥} ŋ {ŋ̊}
|
|
26
|
+
p b t d k ɡ
|
|
27
|
+
f v θ ð s ʃ h χ
|
|
28
|
+
l ɬ r {r̥}
|
|
29
|
+
{d͡ʒ} g W w j
|
|
30
|
+
];
|
|
31
|
+
# Preprocessing of letters that sometimes occur
|
|
32
|
+
k → c;
|
|
33
|
+
v → f;
|
|
34
|
+
x → s;
|
|
35
|
+
z → s;
|
|
36
|
+
::Null;
|
|
37
|
+
# Consonant transductions:
|
|
38
|
+
# Trigraphs
|
|
39
|
+
ngh → ŋ̊;
|
|
40
|
+
# Digraphs
|
|
41
|
+
ch → χ;
|
|
42
|
+
dd → ð;
|
|
43
|
+
ff → f;
|
|
44
|
+
ll → ɬ;
|
|
45
|
+
mh → m̥;
|
|
46
|
+
nh → n̥;
|
|
47
|
+
ng → ŋ;
|
|
48
|
+
ph → f;
|
|
49
|
+
rh → r̥;
|
|
50
|
+
th → θ;
|
|
51
|
+
# Monographs
|
|
52
|
+
b → b;
|
|
53
|
+
c → k;
|
|
54
|
+
d → d;
|
|
55
|
+
f → v;
|
|
56
|
+
g → ɡ;
|
|
57
|
+
h → h;
|
|
58
|
+
j → d͡ʒ; # Loan words
|
|
59
|
+
l → l;
|
|
60
|
+
m → m;
|
|
61
|
+
n → n;
|
|
62
|
+
p → p;
|
|
63
|
+
r → r;
|
|
64
|
+
s → s;
|
|
65
|
+
t → t;
|
|
66
|
+
::Null;
|
|
67
|
+
# Transduce ‹si› to /ʃ/ before vowels
|
|
68
|
+
si} $vowel → ʃ;
|
|
69
|
+
::Null;
|
|
70
|
+
# Treatment of glides.
|
|
71
|
+
# First transduce ‹i›, ‹w› to glides prior to vowels. With ‹w› we want to
|
|
72
|
+
# do this also before /r,l/ after /ɡ/ (from Proto-Celtic *w) e.g. “gwlad”,
|
|
73
|
+
# “gwraig”. However the “after g” environment must allow for the following
|
|
74
|
+
# possibilities:
|
|
75
|
+
#
|
|
76
|
+
# ɡ → ŋ via nasal mutation
|
|
77
|
+
# ɡ → 0 via soft mutation
|
|
78
|
+
{i} $vowel → j;
|
|
79
|
+
{w} $vowel → W; # Temporary register
|
|
80
|
+
[ɡŋ] {w} [rl] $vowel → W; # Plain or nasal mutation environment
|
|
81
|
+
^ {w} [rl] $vowel → W; # Soft mutation at the beginning of a word
|
|
82
|
+
# Transduce accented ‹ẃ› to ‹w›: this is used to indicate when a ‹w› that would
|
|
83
|
+
# normally be expected to be a glide, is instead a vowel:
|
|
84
|
+
ẃ → w;
|
|
85
|
+
::Null;
|
|
86
|
+
# Stress placement, needed for vowel quality/quantity prediction
|
|
87
|
+
# Basic rule of stress in Welsh is to place it on the penult,
|
|
88
|
+
# except of course in monosyllables.
|
|
89
|
+
{($vowel+ $cons+ $vowel+ $cons*)} $end → ˈ $1; ## Polysyllabic words
|
|
90
|
+
$end $cons* {($vowel+ $cons*)} $end → ˈ $1; ## Monosyllabic words
|
|
91
|
+
::Null;
|
|
92
|
+
# Transduction of vowels
|
|
93
|
+
# The first rule above overgenerates streams of stress marks. The rule below
|
|
94
|
+
# cleans that up.
|
|
95
|
+
ˈ+ → ˈ;
|
|
96
|
+
# Diphthongs
|
|
97
|
+
# Deal with ‹y› first since we also need to lengthen the /ɨ/ if that is in the
|
|
98
|
+
# correct environment for lengthening.
|
|
99
|
+
# ‹y› is /ɨ/ in final syllable, otherwise /ə/
|
|
100
|
+
yw } $cons* $end → ɨu;
|
|
101
|
+
yw → əu;
|
|
102
|
+
y} $cons* $end → ɨ;
|
|
103
|
+
y → ə;
|
|
104
|
+
::Null;
|
|
105
|
+
# Diphthongs in long environment
|
|
106
|
+
# Final, or before word-final s
|
|
107
|
+
ˈ { ɨu } s? $end → ɨːu;
|
|
108
|
+
ˈ { aw } s? $end → ɑːu;
|
|
109
|
+
ˈ { ew } s? $end → eːu;
|
|
110
|
+
ˈ { oe } s? $end → ɔːɨ;
|
|
111
|
+
ˈ { ou } s? $end → ɔːɨ;
|
|
112
|
+
ˈ { wy } s? $end → uːɨ;
|
|
113
|
+
# before b, ch, d, dd, g, f, ff, th followed by the end of a word
|
|
114
|
+
# or a vowel
|
|
115
|
+
ˈ { ɨu } [bχdðɡvfθ] $end → ɨːu;
|
|
116
|
+
ˈ { aw } [bχdðɡvfθ] $end → ɑːu;
|
|
117
|
+
ˈ { ew } [bχdðɡvfθ] $end → eːu;
|
|
118
|
+
ˈ { oe } [bχdðɡvfθ] $end → ɔːɨ;
|
|
119
|
+
ˈ { ou } [bχdðɡvfθ] $end → ɔːɨ;
|
|
120
|
+
ˈ { wy } [bχdðɡvfθ] $end → uːɨ;
|
|
121
|
+
ˈ { ɨu } [bχdðɡvfθ] $vowel → ɨːu;
|
|
122
|
+
ˈ { aw } [bχdðɡvfθ] $vowel → ɑːu;
|
|
123
|
+
ˈ { ew } [bχdðɡvfθ] $vowel → eːu;
|
|
124
|
+
ˈ { oe } [bχdðɡvfθ] $vowel → ɔːɨ;
|
|
125
|
+
ˈ { ou } [bχdðɡvfθ] $vowel → ɔːɨ;
|
|
126
|
+
ˈ { wy } [bχdðɡvfθ] $vowel → uːɨ;
|
|
127
|
+
# Diphthongs in other environments
|
|
128
|
+
ae → ɑːɨ;
|
|
129
|
+
ai → ai;
|
|
130
|
+
au → aɨ; ## As plural ending /a/, but we can't predict this
|
|
131
|
+
aw → au;
|
|
132
|
+
ei → əi;
|
|
133
|
+
eu → əɨ;
|
|
134
|
+
ew → ɛu;
|
|
135
|
+
ey → əɨ;
|
|
136
|
+
iw → ɪu;
|
|
137
|
+
oe → ɔɨ;
|
|
138
|
+
oi → ɔi;
|
|
139
|
+
ou → ɔɨ;
|
|
140
|
+
uw → ɨu;
|
|
141
|
+
wy → ʊɨ;
|
|
142
|
+
# Long environments
|
|
143
|
+
# Final, or before word-final s
|
|
144
|
+
ˈ { ɨ } s? $end → ɨː;
|
|
145
|
+
ˈ { a } s? $end → ɑː;
|
|
146
|
+
ˈ { e } s? $end → eː;
|
|
147
|
+
ˈ { i } s? $end → iː;
|
|
148
|
+
ˈ { o } s? $end → oː;
|
|
149
|
+
ˈ { u } s? $end → ɨː;
|
|
150
|
+
ˈ { w } s? $end → uː;
|
|
151
|
+
# before b, ch, d, dd, g, f, ff, th followed by the end of a word
|
|
152
|
+
# or a vowel
|
|
153
|
+
ˈ { ɨ } [bχdðɡvfθ] $end → ɨː;
|
|
154
|
+
ˈ { a } [bχdðɡvfθ] $end → ɑː;
|
|
155
|
+
ˈ { e } [bχdðɡvfθ] $end → eː;
|
|
156
|
+
ˈ { i } [bχdðɡvfθ] $end → iː;
|
|
157
|
+
ˈ { o } [bχdðɡvfθ] $end → oː;
|
|
158
|
+
ˈ { u } [bχdðɡvfθ] $end → ɨː;
|
|
159
|
+
ˈ { w } [bχdðɡvfθ] $end → uː;
|
|
160
|
+
ˈ { ɨ } [bχdðɡvfθ] $vowel → ɨː;
|
|
161
|
+
ˈ { a } [bχdðɡvfθ] $vowel → ɑː;
|
|
162
|
+
ˈ { e } [bχdðɡvfθ] $vowel → eː;
|
|
163
|
+
ˈ { i } [bχdðɡvfθ] $vowel → iː;
|
|
164
|
+
ˈ { o } [bχdðɡvfθ] $vowel → oː;
|
|
165
|
+
ˈ { u } [bχdðɡvfθ] $vowel → ɨː;
|
|
166
|
+
ˈ { w } [bχdðɡvfθ] $vowel → uː;
|
|
167
|
+
# Short environments
|
|
168
|
+
a → a;
|
|
169
|
+
e → ɛ;
|
|
170
|
+
i → ɪ;
|
|
171
|
+
o → ɔ;
|
|
172
|
+
u → ɨ̞;
|
|
173
|
+
w → ʊ;
|
|
174
|
+
::Null;
|
|
175
|
+
W → w;
|
|
176
|
+
# Finally, deal with vowels that are marked as long with a circumflex
|
|
177
|
+
# (“to bach”). Do this last because we don't want the other vowel
|
|
178
|
+
# changes messing this up.
|
|
179
|
+
â → ɑː;
|
|
180
|
+
ê → eː;
|
|
181
|
+
î → iː;
|
|
182
|
+
ô → oː;
|
|
183
|
+
û → ɨː;
|
|
184
|
+
ŵ → uː;
|
|
185
|
+
ŷ → ɨː;
|
|
186
|
+
::Null;
|
|
187
|
+
# Move IPA stress marker to start of syllable.
|
|
188
|
+
([$cons w] [l ɬ r {r̥}]? j? w?) ˈ → ˈ $1;
|
|
189
|
+
|
|
@@ -0,0 +1,15 @@
|
|
|
1
|
+
|
|
2
|
+
$AE = [Ä {A \u0308}];
|
|
3
|
+
$OE = [Ö {O \u0308}];
|
|
4
|
+
$UE = [Ü {U \u0308}];
|
|
5
|
+
[ä {a \u0308}] → ae;
|
|
6
|
+
[ö {o \u0308}] → oe;
|
|
7
|
+
[ü {u \u0308}] → ue;
|
|
8
|
+
{$AE} [:Lowercase:] → Ae;
|
|
9
|
+
{$OE} [:Lowercase:] → Oe;
|
|
10
|
+
{$UE} [:Lowercase:] → Ue;
|
|
11
|
+
$AE → AE;
|
|
12
|
+
$OE → OE;
|
|
13
|
+
$UE → UE;
|
|
14
|
+
::Any-ASCII;
|
|
15
|
+
|
|
@@ -0,0 +1,67 @@
|
|
|
1
|
+
|
|
2
|
+
# Transforms Lower Sorbian (dsb) to its IPA transcription (dsb_FONIPA).
|
|
3
|
+
# http://en.wikipedia.org/wiki/Sorbian_alphabet
|
|
4
|
+
# Transform input to normalized form NFC, and to lowercase.
|
|
5
|
+
::NFC;
|
|
6
|
+
::Lower;
|
|
7
|
+
a → a ;
|
|
8
|
+
b́ → bʲ ; # old spelling
|
|
9
|
+
bj → bʲ ; # modern spelling
|
|
10
|
+
b → b ;
|
|
11
|
+
ch → x ;
|
|
12
|
+
č → t \u0361 ʃ ; # affricate indicated by ligature tie
|
|
13
|
+
ć → t \u0361 ɕ ; # affricate indicated by ligature tie
|
|
14
|
+
c → t \u0361 s ; # affricate indicated by ligature tie
|
|
15
|
+
dź → d \u0361 ʑ ; # affricate indicated by ligature tie
|
|
16
|
+
d → d ;
|
|
17
|
+
ě → iɪ̯;
|
|
18
|
+
e → ɛ ;
|
|
19
|
+
f → f ;
|
|
20
|
+
g → ɡ ;
|
|
21
|
+
h → h ;
|
|
22
|
+
i → i ;
|
|
23
|
+
j → j ;
|
|
24
|
+
k → k ;
|
|
25
|
+
ł → v ;
|
|
26
|
+
l → l ;
|
|
27
|
+
ḿ → mʲ ; # old spelling
|
|
28
|
+
mj → mʲ ; # modern spelling
|
|
29
|
+
m → m ;
|
|
30
|
+
ń → ɲ ;
|
|
31
|
+
n → n ;
|
|
32
|
+
ó → ɛ ;
|
|
33
|
+
o → ɔ ;
|
|
34
|
+
ṕ → pʲ ; # old spelling
|
|
35
|
+
pj → pʲ ; # modern spelling
|
|
36
|
+
p → p ;
|
|
37
|
+
ř → ʃ ;
|
|
38
|
+
ŕ → rʲ ;
|
|
39
|
+
r → r ;
|
|
40
|
+
š → ʃ ;
|
|
41
|
+
ś → ɕ ;
|
|
42
|
+
s → s ;
|
|
43
|
+
t → t ;
|
|
44
|
+
u → u ;
|
|
45
|
+
ẃ → wʲ ; # old spelling
|
|
46
|
+
wj → wʲ ; # modern spelling
|
|
47
|
+
w → w ;
|
|
48
|
+
y → ɨ ;
|
|
49
|
+
ž → ʒ ;
|
|
50
|
+
ź → ʑ ;
|
|
51
|
+
z → z ;
|
|
52
|
+
::NFC;
|
|
53
|
+
# Assimilation.
|
|
54
|
+
b } [k] → p ;
|
|
55
|
+
d } [k] → t ;
|
|
56
|
+
ʃt͡ɕ → ɕt͡ɕ ;
|
|
57
|
+
# Final de-voicing.
|
|
58
|
+
b } [$] → p ;
|
|
59
|
+
d \u0361 z } [$] → t \u0361 s ;
|
|
60
|
+
d } [$] → t ;
|
|
61
|
+
ɡ } [$] → k ;
|
|
62
|
+
v } [$] → f ;
|
|
63
|
+
w } [$] → f ;
|
|
64
|
+
ʑ } [$] → ɕ ;
|
|
65
|
+
z } [$] → s ;
|
|
66
|
+
ʒ } [$] → ʃ ;
|
|
67
|
+
|
|
@@ -0,0 +1,12 @@
|
|
|
1
|
+
|
|
2
|
+
# Special case for final form of sigma.
|
|
3
|
+
::NFD();
|
|
4
|
+
# C is preceded by a sequence consisting of a cased letter and then zero or more case-ignorable characters,
|
|
5
|
+
# and C is not followed by a sequence consisting of zero or more case-ignorable characters and then a cased letter.
|
|
6
|
+
# 03A3; 03C2; 03A3; 03A3; Final_Sigma; # GREEK CAPITAL LETTER SIGMA
|
|
7
|
+
# With translit rules, easiest is to handle the negative condition first, mapping in that case to the regular sigma.
|
|
8
|
+
Σ } [:case-ignorable:]* [:cased:] → σ;
|
|
9
|
+
[:cased:] [:case-ignorable:]* { Σ → ς;
|
|
10
|
+
::Any-Lower;
|
|
11
|
+
::NFC();
|
|
12
|
+
|
|
@@ -0,0 +1,12 @@
|
|
|
1
|
+
|
|
2
|
+
::NFD();
|
|
3
|
+
# Remove \0301 following Greek, with possible intervening 0308 marks.
|
|
4
|
+
# [[:Greek:] & [:Ll:]] [\u0308]? { \u0301 → ;
|
|
5
|
+
# Make any string of letters after a cased letter be lower, with rules for sigma
|
|
6
|
+
[:cased:] [:case-ignorable:]* { Σ } [:case-ignorable:]* [:cased:] → σ;
|
|
7
|
+
[:cased:] [:case-ignorable:]* { Σ → ς;
|
|
8
|
+
[:cased:] [:case-ignorable:]* { (.) → &Any-Lower($1) ;
|
|
9
|
+
# Otherwise all lowercase go to upper (titlecase stay as is)
|
|
10
|
+
([:Lowercase:]) → &Any-Title($1) ;
|
|
11
|
+
::NFC();
|
|
12
|
+
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
|
|
2
|
+
# Copyright (C) 2011-2013, Apple Inc. and others. All Rights Reserved.
|
|
3
|
+
# Remove \0301 following Greek, with possible intervening 0308 marks.
|
|
4
|
+
::NFD();
|
|
5
|
+
# For uppercasing (not titlecasing!) remove all greek accents from greek letters.
|
|
6
|
+
# This is done in two groups, to account for canonical ordering.
|
|
7
|
+
[:Greek:] [^[:ccc=Not_Reordered:][:ccc=Above:]]*? { [\u0313\u0314\u0301\u0300\u0306\u0342\u0308\u0304] → ;
|
|
8
|
+
[:Greek:] [^[:ccc=Not_Reordered:][:ccc=Iota_Subscript:]]*? { \u0345 → ;
|
|
9
|
+
::NFC();
|
|
10
|
+
::Any-Upper();
|
|
11
|
+
|
|
@@ -0,0 +1,47 @@
|
|
|
1
|
+
|
|
2
|
+
# https://en.wikipedia.org/wiki/Esperanto_phonology
|
|
3
|
+
::NFC;
|
|
4
|
+
::Lower;
|
|
5
|
+
[\-\'’] → ; # eg. vorto-provizo, famili’
|
|
6
|
+
aj → ai̯;
|
|
7
|
+
aŭ → au̯;
|
|
8
|
+
á → a;
|
|
9
|
+
a → a;
|
|
10
|
+
b → b;
|
|
11
|
+
ĉ → t͡ʃ;
|
|
12
|
+
c → t͡s;
|
|
13
|
+
dz → d͡z;
|
|
14
|
+
d → d;
|
|
15
|
+
ej → ei̯;
|
|
16
|
+
eŭ → eu̯;
|
|
17
|
+
é → e;
|
|
18
|
+
e → e;
|
|
19
|
+
f → f;
|
|
20
|
+
ĝ → d͡ʒ;
|
|
21
|
+
g → ɡ;
|
|
22
|
+
ĥ → x;
|
|
23
|
+
h → h;
|
|
24
|
+
í → i;
|
|
25
|
+
i → i;
|
|
26
|
+
ĵ → ʒ;
|
|
27
|
+
j → j;
|
|
28
|
+
k → k;
|
|
29
|
+
l → l;
|
|
30
|
+
m → m;
|
|
31
|
+
n → n;
|
|
32
|
+
oj → oi̯;
|
|
33
|
+
ó → o;
|
|
34
|
+
o → o;
|
|
35
|
+
p → p;
|
|
36
|
+
r → r;
|
|
37
|
+
ŝ → ʃ;
|
|
38
|
+
s → s;
|
|
39
|
+
t → t;
|
|
40
|
+
uj → ui̯;
|
|
41
|
+
ŭ → w; # eg. ŭa!
|
|
42
|
+
ú → u;
|
|
43
|
+
u → u;
|
|
44
|
+
v → v;
|
|
45
|
+
z → z;
|
|
46
|
+
::NFC;
|
|
47
|
+
|
|
@@ -0,0 +1,13 @@
|
|
|
1
|
+
|
|
2
|
+
$Boundary = [^[:L:][:M:][:N:]];
|
|
3
|
+
$Vowel = [i e o u a];
|
|
4
|
+
::es-es_FONIPA;
|
|
5
|
+
# In Ararbic transcription of Spanish, un-stressed [e] should be treated
|
|
6
|
+
# like [ə] which gets stripped off. However, we currently do have not
|
|
7
|
+
# have a good way of finding stress in Spanish words. In the long term,
|
|
8
|
+
# it would be _much_ better to look at stress markers, but for now
|
|
9
|
+
# we do this trivial heuristics to find unstressed [e] in the first
|
|
10
|
+
# syllable.
|
|
11
|
+
$Boundary [^Vowel] {e} [^$Vowel]* $Vowel → ə;
|
|
12
|
+
::und_FONIPA-ar;
|
|
13
|
+
|