cldr-transforms 46.0.0-BETA2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +41 -0
- package/README.md +27 -0
- package/bower.json +13 -0
- package/package.json +29 -0
- package/transforms/Amharic-Latin-BGN.json +9 -0
- package/transforms/Amharic-Latin-BGN.txt +441 -0
- package/transforms/Any-Accents.json +9 -0
- package/transforms/Any-Accents.txt +270 -0
- package/transforms/Any-Publishing.json +9 -0
- package/transforms/Any-Publishing.txt +63 -0
- package/transforms/Arabic-Latin-BGN.json +9 -0
- package/transforms/Arabic-Latin-BGN.txt +205 -0
- package/transforms/Arabic-Latin.json +11 -0
- package/transforms/Arabic-Latin.txt +181 -0
- package/transforms/Armenian-Latin-BGN.json +9 -0
- package/transforms/Armenian-Latin-BGN.txt +165 -0
- package/transforms/Azerbaijani-Latin-BGN.json +9 -0
- package/transforms/Azerbaijani-Latin-BGN.txt +183 -0
- package/transforms/Belarusian-Latin-BGN.json +9 -0
- package/transforms/Belarusian-Latin-BGN.txt +194 -0
- package/transforms/Bengali-Arabic.json +9 -0
- package/transforms/Bengali-Arabic.txt +7 -0
- package/transforms/Bengali-Devanagari.json +9 -0
- package/transforms/Bengali-Devanagari.txt +7 -0
- package/transforms/Bengali-Gujarati.json +9 -0
- package/transforms/Bengali-Gujarati.txt +7 -0
- package/transforms/Bengali-Gurmukhi.json +9 -0
- package/transforms/Bengali-Gurmukhi.txt +7 -0
- package/transforms/Bengali-InterIndic.json +7 -0
- package/transforms/Bengali-InterIndic.txt +99 -0
- package/transforms/Bengali-Kannada.json +9 -0
- package/transforms/Bengali-Kannada.txt +7 -0
- package/transforms/Bengali-Latin.json +9 -0
- package/transforms/Bengali-Latin.txt +7 -0
- package/transforms/Bengali-Malayalam.json +9 -0
- package/transforms/Bengali-Malayalam.txt +7 -0
- package/transforms/Bengali-Oriya.json +9 -0
- package/transforms/Bengali-Oriya.txt +7 -0
- package/transforms/Bengali-Tamil.json +9 -0
- package/transforms/Bengali-Tamil.txt +7 -0
- package/transforms/Bengali-Telugu.json +9 -0
- package/transforms/Bengali-Telugu.txt +7 -0
- package/transforms/Bengali-ur.json +8 -0
- package/transforms/Bengali-ur.txt +7 -0
- package/transforms/Bulgarian-Latin-BGN.json +9 -0
- package/transforms/Bulgarian-Latin-BGN.txt +237 -0
- package/transforms/CanadianAboriginal-Latin.json +11 -0
- package/transforms/CanadianAboriginal-Latin.txt +184 -0
- package/transforms/Cyrillic-Latin.json +11 -0
- package/transforms/Cyrillic-Latin.txt +280 -0
- package/transforms/Devanagari-Arabic.json +9 -0
- package/transforms/Devanagari-Arabic.txt +7 -0
- package/transforms/Devanagari-Bengali.json +9 -0
- package/transforms/Devanagari-Bengali.txt +7 -0
- package/transforms/Devanagari-Gujarati.json +9 -0
- package/transforms/Devanagari-Gujarati.txt +7 -0
- package/transforms/Devanagari-Gurmukhi.json +9 -0
- package/transforms/Devanagari-Gurmukhi.txt +7 -0
- package/transforms/Devanagari-InterIndic.json +7 -0
- package/transforms/Devanagari-InterIndic.txt +113 -0
- package/transforms/Devanagari-Kannada.json +9 -0
- package/transforms/Devanagari-Kannada.txt +7 -0
- package/transforms/Devanagari-Latin.json +9 -0
- package/transforms/Devanagari-Latin.txt +7 -0
- package/transforms/Devanagari-Malayalam.json +9 -0
- package/transforms/Devanagari-Malayalam.txt +7 -0
- package/transforms/Devanagari-Oriya.json +9 -0
- package/transforms/Devanagari-Oriya.txt +7 -0
- package/transforms/Devanagari-Tamil.json +9 -0
- package/transforms/Devanagari-Tamil.txt +7 -0
- package/transforms/Devanagari-Telugu.json +9 -0
- package/transforms/Devanagari-Telugu.txt +7 -0
- package/transforms/Devanagari-ur.json +8 -0
- package/transforms/Devanagari-ur.txt +7 -0
- package/transforms/Fullwidth-Halfwidth.json +9 -0
- package/transforms/Fullwidth-Halfwidth.txt +261 -0
- package/transforms/Georgian-Latin-BGN.json +9 -0
- package/transforms/Georgian-Latin-BGN.txt +43 -0
- package/transforms/Georgian-Latin-BGN_1981.json +8 -0
- package/transforms/Georgian-Latin-BGN_1981.txt +54 -0
- package/transforms/Georgian-Latin.json +11 -0
- package/transforms/Georgian-Latin.txt +53 -0
- package/transforms/Greek-Latin-BGN.json +9 -0
- package/transforms/Greek-Latin-BGN.txt +419 -0
- package/transforms/Greek-Latin.json +11 -0
- package/transforms/Greek-Latin.txt +251 -0
- package/transforms/Greek_Latin_UNGEGN.json +11 -0
- package/transforms/Greek_Latin_UNGEGN.txt +179 -0
- package/transforms/Gujarati-Arabic.json +9 -0
- package/transforms/Gujarati-Arabic.txt +7 -0
- package/transforms/Gujarati-Bengali.json +9 -0
- package/transforms/Gujarati-Bengali.txt +7 -0
- package/transforms/Gujarati-Devanagari.json +9 -0
- package/transforms/Gujarati-Devanagari.txt +7 -0
- package/transforms/Gujarati-Gurmukhi.json +9 -0
- package/transforms/Gujarati-Gurmukhi.txt +7 -0
- package/transforms/Gujarati-InterIndic.json +7 -0
- package/transforms/Gujarati-InterIndic.txt +89 -0
- package/transforms/Gujarati-Kannada.json +9 -0
- package/transforms/Gujarati-Kannada.txt +7 -0
- package/transforms/Gujarati-Latin.json +9 -0
- package/transforms/Gujarati-Latin.txt +7 -0
- package/transforms/Gujarati-Malayalam.json +9 -0
- package/transforms/Gujarati-Malayalam.txt +7 -0
- package/transforms/Gujarati-Oriya.json +9 -0
- package/transforms/Gujarati-Oriya.txt +7 -0
- package/transforms/Gujarati-Tamil.json +9 -0
- package/transforms/Gujarati-Tamil.txt +7 -0
- package/transforms/Gujarati-Telugu.json +9 -0
- package/transforms/Gujarati-Telugu.txt +7 -0
- package/transforms/Gujarati-ur.json +8 -0
- package/transforms/Gujarati-ur.txt +7 -0
- package/transforms/Gurmukhi-Arabic.json +9 -0
- package/transforms/Gurmukhi-Arabic.txt +7 -0
- package/transforms/Gurmukhi-Bengali.json +9 -0
- package/transforms/Gurmukhi-Bengali.txt +7 -0
- package/transforms/Gurmukhi-Devanagari.json +9 -0
- package/transforms/Gurmukhi-Devanagari.txt +7 -0
- package/transforms/Gurmukhi-Gujarati.json +9 -0
- package/transforms/Gurmukhi-Gujarati.txt +7 -0
- package/transforms/Gurmukhi-InterIndic.json +7 -0
- package/transforms/Gurmukhi-InterIndic.txt +88 -0
- package/transforms/Gurmukhi-Kannada.json +9 -0
- package/transforms/Gurmukhi-Kannada.txt +7 -0
- package/transforms/Gurmukhi-Latin.json +9 -0
- package/transforms/Gurmukhi-Latin.txt +7 -0
- package/transforms/Gurmukhi-Malayalam.json +9 -0
- package/transforms/Gurmukhi-Malayalam.txt +7 -0
- package/transforms/Gurmukhi-Oriya.json +9 -0
- package/transforms/Gurmukhi-Oriya.txt +7 -0
- package/transforms/Gurmukhi-Tamil.json +9 -0
- package/transforms/Gurmukhi-Tamil.txt +7 -0
- package/transforms/Gurmukhi-Telugu.json +9 -0
- package/transforms/Gurmukhi-Telugu.txt +7 -0
- package/transforms/Gurmukhi-ur.json +8 -0
- package/transforms/Gurmukhi-ur.txt +7 -0
- package/transforms/Han-Latin-Names.json +8 -0
- package/transforms/Han-Latin-Names.txt +65 -0
- package/transforms/Han-Latin.json +9 -0
- package/transforms/Han-Latin.txt +1501 -0
- package/transforms/Han-Spacedhan.json +7 -0
- package/transforms/Han-Spacedhan.txt +35 -0
- package/transforms/Hangul-Latin.json +9 -0
- package/transforms/Hangul-Latin.txt +6 -0
- package/transforms/Hebrew-Latin-BGN.json +9 -0
- package/transforms/Hebrew-Latin-BGN.txt +113 -0
- package/transforms/Hebrew-Latin.json +11 -0
- package/transforms/Hebrew-Latin.txt +91 -0
- package/transforms/Hiragana-Katakana.json +11 -0
- package/transforms/Hiragana-Katakana.txt +179 -0
- package/transforms/Hiragana-Latin.json +11 -0
- package/transforms/Hiragana-Latin.txt +9 -0
- package/transforms/IPA-XSampa.json +11 -0
- package/transforms/IPA-XSampa.txt +228 -0
- package/transforms/InterIndic-Arabic.json +7 -0
- package/transforms/InterIndic-Arabic.txt +128 -0
- package/transforms/InterIndic-Bengali.json +7 -0
- package/transforms/InterIndic-Bengali.txt +135 -0
- package/transforms/InterIndic-Devanagari.json +7 -0
- package/transforms/InterIndic-Devanagari.txt +151 -0
- package/transforms/InterIndic-Gujarati.json +7 -0
- package/transforms/InterIndic-Gujarati.txt +136 -0
- package/transforms/InterIndic-Gurmukhi.json +7 -0
- package/transforms/InterIndic-Gurmukhi.txt +142 -0
- package/transforms/InterIndic-Kannada.json +7 -0
- package/transforms/InterIndic-Kannada.txt +137 -0
- package/transforms/InterIndic-Latin.json +7 -0
- package/transforms/InterIndic-Latin.txt +492 -0
- package/transforms/InterIndic-Malayalam.json +7 -0
- package/transforms/InterIndic-Malayalam.txt +137 -0
- package/transforms/InterIndic-Oriya.json +7 -0
- package/transforms/InterIndic-Oriya.txt +135 -0
- package/transforms/InterIndic-Tamil.json +7 -0
- package/transforms/InterIndic-Tamil.txt +136 -0
- package/transforms/InterIndic-Telugu.json +7 -0
- package/transforms/InterIndic-Telugu.txt +136 -0
- package/transforms/InterIndic-ur.json +7 -0
- package/transforms/InterIndic-ur.txt +119 -0
- package/transforms/Jamo-Latin.json +9 -0
- package/transforms/Jamo-Latin.txt +6 -0
- package/transforms/Kannada-Arabic.json +9 -0
- package/transforms/Kannada-Arabic.txt +7 -0
- package/transforms/Kannada-Bengali.json +9 -0
- package/transforms/Kannada-Bengali.txt +7 -0
- package/transforms/Kannada-Devanagari.json +9 -0
- package/transforms/Kannada-Devanagari.txt +7 -0
- package/transforms/Kannada-Gujarati.json +9 -0
- package/transforms/Kannada-Gujarati.txt +7 -0
- package/transforms/Kannada-Gurmukhi.json +9 -0
- package/transforms/Kannada-Gurmukhi.txt +7 -0
- package/transforms/Kannada-InterIndic.json +7 -0
- package/transforms/Kannada-InterIndic.txt +87 -0
- package/transforms/Kannada-Latin.json +9 -0
- package/transforms/Kannada-Latin.txt +7 -0
- package/transforms/Kannada-Malayalam.json +9 -0
- package/transforms/Kannada-Malayalam.txt +7 -0
- package/transforms/Kannada-Oriya.json +9 -0
- package/transforms/Kannada-Oriya.txt +7 -0
- package/transforms/Kannada-Tamil.json +9 -0
- package/transforms/Kannada-Tamil.txt +7 -0
- package/transforms/Kannada-Telugu.json +9 -0
- package/transforms/Kannada-Telugu.txt +7 -0
- package/transforms/Kannada-ur.json +8 -0
- package/transforms/Kannada-ur.txt +7 -0
- package/transforms/Katakana-Latin-BGN.json +9 -0
- package/transforms/Katakana-Latin-BGN.txt +335 -0
- package/transforms/Kazakh-Latin-BGN.json +9 -0
- package/transforms/Kazakh-Latin-BGN.txt +332 -0
- package/transforms/Kirghiz-Latin-BGN.json +9 -0
- package/transforms/Kirghiz-Latin-BGN.txt +211 -0
- package/transforms/Korean-Latin-BGN.json +9 -0
- package/transforms/Korean-Latin-BGN.txt +345 -0
- package/transforms/Latin-ASCII.json +9 -0
- package/transforms/Latin-ASCII.txt +909 -0
- package/transforms/Latin-Armenian.json +11 -0
- package/transforms/Latin-Armenian.txt +88 -0
- package/transforms/Latin-Bengali.json +9 -0
- package/transforms/Latin-Bengali.txt +8 -0
- package/transforms/Latin-Bopomofo.json +11 -0
- package/transforms/Latin-Bopomofo.txt +1445 -0
- package/transforms/Latin-ConjoiningJamo.json +7 -0
- package/transforms/Latin-ConjoiningJamo.txt +477 -0
- package/transforms/Latin-Devanagari.json +9 -0
- package/transforms/Latin-Devanagari.txt +8 -0
- package/transforms/Latin-Ethiopic.json +11 -0
- package/transforms/Latin-Ethiopic.txt +277 -0
- package/transforms/Latin-Gujarati.json +9 -0
- package/transforms/Latin-Gujarati.txt +8 -0
- package/transforms/Latin-Gurmukhi.json +9 -0
- package/transforms/Latin-Gurmukhi.txt +8 -0
- package/transforms/Latin-Hangul.json +9 -0
- package/transforms/Latin-Hangul.txt +7 -0
- package/transforms/Latin-InterIndic.json +7 -0
- package/transforms/Latin-InterIndic.txt +377 -0
- package/transforms/Latin-Jamo.json +9 -0
- package/transforms/Latin-Jamo.txt +7 -0
- package/transforms/Latin-Kannada.json +9 -0
- package/transforms/Latin-Kannada.txt +8 -0
- package/transforms/Latin-Katakana.json +11 -0
- package/transforms/Latin-Katakana.txt +382 -0
- package/transforms/Latin-Malayalam.json +9 -0
- package/transforms/Latin-Malayalam.txt +8 -0
- package/transforms/Latin-NumericPinyin.json +9 -0
- package/transforms/Latin-NumericPinyin.txt +29 -0
- package/transforms/Latin-Oriya.json +9 -0
- package/transforms/Latin-Oriya.txt +8 -0
- package/transforms/Latin-Tamil.json +9 -0
- package/transforms/Latin-Tamil.txt +8 -0
- package/transforms/Latin-Telugu.json +9 -0
- package/transforms/Latin-Telugu.txt +8 -0
- package/transforms/Latin-Thai.json +9 -0
- package/transforms/Latin-Thai.txt +7 -0
- package/transforms/Macedonian-Latin-BGN.json +9 -0
- package/transforms/Macedonian-Latin-BGN.txt +176 -0
- package/transforms/Malayalam-Arabic.json +9 -0
- package/transforms/Malayalam-Arabic.txt +7 -0
- package/transforms/Malayalam-Bengali.json +9 -0
- package/transforms/Malayalam-Bengali.txt +7 -0
- package/transforms/Malayalam-Devanagari.json +9 -0
- package/transforms/Malayalam-Devanagari.txt +7 -0
- package/transforms/Malayalam-Gujarati.json +9 -0
- package/transforms/Malayalam-Gujarati.txt +7 -0
- package/transforms/Malayalam-Gurmukhi.json +9 -0
- package/transforms/Malayalam-Gurmukhi.txt +7 -0
- package/transforms/Malayalam-InterIndic.json +7 -0
- package/transforms/Malayalam-InterIndic.txt +87 -0
- package/transforms/Malayalam-Kannada.json +9 -0
- package/transforms/Malayalam-Kannada.txt +7 -0
- package/transforms/Malayalam-Latin.json +9 -0
- package/transforms/Malayalam-Latin.txt +7 -0
- package/transforms/Malayalam-Oriya.json +9 -0
- package/transforms/Malayalam-Oriya.txt +7 -0
- package/transforms/Malayalam-Tamil.json +9 -0
- package/transforms/Malayalam-Tamil.txt +7 -0
- package/transforms/Malayalam-Telugu.json +9 -0
- package/transforms/Malayalam-Telugu.txt +7 -0
- package/transforms/Malayalam-ur.json +8 -0
- package/transforms/Malayalam-ur.txt +7 -0
- package/transforms/Maldivian-Latin-BGN.json +9 -0
- package/transforms/Maldivian-Latin-BGN.txt +171 -0
- package/transforms/Mongolian-Latin-BGN.json +9 -0
- package/transforms/Mongolian-Latin-BGN.txt +151 -0
- package/transforms/Myanmar-Latin.json +9 -0
- package/transforms/Myanmar-Latin.txt +367 -0
- package/transforms/Oriya-Arabic.json +9 -0
- package/transforms/Oriya-Arabic.txt +7 -0
- package/transforms/Oriya-Bengali.json +9 -0
- package/transforms/Oriya-Bengali.txt +7 -0
- package/transforms/Oriya-Devanagari.json +9 -0
- package/transforms/Oriya-Devanagari.txt +7 -0
- package/transforms/Oriya-Gujarati.json +9 -0
- package/transforms/Oriya-Gujarati.txt +7 -0
- package/transforms/Oriya-Gurmukhi.json +9 -0
- package/transforms/Oriya-Gurmukhi.txt +7 -0
- package/transforms/Oriya-InterIndic.json +7 -0
- package/transforms/Oriya-InterIndic.txt +91 -0
- package/transforms/Oriya-Kannada.json +9 -0
- package/transforms/Oriya-Kannada.txt +7 -0
- package/transforms/Oriya-Latin.json +9 -0
- package/transforms/Oriya-Latin.txt +7 -0
- package/transforms/Oriya-Malayalam.json +9 -0
- package/transforms/Oriya-Malayalam.txt +7 -0
- package/transforms/Oriya-Tamil.json +9 -0
- package/transforms/Oriya-Tamil.txt +7 -0
- package/transforms/Oriya-Telugu.json +9 -0
- package/transforms/Oriya-Telugu.txt +7 -0
- package/transforms/Oriya-ur.json +8 -0
- package/transforms/Oriya-ur.txt +7 -0
- package/transforms/Pashto-Latin-BGN.json +9 -0
- package/transforms/Pashto-Latin-BGN.txt +231 -0
- package/transforms/Persian-Latin-BGN.json +9 -0
- package/transforms/Persian-Latin-BGN.txt +203 -0
- package/transforms/Pinyin-NumericPinyin.json +7 -0
- package/transforms/Pinyin-NumericPinyin.txt +8 -0
- package/transforms/Russian-Latin-BGN.json +9 -0
- package/transforms/Russian-Latin-BGN.txt +235 -0
- package/transforms/Serbian-Latin-BGN.json +9 -0
- package/transforms/Serbian-Latin-BGN.txt +119 -0
- package/transforms/Simplified-Traditional.json +11 -0
- package/transforms/Simplified-Traditional.txt +4393 -0
- package/transforms/Syriac-Latin.json +11 -0
- package/transforms/Syriac-Latin.txt +52 -0
- package/transforms/Tamil-Arabic.json +9 -0
- package/transforms/Tamil-Arabic.txt +7 -0
- package/transforms/Tamil-Bengali.json +9 -0
- package/transforms/Tamil-Bengali.txt +7 -0
- package/transforms/Tamil-Devanagari.json +9 -0
- package/transforms/Tamil-Devanagari.txt +7 -0
- package/transforms/Tamil-Gujarati.json +9 -0
- package/transforms/Tamil-Gujarati.txt +7 -0
- package/transforms/Tamil-Gurmukhi.json +9 -0
- package/transforms/Tamil-Gurmukhi.txt +7 -0
- package/transforms/Tamil-InterIndic.json +7 -0
- package/transforms/Tamil-InterIndic.txt +70 -0
- package/transforms/Tamil-Kannada.json +9 -0
- package/transforms/Tamil-Kannada.txt +7 -0
- package/transforms/Tamil-Latin.json +9 -0
- package/transforms/Tamil-Latin.txt +7 -0
- package/transforms/Tamil-Malayalam.json +9 -0
- package/transforms/Tamil-Malayalam.txt +7 -0
- package/transforms/Tamil-Oriya.json +9 -0
- package/transforms/Tamil-Oriya.txt +7 -0
- package/transforms/Tamil-Telugu.json +9 -0
- package/transforms/Tamil-Telugu.txt +7 -0
- package/transforms/Tamil-ur.json +8 -0
- package/transforms/Tamil-ur.txt +7 -0
- package/transforms/Telugu-Arabic.json +9 -0
- package/transforms/Telugu-Arabic.txt +7 -0
- package/transforms/Telugu-Bengali.json +9 -0
- package/transforms/Telugu-Bengali.txt +7 -0
- package/transforms/Telugu-Devanagari.json +9 -0
- package/transforms/Telugu-Devanagari.txt +7 -0
- package/transforms/Telugu-Gujarati.json +9 -0
- package/transforms/Telugu-Gujarati.txt +7 -0
- package/transforms/Telugu-Gurmukhi.json +9 -0
- package/transforms/Telugu-Gurmukhi.txt +7 -0
- package/transforms/Telugu-InterIndic.json +7 -0
- package/transforms/Telugu-InterIndic.txt +87 -0
- package/transforms/Telugu-Kannada.json +9 -0
- package/transforms/Telugu-Kannada.txt +7 -0
- package/transforms/Telugu-Latin.json +9 -0
- package/transforms/Telugu-Latin.txt +7 -0
- package/transforms/Telugu-Malayalam.json +9 -0
- package/transforms/Telugu-Malayalam.txt +7 -0
- package/transforms/Telugu-Oriya.json +9 -0
- package/transforms/Telugu-Oriya.txt +7 -0
- package/transforms/Telugu-Tamil.json +9 -0
- package/transforms/Telugu-Tamil.txt +7 -0
- package/transforms/Telugu-ur.json +8 -0
- package/transforms/Telugu-ur.txt +7 -0
- package/transforms/Thaana-Latin.json +11 -0
- package/transforms/Thaana-Latin.txt +433 -0
- package/transforms/Thai-Latin.json +9 -0
- package/transforms/Thai-Latin.txt +9 -0
- package/transforms/Thai-ThaiLogical.json +7 -0
- package/transforms/Thai-ThaiLogical.txt +16 -0
- package/transforms/Thai-ThaiSemi.json +7 -0
- package/transforms/Thai-ThaiSemi.txt +6 -0
- package/transforms/ThaiLogical-Latin.json +7 -0
- package/transforms/ThaiLogical-Latin.txt +147 -0
- package/transforms/Turkmen-Latin-BGN.json +9 -0
- package/transforms/Turkmen-Latin-BGN.txt +302 -0
- package/transforms/Ukrainian-Latin-BGN.json +9 -0
- package/transforms/Ukrainian-Latin-BGN.txt +283 -0
- package/transforms/Uzbek-Latin-BGN.json +9 -0
- package/transforms/Uzbek-Latin-BGN.txt +261 -0
- package/transforms/am-Ethi-t-am-brai.json +11 -0
- package/transforms/am-Ethi-t-am-brai.txt +652 -0
- package/transforms/am-Ethi-t-am-ethi-m0-geminate.json +9 -0
- package/transforms/am-Ethi-t-am-ethi-m0-geminate.txt +6925 -0
- package/transforms/am-Ethi-t-d0-morse.json +9 -0
- package/transforms/am-Ethi-t-d0-morse.txt +657 -0
- package/transforms/am-am_FONIPA.json +9 -0
- package/transforms/am-am_FONIPA.txt +694 -0
- package/transforms/am-ar.json +8 -0
- package/transforms/am-ar.txt +5 -0
- package/transforms/am-chr.json +8 -0
- package/transforms/am-chr.txt +4 -0
- package/transforms/am-fa.json +8 -0
- package/transforms/am-fa.txt +4 -0
- package/transforms/az-Lower.json +8 -0
- package/transforms/az-Lower.txt +13 -0
- package/transforms/az-Title.json +8 -0
- package/transforms/az-Title.txt +11 -0
- package/transforms/az-Upper.json +8 -0
- package/transforms/az-Upper.txt +5 -0
- package/transforms/blt-fonipa-t-blt.json +8 -0
- package/transforms/blt-fonipa-t-blt.txt +132 -0
- package/transforms/byn-Ethi-t-byn-latn-m0-tekie-alibekit.json +11 -0
- package/transforms/byn-Ethi-t-byn-latn-m0-tekie-alibekit.txt +537 -0
- package/transforms/byn-Ethi-t-byn-latn-m0-xaleget.json +11 -0
- package/transforms/byn-Ethi-t-byn-latn-m0-xaleget.txt +773 -0
- package/transforms/ch-am.json +8 -0
- package/transforms/ch-am.txt +4 -0
- package/transforms/ch-ar.json +8 -0
- package/transforms/ch-ar.txt +4 -0
- package/transforms/ch-ch_FONIPA.json +8 -0
- package/transforms/ch-ch_FONIPA.txt +79 -0
- package/transforms/ch-chr.json +8 -0
- package/transforms/ch-chr.txt +4 -0
- package/transforms/ch-fa.json +8 -0
- package/transforms/ch-fa.txt +4 -0
- package/transforms/chr-chr_FONIPA.json +8 -0
- package/transforms/chr-chr_FONIPA.txt +111 -0
- package/transforms/cs-am.json +8 -0
- package/transforms/cs-am.txt +4 -0
- package/transforms/cs-ar.json +8 -0
- package/transforms/cs-ar.txt +4 -0
- package/transforms/cs-chr.json +8 -0
- package/transforms/cs-chr.txt +4 -0
- package/transforms/cs-cs_FONIPA.json +8 -0
- package/transforms/cs-cs_FONIPA.txt +74 -0
- package/transforms/cs-fa.json +8 -0
- package/transforms/cs-fa.txt +4 -0
- package/transforms/cs-ja.json +8 -0
- package/transforms/cs-ja.txt +4 -0
- package/transforms/cs-ko.json +8 -0
- package/transforms/cs-ko.txt +4 -0
- package/transforms/cs_FONIPA-ja.json +8 -0
- package/transforms/cs_FONIPA-ja.txt +228 -0
- package/transforms/cs_FONIPA-ko.json +8 -0
- package/transforms/cs_FONIPA-ko.txt +88 -0
- package/transforms/cy-fonipa-t-cy.json +8 -0
- package/transforms/cy-fonipa-t-cy.txt +189 -0
- package/transforms/de-ASCII.json +8 -0
- package/transforms/de-ASCII.txt +15 -0
- package/transforms/dsb-dsb_FONIPA.json +8 -0
- package/transforms/dsb-dsb_FONIPA.txt +67 -0
- package/transforms/el-Lower.json +8 -0
- package/transforms/el-Lower.txt +12 -0
- package/transforms/el-Title.json +8 -0
- package/transforms/el-Title.txt +12 -0
- package/transforms/el-Upper.json +8 -0
- package/transforms/el-Upper.txt +11 -0
- package/transforms/eo-am.json +8 -0
- package/transforms/eo-am.txt +4 -0
- package/transforms/eo-ar.json +8 -0
- package/transforms/eo-ar.txt +4 -0
- package/transforms/eo-chr.json +8 -0
- package/transforms/eo-chr.txt +4 -0
- package/transforms/eo-eo_FONIPA.json +8 -0
- package/transforms/eo-eo_FONIPA.txt +47 -0
- package/transforms/eo-fa.json +8 -0
- package/transforms/eo-fa.txt +4 -0
- package/transforms/es-am.json +8 -0
- package/transforms/es-am.txt +4 -0
- package/transforms/es-ar.json +8 -0
- package/transforms/es-ar.txt +13 -0
- package/transforms/es-chr.json +8 -0
- package/transforms/es-chr.txt +4 -0
- package/transforms/es-es_FONIPA.json +8 -0
- package/transforms/es-es_FONIPA.txt +139 -0
- package/transforms/es-fa.json +8 -0
- package/transforms/es-fa.txt +13 -0
- package/transforms/es-ja.json +8 -0
- package/transforms/es-ja.txt +4 -0
- package/transforms/es-zh.json +8 -0
- package/transforms/es-zh.txt +4 -0
- package/transforms/es_419-am.json +8 -0
- package/transforms/es_419-am.txt +5 -0
- package/transforms/es_419-ar.json +8 -0
- package/transforms/es_419-ar.txt +14 -0
- package/transforms/es_419-chr.json +8 -0
- package/transforms/es_419-chr.txt +5 -0
- package/transforms/es_419-fa.json +8 -0
- package/transforms/es_419-fa.txt +14 -0
- package/transforms/es_419-ja.json +8 -0
- package/transforms/es_419-ja.txt +5 -0
- package/transforms/es_419-zh.json +8 -0
- package/transforms/es_419-zh.txt +5 -0
- package/transforms/es_FONIPA-am.json +8 -0
- package/transforms/es_FONIPA-am.txt +230 -0
- package/transforms/es_FONIPA-es_419_FONIPA.json +8 -0
- package/transforms/es_FONIPA-es_419_FONIPA.txt +6 -0
- package/transforms/es_FONIPA-ja.json +8 -0
- package/transforms/es_FONIPA-ja.txt +155 -0
- package/transforms/es_FONIPA-zh.json +8 -0
- package/transforms/es_FONIPA-zh.txt +522 -0
- package/transforms/fa-fa_FONIPA.json +8 -0
- package/transforms/fa-fa_FONIPA.txt +107 -0
- package/transforms/gz-Ethi-t-und-sarb.json +11 -0
- package/transforms/gz-Ethi-t-und-sarb.txt +180 -0
- package/transforms/ha-ha_NE.json +8 -0
- package/transforms/ha-ha_NE.txt +6 -0
- package/transforms/hy-am.json +8 -0
- package/transforms/hy-am.txt +4 -0
- package/transforms/hy-ar.json +8 -0
- package/transforms/hy-ar.txt +4 -0
- package/transforms/hy-chr.json +8 -0
- package/transforms/hy-chr.txt +4 -0
- package/transforms/hy-fa.json +8 -0
- package/transforms/hy-fa.txt +4 -0
- package/transforms/hy-hy_FONIPA.json +8 -0
- package/transforms/hy-hy_FONIPA.txt +52 -0
- package/transforms/hy_AREVMDA-am.json +8 -0
- package/transforms/hy_AREVMDA-am.txt +4 -0
- package/transforms/hy_AREVMDA-ar.json +8 -0
- package/transforms/hy_AREVMDA-ar.txt +4 -0
- package/transforms/hy_AREVMDA-chr.json +8 -0
- package/transforms/hy_AREVMDA-chr.txt +4 -0
- package/transforms/hy_AREVMDA-fa.json +8 -0
- package/transforms/hy_AREVMDA-fa.txt +4 -0
- package/transforms/hy_AREVMDA-hy_AREVMDA_FONIPA.json +8 -0
- package/transforms/hy_AREVMDA-hy_AREVMDA_FONIPA.txt +80 -0
- package/transforms/ia-am.json +8 -0
- package/transforms/ia-am.txt +4 -0
- package/transforms/ia-ar.json +8 -0
- package/transforms/ia-ar.txt +4 -0
- package/transforms/ia-chr.json +8 -0
- package/transforms/ia-chr.txt +4 -0
- package/transforms/ia-fa.json +8 -0
- package/transforms/ia-fa.txt +4 -0
- package/transforms/ia-ia_FONIPA.json +8 -0
- package/transforms/ia-ia_FONIPA.txt +71 -0
- package/transforms/it-am.json +8 -0
- package/transforms/it-am.txt +257 -0
- package/transforms/it-ja.json +8 -0
- package/transforms/it-ja.txt +259 -0
- package/transforms/ja_Latn-ko.json +8 -0
- package/transforms/ja_Latn-ko.txt +141 -0
- package/transforms/ja_Latn-ru.json +8 -0
- package/transforms/ja_Latn-ru.txt +123 -0
- package/transforms/kk-am.json +8 -0
- package/transforms/kk-am.txt +4 -0
- package/transforms/kk-ar.json +8 -0
- package/transforms/kk-ar.txt +4 -0
- package/transforms/kk-chr.json +8 -0
- package/transforms/kk-chr.txt +4 -0
- package/transforms/kk-fa.json +8 -0
- package/transforms/kk-fa.txt +4 -0
- package/transforms/kk-kk_FONIPA.json +8 -0
- package/transforms/kk-kk_FONIPA.txt +59 -0
- package/transforms/ky-am.json +8 -0
- package/transforms/ky-am.txt +4 -0
- package/transforms/ky-ar.json +8 -0
- package/transforms/ky-ar.txt +4 -0
- package/transforms/ky-chr.json +8 -0
- package/transforms/ky-chr.txt +4 -0
- package/transforms/ky-fa.json +8 -0
- package/transforms/ky-fa.txt +4 -0
- package/transforms/ky-ky_FONIPA.json +8 -0
- package/transforms/ky-ky_FONIPA.txt +71 -0
- package/transforms/la-la_FONIPA.json +8 -0
- package/transforms/la-la_FONIPA.txt +79 -0
- package/transforms/lt-Lower.json +8 -0
- package/transforms/lt-Lower.txt +20 -0
- package/transforms/lt-Title.json +8 -0
- package/transforms/lt-Title.txt +15 -0
- package/transforms/lt-Upper.json +8 -0
- package/transforms/lt-Upper.txt +8 -0
- package/transforms/mn-mn_Latn-MNS.json +8 -0
- package/transforms/mn-mn_Latn-MNS.txt +86 -0
- package/transforms/my-am.json +8 -0
- package/transforms/my-am.txt +4 -0
- package/transforms/my-ar.json +8 -0
- package/transforms/my-ar.txt +4 -0
- package/transforms/my-chr.json +8 -0
- package/transforms/my-chr.txt +4 -0
- package/transforms/my-fa.json +8 -0
- package/transforms/my-fa.txt +4 -0
- package/transforms/my-my_FONIPA.json +8 -0
- package/transforms/my-my_FONIPA.txt +325 -0
- package/transforms/my-t-my-d0-zawgyi.json +8 -0
- package/transforms/my-t-my-d0-zawgyi.txt +222 -0
- package/transforms/my-t-my-s0-zawgyi.json +8 -0
- package/transforms/my-t-my-s0-zawgyi.txt +231 -0
- package/transforms/nl-Title.json +8 -0
- package/transforms/nl-Title.txt +7 -0
- package/transforms/nv-nv_FONIPA.json +8 -0
- package/transforms/nv-nv_FONIPA.txt +74 -0
- package/transforms/pl-am.json +8 -0
- package/transforms/pl-am.txt +4 -0
- package/transforms/pl-ar.json +8 -0
- package/transforms/pl-ar.txt +4 -0
- package/transforms/pl-chr.json +8 -0
- package/transforms/pl-chr.txt +4 -0
- package/transforms/pl-fa.json +8 -0
- package/transforms/pl-fa.txt +4 -0
- package/transforms/pl-ja.json +8 -0
- package/transforms/pl-ja.txt +4 -0
- package/transforms/pl-pl_FONIPA.json +8 -0
- package/transforms/pl-pl_FONIPA.txt +113 -0
- package/transforms/pl_FONIPA-ja.json +8 -0
- package/transforms/pl_FONIPA-ja.txt +301 -0
- package/transforms/rm_SURSILV-am.json +8 -0
- package/transforms/rm_SURSILV-am.txt +4 -0
- package/transforms/rm_SURSILV-ar.json +8 -0
- package/transforms/rm_SURSILV-ar.txt +4 -0
- package/transforms/rm_SURSILV-chr.json +8 -0
- package/transforms/rm_SURSILV-chr.txt +4 -0
- package/transforms/rm_SURSILV-fa.json +8 -0
- package/transforms/rm_SURSILV-fa.txt +4 -0
- package/transforms/rm_SURSILV-rm_FONIPA_SURSILV.json +8 -0
- package/transforms/rm_SURSILV-rm_FONIPA_SURSILV.txt +96 -0
- package/transforms/ro-am.json +8 -0
- package/transforms/ro-am.txt +4 -0
- package/transforms/ro-ar.json +8 -0
- package/transforms/ro-ar.txt +4 -0
- package/transforms/ro-chr.json +8 -0
- package/transforms/ro-chr.txt +4 -0
- package/transforms/ro-fa.json +8 -0
- package/transforms/ro-fa.txt +4 -0
- package/transforms/ro-ja.json +8 -0
- package/transforms/ro-ja.txt +4 -0
- package/transforms/ro-ro_FONIPA.json +8 -0
- package/transforms/ro-ro_FONIPA.txt +121 -0
- package/transforms/ro_FONIPA-ja.json +8 -0
- package/transforms/ro_FONIPA-ja.txt +211 -0
- package/transforms/ru-ja.json +8 -0
- package/transforms/ru-ja.txt +444 -0
- package/transforms/ru-zh.json +8 -0
- package/transforms/ru-zh.txt +996 -0
- package/transforms/ru_Latn-ru-BGN.json +9 -0
- package/transforms/ru_Latn-ru-BGN.txt +97 -0
- package/transforms/sat-am.json +8 -0
- package/transforms/sat-am.txt +6 -0
- package/transforms/sat-ar.json +8 -0
- package/transforms/sat-ar.txt +6 -0
- package/transforms/sat-chr.json +8 -0
- package/transforms/sat-chr.txt +6 -0
- package/transforms/sat-fa.json +8 -0
- package/transforms/sat-fa.txt +6 -0
- package/transforms/sat_Olck-sat_FONIPA.json +8 -0
- package/transforms/sat_Olck-sat_FONIPA.txt +174 -0
- package/transforms/sgw-Ethi-t-und-ethi.json +11 -0
- package/transforms/sgw-Ethi-t-und-ethi.txt +138 -0
- package/transforms/si-am.json +8 -0
- package/transforms/si-am.txt +4 -0
- package/transforms/si-ar.json +8 -0
- package/transforms/si-ar.txt +4 -0
- package/transforms/si-chr.json +8 -0
- package/transforms/si-chr.txt +4 -0
- package/transforms/si-fa.json +8 -0
- package/transforms/si-fa.txt +4 -0
- package/transforms/si-si_FONIPA.json +8 -0
- package/transforms/si-si_FONIPA.txt +157 -0
- package/transforms/si-si_Latn.json +8 -0
- package/transforms/si-si_Latn.txt +94 -0
- package/transforms/sk-am.json +8 -0
- package/transforms/sk-am.txt +4 -0
- package/transforms/sk-ar.json +8 -0
- package/transforms/sk-ar.txt +4 -0
- package/transforms/sk-chr.json +8 -0
- package/transforms/sk-chr.txt +4 -0
- package/transforms/sk-fa.json +8 -0
- package/transforms/sk-fa.txt +4 -0
- package/transforms/sk-ja.json +8 -0
- package/transforms/sk-ja.txt +4 -0
- package/transforms/sk-sk_FONIPA.json +8 -0
- package/transforms/sk-sk_FONIPA.txt +101 -0
- package/transforms/sk_FONIPA-ja.json +8 -0
- package/transforms/sk_FONIPA-ja.txt +252 -0
- package/transforms/ta-ta_FONIPA.json +8 -0
- package/transforms/ta-ta_FONIPA.txt +73 -0
- package/transforms/tlh-am.json +8 -0
- package/transforms/tlh-am.txt +4 -0
- package/transforms/tlh-ar.json +8 -0
- package/transforms/tlh-ar.txt +4 -0
- package/transforms/tlh-chr.json +8 -0
- package/transforms/tlh-chr.txt +4 -0
- package/transforms/tlh-fa.json +8 -0
- package/transforms/tlh-fa.txt +4 -0
- package/transforms/tlh-tlh_FONIPA.json +8 -0
- package/transforms/tlh-tlh_FONIPA.txt +46 -0
- package/transforms/tr-Lower.json +8 -0
- package/transforms/tr-Lower.txt +13 -0
- package/transforms/tr-Title.json +8 -0
- package/transforms/tr-Title.txt +11 -0
- package/transforms/tr-Upper.json +8 -0
- package/transforms/tr-Upper.txt +8 -0
- package/transforms/ug-ug_FONIPA.json +8 -0
- package/transforms/ug-ug_FONIPA.txt +69 -0
- package/transforms/und-Ethi-t-und-cyrl-m0-gutgarts.json +11 -0
- package/transforms/und-Ethi-t-und-cyrl-m0-gutgarts.txt +747 -0
- package/transforms/und-Ethi-t-und-latn-m0-aethiopi-geminate.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-aethiopi-geminate.txt +19 -0
- package/transforms/und-Ethi-t-und-latn-m0-aethiopi.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-aethiopi.txt +633 -0
- package/transforms/und-Ethi-t-und-latn-m0-alaloc-geminate.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-alaloc-geminate.txt +19 -0
- package/transforms/und-Ethi-t-und-latn-m0-alaloc.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-alaloc.txt +757 -0
- package/transforms/und-Ethi-t-und-latn-m0-beta_metsehaf-geminate.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-beta_metsehaf-geminate.txt +19 -0
- package/transforms/und-Ethi-t-und-latn-m0-beta_metsehaf.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-beta_metsehaf.txt +585 -0
- package/transforms/und-Ethi-t-und-latn-m0-es3842.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-es3842.txt +640 -0
- package/transforms/und-Ethi-t-und-latn-m0-ies-jes-1964-geminate.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-ies-jes-1964-geminate.txt +19 -0
- package/transforms/und-Ethi-t-und-latn-m0-ies-jes-1964.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-ies-jes-1964.txt +619 -0
- package/transforms/und-Ethi-t-und-latn-m0-lambdin.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-lambdin.txt +627 -0
- package/transforms/und-Ethi-t-und-latn-m0-sera.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-sera.txt +695 -0
- package/transforms/und-Ethi-t-und-latn.json +11 -0
- package/transforms/und-Ethi-t-und-latn.txt +16 -0
- package/transforms/und_FONIPA-ar.json +8 -0
- package/transforms/und_FONIPA-ar.txt +114 -0
- package/transforms/und_FONIPA-chr.json +8 -0
- package/transforms/und_FONIPA-chr.txt +172 -0
- package/transforms/und_FONIPA-fa.json +8 -0
- package/transforms/und_FONIPA-fa.txt +109 -0
- package/transforms/uz_Cyrl-uz_Latn.json +9 -0
- package/transforms/uz_Cyrl-uz_Latn.txt +103 -0
- package/transforms/vec-vec_FONIPA.json +8 -0
- package/transforms/vec-vec_FONIPA.txt +85 -0
- package/transforms/xh-am.json +8 -0
- package/transforms/xh-am.txt +4 -0
- package/transforms/xh-ar.json +8 -0
- package/transforms/xh-ar.txt +4 -0
- package/transforms/xh-chr.json +8 -0
- package/transforms/xh-chr.txt +4 -0
- package/transforms/xh-fa.json +8 -0
- package/transforms/xh-fa.txt +4 -0
- package/transforms/xh-xh_FONIPA.json +8 -0
- package/transforms/xh-xh_FONIPA.txt +85 -0
- package/transforms/yo-yo_BJ.json +8 -0
- package/transforms/yo-yo_BJ.txt +36 -0
- package/transforms/zh_Latn_PINYIN-ru.json +8 -0
- package/transforms/zh_Latn_PINYIN-ru.txt +148 -0
- package/transforms/zu-am.json +8 -0
- package/transforms/zu-am.txt +4 -0
- package/transforms/zu-ar.json +8 -0
- package/transforms/zu-ar.txt +4 -0
- package/transforms/zu-chr.json +8 -0
- package/transforms/zu-chr.txt +4 -0
- package/transforms/zu-fa.json +8 -0
- package/transforms/zu-fa.txt +4 -0
- package/transforms/zu-zu_FONIPA.json +8 -0
- package/transforms/zu-zu_FONIPA.txt +72 -0
- package/transforms.json +385 -0
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
{
|
|
2
|
+
"_backwardAlias": "Latin-Ethiopic",
|
|
3
|
+
"_visibility": "external",
|
|
4
|
+
"_backwardAliasBcp47": "und-Ethi-t-und-lant",
|
|
5
|
+
"_alias": "Ethiopic-Latin",
|
|
6
|
+
"_aliasBcp47": "und-Latn-t-und-ethi",
|
|
7
|
+
"_source": "Ethi",
|
|
8
|
+
"_direction": "both",
|
|
9
|
+
"_target": "Latn",
|
|
10
|
+
"_rulesFile": "und-Ethi-t-und-latn.txt"
|
|
11
|
+
}
|
|
@@ -0,0 +1,16 @@
|
|
|
1
|
+
|
|
2
|
+
########################################################################
|
|
3
|
+
#
|
|
4
|
+
# This transformation is introduced to serve as a fallback for a
|
|
5
|
+
# language and variant agnostic conversion between Ethiopic-Latin,
|
|
6
|
+
# and Latin-Ethiopic. In principle, it should act like an alias
|
|
7
|
+
# to the most widely used transliteration system in the present day,
|
|
8
|
+
# which in turn is believed to be the # "Beta Maṣāḥǝft" system
|
|
9
|
+
# maintained by the Hiob Ludolf Centre for Ethiopian Studies,
|
|
10
|
+
#
|
|
11
|
+
########################################################################
|
|
12
|
+
#
|
|
13
|
+
:: Ethiopic-Latin/Beta_Metsehaf ;
|
|
14
|
+
#
|
|
15
|
+
########################################################################
|
|
16
|
+
|
|
@@ -0,0 +1,114 @@
|
|
|
1
|
+
|
|
2
|
+
# Vowels
|
|
3
|
+
# ------
|
|
4
|
+
# In these rules, we produce ي و ا both for short and for long vowels.
|
|
5
|
+
# This would be wrong for writing Arabic, but when transliterating
|
|
6
|
+
# foreign words and names, it is strongly preferred to vowel marks.
|
|
7
|
+
# However, we emit short schwa [ə] and a few other, schwa-like vowels.
|
|
8
|
+
$IVowel = [i ɪ e {e̞}];
|
|
9
|
+
$UVowel = [y {ɨ} {ʉ} ɯ u ʏ {ɪ̈} {ʊ̈} {ɯ̽} {ʊ} ø ɤ o {ø̞} {ɤ̞} {o̞} ɞ ɔ w {w̥} ʍ ʷ];
|
|
10
|
+
$AVowel = [ɛ œ ɜ ʌ æ ɐ a ɶ {ä} {ɒ̈} ɑ ɒ];
|
|
11
|
+
$SchwaVowel = [ɘ ɵ ə {ɵ̞}];
|
|
12
|
+
$Vowel = [$IVowel $UVowel $AVowel $SchwaVowel];
|
|
13
|
+
$Click = [ʘ ɋ ǀ ʇ ǃ ʗ ǂ ʄ ǁ ʖ];
|
|
14
|
+
$Boundary = [^[:L:][:M:][:N:]];
|
|
15
|
+
::NFD;
|
|
16
|
+
[ʰ ʱ ʼ ̃ ̰ ̋ ́ ̄ ̀ ̏ ̌ ̂ ˥ ˦ ˧ ˨ ˩ ꜜ ꜛ ↗ ↘ ͡ ͜ ̯] → ;
|
|
17
|
+
ʲ → j;
|
|
18
|
+
ᵐ → m;
|
|
19
|
+
ⁿ → n;
|
|
20
|
+
ᵑ → ŋ;
|
|
21
|
+
::NFC;
|
|
22
|
+
# TODO: Diphthongs probably need more work.
|
|
23
|
+
# Romanian [sekujesk] → [sekujask], for emitting سيكوياسك not سيكويسك
|
|
24
|
+
$UVowel [j $IVowel] [e {e̞} $SchwaVowel] → uia;
|
|
25
|
+
# Kazakh Аягөз [ɑjɑɡy̯ʉz] → [ɑjɑɡiuz], to emit TODO
|
|
26
|
+
yʉ → iu;
|
|
27
|
+
::NULL;
|
|
28
|
+
# Vowels
|
|
29
|
+
$Boundary {ʔ? $IVowel ː} → إِي;
|
|
30
|
+
$Boundary {ʔ? $IVowel} → إِ;
|
|
31
|
+
{$IVowel ʔ} $Boundary → ئ;
|
|
32
|
+
{$IVowel ː ʔ} $Boundary → يء;
|
|
33
|
+
{$IVowel ː ʔ} [$Vowel] → ئ;
|
|
34
|
+
$IVowel ː? → ي;
|
|
35
|
+
$Boundary {ʔ? $UVowel ː} → أو;
|
|
36
|
+
$Boundary {ʔ? $UVowel} → أ;
|
|
37
|
+
{$UVowel ʔ} $Boundary → ؤ;
|
|
38
|
+
{$UVowel ː ʔ} $Boundary → وء;
|
|
39
|
+
$UVowel ː? → و;
|
|
40
|
+
$Boundary {ʔ? $AVowel ː} → آ;
|
|
41
|
+
$Boundary {ʔ? $AVowel} → أ;
|
|
42
|
+
{$AVowel ʔ} $Boundary → أ;
|
|
43
|
+
{$AVowel ː ʔ} $Boundary → اء;
|
|
44
|
+
$AVowel ː? ʔ $AVowel ː? → اءا;
|
|
45
|
+
$AVowel ː? → ا;
|
|
46
|
+
$Boundary {ʔ? $SchwaVowel ː} → إِي;
|
|
47
|
+
$Boundary {ʔ? $SchwaVowel} → أ;
|
|
48
|
+
$SchwaVowel ː → ي;
|
|
49
|
+
$SchwaVowel → ;
|
|
50
|
+
# TODO: Handle glottal stop.
|
|
51
|
+
ʔ → ;
|
|
52
|
+
# Shadda for long (geminated) consonants
|
|
53
|
+
ː → ّ;
|
|
54
|
+
# Affricates
|
|
55
|
+
[{t͡ʃ} ʧ] → تْش;
|
|
56
|
+
# Clicks
|
|
57
|
+
[ɡ g ɠ k] $Click → كْش;
|
|
58
|
+
$Click → تْش;
|
|
59
|
+
# Nasal stops
|
|
60
|
+
[{m̥} m ɱ] → م;
|
|
61
|
+
[{n̼̊} {n̼} {n̥} n {ɳ̊} ɳ {ɲ̊} {ɲ̥} ɲ] → ن;
|
|
62
|
+
[{ŋ̊} ŋ {ɴ̥} ɴ] k → نك;
|
|
63
|
+
[{ŋ̊} ŋ {ɴ̥} ɴ] [ɡ g ɠ]? → نْغ;
|
|
64
|
+
# Non-nasal stops
|
|
65
|
+
[p b {p̪} {b̪} ɓ] → ب;
|
|
66
|
+
[{d̼} d ɗ ᶑ] → د;
|
|
67
|
+
[{t̼} t] → ت;
|
|
68
|
+
[ʈ] → ط;
|
|
69
|
+
[ɖ] → ض;
|
|
70
|
+
c → تْش;
|
|
71
|
+
ɟ → دج;
|
|
72
|
+
k → ك;
|
|
73
|
+
[ɡ g ɠ] → غ;
|
|
74
|
+
[q ɢ ʡ ʛ] → ق;
|
|
75
|
+
# Sibilant fricatives
|
|
76
|
+
s → س;
|
|
77
|
+
z → ز;
|
|
78
|
+
[ʃ ʂ ɕ ʄ] → ش;
|
|
79
|
+
[ʒ ʐ ʑ] → ج;
|
|
80
|
+
# Non-sibilant fricatives
|
|
81
|
+
[ɸ f v] → ف;
|
|
82
|
+
β → ب;
|
|
83
|
+
[{θ̼} θ {θ̱}] → ث;
|
|
84
|
+
[{ð̼} ð {ð̠}] → ذ;
|
|
85
|
+
ç → ش;
|
|
86
|
+
ʝ $IVowel? ː? → ي;
|
|
87
|
+
[x χ] → خ;
|
|
88
|
+
[ɣ ʁ] → غ;
|
|
89
|
+
ħ → ح;
|
|
90
|
+
ʕ → ع;
|
|
91
|
+
[h ɦ {ʔ̞}] → ه;
|
|
92
|
+
# Approximants, trills, flaps
|
|
93
|
+
ʋ → و;
|
|
94
|
+
ʙ → بر;
|
|
95
|
+
{r̝} → رش;
|
|
96
|
+
[{ɹ̥} {ɹ} {ɻ̊} {ɻ} {ɾ̥} ɾ {ɽ̊} ɽ {r̼} {r̥} r] → ر;
|
|
97
|
+
[{ʀ̥} ʀ] → غ;
|
|
98
|
+
ʜ → ح;
|
|
99
|
+
ʢ → ع;
|
|
100
|
+
j $IVowel? ː? → ي;
|
|
101
|
+
# Laterals
|
|
102
|
+
ɬ → شْل;
|
|
103
|
+
ɮ → جْل;
|
|
104
|
+
{[{ʎ̥} ʎ]} [^ $IVowel j ʝ] → لي;
|
|
105
|
+
[{l̼} {l̥} l {ɭ̊} ɭ {ʎ̥} ʎ] → ل;
|
|
106
|
+
[ʟ {ʟ̠}] → غ;
|
|
107
|
+
# Independent pass for misc cleanup.
|
|
108
|
+
::NULL;
|
|
109
|
+
# Strip off syllable markers
|
|
110
|
+
\. → ;
|
|
111
|
+
# Sequences of three or more ووو look very confusing; we shorten them.
|
|
112
|
+
# Polish Darłowo [darwɔvɔ] → داروو → داروووو
|
|
113
|
+
ووو+ → وو;
|
|
114
|
+
|
|
@@ -0,0 +1,172 @@
|
|
|
1
|
+
|
|
2
|
+
::NFD;
|
|
3
|
+
̋ → ˥;
|
|
4
|
+
́ → ˦;
|
|
5
|
+
̄ → ˧;
|
|
6
|
+
[ ̀ ̏ ] → ˧˩;
|
|
7
|
+
̌ → ˨˦;
|
|
8
|
+
̂ → ˥˧;
|
|
9
|
+
ə̃ → ə̃;
|
|
10
|
+
[ ̃ ̰ ꜜ ꜛ ↗ ↘ ] → ;
|
|
11
|
+
[{ŋɡ͡} {ŋg͡}] [k q ǃ ʗ ] → nk;
|
|
12
|
+
[{ŋɡ͡} {ŋg͡}] → nɡ;
|
|
13
|
+
{k͡x} → kh;
|
|
14
|
+
{k͡ɬ} → kl;
|
|
15
|
+
[{ɡ͡ǀ} {g͡ǀ}] → t͡ɬ;
|
|
16
|
+
[{l͡ʒ} ɮ] → ls;
|
|
17
|
+
[{n̼} {n̼̊} {m̺} {n̊} {n̥} ⁿ ᵑ {ɳ̊} {ɳ̥} ɳ {ɲ̊} {ɲ̥} ɲ {ɴ̊} {ɴ̥} ɴ {ŋ̊} {ŋ̥} ŋ] → n;
|
|
18
|
+
[ɱ {m̥} {m̪} ᵐ] → m;
|
|
19
|
+
[b {d̼} {b̺} {ɾ̼} ɓ p {t̼} {p̺} pʼ ʘ ɋ] ʰ? → kʷ; # Bolivia → ᏉᎵᏫᎠ [kʷoliwia], Bahamas → ᏆᎭᎹᏍ [kʷahamas]
|
|
20
|
+
[{t̪} ʈ ǁ ʖ] → t;
|
|
21
|
+
[ɖ ɗ ᶑ ð {ð̠} {ð̼} {β̺}] → d;
|
|
22
|
+
[q ǃ ʗ {q͡χ} {ɡ͡ǃ}] → k;
|
|
23
|
+
[g ɢ ɣ ɠ ʛ] → ɡ;
|
|
24
|
+
[f v β] → w; # Fiji → ᏫᏥ [wit͡si]
|
|
25
|
+
[θ {θ̱} {θ̞} {θ̼} {ɸ̺} z ʃ ʒ ʂ ʐ ʑ] → s;
|
|
26
|
+
[ɦ {ç} x χ ʕ ʡ ʔ ʰ] → h;
|
|
27
|
+
[r ɾ ɽ ʁ {r̝} ɾ ɽ ʁ {l̥}] → l;
|
|
28
|
+
[ʝ ʲ] → j;
|
|
29
|
+
[ʎ {ʎ̥˔} {ʎ̝} {ʟ̝̊} {ʟ̝}] [y i ɨ ɪ ʉ]? [ʝ ʲ]? → lj;
|
|
30
|
+
[{t͡ʃ} {t͜ʃ} {ʧ} {t͡ɕ} {t͜ɕ} {ʨ} {ʈ͡ʂ} c ɕ {t͡ʃʼ} ǀ ʇ ǂ ʄ] → t͡ɬ;
|
|
31
|
+
[{d͡ʒ} ʤ ʣ {d͡z} {d͜z} {d͡ɕ} ʥ {d͡ʑ} {d͜ʑ} {ɖ͡ʐ} {d͡ʐ} ɟ] → t͡s;
|
|
32
|
+
[y i ɨ ɪ ʉ] → i;
|
|
33
|
+
[ə ɛ æ ɘ] → ə̃;
|
|
34
|
+
[ʊ ɯ] → u;
|
|
35
|
+
[ɔ ø] → o;
|
|
36
|
+
[ɑ] → a;
|
|
37
|
+
[ʼ \. ̯ ] → ;
|
|
38
|
+
::NULL;
|
|
39
|
+
aː → aa;
|
|
40
|
+
eː → ee;
|
|
41
|
+
iː → ii;
|
|
42
|
+
oː → oo;
|
|
43
|
+
uː → uu;
|
|
44
|
+
ə̃ː → ə̃ə̃;
|
|
45
|
+
hh+ → h;
|
|
46
|
+
ː → ;
|
|
47
|
+
::NULL;
|
|
48
|
+
t͡sa → Ꮳ;
|
|
49
|
+
t͡se → Ꮴ;
|
|
50
|
+
t͡si → Ꮵ;
|
|
51
|
+
t͡so → Ꮶ;
|
|
52
|
+
t͡su → Ꮷ;
|
|
53
|
+
t͡sə̃ → Ꮸ;
|
|
54
|
+
t͡s → Ꮵ;
|
|
55
|
+
t͡ɬa → Ꮭ;
|
|
56
|
+
t͡ɬe → Ꮮ;
|
|
57
|
+
t͡ɬi → Ꮯ;
|
|
58
|
+
t͡ɬo → Ꮰ;
|
|
59
|
+
t͡ɬu → Ꮱ;
|
|
60
|
+
t͡ɬə̃ → Ꮲ;
|
|
61
|
+
t͡ɬ → Ꮯ;
|
|
62
|
+
d͡la → Ꮬ;
|
|
63
|
+
d͡le → Ꮮ;
|
|
64
|
+
d͡li → Ꮯ;
|
|
65
|
+
d͡lo → Ꮰ;
|
|
66
|
+
d͡lu → Ꮱ;
|
|
67
|
+
d͡lə̃ → Ꮲ;
|
|
68
|
+
d͡l → Ꮯ;
|
|
69
|
+
ɬa → Ꮭ;
|
|
70
|
+
ɬe → Ꮮ;
|
|
71
|
+
ɬi → Ꮯ;
|
|
72
|
+
ɬo → Ꮰ;
|
|
73
|
+
ɬu → Ꮱ;
|
|
74
|
+
ɬə̃ → Ꮲ;
|
|
75
|
+
ɬ → Ꮯ;
|
|
76
|
+
ma → Ꮉ;
|
|
77
|
+
me → Ꮊ;
|
|
78
|
+
mi → Ꮋ;
|
|
79
|
+
mo → Ꮌ;
|
|
80
|
+
mu → Ꮍ;
|
|
81
|
+
mə̃ → Ᏽ;
|
|
82
|
+
m → Ꮋ;
|
|
83
|
+
nah → Ꮐ;
|
|
84
|
+
na → Ꮎ;
|
|
85
|
+
ne → Ꮑ;
|
|
86
|
+
ni → Ꮒ;
|
|
87
|
+
no → Ꮓ;
|
|
88
|
+
nu → Ꮔ;
|
|
89
|
+
nə̃ → Ꮕ;
|
|
90
|
+
n → Ꮒ;
|
|
91
|
+
ta → Ꮤ;
|
|
92
|
+
te → Ꮦ;
|
|
93
|
+
ti → Ꮨ;
|
|
94
|
+
to → Ꮩ;
|
|
95
|
+
tu → Ꮪ;
|
|
96
|
+
tə̃ → Ꮫ;
|
|
97
|
+
t → Ꮨ;
|
|
98
|
+
da → Ꮣ;
|
|
99
|
+
de → Ꮥ;
|
|
100
|
+
di → Ꮧ;
|
|
101
|
+
do → Ꮩ;
|
|
102
|
+
du → Ꮪ;
|
|
103
|
+
də̃ → Ꮫ;
|
|
104
|
+
d → Ꮧ;
|
|
105
|
+
[kɡ][wʷ]a → Ꮖ;
|
|
106
|
+
[kɡ][wʷ]e → Ꮗ;
|
|
107
|
+
[kɡ][wʷ]i → Ꮘ;
|
|
108
|
+
[kɡ][wʷ]o → Ꮙ;
|
|
109
|
+
[kɡ][wʷ]u → Ꮚ;
|
|
110
|
+
[kɡ][wʷ]ə̃ → Ꮛ;
|
|
111
|
+
[kɡ][wʷ] → Ꮘ;
|
|
112
|
+
ɡa → Ꭶ;
|
|
113
|
+
ka → Ꭷ;
|
|
114
|
+
[kɡ]e → Ꭸ;
|
|
115
|
+
[kɡ]i → Ꭹ;
|
|
116
|
+
[kɡ]o → Ꭺ;
|
|
117
|
+
[kɡ]u → Ꭻ;
|
|
118
|
+
[kɡ]ə̃ → Ꭼ;
|
|
119
|
+
[kɡ] → Ꭹ;
|
|
120
|
+
sa → Ꮜ;
|
|
121
|
+
se → Ꮞ;
|
|
122
|
+
si → Ꮟ;
|
|
123
|
+
so → Ꮠ;
|
|
124
|
+
su → Ꮡ;
|
|
125
|
+
sə̃ → Ꮢ;
|
|
126
|
+
s → Ꮝ;
|
|
127
|
+
ha → Ꭽ;
|
|
128
|
+
he → Ꭾ;
|
|
129
|
+
hi → Ꭿ;
|
|
130
|
+
ho → Ꮀ;
|
|
131
|
+
hu → Ꮁ;
|
|
132
|
+
hə̃ → Ꮂ;
|
|
133
|
+
hna → Ꮏ;
|
|
134
|
+
h → Ꭿ;
|
|
135
|
+
la → Ꮃ;
|
|
136
|
+
le → Ꮄ;
|
|
137
|
+
li → Ꮅ;
|
|
138
|
+
lo → Ꮆ;
|
|
139
|
+
lu → Ꮇ;
|
|
140
|
+
lə̃ → Ꮈ;
|
|
141
|
+
l → Ꮅ;
|
|
142
|
+
wa → Ꮹ;
|
|
143
|
+
we → Ꮺ;
|
|
144
|
+
wi → Ꮻ;
|
|
145
|
+
wo → Ꮼ;
|
|
146
|
+
wu → Ꮽ;
|
|
147
|
+
wə̃ → Ꮾ;
|
|
148
|
+
w → Ꮻ;
|
|
149
|
+
ja → Ꮿ;
|
|
150
|
+
je → Ᏸ;
|
|
151
|
+
ji → Ᏹ;
|
|
152
|
+
jo → Ᏺ;
|
|
153
|
+
ju → Ᏻ;
|
|
154
|
+
jə̃ → Ᏼ;
|
|
155
|
+
j → Ᏹ;
|
|
156
|
+
a → Ꭰ;
|
|
157
|
+
e → Ꭱ;
|
|
158
|
+
i → Ꭲ;
|
|
159
|
+
o → Ꭳ;
|
|
160
|
+
u → Ꭴ;
|
|
161
|
+
ə̃ → Ꭵ;
|
|
162
|
+
˥˧ → ̂;
|
|
163
|
+
˧˩ → ̀;
|
|
164
|
+
˨˦ → ̌;
|
|
165
|
+
˥ → ̋;
|
|
166
|
+
˦ → ́;
|
|
167
|
+
˧ → ̄;
|
|
168
|
+
::NULL;
|
|
169
|
+
[:Zs:]+ → ' ';
|
|
170
|
+
[^[:sc=Cher:][ ̋ ́ ̄ ̀ ̂ ̌ ]] → ;
|
|
171
|
+
::NFC;
|
|
172
|
+
|
|
@@ -0,0 +1,109 @@
|
|
|
1
|
+
|
|
2
|
+
# Vowels
|
|
3
|
+
# ------
|
|
4
|
+
# In these rules, we produce ی و ا both for short and for long vowels.
|
|
5
|
+
# This would be wrong for writing Farsi or Arabic, but when transliterating
|
|
6
|
+
# foreign words and names, it is strongly preferred to vowel marks.
|
|
7
|
+
# Short schwa [ə] and a few other, schwa-like vowels get omitted entirely
|
|
8
|
+
# unless at the end of the word, in which case we emit ه whose Farsi
|
|
9
|
+
# word-final pronunciation comes close to [ə]. At the beginning of words,
|
|
10
|
+
# Farsi speakers prefer to see آ for [ɑ] and a few other similar-sounding
|
|
11
|
+
# dark vowels; note that this use of آ is quite different from Arabic.
|
|
12
|
+
$IVowel = [i ɪ e {e̞}];
|
|
13
|
+
$UVowel = [y {ɨ} {ʉ} ɯ u ʏ {ɪ̈} {ʊ̈} {ɯ̽} {ʊ} ø ɤ o {ø̞} {ɤ̞} {o̞} ɔ w {w̥} ʍ ʷ];
|
|
14
|
+
$AVowel = [ɛ œ ɜ æ ɶ];
|
|
15
|
+
$DarkAVowel = [ʌ a ɑ ɒ ɐ ɞ {ä} {ɒ̈}]; # آ instead of ا at beginning of words
|
|
16
|
+
$SchwaVowel = [ɘ ɵ ə {ɵ̞}];
|
|
17
|
+
$Click = [ʘ ɋ ǀ ʇ ǃ ʗ ǂ ʄ ǁ ʖ];
|
|
18
|
+
$Boundary = [^[:L:][:M:][:N:]];
|
|
19
|
+
::NFD;
|
|
20
|
+
[ʰ ʱ ʼ ̃ ̰ ̋ ́ ̄ ̀ ̏ ̌ ̂ ˥ ˦ ˧ ˨ ˩ ꜜ ꜛ ↗ ↘ ͡ ͜ ̯] → ;
|
|
21
|
+
ʲ → j;
|
|
22
|
+
ᵐ → m;
|
|
23
|
+
ⁿ → n;
|
|
24
|
+
ᵑ → ŋ;
|
|
25
|
+
::NFC;
|
|
26
|
+
# TODO: Diphthongs probably need more work.
|
|
27
|
+
# Romanian [sekujesk] → [sekujask], for emitting سیکویاسک not سیکویسک
|
|
28
|
+
$UVowel [j $IVowel] [e {e̞} $SchwaVowel] → uia;
|
|
29
|
+
# Kazakh Аягөз [ɑjɑɡy̯ʉz] → [ɑjɑɡiuz], to emit آیاگیوز not آیاگووز
|
|
30
|
+
yʉ → iu;
|
|
31
|
+
::NULL;
|
|
32
|
+
# Vowels
|
|
33
|
+
$Boundary {$SchwaVowel ː?} → ای;
|
|
34
|
+
$SchwaVowel ː → ی;
|
|
35
|
+
{[$SchwaVowel e {e̞}]} [^[:L:][:M:][:N:][\.]] → ه;
|
|
36
|
+
$SchwaVowel → ;
|
|
37
|
+
$Boundary {$IVowel ː?} → ای;
|
|
38
|
+
$IVowel ː? j? → ی;
|
|
39
|
+
$Boundary {$UVowel ː?} → او;
|
|
40
|
+
$UVowel ː? → و;
|
|
41
|
+
$Boundary {$AVowel ː?} → ا;
|
|
42
|
+
$AVowel ː? → ا;
|
|
43
|
+
$Boundary {$DarkAVowel ː?} → آ;
|
|
44
|
+
$DarkAVowel ː? → ا;
|
|
45
|
+
# Shadda for long (geminated) consonants
|
|
46
|
+
ː → ّ;
|
|
47
|
+
# Affricates
|
|
48
|
+
[{t͡ʃ} ʧ] → چ;
|
|
49
|
+
# Clicks
|
|
50
|
+
[ɡ g ɠ k] $Click → کچ;
|
|
51
|
+
[n ɲ]? $Click → نچ;
|
|
52
|
+
# Nasal stops
|
|
53
|
+
[{m̥} m ɱ] → م;
|
|
54
|
+
[{n̼̊} {n̼} {n̥} n {ɳ̊} ɳ {ɲ̊} {ɲ̥} ɲ] → ن;
|
|
55
|
+
[{ŋ̊} ŋ {ɴ̥} ɴ] k → نک;
|
|
56
|
+
[{ŋ̊} ŋ {ɴ̥} ɴ] [ɡ g]? → نگ;
|
|
57
|
+
# Non-nasal stops
|
|
58
|
+
[p {p̪}] → پ;
|
|
59
|
+
[b {b̪} ɓ] → ب;
|
|
60
|
+
[{d̼} d ɗ ᶑ] → د;
|
|
61
|
+
[{t̼} t] → ت;
|
|
62
|
+
[ʈ] → ط;
|
|
63
|
+
[ɖ] → ض;
|
|
64
|
+
c → چ;
|
|
65
|
+
ɟ → دج;
|
|
66
|
+
k → ک;
|
|
67
|
+
[ɡ g ɠ] → گ;
|
|
68
|
+
[q ɢ ʡ ʛ] → ق;
|
|
69
|
+
ʔ → ;
|
|
70
|
+
# Sibilant fricatives
|
|
71
|
+
s → س;
|
|
72
|
+
z → ز;
|
|
73
|
+
[ʃ ʂ ɕ ʄ] → ش;
|
|
74
|
+
[ʒ ʐ ʑ] → ژ;
|
|
75
|
+
# Non-sibilant fricatives
|
|
76
|
+
[ɸ f] → ف;
|
|
77
|
+
[β v] → و;
|
|
78
|
+
[{θ̼} θ {θ̱}] → ث;
|
|
79
|
+
[{ð̼} ð {ð̠}] → ذ;
|
|
80
|
+
ç → ش;
|
|
81
|
+
ʝ $IVowel? ː? → ی;
|
|
82
|
+
[x χ] → خ;
|
|
83
|
+
[ɣ ʁ] → غ;
|
|
84
|
+
ħ → ح;
|
|
85
|
+
ʕ → ع;
|
|
86
|
+
[h ɦ {ʔ̞}] → ه;
|
|
87
|
+
# Approximants, trills, flaps
|
|
88
|
+
ʋ → و;
|
|
89
|
+
ʙ → بر;
|
|
90
|
+
{r̝} → رژ;
|
|
91
|
+
[{ɹ̥} {ɹ} {ɻ̊} {ɻ} {ɾ̥} ɾ {ɽ̊} ɽ {r̼} {r̥} r] → ر;
|
|
92
|
+
[{ʀ̥} ʀ] → غ;
|
|
93
|
+
ʜ → ح;
|
|
94
|
+
ʢ → ع;
|
|
95
|
+
j $IVowel? ː? → ی;
|
|
96
|
+
# Laterals
|
|
97
|
+
ɬ → شل;
|
|
98
|
+
ɮ → ژل;
|
|
99
|
+
{[{ʎ̥} ʎ]} [^ $IVowel j ʝ] → لی;
|
|
100
|
+
[{l̼} {l̥} l {ɭ̊} ɭ {ʎ̥} ʎ] → ل;
|
|
101
|
+
[ʟ {ʟ̠}] → غ;
|
|
102
|
+
# Independent pass for misc cleanup.
|
|
103
|
+
::NULL;
|
|
104
|
+
# Strip off syllable markers
|
|
105
|
+
\. → ;
|
|
106
|
+
# Sequences of three or more ووو look very confusing; we shorten them.
|
|
107
|
+
# Polish Darłowo [darwɔvɔ] → داروو → داروووو
|
|
108
|
+
ووو+ → وو;
|
|
109
|
+
|
|
@@ -0,0 +1,103 @@
|
|
|
1
|
+
|
|
2
|
+
# Rules are predicated on running NFD first, and NFC afterwards
|
|
3
|
+
:: NFD (NFC) ;
|
|
4
|
+
$letters = [[:sc=Latn:][:sc=Cyrl:] & [:L:]] ;
|
|
5
|
+
$latinVowel = [AEIOUaeiouĬĭʼËë{oʻ}{Oʻ}] ;
|
|
6
|
+
$lower = [$letters & [:Ll:]] ;
|
|
7
|
+
у \u0306 ↔ oʻ ;
|
|
8
|
+
У \u0306 ↔ Oʻ ;
|
|
9
|
+
ғ ↔ gʻ ;
|
|
10
|
+
Ғ ↔ Gʻ ;
|
|
11
|
+
# For many cases, use a following character to determine the difference between XY and Xy
|
|
12
|
+
ш ↔ sh ;
|
|
13
|
+
{ Ш } $lower ↔ Sh ;
|
|
14
|
+
Ш ↔ SH ;
|
|
15
|
+
ч ↔ ch ;
|
|
16
|
+
{ Ч } $lower ↔ Ch ;
|
|
17
|
+
Ч ↔ CH ;
|
|
18
|
+
# нг ↔ ng ; as separate letters works
|
|
19
|
+
# Нг ↔ Ng ; as separate letters works
|
|
20
|
+
# If we have a lowercase letter on either side, use the lowercase hard sign
|
|
21
|
+
ъ ↔ { ʼ } $lower ;
|
|
22
|
+
ъ ← $lower { ʼ } ;
|
|
23
|
+
Ъ ↔ ʼ ;
|
|
24
|
+
е\u0308 ↔ yo ;
|
|
25
|
+
Е\u0308 } $lower ↔ Yo ;
|
|
26
|
+
Е\u0308 ↔ YO ;
|
|
27
|
+
# е → 'ye' at the beginning of a syllable, after a vowel, ъ or ь, otherwise 'e'
|
|
28
|
+
[:^L:] { е ↔ ye ;
|
|
29
|
+
[:^L:] { Е } $lower ↔ Ye ;
|
|
30
|
+
[:^L:] {Е ↔ YE ;
|
|
31
|
+
$latinVowel { е → ye ;
|
|
32
|
+
$latinVowel { Е } $lower → Ye ;
|
|
33
|
+
$latinVowel { Е → YE ;
|
|
34
|
+
# handle these specially, since ьЬ otherwise disappear.
|
|
35
|
+
ье → ye ;
|
|
36
|
+
{ ьЕ } $lower → Ye ;
|
|
37
|
+
ьЕ → YE ;
|
|
38
|
+
Ье → ye ;
|
|
39
|
+
{ ЬЕ } $lower → Ye ;
|
|
40
|
+
ЬЕ → YE ;
|
|
41
|
+
е → e ;
|
|
42
|
+
Е → E ;
|
|
43
|
+
ю ↔ yu ;
|
|
44
|
+
{ Ю } $lower ↔ Yu ;
|
|
45
|
+
Ю ↔ YU ;
|
|
46
|
+
я ↔ ya ;
|
|
47
|
+
{ Я } $lower ↔ Ya ;
|
|
48
|
+
Я ↔ YA ;
|
|
49
|
+
ц ↔ ts ;
|
|
50
|
+
{ Ц } $lower ↔ Ts ;
|
|
51
|
+
Ц ↔ TS ;
|
|
52
|
+
а ↔ a ;
|
|
53
|
+
А ↔ A ;
|
|
54
|
+
б ↔ b ;
|
|
55
|
+
Б ↔ B ;
|
|
56
|
+
д ↔ d ;
|
|
57
|
+
Д ↔ D ;
|
|
58
|
+
э ↔ e ;
|
|
59
|
+
Э ↔ E ;
|
|
60
|
+
ф ↔ f ;
|
|
61
|
+
Ф ↔ F ;
|
|
62
|
+
г ↔ g ;
|
|
63
|
+
Г ↔ G ;
|
|
64
|
+
ҳ ↔ h ;
|
|
65
|
+
Ҳ ↔ H ;
|
|
66
|
+
и\u0306 ↔ y ;
|
|
67
|
+
И\u0306 ↔ Y ;
|
|
68
|
+
и ↔ i ;
|
|
69
|
+
И ↔ I ;
|
|
70
|
+
ж ↔ j ;
|
|
71
|
+
Ж ↔ J ;
|
|
72
|
+
к ↔ k ;
|
|
73
|
+
К ↔ K ;
|
|
74
|
+
л ↔ l ;
|
|
75
|
+
Л ↔ L ;
|
|
76
|
+
м ↔ m ;
|
|
77
|
+
М ↔ M ;
|
|
78
|
+
н ↔ n ;
|
|
79
|
+
Н ↔ N ;
|
|
80
|
+
о ↔ o ;
|
|
81
|
+
О ↔ O ;
|
|
82
|
+
п ↔ p ;
|
|
83
|
+
П ↔ P ;
|
|
84
|
+
қ ↔ q ;
|
|
85
|
+
Қ ↔ Q ;
|
|
86
|
+
р ↔ r ;
|
|
87
|
+
Р ↔ R ;
|
|
88
|
+
с ↔ s ;
|
|
89
|
+
С ↔ S ;
|
|
90
|
+
т ↔ t ;
|
|
91
|
+
Т ↔ T ;
|
|
92
|
+
у ↔ u ;
|
|
93
|
+
У ↔ U ;
|
|
94
|
+
в ↔ v ;
|
|
95
|
+
В ↔ V ;
|
|
96
|
+
х ↔ x ;
|
|
97
|
+
Х ↔ X ;
|
|
98
|
+
з ↔ z ;
|
|
99
|
+
З ↔ Z ;
|
|
100
|
+
ь → ;
|
|
101
|
+
Ь → ;
|
|
102
|
+
::NFC (NFD) ;
|
|
103
|
+
|
|
@@ -0,0 +1,85 @@
|
|
|
1
|
+
|
|
2
|
+
# References
|
|
3
|
+
# ----------
|
|
4
|
+
# [1] Personal communication with Academia de ła Bona Creansa, Venice
|
|
5
|
+
# [2] https://en.wikipedia.org/wiki/Venetian_language#Phonology
|
|
6
|
+
# [3] https://en.wikipedia.org/wiki/Help:IPA/Venetian (mixed with Ladin)
|
|
7
|
+
#
|
|
8
|
+
# Output phonemes
|
|
9
|
+
# ---------------
|
|
10
|
+
# m n ɲ ŋ
|
|
11
|
+
# p b t d k ɡ
|
|
12
|
+
# f v ɾ s z
|
|
13
|
+
# l ʎ j w
|
|
14
|
+
# t͡ʃ d͡ʒ d͡z
|
|
15
|
+
# i u e e̯ o ɛ ɔ a
|
|
16
|
+
$boundary = [^[:L:][:M:][:N:]];
|
|
17
|
+
$e = [e é è];
|
|
18
|
+
$i = [i í ì];
|
|
19
|
+
$ei = [$e $i];
|
|
20
|
+
$vowel = [a á à $ei o ó ò u ú ù];
|
|
21
|
+
$onset = [
|
|
22
|
+
j w m n ɲ ŋ p b t d k ɡ f v ɾ s z h l ʎ {e̯}
|
|
23
|
+
{t͡ʃ} {d͡ʒ} {d͡z} {mj} {mw} {nj} {nw}
|
|
24
|
+
{ps} {pɾ} {pɾw} {pl} {pj} {pw} {bɾ} {bɾw} {bw} {bj} {bl}
|
|
25
|
+
{ts} {tɾ} {tɾw} {tl} {tj} {tw} {dɾ} {dɾw} {dw} {dj} {dl}
|
|
26
|
+
{kɾ} {kw} {kɾw} {kl} {kj} {kw} {ɡɾ} {ɡɾw} {ɡw} {ɡj} {ɡl}
|
|
27
|
+
{fɾ} {fj} {fl} {fw} {fɾw} {vɾ} {vj} {vw} {ɾw} {ɾj}
|
|
28
|
+
{zm} {zn} {zɲ} {zj} {zl} {zb} {zbɾ} {zbj} {zbw} {zd} {zdɾ} {zdj} {zdw}
|
|
29
|
+
{zɡ} {zɡɾ} {zɡj} {zɡw} {zv} {zvɾ} {zɾ} {zvj} {zd͡ʒ} {zw}
|
|
30
|
+
{sp} {spɾ} {spw} {st} {stɾ} {stw} {sk} {skɾ} {skw}
|
|
31
|
+
{sf} {sfɾ} {sɾ} {st͡ʃ} {sj} {sw} {lj} {lw}
|
|
32
|
+
];
|
|
33
|
+
::Lower;
|
|
34
|
+
::NFC;
|
|
35
|
+
([abefjklmoptvw]) → $1;
|
|
36
|
+
[á à] → ˈa;
|
|
37
|
+
{c [$ei \' ’]} $vowel → t͡ʃ;
|
|
38
|
+
cé [\' ’]? → t͡ʃˈe;
|
|
39
|
+
cè [\' ’]? → t͡ʃˈɛ;
|
|
40
|
+
c e [\' ’]? → t͡ʃe;
|
|
41
|
+
c [íì] [\' ’]? → t͡ʃˈi;
|
|
42
|
+
c i [\' ’]? → t͡ʃi;
|
|
43
|
+
[c {ch} k q {qu}] → k;
|
|
44
|
+
é → ˈe;
|
|
45
|
+
è → ˈɛ;
|
|
46
|
+
{g l $ei} $vowel → ʎ;
|
|
47
|
+
g l → ʎ;
|
|
48
|
+
ġ → d͡ʒ;
|
|
49
|
+
gé [\' ’]? → d͡ʒˈe;
|
|
50
|
+
gè [\' ’]? → d͡ʒˈɛ;
|
|
51
|
+
g [íì] [\' ’]? → d͡ʒˈi;
|
|
52
|
+
{g [$ei \' ’]} $vowel → d͡ʒ;
|
|
53
|
+
{g} $ei → d͡ʒ;
|
|
54
|
+
gn → ɲ;
|
|
55
|
+
[g {gh}] → ɡ;
|
|
56
|
+
[í ì] → ˈi;
|
|
57
|
+
{i} $vowel → j;
|
|
58
|
+
ł → ɰ;
|
|
59
|
+
ṅ → ŋ;
|
|
60
|
+
ñ → ɲ;
|
|
61
|
+
nj → ɲ;
|
|
62
|
+
ó → ˈo;
|
|
63
|
+
ò → ˈɔ;
|
|
64
|
+
r → ɾ;
|
|
65
|
+
[ṡ x z] → z;
|
|
66
|
+
{s}[bdg] → z;
|
|
67
|
+
s → s;
|
|
68
|
+
{u} $vowel → w;
|
|
69
|
+
[ú ù] → ˈu;
|
|
70
|
+
u → u;
|
|
71
|
+
y → j;
|
|
72
|
+
[ż đ {dh}] → d͡z;
|
|
73
|
+
d → d;
|
|
74
|
+
[[:P:][:Z:]]+ → ' ';
|
|
75
|
+
::NULL;
|
|
76
|
+
{n} [p b t d k ɡ f v ɾ s z $boundary] → ŋ;
|
|
77
|
+
{ɰ} ˈ? [ei] → ;
|
|
78
|
+
eɰ → e;
|
|
79
|
+
iɰ → i;
|
|
80
|
+
ɰ → e̯;
|
|
81
|
+
::NULL;
|
|
82
|
+
# Move stress marker before syllable onset: [zɡɾaŋfiɲˈae] → [zɡɾaŋfiˈɲae]
|
|
83
|
+
($onset) ˈ → ˈ $1;
|
|
84
|
+
::NULL;
|
|
85
|
+
|