cldr-transforms 46.0.0-BETA2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +41 -0
- package/README.md +27 -0
- package/bower.json +13 -0
- package/package.json +29 -0
- package/transforms/Amharic-Latin-BGN.json +9 -0
- package/transforms/Amharic-Latin-BGN.txt +441 -0
- package/transforms/Any-Accents.json +9 -0
- package/transforms/Any-Accents.txt +270 -0
- package/transforms/Any-Publishing.json +9 -0
- package/transforms/Any-Publishing.txt +63 -0
- package/transforms/Arabic-Latin-BGN.json +9 -0
- package/transforms/Arabic-Latin-BGN.txt +205 -0
- package/transforms/Arabic-Latin.json +11 -0
- package/transforms/Arabic-Latin.txt +181 -0
- package/transforms/Armenian-Latin-BGN.json +9 -0
- package/transforms/Armenian-Latin-BGN.txt +165 -0
- package/transforms/Azerbaijani-Latin-BGN.json +9 -0
- package/transforms/Azerbaijani-Latin-BGN.txt +183 -0
- package/transforms/Belarusian-Latin-BGN.json +9 -0
- package/transforms/Belarusian-Latin-BGN.txt +194 -0
- package/transforms/Bengali-Arabic.json +9 -0
- package/transforms/Bengali-Arabic.txt +7 -0
- package/transforms/Bengali-Devanagari.json +9 -0
- package/transforms/Bengali-Devanagari.txt +7 -0
- package/transforms/Bengali-Gujarati.json +9 -0
- package/transforms/Bengali-Gujarati.txt +7 -0
- package/transforms/Bengali-Gurmukhi.json +9 -0
- package/transforms/Bengali-Gurmukhi.txt +7 -0
- package/transforms/Bengali-InterIndic.json +7 -0
- package/transforms/Bengali-InterIndic.txt +99 -0
- package/transforms/Bengali-Kannada.json +9 -0
- package/transforms/Bengali-Kannada.txt +7 -0
- package/transforms/Bengali-Latin.json +9 -0
- package/transforms/Bengali-Latin.txt +7 -0
- package/transforms/Bengali-Malayalam.json +9 -0
- package/transforms/Bengali-Malayalam.txt +7 -0
- package/transforms/Bengali-Oriya.json +9 -0
- package/transforms/Bengali-Oriya.txt +7 -0
- package/transforms/Bengali-Tamil.json +9 -0
- package/transforms/Bengali-Tamil.txt +7 -0
- package/transforms/Bengali-Telugu.json +9 -0
- package/transforms/Bengali-Telugu.txt +7 -0
- package/transforms/Bengali-ur.json +8 -0
- package/transforms/Bengali-ur.txt +7 -0
- package/transforms/Bulgarian-Latin-BGN.json +9 -0
- package/transforms/Bulgarian-Latin-BGN.txt +237 -0
- package/transforms/CanadianAboriginal-Latin.json +11 -0
- package/transforms/CanadianAboriginal-Latin.txt +184 -0
- package/transforms/Cyrillic-Latin.json +11 -0
- package/transforms/Cyrillic-Latin.txt +280 -0
- package/transforms/Devanagari-Arabic.json +9 -0
- package/transforms/Devanagari-Arabic.txt +7 -0
- package/transforms/Devanagari-Bengali.json +9 -0
- package/transforms/Devanagari-Bengali.txt +7 -0
- package/transforms/Devanagari-Gujarati.json +9 -0
- package/transforms/Devanagari-Gujarati.txt +7 -0
- package/transforms/Devanagari-Gurmukhi.json +9 -0
- package/transforms/Devanagari-Gurmukhi.txt +7 -0
- package/transforms/Devanagari-InterIndic.json +7 -0
- package/transforms/Devanagari-InterIndic.txt +113 -0
- package/transforms/Devanagari-Kannada.json +9 -0
- package/transforms/Devanagari-Kannada.txt +7 -0
- package/transforms/Devanagari-Latin.json +9 -0
- package/transforms/Devanagari-Latin.txt +7 -0
- package/transforms/Devanagari-Malayalam.json +9 -0
- package/transforms/Devanagari-Malayalam.txt +7 -0
- package/transforms/Devanagari-Oriya.json +9 -0
- package/transforms/Devanagari-Oriya.txt +7 -0
- package/transforms/Devanagari-Tamil.json +9 -0
- package/transforms/Devanagari-Tamil.txt +7 -0
- package/transforms/Devanagari-Telugu.json +9 -0
- package/transforms/Devanagari-Telugu.txt +7 -0
- package/transforms/Devanagari-ur.json +8 -0
- package/transforms/Devanagari-ur.txt +7 -0
- package/transforms/Fullwidth-Halfwidth.json +9 -0
- package/transforms/Fullwidth-Halfwidth.txt +261 -0
- package/transforms/Georgian-Latin-BGN.json +9 -0
- package/transforms/Georgian-Latin-BGN.txt +43 -0
- package/transforms/Georgian-Latin-BGN_1981.json +8 -0
- package/transforms/Georgian-Latin-BGN_1981.txt +54 -0
- package/transforms/Georgian-Latin.json +11 -0
- package/transforms/Georgian-Latin.txt +53 -0
- package/transforms/Greek-Latin-BGN.json +9 -0
- package/transforms/Greek-Latin-BGN.txt +419 -0
- package/transforms/Greek-Latin.json +11 -0
- package/transforms/Greek-Latin.txt +251 -0
- package/transforms/Greek_Latin_UNGEGN.json +11 -0
- package/transforms/Greek_Latin_UNGEGN.txt +179 -0
- package/transforms/Gujarati-Arabic.json +9 -0
- package/transforms/Gujarati-Arabic.txt +7 -0
- package/transforms/Gujarati-Bengali.json +9 -0
- package/transforms/Gujarati-Bengali.txt +7 -0
- package/transforms/Gujarati-Devanagari.json +9 -0
- package/transforms/Gujarati-Devanagari.txt +7 -0
- package/transforms/Gujarati-Gurmukhi.json +9 -0
- package/transforms/Gujarati-Gurmukhi.txt +7 -0
- package/transforms/Gujarati-InterIndic.json +7 -0
- package/transforms/Gujarati-InterIndic.txt +89 -0
- package/transforms/Gujarati-Kannada.json +9 -0
- package/transforms/Gujarati-Kannada.txt +7 -0
- package/transforms/Gujarati-Latin.json +9 -0
- package/transforms/Gujarati-Latin.txt +7 -0
- package/transforms/Gujarati-Malayalam.json +9 -0
- package/transforms/Gujarati-Malayalam.txt +7 -0
- package/transforms/Gujarati-Oriya.json +9 -0
- package/transforms/Gujarati-Oriya.txt +7 -0
- package/transforms/Gujarati-Tamil.json +9 -0
- package/transforms/Gujarati-Tamil.txt +7 -0
- package/transforms/Gujarati-Telugu.json +9 -0
- package/transforms/Gujarati-Telugu.txt +7 -0
- package/transforms/Gujarati-ur.json +8 -0
- package/transforms/Gujarati-ur.txt +7 -0
- package/transforms/Gurmukhi-Arabic.json +9 -0
- package/transforms/Gurmukhi-Arabic.txt +7 -0
- package/transforms/Gurmukhi-Bengali.json +9 -0
- package/transforms/Gurmukhi-Bengali.txt +7 -0
- package/transforms/Gurmukhi-Devanagari.json +9 -0
- package/transforms/Gurmukhi-Devanagari.txt +7 -0
- package/transforms/Gurmukhi-Gujarati.json +9 -0
- package/transforms/Gurmukhi-Gujarati.txt +7 -0
- package/transforms/Gurmukhi-InterIndic.json +7 -0
- package/transforms/Gurmukhi-InterIndic.txt +88 -0
- package/transforms/Gurmukhi-Kannada.json +9 -0
- package/transforms/Gurmukhi-Kannada.txt +7 -0
- package/transforms/Gurmukhi-Latin.json +9 -0
- package/transforms/Gurmukhi-Latin.txt +7 -0
- package/transforms/Gurmukhi-Malayalam.json +9 -0
- package/transforms/Gurmukhi-Malayalam.txt +7 -0
- package/transforms/Gurmukhi-Oriya.json +9 -0
- package/transforms/Gurmukhi-Oriya.txt +7 -0
- package/transforms/Gurmukhi-Tamil.json +9 -0
- package/transforms/Gurmukhi-Tamil.txt +7 -0
- package/transforms/Gurmukhi-Telugu.json +9 -0
- package/transforms/Gurmukhi-Telugu.txt +7 -0
- package/transforms/Gurmukhi-ur.json +8 -0
- package/transforms/Gurmukhi-ur.txt +7 -0
- package/transforms/Han-Latin-Names.json +8 -0
- package/transforms/Han-Latin-Names.txt +65 -0
- package/transforms/Han-Latin.json +9 -0
- package/transforms/Han-Latin.txt +1501 -0
- package/transforms/Han-Spacedhan.json +7 -0
- package/transforms/Han-Spacedhan.txt +35 -0
- package/transforms/Hangul-Latin.json +9 -0
- package/transforms/Hangul-Latin.txt +6 -0
- package/transforms/Hebrew-Latin-BGN.json +9 -0
- package/transforms/Hebrew-Latin-BGN.txt +113 -0
- package/transforms/Hebrew-Latin.json +11 -0
- package/transforms/Hebrew-Latin.txt +91 -0
- package/transforms/Hiragana-Katakana.json +11 -0
- package/transforms/Hiragana-Katakana.txt +179 -0
- package/transforms/Hiragana-Latin.json +11 -0
- package/transforms/Hiragana-Latin.txt +9 -0
- package/transforms/IPA-XSampa.json +11 -0
- package/transforms/IPA-XSampa.txt +228 -0
- package/transforms/InterIndic-Arabic.json +7 -0
- package/transforms/InterIndic-Arabic.txt +128 -0
- package/transforms/InterIndic-Bengali.json +7 -0
- package/transforms/InterIndic-Bengali.txt +135 -0
- package/transforms/InterIndic-Devanagari.json +7 -0
- package/transforms/InterIndic-Devanagari.txt +151 -0
- package/transforms/InterIndic-Gujarati.json +7 -0
- package/transforms/InterIndic-Gujarati.txt +136 -0
- package/transforms/InterIndic-Gurmukhi.json +7 -0
- package/transforms/InterIndic-Gurmukhi.txt +142 -0
- package/transforms/InterIndic-Kannada.json +7 -0
- package/transforms/InterIndic-Kannada.txt +137 -0
- package/transforms/InterIndic-Latin.json +7 -0
- package/transforms/InterIndic-Latin.txt +492 -0
- package/transforms/InterIndic-Malayalam.json +7 -0
- package/transforms/InterIndic-Malayalam.txt +137 -0
- package/transforms/InterIndic-Oriya.json +7 -0
- package/transforms/InterIndic-Oriya.txt +135 -0
- package/transforms/InterIndic-Tamil.json +7 -0
- package/transforms/InterIndic-Tamil.txt +136 -0
- package/transforms/InterIndic-Telugu.json +7 -0
- package/transforms/InterIndic-Telugu.txt +136 -0
- package/transforms/InterIndic-ur.json +7 -0
- package/transforms/InterIndic-ur.txt +119 -0
- package/transforms/Jamo-Latin.json +9 -0
- package/transforms/Jamo-Latin.txt +6 -0
- package/transforms/Kannada-Arabic.json +9 -0
- package/transforms/Kannada-Arabic.txt +7 -0
- package/transforms/Kannada-Bengali.json +9 -0
- package/transforms/Kannada-Bengali.txt +7 -0
- package/transforms/Kannada-Devanagari.json +9 -0
- package/transforms/Kannada-Devanagari.txt +7 -0
- package/transforms/Kannada-Gujarati.json +9 -0
- package/transforms/Kannada-Gujarati.txt +7 -0
- package/transforms/Kannada-Gurmukhi.json +9 -0
- package/transforms/Kannada-Gurmukhi.txt +7 -0
- package/transforms/Kannada-InterIndic.json +7 -0
- package/transforms/Kannada-InterIndic.txt +87 -0
- package/transforms/Kannada-Latin.json +9 -0
- package/transforms/Kannada-Latin.txt +7 -0
- package/transforms/Kannada-Malayalam.json +9 -0
- package/transforms/Kannada-Malayalam.txt +7 -0
- package/transforms/Kannada-Oriya.json +9 -0
- package/transforms/Kannada-Oriya.txt +7 -0
- package/transforms/Kannada-Tamil.json +9 -0
- package/transforms/Kannada-Tamil.txt +7 -0
- package/transforms/Kannada-Telugu.json +9 -0
- package/transforms/Kannada-Telugu.txt +7 -0
- package/transforms/Kannada-ur.json +8 -0
- package/transforms/Kannada-ur.txt +7 -0
- package/transforms/Katakana-Latin-BGN.json +9 -0
- package/transforms/Katakana-Latin-BGN.txt +335 -0
- package/transforms/Kazakh-Latin-BGN.json +9 -0
- package/transforms/Kazakh-Latin-BGN.txt +332 -0
- package/transforms/Kirghiz-Latin-BGN.json +9 -0
- package/transforms/Kirghiz-Latin-BGN.txt +211 -0
- package/transforms/Korean-Latin-BGN.json +9 -0
- package/transforms/Korean-Latin-BGN.txt +345 -0
- package/transforms/Latin-ASCII.json +9 -0
- package/transforms/Latin-ASCII.txt +909 -0
- package/transforms/Latin-Armenian.json +11 -0
- package/transforms/Latin-Armenian.txt +88 -0
- package/transforms/Latin-Bengali.json +9 -0
- package/transforms/Latin-Bengali.txt +8 -0
- package/transforms/Latin-Bopomofo.json +11 -0
- package/transforms/Latin-Bopomofo.txt +1445 -0
- package/transforms/Latin-ConjoiningJamo.json +7 -0
- package/transforms/Latin-ConjoiningJamo.txt +477 -0
- package/transforms/Latin-Devanagari.json +9 -0
- package/transforms/Latin-Devanagari.txt +8 -0
- package/transforms/Latin-Ethiopic.json +11 -0
- package/transforms/Latin-Ethiopic.txt +277 -0
- package/transforms/Latin-Gujarati.json +9 -0
- package/transforms/Latin-Gujarati.txt +8 -0
- package/transforms/Latin-Gurmukhi.json +9 -0
- package/transforms/Latin-Gurmukhi.txt +8 -0
- package/transforms/Latin-Hangul.json +9 -0
- package/transforms/Latin-Hangul.txt +7 -0
- package/transforms/Latin-InterIndic.json +7 -0
- package/transforms/Latin-InterIndic.txt +377 -0
- package/transforms/Latin-Jamo.json +9 -0
- package/transforms/Latin-Jamo.txt +7 -0
- package/transforms/Latin-Kannada.json +9 -0
- package/transforms/Latin-Kannada.txt +8 -0
- package/transforms/Latin-Katakana.json +11 -0
- package/transforms/Latin-Katakana.txt +382 -0
- package/transforms/Latin-Malayalam.json +9 -0
- package/transforms/Latin-Malayalam.txt +8 -0
- package/transforms/Latin-NumericPinyin.json +9 -0
- package/transforms/Latin-NumericPinyin.txt +29 -0
- package/transforms/Latin-Oriya.json +9 -0
- package/transforms/Latin-Oriya.txt +8 -0
- package/transforms/Latin-Tamil.json +9 -0
- package/transforms/Latin-Tamil.txt +8 -0
- package/transforms/Latin-Telugu.json +9 -0
- package/transforms/Latin-Telugu.txt +8 -0
- package/transforms/Latin-Thai.json +9 -0
- package/transforms/Latin-Thai.txt +7 -0
- package/transforms/Macedonian-Latin-BGN.json +9 -0
- package/transforms/Macedonian-Latin-BGN.txt +176 -0
- package/transforms/Malayalam-Arabic.json +9 -0
- package/transforms/Malayalam-Arabic.txt +7 -0
- package/transforms/Malayalam-Bengali.json +9 -0
- package/transforms/Malayalam-Bengali.txt +7 -0
- package/transforms/Malayalam-Devanagari.json +9 -0
- package/transforms/Malayalam-Devanagari.txt +7 -0
- package/transforms/Malayalam-Gujarati.json +9 -0
- package/transforms/Malayalam-Gujarati.txt +7 -0
- package/transforms/Malayalam-Gurmukhi.json +9 -0
- package/transforms/Malayalam-Gurmukhi.txt +7 -0
- package/transforms/Malayalam-InterIndic.json +7 -0
- package/transforms/Malayalam-InterIndic.txt +87 -0
- package/transforms/Malayalam-Kannada.json +9 -0
- package/transforms/Malayalam-Kannada.txt +7 -0
- package/transforms/Malayalam-Latin.json +9 -0
- package/transforms/Malayalam-Latin.txt +7 -0
- package/transforms/Malayalam-Oriya.json +9 -0
- package/transforms/Malayalam-Oriya.txt +7 -0
- package/transforms/Malayalam-Tamil.json +9 -0
- package/transforms/Malayalam-Tamil.txt +7 -0
- package/transforms/Malayalam-Telugu.json +9 -0
- package/transforms/Malayalam-Telugu.txt +7 -0
- package/transforms/Malayalam-ur.json +8 -0
- package/transforms/Malayalam-ur.txt +7 -0
- package/transforms/Maldivian-Latin-BGN.json +9 -0
- package/transforms/Maldivian-Latin-BGN.txt +171 -0
- package/transforms/Mongolian-Latin-BGN.json +9 -0
- package/transforms/Mongolian-Latin-BGN.txt +151 -0
- package/transforms/Myanmar-Latin.json +9 -0
- package/transforms/Myanmar-Latin.txt +367 -0
- package/transforms/Oriya-Arabic.json +9 -0
- package/transforms/Oriya-Arabic.txt +7 -0
- package/transforms/Oriya-Bengali.json +9 -0
- package/transforms/Oriya-Bengali.txt +7 -0
- package/transforms/Oriya-Devanagari.json +9 -0
- package/transforms/Oriya-Devanagari.txt +7 -0
- package/transforms/Oriya-Gujarati.json +9 -0
- package/transforms/Oriya-Gujarati.txt +7 -0
- package/transforms/Oriya-Gurmukhi.json +9 -0
- package/transforms/Oriya-Gurmukhi.txt +7 -0
- package/transforms/Oriya-InterIndic.json +7 -0
- package/transforms/Oriya-InterIndic.txt +91 -0
- package/transforms/Oriya-Kannada.json +9 -0
- package/transforms/Oriya-Kannada.txt +7 -0
- package/transforms/Oriya-Latin.json +9 -0
- package/transforms/Oriya-Latin.txt +7 -0
- package/transforms/Oriya-Malayalam.json +9 -0
- package/transforms/Oriya-Malayalam.txt +7 -0
- package/transforms/Oriya-Tamil.json +9 -0
- package/transforms/Oriya-Tamil.txt +7 -0
- package/transforms/Oriya-Telugu.json +9 -0
- package/transforms/Oriya-Telugu.txt +7 -0
- package/transforms/Oriya-ur.json +8 -0
- package/transforms/Oriya-ur.txt +7 -0
- package/transforms/Pashto-Latin-BGN.json +9 -0
- package/transforms/Pashto-Latin-BGN.txt +231 -0
- package/transforms/Persian-Latin-BGN.json +9 -0
- package/transforms/Persian-Latin-BGN.txt +203 -0
- package/transforms/Pinyin-NumericPinyin.json +7 -0
- package/transforms/Pinyin-NumericPinyin.txt +8 -0
- package/transforms/Russian-Latin-BGN.json +9 -0
- package/transforms/Russian-Latin-BGN.txt +235 -0
- package/transforms/Serbian-Latin-BGN.json +9 -0
- package/transforms/Serbian-Latin-BGN.txt +119 -0
- package/transforms/Simplified-Traditional.json +11 -0
- package/transforms/Simplified-Traditional.txt +4393 -0
- package/transforms/Syriac-Latin.json +11 -0
- package/transforms/Syriac-Latin.txt +52 -0
- package/transforms/Tamil-Arabic.json +9 -0
- package/transforms/Tamil-Arabic.txt +7 -0
- package/transforms/Tamil-Bengali.json +9 -0
- package/transforms/Tamil-Bengali.txt +7 -0
- package/transforms/Tamil-Devanagari.json +9 -0
- package/transforms/Tamil-Devanagari.txt +7 -0
- package/transforms/Tamil-Gujarati.json +9 -0
- package/transforms/Tamil-Gujarati.txt +7 -0
- package/transforms/Tamil-Gurmukhi.json +9 -0
- package/transforms/Tamil-Gurmukhi.txt +7 -0
- package/transforms/Tamil-InterIndic.json +7 -0
- package/transforms/Tamil-InterIndic.txt +70 -0
- package/transforms/Tamil-Kannada.json +9 -0
- package/transforms/Tamil-Kannada.txt +7 -0
- package/transforms/Tamil-Latin.json +9 -0
- package/transforms/Tamil-Latin.txt +7 -0
- package/transforms/Tamil-Malayalam.json +9 -0
- package/transforms/Tamil-Malayalam.txt +7 -0
- package/transforms/Tamil-Oriya.json +9 -0
- package/transforms/Tamil-Oriya.txt +7 -0
- package/transforms/Tamil-Telugu.json +9 -0
- package/transforms/Tamil-Telugu.txt +7 -0
- package/transforms/Tamil-ur.json +8 -0
- package/transforms/Tamil-ur.txt +7 -0
- package/transforms/Telugu-Arabic.json +9 -0
- package/transforms/Telugu-Arabic.txt +7 -0
- package/transforms/Telugu-Bengali.json +9 -0
- package/transforms/Telugu-Bengali.txt +7 -0
- package/transforms/Telugu-Devanagari.json +9 -0
- package/transforms/Telugu-Devanagari.txt +7 -0
- package/transforms/Telugu-Gujarati.json +9 -0
- package/transforms/Telugu-Gujarati.txt +7 -0
- package/transforms/Telugu-Gurmukhi.json +9 -0
- package/transforms/Telugu-Gurmukhi.txt +7 -0
- package/transforms/Telugu-InterIndic.json +7 -0
- package/transforms/Telugu-InterIndic.txt +87 -0
- package/transforms/Telugu-Kannada.json +9 -0
- package/transforms/Telugu-Kannada.txt +7 -0
- package/transforms/Telugu-Latin.json +9 -0
- package/transforms/Telugu-Latin.txt +7 -0
- package/transforms/Telugu-Malayalam.json +9 -0
- package/transforms/Telugu-Malayalam.txt +7 -0
- package/transforms/Telugu-Oriya.json +9 -0
- package/transforms/Telugu-Oriya.txt +7 -0
- package/transforms/Telugu-Tamil.json +9 -0
- package/transforms/Telugu-Tamil.txt +7 -0
- package/transforms/Telugu-ur.json +8 -0
- package/transforms/Telugu-ur.txt +7 -0
- package/transforms/Thaana-Latin.json +11 -0
- package/transforms/Thaana-Latin.txt +433 -0
- package/transforms/Thai-Latin.json +9 -0
- package/transforms/Thai-Latin.txt +9 -0
- package/transforms/Thai-ThaiLogical.json +7 -0
- package/transforms/Thai-ThaiLogical.txt +16 -0
- package/transforms/Thai-ThaiSemi.json +7 -0
- package/transforms/Thai-ThaiSemi.txt +6 -0
- package/transforms/ThaiLogical-Latin.json +7 -0
- package/transforms/ThaiLogical-Latin.txt +147 -0
- package/transforms/Turkmen-Latin-BGN.json +9 -0
- package/transforms/Turkmen-Latin-BGN.txt +302 -0
- package/transforms/Ukrainian-Latin-BGN.json +9 -0
- package/transforms/Ukrainian-Latin-BGN.txt +283 -0
- package/transforms/Uzbek-Latin-BGN.json +9 -0
- package/transforms/Uzbek-Latin-BGN.txt +261 -0
- package/transforms/am-Ethi-t-am-brai.json +11 -0
- package/transforms/am-Ethi-t-am-brai.txt +652 -0
- package/transforms/am-Ethi-t-am-ethi-m0-geminate.json +9 -0
- package/transforms/am-Ethi-t-am-ethi-m0-geminate.txt +6925 -0
- package/transforms/am-Ethi-t-d0-morse.json +9 -0
- package/transforms/am-Ethi-t-d0-morse.txt +657 -0
- package/transforms/am-am_FONIPA.json +9 -0
- package/transforms/am-am_FONIPA.txt +694 -0
- package/transforms/am-ar.json +8 -0
- package/transforms/am-ar.txt +5 -0
- package/transforms/am-chr.json +8 -0
- package/transforms/am-chr.txt +4 -0
- package/transforms/am-fa.json +8 -0
- package/transforms/am-fa.txt +4 -0
- package/transforms/az-Lower.json +8 -0
- package/transforms/az-Lower.txt +13 -0
- package/transforms/az-Title.json +8 -0
- package/transforms/az-Title.txt +11 -0
- package/transforms/az-Upper.json +8 -0
- package/transforms/az-Upper.txt +5 -0
- package/transforms/blt-fonipa-t-blt.json +8 -0
- package/transforms/blt-fonipa-t-blt.txt +132 -0
- package/transforms/byn-Ethi-t-byn-latn-m0-tekie-alibekit.json +11 -0
- package/transforms/byn-Ethi-t-byn-latn-m0-tekie-alibekit.txt +537 -0
- package/transforms/byn-Ethi-t-byn-latn-m0-xaleget.json +11 -0
- package/transforms/byn-Ethi-t-byn-latn-m0-xaleget.txt +773 -0
- package/transforms/ch-am.json +8 -0
- package/transforms/ch-am.txt +4 -0
- package/transforms/ch-ar.json +8 -0
- package/transforms/ch-ar.txt +4 -0
- package/transforms/ch-ch_FONIPA.json +8 -0
- package/transforms/ch-ch_FONIPA.txt +79 -0
- package/transforms/ch-chr.json +8 -0
- package/transforms/ch-chr.txt +4 -0
- package/transforms/ch-fa.json +8 -0
- package/transforms/ch-fa.txt +4 -0
- package/transforms/chr-chr_FONIPA.json +8 -0
- package/transforms/chr-chr_FONIPA.txt +111 -0
- package/transforms/cs-am.json +8 -0
- package/transforms/cs-am.txt +4 -0
- package/transforms/cs-ar.json +8 -0
- package/transforms/cs-ar.txt +4 -0
- package/transforms/cs-chr.json +8 -0
- package/transforms/cs-chr.txt +4 -0
- package/transforms/cs-cs_FONIPA.json +8 -0
- package/transforms/cs-cs_FONIPA.txt +74 -0
- package/transforms/cs-fa.json +8 -0
- package/transforms/cs-fa.txt +4 -0
- package/transforms/cs-ja.json +8 -0
- package/transforms/cs-ja.txt +4 -0
- package/transforms/cs-ko.json +8 -0
- package/transforms/cs-ko.txt +4 -0
- package/transforms/cs_FONIPA-ja.json +8 -0
- package/transforms/cs_FONIPA-ja.txt +228 -0
- package/transforms/cs_FONIPA-ko.json +8 -0
- package/transforms/cs_FONIPA-ko.txt +88 -0
- package/transforms/cy-fonipa-t-cy.json +8 -0
- package/transforms/cy-fonipa-t-cy.txt +189 -0
- package/transforms/de-ASCII.json +8 -0
- package/transforms/de-ASCII.txt +15 -0
- package/transforms/dsb-dsb_FONIPA.json +8 -0
- package/transforms/dsb-dsb_FONIPA.txt +67 -0
- package/transforms/el-Lower.json +8 -0
- package/transforms/el-Lower.txt +12 -0
- package/transforms/el-Title.json +8 -0
- package/transforms/el-Title.txt +12 -0
- package/transforms/el-Upper.json +8 -0
- package/transforms/el-Upper.txt +11 -0
- package/transforms/eo-am.json +8 -0
- package/transforms/eo-am.txt +4 -0
- package/transforms/eo-ar.json +8 -0
- package/transforms/eo-ar.txt +4 -0
- package/transforms/eo-chr.json +8 -0
- package/transforms/eo-chr.txt +4 -0
- package/transforms/eo-eo_FONIPA.json +8 -0
- package/transforms/eo-eo_FONIPA.txt +47 -0
- package/transforms/eo-fa.json +8 -0
- package/transforms/eo-fa.txt +4 -0
- package/transforms/es-am.json +8 -0
- package/transforms/es-am.txt +4 -0
- package/transforms/es-ar.json +8 -0
- package/transforms/es-ar.txt +13 -0
- package/transforms/es-chr.json +8 -0
- package/transforms/es-chr.txt +4 -0
- package/transforms/es-es_FONIPA.json +8 -0
- package/transforms/es-es_FONIPA.txt +139 -0
- package/transforms/es-fa.json +8 -0
- package/transforms/es-fa.txt +13 -0
- package/transforms/es-ja.json +8 -0
- package/transforms/es-ja.txt +4 -0
- package/transforms/es-zh.json +8 -0
- package/transforms/es-zh.txt +4 -0
- package/transforms/es_419-am.json +8 -0
- package/transforms/es_419-am.txt +5 -0
- package/transforms/es_419-ar.json +8 -0
- package/transforms/es_419-ar.txt +14 -0
- package/transforms/es_419-chr.json +8 -0
- package/transforms/es_419-chr.txt +5 -0
- package/transforms/es_419-fa.json +8 -0
- package/transforms/es_419-fa.txt +14 -0
- package/transforms/es_419-ja.json +8 -0
- package/transforms/es_419-ja.txt +5 -0
- package/transforms/es_419-zh.json +8 -0
- package/transforms/es_419-zh.txt +5 -0
- package/transforms/es_FONIPA-am.json +8 -0
- package/transforms/es_FONIPA-am.txt +230 -0
- package/transforms/es_FONIPA-es_419_FONIPA.json +8 -0
- package/transforms/es_FONIPA-es_419_FONIPA.txt +6 -0
- package/transforms/es_FONIPA-ja.json +8 -0
- package/transforms/es_FONIPA-ja.txt +155 -0
- package/transforms/es_FONIPA-zh.json +8 -0
- package/transforms/es_FONIPA-zh.txt +522 -0
- package/transforms/fa-fa_FONIPA.json +8 -0
- package/transforms/fa-fa_FONIPA.txt +107 -0
- package/transforms/gz-Ethi-t-und-sarb.json +11 -0
- package/transforms/gz-Ethi-t-und-sarb.txt +180 -0
- package/transforms/ha-ha_NE.json +8 -0
- package/transforms/ha-ha_NE.txt +6 -0
- package/transforms/hy-am.json +8 -0
- package/transforms/hy-am.txt +4 -0
- package/transforms/hy-ar.json +8 -0
- package/transforms/hy-ar.txt +4 -0
- package/transforms/hy-chr.json +8 -0
- package/transforms/hy-chr.txt +4 -0
- package/transforms/hy-fa.json +8 -0
- package/transforms/hy-fa.txt +4 -0
- package/transforms/hy-hy_FONIPA.json +8 -0
- package/transforms/hy-hy_FONIPA.txt +52 -0
- package/transforms/hy_AREVMDA-am.json +8 -0
- package/transforms/hy_AREVMDA-am.txt +4 -0
- package/transforms/hy_AREVMDA-ar.json +8 -0
- package/transforms/hy_AREVMDA-ar.txt +4 -0
- package/transforms/hy_AREVMDA-chr.json +8 -0
- package/transforms/hy_AREVMDA-chr.txt +4 -0
- package/transforms/hy_AREVMDA-fa.json +8 -0
- package/transforms/hy_AREVMDA-fa.txt +4 -0
- package/transforms/hy_AREVMDA-hy_AREVMDA_FONIPA.json +8 -0
- package/transforms/hy_AREVMDA-hy_AREVMDA_FONIPA.txt +80 -0
- package/transforms/ia-am.json +8 -0
- package/transforms/ia-am.txt +4 -0
- package/transforms/ia-ar.json +8 -0
- package/transforms/ia-ar.txt +4 -0
- package/transforms/ia-chr.json +8 -0
- package/transforms/ia-chr.txt +4 -0
- package/transforms/ia-fa.json +8 -0
- package/transforms/ia-fa.txt +4 -0
- package/transforms/ia-ia_FONIPA.json +8 -0
- package/transforms/ia-ia_FONIPA.txt +71 -0
- package/transforms/it-am.json +8 -0
- package/transforms/it-am.txt +257 -0
- package/transforms/it-ja.json +8 -0
- package/transforms/it-ja.txt +259 -0
- package/transforms/ja_Latn-ko.json +8 -0
- package/transforms/ja_Latn-ko.txt +141 -0
- package/transforms/ja_Latn-ru.json +8 -0
- package/transforms/ja_Latn-ru.txt +123 -0
- package/transforms/kk-am.json +8 -0
- package/transforms/kk-am.txt +4 -0
- package/transforms/kk-ar.json +8 -0
- package/transforms/kk-ar.txt +4 -0
- package/transforms/kk-chr.json +8 -0
- package/transforms/kk-chr.txt +4 -0
- package/transforms/kk-fa.json +8 -0
- package/transforms/kk-fa.txt +4 -0
- package/transforms/kk-kk_FONIPA.json +8 -0
- package/transforms/kk-kk_FONIPA.txt +59 -0
- package/transforms/ky-am.json +8 -0
- package/transforms/ky-am.txt +4 -0
- package/transforms/ky-ar.json +8 -0
- package/transforms/ky-ar.txt +4 -0
- package/transforms/ky-chr.json +8 -0
- package/transforms/ky-chr.txt +4 -0
- package/transforms/ky-fa.json +8 -0
- package/transforms/ky-fa.txt +4 -0
- package/transforms/ky-ky_FONIPA.json +8 -0
- package/transforms/ky-ky_FONIPA.txt +71 -0
- package/transforms/la-la_FONIPA.json +8 -0
- package/transforms/la-la_FONIPA.txt +79 -0
- package/transforms/lt-Lower.json +8 -0
- package/transforms/lt-Lower.txt +20 -0
- package/transforms/lt-Title.json +8 -0
- package/transforms/lt-Title.txt +15 -0
- package/transforms/lt-Upper.json +8 -0
- package/transforms/lt-Upper.txt +8 -0
- package/transforms/mn-mn_Latn-MNS.json +8 -0
- package/transforms/mn-mn_Latn-MNS.txt +86 -0
- package/transforms/my-am.json +8 -0
- package/transforms/my-am.txt +4 -0
- package/transforms/my-ar.json +8 -0
- package/transforms/my-ar.txt +4 -0
- package/transforms/my-chr.json +8 -0
- package/transforms/my-chr.txt +4 -0
- package/transforms/my-fa.json +8 -0
- package/transforms/my-fa.txt +4 -0
- package/transforms/my-my_FONIPA.json +8 -0
- package/transforms/my-my_FONIPA.txt +325 -0
- package/transforms/my-t-my-d0-zawgyi.json +8 -0
- package/transforms/my-t-my-d0-zawgyi.txt +222 -0
- package/transforms/my-t-my-s0-zawgyi.json +8 -0
- package/transforms/my-t-my-s0-zawgyi.txt +231 -0
- package/transforms/nl-Title.json +8 -0
- package/transforms/nl-Title.txt +7 -0
- package/transforms/nv-nv_FONIPA.json +8 -0
- package/transforms/nv-nv_FONIPA.txt +74 -0
- package/transforms/pl-am.json +8 -0
- package/transforms/pl-am.txt +4 -0
- package/transforms/pl-ar.json +8 -0
- package/transforms/pl-ar.txt +4 -0
- package/transforms/pl-chr.json +8 -0
- package/transforms/pl-chr.txt +4 -0
- package/transforms/pl-fa.json +8 -0
- package/transforms/pl-fa.txt +4 -0
- package/transforms/pl-ja.json +8 -0
- package/transforms/pl-ja.txt +4 -0
- package/transforms/pl-pl_FONIPA.json +8 -0
- package/transforms/pl-pl_FONIPA.txt +113 -0
- package/transforms/pl_FONIPA-ja.json +8 -0
- package/transforms/pl_FONIPA-ja.txt +301 -0
- package/transforms/rm_SURSILV-am.json +8 -0
- package/transforms/rm_SURSILV-am.txt +4 -0
- package/transforms/rm_SURSILV-ar.json +8 -0
- package/transforms/rm_SURSILV-ar.txt +4 -0
- package/transforms/rm_SURSILV-chr.json +8 -0
- package/transforms/rm_SURSILV-chr.txt +4 -0
- package/transforms/rm_SURSILV-fa.json +8 -0
- package/transforms/rm_SURSILV-fa.txt +4 -0
- package/transforms/rm_SURSILV-rm_FONIPA_SURSILV.json +8 -0
- package/transforms/rm_SURSILV-rm_FONIPA_SURSILV.txt +96 -0
- package/transforms/ro-am.json +8 -0
- package/transforms/ro-am.txt +4 -0
- package/transforms/ro-ar.json +8 -0
- package/transforms/ro-ar.txt +4 -0
- package/transforms/ro-chr.json +8 -0
- package/transforms/ro-chr.txt +4 -0
- package/transforms/ro-fa.json +8 -0
- package/transforms/ro-fa.txt +4 -0
- package/transforms/ro-ja.json +8 -0
- package/transforms/ro-ja.txt +4 -0
- package/transforms/ro-ro_FONIPA.json +8 -0
- package/transforms/ro-ro_FONIPA.txt +121 -0
- package/transforms/ro_FONIPA-ja.json +8 -0
- package/transforms/ro_FONIPA-ja.txt +211 -0
- package/transforms/ru-ja.json +8 -0
- package/transforms/ru-ja.txt +444 -0
- package/transforms/ru-zh.json +8 -0
- package/transforms/ru-zh.txt +996 -0
- package/transforms/ru_Latn-ru-BGN.json +9 -0
- package/transforms/ru_Latn-ru-BGN.txt +97 -0
- package/transforms/sat-am.json +8 -0
- package/transforms/sat-am.txt +6 -0
- package/transforms/sat-ar.json +8 -0
- package/transforms/sat-ar.txt +6 -0
- package/transforms/sat-chr.json +8 -0
- package/transforms/sat-chr.txt +6 -0
- package/transforms/sat-fa.json +8 -0
- package/transforms/sat-fa.txt +6 -0
- package/transforms/sat_Olck-sat_FONIPA.json +8 -0
- package/transforms/sat_Olck-sat_FONIPA.txt +174 -0
- package/transforms/sgw-Ethi-t-und-ethi.json +11 -0
- package/transforms/sgw-Ethi-t-und-ethi.txt +138 -0
- package/transforms/si-am.json +8 -0
- package/transforms/si-am.txt +4 -0
- package/transforms/si-ar.json +8 -0
- package/transforms/si-ar.txt +4 -0
- package/transforms/si-chr.json +8 -0
- package/transforms/si-chr.txt +4 -0
- package/transforms/si-fa.json +8 -0
- package/transforms/si-fa.txt +4 -0
- package/transforms/si-si_FONIPA.json +8 -0
- package/transforms/si-si_FONIPA.txt +157 -0
- package/transforms/si-si_Latn.json +8 -0
- package/transforms/si-si_Latn.txt +94 -0
- package/transforms/sk-am.json +8 -0
- package/transforms/sk-am.txt +4 -0
- package/transforms/sk-ar.json +8 -0
- package/transforms/sk-ar.txt +4 -0
- package/transforms/sk-chr.json +8 -0
- package/transforms/sk-chr.txt +4 -0
- package/transforms/sk-fa.json +8 -0
- package/transforms/sk-fa.txt +4 -0
- package/transforms/sk-ja.json +8 -0
- package/transforms/sk-ja.txt +4 -0
- package/transforms/sk-sk_FONIPA.json +8 -0
- package/transforms/sk-sk_FONIPA.txt +101 -0
- package/transforms/sk_FONIPA-ja.json +8 -0
- package/transforms/sk_FONIPA-ja.txt +252 -0
- package/transforms/ta-ta_FONIPA.json +8 -0
- package/transforms/ta-ta_FONIPA.txt +73 -0
- package/transforms/tlh-am.json +8 -0
- package/transforms/tlh-am.txt +4 -0
- package/transforms/tlh-ar.json +8 -0
- package/transforms/tlh-ar.txt +4 -0
- package/transforms/tlh-chr.json +8 -0
- package/transforms/tlh-chr.txt +4 -0
- package/transforms/tlh-fa.json +8 -0
- package/transforms/tlh-fa.txt +4 -0
- package/transforms/tlh-tlh_FONIPA.json +8 -0
- package/transforms/tlh-tlh_FONIPA.txt +46 -0
- package/transforms/tr-Lower.json +8 -0
- package/transforms/tr-Lower.txt +13 -0
- package/transforms/tr-Title.json +8 -0
- package/transforms/tr-Title.txt +11 -0
- package/transforms/tr-Upper.json +8 -0
- package/transforms/tr-Upper.txt +8 -0
- package/transforms/ug-ug_FONIPA.json +8 -0
- package/transforms/ug-ug_FONIPA.txt +69 -0
- package/transforms/und-Ethi-t-und-cyrl-m0-gutgarts.json +11 -0
- package/transforms/und-Ethi-t-und-cyrl-m0-gutgarts.txt +747 -0
- package/transforms/und-Ethi-t-und-latn-m0-aethiopi-geminate.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-aethiopi-geminate.txt +19 -0
- package/transforms/und-Ethi-t-und-latn-m0-aethiopi.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-aethiopi.txt +633 -0
- package/transforms/und-Ethi-t-und-latn-m0-alaloc-geminate.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-alaloc-geminate.txt +19 -0
- package/transforms/und-Ethi-t-und-latn-m0-alaloc.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-alaloc.txt +757 -0
- package/transforms/und-Ethi-t-und-latn-m0-beta_metsehaf-geminate.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-beta_metsehaf-geminate.txt +19 -0
- package/transforms/und-Ethi-t-und-latn-m0-beta_metsehaf.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-beta_metsehaf.txt +585 -0
- package/transforms/und-Ethi-t-und-latn-m0-es3842.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-es3842.txt +640 -0
- package/transforms/und-Ethi-t-und-latn-m0-ies-jes-1964-geminate.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-ies-jes-1964-geminate.txt +19 -0
- package/transforms/und-Ethi-t-und-latn-m0-ies-jes-1964.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-ies-jes-1964.txt +619 -0
- package/transforms/und-Ethi-t-und-latn-m0-lambdin.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-lambdin.txt +627 -0
- package/transforms/und-Ethi-t-und-latn-m0-sera.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-sera.txt +695 -0
- package/transforms/und-Ethi-t-und-latn.json +11 -0
- package/transforms/und-Ethi-t-und-latn.txt +16 -0
- package/transforms/und_FONIPA-ar.json +8 -0
- package/transforms/und_FONIPA-ar.txt +114 -0
- package/transforms/und_FONIPA-chr.json +8 -0
- package/transforms/und_FONIPA-chr.txt +172 -0
- package/transforms/und_FONIPA-fa.json +8 -0
- package/transforms/und_FONIPA-fa.txt +109 -0
- package/transforms/uz_Cyrl-uz_Latn.json +9 -0
- package/transforms/uz_Cyrl-uz_Latn.txt +103 -0
- package/transforms/vec-vec_FONIPA.json +8 -0
- package/transforms/vec-vec_FONIPA.txt +85 -0
- package/transforms/xh-am.json +8 -0
- package/transforms/xh-am.txt +4 -0
- package/transforms/xh-ar.json +8 -0
- package/transforms/xh-ar.txt +4 -0
- package/transforms/xh-chr.json +8 -0
- package/transforms/xh-chr.txt +4 -0
- package/transforms/xh-fa.json +8 -0
- package/transforms/xh-fa.txt +4 -0
- package/transforms/xh-xh_FONIPA.json +8 -0
- package/transforms/xh-xh_FONIPA.txt +85 -0
- package/transforms/yo-yo_BJ.json +8 -0
- package/transforms/yo-yo_BJ.txt +36 -0
- package/transforms/zh_Latn_PINYIN-ru.json +8 -0
- package/transforms/zh_Latn_PINYIN-ru.txt +148 -0
- package/transforms/zu-am.json +8 -0
- package/transforms/zu-am.txt +4 -0
- package/transforms/zu-ar.json +8 -0
- package/transforms/zu-ar.txt +4 -0
- package/transforms/zu-chr.json +8 -0
- package/transforms/zu-chr.txt +4 -0
- package/transforms/zu-fa.json +8 -0
- package/transforms/zu-fa.txt +4 -0
- package/transforms/zu-zu_FONIPA.json +8 -0
- package/transforms/zu-zu_FONIPA.txt +72 -0
- package/transforms.json +385 -0
|
@@ -0,0 +1,155 @@
|
|
|
1
|
+
|
|
2
|
+
# Phonemic transcription of Spanish into Katakana.
|
|
3
|
+
$word_boundary = [-\ $] ;
|
|
4
|
+
$vowel = [aeijouw] ; # Vowels and glides
|
|
5
|
+
$not_vowel = [^$vowel] ;
|
|
6
|
+
#
|
|
7
|
+
#
|
|
8
|
+
# First pass: Collapse phonetic distinctions not preserved in Katakana.
|
|
9
|
+
β → | b;
|
|
10
|
+
ð → | d;
|
|
11
|
+
ɣ → | g;
|
|
12
|
+
ŋ → | n;
|
|
13
|
+
θ → | s;
|
|
14
|
+
ɾ → | r;
|
|
15
|
+
[ij{i̯}]+ → i;
|
|
16
|
+
[uw{u̯}]+ → u;
|
|
17
|
+
#
|
|
18
|
+
#
|
|
19
|
+
nn → n ;
|
|
20
|
+
#
|
|
21
|
+
#
|
|
22
|
+
::Null;
|
|
23
|
+
#
|
|
24
|
+
#
|
|
25
|
+
# Main pass: Phoneme to Katakana conversion.
|
|
26
|
+
'.' → ;
|
|
27
|
+
a → ア;
|
|
28
|
+
ba → バ;
|
|
29
|
+
bb → ッ | b;
|
|
30
|
+
be → ベ;
|
|
31
|
+
bi → ビ;
|
|
32
|
+
bo → ボ;
|
|
33
|
+
bu → ブ;
|
|
34
|
+
b → ブ ;
|
|
35
|
+
da → ダ;
|
|
36
|
+
dd → ッ | d;
|
|
37
|
+
de → デ;
|
|
38
|
+
di → ディ;
|
|
39
|
+
do → ド;
|
|
40
|
+
du → ドゥ;
|
|
41
|
+
#
|
|
42
|
+
#
|
|
43
|
+
# 'd' at the end of a word is usually ignored.
|
|
44
|
+
d } $word_boundary → ー;
|
|
45
|
+
d → ド;
|
|
46
|
+
e → エ;
|
|
47
|
+
fa → ファ;
|
|
48
|
+
fe → フェ;
|
|
49
|
+
ff → ッ | f;
|
|
50
|
+
fi → フィ;
|
|
51
|
+
fo → フォ;
|
|
52
|
+
fu → フ;
|
|
53
|
+
f → フ;
|
|
54
|
+
ga → ガ;
|
|
55
|
+
ge → グエ;
|
|
56
|
+
gi → グイ;
|
|
57
|
+
gg → ッ | g;
|
|
58
|
+
go → ゴ;
|
|
59
|
+
gu → グ;
|
|
60
|
+
g → グ;
|
|
61
|
+
i → イ ;
|
|
62
|
+
ʝa → ヤ ;
|
|
63
|
+
ʝe → イェ ;
|
|
64
|
+
ʝi → イ ;
|
|
65
|
+
ʝu → ユ ;
|
|
66
|
+
ʝo → ヨ ;
|
|
67
|
+
ʝ → イ ;
|
|
68
|
+
ka → カ;
|
|
69
|
+
ke → ケ;
|
|
70
|
+
ki → キ;
|
|
71
|
+
kk → ッ | k;
|
|
72
|
+
ko → コ;
|
|
73
|
+
ku → ク;
|
|
74
|
+
k → ク;
|
|
75
|
+
la → ラ ;
|
|
76
|
+
le → レ ;
|
|
77
|
+
li → リ ;
|
|
78
|
+
lo → ロ ;
|
|
79
|
+
lu → ル ;
|
|
80
|
+
l → ル ;
|
|
81
|
+
ʎa → リャ ;
|
|
82
|
+
ʎe → レ ;
|
|
83
|
+
ʎi → リ ;
|
|
84
|
+
ʎo → リョ ;
|
|
85
|
+
ʎu → リュ ;
|
|
86
|
+
ʎ → ル ;
|
|
87
|
+
ma → マ ;
|
|
88
|
+
me → メ ;
|
|
89
|
+
mi → ミ ;
|
|
90
|
+
mo → モ ;
|
|
91
|
+
mu → ム ;
|
|
92
|
+
m } $word_boundary → ム ;
|
|
93
|
+
m } $not_vowel → ン ;
|
|
94
|
+
m → ム ;
|
|
95
|
+
na → ナ ;
|
|
96
|
+
ne → ネ ;
|
|
97
|
+
ni → ニ ;
|
|
98
|
+
no → ノ ;
|
|
99
|
+
nu → ヌ ;
|
|
100
|
+
n → ン ;
|
|
101
|
+
ɲa → ニャ ;
|
|
102
|
+
ɲe → ニェ ;
|
|
103
|
+
ɲi → ニ ;
|
|
104
|
+
ɲo → ニョ ;
|
|
105
|
+
ɲu → ニュ ;
|
|
106
|
+
o → オ ;
|
|
107
|
+
pa → パ ;
|
|
108
|
+
pe → ペ ;
|
|
109
|
+
pi → ピ ;
|
|
110
|
+
po → ポ ;
|
|
111
|
+
pp → ッ | p;
|
|
112
|
+
pu → プ ;
|
|
113
|
+
p → プ ;
|
|
114
|
+
ra → ラ ;
|
|
115
|
+
re → レ ;
|
|
116
|
+
ri → リ ;
|
|
117
|
+
ro → ロ ;
|
|
118
|
+
ru → ル ;
|
|
119
|
+
r → ル;
|
|
120
|
+
sa → サ ;
|
|
121
|
+
se → セ ;
|
|
122
|
+
si → シ ;
|
|
123
|
+
so → ソ ;
|
|
124
|
+
su → ス ;
|
|
125
|
+
s → ス ;
|
|
126
|
+
ta → タ ;
|
|
127
|
+
te → テ ;
|
|
128
|
+
ti → ティ ;
|
|
129
|
+
to → ト ;
|
|
130
|
+
tsa → ツァ ;
|
|
131
|
+
tse → ツェ ;
|
|
132
|
+
tsi → ツィ ;
|
|
133
|
+
tso → ツォ ;
|
|
134
|
+
tsu → ツ ;
|
|
135
|
+
ts → ツ ;
|
|
136
|
+
tt → ッ | t;
|
|
137
|
+
tu → トゥ ;
|
|
138
|
+
t → ト ;
|
|
139
|
+
ʧa → チャ ;
|
|
140
|
+
ʧe → チェ ;
|
|
141
|
+
ʧi → チ ;
|
|
142
|
+
ʧo → チョ ;
|
|
143
|
+
ʧu → チュ ;
|
|
144
|
+
ʧ → チュ ;
|
|
145
|
+
u → ウ ;
|
|
146
|
+
xa → ハ ;
|
|
147
|
+
xe → ヘ ;
|
|
148
|
+
xi → ヒ ;
|
|
149
|
+
xo → ホ ;
|
|
150
|
+
xu → フ ;
|
|
151
|
+
x → フ ;
|
|
152
|
+
#
|
|
153
|
+
#
|
|
154
|
+
::NFC;
|
|
155
|
+
|
|
@@ -0,0 +1,522 @@
|
|
|
1
|
+
|
|
2
|
+
# Transforms Spanish to Mandarin Chinese. The input Spanish string must be in
|
|
3
|
+
# phonemic IPA transcription (es_FONIPA); the output is in Simplified Chinese.
|
|
4
|
+
$word_boundary = [-\ $];
|
|
5
|
+
$vowel = [aeijouw]; # Vowels and glides
|
|
6
|
+
$not_vowel = [^$vowel];
|
|
7
|
+
# First pass: Collapse phonetic distinctions not preserved in Mandarin.
|
|
8
|
+
ð → | d;
|
|
9
|
+
ɣ → | g;
|
|
10
|
+
ŋ → | n;
|
|
11
|
+
θ → | s;
|
|
12
|
+
ɾ → | r;
|
|
13
|
+
ff → f ;
|
|
14
|
+
kk → k ;
|
|
15
|
+
mm → m ;
|
|
16
|
+
nn → n ;
|
|
17
|
+
pp → p ;
|
|
18
|
+
tt → t ;
|
|
19
|
+
tʧ → ʧ ;
|
|
20
|
+
aa → a ;
|
|
21
|
+
oi̯ → oi ;
|
|
22
|
+
oo → o ;
|
|
23
|
+
uu → u ;
|
|
24
|
+
[^dgktx] { ei̯ → e ;
|
|
25
|
+
[^-\ .$] { eu̯ → eu ;
|
|
26
|
+
[^-\ .$] { ou̯ → o;
|
|
27
|
+
[^j] { ui → wi ;
|
|
28
|
+
[^$word_boundary] { m } [bp] → n; # GB/T 17693.5-2009, 5.3.2
|
|
29
|
+
s[θs] → s; # GB/T 17693.5-2009, 5.3.4
|
|
30
|
+
[^ʧ] { jo → io; # GB/T 17693.5-2009 表 1, 注 7
|
|
31
|
+
::Null;
|
|
32
|
+
j } an $not_vowel → i ; # GB/T 17693.5-2009 表 1, 注 8
|
|
33
|
+
# GB/T 17693.5-2009 表 1, 注 8 also says that <uai> should be treated as if
|
|
34
|
+
# it was <u> plus <ai>. This is not borne out by the observed data, which
|
|
35
|
+
# suggests that <ua> plus <i> is the more appropriate choice in some
|
|
36
|
+
# situations.
|
|
37
|
+
[g.$] { wai̯ → wai ;
|
|
38
|
+
wai̯ → uai̯ ;
|
|
39
|
+
[g.$] { wau̯ → wau ;
|
|
40
|
+
wau̯ → uau̯ ;
|
|
41
|
+
jau̯ → iau̯ ;
|
|
42
|
+
# Even though "ao" is not a diphthong in Spanish, Mandarin treats it as one.
|
|
43
|
+
[^jw] { ao } [^n] → au̯ ;
|
|
44
|
+
[^jw] { ao } n $vowel → au̯ ;
|
|
45
|
+
# Main pass: Phoneme to Hanzi conversion.
|
|
46
|
+
# This generally follows GB/T 17693.5-2009 表 1, unless otherwise noted.
|
|
47
|
+
::Null;
|
|
48
|
+
'.' → ;
|
|
49
|
+
ai̯ → 艾 ;
|
|
50
|
+
an } $not_vowel → 安 ;
|
|
51
|
+
au̯ → 奥 ;
|
|
52
|
+
a → 阿 ;
|
|
53
|
+
bai̯ → 拜 ;
|
|
54
|
+
ban } $not_vowel → 班 ;
|
|
55
|
+
bau̯ → 包 ;
|
|
56
|
+
ba → 巴 ;
|
|
57
|
+
ben } $not_vowel → 本 ;
|
|
58
|
+
be → 贝 ;
|
|
59
|
+
bin } $not_vowel → 宾 ;
|
|
60
|
+
bi → 比 ;
|
|
61
|
+
bja → 比亚 ;
|
|
62
|
+
bjen } $not_vowel → 比恩 ;
|
|
63
|
+
bje → 别 ;
|
|
64
|
+
bju → 比乌 ;
|
|
65
|
+
bon } $not_vowel → 邦 ;
|
|
66
|
+
bo → 博 ;
|
|
67
|
+
bun } $not_vowel → 本 ;
|
|
68
|
+
bu → 布 ;
|
|
69
|
+
bwan } $not_vowel → 布安 ;
|
|
70
|
+
bwa → 布阿 ;
|
|
71
|
+
bwen } $not_vowel → 布恩 ; # Should be be 本, per GB/T 17693.5-2009 表 1.
|
|
72
|
+
bwe → 布埃 ;
|
|
73
|
+
bwin } $not_vowel → 布因 ; # Nonstandard, but fits observed data.
|
|
74
|
+
bwi → 布伊 ;
|
|
75
|
+
bwo → 博 ;
|
|
76
|
+
b → 布 ;
|
|
77
|
+
βai̯ → 瓦伊 ;
|
|
78
|
+
βan } $not_vowel → 万 ;
|
|
79
|
+
βau̯ → 沃 ;
|
|
80
|
+
βa → 瓦 ;
|
|
81
|
+
βen } $not_vowel → 文 ;
|
|
82
|
+
βe → 韦 ;
|
|
83
|
+
βin } $not_vowel → 温 ;
|
|
84
|
+
βi → 维 ;
|
|
85
|
+
βja → 维亚 ;
|
|
86
|
+
βjen } $not_vowel → 维恩 ;
|
|
87
|
+
βje → 维耶 ;
|
|
88
|
+
βju → 维乌 ;
|
|
89
|
+
βon } $not_vowel → 翁 ;
|
|
90
|
+
βo → 沃 ;
|
|
91
|
+
βun } $not_vowel → 文 ;
|
|
92
|
+
βu → 武 ;
|
|
93
|
+
βwan } $not_vowel → 万 ;
|
|
94
|
+
βwa → 瓦 ;
|
|
95
|
+
βwen } $not_vowel → 文 ;
|
|
96
|
+
βwe → 武埃 ;
|
|
97
|
+
βwi → 维 ;
|
|
98
|
+
βwo → 沃 ;
|
|
99
|
+
β → 夫 ;
|
|
100
|
+
dai̯ → 代 ;
|
|
101
|
+
dan } $not_vowel → 丹 ;
|
|
102
|
+
dau̯ → 道 ;
|
|
103
|
+
da → 达 ;
|
|
104
|
+
dei̯ → 代 ;
|
|
105
|
+
den } $not_vowel → 登 ;
|
|
106
|
+
de → 德 ;
|
|
107
|
+
din } $not_vowel → 丁 ;
|
|
108
|
+
di → 迪 ;
|
|
109
|
+
dja → 迪亚 ;
|
|
110
|
+
djen } $not_vowel → 迪恩 ;
|
|
111
|
+
dje → 迭 ;
|
|
112
|
+
dju → 迪乌 ;
|
|
113
|
+
don } $not_vowel → 东 ;
|
|
114
|
+
do → 多 ;
|
|
115
|
+
dun } $not_vowel → 敦 ;
|
|
116
|
+
du → 杜 ;
|
|
117
|
+
dwan } $not_vowel → 端 ;
|
|
118
|
+
dwa → 杜阿 ;
|
|
119
|
+
dwen } $not_vowel → 敦 ;
|
|
120
|
+
dwe → 杜埃 ;
|
|
121
|
+
dwi → 杜伊 ;
|
|
122
|
+
dwo → 多 ;
|
|
123
|
+
d } $word_boundary → ;
|
|
124
|
+
d → 德 ;
|
|
125
|
+
ei̯ → 埃 ;
|
|
126
|
+
en } $not_vowel → 恩 ;
|
|
127
|
+
eu̯ → 欧 ;
|
|
128
|
+
e → 埃 ;
|
|
129
|
+
fai̯ → 法伊 ;
|
|
130
|
+
fan } $not_vowel → 凡 ;
|
|
131
|
+
fau̯ → 福 ;
|
|
132
|
+
fa → 法 ;
|
|
133
|
+
fe → 费 ;
|
|
134
|
+
fin } $not_vowel → 芬 ;
|
|
135
|
+
fi → 菲 ;
|
|
136
|
+
fja → 菲亚 ;
|
|
137
|
+
fjen } $not_vowel → 菲恩 ;
|
|
138
|
+
fje → 菲耶 ;
|
|
139
|
+
fju → 菲乌 ;
|
|
140
|
+
fon } $not_vowel → 丰 ;
|
|
141
|
+
fo → 福 ;
|
|
142
|
+
fun } $not_vowel → 丰 ;
|
|
143
|
+
fu → 富 ;
|
|
144
|
+
fwan } $not_vowel → 富安 ;
|
|
145
|
+
fwa → 富阿 ;
|
|
146
|
+
fwen } $not_vowel → 丰 ;
|
|
147
|
+
fwe → 富埃 ;
|
|
148
|
+
fwi → 富伊 ;
|
|
149
|
+
fwo → 福 ;
|
|
150
|
+
# The choice of 弗 vs. 夫 sounds simple according to the GB/T standard, but the
|
|
151
|
+
# data suggest otherwise. Ideally, 弗 should occur at the beginning of a
|
|
152
|
+
# morpheme (e.g. in "villafranca" 比利亚弗兰卡) and 夫 everywhere else. Since
|
|
153
|
+
# we don't have morpheme boundaries, we'll fudge it by writing 夫 at the end of
|
|
154
|
+
# a word and 弗 everywhere else.
|
|
155
|
+
f } $word_boundary → 夫 ;
|
|
156
|
+
f → 弗 ;
|
|
157
|
+
gai̯ → 盖 ;
|
|
158
|
+
gan } $not_vowel → 甘 ;
|
|
159
|
+
gau̯ → 高 ;
|
|
160
|
+
ga → 加 ;
|
|
161
|
+
gei̯ → 盖 ;
|
|
162
|
+
gen } $not_vowel → 根 ;
|
|
163
|
+
ge → 格 ;
|
|
164
|
+
gin } $not_vowel → 金 ;
|
|
165
|
+
gi → 吉 ;
|
|
166
|
+
gja → 吉亚 ;
|
|
167
|
+
gjen } $not_vowel → 吉恩 ;
|
|
168
|
+
gje → 吉耶 ;
|
|
169
|
+
gju → 吉乌 ;
|
|
170
|
+
gon } $not_vowel → 贡 ;
|
|
171
|
+
go → 戈 ;
|
|
172
|
+
gun } $not_vowel → 贡 ;
|
|
173
|
+
gu → 古 ;
|
|
174
|
+
gwan } [$] → 古安 ; # Nonstandard, but fits observed data.
|
|
175
|
+
gwan } $not_vowel → 关 ;
|
|
176
|
+
gwa → 瓜 ;
|
|
177
|
+
gwen } $not_vowel → 古恩 ;
|
|
178
|
+
gwe → 圭 ;
|
|
179
|
+
gwi → 圭 ;
|
|
180
|
+
gwo → 果 ;
|
|
181
|
+
g → 格 ;
|
|
182
|
+
in } $not_vowel → 因 ;
|
|
183
|
+
i → 伊 ;
|
|
184
|
+
ʝai̯ → 亚伊 ;
|
|
185
|
+
ʝan } $not_vowel → 扬 ;
|
|
186
|
+
ʝau̯ → 尧 ;
|
|
187
|
+
ʝa → 亚 ;
|
|
188
|
+
ʝen } $not_vowel → 延 ;
|
|
189
|
+
ʝe → 耶 ;
|
|
190
|
+
ʝin } $not_vowel → 因 ;
|
|
191
|
+
ʝi → 伊 ;
|
|
192
|
+
ʝon } $not_vowel → 永 ;
|
|
193
|
+
ʝo → 约 ;
|
|
194
|
+
ʝun } $not_vowel → 云 ;
|
|
195
|
+
ʝu → 尤 ;
|
|
196
|
+
ʝwan } $not_vowel → 元 ;
|
|
197
|
+
ʝwa → 尤阿 ;
|
|
198
|
+
ʝwen } $not_vowel → 云 ;
|
|
199
|
+
ʝwe → 尤埃 ;
|
|
200
|
+
ʝwi → 尤伊 ;
|
|
201
|
+
ʝwo → 约 ;
|
|
202
|
+
ʝ → 伊 ;
|
|
203
|
+
kai̯ → 凯 ;
|
|
204
|
+
kan } $not_vowel → 坎 ;
|
|
205
|
+
kau̯ → 考 ;
|
|
206
|
+
ka → 卡 ;
|
|
207
|
+
kei̯ → 凯 ;
|
|
208
|
+
ken } $not_vowel → 肯 ;
|
|
209
|
+
ke → 克 ;
|
|
210
|
+
kin } $not_vowel → 金 ;
|
|
211
|
+
ki → 基 ;
|
|
212
|
+
kja → 基亚 ;
|
|
213
|
+
kjen } $not_vowel → 基恩 ;
|
|
214
|
+
kje → 基耶 ;
|
|
215
|
+
kju → 基乌 ;
|
|
216
|
+
kon } $not_vowel → 孔 ;
|
|
217
|
+
ko → 科 ;
|
|
218
|
+
kun } $not_vowel → 昆 ;
|
|
219
|
+
ku → 库 ;
|
|
220
|
+
kwan } $not_vowel → 宽 ;
|
|
221
|
+
kwa → 夸 ;
|
|
222
|
+
kwen } $not_vowel → 昆 ;
|
|
223
|
+
kwe → 库埃 ;
|
|
224
|
+
kwin } $not_vowel → 昆 ;
|
|
225
|
+
kwi → 奎 ;
|
|
226
|
+
kwo → 阔 ;
|
|
227
|
+
k → 克 ;
|
|
228
|
+
lae } [^n] → 莱 ;
|
|
229
|
+
lai̯ → 莱 ;
|
|
230
|
+
lan } $not_vowel → 兰 ;
|
|
231
|
+
lau̯ → 劳 ;
|
|
232
|
+
la → 拉 ;
|
|
233
|
+
len } $not_vowel → 伦 ;
|
|
234
|
+
le → 莱 ;
|
|
235
|
+
lin } $not_vowel → 林 ;
|
|
236
|
+
li → 利 ;
|
|
237
|
+
lja → 利亚 ;
|
|
238
|
+
ljen } $not_vowel → 连 ;
|
|
239
|
+
lje → 列 ;
|
|
240
|
+
lju → 柳 ;
|
|
241
|
+
lon } $not_vowel → 隆 ;
|
|
242
|
+
lo → 洛 ;
|
|
243
|
+
lun } $not_vowel → 伦 ;
|
|
244
|
+
lu → 卢 ;
|
|
245
|
+
lwan } $not_vowel → 卢安 ;
|
|
246
|
+
lwa → 卢阿 ;
|
|
247
|
+
lwen } $not_vowel → 伦 ;
|
|
248
|
+
lwe → 卢埃 ;
|
|
249
|
+
lwi → 卢伊 ;
|
|
250
|
+
lwo → 洛 ;
|
|
251
|
+
l → 尔 ;
|
|
252
|
+
ʎan } $not_vowel → 良 ;
|
|
253
|
+
ʎau̯ → 廖 ;
|
|
254
|
+
ʎa → 利亚 ;
|
|
255
|
+
ʎen } $not_vowel → 连 ;
|
|
256
|
+
ʎe → 列 ;
|
|
257
|
+
ʎin } $not_vowel → 林 ;
|
|
258
|
+
ʎi → 利 ;
|
|
259
|
+
ʎon } $not_vowel → 利翁 ;
|
|
260
|
+
ʎo → 略 ;
|
|
261
|
+
ʎu → 柳 ;
|
|
262
|
+
ʎwan } $not_vowel → 柳安 ;
|
|
263
|
+
ʎwa → 柳阿 ;
|
|
264
|
+
ʎwen } $not_vowel → 柳恩 ;
|
|
265
|
+
ʎwe → 柳埃 ;
|
|
266
|
+
ʎwi → 柳伊 ;
|
|
267
|
+
ʎwo → 略 ;
|
|
268
|
+
ʎ → 尔 ;
|
|
269
|
+
mai̯ → 迈 ;
|
|
270
|
+
man } $not_vowel → 曼 ;
|
|
271
|
+
martin → 马丁 ;
|
|
272
|
+
mau̯ → 毛 ;
|
|
273
|
+
ma → 马 ;
|
|
274
|
+
men } $not_vowel → 门 ;
|
|
275
|
+
me → 梅 ;
|
|
276
|
+
min } $not_vowel → 明 ;
|
|
277
|
+
mi → 米 ;
|
|
278
|
+
mja → 米亚 ;
|
|
279
|
+
mjen } $not_vowel → 缅 ;
|
|
280
|
+
mje → 米耶 ;
|
|
281
|
+
mju → 缪 ;
|
|
282
|
+
mon } $not_vowel → 蒙 ;
|
|
283
|
+
mo → 莫 ;
|
|
284
|
+
mun } $not_vowel → 蒙 ;
|
|
285
|
+
mu → 穆 ;
|
|
286
|
+
mwan } $not_vowel → 穆安 ;
|
|
287
|
+
mwa → 穆阿 ;
|
|
288
|
+
mwen } $not_vowel → 门 ;
|
|
289
|
+
mwe → 穆埃 ;
|
|
290
|
+
mwin } $not_vowel → 穆因 ; # Nonstandard, but fits observed data.
|
|
291
|
+
mwi → 穆伊 ;
|
|
292
|
+
mwo → 莫 ;
|
|
293
|
+
m → 姆 ;
|
|
294
|
+
nai̯ → 奈 ;
|
|
295
|
+
nan } $not_vowel → 南 ;
|
|
296
|
+
nau̯ → 瑙 ;
|
|
297
|
+
na → 纳 ;
|
|
298
|
+
nen } $not_vowel → 嫩 ;
|
|
299
|
+
ne → 内 ;
|
|
300
|
+
nin } $not_vowel → 宁 ;
|
|
301
|
+
ni → 尼 ;
|
|
302
|
+
nja → 尼亚 ;
|
|
303
|
+
njen } $not_vowel → 年 ;
|
|
304
|
+
nje → 涅 ;
|
|
305
|
+
nju → 纽 ;
|
|
306
|
+
non } $not_vowel → 农 ;
|
|
307
|
+
no → 诺 ;
|
|
308
|
+
nun } $not_vowel → 嫩 ;
|
|
309
|
+
nu → 努 ;
|
|
310
|
+
nwan } $not_vowel → 努安 ;
|
|
311
|
+
nwa → 努阿 ;
|
|
312
|
+
nwen } $not_vowel → 农 ;
|
|
313
|
+
nwe → 努埃 ;
|
|
314
|
+
nwi → 努伊 ;
|
|
315
|
+
nwo → 诺 ;
|
|
316
|
+
n → 恩 ;
|
|
317
|
+
ɲan } $not_vowel → 尼扬 ;
|
|
318
|
+
ɲau̯ → 尼奥 ;
|
|
319
|
+
ɲa → 尼亚 ;
|
|
320
|
+
ɲen } $not_vowel → 年 ;
|
|
321
|
+
ɲe → 涅 ;
|
|
322
|
+
ɲin } $not_vowel → 宁 ;
|
|
323
|
+
ɲi → 尼 ;
|
|
324
|
+
ɲon } $not_vowel → 尼翁 ;
|
|
325
|
+
ɲo → 尼奥 ;
|
|
326
|
+
ɲu → 纽 ;
|
|
327
|
+
ɲwan } $not_vowel → 纽安 ;
|
|
328
|
+
ɲwa → 纽阿 ;
|
|
329
|
+
ɲwen } $not_vowel → 纽恩 ;
|
|
330
|
+
ɲwe → 纽埃 ;
|
|
331
|
+
ɲwi → 纽伊 ;
|
|
332
|
+
ɲwo → 尼奥 ;
|
|
333
|
+
on } $not_vowel → 翁 ;
|
|
334
|
+
ou̯ → 欧 ;
|
|
335
|
+
o → 奥 ;
|
|
336
|
+
pai̯ → 派 ;
|
|
337
|
+
pan } $not_vowel → 潘 ;
|
|
338
|
+
pau̯ → 保 ;
|
|
339
|
+
pa → 帕 ;
|
|
340
|
+
pen } $not_vowel → 彭 ;
|
|
341
|
+
pe → 佩 ;
|
|
342
|
+
pin } $not_vowel → 平 ;
|
|
343
|
+
pi → 皮 ;
|
|
344
|
+
pja → 皮亚 ;
|
|
345
|
+
pjen } $not_vowel → 皮恩 ;
|
|
346
|
+
pje → 彼 ;
|
|
347
|
+
pju → 皮乌 ;
|
|
348
|
+
pon } $not_vowel → 蓬 ;
|
|
349
|
+
po → 波 ;
|
|
350
|
+
pun } $not_vowel → 蓬 ;
|
|
351
|
+
pu → 普 ;
|
|
352
|
+
pwan } $not_vowel → 普安 ;
|
|
353
|
+
pwa → 普阿 ;
|
|
354
|
+
pwen } $not_vowel → 蓬 ;
|
|
355
|
+
pwe → 普埃 ;
|
|
356
|
+
pwi → 普伊 ;
|
|
357
|
+
pwo → 波 ;
|
|
358
|
+
p → 普 ;
|
|
359
|
+
rai̯ → 赖 ;
|
|
360
|
+
ran } $not_vowel → 兰 ;
|
|
361
|
+
rau̯ → 劳 ;
|
|
362
|
+
ra → 拉 ;
|
|
363
|
+
ren } $not_vowel → 伦 ;
|
|
364
|
+
re → 雷 ;
|
|
365
|
+
rin } $not_vowel → 林 ;
|
|
366
|
+
ri → 里 ;
|
|
367
|
+
rja → 里亚 ;
|
|
368
|
+
rjen } $not_vowel → 连 ;
|
|
369
|
+
rje → 列 ;
|
|
370
|
+
rju → 留 ;
|
|
371
|
+
ron } $not_vowel → 龙 ;
|
|
372
|
+
ro → 罗 ;
|
|
373
|
+
run } $not_vowel → 伦 ;
|
|
374
|
+
ru → 鲁 ;
|
|
375
|
+
rwan } $not_vowel → 鲁安 ;
|
|
376
|
+
rwa → 鲁阿 ;
|
|
377
|
+
rwen } $not_vowel → 伦 ;
|
|
378
|
+
rwe → 鲁埃 ;
|
|
379
|
+
rwi → 鲁伊 ;
|
|
380
|
+
rwo → 罗 ;
|
|
381
|
+
r → R ;
|
|
382
|
+
sai̯ → 赛 ;
|
|
383
|
+
san } $not_vowel → 桑 ;
|
|
384
|
+
sau̯ → 绍 ;
|
|
385
|
+
sa → 萨 ;
|
|
386
|
+
sen } $not_vowel → 森 ;
|
|
387
|
+
se → 塞 ;
|
|
388
|
+
sin } $not_vowel → 辛 ;
|
|
389
|
+
si → 西 ;
|
|
390
|
+
sja → 西亚 ;
|
|
391
|
+
sjen } $not_vowel → 先 ;
|
|
392
|
+
sje → 谢 ;
|
|
393
|
+
sju → 休 ;
|
|
394
|
+
son } $not_vowel → 松 ;
|
|
395
|
+
so → 索 ;
|
|
396
|
+
sun } $not_vowel → 孙 ;
|
|
397
|
+
su → 苏 ;
|
|
398
|
+
swan } $not_vowel → 苏安 ;
|
|
399
|
+
swa → 苏阿 ;
|
|
400
|
+
swen } $not_vowel → 孙 ;
|
|
401
|
+
swe → 苏埃 ;
|
|
402
|
+
swi → 绥 ;
|
|
403
|
+
swo → 索 ;
|
|
404
|
+
s → 斯 ;
|
|
405
|
+
tai̯ → 泰 ;
|
|
406
|
+
tan } $not_vowel → 坦 ;
|
|
407
|
+
tau̯ → 陶 ;
|
|
408
|
+
ta → 塔 ;
|
|
409
|
+
tei̯ → 泰 ;
|
|
410
|
+
ten } $not_vowel → 滕 ;
|
|
411
|
+
te → 特 ;
|
|
412
|
+
tin } $not_vowel → 廷 ;
|
|
413
|
+
ti → 蒂 ;
|
|
414
|
+
tja → 蒂亚 ;
|
|
415
|
+
tjen } $not_vowel → 蒂恩 ;
|
|
416
|
+
tje → 铁 ;
|
|
417
|
+
tju → 蒂乌 ;
|
|
418
|
+
ton } $not_vowel → 通 ;
|
|
419
|
+
to → 托 ;
|
|
420
|
+
# The rules for /ts/ (tz in the orthography) are nonstandard and derived
|
|
421
|
+
# entirely from the observed data. They apply mostly to native toponyms
|
|
422
|
+
# in Mexico.
|
|
423
|
+
tsa → 察 ;
|
|
424
|
+
tsen } $not_vowel → 岑 ;
|
|
425
|
+
tse → 采 ;
|
|
426
|
+
tsin } $not_vowel → 钦 ;
|
|
427
|
+
tsi → 齐 ;
|
|
428
|
+
tso → 措 ;
|
|
429
|
+
tsun } $not_vowel → 聪 ;
|
|
430
|
+
tsu → 楚 ;
|
|
431
|
+
ts → 茨 ;
|
|
432
|
+
tun } $not_vowel → 通 ;
|
|
433
|
+
tu → 图 ;
|
|
434
|
+
twan } $not_vowel → 图安 ;
|
|
435
|
+
twa → 图阿 ;
|
|
436
|
+
twen } $not_vowel → 通 ;
|
|
437
|
+
twe → 图埃 ;
|
|
438
|
+
twi → 图伊 ;
|
|
439
|
+
two → 托 ;
|
|
440
|
+
t → 特 ;
|
|
441
|
+
ʧai̯ → 柴 ;
|
|
442
|
+
ʧan } $not_vowel → 钱 ;
|
|
443
|
+
ʧau̯ → 乔 ;
|
|
444
|
+
ʧa → 查 ;
|
|
445
|
+
ʧen } $not_vowel → 琴 ;
|
|
446
|
+
ʧe → 切 ;
|
|
447
|
+
ʧin } $not_vowel → 钦 ;
|
|
448
|
+
ʧi → 奇 ;
|
|
449
|
+
ʧjan } $not_vowel → 钱 ;
|
|
450
|
+
ʧja → 恰 ;
|
|
451
|
+
ʧjen } $not_vowel → 钱 ;
|
|
452
|
+
ʧje → 切 ;
|
|
453
|
+
ʧjon } $not_vowel → 琼 ;
|
|
454
|
+
ʧju → 丘 ;
|
|
455
|
+
ʧon } $not_vowel → 琼 ;
|
|
456
|
+
ʧo → 乔 ;
|
|
457
|
+
ʧun } $not_vowel → 琼 ; # Should be 春, per GB/T 17693.5-2009 表 1.
|
|
458
|
+
ʧu → 丘 ;
|
|
459
|
+
ʧwan } $not_vowel → 丘安 ;
|
|
460
|
+
ʧwa → 丘阿 ;
|
|
461
|
+
ʧwen } $not_vowel → 琼 ;
|
|
462
|
+
ʧwe → 丘埃 ;
|
|
463
|
+
ʧwi → 崔 ;
|
|
464
|
+
ʧwo → 乔 ;
|
|
465
|
+
ʧ → 奇 ;
|
|
466
|
+
un } $not_vowel → 温 ;
|
|
467
|
+
u → 乌 ;
|
|
468
|
+
wan } $not_vowel → 万 ;
|
|
469
|
+
wa → 瓦 ;
|
|
470
|
+
wen } $not_vowel → 温 ;
|
|
471
|
+
we → 韦 ;
|
|
472
|
+
win } $not_vowel → 温 ;
|
|
473
|
+
wi → 维 ;
|
|
474
|
+
won } $not_vowel → 翁 ; # Unseen.
|
|
475
|
+
wo → 沃 ;
|
|
476
|
+
xai̯ → 海 ;
|
|
477
|
+
xan } $not_vowel → 汉 ;
|
|
478
|
+
xau̯ → 豪 ;
|
|
479
|
+
xa → 哈 ;
|
|
480
|
+
xei̯ → 黑 ;
|
|
481
|
+
xen } $not_vowel → 亨 ;
|
|
482
|
+
xe → 赫 ;
|
|
483
|
+
xin } $not_vowel → 欣 ;
|
|
484
|
+
xi → 希 ;
|
|
485
|
+
xja → 希亚 ;
|
|
486
|
+
xjen } $not_vowel → 希恩 ;
|
|
487
|
+
xje → 希耶 ;
|
|
488
|
+
xju → 休 ;
|
|
489
|
+
xon } $not_vowel → 洪 ;
|
|
490
|
+
xo → 霍 ;
|
|
491
|
+
xun } $not_vowel → 洪 ;
|
|
492
|
+
xu → 胡 ;
|
|
493
|
+
xwan } $not_vowel → 胡安 ;
|
|
494
|
+
xwa → 华 ;
|
|
495
|
+
xwen } $not_vowel → 洪 ;
|
|
496
|
+
xwe → 胡埃 ;
|
|
497
|
+
xwi → 惠 ;
|
|
498
|
+
xwo → 霍 ;
|
|
499
|
+
x → 赫 ;
|
|
500
|
+
# 尔 simplification pass. The idea is to drop most occurrences of 尔
|
|
501
|
+
# corresponding to <r> (not to <l> or <ll>) from a word if there is another /l/
|
|
502
|
+
# sound nearby. There is a vague pattern like this in the data, but the details
|
|
503
|
+
# remain to be determined. At the moment, this does nothing, it just puts 尔 in
|
|
504
|
+
# for every <r> in a syllable coda.
|
|
505
|
+
::Null;
|
|
506
|
+
$r = [R利拉];
|
|
507
|
+
#
|
|
508
|
+
#
|
|
509
|
+
# R } . $r → ;
|
|
510
|
+
# R } .. $r → ;
|
|
511
|
+
# R } ... $r → ;
|
|
512
|
+
# R } .... $r → ;
|
|
513
|
+
R → 尔 ;
|
|
514
|
+
# Dong-nan-xi-hai pass. Per GB/T 17693.5-2009 表 1, 注 4, replace confusing
|
|
515
|
+
# characters at the beginning and end of a word.
|
|
516
|
+
::Null;
|
|
517
|
+
$word_boundary { 东 → 栋 ;
|
|
518
|
+
$word_boundary { 南 → 楠 ;
|
|
519
|
+
$word_boundary { 西 → 锡 ;
|
|
520
|
+
海 } $word_boundary → 亥 ;
|
|
521
|
+
::NFC;
|
|
522
|
+
|