cldr-transforms 46.0.0-BETA2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +41 -0
- package/README.md +27 -0
- package/bower.json +13 -0
- package/package.json +29 -0
- package/transforms/Amharic-Latin-BGN.json +9 -0
- package/transforms/Amharic-Latin-BGN.txt +441 -0
- package/transforms/Any-Accents.json +9 -0
- package/transforms/Any-Accents.txt +270 -0
- package/transforms/Any-Publishing.json +9 -0
- package/transforms/Any-Publishing.txt +63 -0
- package/transforms/Arabic-Latin-BGN.json +9 -0
- package/transforms/Arabic-Latin-BGN.txt +205 -0
- package/transforms/Arabic-Latin.json +11 -0
- package/transforms/Arabic-Latin.txt +181 -0
- package/transforms/Armenian-Latin-BGN.json +9 -0
- package/transforms/Armenian-Latin-BGN.txt +165 -0
- package/transforms/Azerbaijani-Latin-BGN.json +9 -0
- package/transforms/Azerbaijani-Latin-BGN.txt +183 -0
- package/transforms/Belarusian-Latin-BGN.json +9 -0
- package/transforms/Belarusian-Latin-BGN.txt +194 -0
- package/transforms/Bengali-Arabic.json +9 -0
- package/transforms/Bengali-Arabic.txt +7 -0
- package/transforms/Bengali-Devanagari.json +9 -0
- package/transforms/Bengali-Devanagari.txt +7 -0
- package/transforms/Bengali-Gujarati.json +9 -0
- package/transforms/Bengali-Gujarati.txt +7 -0
- package/transforms/Bengali-Gurmukhi.json +9 -0
- package/transforms/Bengali-Gurmukhi.txt +7 -0
- package/transforms/Bengali-InterIndic.json +7 -0
- package/transforms/Bengali-InterIndic.txt +99 -0
- package/transforms/Bengali-Kannada.json +9 -0
- package/transforms/Bengali-Kannada.txt +7 -0
- package/transforms/Bengali-Latin.json +9 -0
- package/transforms/Bengali-Latin.txt +7 -0
- package/transforms/Bengali-Malayalam.json +9 -0
- package/transforms/Bengali-Malayalam.txt +7 -0
- package/transforms/Bengali-Oriya.json +9 -0
- package/transforms/Bengali-Oriya.txt +7 -0
- package/transforms/Bengali-Tamil.json +9 -0
- package/transforms/Bengali-Tamil.txt +7 -0
- package/transforms/Bengali-Telugu.json +9 -0
- package/transforms/Bengali-Telugu.txt +7 -0
- package/transforms/Bengali-ur.json +8 -0
- package/transforms/Bengali-ur.txt +7 -0
- package/transforms/Bulgarian-Latin-BGN.json +9 -0
- package/transforms/Bulgarian-Latin-BGN.txt +237 -0
- package/transforms/CanadianAboriginal-Latin.json +11 -0
- package/transforms/CanadianAboriginal-Latin.txt +184 -0
- package/transforms/Cyrillic-Latin.json +11 -0
- package/transforms/Cyrillic-Latin.txt +280 -0
- package/transforms/Devanagari-Arabic.json +9 -0
- package/transforms/Devanagari-Arabic.txt +7 -0
- package/transforms/Devanagari-Bengali.json +9 -0
- package/transforms/Devanagari-Bengali.txt +7 -0
- package/transforms/Devanagari-Gujarati.json +9 -0
- package/transforms/Devanagari-Gujarati.txt +7 -0
- package/transforms/Devanagari-Gurmukhi.json +9 -0
- package/transforms/Devanagari-Gurmukhi.txt +7 -0
- package/transforms/Devanagari-InterIndic.json +7 -0
- package/transforms/Devanagari-InterIndic.txt +113 -0
- package/transforms/Devanagari-Kannada.json +9 -0
- package/transforms/Devanagari-Kannada.txt +7 -0
- package/transforms/Devanagari-Latin.json +9 -0
- package/transforms/Devanagari-Latin.txt +7 -0
- package/transforms/Devanagari-Malayalam.json +9 -0
- package/transforms/Devanagari-Malayalam.txt +7 -0
- package/transforms/Devanagari-Oriya.json +9 -0
- package/transforms/Devanagari-Oriya.txt +7 -0
- package/transforms/Devanagari-Tamil.json +9 -0
- package/transforms/Devanagari-Tamil.txt +7 -0
- package/transforms/Devanagari-Telugu.json +9 -0
- package/transforms/Devanagari-Telugu.txt +7 -0
- package/transforms/Devanagari-ur.json +8 -0
- package/transforms/Devanagari-ur.txt +7 -0
- package/transforms/Fullwidth-Halfwidth.json +9 -0
- package/transforms/Fullwidth-Halfwidth.txt +261 -0
- package/transforms/Georgian-Latin-BGN.json +9 -0
- package/transforms/Georgian-Latin-BGN.txt +43 -0
- package/transforms/Georgian-Latin-BGN_1981.json +8 -0
- package/transforms/Georgian-Latin-BGN_1981.txt +54 -0
- package/transforms/Georgian-Latin.json +11 -0
- package/transforms/Georgian-Latin.txt +53 -0
- package/transforms/Greek-Latin-BGN.json +9 -0
- package/transforms/Greek-Latin-BGN.txt +419 -0
- package/transforms/Greek-Latin.json +11 -0
- package/transforms/Greek-Latin.txt +251 -0
- package/transforms/Greek_Latin_UNGEGN.json +11 -0
- package/transforms/Greek_Latin_UNGEGN.txt +179 -0
- package/transforms/Gujarati-Arabic.json +9 -0
- package/transforms/Gujarati-Arabic.txt +7 -0
- package/transforms/Gujarati-Bengali.json +9 -0
- package/transforms/Gujarati-Bengali.txt +7 -0
- package/transforms/Gujarati-Devanagari.json +9 -0
- package/transforms/Gujarati-Devanagari.txt +7 -0
- package/transforms/Gujarati-Gurmukhi.json +9 -0
- package/transforms/Gujarati-Gurmukhi.txt +7 -0
- package/transforms/Gujarati-InterIndic.json +7 -0
- package/transforms/Gujarati-InterIndic.txt +89 -0
- package/transforms/Gujarati-Kannada.json +9 -0
- package/transforms/Gujarati-Kannada.txt +7 -0
- package/transforms/Gujarati-Latin.json +9 -0
- package/transforms/Gujarati-Latin.txt +7 -0
- package/transforms/Gujarati-Malayalam.json +9 -0
- package/transforms/Gujarati-Malayalam.txt +7 -0
- package/transforms/Gujarati-Oriya.json +9 -0
- package/transforms/Gujarati-Oriya.txt +7 -0
- package/transforms/Gujarati-Tamil.json +9 -0
- package/transforms/Gujarati-Tamil.txt +7 -0
- package/transforms/Gujarati-Telugu.json +9 -0
- package/transforms/Gujarati-Telugu.txt +7 -0
- package/transforms/Gujarati-ur.json +8 -0
- package/transforms/Gujarati-ur.txt +7 -0
- package/transforms/Gurmukhi-Arabic.json +9 -0
- package/transforms/Gurmukhi-Arabic.txt +7 -0
- package/transforms/Gurmukhi-Bengali.json +9 -0
- package/transforms/Gurmukhi-Bengali.txt +7 -0
- package/transforms/Gurmukhi-Devanagari.json +9 -0
- package/transforms/Gurmukhi-Devanagari.txt +7 -0
- package/transforms/Gurmukhi-Gujarati.json +9 -0
- package/transforms/Gurmukhi-Gujarati.txt +7 -0
- package/transforms/Gurmukhi-InterIndic.json +7 -0
- package/transforms/Gurmukhi-InterIndic.txt +88 -0
- package/transforms/Gurmukhi-Kannada.json +9 -0
- package/transforms/Gurmukhi-Kannada.txt +7 -0
- package/transforms/Gurmukhi-Latin.json +9 -0
- package/transforms/Gurmukhi-Latin.txt +7 -0
- package/transforms/Gurmukhi-Malayalam.json +9 -0
- package/transforms/Gurmukhi-Malayalam.txt +7 -0
- package/transforms/Gurmukhi-Oriya.json +9 -0
- package/transforms/Gurmukhi-Oriya.txt +7 -0
- package/transforms/Gurmukhi-Tamil.json +9 -0
- package/transforms/Gurmukhi-Tamil.txt +7 -0
- package/transforms/Gurmukhi-Telugu.json +9 -0
- package/transforms/Gurmukhi-Telugu.txt +7 -0
- package/transforms/Gurmukhi-ur.json +8 -0
- package/transforms/Gurmukhi-ur.txt +7 -0
- package/transforms/Han-Latin-Names.json +8 -0
- package/transforms/Han-Latin-Names.txt +65 -0
- package/transforms/Han-Latin.json +9 -0
- package/transforms/Han-Latin.txt +1501 -0
- package/transforms/Han-Spacedhan.json +7 -0
- package/transforms/Han-Spacedhan.txt +35 -0
- package/transforms/Hangul-Latin.json +9 -0
- package/transforms/Hangul-Latin.txt +6 -0
- package/transforms/Hebrew-Latin-BGN.json +9 -0
- package/transforms/Hebrew-Latin-BGN.txt +113 -0
- package/transforms/Hebrew-Latin.json +11 -0
- package/transforms/Hebrew-Latin.txt +91 -0
- package/transforms/Hiragana-Katakana.json +11 -0
- package/transforms/Hiragana-Katakana.txt +179 -0
- package/transforms/Hiragana-Latin.json +11 -0
- package/transforms/Hiragana-Latin.txt +9 -0
- package/transforms/IPA-XSampa.json +11 -0
- package/transforms/IPA-XSampa.txt +228 -0
- package/transforms/InterIndic-Arabic.json +7 -0
- package/transforms/InterIndic-Arabic.txt +128 -0
- package/transforms/InterIndic-Bengali.json +7 -0
- package/transforms/InterIndic-Bengali.txt +135 -0
- package/transforms/InterIndic-Devanagari.json +7 -0
- package/transforms/InterIndic-Devanagari.txt +151 -0
- package/transforms/InterIndic-Gujarati.json +7 -0
- package/transforms/InterIndic-Gujarati.txt +136 -0
- package/transforms/InterIndic-Gurmukhi.json +7 -0
- package/transforms/InterIndic-Gurmukhi.txt +142 -0
- package/transforms/InterIndic-Kannada.json +7 -0
- package/transforms/InterIndic-Kannada.txt +137 -0
- package/transforms/InterIndic-Latin.json +7 -0
- package/transforms/InterIndic-Latin.txt +492 -0
- package/transforms/InterIndic-Malayalam.json +7 -0
- package/transforms/InterIndic-Malayalam.txt +137 -0
- package/transforms/InterIndic-Oriya.json +7 -0
- package/transforms/InterIndic-Oriya.txt +135 -0
- package/transforms/InterIndic-Tamil.json +7 -0
- package/transforms/InterIndic-Tamil.txt +136 -0
- package/transforms/InterIndic-Telugu.json +7 -0
- package/transforms/InterIndic-Telugu.txt +136 -0
- package/transforms/InterIndic-ur.json +7 -0
- package/transforms/InterIndic-ur.txt +119 -0
- package/transforms/Jamo-Latin.json +9 -0
- package/transforms/Jamo-Latin.txt +6 -0
- package/transforms/Kannada-Arabic.json +9 -0
- package/transforms/Kannada-Arabic.txt +7 -0
- package/transforms/Kannada-Bengali.json +9 -0
- package/transforms/Kannada-Bengali.txt +7 -0
- package/transforms/Kannada-Devanagari.json +9 -0
- package/transforms/Kannada-Devanagari.txt +7 -0
- package/transforms/Kannada-Gujarati.json +9 -0
- package/transforms/Kannada-Gujarati.txt +7 -0
- package/transforms/Kannada-Gurmukhi.json +9 -0
- package/transforms/Kannada-Gurmukhi.txt +7 -0
- package/transforms/Kannada-InterIndic.json +7 -0
- package/transforms/Kannada-InterIndic.txt +87 -0
- package/transforms/Kannada-Latin.json +9 -0
- package/transforms/Kannada-Latin.txt +7 -0
- package/transforms/Kannada-Malayalam.json +9 -0
- package/transforms/Kannada-Malayalam.txt +7 -0
- package/transforms/Kannada-Oriya.json +9 -0
- package/transforms/Kannada-Oriya.txt +7 -0
- package/transforms/Kannada-Tamil.json +9 -0
- package/transforms/Kannada-Tamil.txt +7 -0
- package/transforms/Kannada-Telugu.json +9 -0
- package/transforms/Kannada-Telugu.txt +7 -0
- package/transforms/Kannada-ur.json +8 -0
- package/transforms/Kannada-ur.txt +7 -0
- package/transforms/Katakana-Latin-BGN.json +9 -0
- package/transforms/Katakana-Latin-BGN.txt +335 -0
- package/transforms/Kazakh-Latin-BGN.json +9 -0
- package/transforms/Kazakh-Latin-BGN.txt +332 -0
- package/transforms/Kirghiz-Latin-BGN.json +9 -0
- package/transforms/Kirghiz-Latin-BGN.txt +211 -0
- package/transforms/Korean-Latin-BGN.json +9 -0
- package/transforms/Korean-Latin-BGN.txt +345 -0
- package/transforms/Latin-ASCII.json +9 -0
- package/transforms/Latin-ASCII.txt +909 -0
- package/transforms/Latin-Armenian.json +11 -0
- package/transforms/Latin-Armenian.txt +88 -0
- package/transforms/Latin-Bengali.json +9 -0
- package/transforms/Latin-Bengali.txt +8 -0
- package/transforms/Latin-Bopomofo.json +11 -0
- package/transforms/Latin-Bopomofo.txt +1445 -0
- package/transforms/Latin-ConjoiningJamo.json +7 -0
- package/transforms/Latin-ConjoiningJamo.txt +477 -0
- package/transforms/Latin-Devanagari.json +9 -0
- package/transforms/Latin-Devanagari.txt +8 -0
- package/transforms/Latin-Ethiopic.json +11 -0
- package/transforms/Latin-Ethiopic.txt +277 -0
- package/transforms/Latin-Gujarati.json +9 -0
- package/transforms/Latin-Gujarati.txt +8 -0
- package/transforms/Latin-Gurmukhi.json +9 -0
- package/transforms/Latin-Gurmukhi.txt +8 -0
- package/transforms/Latin-Hangul.json +9 -0
- package/transforms/Latin-Hangul.txt +7 -0
- package/transforms/Latin-InterIndic.json +7 -0
- package/transforms/Latin-InterIndic.txt +377 -0
- package/transforms/Latin-Jamo.json +9 -0
- package/transforms/Latin-Jamo.txt +7 -0
- package/transforms/Latin-Kannada.json +9 -0
- package/transforms/Latin-Kannada.txt +8 -0
- package/transforms/Latin-Katakana.json +11 -0
- package/transforms/Latin-Katakana.txt +382 -0
- package/transforms/Latin-Malayalam.json +9 -0
- package/transforms/Latin-Malayalam.txt +8 -0
- package/transforms/Latin-NumericPinyin.json +9 -0
- package/transforms/Latin-NumericPinyin.txt +29 -0
- package/transforms/Latin-Oriya.json +9 -0
- package/transforms/Latin-Oriya.txt +8 -0
- package/transforms/Latin-Tamil.json +9 -0
- package/transforms/Latin-Tamil.txt +8 -0
- package/transforms/Latin-Telugu.json +9 -0
- package/transforms/Latin-Telugu.txt +8 -0
- package/transforms/Latin-Thai.json +9 -0
- package/transforms/Latin-Thai.txt +7 -0
- package/transforms/Macedonian-Latin-BGN.json +9 -0
- package/transforms/Macedonian-Latin-BGN.txt +176 -0
- package/transforms/Malayalam-Arabic.json +9 -0
- package/transforms/Malayalam-Arabic.txt +7 -0
- package/transforms/Malayalam-Bengali.json +9 -0
- package/transforms/Malayalam-Bengali.txt +7 -0
- package/transforms/Malayalam-Devanagari.json +9 -0
- package/transforms/Malayalam-Devanagari.txt +7 -0
- package/transforms/Malayalam-Gujarati.json +9 -0
- package/transforms/Malayalam-Gujarati.txt +7 -0
- package/transforms/Malayalam-Gurmukhi.json +9 -0
- package/transforms/Malayalam-Gurmukhi.txt +7 -0
- package/transforms/Malayalam-InterIndic.json +7 -0
- package/transforms/Malayalam-InterIndic.txt +87 -0
- package/transforms/Malayalam-Kannada.json +9 -0
- package/transforms/Malayalam-Kannada.txt +7 -0
- package/transforms/Malayalam-Latin.json +9 -0
- package/transforms/Malayalam-Latin.txt +7 -0
- package/transforms/Malayalam-Oriya.json +9 -0
- package/transforms/Malayalam-Oriya.txt +7 -0
- package/transforms/Malayalam-Tamil.json +9 -0
- package/transforms/Malayalam-Tamil.txt +7 -0
- package/transforms/Malayalam-Telugu.json +9 -0
- package/transforms/Malayalam-Telugu.txt +7 -0
- package/transforms/Malayalam-ur.json +8 -0
- package/transforms/Malayalam-ur.txt +7 -0
- package/transforms/Maldivian-Latin-BGN.json +9 -0
- package/transforms/Maldivian-Latin-BGN.txt +171 -0
- package/transforms/Mongolian-Latin-BGN.json +9 -0
- package/transforms/Mongolian-Latin-BGN.txt +151 -0
- package/transforms/Myanmar-Latin.json +9 -0
- package/transforms/Myanmar-Latin.txt +367 -0
- package/transforms/Oriya-Arabic.json +9 -0
- package/transforms/Oriya-Arabic.txt +7 -0
- package/transforms/Oriya-Bengali.json +9 -0
- package/transforms/Oriya-Bengali.txt +7 -0
- package/transforms/Oriya-Devanagari.json +9 -0
- package/transforms/Oriya-Devanagari.txt +7 -0
- package/transforms/Oriya-Gujarati.json +9 -0
- package/transforms/Oriya-Gujarati.txt +7 -0
- package/transforms/Oriya-Gurmukhi.json +9 -0
- package/transforms/Oriya-Gurmukhi.txt +7 -0
- package/transforms/Oriya-InterIndic.json +7 -0
- package/transforms/Oriya-InterIndic.txt +91 -0
- package/transforms/Oriya-Kannada.json +9 -0
- package/transforms/Oriya-Kannada.txt +7 -0
- package/transforms/Oriya-Latin.json +9 -0
- package/transforms/Oriya-Latin.txt +7 -0
- package/transforms/Oriya-Malayalam.json +9 -0
- package/transforms/Oriya-Malayalam.txt +7 -0
- package/transforms/Oriya-Tamil.json +9 -0
- package/transforms/Oriya-Tamil.txt +7 -0
- package/transforms/Oriya-Telugu.json +9 -0
- package/transforms/Oriya-Telugu.txt +7 -0
- package/transforms/Oriya-ur.json +8 -0
- package/transforms/Oriya-ur.txt +7 -0
- package/transforms/Pashto-Latin-BGN.json +9 -0
- package/transforms/Pashto-Latin-BGN.txt +231 -0
- package/transforms/Persian-Latin-BGN.json +9 -0
- package/transforms/Persian-Latin-BGN.txt +203 -0
- package/transforms/Pinyin-NumericPinyin.json +7 -0
- package/transforms/Pinyin-NumericPinyin.txt +8 -0
- package/transforms/Russian-Latin-BGN.json +9 -0
- package/transforms/Russian-Latin-BGN.txt +235 -0
- package/transforms/Serbian-Latin-BGN.json +9 -0
- package/transforms/Serbian-Latin-BGN.txt +119 -0
- package/transforms/Simplified-Traditional.json +11 -0
- package/transforms/Simplified-Traditional.txt +4393 -0
- package/transforms/Syriac-Latin.json +11 -0
- package/transforms/Syriac-Latin.txt +52 -0
- package/transforms/Tamil-Arabic.json +9 -0
- package/transforms/Tamil-Arabic.txt +7 -0
- package/transforms/Tamil-Bengali.json +9 -0
- package/transforms/Tamil-Bengali.txt +7 -0
- package/transforms/Tamil-Devanagari.json +9 -0
- package/transforms/Tamil-Devanagari.txt +7 -0
- package/transforms/Tamil-Gujarati.json +9 -0
- package/transforms/Tamil-Gujarati.txt +7 -0
- package/transforms/Tamil-Gurmukhi.json +9 -0
- package/transforms/Tamil-Gurmukhi.txt +7 -0
- package/transforms/Tamil-InterIndic.json +7 -0
- package/transforms/Tamil-InterIndic.txt +70 -0
- package/transforms/Tamil-Kannada.json +9 -0
- package/transforms/Tamil-Kannada.txt +7 -0
- package/transforms/Tamil-Latin.json +9 -0
- package/transforms/Tamil-Latin.txt +7 -0
- package/transforms/Tamil-Malayalam.json +9 -0
- package/transforms/Tamil-Malayalam.txt +7 -0
- package/transforms/Tamil-Oriya.json +9 -0
- package/transforms/Tamil-Oriya.txt +7 -0
- package/transforms/Tamil-Telugu.json +9 -0
- package/transforms/Tamil-Telugu.txt +7 -0
- package/transforms/Tamil-ur.json +8 -0
- package/transforms/Tamil-ur.txt +7 -0
- package/transforms/Telugu-Arabic.json +9 -0
- package/transforms/Telugu-Arabic.txt +7 -0
- package/transforms/Telugu-Bengali.json +9 -0
- package/transforms/Telugu-Bengali.txt +7 -0
- package/transforms/Telugu-Devanagari.json +9 -0
- package/transforms/Telugu-Devanagari.txt +7 -0
- package/transforms/Telugu-Gujarati.json +9 -0
- package/transforms/Telugu-Gujarati.txt +7 -0
- package/transforms/Telugu-Gurmukhi.json +9 -0
- package/transforms/Telugu-Gurmukhi.txt +7 -0
- package/transforms/Telugu-InterIndic.json +7 -0
- package/transforms/Telugu-InterIndic.txt +87 -0
- package/transforms/Telugu-Kannada.json +9 -0
- package/transforms/Telugu-Kannada.txt +7 -0
- package/transforms/Telugu-Latin.json +9 -0
- package/transforms/Telugu-Latin.txt +7 -0
- package/transforms/Telugu-Malayalam.json +9 -0
- package/transforms/Telugu-Malayalam.txt +7 -0
- package/transforms/Telugu-Oriya.json +9 -0
- package/transforms/Telugu-Oriya.txt +7 -0
- package/transforms/Telugu-Tamil.json +9 -0
- package/transforms/Telugu-Tamil.txt +7 -0
- package/transforms/Telugu-ur.json +8 -0
- package/transforms/Telugu-ur.txt +7 -0
- package/transforms/Thaana-Latin.json +11 -0
- package/transforms/Thaana-Latin.txt +433 -0
- package/transforms/Thai-Latin.json +9 -0
- package/transforms/Thai-Latin.txt +9 -0
- package/transforms/Thai-ThaiLogical.json +7 -0
- package/transforms/Thai-ThaiLogical.txt +16 -0
- package/transforms/Thai-ThaiSemi.json +7 -0
- package/transforms/Thai-ThaiSemi.txt +6 -0
- package/transforms/ThaiLogical-Latin.json +7 -0
- package/transforms/ThaiLogical-Latin.txt +147 -0
- package/transforms/Turkmen-Latin-BGN.json +9 -0
- package/transforms/Turkmen-Latin-BGN.txt +302 -0
- package/transforms/Ukrainian-Latin-BGN.json +9 -0
- package/transforms/Ukrainian-Latin-BGN.txt +283 -0
- package/transforms/Uzbek-Latin-BGN.json +9 -0
- package/transforms/Uzbek-Latin-BGN.txt +261 -0
- package/transforms/am-Ethi-t-am-brai.json +11 -0
- package/transforms/am-Ethi-t-am-brai.txt +652 -0
- package/transforms/am-Ethi-t-am-ethi-m0-geminate.json +9 -0
- package/transforms/am-Ethi-t-am-ethi-m0-geminate.txt +6925 -0
- package/transforms/am-Ethi-t-d0-morse.json +9 -0
- package/transforms/am-Ethi-t-d0-morse.txt +657 -0
- package/transforms/am-am_FONIPA.json +9 -0
- package/transforms/am-am_FONIPA.txt +694 -0
- package/transforms/am-ar.json +8 -0
- package/transforms/am-ar.txt +5 -0
- package/transforms/am-chr.json +8 -0
- package/transforms/am-chr.txt +4 -0
- package/transforms/am-fa.json +8 -0
- package/transforms/am-fa.txt +4 -0
- package/transforms/az-Lower.json +8 -0
- package/transforms/az-Lower.txt +13 -0
- package/transforms/az-Title.json +8 -0
- package/transforms/az-Title.txt +11 -0
- package/transforms/az-Upper.json +8 -0
- package/transforms/az-Upper.txt +5 -0
- package/transforms/blt-fonipa-t-blt.json +8 -0
- package/transforms/blt-fonipa-t-blt.txt +132 -0
- package/transforms/byn-Ethi-t-byn-latn-m0-tekie-alibekit.json +11 -0
- package/transforms/byn-Ethi-t-byn-latn-m0-tekie-alibekit.txt +537 -0
- package/transforms/byn-Ethi-t-byn-latn-m0-xaleget.json +11 -0
- package/transforms/byn-Ethi-t-byn-latn-m0-xaleget.txt +773 -0
- package/transforms/ch-am.json +8 -0
- package/transforms/ch-am.txt +4 -0
- package/transforms/ch-ar.json +8 -0
- package/transforms/ch-ar.txt +4 -0
- package/transforms/ch-ch_FONIPA.json +8 -0
- package/transforms/ch-ch_FONIPA.txt +79 -0
- package/transforms/ch-chr.json +8 -0
- package/transforms/ch-chr.txt +4 -0
- package/transforms/ch-fa.json +8 -0
- package/transforms/ch-fa.txt +4 -0
- package/transforms/chr-chr_FONIPA.json +8 -0
- package/transforms/chr-chr_FONIPA.txt +111 -0
- package/transforms/cs-am.json +8 -0
- package/transforms/cs-am.txt +4 -0
- package/transforms/cs-ar.json +8 -0
- package/transforms/cs-ar.txt +4 -0
- package/transforms/cs-chr.json +8 -0
- package/transforms/cs-chr.txt +4 -0
- package/transforms/cs-cs_FONIPA.json +8 -0
- package/transforms/cs-cs_FONIPA.txt +74 -0
- package/transforms/cs-fa.json +8 -0
- package/transforms/cs-fa.txt +4 -0
- package/transforms/cs-ja.json +8 -0
- package/transforms/cs-ja.txt +4 -0
- package/transforms/cs-ko.json +8 -0
- package/transforms/cs-ko.txt +4 -0
- package/transforms/cs_FONIPA-ja.json +8 -0
- package/transforms/cs_FONIPA-ja.txt +228 -0
- package/transforms/cs_FONIPA-ko.json +8 -0
- package/transforms/cs_FONIPA-ko.txt +88 -0
- package/transforms/cy-fonipa-t-cy.json +8 -0
- package/transforms/cy-fonipa-t-cy.txt +189 -0
- package/transforms/de-ASCII.json +8 -0
- package/transforms/de-ASCII.txt +15 -0
- package/transforms/dsb-dsb_FONIPA.json +8 -0
- package/transforms/dsb-dsb_FONIPA.txt +67 -0
- package/transforms/el-Lower.json +8 -0
- package/transforms/el-Lower.txt +12 -0
- package/transforms/el-Title.json +8 -0
- package/transforms/el-Title.txt +12 -0
- package/transforms/el-Upper.json +8 -0
- package/transforms/el-Upper.txt +11 -0
- package/transforms/eo-am.json +8 -0
- package/transforms/eo-am.txt +4 -0
- package/transforms/eo-ar.json +8 -0
- package/transforms/eo-ar.txt +4 -0
- package/transforms/eo-chr.json +8 -0
- package/transforms/eo-chr.txt +4 -0
- package/transforms/eo-eo_FONIPA.json +8 -0
- package/transforms/eo-eo_FONIPA.txt +47 -0
- package/transforms/eo-fa.json +8 -0
- package/transforms/eo-fa.txt +4 -0
- package/transforms/es-am.json +8 -0
- package/transforms/es-am.txt +4 -0
- package/transforms/es-ar.json +8 -0
- package/transforms/es-ar.txt +13 -0
- package/transforms/es-chr.json +8 -0
- package/transforms/es-chr.txt +4 -0
- package/transforms/es-es_FONIPA.json +8 -0
- package/transforms/es-es_FONIPA.txt +139 -0
- package/transforms/es-fa.json +8 -0
- package/transforms/es-fa.txt +13 -0
- package/transforms/es-ja.json +8 -0
- package/transforms/es-ja.txt +4 -0
- package/transforms/es-zh.json +8 -0
- package/transforms/es-zh.txt +4 -0
- package/transforms/es_419-am.json +8 -0
- package/transforms/es_419-am.txt +5 -0
- package/transforms/es_419-ar.json +8 -0
- package/transforms/es_419-ar.txt +14 -0
- package/transforms/es_419-chr.json +8 -0
- package/transforms/es_419-chr.txt +5 -0
- package/transforms/es_419-fa.json +8 -0
- package/transforms/es_419-fa.txt +14 -0
- package/transforms/es_419-ja.json +8 -0
- package/transforms/es_419-ja.txt +5 -0
- package/transforms/es_419-zh.json +8 -0
- package/transforms/es_419-zh.txt +5 -0
- package/transforms/es_FONIPA-am.json +8 -0
- package/transforms/es_FONIPA-am.txt +230 -0
- package/transforms/es_FONIPA-es_419_FONIPA.json +8 -0
- package/transforms/es_FONIPA-es_419_FONIPA.txt +6 -0
- package/transforms/es_FONIPA-ja.json +8 -0
- package/transforms/es_FONIPA-ja.txt +155 -0
- package/transforms/es_FONIPA-zh.json +8 -0
- package/transforms/es_FONIPA-zh.txt +522 -0
- package/transforms/fa-fa_FONIPA.json +8 -0
- package/transforms/fa-fa_FONIPA.txt +107 -0
- package/transforms/gz-Ethi-t-und-sarb.json +11 -0
- package/transforms/gz-Ethi-t-und-sarb.txt +180 -0
- package/transforms/ha-ha_NE.json +8 -0
- package/transforms/ha-ha_NE.txt +6 -0
- package/transforms/hy-am.json +8 -0
- package/transforms/hy-am.txt +4 -0
- package/transforms/hy-ar.json +8 -0
- package/transforms/hy-ar.txt +4 -0
- package/transforms/hy-chr.json +8 -0
- package/transforms/hy-chr.txt +4 -0
- package/transforms/hy-fa.json +8 -0
- package/transforms/hy-fa.txt +4 -0
- package/transforms/hy-hy_FONIPA.json +8 -0
- package/transforms/hy-hy_FONIPA.txt +52 -0
- package/transforms/hy_AREVMDA-am.json +8 -0
- package/transforms/hy_AREVMDA-am.txt +4 -0
- package/transforms/hy_AREVMDA-ar.json +8 -0
- package/transforms/hy_AREVMDA-ar.txt +4 -0
- package/transforms/hy_AREVMDA-chr.json +8 -0
- package/transforms/hy_AREVMDA-chr.txt +4 -0
- package/transforms/hy_AREVMDA-fa.json +8 -0
- package/transforms/hy_AREVMDA-fa.txt +4 -0
- package/transforms/hy_AREVMDA-hy_AREVMDA_FONIPA.json +8 -0
- package/transforms/hy_AREVMDA-hy_AREVMDA_FONIPA.txt +80 -0
- package/transforms/ia-am.json +8 -0
- package/transforms/ia-am.txt +4 -0
- package/transforms/ia-ar.json +8 -0
- package/transforms/ia-ar.txt +4 -0
- package/transforms/ia-chr.json +8 -0
- package/transforms/ia-chr.txt +4 -0
- package/transforms/ia-fa.json +8 -0
- package/transforms/ia-fa.txt +4 -0
- package/transforms/ia-ia_FONIPA.json +8 -0
- package/transforms/ia-ia_FONIPA.txt +71 -0
- package/transforms/it-am.json +8 -0
- package/transforms/it-am.txt +257 -0
- package/transforms/it-ja.json +8 -0
- package/transforms/it-ja.txt +259 -0
- package/transforms/ja_Latn-ko.json +8 -0
- package/transforms/ja_Latn-ko.txt +141 -0
- package/transforms/ja_Latn-ru.json +8 -0
- package/transforms/ja_Latn-ru.txt +123 -0
- package/transforms/kk-am.json +8 -0
- package/transforms/kk-am.txt +4 -0
- package/transforms/kk-ar.json +8 -0
- package/transforms/kk-ar.txt +4 -0
- package/transforms/kk-chr.json +8 -0
- package/transforms/kk-chr.txt +4 -0
- package/transforms/kk-fa.json +8 -0
- package/transforms/kk-fa.txt +4 -0
- package/transforms/kk-kk_FONIPA.json +8 -0
- package/transforms/kk-kk_FONIPA.txt +59 -0
- package/transforms/ky-am.json +8 -0
- package/transforms/ky-am.txt +4 -0
- package/transforms/ky-ar.json +8 -0
- package/transforms/ky-ar.txt +4 -0
- package/transforms/ky-chr.json +8 -0
- package/transforms/ky-chr.txt +4 -0
- package/transforms/ky-fa.json +8 -0
- package/transforms/ky-fa.txt +4 -0
- package/transforms/ky-ky_FONIPA.json +8 -0
- package/transforms/ky-ky_FONIPA.txt +71 -0
- package/transforms/la-la_FONIPA.json +8 -0
- package/transforms/la-la_FONIPA.txt +79 -0
- package/transforms/lt-Lower.json +8 -0
- package/transforms/lt-Lower.txt +20 -0
- package/transforms/lt-Title.json +8 -0
- package/transforms/lt-Title.txt +15 -0
- package/transforms/lt-Upper.json +8 -0
- package/transforms/lt-Upper.txt +8 -0
- package/transforms/mn-mn_Latn-MNS.json +8 -0
- package/transforms/mn-mn_Latn-MNS.txt +86 -0
- package/transforms/my-am.json +8 -0
- package/transforms/my-am.txt +4 -0
- package/transforms/my-ar.json +8 -0
- package/transforms/my-ar.txt +4 -0
- package/transforms/my-chr.json +8 -0
- package/transforms/my-chr.txt +4 -0
- package/transforms/my-fa.json +8 -0
- package/transforms/my-fa.txt +4 -0
- package/transforms/my-my_FONIPA.json +8 -0
- package/transforms/my-my_FONIPA.txt +325 -0
- package/transforms/my-t-my-d0-zawgyi.json +8 -0
- package/transforms/my-t-my-d0-zawgyi.txt +222 -0
- package/transforms/my-t-my-s0-zawgyi.json +8 -0
- package/transforms/my-t-my-s0-zawgyi.txt +231 -0
- package/transforms/nl-Title.json +8 -0
- package/transforms/nl-Title.txt +7 -0
- package/transforms/nv-nv_FONIPA.json +8 -0
- package/transforms/nv-nv_FONIPA.txt +74 -0
- package/transforms/pl-am.json +8 -0
- package/transforms/pl-am.txt +4 -0
- package/transforms/pl-ar.json +8 -0
- package/transforms/pl-ar.txt +4 -0
- package/transforms/pl-chr.json +8 -0
- package/transforms/pl-chr.txt +4 -0
- package/transforms/pl-fa.json +8 -0
- package/transforms/pl-fa.txt +4 -0
- package/transforms/pl-ja.json +8 -0
- package/transforms/pl-ja.txt +4 -0
- package/transforms/pl-pl_FONIPA.json +8 -0
- package/transforms/pl-pl_FONIPA.txt +113 -0
- package/transforms/pl_FONIPA-ja.json +8 -0
- package/transforms/pl_FONIPA-ja.txt +301 -0
- package/transforms/rm_SURSILV-am.json +8 -0
- package/transforms/rm_SURSILV-am.txt +4 -0
- package/transforms/rm_SURSILV-ar.json +8 -0
- package/transforms/rm_SURSILV-ar.txt +4 -0
- package/transforms/rm_SURSILV-chr.json +8 -0
- package/transforms/rm_SURSILV-chr.txt +4 -0
- package/transforms/rm_SURSILV-fa.json +8 -0
- package/transforms/rm_SURSILV-fa.txt +4 -0
- package/transforms/rm_SURSILV-rm_FONIPA_SURSILV.json +8 -0
- package/transforms/rm_SURSILV-rm_FONIPA_SURSILV.txt +96 -0
- package/transforms/ro-am.json +8 -0
- package/transforms/ro-am.txt +4 -0
- package/transforms/ro-ar.json +8 -0
- package/transforms/ro-ar.txt +4 -0
- package/transforms/ro-chr.json +8 -0
- package/transforms/ro-chr.txt +4 -0
- package/transforms/ro-fa.json +8 -0
- package/transforms/ro-fa.txt +4 -0
- package/transforms/ro-ja.json +8 -0
- package/transforms/ro-ja.txt +4 -0
- package/transforms/ro-ro_FONIPA.json +8 -0
- package/transforms/ro-ro_FONIPA.txt +121 -0
- package/transforms/ro_FONIPA-ja.json +8 -0
- package/transforms/ro_FONIPA-ja.txt +211 -0
- package/transforms/ru-ja.json +8 -0
- package/transforms/ru-ja.txt +444 -0
- package/transforms/ru-zh.json +8 -0
- package/transforms/ru-zh.txt +996 -0
- package/transforms/ru_Latn-ru-BGN.json +9 -0
- package/transforms/ru_Latn-ru-BGN.txt +97 -0
- package/transforms/sat-am.json +8 -0
- package/transforms/sat-am.txt +6 -0
- package/transforms/sat-ar.json +8 -0
- package/transforms/sat-ar.txt +6 -0
- package/transforms/sat-chr.json +8 -0
- package/transforms/sat-chr.txt +6 -0
- package/transforms/sat-fa.json +8 -0
- package/transforms/sat-fa.txt +6 -0
- package/transforms/sat_Olck-sat_FONIPA.json +8 -0
- package/transforms/sat_Olck-sat_FONIPA.txt +174 -0
- package/transforms/sgw-Ethi-t-und-ethi.json +11 -0
- package/transforms/sgw-Ethi-t-und-ethi.txt +138 -0
- package/transforms/si-am.json +8 -0
- package/transforms/si-am.txt +4 -0
- package/transforms/si-ar.json +8 -0
- package/transforms/si-ar.txt +4 -0
- package/transforms/si-chr.json +8 -0
- package/transforms/si-chr.txt +4 -0
- package/transforms/si-fa.json +8 -0
- package/transforms/si-fa.txt +4 -0
- package/transforms/si-si_FONIPA.json +8 -0
- package/transforms/si-si_FONIPA.txt +157 -0
- package/transforms/si-si_Latn.json +8 -0
- package/transforms/si-si_Latn.txt +94 -0
- package/transforms/sk-am.json +8 -0
- package/transforms/sk-am.txt +4 -0
- package/transforms/sk-ar.json +8 -0
- package/transforms/sk-ar.txt +4 -0
- package/transforms/sk-chr.json +8 -0
- package/transforms/sk-chr.txt +4 -0
- package/transforms/sk-fa.json +8 -0
- package/transforms/sk-fa.txt +4 -0
- package/transforms/sk-ja.json +8 -0
- package/transforms/sk-ja.txt +4 -0
- package/transforms/sk-sk_FONIPA.json +8 -0
- package/transforms/sk-sk_FONIPA.txt +101 -0
- package/transforms/sk_FONIPA-ja.json +8 -0
- package/transforms/sk_FONIPA-ja.txt +252 -0
- package/transforms/ta-ta_FONIPA.json +8 -0
- package/transforms/ta-ta_FONIPA.txt +73 -0
- package/transforms/tlh-am.json +8 -0
- package/transforms/tlh-am.txt +4 -0
- package/transforms/tlh-ar.json +8 -0
- package/transforms/tlh-ar.txt +4 -0
- package/transforms/tlh-chr.json +8 -0
- package/transforms/tlh-chr.txt +4 -0
- package/transforms/tlh-fa.json +8 -0
- package/transforms/tlh-fa.txt +4 -0
- package/transforms/tlh-tlh_FONIPA.json +8 -0
- package/transforms/tlh-tlh_FONIPA.txt +46 -0
- package/transforms/tr-Lower.json +8 -0
- package/transforms/tr-Lower.txt +13 -0
- package/transforms/tr-Title.json +8 -0
- package/transforms/tr-Title.txt +11 -0
- package/transforms/tr-Upper.json +8 -0
- package/transforms/tr-Upper.txt +8 -0
- package/transforms/ug-ug_FONIPA.json +8 -0
- package/transforms/ug-ug_FONIPA.txt +69 -0
- package/transforms/und-Ethi-t-und-cyrl-m0-gutgarts.json +11 -0
- package/transforms/und-Ethi-t-und-cyrl-m0-gutgarts.txt +747 -0
- package/transforms/und-Ethi-t-und-latn-m0-aethiopi-geminate.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-aethiopi-geminate.txt +19 -0
- package/transforms/und-Ethi-t-und-latn-m0-aethiopi.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-aethiopi.txt +633 -0
- package/transforms/und-Ethi-t-und-latn-m0-alaloc-geminate.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-alaloc-geminate.txt +19 -0
- package/transforms/und-Ethi-t-und-latn-m0-alaloc.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-alaloc.txt +757 -0
- package/transforms/und-Ethi-t-und-latn-m0-beta_metsehaf-geminate.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-beta_metsehaf-geminate.txt +19 -0
- package/transforms/und-Ethi-t-und-latn-m0-beta_metsehaf.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-beta_metsehaf.txt +585 -0
- package/transforms/und-Ethi-t-und-latn-m0-es3842.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-es3842.txt +640 -0
- package/transforms/und-Ethi-t-und-latn-m0-ies-jes-1964-geminate.json +9 -0
- package/transforms/und-Ethi-t-und-latn-m0-ies-jes-1964-geminate.txt +19 -0
- package/transforms/und-Ethi-t-und-latn-m0-ies-jes-1964.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-ies-jes-1964.txt +619 -0
- package/transforms/und-Ethi-t-und-latn-m0-lambdin.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-lambdin.txt +627 -0
- package/transforms/und-Ethi-t-und-latn-m0-sera.json +11 -0
- package/transforms/und-Ethi-t-und-latn-m0-sera.txt +695 -0
- package/transforms/und-Ethi-t-und-latn.json +11 -0
- package/transforms/und-Ethi-t-und-latn.txt +16 -0
- package/transforms/und_FONIPA-ar.json +8 -0
- package/transforms/und_FONIPA-ar.txt +114 -0
- package/transforms/und_FONIPA-chr.json +8 -0
- package/transforms/und_FONIPA-chr.txt +172 -0
- package/transforms/und_FONIPA-fa.json +8 -0
- package/transforms/und_FONIPA-fa.txt +109 -0
- package/transforms/uz_Cyrl-uz_Latn.json +9 -0
- package/transforms/uz_Cyrl-uz_Latn.txt +103 -0
- package/transforms/vec-vec_FONIPA.json +8 -0
- package/transforms/vec-vec_FONIPA.txt +85 -0
- package/transforms/xh-am.json +8 -0
- package/transforms/xh-am.txt +4 -0
- package/transforms/xh-ar.json +8 -0
- package/transforms/xh-ar.txt +4 -0
- package/transforms/xh-chr.json +8 -0
- package/transforms/xh-chr.txt +4 -0
- package/transforms/xh-fa.json +8 -0
- package/transforms/xh-fa.txt +4 -0
- package/transforms/xh-xh_FONIPA.json +8 -0
- package/transforms/xh-xh_FONIPA.txt +85 -0
- package/transforms/yo-yo_BJ.json +8 -0
- package/transforms/yo-yo_BJ.txt +36 -0
- package/transforms/zh_Latn_PINYIN-ru.json +8 -0
- package/transforms/zh_Latn_PINYIN-ru.txt +148 -0
- package/transforms/zu-am.json +8 -0
- package/transforms/zu-am.txt +4 -0
- package/transforms/zu-ar.json +8 -0
- package/transforms/zu-ar.txt +4 -0
- package/transforms/zu-chr.json +8 -0
- package/transforms/zu-chr.txt +4 -0
- package/transforms/zu-fa.json +8 -0
- package/transforms/zu-fa.txt +4 -0
- package/transforms/zu-zu_FONIPA.json +8 -0
- package/transforms/zu-zu_FONIPA.txt +72 -0
- package/transforms.json +385 -0
|
@@ -0,0 +1,8 @@
|
|
|
1
|
+
|
|
2
|
+
::['.0-9A-Za-z~À-ÅÇ-ÏÑ-ÖÙ-Ýà-åç-ïñ-öù-ýÿ-ďĒ-ĥĨ-İĴ-ķĹ-ľŃ-ňŌ-őŔ-ťŨ-žƠ-ơƯ-ưǍ-ǜǞ-ǣǦ-ǭǰǴ-ǵǸ-țȞ-ȟȦ-ȳʔ́̃-̄̆-̇̐̔-̣̥̱́̈́̕΅-ΆΈ-ΊΌΎ-ΐά-ΰό-ώϓЃЌЎЙйѓќўӁ-ӂӐ-ӑӖ-ӗӢ-ӣӮ-ӯḀ-ẙẠ-ỹἁἃ-ἅἇἉἋ-ἍἏἑἓ-ἕἙἛ-Ἕἡἣ-ἥἧἩἫ-ἭἯἱἳ-ἵἷἹἻ-ἽἿὁὃ-ὅὉὋ-Ὅὑὓ-ὕὗὙὛὝὟὡὣ-ὥὧὩὫ-ὭὯάέήίόύώᾁᾃ-ᾅᾇᾉᾋ-ᾍᾏᾑᾓ-ᾕᾗᾙᾛ-ᾝᾟᾡᾣ-ᾥᾧᾩᾫ-ᾭᾯ-ᾱᾴᾸ-ᾹΆῄΈΉ῎ῐ-ῑΐῘ-ῙΊ῞ῠ-ῡΰῥῨ-ῩΎ-Ῥ΅ῴΌΏK-Å\uE04D\uE064];
|
|
3
|
+
::NFD;
|
|
4
|
+
::Lower;
|
|
5
|
+
::Latin-InterIndic;
|
|
6
|
+
::InterIndic-Kannada;
|
|
7
|
+
::NFC;
|
|
8
|
+
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
{
|
|
2
|
+
"_backwardAlias": "Katakana-Latin",
|
|
3
|
+
"_visibility": "external",
|
|
4
|
+
"_backwardAliasBcp47": "und-Latn-t-und-kana",
|
|
5
|
+
"_alias": "Latin-Katakana",
|
|
6
|
+
"_aliasBcp47": "und-Kana-t-und-latn",
|
|
7
|
+
"_source": "Latn",
|
|
8
|
+
"_direction": "both",
|
|
9
|
+
"_target": "Kana",
|
|
10
|
+
"_rulesFile": "Latin-Katakana.txt"
|
|
11
|
+
}
|
|
@@ -0,0 +1,382 @@
|
|
|
1
|
+
|
|
2
|
+
# note: a global filter is more efficient, but MUST include all source chars
|
|
3
|
+
#:: [\u0000-\u007E 、。 ゙-゜ ァ-ー 。-゚ [:Latin:][:Katakana:] [:nonspacing mark:]] ;
|
|
4
|
+
# MINIMAL FILTER GENERATED FOR: Latin-Katakana
|
|
5
|
+
### WARNING -- must add width filter, both here and below!!! ###
|
|
6
|
+
:: [[ᄀ-ᄒᄚᄡ\u1160-ᅵᆪᆬ-ᆭᆰ-ᆵ←-↓│■○\u3000-。「-」゙-゚ァ-ロワヲ-ヴヷヺ-ー!-~¢-₩][',.A-Za-z~À-ÖØ-öø-ďĒ-ĥĨ-İĴ-ķĹ-ľŃ-ňŌ-őŔ-ťŨ-žƠ-ơƯ-ưǍ-ǜǞ-ǣǦ-ǭǰǴ-ǵǸ-țȞ-ȟȦ-ȳ̄Ӣ-ӣӮ-ӯḀ-ẙẠ-ỹᾱᾹῑῙῡῩK-Å]] ;
|
|
7
|
+
:: [:Latin:] fullwidth-halfwidth ();
|
|
8
|
+
:: NFD (NFC);
|
|
9
|
+
:: Lower (); # whenever transliterating from cased to uncased script, include this
|
|
10
|
+
# :: NFD () ; # this would catch the odd cases where a lowercase is not in NFD, but none are important for Japanese
|
|
11
|
+
# Uses modified Hepburn. Small changes to make unambiguous.
|
|
12
|
+
# | Kunrei-shiki: Hepburn/MHepburn
|
|
13
|
+
# | ------------------------------
|
|
14
|
+
# | si: shi
|
|
15
|
+
# | si ~ya: sha
|
|
16
|
+
# | si ~yu: shu
|
|
17
|
+
# | si ~yo: sho
|
|
18
|
+
# | zi: ji
|
|
19
|
+
# | zi ~ya: ja
|
|
20
|
+
# | zi ~yu: ju
|
|
21
|
+
# | zi ~yo: jo
|
|
22
|
+
# | ti: chi
|
|
23
|
+
# | ti ~ya: cha
|
|
24
|
+
# | ti ~yu: chu
|
|
25
|
+
# | ti ~yu: cho
|
|
26
|
+
# | tu: tsu
|
|
27
|
+
# | di: ji/dji
|
|
28
|
+
# | du: zu/dzu
|
|
29
|
+
# | hu: fu
|
|
30
|
+
# | For foreign words:
|
|
31
|
+
# | -----------------
|
|
32
|
+
# | se ~i si
|
|
33
|
+
# | si ~e she
|
|
34
|
+
# |
|
|
35
|
+
# | ze ~i zi
|
|
36
|
+
# | zi ~e je
|
|
37
|
+
# |
|
|
38
|
+
# | te ~i ti
|
|
39
|
+
# | ti ~e che
|
|
40
|
+
# | te ~u tu
|
|
41
|
+
# |
|
|
42
|
+
# | de ~i di
|
|
43
|
+
# | de ~u du
|
|
44
|
+
# | de ~i di
|
|
45
|
+
# |
|
|
46
|
+
# | he ~u: hu
|
|
47
|
+
# | hu ~a fa
|
|
48
|
+
# | hu ~i fi
|
|
49
|
+
# | hu ~e he
|
|
50
|
+
# | hu ~o ho
|
|
51
|
+
# Most small forms are generated, but if necessary
|
|
52
|
+
# explicit small forms are given with ~a, ~ya, etc.
|
|
53
|
+
#------------------------------------------------------
|
|
54
|
+
# Variables
|
|
55
|
+
$vowel = [aeiou] ;
|
|
56
|
+
$consonant = [bcdfghjklmnpqrstvwxyz] ;
|
|
57
|
+
$macron = ̄ ;
|
|
58
|
+
# Variables used for doubled-consonants with tsu
|
|
59
|
+
$kana = [ぁ-ゔ] ;
|
|
60
|
+
$voice = [゙゛];
|
|
61
|
+
$semivoice = [゚゜];
|
|
62
|
+
$k_start = [カキクケコかきくけこ] ;
|
|
63
|
+
$s_start = [サシスセソさしすせそ] ;
|
|
64
|
+
$j_start = [シし] $voice ;
|
|
65
|
+
$t_start = [タチツテトたちつてと] ;
|
|
66
|
+
$n_start = [ナニヌネノンなにぬねの] ;
|
|
67
|
+
$h_start = [ハヒヘホはひへほ] ;
|
|
68
|
+
$f_start = [フふ] ;
|
|
69
|
+
$m_start = [マミムメモまみむめも] ;
|
|
70
|
+
$y_start = [ヤユヨやゆよ] ;
|
|
71
|
+
$r_start = [ラリルレロらりるれろ] ;
|
|
72
|
+
$w_start = [ワヰヱヲわゐゑを] ;
|
|
73
|
+
$v_start = [ワヰヱヲ]゙ ;
|
|
74
|
+
$voweled_basekana = [ァ-オカキクケコサシスセソタチッツテトナ-ノハヒフヘホマ-ヲヵヶ] ;
|
|
75
|
+
# if ン is followed by $n_quoter, then it needs an
|
|
76
|
+
# apostrophe after its romaji form to disambiguate it.
|
|
77
|
+
# e.g., ン ア ! = ナ, so represent as "n'a", not "na".
|
|
78
|
+
$n_quoter = [ア イ ウ エ オ ナ ニ ヌ ネ ノ ヤ ユ ヨ ン] ;
|
|
79
|
+
$small_y = [ャィュェョ] ;
|
|
80
|
+
$iteration = ゝ ;
|
|
81
|
+
#------------------------------------------------------
|
|
82
|
+
# katakana rules
|
|
83
|
+
# Punctuation
|
|
84
|
+
'.' ↔ 。;
|
|
85
|
+
',' ↔ 、;
|
|
86
|
+
# ' ' } [a-z] → ; # delete spaces before latin
|
|
87
|
+
# ' ' ← [^' '゠-ヿ] {} ['゠-ヿ] ; #insert spaces before hiragana
|
|
88
|
+
# Iteration Mark
|
|
89
|
+
# Copy previous letter § marks
|
|
90
|
+
# TODO
|
|
91
|
+
# | $1 $1 ← ($kana [[:M:]$voice$semivoice]?) $iteration
|
|
92
|
+
# Specials for katakana -- not shared with hiragana
|
|
93
|
+
va ↔ ヷ ;
|
|
94
|
+
vi ↔ ヸ ;
|
|
95
|
+
ve ↔ ヹ ;
|
|
96
|
+
vo ↔ ヺ ;
|
|
97
|
+
'~ka' ↔ ヵ ;
|
|
98
|
+
'~ke' ↔ ヶ ;
|
|
99
|
+
# ~~~ begin shared rules ~~~
|
|
100
|
+
#special
|
|
101
|
+
ya ← '~'ャ;
|
|
102
|
+
yi ← '~'ィ ;
|
|
103
|
+
yu ← '~'ュ;
|
|
104
|
+
ye ← '~'ェ;
|
|
105
|
+
yo ← '~'ョ;
|
|
106
|
+
#normal
|
|
107
|
+
a ↔ ア ;
|
|
108
|
+
b | '~' ← ヒ ゙} $small_y ;
|
|
109
|
+
by } $vowel → ビ | '~y' ;
|
|
110
|
+
ba ↔ バ ;
|
|
111
|
+
bi ↔ ビ ;
|
|
112
|
+
bu ↔ ブ ;
|
|
113
|
+
be ↔ ベ ;
|
|
114
|
+
bo ↔ ボ ;
|
|
115
|
+
c } i → | s ;
|
|
116
|
+
c } e → | s ;
|
|
117
|
+
da ↔ ダ ;
|
|
118
|
+
di ↔ ディ ;
|
|
119
|
+
du ↔ デゥ ;
|
|
120
|
+
de ↔ デ ;
|
|
121
|
+
do ↔ ド ;
|
|
122
|
+
dzu ↔ ヅ ;
|
|
123
|
+
dja ← ヂャ ;
|
|
124
|
+
dji'~i' ← ヂィ ; # liu
|
|
125
|
+
dju ← ヂュ ;
|
|
126
|
+
dje ← ヂェ ;
|
|
127
|
+
djo ← ヂョ ;
|
|
128
|
+
dji ↔ ヂ ;
|
|
129
|
+
dj } $vowel → ヂ | '~y' ;
|
|
130
|
+
# TODO: QUESTION: use ĵĴżŻ instead of dj, dz
|
|
131
|
+
cha ← チャ ;
|
|
132
|
+
chi'~i' ← チィ ; # liu
|
|
133
|
+
chu ← チュ ;
|
|
134
|
+
che ← チェ ;
|
|
135
|
+
cho ← チョ ;
|
|
136
|
+
chi ↔ チ ;
|
|
137
|
+
ch } $vowel → チ | '~y' ;
|
|
138
|
+
e ↔ エ ;
|
|
139
|
+
g | '~' ← ギ} $small_y ;
|
|
140
|
+
gy } $vowel → ギ | '~y' ;
|
|
141
|
+
ga ↔ ガ ;
|
|
142
|
+
gi ↔ ギ ;
|
|
143
|
+
gu ↔ グ ;
|
|
144
|
+
ge ↔ ゲ ;
|
|
145
|
+
go ↔ ゴ ;
|
|
146
|
+
i ↔ イ ;
|
|
147
|
+
# j } $vowel → ジ | '~y' ;
|
|
148
|
+
ja ↔ ジャ ;
|
|
149
|
+
ji'~i' ← ジィ ; # liu
|
|
150
|
+
ju ↔ ジュ ;
|
|
151
|
+
je ↔ ジェ ;
|
|
152
|
+
jo ↔ ジョ ;
|
|
153
|
+
ji ↔ ジ ;
|
|
154
|
+
k | '~' ← キ} $small_y ;
|
|
155
|
+
ky } $vowel → キ | '~y' ;
|
|
156
|
+
ka ↔ カ ;
|
|
157
|
+
ki ↔ キ ;
|
|
158
|
+
ku ↔ ク ;
|
|
159
|
+
ke ↔ ケ ;
|
|
160
|
+
ko ↔ コ ;
|
|
161
|
+
m | '~' ← ミ} $small_y ;
|
|
162
|
+
my } $vowel → ミ | '~y' ;
|
|
163
|
+
ma ↔ マ ;
|
|
164
|
+
mi ↔ ミ ;
|
|
165
|
+
mu ↔ ム ;
|
|
166
|
+
me ↔ メ ;
|
|
167
|
+
mo ↔ モ ;
|
|
168
|
+
m } [pbfv] → ン ;
|
|
169
|
+
n | '~' ← ニ } $small_y ;
|
|
170
|
+
ny } $vowel → ニ | '~y' ;
|
|
171
|
+
na ↔ ナ ;
|
|
172
|
+
ni ↔ ニ ;
|
|
173
|
+
nu ↔ ヌ ;
|
|
174
|
+
ne ↔ ネ ;
|
|
175
|
+
no ↔ ノ ;
|
|
176
|
+
o ↔ オ ;
|
|
177
|
+
p | '~' ← ピ } $small_y ;
|
|
178
|
+
py } $vowel → ピ | '~y' ;
|
|
179
|
+
pa ↔ パ ;
|
|
180
|
+
pi ↔ ピ ;
|
|
181
|
+
pu ↔ プ ;
|
|
182
|
+
pe ↔ ペ ;
|
|
183
|
+
po ↔ ポ ;
|
|
184
|
+
h | '~' ← ヒ } $small_y ;
|
|
185
|
+
hy } $vowel → ヒ | '~y' ;
|
|
186
|
+
ha ↔ ハ ;
|
|
187
|
+
hi ↔ ヒ ;
|
|
188
|
+
hu ↔ ヘゥ ;
|
|
189
|
+
he ↔ ヘ ;
|
|
190
|
+
ho ↔ ホ ;
|
|
191
|
+
# f | '~' ← フ } $small_y ;
|
|
192
|
+
# f } $vowel → フ | '~' ;
|
|
193
|
+
fa ↔ ファ ;
|
|
194
|
+
fi ↔ フィ ;
|
|
195
|
+
fe ↔ フェ ;
|
|
196
|
+
fo ↔ フォ ;
|
|
197
|
+
fu ↔ フ ;
|
|
198
|
+
r | '~' ← リ } $small_y ;
|
|
199
|
+
ry } $vowel → リ | '~y' ;
|
|
200
|
+
ra ↔ ラ ;
|
|
201
|
+
ri ↔ リ ;
|
|
202
|
+
ru ↔ ル ;
|
|
203
|
+
re ↔ レ ;
|
|
204
|
+
ro ↔ ロ ;
|
|
205
|
+
za ↔ ザ ;
|
|
206
|
+
zi ↔ ゼィ ;
|
|
207
|
+
zu ↔ ズ ;
|
|
208
|
+
ze ↔ ゼ ;
|
|
209
|
+
zo ↔ ゾ ;
|
|
210
|
+
sa ↔ サ ;
|
|
211
|
+
si ↔ セィ ;
|
|
212
|
+
su ↔ ス ;
|
|
213
|
+
se ↔ セ ;
|
|
214
|
+
so ↔ ソ ;
|
|
215
|
+
sha ← シャ ;
|
|
216
|
+
shi'~i' ← シィ ; # liu
|
|
217
|
+
shu ← シュ ;
|
|
218
|
+
she ← シェ ;
|
|
219
|
+
sho ← ショ ;
|
|
220
|
+
shi ↔ シ ;
|
|
221
|
+
sh } $vowel → シ | '~y' ;
|
|
222
|
+
ta ↔ タ ;
|
|
223
|
+
ti ↔ ティ ;
|
|
224
|
+
tu ↔ テゥ ;
|
|
225
|
+
te ↔ テ ;
|
|
226
|
+
to ↔ ト ;
|
|
227
|
+
tsu ↔ ツ ;
|
|
228
|
+
# v } $vowel → ヴ | '~' ;
|
|
229
|
+
#'v~a' ← ヴァ ; # liu
|
|
230
|
+
#'v~i' ← ヴィ ; # liu
|
|
231
|
+
#'v~e' ← ヴェ ; # liu
|
|
232
|
+
#'v~o' ← ヴォ ; # liu
|
|
233
|
+
vu ↔ ヴ ;
|
|
234
|
+
u ↔ ウ ;
|
|
235
|
+
# w } $vowel → ウ | '~' ;
|
|
236
|
+
wa ↔ ワ ;
|
|
237
|
+
wi ↔ ヰ ;
|
|
238
|
+
wu → ウ ;
|
|
239
|
+
we ↔ ヱ ;
|
|
240
|
+
wo ↔ ヲ ;
|
|
241
|
+
ya ↔ ヤ ;
|
|
242
|
+
yi → イ ;
|
|
243
|
+
yu ↔ ユ ;
|
|
244
|
+
ye → エ ;
|
|
245
|
+
yo ↔ ヨ ;
|
|
246
|
+
# double consonants
|
|
247
|
+
#specials
|
|
248
|
+
s } sh → ッ ;
|
|
249
|
+
t } ch → ッ ;
|
|
250
|
+
#voiced
|
|
251
|
+
j } j ↔ ッ } $j_start ;
|
|
252
|
+
b } b ↔ ッ } [$h_start$f_start] $voice;
|
|
253
|
+
d } d ↔ ッ } $t_start $voice;
|
|
254
|
+
g } g ↔ ッ } $k_start $voice;
|
|
255
|
+
p } p ↔ ッ } [$h_start$f_start] $semivoice;
|
|
256
|
+
# v } v ↔ ッ } [ワヰウヱヲう] $voice ;
|
|
257
|
+
z } z ↔ ッ } $s_start $voice;
|
|
258
|
+
v } v ↔ ッ } $v_start;
|
|
259
|
+
# normal
|
|
260
|
+
k } k ↔ ッ } $k_start ;
|
|
261
|
+
m } m ↔ ッ } $m_start ;
|
|
262
|
+
n } n ↔ ッ } $n_start ;
|
|
263
|
+
h } h ↔ ッ } $h_start ;
|
|
264
|
+
f } f ↔ ッ } $f_start ;
|
|
265
|
+
r } r ↔ ッ } $r_start ;
|
|
266
|
+
t } t ↔ ッ } $t_start ;
|
|
267
|
+
s } s ↔ ッ } $s_start ;
|
|
268
|
+
w } w ↔ ッ } $w_start;
|
|
269
|
+
y } y ↔ ッ } $y_start;
|
|
270
|
+
# completeness
|
|
271
|
+
x } x → ッ ;
|
|
272
|
+
c } k → ッ ;
|
|
273
|
+
c } c → ッ ;
|
|
274
|
+
c } q → ッ ;
|
|
275
|
+
l } l → ッ ;
|
|
276
|
+
q } q → ッ ;
|
|
277
|
+
# y } y → ッ ;
|
|
278
|
+
# w } w → ッ ;
|
|
279
|
+
# prolonged vowel mark. this indicates a doubling of
|
|
280
|
+
# the preceding vowel sound
|
|
281
|
+
#a ← a { ー ; # liu
|
|
282
|
+
#e ← e { ー ; # liu
|
|
283
|
+
#i ← i { ー ; # liu
|
|
284
|
+
#o ← o { ー ; # liu
|
|
285
|
+
#u ← u { ー ; # liu
|
|
286
|
+
$macron ↔ ー ;
|
|
287
|
+
# small forms
|
|
288
|
+
'~a' ↔ ァ ;
|
|
289
|
+
'~i' ↔ ィ ;
|
|
290
|
+
'~u' ↔ ゥ ;
|
|
291
|
+
'~e' ↔ ェ ;
|
|
292
|
+
'~o' ↔ ォ ;
|
|
293
|
+
'~tsu' ↔ ッ ;
|
|
294
|
+
'~wa' ↔ ヮ ;
|
|
295
|
+
'~ya' ↔ ャ ;
|
|
296
|
+
'~yi' → ィ ;
|
|
297
|
+
'~yu' ↔ ュ ;
|
|
298
|
+
'~ye' → ェ ;
|
|
299
|
+
'~yo' ↔ ョ ;
|
|
300
|
+
# iteration marks
|
|
301
|
+
# TODO: make more accurate
|
|
302
|
+
j $1 ← sh (y* $vowel) {ヽ$voice ;
|
|
303
|
+
dj $1 ← ch (y* $vowel) {ヽ$voice ;
|
|
304
|
+
dz $1 ← ts (y* $vowel) {ヽ$voice ;
|
|
305
|
+
g $1 ← k (y* $vowel) {ヽ$voice ;
|
|
306
|
+
z $1 ← s (y* $vowel) {ヽ$voice ;
|
|
307
|
+
d $1 ← t (y* $vowel) {ヽ$voice ;
|
|
308
|
+
h $1 ← b (y* $vowel) {ヽ$voice ;
|
|
309
|
+
v $1 ← w (y* $vowel) {ヽ$voice ;
|
|
310
|
+
sh $1 ← sh (y* $vowel) {ヽ$voice ;
|
|
311
|
+
j $1 ← j (y* $vowel) {ヽ$voice ;
|
|
312
|
+
ch $1 ← ch (y* $vowel) {ヽ$voice ;
|
|
313
|
+
dj $1 ← dj(y* $vowel) {ヽ$voice ;
|
|
314
|
+
ts $1 ← ts (y* $vowel) {ヽ$voice ;
|
|
315
|
+
dz $1 ← dz (y* $vowel) {ヽ$voice ;
|
|
316
|
+
$1 ← ($consonant y* $vowel) {ヽ$voice? ;
|
|
317
|
+
$1 ← (.) {ヽ $voice? ; # otherwise repeat last character
|
|
318
|
+
← ヽ $voice? ; # delete if no characters found
|
|
319
|
+
# h- rule: lengthens vowel if not followed by a vowel.
|
|
320
|
+
# At the point this is applied, latin [cons]?vowel sequences
|
|
321
|
+
# have been converted to katakana in NFD form.
|
|
322
|
+
$voweled_basekana [\u3099 \u309A]? { h → ー ;
|
|
323
|
+
# one-way latin- → kana rules. these do not occur in
|
|
324
|
+
# well-formed romaji representing actual japanese text.
|
|
325
|
+
# their purpose is to make all romaji map to kana of
|
|
326
|
+
# some sort.
|
|
327
|
+
# the following are not really necessary, but produce
|
|
328
|
+
# slightly more natural results.
|
|
329
|
+
cy → セィ ;
|
|
330
|
+
dy → ディ ;
|
|
331
|
+
hy → ヒ ;
|
|
332
|
+
sy → セィ ;
|
|
333
|
+
ty → ティ ;
|
|
334
|
+
zy → ゼィ ;
|
|
335
|
+
h → ヘ ;
|
|
336
|
+
# isolated consonants listed here so as not to mask
|
|
337
|
+
# longer rules above.
|
|
338
|
+
ch → チ;
|
|
339
|
+
sh → シ ;
|
|
340
|
+
dz → ヅ ;
|
|
341
|
+
dj → ヂ;
|
|
342
|
+
b → ブ ;
|
|
343
|
+
d → デ ;
|
|
344
|
+
g → グ ;
|
|
345
|
+
k → ク ;
|
|
346
|
+
m → ム ;
|
|
347
|
+
n'' ← ン } $n_quoter ;
|
|
348
|
+
n ↔ ン ;
|
|
349
|
+
p → プ ;
|
|
350
|
+
r → ル ;
|
|
351
|
+
s → ス ;
|
|
352
|
+
t → テ ;
|
|
353
|
+
y → イ ;
|
|
354
|
+
z → ズ ;
|
|
355
|
+
v → ヴ ;
|
|
356
|
+
f → フ;
|
|
357
|
+
j → ジ;
|
|
358
|
+
w → ウ;
|
|
359
|
+
ß → | ss ;
|
|
360
|
+
æ → | e ;
|
|
361
|
+
ð → | d ;
|
|
362
|
+
ø → | u ;
|
|
363
|
+
þ → | th ;
|
|
364
|
+
# simple substitutions using backup
|
|
365
|
+
c → | k ;
|
|
366
|
+
l → | r ;
|
|
367
|
+
q → | k ;
|
|
368
|
+
x → | ks ;
|
|
369
|
+
# ~~~ END shared rules ~~~
|
|
370
|
+
#------------------------------------------------------
|
|
371
|
+
# Final cleanup
|
|
372
|
+
'~' → ; # delete stray tildes between letters
|
|
373
|
+
[:Katakana:] { '' } [:Latin:] → ; # delete stray quotes between letters
|
|
374
|
+
# [ʾ[:Nonspacing Mark:]-[゙-゜]] → ; # delete any non-spacing marks that we didn't use
|
|
375
|
+
:: NFC (NFD) ;
|
|
376
|
+
:: ([[:Katakana:][\u309B\u309C\u30A0\u30FC\uFF70\uFF9E\uFF9F]] halfwidth-fullwidth);
|
|
377
|
+
# note: a global filter is more efficient, but MUST include all source chars!!
|
|
378
|
+
#:: ([\u0000-\u007E 、。 ゙-゜ ァ-ー 。-゚ [:Latin:][:Katakana:] [:nonspacing mark:]]);
|
|
379
|
+
# MINIMAL FILTER GENERATED FOR: Latin-Katakana BACKWARD
|
|
380
|
+
:: ( [[\ -~¢-£¥-¦¬̄₩。-하-ᅦᅧ-ᅬᅭ-ᅲᅳ-ᅵ│-○][~、-。がぎぐげござじずぜぞだぢづでどば-ぱび-ぴぶ-ぷべ-ぺぼ-ぽゔ゙-゛ゞァ-ヺー-ヾ][\u309B\u309C\u30A0\u30FC\uFF70\uFF9E\uFF9F]] ) ;
|
|
381
|
+
# eof
|
|
382
|
+
|
|
@@ -0,0 +1,8 @@
|
|
|
1
|
+
|
|
2
|
+
::['.0-9A-Za-z~À-ÅÇ-ÏÑ-ÖÙ-Ýà-åç-ïñ-öù-ýÿ-ďĒ-ĥĨ-İĴ-ķĹ-ľŃ-ňŌ-őŔ-ťŨ-žƠ-ơƯ-ưǍ-ǜǞ-ǣǦ-ǭǰǴ-ǵǸ-țȞ-ȟȦ-ȳʔ́̃-̄̆-̇̐̔-̣̥̱́̈́̕΅-ΆΈ-ΊΌΎ-ΐά-ΰό-ώϓЃЌЎЙйѓќўӁ-ӂӐ-ӑӖ-ӗӢ-ӣӮ-ӯḀ-ẙẠ-ỹἁἃ-ἅἇἉἋ-ἍἏἑἓ-ἕἙἛ-Ἕἡἣ-ἥἧἩἫ-ἭἯἱἳ-ἵἷἹἻ-ἽἿὁὃ-ὅὉὋ-Ὅὑὓ-ὕὗὙὛὝὟὡὣ-ὥὧὩὫ-ὭὯάέήίόύώᾁᾃ-ᾅᾇᾉᾋ-ᾍᾏᾑᾓ-ᾕᾗᾙᾛ-ᾝᾟᾡᾣ-ᾥᾧᾩᾫ-ᾭᾯ-ᾱᾴᾸ-ᾹΆῄΈΉ῎ῐ-ῑΐῘ-ῙΊ῞ῠ-ῡΰῥῨ-ῩΎ-Ῥ΅ῴΌΏK-Å\uE04D\uE064];
|
|
3
|
+
::NFD;
|
|
4
|
+
::Lower;
|
|
5
|
+
::Latin-InterIndic;
|
|
6
|
+
::InterIndic-Malayalam;
|
|
7
|
+
::NFC;
|
|
8
|
+
|
|
@@ -0,0 +1,29 @@
|
|
|
1
|
+
|
|
2
|
+
# According to the pinyin definitions I've been able to find:
|
|
3
|
+
# 'a', 'e' are the preferred bases
|
|
4
|
+
# otherwise 'o'
|
|
5
|
+
# otherwise last vowel
|
|
6
|
+
# The trailing form of syllables are the following:
|
|
7
|
+
# "a", "ai", "ao", "an", "ang",
|
|
8
|
+
# "o", "ou", "ong",
|
|
9
|
+
# "e", "ei", "er", "en", "eng",
|
|
10
|
+
# "i", "ia", "iao", "ie", "iu", "ian", "in", "iang", "ing", "iong",
|
|
11
|
+
# "u", "ua", "uo", "uai", "ui", "uan", "un", "uang", "ueng",
|
|
12
|
+
# "ü", "üe", "üan", "ün"
|
|
13
|
+
# so the letters the tone will 'hop' are:
|
|
14
|
+
::NFD (NFC);
|
|
15
|
+
$tone = [̄́̌̀̆] ;
|
|
16
|
+
# Move the tone to the end of a syllable, and convert to number
|
|
17
|
+
e {($tone) r} → r &Pinyin-NumericPinyin($1);
|
|
18
|
+
($tone) ( [i o n u {o n} {n g}]) → $2 &Pinyin-NumericPinyin($1);
|
|
19
|
+
($tone) → &Pinyin-NumericPinyin($1);
|
|
20
|
+
# The following backs up until it finds the right vowel, then deposits the tone
|
|
21
|
+
$vowel = [aAeEiIoOuU {ü} {Ü} vV];
|
|
22
|
+
$consonant = [[a-z A-Z] - [$vowel]];
|
|
23
|
+
$digit = [1-5];
|
|
24
|
+
$1 &NumericPinyin-Pinyin($3) $2 ← ([aAeE]) ($vowel* $consonant*) ($digit);
|
|
25
|
+
$1 &NumericPinyin-Pinyin($3) $2 ← ([oO]) ([$vowel-[aeAE]]* $consonant*) ($digit);
|
|
26
|
+
$1 &NumericPinyin-Pinyin($3) $2 ← ($vowel) ($consonant*) ($digit);
|
|
27
|
+
&NumericPinyin-Pinyin($1) ← [:letter:] {($digit)};
|
|
28
|
+
::NFC (NFD);
|
|
29
|
+
|
|
@@ -0,0 +1,8 @@
|
|
|
1
|
+
|
|
2
|
+
::['.0-9A-Za-z~À-ÅÇ-ÏÑ-ÖÙ-Ýà-åç-ïñ-öù-ýÿ-ďĒ-ĥĨ-İĴ-ķĹ-ľŃ-ňŌ-őŔ-ťŨ-žƠ-ơƯ-ưǍ-ǜǞ-ǣǦ-ǭǰǴ-ǵǸ-țȞ-ȟȦ-ȳʔ́̃-̄̆-̇̐̔-̣̥̱́̈́̕΅-ΆΈ-ΊΌΎ-ΐά-ΰό-ώϓЃЌЎЙйѓќўӁ-ӂӐ-ӑӖ-ӗӢ-ӣӮ-ӯḀ-ẙẠ-ỹἁἃ-ἅἇἉἋ-ἍἏἑἓ-ἕἙἛ-Ἕἡἣ-ἥἧἩἫ-ἭἯἱἳ-ἵἷἹἻ-ἽἿὁὃ-ὅὉὋ-Ὅὑὓ-ὕὗὙὛὝὟὡὣ-ὥὧὩὫ-ὭὯάέήίόύώᾁᾃ-ᾅᾇᾉᾋ-ᾍᾏᾑᾓ-ᾕᾗᾙᾛ-ᾝᾟᾡᾣ-ᾥᾧᾩᾫ-ᾭᾯ-ᾱᾴᾸ-ᾹΆῄΈΉ῎ῐ-ῑΐῘ-ῙΊ῞ῠ-ῡΰῥῨ-ῩΎ-Ῥ΅ῴΌΏK-Å\uE04D\uE064];
|
|
3
|
+
::NFD;
|
|
4
|
+
::Lower;
|
|
5
|
+
::Latin-InterIndic;
|
|
6
|
+
::InterIndic-Oriya;
|
|
7
|
+
::NFC;
|
|
8
|
+
|
|
@@ -0,0 +1,8 @@
|
|
|
1
|
+
|
|
2
|
+
::['.0-9A-Za-z~À-ÅÇ-ÏÑ-ÖÙ-Ýà-åç-ïñ-öù-ýÿ-ďĒ-ĥĨ-İĴ-ķĹ-ľŃ-ňŌ-őŔ-ťŨ-žƠ-ơƯ-ưǍ-ǜǞ-ǣǦ-ǭǰǴ-ǵǸ-țȞ-ȟȦ-ȳʔ́̃-̄̆-̇̐̔-̣̥̱́̈́̕΅-ΆΈ-ΊΌΎ-ΐά-ΰό-ώϓЃЌЎЙйѓќўӁ-ӂӐ-ӑӖ-ӗӢ-ӣӮ-ӯḀ-ẙẠ-ỹἁἃ-ἅἇἉἋ-ἍἏἑἓ-ἕἙἛ-Ἕἡἣ-ἥἧἩἫ-ἭἯἱἳ-ἵἷἹἻ-ἽἿὁὃ-ὅὉὋ-Ὅὑὓ-ὕὗὙὛὝὟὡὣ-ὥὧὩὫ-ὭὯάέήίόύώᾁᾃ-ᾅᾇᾉᾋ-ᾍᾏᾑᾓ-ᾕᾗᾙᾛ-ᾝᾟᾡᾣ-ᾥᾧᾩᾫ-ᾭᾯ-ᾱᾴᾸ-ᾹΆῄΈΉ῎ῐ-ῑΐῘ-ῙΊ῞ῠ-ῡΰῥῨ-ῩΎ-Ῥ΅ῴΌΏK-Å\uE04D\uE064];
|
|
3
|
+
::NFD;
|
|
4
|
+
::Lower;
|
|
5
|
+
::Latin-InterIndic;
|
|
6
|
+
::InterIndic-Tamil;
|
|
7
|
+
::NFC;
|
|
8
|
+
|
|
@@ -0,0 +1,8 @@
|
|
|
1
|
+
|
|
2
|
+
::['.0-9A-Za-z~À-ÅÇ-ÏÑ-ÖÙ-Ýà-åç-ïñ-öù-ýÿ-ďĒ-ĥĨ-İĴ-ķĹ-ľŃ-ňŌ-őŔ-ťŨ-žƠ-ơƯ-ưǍ-ǜǞ-ǣǦ-ǭǰǴ-ǵǸ-țȞ-ȟȦ-ȳʔ́̃-̄̆-̇̐̔-̣̥̱́̈́̕΅-ΆΈ-ΊΌΎ-ΐά-ΰό-ώϓЃЌЎЙйѓќўӁ-ӂӐ-ӑӖ-ӗӢ-ӣӮ-ӯḀ-ẙẠ-ỹἁἃ-ἅἇἉἋ-ἍἏἑἓ-ἕἙἛ-Ἕἡἣ-ἥἧἩἫ-ἭἯἱἳ-ἵἷἹἻ-ἽἿὁὃ-ὅὉὋ-Ὅὑὓ-ὕὗὙὛὝὟὡὣ-ὥὧὩὫ-ὭὯάέήίόύώᾁᾃ-ᾅᾇᾉᾋ-ᾍᾏᾑᾓ-ᾕᾗᾙᾛ-ᾝᾟᾡᾣ-ᾥᾧᾩᾫ-ᾭᾯ-ᾱᾴᾸ-ᾹΆῄΈΉ῎ῐ-ῑΐῘ-ῙΊ῞ῠ-ῡΰῥῨ-ῩΎ-Ῥ΅ῴΌΏK-Å\uE04D\uE064];
|
|
3
|
+
::NFD;
|
|
4
|
+
::Lower;
|
|
5
|
+
::Latin-InterIndic;
|
|
6
|
+
::InterIndic-Telugu;
|
|
7
|
+
::NFC;
|
|
8
|
+
|