interscript-maps 2.0.5
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +7 -0
- data/README.adoc +28 -0
- data/interscript-maps.gemspec +28 -0
- data/interscript-maps.yaml +235 -0
- data/libs/posix.iml +11 -0
- data/libs/unicode.iml +13 -0
- data/libs/var-Cyrl.iml +7 -0
- data/libs/var-kor.iml +17 -0
- data/maps-staging/royin-tha-Thai-Latn-1939-generic.imp +98 -0
- data/maps-staging/royin-tha-Thai-Latn-1968.imp +156 -0
- data/maps-staging/royin-tha-Thai-Latn-1999-chained.imp +161 -0
- data/maps-staging/royin-tha-Thai-Latn-1999.imp +78 -0
- data/maps-staging/var-tha-Thai-Thai-phonemic.imp +53 -0
- data/maps-staging/var-tha-Thai-Zsym-ipa.imp +273 -0
- data/maps/acadsin-zho-Hani-Latn-2002.imp +27515 -0
- data/maps/alalc-amh-Ethi-Latn-1997.imp +392 -0
- data/maps/alalc-amh-Ethi-Latn-2011.imp +85 -0
- data/maps/alalc-ara-Arab-Latn-1997.imp +1171 -0
- data/maps/alalc-asm-Deva-Latn-1997.imp +214 -0
- data/maps/alalc-asm-Deva-Latn-2012.imp +53 -0
- data/maps/alalc-aze-Arab-Latn-1997.imp +321 -0
- data/maps/alalc-aze-Cyrl-Latn-1997.imp +101 -0
- data/maps/alalc-bel-Cyrl-Latn-1997.imp +118 -0
- data/maps/alalc-ben-Beng-Latn-1997.imp +225 -0
- data/maps/alalc-ben-Beng-Latn-2017.imp +135 -0
- data/maps/alalc-bul-Cyrl-Latn-1997.imp +110 -0
- data/maps/alalc-div-Thaa-Latn-1997.imp +171 -0
- data/maps/alalc-ell-Grek-Latn-1997.imp +381 -0
- data/maps/alalc-ell-Grek-Latn-2010.imp +382 -0
- data/maps/alalc-guj-Gujr-Latn-1997.imp +223 -0
- data/maps/alalc-guj-Gujr-Latn-2011.imp +57 -0
- data/maps/alalc-hin-Deva-Latn-1997.imp +248 -0
- data/maps/alalc-hin-Deva-Latn-2011.imp +63 -0
- data/maps/alalc-kan-Kana-Latn-1997.imp +233 -0
- data/maps/alalc-kan-Kana-Latn-2011.imp +58 -0
- data/maps/alalc-kat-Geok-Latn-1997.imp +109 -0
- data/maps/alalc-kat-Geor-Latn-1997.imp +104 -0
- data/maps/alalc-kor-Hang-Latn-1997.imp +68 -0
- data/maps/alalc-mal-Mlym-Latn-1997.imp +260 -0
- data/maps/alalc-mal-Mlym-Latn-2012.imp +65 -0
- data/maps/alalc-mar-Deva-Latn-1997.imp +178 -0
- data/maps/alalc-mar-Deva-Latn-2011.imp +51 -0
- data/maps/alalc-mkd-Cyrl-Latn-1997.imp +125 -0
- data/maps/alalc-mkd-Cyrl-Latn-2013.imp +113 -0
- data/maps/alalc-mon-Cyrl-Latn-1997.imp +161 -0
- data/maps/alalc-ori-Orya-Latn-1997.imp +234 -0
- data/maps/alalc-ori-Orya-Latn-2011.imp +59 -0
- data/maps/alalc-pan-Guru-Latn-1997.imp +241 -0
- data/maps/alalc-pan-Guru-Latn-2011.imp +71 -0
- data/maps/alalc-per-Arab-Latn-1997.imp +318 -0
- data/maps/alalc-pli-Deva-Latn-2012.imp +140 -0
- data/maps/alalc-pra-Deva-Latn-2012.imp +52 -0
- data/maps/alalc-rus-Cyrl-Latn-1997.imp +165 -0
- data/maps/alalc-rus-Cyrl-Latn-2012.imp +107 -0
- data/maps/alalc-san-Deva-Latn-2012.imp +207 -0
- data/maps/alalc-sin-Sinh-Latn-1997.imp +246 -0
- data/maps/alalc-sin-Sinh-Latn-2011.imp +63 -0
- data/maps/alalc-srp-Cyrl-Latn-1997.imp +124 -0
- data/maps/alalc-srp-Cyrl-Latn-2013.imp +115 -0
- data/maps/alalc-tam-Taml-Latn-1997.imp +52 -0
- data/maps/alalc-tam-Taml-Latn-2011.imp +49 -0
- data/maps/alalc-tel-Telu-Latn-1997.imp +237 -0
- data/maps/alalc-tel-Telu-Latn-2011.imp +58 -0
- data/maps/alalc-ukr-Cyrl-Latn-1997.imp +123 -0
- data/maps/alalc-ukr-Cyrl-Latn-2011.imp +32 -0
- data/maps/apcbg-bul-Cyrl-Latn-1995.imp +194 -0
- data/maps/az-aze-Cyrl-Latn-1939.imp +105 -0
- data/maps/az-aze-Cyrl-Latn-1958.imp +50 -0
- data/maps/bas-rus-Cyrl-Latn-2017-bss.imp +160 -0
- data/maps/bas-rus-Cyrl-Latn-2017-oss.imp +165 -0
- data/maps/bgn-jpn-Hrkt-Latn-1962.imp +288 -0
- data/maps/bgn-kor-Hang-Latn-1943.imp +31 -0
- data/maps/bgn-kor-Kore-Latn-1943.imp +33 -0
- data/maps/bgna-bul-Cyrl-Latn-2006.imp +119 -0
- data/maps/bgna-bul-Cyrl-Latn-2009.imp +119 -0
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +393 -0
- data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +472 -0
- data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +125 -0
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +111 -0
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.imp +169 -0
- data/maps/bgnpcgn-bal-Arab-Latn-2008.imp +296 -0
- data/maps/bgnpcgn-bel-Cyrl-Latn-1979.imp +200 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +137 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +38 -0
- data/maps/bgnpcgn-che-Cyrl-Latn-2008.imp +176 -0
- data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +56 -0
- data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +90 -0
- data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +71 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +443 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +269 -0
- data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +41 -0
- data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +28 -0
- data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +111 -0
- data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +42 -0
- data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +32 -0
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +191 -0
- data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +116 -0
- data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +43 -0
- data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +193 -0
- data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +170 -0
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +177 -0
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +40 -0
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +41 -0
- data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +240 -0
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +132 -0
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +174 -0
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +168 -0
- data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +208 -0
- data/maps/bgnpcgn-per-Arab-Latn-1958.imp +312 -0
- data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +552 -0
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +445 -0
- data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +289 -0
- data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +165 -0
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +133 -0
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +195 -0
- data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +48 -0
- data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +55 -0
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +146 -0
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +185 -0
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +188 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +136 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +88 -0
- data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +333 -0
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +145 -0
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +74 -0
- data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +7463 -0
- data/maps/bis-asm-Beng-Latn-13194-1991.imp +154 -0
- data/maps/bis-ben-Beng-Latn-13194-1991.imp +151 -0
- data/maps/bis-dev-Deva-Latn-13194-1991.imp +178 -0
- data/maps/bis-guj-Gujr-Latn-13194-1991.imp +172 -0
- data/maps/bis-kan-Kana-Latn-13194-1991.imp +166 -0
- data/maps/bis-mlm-Mlym-Latn-13194-1991.imp +170 -0
- data/maps/bis-ori-Orya-Latn-13194-1991.imp +168 -0
- data/maps/bis-pnj-Guru-Latn-13194-1991.imp +169 -0
- data/maps/bis-tel-Telu-Latn-13194-1991.imp +165 -0
- data/maps/bis-tml-Taml-Latn-13194-1991.imp +149 -0
- data/maps/by-bel-Cyrl-Latn-1998.imp +123 -0
- data/maps/by-bel-Cyrl-Latn-2007.imp +77 -0
- data/maps/din-grc-Grek-Latn-31634-2011-t1.imp +627 -0
- data/maps/din-hin-Deva-Latn-33904-2018.imp +101 -0
- data/maps/din-kat-Geor-Latn-32707-2010.imp +103 -0
- data/maps/din-mar-Deva-Latn-33904-2018.imp +83 -0
- data/maps/din-nep-Deva-Latn-33904-2018.imp +110 -0
- data/maps/din-pli-Deva-Latn-33904-2018.imp +72 -0
- data/maps/din-pra-Deva-Latn-33904-2018.imp +66 -0
- data/maps/din-san-Deva-Latn-33904-2018.imp +294 -0
- data/maps/din-tam-Taml-Latn-33903-2016.imp +187 -0
- data/maps/dos-nep-Deva-Latn-1997.imp +47 -0
- data/maps/elot-ell-Grek-Latn-743-1982-tl.imp +399 -0
- data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +397 -0
- data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +34 -0
- data/maps/elot-ell-Grek-Latn-743-2001-ts.imp +178 -0
- data/maps/ggg-kat-Geor-Latn-2002.imp +75 -0
- data/maps/gki-bel-Cyrl-Latn-1992.imp +44 -0
- data/maps/gki-bel-Cyrl-Latn-2000.imp +159 -0
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +179 -0
- data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.imp +132 -0
- data/maps/hk-yue-Hani-Latn-1888.imp +29201 -0
- data/maps/icao-bel-Cyrl-Latn-9303.imp +136 -0
- data/maps/icao-bul-Cyrl-Latn-9303.imp +127 -0
- data/maps/icao-fas-Arab-Latn-9303.imp +112 -0
- data/maps/icao-heb-Hebr-Latn-9303.imp +160 -0
- data/maps/icao-mkd-Cyrl-Latn-9303.imp +126 -0
- data/maps/icao-rus-Cyrl-Latn-9303.imp +126 -0
- data/maps/icao-srp-Cyrl-Latn-9303.imp +126 -0
- data/maps/icao-ukr-Cyrl-Latn-9303.imp +127 -0
- data/maps/iso-ara-Arab-Latn-233-1984.imp +301 -0
- data/maps/iso-asm-Beng-Latn-15919-2001.imp +73 -0
- data/maps/iso-ben-Beng-Latn-15919-2001.imp +171 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t1.imp +365 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t2.imp +43 -0
- data/maps/iso-guj-Gujr-Latn-15919-2001.imp +214 -0
- data/maps/iso-hin-Deva-Latn-15919-2001.imp +73 -0
- data/maps/iso-inc-Deva-Latn-15919-2001.imp +61 -0
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.imp +59 -0
- data/maps/iso-kan-Kana-Latn-15919-2001.imp +212 -0
- data/maps/iso-kat-Geor-Latn-9984-1996.imp +103 -0
- data/maps/iso-kor-Hang-Latn-1996-method1.imp +140 -0
- data/maps/iso-kor-Hang-Latn-1996-method2.imp +132 -0
- data/maps/iso-mal-Mlym-Latn-15919-2001.imp +276 -0
- data/maps/iso-mar-Deva-Latn-15919-2001.imp +68 -0
- data/maps/iso-nep-Deva-Latn-15919-2001.imp +75 -0
- data/maps/iso-ori-Orya-Latn-15919-2001.imp +188 -0
- data/maps/iso-pan-Guru-Latn-15919-2001.imp +217 -0
- data/maps/iso-pli-Beng-Latn-15919-2001.imp +66 -0
- data/maps/iso-pli-Deva-Latn-15919-2001.imp +68 -0
- data/maps/iso-pli-Sinh-Latn-15919-2001.imp +211 -0
- data/maps/iso-pli-Thai-Latn-15919-2001.imp +47 -0
- data/maps/iso-pra-Deva-Latn-15919-2001.imp +60 -0
- data/maps/iso-prs-Arab-Latn-233-3-1999.imp +352 -0
- data/maps/iso-rus-Cyrl-Latn-9-1995.imp +279 -0
- data/maps/iso-san-Deva-Latn-15919-2001.imp +215 -0
- data/maps/iso-tam-Taml-Latn-15919-2001.imp +153 -0
- data/maps/iso-tel-Telu-Latn-15919-2001.imp +214 -0
- data/maps/iso-tha-Thai-Latn-11940-1998.imp +114 -0
- data/maps/kp-kor-Hang-Latn-2002.imp +540 -0
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +29005 -0
- data/maps/masm-mon-Cyrl-Latn-5217-2012.imp +136 -0
- data/maps/masm-mon-Latn-Cyrl-5217-2012.imp +162 -0
- data/maps/mext-jpn-Hrkt-Latn-1954.imp +403 -0
- data/maps/moct-kor-Hang-Latn-2000.imp +475 -0
- data/maps/mofa-jpn-Hrkt-Latn-1989.imp +484 -0
- data/maps/mv-div-Thaa-Latn-1987.imp +144 -0
- data/maps/mvd-bel-Cyrl-Latn-2008.imp +224 -0
- data/maps/mvd-bel-Cyrl-Latn-2010.imp +64 -0
- data/maps/mvd-rus-Cyrl-Latn-2008.imp +110 -0
- data/maps/mvd-rus-Cyrl-Latn-2010.imp +40 -0
- data/maps/odni-ara-Arab-Latn-2004.imp +106 -0
- data/maps/odni-ara-Arab-Latn-2015.imp +281 -0
- data/maps/odni-aze-Cyrl-Latn-2015.imp +158 -0
- data/maps/odni-bel-Cyrl-Latn-2015.imp +138 -0
- data/maps/odni-bul-Cyrl-Latn-2005.imp +90 -0
- data/maps/odni-bul-Cyrl-Latn-2015.imp +103 -0
- data/maps/odni-che-Cyrl-Latn-2015.imp +165 -0
- data/maps/odni-fas-Arab-Latn-2004.imp +268 -0
- data/maps/odni-fas-Arab-Latn-2015.imp +398 -0
- data/maps/odni-hin-Deva-Latn-2004.imp +180 -0
- data/maps/odni-hin-Deva-Latn-2015.imp +256 -0
- data/maps/odni-kat-Geor-Latn-2015.imp +76 -0
- data/maps/odni-kaz-Cyrl-Latn-2015.imp +164 -0
- data/maps/odni-kir-Cyrl-Latn-2015.imp +149 -0
- data/maps/odni-kor-Hang-Latn-2015.imp +307 -0
- data/maps/odni-mkd-Cyrl-Latn-2005.imp +28 -0
- data/maps/odni-mkd-Cyrl-Latn-2015.imp +124 -0
- data/maps/odni-prs-Arab-Latn-2004.imp +120 -0
- data/maps/odni-prs-Arab-Latn-2015.imp +225 -0
- data/maps/odni-pus-Arab-Latn-2011.imp +327 -0
- data/maps/odni-rus-Cyrl-Latn-2015.imp +79 -0
- data/maps/odni-srp-Cyrl-Latn-2005.imp +35 -0
- data/maps/odni-srp-Cyrl-Latn-2015.imp +130 -0
- data/maps/odni-tat-Cyrl-Latn-2015.imp +157 -0
- data/maps/odni-tgk-Cyrl-Latn-2015.imp +161 -0
- data/maps/odni-tuk-Cyrl-Latn-2015.imp +159 -0
- data/maps/odni-uig-Cyrl-Latn-2015.imp +151 -0
- data/maps/odni-ukr-Cyrl-Latn-2015.imp +136 -0
- data/maps/odni-urd-Arab-Latn-2015.imp +220 -0
- data/maps/odni-uzb-Cyrl-Latn-2015.imp +165 -0
- data/maps/sac-zho-Hans-Latn-1979.imp +20940 -0
- data/maps/sasm-mon-Mong-Latn-general-1978.imp +294 -0
- data/maps/sasm-mon-Mong-Latn-phonetic-1978.imp +261 -0
- data/maps/ses-ara-Arab-Latn-1930.imp +225 -0
- data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.imp +171 -0
- data/maps/ua-ukr-Cyrl-Latn-1996.imp +149 -0
- data/maps/ua-ukr-Cyrl-Latn-2007.imp +69 -0
- data/maps/ua-ukr-Cyrl-Latn-2010.imp +128 -0
- data/maps/un-amh-Ethi-Latn-2016.imp +483 -0
- data/maps/un-ara-Arab-Latn-1971.imp +137 -0
- data/maps/un-ara-Arab-Latn-1972.imp +155 -0
- data/maps/un-ara-Arab-Latn-2017.imp +375 -0
- data/maps/un-asm-Beng-Latn-1972.imp +188 -0
- data/maps/un-bel-Cyrl-Latn-2007.imp +78 -0
- data/maps/un-ben-Beng-Latn-2016.imp +516 -0
- data/maps/un-ell-Grek-Latn-1987-phonetic.imp +437 -0
- data/maps/un-ell-Grek-Latn-1987-tl.imp +27 -0
- data/maps/un-ell-Grek-Latn-1987-ts.imp +269 -0
- data/maps/un-guj-Gujr-Latn-1972.imp +196 -0
- data/maps/un-hin-Deva-Latn-2016.imp +356 -0
- data/maps/un-kan-Kana-Latn-2016.imp +214 -0
- data/maps/un-mal-Mlym-Latn-1972.imp +215 -0
- data/maps/un-mar-Deva-Latn-2016.imp +96 -0
- data/maps/un-mon-Mong-Latn-general-2013.imp +170 -0
- data/maps/un-mon-Mong-Latn-phonetic-2013.imp +170 -0
- data/maps/un-nep-Deva-Latn-1972.imp +295 -0
- data/maps/un-nep-Deva-Latn-2013.imp +62 -0
- data/maps/un-ori-Orya-Latn-1972.imp +208 -0
- data/maps/un-pan-Guru-Latn-1972.imp +321 -0
- data/maps/un-prs-Arab-Latn-1967.imp +214 -0
- data/maps/un-rus-Cyrl-Latn-1987.imp +96 -0
- data/maps/un-sin-Sinh-Latn-1972.imp +193 -0
- data/maps/un-tam-Taml-Latn-1972.imp +173 -0
- data/maps/un-tel-Telu-Latn-1972.imp +229 -0
- data/maps/un-ukr-Cyrl-Latn-1998.imp +58 -0
- data/maps/un-ukr-Cyrl-Latn-2012.imp +95 -0
- data/maps/un-urd-Arab-Latn-1972.imp +290 -0
- data/maps/var-amh-Ethi-Latn-eae-2003.imp +414 -0
- data/maps/var-gez-Ethi-Latn-eae-2003.imp +54 -0
- data/maps/var-hin-Deva-Latn-hunterian-1872.imp +212 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.imp +399 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.imp +382 -0
- data/maps/var-kor-Hang-Hang-jamo.imp +11196 -0
- data/maps/var-kor-Hang-Latn-mr-1939.imp +574 -0
- data/maps/var-kor-Kore-Hang-2013.imp +59764 -0
- data/maps/var-kor-Kore-Latn-mr-1939.imp +36 -0
- data/maps/var-mar-Deva-Latn-hunterian-1872.imp +39 -0
- data/maps/var-mon-Mong-Latn-1930.imp +101 -0
- data/maps/var-mon-Mong-Latn-lessing.imp +181 -0
- data/maps/var-mon-Mong-Latn-vpmc.imp +182 -0
- data/maps/var-pra-Deva-Latn-iast-1912.imp +36 -0
- data/maps/var-san-Deva-Latn-iast-1912.imp +147 -0
- data/maps/var-zho-Hani-Latn-wd-1979.imp +27549 -0
- metadata +335 -0
@@ -0,0 +1,475 @@
|
|
1
|
+
metadata {
|
2
|
+
authority_id: moct
|
3
|
+
id: 2000-viajamo
|
4
|
+
language: iso-639-2:kor
|
5
|
+
source_script: Hang
|
6
|
+
destination_script: Latn
|
7
|
+
name: Korean Ministry of Culture and Tourism 2000 System
|
8
|
+
url: https://www.korean.go.kr/front_eng/roman/roman_01.do
|
9
|
+
creation_date: 2000
|
10
|
+
adoption_date: 2002
|
11
|
+
description: |
|
12
|
+
Generation of Jamo from Hangul
|
13
|
+
|
14
|
+
This is how the Hangul-to-Jamo maps are generated. Please refer to this page
|
15
|
+
for details about Korean text handling in Unicode.
|
16
|
+
http://gernot-katzers-spice-pages.com/var/korean_hangul_unicode.html
|
17
|
+
|
18
|
+
This formula copied from the page above is used:
|
19
|
+
[stem]
|
20
|
+
====
|
21
|
+
tail = mod (Hangul codepoint − 44032, 28)
|
22
|
+
vowel = 1 + mod (Hangul codepoint − 44032 − tail, 588) / 28
|
23
|
+
lead = 1 + int [ (Hangul codepoint − 44032)/588 ]
|
24
|
+
====
|
25
|
+
|
26
|
+
[source,python]
|
27
|
+
----
|
28
|
+
import pandas as pd
|
29
|
+
import re
|
30
|
+
import math
|
31
|
+
|
32
|
+
leadjamo = [chr(0x1100+i) for i in range(0,19)]
|
33
|
+
# ᄀᄁᄂᄃᄄᄅᄆᄇᄈᄉᄊᄋᄌᄍᄎᄏᄐᄑᄒ
|
34
|
+
voweljamo = [chr(0x1161+i) for i in range(0,21)]
|
35
|
+
# ᅡᅢᅣᅤᅥᅦᅧᅨᅩᅪᅫᅬᅭᅮᅯᅰᅱᅲᅳᅴᅵ
|
36
|
+
tailjamo = ['']+[chr(0x11A8+i) for i in range(0,27)]
|
37
|
+
# ᆨᆩᆪᆫᆬᆭᆮᆯᆰᆱᆲᆳᆴᆵᆶᆷᆸᆹᆺᆻᆼᆽᆾᆿᇀᇁᇂ
|
38
|
+
|
39
|
+
hanguls = [chr(i) for i in range(44032,55204)]
|
40
|
+
tails = [tailjamo[(i-44032) % 28] for i in range(44032,55204)]
|
41
|
+
vowels = [voweljamo[((i-44032-((i-44032) % 28)) % 588) // 28] for i in range(44032,55204)]
|
42
|
+
leads = [leadjamo[math.floor((i-44032)// 588)] for i in range(44032,55204)]
|
43
|
+
|
44
|
+
kr_df = pd.DataFrame({'Hangul':hanguls, 'Lead':leads,'Vowel':vowels, 'Tail':tails})
|
45
|
+
----
|
46
|
+
|
47
|
+
Hangul Lead Vowel Tail
|
48
|
+
0 가 ᄀ ᅡ
|
49
|
+
1 각 ᄀ ᅡ ᆨ
|
50
|
+
2 갂 ᄀ ᅡ ᆩ
|
51
|
+
3 갃 ᄀ ᅡ ᆪ
|
52
|
+
4 간 ᄀ ᅡ ᆫ
|
53
|
+
5 갅 ᄀ ᅡ ᆬ
|
54
|
+
6 갆 ᄀ ᅡ ᆭ
|
55
|
+
7 갇 ᄀ ᅡ ᆮ
|
56
|
+
8 갈 ᄀ ᅡ ᆯ
|
57
|
+
9 갉 ᄀ ᅡ ᆰ
|
58
|
+
|
59
|
+
notes: []
|
60
|
+
}
|
61
|
+
|
62
|
+
tests {
|
63
|
+
test "불국사", "Bulguksa"
|
64
|
+
test "묵호", "Mukho"
|
65
|
+
test "울산", "Ulsan"
|
66
|
+
test "독립문", "Dongnimmun"
|
67
|
+
test "강남역", "Gangnamyeok"
|
68
|
+
test "남산리", "Namsan-ri" #Note: no assimilation for -ri even after nasals
|
69
|
+
test "내월리", "Naewol-ri"
|
70
|
+
test "울릉군", "Ulleung-gun"
|
71
|
+
test "설악산", "Seoraksan"
|
72
|
+
test "삼죽면", "Samjuk-myeon"
|
73
|
+
test "평리1동", "Pyeongni Il-dong"
|
74
|
+
test "평리2동", "Pyeongni I-dong"
|
75
|
+
test "탑안이", "Tabani"
|
76
|
+
}
|
77
|
+
|
78
|
+
dependency "var-kor", import: true
|
79
|
+
dependency "var-kor-Hang-Hang-jamo", as: hangjamo
|
80
|
+
|
81
|
+
# Those may be parts of this supposed korean library
|
82
|
+
aliases {
|
83
|
+
def_alias double_cons_jamo, any("ᄁᄄᄈᄍᄊ")
|
84
|
+
def_alias aspirated_cons_jamo, any("ᄏᄐᄑᄎ")
|
85
|
+
}
|
86
|
+
|
87
|
+
stage {
|
88
|
+
# convert numbers to space + Hangul
|
89
|
+
sub none, space, not_before: any([digit, space]), after: digit
|
90
|
+
sub "1", "일"
|
91
|
+
sub "2", "이"
|
92
|
+
sub "3", "삼"
|
93
|
+
sub "4", "사"
|
94
|
+
sub "5", "오"
|
95
|
+
sub "6", "육"
|
96
|
+
sub "7", "칠"
|
97
|
+
sub "8", "팔"
|
98
|
+
sub "9", "구"
|
99
|
+
|
100
|
+
# add hyphen in front of generics
|
101
|
+
sub none, "-", not_before: line_start, after: any("도시군구읍면리동가") + line_end
|
102
|
+
|
103
|
+
run map.hangjamo.stage.main
|
104
|
+
|
105
|
+
# Add space to the two ends of the string for easier word boundary handling
|
106
|
+
sub line_start, space
|
107
|
+
sub line_end, space
|
108
|
+
|
109
|
+
# HANGUL JONGSEONG SSANGKIYEOK
|
110
|
+
sub "ᆩᄋ", "ᆨᄁ"
|
111
|
+
sub "ᆩ", "ᆨ"
|
112
|
+
|
113
|
+
# HANGUL JONGSEONG SSANGKIYEOK
|
114
|
+
sub "ᆪᄋ", "ᆨᄉ"
|
115
|
+
sub "ᆪ", "ᆨ"
|
116
|
+
|
117
|
+
# HANGUL JONGSEONG NIEUN-CIEUC
|
118
|
+
sub "ᆬᄋ", "ᆫᄌ"
|
119
|
+
sub "ᆬ", "ᆫ"
|
120
|
+
|
121
|
+
# HANGUL JONGSEONG NIEUN-CIEUC
|
122
|
+
sub "ᆭᄀ", "ᆫᄏ"
|
123
|
+
sub "ᆭᄃ", "ᆫᄐ"
|
124
|
+
sub "ᆭᄇ", "ᆫᄑ"
|
125
|
+
sub "ᆭᄌ", "ᆫᄎ"
|
126
|
+
sub "ᆭ", "ᆫ"
|
127
|
+
|
128
|
+
# HANGUL JONGSEONG TIEUT
|
129
|
+
sub "ᆮ", "ᆺ", after: any("ᄀᄁᄂᄃᄄᄅᄆᄇᄈᄉᄊᄌᄍᄎᄏᄐᄑᄒ")
|
130
|
+
|
131
|
+
# HANGUL JONGSEONG RIEUL-SIOS
|
132
|
+
sub "ᆳᄋ", "ᆯᄉ"
|
133
|
+
sub "ᆳ", "ᆯ"
|
134
|
+
|
135
|
+
# HANGUL JONGSEONG RIEUL-THIEUTH
|
136
|
+
sub "ᆴᄋ", "ᆯᄐ"
|
137
|
+
sub "ᆴ", "ᆯ"
|
138
|
+
|
139
|
+
# HANGUL JONGSEONG RIEUL-PHIEUPH
|
140
|
+
sub "ᆵᄋ", "ᆯᄑ"
|
141
|
+
sub "ᆵ", "ᆯ", after: any("ᄃᄄᄐ")
|
142
|
+
sub "ᆵ", "ᄇ"
|
143
|
+
|
144
|
+
parallel {
|
145
|
+
# HANGUL JONGSEONG RIEUL-HIEUH
|
146
|
+
sub "ᆶᄀ", "ᆯᄏ"
|
147
|
+
sub "ᆶᄃ", "ᆯᄐ"
|
148
|
+
sub "ᆶᄇ", "ᆯᄑ"
|
149
|
+
sub "ᆶᄌ", "ᆯᄎ"
|
150
|
+
sub "ᆶ", "ᆯ"
|
151
|
+
|
152
|
+
# HANGUL JONGSEONG PIEUP-SIOS
|
153
|
+
sub "ᆹᄋ", "ᄇᄉ"
|
154
|
+
sub "ᆹ", "ᄇ"
|
155
|
+
|
156
|
+
# HANGUL JONGSEONG SSANG-SIOS
|
157
|
+
sub "ᆻᄋ", "ᆺᄊ"
|
158
|
+
sub "ᆻ", "ᆺ"
|
159
|
+
|
160
|
+
# HANGUL JONGSEONG CIEUC
|
161
|
+
sub "ᆽᄋ", "ᆺᄌ"
|
162
|
+
sub "ᆽ", "ᆺ"
|
163
|
+
|
164
|
+
# HANGUL JONGSEONG CHIEUCH
|
165
|
+
sub "ᆾᄋ", "ᆺᄎ"
|
166
|
+
sub "ᆾ", "ᆺ"
|
167
|
+
|
168
|
+
# HANGUL JONGSEONG KHIEUKH
|
169
|
+
sub "ᆿᄋ", "ᆨᄏ"
|
170
|
+
sub "ᆿ", "ᆨ"
|
171
|
+
|
172
|
+
# HANGUL JONGSEONG THIEUTH
|
173
|
+
sub "ᇀᄋ", "ᆺᄐ"
|
174
|
+
sub "ᇀ", "ᆺ"
|
175
|
+
|
176
|
+
# HANGUL JONGSEONG PHIEUPH
|
177
|
+
sub "ᇁᄋ", "ᆸᄑ"
|
178
|
+
sub "ᇁ", "ᆸ"
|
179
|
+
|
180
|
+
# HANGUL JONGSEONG HIEUH
|
181
|
+
sub "ᇂᄀ", "ᄏ"
|
182
|
+
sub "ᇂᄃ", "ᄐ"
|
183
|
+
sub "ᇂᄇ", "ᄑ"
|
184
|
+
sub "ᇂᄌ", "ᄎ"
|
185
|
+
sub "ᇂ", ""
|
186
|
+
}
|
187
|
+
|
188
|
+
parallel {
|
189
|
+
# From Unicode Chart
|
190
|
+
# https://github.com/unicode-org/cldr/blob/master/common/transforms/Korean-Latin-BGN.xml
|
191
|
+
|
192
|
+
sub "ᆮᄋ", "d" # HANGUL JONGSEONG TIEUT + CHOSEONG IEUNG
|
193
|
+
|
194
|
+
sub "ᆨᄀ", "kg" # HANGUL JONGSEONG KIYEOK + CHOSEONG KIYEOK
|
195
|
+
sub "ᆨᄂ", "ngn" # HANGUL JONGSEONG KIYEOK + CHOSEONG NIEUN
|
196
|
+
sub "ᆨᄃ", "kd" # HANGUL JONGSEONG KIYEOK + CHOSEONG TIEUT
|
197
|
+
sub "ᆨᄅ", "ngn" # HANGUL JONGSEONG KIYEOK + CHOSEONG RIEUL
|
198
|
+
sub "ᆨᄆ", "ngm" # HANGUL JONGSEONG KIYEOK + CHOSEONG MIEUM
|
199
|
+
sub "ᆨᄇ", "kb" # HANGUL JONGSEONG KIYEOK + CHOSEONG PIEUP
|
200
|
+
sub "ᆨᄉ", "ks" # HANGUL JONGSEONG KIYEOK + CHOSEONG SIOS
|
201
|
+
sub "ᆨᄋ", "g" # HANGUL JONGSEONG KIYEOK + CHOSEONG IEUNG
|
202
|
+
sub "ᆨᄌ", "kj" # HANGUL JONGSEONG KIYEOK + CHOSEONG CIEUC
|
203
|
+
sub "ᆨᄎ", "kch" # HANGUL JONGSEONG KIYEOK + CHOSEONG CHIEUCH
|
204
|
+
sub "ᆨᄏ", "kk" # HANGUL JONGSEONG KIYEOK + CHOSEONG KHIEUKH # NOTE: the dash is always skipped
|
205
|
+
sub "ᆨᄐ", "kt" # HANGUL JONGSEONG KIYEOK + CHOSEONG THIEUTH
|
206
|
+
sub "ᆨᄑ", "kp" # HANGUL JONGSEONG KIYEOK + CHOSEONG PHIEUPH
|
207
|
+
sub "ᆨᄒ", "kh" # HANGUL JONGSEONG KIYEOK + CHOSEONG HIEUH
|
208
|
+
sub "ᆨᄁ", "kkk" # HANGUL JONGSEONG KIYEOK + CHOSEONG SSANGKIYEOK
|
209
|
+
sub "ᆨᄄ", "ktt" # HANGUL JONGSEONG KIYEOK + CHOSEONG SSANGTIEUT
|
210
|
+
sub "ᆨᄈ", "kpp" # HANGUL JONGSEONG KIYEOK + CHOSEONG SSANGPIEUP
|
211
|
+
sub "ᆨᄊ", "kss" # HANGUL JONGSEONG KIYEOK + CHOSEONG SSANGSIOS
|
212
|
+
sub "ᆨᄍ", "kjj" # HANGUL JONGSEONG KIYEOK + CHOSEONG SSANGCIEUC
|
213
|
+
sub "ᆫᄀ", "ng" # HANGUL JONGSEONG NIEUN + CHOSEONG KIEUK
|
214
|
+
sub "ᆫᄂ", "nn" # HANGUL JONGSEONG NIEUN + CHOSEONG NIEUN
|
215
|
+
sub "ᆫᄃ", "nd" # HANGUL JONGSEONG NIEUN + CHOSEONG TIEUT
|
216
|
+
sub "ᆫᄅ", "ll" # HANGUL JONGSEONG NIEUN + CHOSEONG RIEUL
|
217
|
+
sub "ᆫᄆ", "nm" # HANGUL JONGSEONG NIEUN + CHOSEONG MIEUM
|
218
|
+
sub "ᆫᄇ", "nb" # HANGUL JONGSEONG NIEUN + CHOSEONG PIEUP
|
219
|
+
sub "ᆫᄉ", "ns" # HANGUL JONGSEONG NIEUN + CHOSEONG SIOS
|
220
|
+
sub "ᆫᄋ", "n" # HANGUL JONGSEONG NIEUN + CHOSEONG IEUNG
|
221
|
+
sub "ᆫᄌ", "nj" # HANGUL JONGSEONG NIEUN + CHOSEONG CIEUC
|
222
|
+
sub "ᆫᄎ", "nch" # HANGUL JONGSEONG NIEUN + CHOSEONG CHIEUCH
|
223
|
+
sub "ᆫᄏ", "nk" # HANGUL JONGSEONG NIEUN + CHOSEONG KHIEUKH
|
224
|
+
sub "ᆫᄐ", "nt" # HANGUL JONGSEONG NIEUN + CHOSEONG THIEUTH
|
225
|
+
sub "ᆫᄑ", "np" # HANGUL JONGSEONG NIEUN + CHOSEONG PHIEUPH
|
226
|
+
sub "ᆫᄒ", "nh" # HANGUL JONGSEONG NIEUN + CHOSEONG HIEUH
|
227
|
+
sub "ᆫᄁ", "nkk" # HANGUL JONGSEONG NIEUN + CHOSEONG SSANGKIYEOK
|
228
|
+
sub "ᆫᄄ", "ntt" # HANGUL JONGSEONG NIEUN + CHOSEONG SSANGTIEUT
|
229
|
+
sub "ᆫᄈ", "npp" # HANGUL JONGSEONG NIEUN + CHOSEONG SSANGPIEUP
|
230
|
+
sub "ᆫᄊ", "nss" # HANGUL JONGSEONG NIEUN + CHOSEONG SSANGSIOS
|
231
|
+
sub "ᆫᄍ", "njj" # HANGUL JONGSEONG NIEUN + CHOSEONG SSANGCIEUC
|
232
|
+
sub "ᆯᄀ", "lg" # HANGUL JONGSEONG RIEUL + CHOSEONG KIYEOK
|
233
|
+
sub "ᆯᄂ", "ll" # HANGUL JONGSEONG RIEUL + CHOSEONG NIEUN
|
234
|
+
sub "ᆯᄃ", "ld" # HANGUL JONGSEONG RIEUL + CHOSEONG TIEUT
|
235
|
+
sub "ᆯᄅ", "ll" # HANGUL JONGSEONG RIEUL + CHOSEONG RIEUL
|
236
|
+
sub "ᆯᄆ", "lm" # HANGUL JONGSEONG RIEUL + CHOSEONG MIEUM
|
237
|
+
sub "ᆯᄇ", "lb" # HANGUL JONGSEONG RIEUL + CHOSEONG PIEUP
|
238
|
+
sub "ᆯᄉ", "ls" # HANGUL JONGSEONG RIEUL + CHOSEONG SIOS
|
239
|
+
sub "ᆯᄋ", "r" # HANGUL JONGSEONG RIEUL + CHOSEONG IEUNG
|
240
|
+
sub "ᆯᄌ", "lj" # HANGUL JONGSEONG RIEUL + CHOSEONG CIEUC
|
241
|
+
sub "ᆯᄎ", "lch" # HANGUL JONGSEONG RIEUL + CHOSEONG CHIEUCH
|
242
|
+
sub "ᆯᄏ", "lk" # HANGUL JONGSEONG RIEUL + CHOSEONG KHIEUKH
|
243
|
+
sub "ᆯᄐ", "lt" # HANGUL JONGSEONG RIEUL + CHOSEONG THIEUTH
|
244
|
+
sub "ᆯᄑ", "lp" # HANGUL JONGSEONG RIEUL + CHOSEONG PHIEUPH
|
245
|
+
sub "ᆯᄒ", "rh" # HANGUL JONGSEONG RIEUL + CHOSEONG HIEUH
|
246
|
+
sub "ᆯᄁ", "lkk" # HANGUL JONGSEONG RIEUL + CHOSEONG SSANGKIYEOK
|
247
|
+
sub "ᆯᄄ", "ltt" # HANGUL JONGSEONG RIEUL + CHOSEONG SSANGTIEUT
|
248
|
+
sub "ᆯᄈ", "lpp" # HANGUL JONGSEONG RIEUL + CHOSEONG SSANGPIEUP
|
249
|
+
sub "ᆯᄊ", "lss" # HANGUL JONGSEONG RIEUL + CHOSEONG SSANGSIOS
|
250
|
+
sub "ᆯᄍ", "ljj" # HANGUL JONGSEONG RIEUL + CHOSEONG SSANGCIEUC
|
251
|
+
sub "ᆷᄀ", "mg" # HANGUL JONGSEONG MIEUM + CHOSEONG KIYEOK
|
252
|
+
sub "ᆷᄂ", "mn" # HANGUL JONGSEONG MIEUM + CHOSEONG NIEUN
|
253
|
+
sub "ᆷᄃ", "md" # HANGUL JONGSEONG MIEUM + CHOSEONG TIEUT
|
254
|
+
sub "ᆷᄅ", "mn" # HANGUL JONGSEONG MIEUM + CHOSEONG RIEUL
|
255
|
+
sub "ᆷᄆ", "mm" # HANGUL JONGSEONG MIEUM + CHOSEONG MIEUM
|
256
|
+
sub "ᆷᄇ", "mb" # HANGUL JONGSEONG MIEUM + CHOSEONG PIEUP
|
257
|
+
sub "ᆷᄉ", "ms" # HANGUL JONGSEONG MIEUM + CHOSEONG SIOS
|
258
|
+
sub "ᆷᄋ", "m" # HANGUL JONGSEONG MIEUM + CHOSEONG IEUNG
|
259
|
+
sub "ᆷᄌ", "mj" # HANGUL JONGSEONG MIEUM + CHOSEONG CIEUC
|
260
|
+
sub "ᆷᄎ", "mch" # HANGUL JONGSEONG MIEUM + CHOSEONG CHIEUCH
|
261
|
+
sub "ᆷᄏ", "mk" # HANGUL JONGSEONG MIEUM + CHOSEONG KHIEUKH
|
262
|
+
sub "ᆷᄐ", "mt" # HANGUL JONGSEONG MIEUM + CHOSEONG THIEUTH
|
263
|
+
sub "ᆷᄑ", "mp" # HANGUL JONGSEONG MIEUM + CHOSEONG PHIEUPH
|
264
|
+
sub "ᆷᄒ", "mh" # HANGUL JONGSEONG MIEUM + CHOSEONG HIEUH
|
265
|
+
sub "ᆷᄁ", "mkk" # HANGUL JONGSEONG MIEUM + CHOSEONG SSANGKIYEOK
|
266
|
+
sub "ᆷᄄ", "mtt" # HANGUL JONGSEONG MIEUM + CHOSEONG SSANGTIEUT
|
267
|
+
sub "ᆷᄈ", "mpp" # HANGUL JONGSEONG MIEUM + CHOSEONG SSANGPIEUP
|
268
|
+
sub "ᆷᄊ", "mss" # HANGUL JONGSEONG MIEUM + CHOSEONG SSANGSIOS
|
269
|
+
sub "ᆷᄍ", "mjj" # HANGUL JONGSEONG MIEUM + CHOSEONG SSANGCIEUC
|
270
|
+
sub "ᆸᄀ", "pg" # HANGUL JONGSEONG PIEUP + CHOSEONG KIYEOK
|
271
|
+
sub "ᆸᄂ", "mn" # HANGUL JONGSEONG PIEUP + CHOSEONG NIEUN
|
272
|
+
sub "ᆸᄃ", "pd" # HANGUL JONGSEONG PIEUP + CHOSEONG TIEUT
|
273
|
+
sub "ᆸᄅ", "mn" # HANGUL JONGSEONG PIEUP + CHOSEONG RIEUL
|
274
|
+
sub "ᆸᄆ", "mm" # HANGUL JONGSEONG PIEUP + CHOSEONG MIEUM
|
275
|
+
sub "ᆸᄇ", "pb" # HANGUL JONGSEONG PIEUP + CHOSEONG PIEUP
|
276
|
+
sub "ᆸᄉ", "ps" # HANGUL JONGSEONG PIEUP + CHOSEONG SIOS
|
277
|
+
sub "ᆸᄋ", "b" # HANGUL JONGSEONG PIEUP + CHOSEONG IEUNG
|
278
|
+
sub "ᆸᄌ", "pj" # HANGUL JONGSEONG PIEUP + CHOSEONG CIEUC
|
279
|
+
sub "ᆸᄎ", "pch" # HANGUL JONGSEONG PIEUP + CHOSEONG CHIEUCH
|
280
|
+
sub "ᆸᄏ", "pk" # HANGUL JONGSEONG PIEUP + CHOSEONG KHIEUKH
|
281
|
+
sub "ᆸᄐ", "pt" # HANGUL JONGSEONG PIEUP + CHOSEONG THIEUTH
|
282
|
+
sub "ᆸᄑ", "pp" # HANGUL JONGSEONG PIEUP + CHOSEONG PHIEUPH
|
283
|
+
sub "ᆸᄒ", "ph" # HANGUL JONGSEONG PIEUP + CHOSEONG HIEUH
|
284
|
+
sub "ᆸᄁ", "pkk" # HANGUL JONGSEONG PIEUP + CHOSEONG SSANGKIYEOK
|
285
|
+
sub "ᆸᄄ", "ptt" # HANGUL JONGSEONG PIEUP + CHOSEONG SSANGTIEUT
|
286
|
+
sub "ᆸᄈ", "ppp" # HANGUL JONGSEONG PIEUP + CHOSEONG SSANGPIEUP
|
287
|
+
sub "ᆸᄊ", "pss" # HANGUL JONGSEONG PIEUP + CHOSEONG SSANGSIOS
|
288
|
+
sub "ᆸᄍ", "pjj" # HANGUL JONGSEONG PIEUP + CHOSEONG SSANGCIEUC
|
289
|
+
sub "ᆺᄀ", "tg" # HANGUL JONGSEONG SIOS + CHOSEONG KIYEOK
|
290
|
+
sub "ᆺᄂ", "nn" # HANGUL JONGSEONG SIOS + CHOSEONG NIEUN
|
291
|
+
sub "ᆺᄃ", "td" # HANGUL JONGSEONG SIOS + CHOSEONG TIEUT
|
292
|
+
sub "ᆺᄅ", "nn" # HANGUL JONGSEONG SIOS + CHOSEONG RIEUL
|
293
|
+
sub "ᆺᄆ", "nm" # HANGUL JONGSEONG SIOS + CHOSEONG MIEUM
|
294
|
+
sub "ᆺᄇ", "tb" # HANGUL JONGSEONG SIOS + CHOSEONG PIEUP
|
295
|
+
sub "ᆺᄉ", "ts" # HANGUL JONGSEONG SIOS + CHOSEONG SIOS
|
296
|
+
sub "ᆺᄋ", "s" # HANGUL JONGSEONG SIOS + CHOSEONG IEUNG
|
297
|
+
sub "ᆺᄌ", "tj" # HANGUL JONGSEONG SIOS + CHOSEONG CIEUC
|
298
|
+
sub "ᆺᄎ", "tch" # HANGUL JONGSEONG SIOS + CHOSEONG CHIEUCH
|
299
|
+
sub "ᆺᄏ", "tk" # HANGUL JONGSEONG SIOS + CHOSEONG KHIEUKH
|
300
|
+
sub "ᆺᄐ", "tt" # HANGUL JONGSEONG SIOS + CHOSEONG THIEUTH
|
301
|
+
sub "ᆺᄑ", "tp" # HANGUL JONGSEONG SIOS + CHOSEONG PHIEUPH
|
302
|
+
sub "ᆺᄒ", "th" # HANGUL JONGSEONG SIOS + CHOSEONG HIEUH
|
303
|
+
sub "ᆺᄁ", "tkk" # HANGUL JONGSEONG SIOS + CHOSEONG SSANGKIYEOK
|
304
|
+
sub "ᆺᄄ", "ttt" # HANGUL JONGSEONG SIOS + CHOSEONG SSANGTIEUT
|
305
|
+
sub "ᆺᄈ", "tpp" # HANGUL JONGSEONG SIOS + CHOSEONG SSANGPIEUP
|
306
|
+
sub "ᆺᄊ", "tss" # HANGUL JONGSEONG SIOS + CHOSEONG SSANGSIOS
|
307
|
+
sub "ᆺᄍ", "tjj" # HANGUL JONGSEONG SIOS + CHOSEONG SSANGCIEUC
|
308
|
+
sub "ᆼᄀ", "ngg" # HANGUL JONGSEONG IEUNG + CHOSEONG KIYEOK
|
309
|
+
sub "ᆼᄂ", "ngn" # HANGUL JONGSEONG IEUNG + CHOSEONG NIEUN
|
310
|
+
sub "ᆼᄃ", "ngd" # HANGUL JONGSEONG IEUNG + CHOSEONG TIEUT
|
311
|
+
sub "ᆼᄅ", "ngn" # HANGUL JONGSEONG IEUNG + CHOSEONG RIEUL
|
312
|
+
sub "ᆼᄆ", "ngm" # HANGUL JONGSEONG IEUNG + CHOSEONG MIEUM
|
313
|
+
sub "ᆼᄇ", "ngb" # HANGUL JONGSEONG IEUNG + CHOSEONG PIEUP
|
314
|
+
sub "ᆼᄉ", "ngs" # HANGUL JONGSEONG IEUNG + CHOSEONG SIOS
|
315
|
+
sub "ᆼᄋ", "ng" # HANGUL JONGSEONG IEUNG + CHOSEONG IEUNG
|
316
|
+
sub "ᆼᄌ", "ngj" # HANGUL JONGSEONG IEUNG + CHOSEONG CIEUC
|
317
|
+
sub "ᆼᄎ", "ngch" # HANGUL JONGSEONG IEUNG + CHOSEONG CHIEUCH
|
318
|
+
sub "ᆼᄏ", "ngk" # HANGUL JONGSEONG IEUNG + CHOSEONG KHIEUKH
|
319
|
+
sub "ᆼᄐ", "ngt" # HANGUL JONGSEONG IEUNG + CHOSEONG THIEUTH
|
320
|
+
sub "ᆼᄑ", "ngp" # HANGUL JONGSEONG IEUNG + CHOSEONG PHIEUPH
|
321
|
+
sub "ᆼᄒ", "ngh" # HANGUL JONGSEONG IEUNG + CHOSEONG HIEUH
|
322
|
+
sub "ᆼᄁ", "ngkk" # HANGUL JONGSEONG IEUNG + CHOSEONG SSANGKIYEOK
|
323
|
+
sub "ᆼᄄ", "ngtt" # HANGUL JONGSEONG IEUNG + CHOSEONG SSANGTIEUT
|
324
|
+
sub "ᆼᄈ", "ngpp" # HANGUL JONGSEONG IEUNG + CHOSEONG SSANGPIEUP
|
325
|
+
sub "ᆼᄊ", "ngss" # HANGUL JONGSEONG IEUNG + CHOSEONG SSANGSIOS
|
326
|
+
sub "ᆼᄍ", "ngjj" # HANGUL JONGSEONG IEUNG + CHOSEONG SSANGCIEUC
|
327
|
+
}
|
328
|
+
|
329
|
+
sub "ᄀ", "g", before: any([alpha, digit, jamo_vowel, "-"]) # VOWEL + CHOSEONG KIYEOK
|
330
|
+
sub "ᄂ", "n", before: any([alpha, digit, jamo_vowel, "-"]) # VOWEL + CHOSEONG NIEUN
|
331
|
+
sub "ᄃ", "d", before: any([alpha, digit, jamo_vowel, "-"]) # VOWEL + CHOSEONG TIEUT
|
332
|
+
sub "ᄅ", "r", before: any([alpha, digit, jamo_vowel, "-"]) # VOWEL + CHOSEONG RIEUL
|
333
|
+
sub "ᄆ", "m", before: any([alpha, digit, jamo_vowel, "-"]) # VOWEL + CHOSEONG MIEUM
|
334
|
+
sub "ᄇ", "b", before: any([alpha, digit, jamo_vowel, "-"]) # VOWEL + CHOSEONG PIEUP
|
335
|
+
sub "ᄉ", "s", before: any([alpha, digit, jamo_vowel, "-"]) # VOWEL + CHOSEONG SIOS
|
336
|
+
sub "ᄋ", "", before: any([alpha, digit, jamo_vowel, "-"]) # VOWEL + CHOSEONG IEUNG
|
337
|
+
sub "ᄌ", "j", before: any([alpha, digit, jamo_vowel, "-"]) # VOWEL + CHOSEONG CIEUC
|
338
|
+
sub "ᄎ", "ch", before: any([alpha, digit, jamo_vowel, "-"]) # VOWEL + CHOSEONG CHIEUCH
|
339
|
+
sub "ᄏ", "k", before: any([alpha, digit, jamo_vowel, "-"]) # VOWEL + CHOSEONG KHIEUKH
|
340
|
+
sub "ᄐ", "t", before: any([alpha, digit, jamo_vowel, "-"]) # VOWEL + CHOSEONG THIEUTH
|
341
|
+
sub "ᄑ", "p", before: any([alpha, digit, jamo_vowel, "-"]) # VOWEL + CHOSEONG PHIEUPH
|
342
|
+
sub "ᄒ", "h", before: any([alpha, digit, jamo_vowel, "-"]) # VOWEL + CHOSEONG HIEUH
|
343
|
+
sub "ᄁ", "kk", before: any([alpha, digit, jamo_vowel]) # VOWEL + CHOSEONG SSANGKIYEOK
|
344
|
+
sub "ᄄ", "tt", before: any([alpha, digit, jamo_vowel]) # VOWEL + CHOSEONG SSANGTIEUT
|
345
|
+
sub "ᄈ", "pp", before: any([alpha, digit, jamo_vowel]) # VOWEL + CHOSEONG SSANGPIEUP
|
346
|
+
sub "ᄊ", "ss", before: any([alpha, digit, jamo_vowel]) # VOWEL + CHOSEONG SSANGSIOS
|
347
|
+
sub "ᄍ", "jj", before: any([alpha, digit, jamo_vowel]) # VOWEL + CHOSEONG SSANGCIEUC
|
348
|
+
parallel {
|
349
|
+
sub "ᆰᄀ", "lg" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG KIYEOK
|
350
|
+
sub "ᆰᄂ", "ngn" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG NIEUN
|
351
|
+
sub "ᆰᄃ", "kd" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG TIEUT
|
352
|
+
sub "ᆰᄅ", "ngn" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG RIEUL
|
353
|
+
sub "ᆰᄆ", "ngm" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG MIEUM
|
354
|
+
sub "ᆰᄇ", "kb" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG PIEUP
|
355
|
+
sub "ᆰᄉ", "ks" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG SIOS
|
356
|
+
sub "ᆰᄋ", "lg" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG IEUNG
|
357
|
+
sub "ᆰᄌ", "kj" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG CIEUC
|
358
|
+
sub "ᆰᄎ", "kch" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG CHIEUCH
|
359
|
+
sub "ᆰᄏ", "lk" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG KHIEUKH
|
360
|
+
sub "ᆰᄐ", "kt" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG THIEUTH
|
361
|
+
sub "ᆰᄑ", "kp" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG PHIEUPH
|
362
|
+
sub "ᆰᄒ", "lk" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG HIEUH
|
363
|
+
sub "ᆰᄁ", "lkk" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG SSANGKIYEOK
|
364
|
+
sub "ᆰᄄ", "ktt" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG SSANGTIEUT
|
365
|
+
sub "ᆰᄈ", "kpp" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG SSANGPIEUP
|
366
|
+
sub "ᆰᄊ", "kss" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG SSANGSIOS
|
367
|
+
sub "ᆰᄍ", "kjj" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG SSANGCIEUC
|
368
|
+
sub "ᆱᄀ", "mg" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG KIYEOK
|
369
|
+
sub "ᆱᄂ", "mn" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG NIEUN
|
370
|
+
sub "ᆱᄃ", "md" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG TIEUT
|
371
|
+
sub "ᆱᄅ", "mn" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG RIEUL
|
372
|
+
sub "ᆱᄆ", "lm" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG MIEUM
|
373
|
+
sub "ᆱᄇ", "mb" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG PIEUP
|
374
|
+
sub "ᆱᄉ", "ms" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG SIOS
|
375
|
+
sub "ᆱᄋ", "lm" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG IEUNG
|
376
|
+
sub "ᆱᄌ", "mj" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG CIEUC
|
377
|
+
sub "ᆱᄎ", "mch" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG CHIEUCH
|
378
|
+
sub "ᆱᄏ", "mk" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG KHIEUKH
|
379
|
+
sub "ᆱᄐ", "mt" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG THIEUTH
|
380
|
+
sub "ᆱᄑ", "mp" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG PHIEUPH
|
381
|
+
sub "ᆱᄒ", "mh" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG HIEUH
|
382
|
+
sub "ᆱᄁ", "mkk" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG SSANGKIYEOK
|
383
|
+
sub "ᆱᄄ", "mtt" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG SSANGTIEUT
|
384
|
+
sub "ᆱᄈ", "mpp" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG SSANGPIEUP
|
385
|
+
sub "ᆱᄊ", "mss" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG SSANGSIOS
|
386
|
+
sub "ᆱᄍ", "mjj" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG SSANGCIEUC
|
387
|
+
sub "ᆲᄀ", "pg" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG KIYEOK
|
388
|
+
sub "ᆲᄂ", "mn" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG NIEUN
|
389
|
+
sub "ᆲᄃ", "pd" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG TIEUT
|
390
|
+
sub "ᆲᄅ", "mn" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG RIEUL
|
391
|
+
sub "ᆲᄆ", "mm" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG MIEUM
|
392
|
+
sub "ᆲᄇ", "lb" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG PIEUP
|
393
|
+
sub "ᆲᄉ", "ps" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG SIOS
|
394
|
+
sub "ᆲᄋ", "lb" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG IEUNG
|
395
|
+
sub "ᆲᄌ", "pj" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG CIEUC
|
396
|
+
sub "ᆲᄎ", "pch" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG CHIEUCH
|
397
|
+
sub "ᆲᄏ", "pk" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG KHIEUKH
|
398
|
+
sub "ᆲᄐ", "pt" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG THIEUTH
|
399
|
+
sub "ᆲᄑ", "lp" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG PHIEUPH
|
400
|
+
sub "ᆲᄒ", "lp" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG HIEUH
|
401
|
+
sub "ᆲᄁ", "pkk" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG SSANGKIYEOK
|
402
|
+
sub "ᆲᄄ", "ptt" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG SSANGTIEUT
|
403
|
+
sub "ᆲᄈ", "lpp" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG SSANGPIEUP
|
404
|
+
sub "ᆲᄊ", "pss" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG SSANGSIOS
|
405
|
+
sub "ᆲᄍ", "pjj" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG SSANGCIEUC
|
406
|
+
}
|
407
|
+
sub "ᄀ", "g", before: space # HANGUL CHOSEONG KIYEOK
|
408
|
+
sub "ᄂ", "n", before: space # HANGUL CHOSEONG NIEUN
|
409
|
+
sub "ᄃ", "d", before: space # HANGUL CHOSEONG TIEUT
|
410
|
+
sub "ᄅ", "", before: space, after: any("ᅣᅤᅧᅨᅭᅲ") # HANGUL CHOSEONG RIEUL # R-onset rule
|
411
|
+
sub "ᄅ", "n", before: space # HANGUL CHOSEONG RIEUL
|
412
|
+
sub "ᄆ", "m", before: space # HANGUL CHOSEONG MIEUM
|
413
|
+
sub "ᄇ", "b", before: space # HANGUL CHOSEONG PIEUP
|
414
|
+
sub "ᄉ", "s", before: space # HANGUL CHOSEONG SIOS
|
415
|
+
sub "ᄋ", "", before: space # HANGUL CHOSEONG IEUNG
|
416
|
+
sub "ᄌ", "j", before: space # HANGUL CHOSEONG CIEUC
|
417
|
+
sub "ᄎ", "ch", before: space # HANGUL CHOSEONG CHIEUCH
|
418
|
+
sub "ᄏ", "k", before: space # HANGUL CHOSEONG KHIEUKH
|
419
|
+
sub "ᄐ", "t", before: space # HANGUL CHOSEONG THIEUTH
|
420
|
+
sub "ᄑ", "p", before: space # HANGUL CHOSEONG PHIEUPH
|
421
|
+
sub "ᄒ", "h", before: space # HANGUL CHOSEONG HIEUH
|
422
|
+
sub "ᄁ", "kk", before: space # HANGUL CHOSEONG SSANGKIYEOK
|
423
|
+
sub "ᄭ", "kk", before: space # HANGUL CHOSEONG SIOS-KIYEOK
|
424
|
+
sub "ᄄ", "tt", before: space # HANGUL CHOSEONG SSANGTIEUT
|
425
|
+
sub "ᄯ", "tt", before: space # HANGUL CHOSEONG SIOS-TIEUT
|
426
|
+
sub "ᄈ", "pp", before: space # HANGUL CHOSEONG SSANGPIEUP
|
427
|
+
sub "ᄲ", "pp", before: space # HANGUL CHOSEONG SIOS-PIEUP
|
428
|
+
sub "ᄊ", "ss", before: space # HANGUL CHOSEONG SSANGSIOS
|
429
|
+
sub "ᄍ", "jj", before: space # HANGUL CHOSEONG SSANGCIEUC
|
430
|
+
sub "ᄶ", "jj", before: space # HANGUL CHOSEONG SIOS-CIEUC
|
431
|
+
parallel {
|
432
|
+
sub "ᅡ", "a" # HANGUL JUNGSEONG A
|
433
|
+
sub "ᅣ", "ya" # HANGUL JUNGSEONG YA
|
434
|
+
sub "ᅥ", "eo" # HANGUL JUNGSEONG EO
|
435
|
+
sub "ᅧ", "yeo" # HANGUL JUNGSEONG YEO
|
436
|
+
sub "ᅩ", "o" # HANGUL JUNGSEONG O
|
437
|
+
sub "ᅭ", "yo" # HANGUL JUNGSEONG YO
|
438
|
+
sub "ᅮ", "u" # HANGUL JUNGSEONG U
|
439
|
+
sub "ᅲ", "yu" # HANGUL JUNGSEONG YU
|
440
|
+
sub "ᅳ", "eu" # HANGUL JUNGSEONG EU
|
441
|
+
sub "ᅵ", "i" # HANGUL JUNGSEONG I
|
442
|
+
sub "ᅢ", "ae" # HANGUL JUNGSEONG AE
|
443
|
+
sub "ᅤ", "yae" # HANGUL JUNGSEONG YAE
|
444
|
+
sub "ᅦ", "e" # HANGUL JUNGSEONG E
|
445
|
+
sub "ᅨ", "ye" # HANGUL JUNGSEONG YE
|
446
|
+
sub "ᅬ", "oe" # HANGUL JUNGSEONG OE
|
447
|
+
sub "ᅱ", "wi" # HANGUL JUNGSEONG WI
|
448
|
+
sub "ᅴ", "ui" # HANGUL JUNGSEONG YI
|
449
|
+
sub "ᅪ", "wa" # HANGUL JUNGSEONG WA
|
450
|
+
sub "ᅯ", "wo" # HANGUL JUNGSEONG WEO
|
451
|
+
sub "ᅫ", "wae" # HANGUL JUNGSEONG WAE
|
452
|
+
sub "ᅰ", "we" # HANGUL JUNGSEONG WE
|
453
|
+
}
|
454
|
+
sub "ᆨ", "k", after: any([space,"-"]) # HANGUL JONGSEONG KIYEOK
|
455
|
+
sub "ᆫ", "n", after: any([space,"-"]) # HANGUL JONGSEONG NIEUN
|
456
|
+
sub "ᆮ", "t", after: any([space,"-"]) # HANGUL JONGSEONG TIEUT
|
457
|
+
sub "ᆯ", "l", after: any([space,"-"]) # HANGUL JONGSEONG RIEUL
|
458
|
+
sub "ᆷ", "m", after: any([space,"-"]) # HANGUL JONGSEONG MIEUM
|
459
|
+
sub "ᆸ", "p", after: any([space,"-"]) # HANGUL JONGSEONG PIEUP
|
460
|
+
sub "ᆺ", "t", after: any([space,"-"]) # HANGUL JONGSEONG SIOS
|
461
|
+
sub "ᆼ", "ng", after: any([space,"-"]) # HANGUL JONGSEONG IEUNG
|
462
|
+
sub "ᆽ", "t", after: any([space,"-"]) # HANGUL JONGSEONG CIEUC
|
463
|
+
sub "ᆾ", "t", after: any([space,"-"]) # HANGUL JONGSEONG CHIEUCH
|
464
|
+
sub "ᆿ", "k", after: any([space,"-"]) # HANGUL JONGSEONG KHIEUKH
|
465
|
+
sub "ᇀ", "t", after: any([space,"-"]) # HANGUL JONGSEONG THIEUTH
|
466
|
+
sub "ᇁ", "p", after: any([space,"-"]) # HANGUL JONGSEONG PHIEUPH
|
467
|
+
sub "ᆰ", "k", after: any([space,"-"]) # HANGUL JONGSEONG RIEUL-KIYEOK
|
468
|
+
sub "ᆲ", "p", after: any([space,"-"]) # HANGUL JONGSEONG RIEUL-PIEUP
|
469
|
+
|
470
|
+
# Remove space added
|
471
|
+
sub line_start + space, none
|
472
|
+
sub space + line_end, none
|
473
|
+
|
474
|
+
title_case
|
475
|
+
}
|