interscript-maps 2.0.5
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +7 -0
- data/README.adoc +28 -0
- data/interscript-maps.gemspec +28 -0
- data/interscript-maps.yaml +235 -0
- data/libs/posix.iml +11 -0
- data/libs/unicode.iml +13 -0
- data/libs/var-Cyrl.iml +7 -0
- data/libs/var-kor.iml +17 -0
- data/maps-staging/royin-tha-Thai-Latn-1939-generic.imp +98 -0
- data/maps-staging/royin-tha-Thai-Latn-1968.imp +156 -0
- data/maps-staging/royin-tha-Thai-Latn-1999-chained.imp +161 -0
- data/maps-staging/royin-tha-Thai-Latn-1999.imp +78 -0
- data/maps-staging/var-tha-Thai-Thai-phonemic.imp +53 -0
- data/maps-staging/var-tha-Thai-Zsym-ipa.imp +273 -0
- data/maps/acadsin-zho-Hani-Latn-2002.imp +27515 -0
- data/maps/alalc-amh-Ethi-Latn-1997.imp +392 -0
- data/maps/alalc-amh-Ethi-Latn-2011.imp +85 -0
- data/maps/alalc-ara-Arab-Latn-1997.imp +1171 -0
- data/maps/alalc-asm-Deva-Latn-1997.imp +214 -0
- data/maps/alalc-asm-Deva-Latn-2012.imp +53 -0
- data/maps/alalc-aze-Arab-Latn-1997.imp +321 -0
- data/maps/alalc-aze-Cyrl-Latn-1997.imp +101 -0
- data/maps/alalc-bel-Cyrl-Latn-1997.imp +118 -0
- data/maps/alalc-ben-Beng-Latn-1997.imp +225 -0
- data/maps/alalc-ben-Beng-Latn-2017.imp +135 -0
- data/maps/alalc-bul-Cyrl-Latn-1997.imp +110 -0
- data/maps/alalc-div-Thaa-Latn-1997.imp +171 -0
- data/maps/alalc-ell-Grek-Latn-1997.imp +381 -0
- data/maps/alalc-ell-Grek-Latn-2010.imp +382 -0
- data/maps/alalc-guj-Gujr-Latn-1997.imp +223 -0
- data/maps/alalc-guj-Gujr-Latn-2011.imp +57 -0
- data/maps/alalc-hin-Deva-Latn-1997.imp +248 -0
- data/maps/alalc-hin-Deva-Latn-2011.imp +63 -0
- data/maps/alalc-kan-Kana-Latn-1997.imp +233 -0
- data/maps/alalc-kan-Kana-Latn-2011.imp +58 -0
- data/maps/alalc-kat-Geok-Latn-1997.imp +109 -0
- data/maps/alalc-kat-Geor-Latn-1997.imp +104 -0
- data/maps/alalc-kor-Hang-Latn-1997.imp +68 -0
- data/maps/alalc-mal-Mlym-Latn-1997.imp +260 -0
- data/maps/alalc-mal-Mlym-Latn-2012.imp +65 -0
- data/maps/alalc-mar-Deva-Latn-1997.imp +178 -0
- data/maps/alalc-mar-Deva-Latn-2011.imp +51 -0
- data/maps/alalc-mkd-Cyrl-Latn-1997.imp +125 -0
- data/maps/alalc-mkd-Cyrl-Latn-2013.imp +113 -0
- data/maps/alalc-mon-Cyrl-Latn-1997.imp +161 -0
- data/maps/alalc-ori-Orya-Latn-1997.imp +234 -0
- data/maps/alalc-ori-Orya-Latn-2011.imp +59 -0
- data/maps/alalc-pan-Guru-Latn-1997.imp +241 -0
- data/maps/alalc-pan-Guru-Latn-2011.imp +71 -0
- data/maps/alalc-per-Arab-Latn-1997.imp +318 -0
- data/maps/alalc-pli-Deva-Latn-2012.imp +140 -0
- data/maps/alalc-pra-Deva-Latn-2012.imp +52 -0
- data/maps/alalc-rus-Cyrl-Latn-1997.imp +165 -0
- data/maps/alalc-rus-Cyrl-Latn-2012.imp +107 -0
- data/maps/alalc-san-Deva-Latn-2012.imp +207 -0
- data/maps/alalc-sin-Sinh-Latn-1997.imp +246 -0
- data/maps/alalc-sin-Sinh-Latn-2011.imp +63 -0
- data/maps/alalc-srp-Cyrl-Latn-1997.imp +124 -0
- data/maps/alalc-srp-Cyrl-Latn-2013.imp +115 -0
- data/maps/alalc-tam-Taml-Latn-1997.imp +52 -0
- data/maps/alalc-tam-Taml-Latn-2011.imp +49 -0
- data/maps/alalc-tel-Telu-Latn-1997.imp +237 -0
- data/maps/alalc-tel-Telu-Latn-2011.imp +58 -0
- data/maps/alalc-ukr-Cyrl-Latn-1997.imp +123 -0
- data/maps/alalc-ukr-Cyrl-Latn-2011.imp +32 -0
- data/maps/apcbg-bul-Cyrl-Latn-1995.imp +194 -0
- data/maps/az-aze-Cyrl-Latn-1939.imp +105 -0
- data/maps/az-aze-Cyrl-Latn-1958.imp +50 -0
- data/maps/bas-rus-Cyrl-Latn-2017-bss.imp +160 -0
- data/maps/bas-rus-Cyrl-Latn-2017-oss.imp +165 -0
- data/maps/bgn-jpn-Hrkt-Latn-1962.imp +288 -0
- data/maps/bgn-kor-Hang-Latn-1943.imp +31 -0
- data/maps/bgn-kor-Kore-Latn-1943.imp +33 -0
- data/maps/bgna-bul-Cyrl-Latn-2006.imp +119 -0
- data/maps/bgna-bul-Cyrl-Latn-2009.imp +119 -0
- data/maps/bgnpcgn-amh-Ethi-Latn-1967.imp +393 -0
- data/maps/bgnpcgn-ara-Arab-Latn-1956.imp +472 -0
- data/maps/bgnpcgn-arm-Armn-Latn-1981.imp +125 -0
- data/maps/bgnpcgn-aze-Cyrl-Latn-1993.imp +111 -0
- data/maps/bgnpcgn-bak-Cyrl-Latn-2007.imp +169 -0
- data/maps/bgnpcgn-bal-Arab-Latn-2008.imp +296 -0
- data/maps/bgnpcgn-bel-Cyrl-Latn-1979.imp +200 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-1952.imp +137 -0
- data/maps/bgnpcgn-bul-Cyrl-Latn-2013.imp +38 -0
- data/maps/bgnpcgn-che-Cyrl-Latn-2008.imp +176 -0
- data/maps/bgnpcgn-deu-Latn-Latn-2000.imp +56 -0
- data/maps/bgnpcgn-div-Thaa-Latn-1972.imp +90 -0
- data/maps/bgnpcgn-div-Thaa-Latn-1988.imp +71 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1962.imp +443 -0
- data/maps/bgnpcgn-ell-Grek-Latn-1996.imp +269 -0
- data/maps/bgnpcgn-fao-Latn-Latn-1964.imp +41 -0
- data/maps/bgnpcgn-fao-Latn-Latn-1968.imp +28 -0
- data/maps/bgnpcgn-fas-Arab-Latn-1956.imp +111 -0
- data/maps/bgnpcgn-isl-Latn-Latn-1964.imp +42 -0
- data/maps/bgnpcgn-isl-Latn-Latn-1968.imp +32 -0
- data/maps/bgnpcgn-jpn-Hrkt-Latn-1976.imp +191 -0
- data/maps/bgnpcgn-kat-Geor-Latn-1981.imp +116 -0
- data/maps/bgnpcgn-kat-Geor-Latn-2009.imp +43 -0
- data/maps/bgnpcgn-kaz-Cyrl-Latn-1979.imp +193 -0
- data/maps/bgnpcgn-kir-Cyrl-Latn-1979.imp +170 -0
- data/maps/bgnpcgn-kor-Hang-Latn-kn-1945.imp +177 -0
- data/maps/bgnpcgn-kor-Hang-Latn-rok-2011.imp +40 -0
- data/maps/bgnpcgn-kor-Kore-Latn-rok-2011.imp +41 -0
- data/maps/bgnpcgn-kur-Arab-Latn-2007.imp +240 -0
- data/maps/bgnpcgn-mkd-Cyrl-Latn-1981.imp +132 -0
- data/maps/bgnpcgn-mkd-Cyrl-Latn-2013.imp +174 -0
- data/maps/bgnpcgn-mon-Cyrl-Latn-1964.imp +168 -0
- data/maps/bgnpcgn-nep-Deva-Latn-2011.imp +208 -0
- data/maps/bgnpcgn-per-Arab-Latn-1958.imp +312 -0
- data/maps/bgnpcgn-prs-Arab-Latn-2007.imp +552 -0
- data/maps/bgnpcgn-prs-Arab-Latn-yaghoubi.imp +445 -0
- data/maps/bgnpcgn-pus-Arab-Latn-1968.imp +289 -0
- data/maps/bgnpcgn-ron-cyrl-latn-2002.imp +165 -0
- data/maps/bgnpcgn-rue-Cyrl-Latn-2016.imp +133 -0
- data/maps/bgnpcgn-rus-Cyrl-Latn-1947.imp +195 -0
- data/maps/bgnpcgn-sme-Latn-Latn-1984.imp +48 -0
- data/maps/bgnpcgn-srp-Cyrl-Latn-1962.imp +55 -0
- data/maps/bgnpcgn-srp-Cyrl-Latn-2005.imp +146 -0
- data/maps/bgnpcgn-tat-Cyrl-Latn-2007.imp +185 -0
- data/maps/bgnpcgn-tgk-Cyrl-Latn-1994.imp +188 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-1965.imp +136 -0
- data/maps/bgnpcgn-ukr-Cyrl-Latn-2019.imp +88 -0
- data/maps/bgnpcgn-urd-Arab-Latn-2007.imp +333 -0
- data/maps/bgnpcgn-uzb-Cyrl-Latn-1979.imp +145 -0
- data/maps/bgnpcgn-uzb-Cyrl-Latn-2000.imp +74 -0
- data/maps/bgnpcgn-zho-Hans-Latn-1979.imp +7463 -0
- data/maps/bis-asm-Beng-Latn-13194-1991.imp +154 -0
- data/maps/bis-ben-Beng-Latn-13194-1991.imp +151 -0
- data/maps/bis-dev-Deva-Latn-13194-1991.imp +178 -0
- data/maps/bis-guj-Gujr-Latn-13194-1991.imp +172 -0
- data/maps/bis-kan-Kana-Latn-13194-1991.imp +166 -0
- data/maps/bis-mlm-Mlym-Latn-13194-1991.imp +170 -0
- data/maps/bis-ori-Orya-Latn-13194-1991.imp +168 -0
- data/maps/bis-pnj-Guru-Latn-13194-1991.imp +169 -0
- data/maps/bis-tel-Telu-Latn-13194-1991.imp +165 -0
- data/maps/bis-tml-Taml-Latn-13194-1991.imp +149 -0
- data/maps/by-bel-Cyrl-Latn-1998.imp +123 -0
- data/maps/by-bel-Cyrl-Latn-2007.imp +77 -0
- data/maps/din-grc-Grek-Latn-31634-2011-t1.imp +627 -0
- data/maps/din-hin-Deva-Latn-33904-2018.imp +101 -0
- data/maps/din-kat-Geor-Latn-32707-2010.imp +103 -0
- data/maps/din-mar-Deva-Latn-33904-2018.imp +83 -0
- data/maps/din-nep-Deva-Latn-33904-2018.imp +110 -0
- data/maps/din-pli-Deva-Latn-33904-2018.imp +72 -0
- data/maps/din-pra-Deva-Latn-33904-2018.imp +66 -0
- data/maps/din-san-Deva-Latn-33904-2018.imp +294 -0
- data/maps/din-tam-Taml-Latn-33903-2016.imp +187 -0
- data/maps/dos-nep-Deva-Latn-1997.imp +47 -0
- data/maps/elot-ell-Grek-Latn-743-1982-tl.imp +399 -0
- data/maps/elot-ell-Grek-Latn-743-1982-ts.imp +397 -0
- data/maps/elot-ell-Grek-Latn-743-2001-tl.imp +34 -0
- data/maps/elot-ell-Grek-Latn-743-2001-ts.imp +178 -0
- data/maps/ggg-kat-Geor-Latn-2002.imp +75 -0
- data/maps/gki-bel-Cyrl-Latn-1992.imp +44 -0
- data/maps/gki-bel-Cyrl-Latn-2000.imp +159 -0
- data/maps/gost-rus-Cyrl-Latn-16876-71-1983.imp +179 -0
- data/maps/gost-rus-Cyrl-Latn-7.79-2000-2002.imp +132 -0
- data/maps/hk-yue-Hani-Latn-1888.imp +29201 -0
- data/maps/icao-bel-Cyrl-Latn-9303.imp +136 -0
- data/maps/icao-bul-Cyrl-Latn-9303.imp +127 -0
- data/maps/icao-fas-Arab-Latn-9303.imp +112 -0
- data/maps/icao-heb-Hebr-Latn-9303.imp +160 -0
- data/maps/icao-mkd-Cyrl-Latn-9303.imp +126 -0
- data/maps/icao-rus-Cyrl-Latn-9303.imp +126 -0
- data/maps/icao-srp-Cyrl-Latn-9303.imp +126 -0
- data/maps/icao-ukr-Cyrl-Latn-9303.imp +127 -0
- data/maps/iso-ara-Arab-Latn-233-1984.imp +301 -0
- data/maps/iso-asm-Beng-Latn-15919-2001.imp +73 -0
- data/maps/iso-ben-Beng-Latn-15919-2001.imp +171 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t1.imp +365 -0
- data/maps/iso-ell-Grek-Latn-843-1997-t2.imp +43 -0
- data/maps/iso-guj-Gujr-Latn-15919-2001.imp +214 -0
- data/maps/iso-hin-Deva-Latn-15919-2001.imp +73 -0
- data/maps/iso-inc-Deva-Latn-15919-2001.imp +61 -0
- data/maps/iso-jpn-Hrkt-Latn-3602-1989.imp +59 -0
- data/maps/iso-kan-Kana-Latn-15919-2001.imp +212 -0
- data/maps/iso-kat-Geor-Latn-9984-1996.imp +103 -0
- data/maps/iso-kor-Hang-Latn-1996-method1.imp +140 -0
- data/maps/iso-kor-Hang-Latn-1996-method2.imp +132 -0
- data/maps/iso-mal-Mlym-Latn-15919-2001.imp +276 -0
- data/maps/iso-mar-Deva-Latn-15919-2001.imp +68 -0
- data/maps/iso-nep-Deva-Latn-15919-2001.imp +75 -0
- data/maps/iso-ori-Orya-Latn-15919-2001.imp +188 -0
- data/maps/iso-pan-Guru-Latn-15919-2001.imp +217 -0
- data/maps/iso-pli-Beng-Latn-15919-2001.imp +66 -0
- data/maps/iso-pli-Deva-Latn-15919-2001.imp +68 -0
- data/maps/iso-pli-Sinh-Latn-15919-2001.imp +211 -0
- data/maps/iso-pli-Thai-Latn-15919-2001.imp +47 -0
- data/maps/iso-pra-Deva-Latn-15919-2001.imp +60 -0
- data/maps/iso-prs-Arab-Latn-233-3-1999.imp +352 -0
- data/maps/iso-rus-Cyrl-Latn-9-1995.imp +279 -0
- data/maps/iso-san-Deva-Latn-15919-2001.imp +215 -0
- data/maps/iso-tam-Taml-Latn-15919-2001.imp +153 -0
- data/maps/iso-tel-Telu-Latn-15919-2001.imp +214 -0
- data/maps/iso-tha-Thai-Latn-11940-1998.imp +114 -0
- data/maps/kp-kor-Hang-Latn-2002.imp +540 -0
- data/maps/lshk-yue-Hani-Latn-jyutping-1993.imp +29005 -0
- data/maps/masm-mon-Cyrl-Latn-5217-2012.imp +136 -0
- data/maps/masm-mon-Latn-Cyrl-5217-2012.imp +162 -0
- data/maps/mext-jpn-Hrkt-Latn-1954.imp +403 -0
- data/maps/moct-kor-Hang-Latn-2000.imp +475 -0
- data/maps/mofa-jpn-Hrkt-Latn-1989.imp +484 -0
- data/maps/mv-div-Thaa-Latn-1987.imp +144 -0
- data/maps/mvd-bel-Cyrl-Latn-2008.imp +224 -0
- data/maps/mvd-bel-Cyrl-Latn-2010.imp +64 -0
- data/maps/mvd-rus-Cyrl-Latn-2008.imp +110 -0
- data/maps/mvd-rus-Cyrl-Latn-2010.imp +40 -0
- data/maps/odni-ara-Arab-Latn-2004.imp +106 -0
- data/maps/odni-ara-Arab-Latn-2015.imp +281 -0
- data/maps/odni-aze-Cyrl-Latn-2015.imp +158 -0
- data/maps/odni-bel-Cyrl-Latn-2015.imp +138 -0
- data/maps/odni-bul-Cyrl-Latn-2005.imp +90 -0
- data/maps/odni-bul-Cyrl-Latn-2015.imp +103 -0
- data/maps/odni-che-Cyrl-Latn-2015.imp +165 -0
- data/maps/odni-fas-Arab-Latn-2004.imp +268 -0
- data/maps/odni-fas-Arab-Latn-2015.imp +398 -0
- data/maps/odni-hin-Deva-Latn-2004.imp +180 -0
- data/maps/odni-hin-Deva-Latn-2015.imp +256 -0
- data/maps/odni-kat-Geor-Latn-2015.imp +76 -0
- data/maps/odni-kaz-Cyrl-Latn-2015.imp +164 -0
- data/maps/odni-kir-Cyrl-Latn-2015.imp +149 -0
- data/maps/odni-kor-Hang-Latn-2015.imp +307 -0
- data/maps/odni-mkd-Cyrl-Latn-2005.imp +28 -0
- data/maps/odni-mkd-Cyrl-Latn-2015.imp +124 -0
- data/maps/odni-prs-Arab-Latn-2004.imp +120 -0
- data/maps/odni-prs-Arab-Latn-2015.imp +225 -0
- data/maps/odni-pus-Arab-Latn-2011.imp +327 -0
- data/maps/odni-rus-Cyrl-Latn-2015.imp +79 -0
- data/maps/odni-srp-Cyrl-Latn-2005.imp +35 -0
- data/maps/odni-srp-Cyrl-Latn-2015.imp +130 -0
- data/maps/odni-tat-Cyrl-Latn-2015.imp +157 -0
- data/maps/odni-tgk-Cyrl-Latn-2015.imp +161 -0
- data/maps/odni-tuk-Cyrl-Latn-2015.imp +159 -0
- data/maps/odni-uig-Cyrl-Latn-2015.imp +151 -0
- data/maps/odni-ukr-Cyrl-Latn-2015.imp +136 -0
- data/maps/odni-urd-Arab-Latn-2015.imp +220 -0
- data/maps/odni-uzb-Cyrl-Latn-2015.imp +165 -0
- data/maps/sac-zho-Hans-Latn-1979.imp +20940 -0
- data/maps/sasm-mon-Mong-Latn-general-1978.imp +294 -0
- data/maps/sasm-mon-Mong-Latn-phonetic-1978.imp +261 -0
- data/maps/ses-ara-Arab-Latn-1930.imp +225 -0
- data/maps/stategeocadastre-ukr-Cyrl-Latn-1993.imp +171 -0
- data/maps/ua-ukr-Cyrl-Latn-1996.imp +149 -0
- data/maps/ua-ukr-Cyrl-Latn-2007.imp +69 -0
- data/maps/ua-ukr-Cyrl-Latn-2010.imp +128 -0
- data/maps/un-amh-Ethi-Latn-2016.imp +483 -0
- data/maps/un-ara-Arab-Latn-1971.imp +137 -0
- data/maps/un-ara-Arab-Latn-1972.imp +155 -0
- data/maps/un-ara-Arab-Latn-2017.imp +375 -0
- data/maps/un-asm-Beng-Latn-1972.imp +188 -0
- data/maps/un-bel-Cyrl-Latn-2007.imp +78 -0
- data/maps/un-ben-Beng-Latn-2016.imp +516 -0
- data/maps/un-ell-Grek-Latn-1987-phonetic.imp +437 -0
- data/maps/un-ell-Grek-Latn-1987-tl.imp +27 -0
- data/maps/un-ell-Grek-Latn-1987-ts.imp +269 -0
- data/maps/un-guj-Gujr-Latn-1972.imp +196 -0
- data/maps/un-hin-Deva-Latn-2016.imp +356 -0
- data/maps/un-kan-Kana-Latn-2016.imp +214 -0
- data/maps/un-mal-Mlym-Latn-1972.imp +215 -0
- data/maps/un-mar-Deva-Latn-2016.imp +96 -0
- data/maps/un-mon-Mong-Latn-general-2013.imp +170 -0
- data/maps/un-mon-Mong-Latn-phonetic-2013.imp +170 -0
- data/maps/un-nep-Deva-Latn-1972.imp +295 -0
- data/maps/un-nep-Deva-Latn-2013.imp +62 -0
- data/maps/un-ori-Orya-Latn-1972.imp +208 -0
- data/maps/un-pan-Guru-Latn-1972.imp +321 -0
- data/maps/un-prs-Arab-Latn-1967.imp +214 -0
- data/maps/un-rus-Cyrl-Latn-1987.imp +96 -0
- data/maps/un-sin-Sinh-Latn-1972.imp +193 -0
- data/maps/un-tam-Taml-Latn-1972.imp +173 -0
- data/maps/un-tel-Telu-Latn-1972.imp +229 -0
- data/maps/un-ukr-Cyrl-Latn-1998.imp +58 -0
- data/maps/un-ukr-Cyrl-Latn-2012.imp +95 -0
- data/maps/un-urd-Arab-Latn-1972.imp +290 -0
- data/maps/var-amh-Ethi-Latn-eae-2003.imp +414 -0
- data/maps/var-gez-Ethi-Latn-eae-2003.imp +54 -0
- data/maps/var-hin-Deva-Latn-hunterian-1872.imp +212 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1886.imp +399 -0
- data/maps/var-jpn-Hrkt-Latn-hepburn-1954.imp +382 -0
- data/maps/var-kor-Hang-Hang-jamo.imp +11196 -0
- data/maps/var-kor-Hang-Latn-mr-1939.imp +574 -0
- data/maps/var-kor-Kore-Hang-2013.imp +59764 -0
- data/maps/var-kor-Kore-Latn-mr-1939.imp +36 -0
- data/maps/var-mar-Deva-Latn-hunterian-1872.imp +39 -0
- data/maps/var-mon-Mong-Latn-1930.imp +101 -0
- data/maps/var-mon-Mong-Latn-lessing.imp +181 -0
- data/maps/var-mon-Mong-Latn-vpmc.imp +182 -0
- data/maps/var-pra-Deva-Latn-iast-1912.imp +36 -0
- data/maps/var-san-Deva-Latn-iast-1912.imp +147 -0
- data/maps/var-zho-Hani-Latn-wd-1979.imp +27549 -0
- metadata +335 -0
@@ -0,0 +1,114 @@
|
|
1
|
+
metadata {
|
2
|
+
authority_id: iso
|
3
|
+
id: 11940-1998
|
4
|
+
language: iso-639-2:tha
|
5
|
+
source_script: Thai
|
6
|
+
destination_script: Latn
|
7
|
+
name: ISO 11940:1998 Information and documentation -- Transliteration of Thai
|
8
|
+
url: https://www.iso.org/standard/20574.html
|
9
|
+
creation_date: 1998
|
10
|
+
adoption_date:
|
11
|
+
description:
|
12
|
+
|
13
|
+
notes:
|
14
|
+
}
|
15
|
+
|
16
|
+
tests {
|
17
|
+
test "ภาษาไทย", "p̣hās̛̄āịthy"
|
18
|
+
test "เชียงใหม่", "echīyngıh̄m̀"
|
19
|
+
}
|
20
|
+
|
21
|
+
|
22
|
+
stage {
|
23
|
+
|
24
|
+
# CHARACTERS
|
25
|
+
parallel {
|
26
|
+
sub "\u0e01", "k" # ก THAI CHARACTER KO KAI
|
27
|
+
sub "\u0e02", "k̄h" # ข THAI CHARACTER KHO KHAI
|
28
|
+
sub "\u0e03", "ḳ̄h" # ฃ THAI CHARACTER KHO KHUAT
|
29
|
+
sub "\u0e04", "kh" # ค THAI CHARACTER KHO KHWAI
|
30
|
+
sub "\u0e05", "k̛h" # ฅ THAI CHARACTER KHO KHON
|
31
|
+
sub "\u0e06", "ḳh" # ฆ THAI CHARACTER KHO RAKHANG
|
32
|
+
sub "\u0e07", "ng" # ง THAI CHARACTER NGO NGU
|
33
|
+
sub "\u0e08", "c" # จ THAI CHARACTER CHO CHAN
|
34
|
+
sub "\u0e09", "c̄h" # ฉ THAI CHARACTER CHO CHING
|
35
|
+
sub "\u0e0a", "ch" # ช THAI CHARACTER CHO CHANG
|
36
|
+
sub "\u0e0b", "s" # ซ THAI CHARACTER SO SO
|
37
|
+
sub "\u0e0c", "c̣h" # ฌ THAI CHARACTER CHO CHOE
|
38
|
+
sub "\u0e0d", "ỵ" # ญ THAI CHARACTER YO YING
|
39
|
+
sub "\u0e0e", "ḍ" # ฎ THAI CHARACTER DO CHADA
|
40
|
+
sub "\u0e0f", "ṭ" # ฏ THAI CHARACTER TO PATAK
|
41
|
+
sub "\u0e10", "ṭ̄h" # ฐ THAI CHARACTER THO THAN
|
42
|
+
sub "\u0e11", "ṯh" # ฑ THAI CHARACTER THO NANGMONTHO
|
43
|
+
sub "\u0e12", "t̛h" # ฒ THAI CHARACTER THO PHUTHAO
|
44
|
+
sub "\u0e13", "ṇ" # ณ THAI CHARACTER NO NEN
|
45
|
+
sub "\u0e14", "d" # ด THAI CHARACTER DO DEK
|
46
|
+
sub "\u0e15", "t" # ต THAI CHARACTER TO TAO
|
47
|
+
sub "\u0e16", "t̄h" # ถ THAI CHARACTER THO THUNG
|
48
|
+
sub "\u0e17", "th" # ท THAI CHARACTER THO THAHAN
|
49
|
+
sub "\u0e18", "ṭh" # ธ THAI CHARACTER THO THONG
|
50
|
+
sub "\u0e19", "n" # น THAI CHARACTER NO NU
|
51
|
+
sub "\u0e1a", "b" # บ THAI CHARACTER BO BAIMAI
|
52
|
+
sub "\u0e1b", "p" # ป THAI CHARACTER PO PLA
|
53
|
+
sub "\u0e1c", "p̄h" # ผ THAI CHARACTER PHO PHUNG
|
54
|
+
sub "\u0e1d", "f̄" # ฝ THAI CHARACTER FO FA
|
55
|
+
sub "\u0e1e", "ph" # พ THAI CHARACTER PHO PHAN
|
56
|
+
sub "\u0e1f", "f" # ฟ THAI CHARACTER FO FAN
|
57
|
+
sub "\u0e20", "p̣h" # ภ THAI CHARACTER PHO SAMPHAO
|
58
|
+
sub "\u0e21", "m" # ม THAI CHARACTER MO MA
|
59
|
+
sub "\u0e22", "y" # ย THAI CHARACTER YO YAK
|
60
|
+
sub "\u0e23", "r" # ร THAI CHARACTER RO RUA
|
61
|
+
sub "\u0e24", "v" # ฤ THAI CHARACTER RU
|
62
|
+
sub "\u0e25", "l" # ล THAI CHARACTER LO LING
|
63
|
+
sub "\u0e26", "ł" # ฦ THAI CHARACTER LU
|
64
|
+
sub "\u0e27", "w" # ว THAI CHARACTER WO WAEN
|
65
|
+
sub "\u0e28", "ṣ̄" # ศ THAI CHARACTER SO SALA
|
66
|
+
sub "\u0e29", "s̛̄" # ษ THAI CHARACTER SO RUSI
|
67
|
+
sub "\u0e2a", "s̄" # ส THAI CHARACTER SO SUA
|
68
|
+
sub "\u0e2b", "h̄" # ห THAI CHARACTER HO HIP
|
69
|
+
sub "\u0e2c", "ḷ" # ฬ THAI CHARACTER LO CHULA
|
70
|
+
sub "\u0e2d", "x" # อ THAI CHARACTER O ANG
|
71
|
+
sub "\u0e2e", "ḥ" # ฮ THAI CHARACTER HO NOKHUK
|
72
|
+
sub "\u0e2f", "ǂ" # ฯ THAI CHARACTER PAIYANNOI
|
73
|
+
sub "\u0e30", "a" # ะ THAI CHARACTER SARA A
|
74
|
+
sub "\u0e31", "ạ" # ั THAI CHARACTER MAI HAN-AKAT
|
75
|
+
sub "\u0e32", "ā" # า THAI CHARACTER SARA AA
|
76
|
+
sub "\u0e33", "å" # ำ THAI CHARACTER SARA AM
|
77
|
+
sub "\u0e34", "i" # ิ THAI CHARACTER SARA I
|
78
|
+
sub "\u0e35", "ī" # ี THAI CHARACTER SARA II
|
79
|
+
sub "\u0e36", "ụ" # ึ THAI CHARACTER SARA UE
|
80
|
+
sub "\u0e37", "ụ̄" # ื THAI CHARACTER SARA UEE
|
81
|
+
sub "\u0e38", "u" # ุ THAI CHARACTER SARA U
|
82
|
+
sub "\u0e39", "ū" # ู THAI CHARACTER SARA UU
|
83
|
+
sub "\u0e3a", "–̥" # ฺ THAI CHARACTER PHINTHU
|
84
|
+
sub "\u0e40", "e" # เ THAI CHARACTER SARA E
|
85
|
+
sub "\u0e41", "æ" # แ THAI CHARACTER SARA AE
|
86
|
+
sub "\u0e42", "o" # โ THAI CHARACTER SARA O
|
87
|
+
sub "\u0e43", "ı" # ใ THAI CHARACTER SARA AI MAIMUAN
|
88
|
+
sub "\u0e44", "ị" # ไ THAI CHARACTER SARA AI MAIMALAI
|
89
|
+
sub "\u0e45", "ɨ" # ๅ THAI CHARACTER LAKKHANGYAO
|
90
|
+
sub "\u0e46", "«" # ๆ THAI CHARACTER MAIYAMOK
|
91
|
+
sub "\u0e47", "̆" # ็ THAI CHARACTER MAITAIKHU
|
92
|
+
sub "\u0e48", "̀" # ่ THAI CHARACTER MAI EK
|
93
|
+
sub "\u0e49", "̂" # ้ THAI CHARACTER MAI THO
|
94
|
+
sub "\u0e4a", "́" # ๊ THAI CHARACTER MAI TRI
|
95
|
+
sub "\u0e4b", "̌" # ๋ THAI CHARACTER MAI CHATTAWA
|
96
|
+
sub "\u0e4c", "̒" # ์ THAI CHARACTER THANTHAKHAT
|
97
|
+
sub "\u0e4d", "̊" # ํ THAI CHARACTER NIKHAHIT
|
98
|
+
sub "\u0e4e", "~" # ๎ THAI CHARACTER YAMAKKAN
|
99
|
+
sub "\u0e4f", "§" # ๏ THAI CHARACTER FONGMAN
|
100
|
+
sub "\u0e50", "0" # ๐ THAI DIGIT ZERO
|
101
|
+
sub "\u0e51", "1" # ๑ THAI DIGIT ONE
|
102
|
+
sub "\u0e52", "2" # ๒ THAI DIGIT TWO
|
103
|
+
sub "\u0e53", "3" # ๓ THAI DIGIT THREE
|
104
|
+
sub "\u0e54", "4" # ๔ THAI DIGIT FOUR
|
105
|
+
sub "\u0e55", "5" # ๕ THAI DIGIT FIVE
|
106
|
+
sub "\u0e56", "6" # ๖ THAI DIGIT SIX
|
107
|
+
sub "\u0e57", "7" # ๗ THAI DIGIT SEVEN
|
108
|
+
sub "\u0e58", "8" # ๘ THAI DIGIT EIGHT
|
109
|
+
sub "\u0e59", "9" # ๙ THAI DIGIT NINE
|
110
|
+
sub "\u0e5a", "ǁ" # ๚ THAI CHARACTER ANGKHANKHU
|
111
|
+
sub "\u0e5b", "»" # ๛ THAI CHARACTER KHOMUT
|
112
|
+
}
|
113
|
+
compose
|
114
|
+
}
|
@@ -0,0 +1,540 @@
|
|
1
|
+
metadata {
|
2
|
+
authority_id: kp
|
3
|
+
id: 2002
|
4
|
+
language: iso-639-2:kor
|
5
|
+
source_script: Hang
|
6
|
+
destination_script: Latn
|
7
|
+
name: Korean Democratic People's Republic of Korea Korean System (2002)
|
8
|
+
url: https://unstats.un.org/unsd/geoinfo/UNGEGN/docs/8th-uncsgn-docs/inf/8th_UNCSGN_econf.94_INF.72.pdf
|
9
|
+
creation_date:
|
10
|
+
adoption_date:
|
11
|
+
description:
|
12
|
+
|
13
|
+
notes:
|
14
|
+
|
15
|
+
- Here is a list of features that are listed in the guideline but
|
16
|
+
not unimplemented in this map.
|
17
|
+
|
18
|
+
- Note 3.2
|
19
|
+
The combination n+r is romanized as -ll- only when it is "considered
|
20
|
+
to be longstanding". In this implementation, all n+r will be romanized as
|
21
|
+
-ll- for the sake of simplicity.
|
22
|
+
|
23
|
+
- Note 3.3
|
24
|
+
Sai-siot (Connective ㅅ) is not written out in DPRK Korean, but it is
|
25
|
+
supposed to be romanized. Sai-siot is not predictable.
|
26
|
+
This has not been implemented.
|
27
|
+
|
28
|
+
- Note 4.1
|
29
|
+
Hyphen "may be inserted in case of a possible confusion in pronunciation".
|
30
|
+
Except for the n-g combination, this has not been implemented.
|
31
|
+
|
32
|
+
- Note 4.4
|
33
|
+
Geographical names "may be transliterated or translated". In this map,
|
34
|
+
all names will be transliterated, not translated. Numerals will not be
|
35
|
+
transliterated.
|
36
|
+
|
37
|
+
- Note 4.5
|
38
|
+
Spacing rule for personal names has not been implemented.
|
39
|
+
|
40
|
+
- Note 4.7
|
41
|
+
Optional omission of diacritics and optional simplification of
|
42
|
+
KK, TT, PP, SS, JJ to single letter have not been implemented.
|
43
|
+
}
|
44
|
+
|
45
|
+
tests {
|
46
|
+
# Note1.5
|
47
|
+
test "우리산", "Urisan"
|
48
|
+
# Note2.1
|
49
|
+
test "교구동", "Kyogu-dong"
|
50
|
+
test "초도", "Chodo"
|
51
|
+
test "고비리", "Kobi-ri"
|
52
|
+
test "강동", "Kangdong"
|
53
|
+
test "금교", "Kümgyo"
|
54
|
+
test "칠보산", "Chilbosan"
|
55
|
+
# Note2.2
|
56
|
+
test "곡산", "Koksan"
|
57
|
+
test "갑산", "Kapsan"
|
58
|
+
test "앞산", "Apsan"
|
59
|
+
test "삿갓봉", "Satkatbong"
|
60
|
+
# Note2.3
|
61
|
+
test "울산", "Ulsan"
|
62
|
+
# - source: "은률"
|
63
|
+
# expected: "Ünryul" # This is an exceptino to note 3.1
|
64
|
+
# Note2.4
|
65
|
+
test "닭섬", "Taksŏm"
|
66
|
+
test "물곬", "Mulkol"
|
67
|
+
test "붉은바위", "Pulgünbawi"
|
68
|
+
test "앉은바위", "Anjünbawi"
|
69
|
+
# Note3.1
|
70
|
+
test "백마산", "Paengmasan"
|
71
|
+
test "꽃마을", "Kkonmaül"
|
72
|
+
test "압록강", "Amrokgang"
|
73
|
+
# Note3.2
|
74
|
+
test "천리마", "Chŏllima"
|
75
|
+
# - source: "한나산" # Typo in the original document
|
76
|
+
test "한라산", "Hallasan"
|
77
|
+
test "전라도", "Jŏlla-do"
|
78
|
+
# Note3.3
|
79
|
+
# - source: "기대산" # ROK: 깃대산
|
80
|
+
# expected: "Kittaesan"
|
81
|
+
# - source: "새별읍" # ROK: 샛별
|
82
|
+
# expected: "Saeppyŏl-üp" # hyphen
|
83
|
+
# - source: "뒤문" # ROK: 뒷문
|
84
|
+
# expected: "Twinmun"
|
85
|
+
# Note4.1 - Separator (OPTIONAL)
|
86
|
+
test "앞-언덕", "Ap-ŏndŏk"
|
87
|
+
test "부억-안골", "Puŏk-angol"
|
88
|
+
test "판교", "Phan-gyo"
|
89
|
+
# - source: "방어동"
|
90
|
+
# expected: "Pang-ŏ-dong"
|
91
|
+
# Note4.2
|
92
|
+
test "평안남도 평성시", "Phyŏngannam-do Phyŏngsŏng-si"
|
93
|
+
# Note4.3
|
94
|
+
test "3.1동", "3.1-dong"
|
95
|
+
# Note4.6
|
96
|
+
test "평양", "Pyongyang"
|
97
|
+
# Fix a problem with a trailing comma
|
98
|
+
test "구현, 글꼴, 문자 배열, 다국어 컴퓨팅.", "Kuhyŏn, Külkkol, Munja Paeyŏl, Tagugŏ Khŏmphyuthing."
|
99
|
+
}
|
100
|
+
|
101
|
+
dependency "unicode", import: true
|
102
|
+
dependency "var-kor-Hang-Hang-jamo", as: hanghang
|
103
|
+
|
104
|
+
|
105
|
+
stage {
|
106
|
+
|
107
|
+
|
108
|
+
# RULES
|
109
|
+
|
110
|
+
# This system does not require transliteration of numerals
|
111
|
+
# convert numbers to space + Hangul
|
112
|
+
# - pattern: "([^0-9 ])(?=[0-9])"
|
113
|
+
# result: "\\1 "
|
114
|
+
# - pattern: "1"
|
115
|
+
# result: "일"
|
116
|
+
# - pattern: "2"
|
117
|
+
# result: "이"
|
118
|
+
# - pattern: "3"
|
119
|
+
# result: "삼"
|
120
|
+
# - pattern: "4"
|
121
|
+
# result: "사"
|
122
|
+
# - pattern: "5"
|
123
|
+
# result: "오"
|
124
|
+
# - pattern: "6"
|
125
|
+
# result: "육"
|
126
|
+
# - pattern: "7"
|
127
|
+
# result: "칠"
|
128
|
+
# - pattern: "8"
|
129
|
+
# result: "팔"
|
130
|
+
# - pattern: "9"
|
131
|
+
# result: "구"
|
132
|
+
|
133
|
+
# Use voiced onset for geographical features
|
134
|
+
# Note 4.3.1
|
135
|
+
sub "산" + capture(any([" ", line_end])), "san" + ref( 1 ), before: any_character + any_character
|
136
|
+
sub "거리" + capture(any([" ", line_end])), "gŏri" + ref( 1 ), before: any_character + any_character
|
137
|
+
sub "고개" + capture(any([" ", line_end])), "gogae" + ref( 1 ), before: any_character + any_character
|
138
|
+
sub "대" + capture(any([" ", line_end])), "dae" + ref( 1 ), before: any_character + any_character
|
139
|
+
sub "봉" + capture(any([" ", line_end])), "bong" + ref( 1 ), before: any_character + any_character
|
140
|
+
sub "교" + capture(any([" ", line_end])), "gyo" + ref( 1 ), before: any_character + any_character
|
141
|
+
sub "골" + capture(any([" ", line_end])), "gol" + ref( 1 ), before: any_character + any_character
|
142
|
+
sub "각" + capture(any([" ", line_end])), "gak" + ref( 1 ), before: any_character + any_character
|
143
|
+
sub "벌" + capture(any([" ", line_end])), "bŏl" + ref( 1 ), before: any_character + any_character
|
144
|
+
sub "관" + capture(any([" ", line_end])), "gwan" + ref( 1 ), before: any_character + any_character
|
145
|
+
sub "곶" + capture(any([" ", line_end])), "got" + ref( 1 ), before: any_character + any_character
|
146
|
+
sub "강" + capture(any([" ", line_end])), "gang" + ref( 1 ), before: any_character + any_character
|
147
|
+
|
148
|
+
# add hyphen in front of generics
|
149
|
+
# Only add hyphen if the name is three syllables or longer
|
150
|
+
sub "도" + capture(any([" ", line_end])), "-do" + ref( 1 ), before: any_character + any_character
|
151
|
+
sub "시" + capture(any([" ", line_end])), "-si" + ref( 1 ), before: any_character + any_character
|
152
|
+
sub "군" + capture(any([" ", line_end])), "-gun" + ref( 1 ), before: any_character + any_character
|
153
|
+
sub "면" + capture(any([" ", line_end])), "-myŏn" + ref( 1 ), before: any_character + any_character
|
154
|
+
sub "리" + capture(any([" ", line_end])), "-ri" + ref( 1 ), before: any_character + any_character
|
155
|
+
sub "동" + capture(any([" ", line_end])), "-dong" + ref( 1 ), before: any_character + any_character
|
156
|
+
sub "구" + capture(any([" ", line_end])), "-gu" + ref( 1 ), before: any_character + any_character
|
157
|
+
sub "구역" + capture(any([" ", line_end])), "-guyŏk" + ref( 1 ), before: any_character + any_character
|
158
|
+
|
159
|
+
# The name Pyongyang will be an exception
|
160
|
+
# Not Phyŏngyang
|
161
|
+
|
162
|
+
sub "평양", "Pyongyang"
|
163
|
+
|
164
|
+
|
165
|
+
run map.hanghang.stage.main
|
166
|
+
|
167
|
+
|
168
|
+
# POSTRULES
|
169
|
+
|
170
|
+
# Add space to the two ends of the string for easier word boundary handling
|
171
|
+
sub line_start, " "
|
172
|
+
sub line_end, " "
|
173
|
+
|
174
|
+
# HANGUL JONGSEONG SSANGKIYEOK
|
175
|
+
sub "ᆩᄋ", "ᆨᄁ"
|
176
|
+
sub "ᆩ", "ᆨ"
|
177
|
+
|
178
|
+
# HANGUL JONGSEONG SSANGKIYEOK
|
179
|
+
sub "ᆪᄋ", "ᆨᄉ"
|
180
|
+
sub "ᆪ", "ᆨ"
|
181
|
+
|
182
|
+
# HANGUL JONGSEONG NIEUN-CIEUC
|
183
|
+
sub "ᆬᄋ", "ᆫᄌ"
|
184
|
+
sub "ᆬ", "ᆫ"
|
185
|
+
|
186
|
+
# HANGUL JONGSEONG NIEUN-CIEUC
|
187
|
+
sub "ᆭᄀ", "ᆫᄏ"
|
188
|
+
sub "ᆭᄃ", "ᆫᄐ"
|
189
|
+
sub "ᆭᄇ", "ᆫᄑ"
|
190
|
+
sub "ᆭᄌ", "ᆫᄎ"
|
191
|
+
sub "ᆭ", "ᆫ"
|
192
|
+
|
193
|
+
# HANGUL JONGSEONG TIEUT
|
194
|
+
sub "ᆮ", "ᆺ", after: any("ᄀᄁᄂᄃᄄᄅᄆᄇᄈᄉᄊᄌᄍᄎᄏᄐᄑᄒ")
|
195
|
+
|
196
|
+
# HANGUL JONGSEONG RIEUL-SIOS
|
197
|
+
sub "ᆳᄋ", "ᆯᄉ"
|
198
|
+
sub "ᆳ", "ᆯ"
|
199
|
+
|
200
|
+
# HANGUL JONGSEONG RIEUL-THIEUTH
|
201
|
+
sub "ᆴᄋ", "ᆯᄐ"
|
202
|
+
sub "ᆴ", "ᆯ"
|
203
|
+
|
204
|
+
# HANGUL JONGSEONG RIEUL-PHIEUPH
|
205
|
+
sub "ᆵᄋ", "ᆯᄑ"
|
206
|
+
sub "ᆵ", "ᆯ", after: any("ᄃᄄᄐ")
|
207
|
+
sub "ᆵ", "ᄇ"
|
208
|
+
|
209
|
+
# HANGUL JONGSEONG RIEUL-HIEUH
|
210
|
+
sub "ᆶᄀ", "ᆯᄏ"
|
211
|
+
sub "ᆶᄃ", "ᆯᄐ"
|
212
|
+
sub "ᆶᄇ", "ᆯᄑ"
|
213
|
+
sub "ᆶᄌ", "ᆯᄎ"
|
214
|
+
sub "ᆶ", "ᆯ"
|
215
|
+
|
216
|
+
# HANGUL JONGSEONG PIEUP-SIOS
|
217
|
+
sub "ᆹᄋ", "ᄇᄉ"
|
218
|
+
sub "ᆹ", "ᄇ"
|
219
|
+
|
220
|
+
# HANGUL JONGSEONG SSANG-SIOS
|
221
|
+
sub "ᆻᄋ", "ᆺᄊ"
|
222
|
+
sub "ᆻ", "ᆺ"
|
223
|
+
|
224
|
+
# HANGUL JONGSEONG CIEUC
|
225
|
+
sub "ᆽᄋ", "ᆺᄌ"
|
226
|
+
sub "ᆽ", "ᆺ"
|
227
|
+
|
228
|
+
# HANGUL JONGSEONG CHIEUCH
|
229
|
+
sub "ᆾᄋ", "ᆺᄎ"
|
230
|
+
sub "ᆾ", "ᆺ"
|
231
|
+
|
232
|
+
# HANGUL JONGSEONG KHIEUKH
|
233
|
+
sub "ᆿᄋ", "ᆨᄏ"
|
234
|
+
sub "ᆿ", "ᆨ"
|
235
|
+
|
236
|
+
# HANGUL JONGSEONG THIEUTH
|
237
|
+
sub "ᇀᄋ", "ᆺᄐ"
|
238
|
+
sub "ᇀ", "ᆺ"
|
239
|
+
|
240
|
+
# HANGUL JONGSEONG PHIEUPH
|
241
|
+
sub "ᇁᄋ", "ᆸᄑ"
|
242
|
+
sub "ᇁ", "ᆸ"
|
243
|
+
|
244
|
+
# HANGUL JONGSEONG HIEUH
|
245
|
+
sub "ᇂᄀ", "ᄏ"
|
246
|
+
sub "ᇂᄃ", "ᄐ"
|
247
|
+
sub "ᇂᄇ", "ᄑ"
|
248
|
+
sub "ᇂᄌ", "ᄎ"
|
249
|
+
sub "ᇂ", ""
|
250
|
+
|
251
|
+
# CHARACTERS
|
252
|
+
# parallel {
|
253
|
+
# From Unicode Chart
|
254
|
+
# https://github.com/unicode-org/cldr/blob/master/common/transforms/Korean-Latin-BGN.xml
|
255
|
+
parallel {
|
256
|
+
sub "ᆨᄀ", "kk" # HANGUL JONGSEONG KIYEOK + CHOSEONG KIYEOK
|
257
|
+
sub "ᆨᄂ", "ngn" # HANGUL JONGSEONG KIYEOK + CHOSEONG NIEUN
|
258
|
+
sub "ᆨᄃ", "kt" # HANGUL JONGSEONG KIYEOK + CHOSEONG TIEUT
|
259
|
+
sub "ᆨᄅ", "ngn" # HANGUL JONGSEONG KIYEOK + CHOSEONG RIEUL
|
260
|
+
sub "ᆨᄆ", "ngm" # HANGUL JONGSEONG KIYEOK + CHOSEONG MIEUM
|
261
|
+
sub "ᆨᄇ", "kp" # HANGUL JONGSEONG KIYEOK + CHOSEONG PIEUP
|
262
|
+
sub "ᆨᄉ", "ks" # HANGUL JONGSEONG KIYEOK + CHOSEONG SIOS
|
263
|
+
sub "ᆨᄋ", "g" # HANGUL JONGSEONG KIYEOK + CHOSEONG IEUNG
|
264
|
+
sub "ᆨᄌ", "kj" # HANGUL JONGSEONG KIYEOK + CHOSEONG CIEUC
|
265
|
+
sub "ᆨᄎ", "kch" # HANGUL JONGSEONG KIYEOK + CHOSEONG CHIEUCH
|
266
|
+
sub "ᆨᄏ", "kkh" # HANGUL JONGSEONG KIYEOK + CHOSEONG KHIEUKH # NOTE: the dash is always skipped
|
267
|
+
sub "ᆨᄐ", "kth" # HANGUL JONGSEONG KIYEOK + CHOSEONG THIEUTH
|
268
|
+
sub "ᆨᄑ", "kp" # HANGUL JONGSEONG KIYEOK + CHOSEONG PHIEUPH
|
269
|
+
sub "ᆨᄒ", "kh" # HANGUL JONGSEONG KIYEOK + CHOSEONG HIEUH
|
270
|
+
sub "ᆨᄁ", "kkk" # HANGUL JONGSEONG KIYEOK + CHOSEONG SSANGKIYEOK
|
271
|
+
sub "ᆨᄄ", "ktt" # HANGUL JONGSEONG KIYEOK + CHOSEONG SSANGTIEUT
|
272
|
+
sub "ᆨᄈ", "kpp" # HANGUL JONGSEONG KIYEOK + CHOSEONG SSANGPIEUP
|
273
|
+
sub "ᆨᄊ", "kss" # HANGUL JONGSEONG KIYEOK + CHOSEONG SSANGSIOS
|
274
|
+
sub "ᆨᄍ", "kjj" # HANGUL JONGSEONG KIYEOK + CHOSEONG SSANGCIEUC
|
275
|
+
sub "ᆫᄀ", "n-g" # HANGUL JONGSEONG NIEUN + CHOSEONG KIEUK
|
276
|
+
sub "ᆫᄂ", "nn" # HANGUL JONGSEONG NIEUN + CHOSEONG NIEUN
|
277
|
+
sub "ᆫᄃ", "nd" # HANGUL JONGSEONG NIEUN + CHOSEONG TIEUT
|
278
|
+
sub "ᆫᄅ", "ll" # HANGUL JONGSEONG NIEUN + CHOSEONG RIEUL
|
279
|
+
sub "ᆫᄆ", "nm" # HANGUL JONGSEONG NIEUN + CHOSEONG MIEUM
|
280
|
+
sub "ᆫᄇ", "nb" # HANGUL JONGSEONG NIEUN + CHOSEONG PIEUP
|
281
|
+
sub "ᆫᄉ", "ns" # HANGUL JONGSEONG NIEUN + CHOSEONG SIOS
|
282
|
+
sub "ᆫᄋ", "n" # HANGUL JONGSEONG NIEUN + CHOSEONG IEUNG
|
283
|
+
sub "ᆫᄌ", "nj" # HANGUL JONGSEONG NIEUN + CHOSEONG CIEUC
|
284
|
+
sub "ᆫᄎ", "nch" # HANGUL JONGSEONG NIEUN + CHOSEONG CHIEUCH
|
285
|
+
sub "ᆫᄏ", "nkh" # HANGUL JONGSEONG NIEUN + CHOSEONG KHIEUKH
|
286
|
+
sub "ᆫᄐ", "nth" # HANGUL JONGSEONG NIEUN + CHOSEONG THIEUTH
|
287
|
+
sub "ᆫᄑ", "nph" # HANGUL JONGSEONG NIEUN + CHOSEONG PHIEUPH
|
288
|
+
sub "ᆫᄒ", "nh" # HANGUL JONGSEONG NIEUN + CHOSEONG HIEUH
|
289
|
+
sub "ᆫᄁ", "nkk" # HANGUL JONGSEONG NIEUN + CHOSEONG SSANGKIYEOK
|
290
|
+
sub "ᆫᄄ", "ntt" # HANGUL JONGSEONG NIEUN + CHOSEONG SSANGTIEUT
|
291
|
+
sub "ᆫᄈ", "npp" # HANGUL JONGSEONG NIEUN + CHOSEONG SSANGPIEUP
|
292
|
+
sub "ᆫᄊ", "nss" # HANGUL JONGSEONG NIEUN + CHOSEONG SSANGSIOS
|
293
|
+
sub "ᆫᄍ", "njj" # HANGUL JONGSEONG NIEUN + CHOSEONG SSANGCIEUC
|
294
|
+
sub "ᆯᄀ", "lk" # HANGUL JONGSEONG RIEUL + CHOSEONG KIYEOK
|
295
|
+
sub "ᆯᄂ", "ll" # HANGUL JONGSEONG RIEUL + CHOSEONG NIEUN
|
296
|
+
sub "ᆯᄃ", "lt" # HANGUL JONGSEONG RIEUL + CHOSEONG TIEUT
|
297
|
+
sub "ᆯᄅ", "ll" # HANGUL JONGSEONG RIEUL + CHOSEONG RIEUL
|
298
|
+
sub "ᆯᄆ", "lm" # HANGUL JONGSEONG RIEUL + CHOSEONG MIEUM
|
299
|
+
sub "ᆯᄇ", "lb" # HANGUL JONGSEONG RIEUL + CHOSEONG PIEUP
|
300
|
+
sub "ᆯᄉ", "ls" # HANGUL JONGSEONG RIEUL + CHOSEONG SIOS
|
301
|
+
sub "ᆯᄋ", "r" # HANGUL JONGSEONG RIEUL + CHOSEONG IEUNG
|
302
|
+
sub "ᆯᄌ", "lj" # HANGUL JONGSEONG RIEUL + CHOSEONG CIEUC
|
303
|
+
sub "ᆯᄎ", "lch" # HANGUL JONGSEONG RIEUL + CHOSEONG CHIEUCH
|
304
|
+
sub "ᆯᄏ", "lkh" # HANGUL JONGSEONG RIEUL + CHOSEONG KHIEUKH
|
305
|
+
sub "ᆯᄐ", "lth" # HANGUL JONGSEONG RIEUL + CHOSEONG THIEUTH
|
306
|
+
sub "ᆯᄑ", "lph" # HANGUL JONGSEONG RIEUL + CHOSEONG PHIEUPH
|
307
|
+
sub "ᆯᄒ", "lh" # HANGUL JONGSEONG RIEUL + CHOSEONG HIEUH
|
308
|
+
sub "ᆯᄁ", "lkk" # HANGUL JONGSEONG RIEUL + CHOSEONG SSANGKIYEOK
|
309
|
+
sub "ᆯᄄ", "ltt" # HANGUL JONGSEONG RIEUL + CHOSEONG SSANGTIEUT
|
310
|
+
sub "ᆯᄈ", "lpp" # HANGUL JONGSEONG RIEUL + CHOSEONG SSANGPIEUP
|
311
|
+
sub "ᆯᄊ", "lss" # HANGUL JONGSEONG RIEUL + CHOSEONG SSANGSIOS
|
312
|
+
sub "ᆯᄍ", "ljj" # HANGUL JONGSEONG RIEUL + CHOSEONG SSANGCIEUC
|
313
|
+
sub "ᆷᄀ", "mg" # HANGUL JONGSEONG MIEUM + CHOSEONG KIYEOK
|
314
|
+
sub "ᆷᄂ", "mn" # HANGUL JONGSEONG MIEUM + CHOSEONG NIEUN
|
315
|
+
sub "ᆷᄃ", "md" # HANGUL JONGSEONG MIEUM + CHOSEONG TIEUT
|
316
|
+
sub "ᆷᄅ", "mr" # HANGUL JONGSEONG MIEUM + CHOSEONG RIEUL # Note 3.1
|
317
|
+
sub "ᆷᄆ", "mm" # HANGUL JONGSEONG MIEUM + CHOSEONG MIEUM
|
318
|
+
sub "ᆷᄇ", "mb" # HANGUL JONGSEONG MIEUM + CHOSEONG PIEUP
|
319
|
+
sub "ᆷᄉ", "ms" # HANGUL JONGSEONG MIEUM + CHOSEONG SIOS
|
320
|
+
sub "ᆷᄋ", "m" # HANGUL JONGSEONG MIEUM + CHOSEONG IEUNG
|
321
|
+
sub "ᆷᄌ", "mj" # HANGUL JONGSEONG MIEUM + CHOSEONG CIEUC
|
322
|
+
sub "ᆷᄎ", "mch" # HANGUL JONGSEONG MIEUM + CHOSEONG CHIEUCH
|
323
|
+
sub "ᆷᄏ", "mkh" # HANGUL JONGSEONG MIEUM + CHOSEONG KHIEUKH
|
324
|
+
sub "ᆷᄐ", "mth" # HANGUL JONGSEONG MIEUM + CHOSEONG THIEUTH
|
325
|
+
sub "ᆷᄑ", "mph" # HANGUL JONGSEONG MIEUM + CHOSEONG PHIEUPH
|
326
|
+
sub "ᆷᄒ", "mh" # HANGUL JONGSEONG MIEUM + CHOSEONG HIEUH
|
327
|
+
sub "ᆷᄁ", "mkk" # HANGUL JONGSEONG MIEUM + CHOSEONG SSANGKIYEOK
|
328
|
+
sub "ᆷᄄ", "mtt" # HANGUL JONGSEONG MIEUM + CHOSEONG SSANGTIEUT
|
329
|
+
sub "ᆷᄈ", "mpp" # HANGUL JONGSEONG MIEUM + CHOSEONG SSANGPIEUP
|
330
|
+
sub "ᆷᄊ", "mss" # HANGUL JONGSEONG MIEUM + CHOSEONG SSANGSIOS
|
331
|
+
sub "ᆷᄍ", "mjj" # HANGUL JONGSEONG MIEUM + CHOSEONG SSANGCIEUC
|
332
|
+
sub "ᆸᄀ", "pk" # HANGUL JONGSEONG PIEUP + CHOSEONG KIYEOK
|
333
|
+
sub "ᆸᄂ", "mn" # HANGUL JONGSEONG PIEUP + CHOSEONG NIEUN
|
334
|
+
sub "ᆸᄃ", "pt" # HANGUL JONGSEONG PIEUP + CHOSEONG TIEUT
|
335
|
+
sub "ᆸᄅ", "mr" # HANGUL JONGSEONG PIEUP + CHOSEONG RIEUL
|
336
|
+
sub "ᆸᄆ", "mm" # HANGUL JONGSEONG PIEUP + CHOSEONG MIEUM
|
337
|
+
sub "ᆸᄇ", "pp" # HANGUL JONGSEONG PIEUP + CHOSEONG PIEUP
|
338
|
+
sub "ᆸᄉ", "ps" # HANGUL JONGSEONG PIEUP + CHOSEONG SIOS
|
339
|
+
sub "ᆸᄋ", "b" # HANGUL JONGSEONG PIEUP + CHOSEONG IEUNG
|
340
|
+
sub "ᆸᄌ", "pj" # HANGUL JONGSEONG PIEUP + CHOSEONG CIEUC
|
341
|
+
sub "ᆸᄎ", "pch" # HANGUL JONGSEONG PIEUP + CHOSEONG CHIEUCH
|
342
|
+
sub "ᆸᄏ", "pkh" # HANGUL JONGSEONG PIEUP + CHOSEONG KHIEUKH
|
343
|
+
sub "ᆸᄐ", "pth" # HANGUL JONGSEONG PIEUP + CHOSEONG THIEUTH
|
344
|
+
sub "ᆸᄑ", "pph" # HANGUL JONGSEONG PIEUP + CHOSEONG PHIEUPH
|
345
|
+
sub "ᆸᄒ", "ph" # HANGUL JONGSEONG PIEUP + CHOSEONG HIEUH
|
346
|
+
sub "ᆸᄁ", "pkk" # HANGUL JONGSEONG PIEUP + CHOSEONG SSANGKIYEOK
|
347
|
+
sub "ᆸᄄ", "ptt" # HANGUL JONGSEONG PIEUP + CHOSEONG SSANGTIEUT
|
348
|
+
sub "ᆸᄈ", "ppp" # HANGUL JONGSEONG PIEUP + CHOSEONG SSANGPIEUP
|
349
|
+
sub "ᆸᄊ", "pss" # HANGUL JONGSEONG PIEUP + CHOSEONG SSANGSIOS
|
350
|
+
sub "ᆸᄍ", "pjj" # HANGUL JONGSEONG PIEUP + CHOSEONG SSANGCIEUC
|
351
|
+
sub "ᆺᄀ", "tk" # HANGUL JONGSEONG SIOS + CHOSEONG KIYEOK
|
352
|
+
sub "ᆺᄂ", "nn" # HANGUL JONGSEONG SIOS + CHOSEONG NIEUN
|
353
|
+
sub "ᆺᄃ", "tt" # HANGUL JONGSEONG SIOS + CHOSEONG TIEUT
|
354
|
+
sub "ᆺᄅ", "nr" # HANGUL JONGSEONG SIOS + CHOSEONG RIEUL # Note 3.1
|
355
|
+
sub "ᆺᄆ", "nm" # HANGUL JONGSEONG SIOS + CHOSEONG MIEUM
|
356
|
+
sub "ᆺᄇ", "tp" # HANGUL JONGSEONG SIOS + CHOSEONG PIEUP
|
357
|
+
sub "ᆺᄉ", "ts" # HANGUL JONGSEONG SIOS + CHOSEONG SIOS
|
358
|
+
sub "ᆺᄋ", "d" # HANGUL JONGSEONG SIOS + CHOSEONG IEUNG
|
359
|
+
sub "ᆺᄌ", "tj" # HANGUL JONGSEONG SIOS + CHOSEONG CIEUC
|
360
|
+
sub "ᆺᄎ", "tch" # HANGUL JONGSEONG SIOS + CHOSEONG CHIEUCH
|
361
|
+
sub "ᆺᄏ", "tkh" # HANGUL JONGSEONG SIOS + CHOSEONG KHIEUKH
|
362
|
+
sub "ᆺᄐ", "tth" # HANGUL JONGSEONG SIOS + CHOSEONG THIEUTH
|
363
|
+
sub "ᆺᄑ", "tph" # HANGUL JONGSEONG SIOS + CHOSEONG PHIEUPH
|
364
|
+
sub "ᆺᄒ", "th" # HANGUL JONGSEONG SIOS + CHOSEONG HIEUH
|
365
|
+
sub "ᆺᄁ", "tkk" # HANGUL JONGSEONG SIOS + CHOSEONG SSANGKIYEOK
|
366
|
+
sub "ᆺᄄ", "ttt" # HANGUL JONGSEONG SIOS + CHOSEONG SSANGTIEUT
|
367
|
+
sub "ᆺᄈ", "tpp" # HANGUL JONGSEONG SIOS + CHOSEONG SSANGPIEUP
|
368
|
+
sub "ᆺᄊ", "tss" # HANGUL JONGSEONG SIOS + CHOSEONG SSANGSIOS
|
369
|
+
sub "ᆺᄍ", "tjj" # HANGUL JONGSEONG SIOS + CHOSEONG SSANGCIEUC
|
370
|
+
sub "ᆼᄀ", "ngg" # HANGUL JONGSEONG IEUNG + CHOSEONG KIYEOK
|
371
|
+
sub "ᆼᄂ", "ngn" # HANGUL JONGSEONG IEUNG + CHOSEONG NIEUN
|
372
|
+
sub "ᆼᄃ", "ngd" # HANGUL JONGSEONG IEUNG + CHOSEONG TIEUT
|
373
|
+
sub "ᆼᄅ", "ngn" # HANGUL JONGSEONG IEUNG + CHOSEONG RIEUL
|
374
|
+
sub "ᆼᄆ", "ngm" # HANGUL JONGSEONG IEUNG + CHOSEONG MIEUM
|
375
|
+
sub "ᆼᄇ", "ngb" # HANGUL JONGSEONG IEUNG + CHOSEONG PIEUP
|
376
|
+
sub "ᆼᄉ", "ngs" # HANGUL JONGSEONG IEUNG + CHOSEONG SIOS
|
377
|
+
sub "ᆼᄋ", "ng" # HANGUL JONGSEONG IEUNG + CHOSEONG IEUNG
|
378
|
+
sub "ᆼᄌ", "ngj" # HANGUL JONGSEONG IEUNG + CHOSEONG CIEUC
|
379
|
+
sub "ᆼᄎ", "ngch" # HANGUL JONGSEONG IEUNG + CHOSEONG CHIEUCH
|
380
|
+
sub "ᆼᄏ", "ngkh" # HANGUL JONGSEONG IEUNG + CHOSEONG KHIEUKH
|
381
|
+
sub "ᆼᄐ", "ngth" # HANGUL JONGSEONG IEUNG + CHOSEONG THIEUTH
|
382
|
+
sub "ᆼᄑ", "ngph" # HANGUL JONGSEONG IEUNG + CHOSEONG PHIEUPH
|
383
|
+
sub "ᆼᄒ", "ngh" # HANGUL JONGSEONG IEUNG + CHOSEONG HIEUH
|
384
|
+
sub "ᆼᄁ", "ngkk" # HANGUL JONGSEONG IEUNG + CHOSEONG SSANGKIYEOK
|
385
|
+
sub "ᆼᄄ", "ngtt" # HANGUL JONGSEONG IEUNG + CHOSEONG SSANGTIEUT
|
386
|
+
sub "ᆼᄈ", "ngpp" # HANGUL JONGSEONG IEUNG + CHOSEONG SSANGPIEUP
|
387
|
+
sub "ᆼᄊ", "ngss" # HANGUL JONGSEONG IEUNG + CHOSEONG SSANGSIOS
|
388
|
+
sub "ᆼᄍ", "ngjj" # HANGUL JONGSEONG IEUNG + CHOSEONG SSANGCIEUC
|
389
|
+
sub "ᄀ", "g", before: any([any("-"), any("A".."Z"), any("a".."z"), any("0".."9"), any("ᅡᅢᅣᅤᅥᅦᅧᅨᅩᅪᅫᅬᅭᅮᅯᅰᅱᅲᅳᅴᅵ") ]) # VOWEL + CHOSEONG KIYEOK # c.f. Note 3.3
|
390
|
+
sub "ᄂ", "n", before: any([any("-"), any("A".."Z"), any("a".."z"), any("0".."9"), any("ᅡᅢᅣᅤᅥᅦᅧᅨᅩᅪᅫᅬᅭᅮᅯᅰᅱᅲᅳᅴᅵ") ]) # VOWEL + CHOSEONG NIEUN # c.f. Note 3.3
|
391
|
+
sub "ᄃ", "d", before: any([any("-"), any("A".."Z"), any("a".."z"), any("0".."9"), any("ᅡᅢᅣᅤᅥᅦᅧᅨᅩᅪᅫᅬᅭᅮᅯᅰᅱᅲᅳᅴᅵ") ]) # VOWEL + CHOSEONG TIEUT # c.f. Note 3.3
|
392
|
+
sub "ᄅ", "r", before: any([any("-"), any("A".."Z"), any("a".."z"), any("0".."9"), any("ᅡᅢᅣᅤᅥᅦᅧᅨᅩᅪᅫᅬᅭᅮᅯᅰᅱᅲᅳᅴᅵ") ]) # VOWEL + CHOSEONG RIEUL
|
393
|
+
sub "ᄆ", "m", before: any([any("-"), any("A".."Z"), any("a".."z"), any("0".."9"), any("ᅡᅢᅣᅤᅥᅦᅧᅨᅩᅪᅫᅬᅭᅮᅯᅰᅱᅲᅳᅴᅵ") ]) # VOWEL + CHOSEONG MIEUM # c.f. Note 3.3
|
394
|
+
sub "ᄇ", "b", before: any([any("-"), any("A".."Z"), any("a".."z"), any("0".."9"), any("ᅡᅢᅣᅤᅥᅦᅧᅨᅩᅪᅫᅬᅭᅮᅯᅰᅱᅲᅳᅴᅵ") ]) # VOWEL + CHOSEONG PIEUP # c.f. Note 3.3
|
395
|
+
sub "ᄉ", "s", before: any([any("-"), any("A".."Z"), any("a".."z"), any("0".."9"), any("ᅡᅢᅣᅤᅥᅦᅧᅨᅩᅪᅫᅬᅭᅮᅯᅰᅱᅲᅳᅴᅵ") ]) # VOWEL + CHOSEONG SIOS
|
396
|
+
sub "ᄋ", "", before: any([any("-"), any("A".."Z"), any("a".."z"), any("0".."9"), any("ᅡᅢᅣᅤᅥᅦᅧᅨᅩᅪᅫᅬᅭᅮᅯᅰᅱᅲᅳᅴᅵ") ]) # VOWEL + CHOSEONG IEUNG
|
397
|
+
sub "ᄌ", "j", before: any([any("-"), any("A".."Z"), any("a".."z"), any("0".."9"), any("ᅡᅢᅣᅤᅥᅦᅧᅨᅩᅪᅫᅬᅭᅮᅯᅰᅱᅲᅳᅴᅵ") ]) # VOWEL + CHOSEONG CIEUC
|
398
|
+
sub "ᄎ", "ch", before: any([any("-"), any("A".."Z"), any("a".."z"), any("0".."9"), any("ᅡᅢᅣᅤᅥᅦᅧᅨᅩᅪᅫᅬᅭᅮᅯᅰᅱᅲᅳᅴᅵ") ]) # VOWEL + CHOSEONG CHIEUCH
|
399
|
+
sub "ᄏ", "kh", before: any([any("-"), any("A".."Z"), any("a".."z"), any("0".."9"), any("ᅡᅢᅣᅤᅥᅦᅧᅨᅩᅪᅫᅬᅭᅮᅯᅰᅱᅲᅳᅴᅵ") ]) # VOWEL + CHOSEONG KHIEUKH
|
400
|
+
sub "ᄐ", "th", before: any([any("-"), any("A".."Z"), any("a".."z"), any("0".."9"), any("ᅡᅢᅣᅤᅥᅦᅧᅨᅩᅪᅫᅬᅭᅮᅯᅰᅱᅲᅳᅴᅵ") ]) # VOWEL + CHOSEONG THIEUTH
|
401
|
+
sub "ᄑ", "ph", before: any([any("-"), any("A".."Z"), any("a".."z"), any("0".."9"), any("ᅡᅢᅣᅤᅥᅦᅧᅨᅩᅪᅫᅬᅭᅮᅯᅰᅱᅲᅳᅴᅵ") ]) # VOWEL + CHOSEONG PHIEUPH
|
402
|
+
sub "ᄒ", "h", before: any([any("-"), any("A".."Z"), any("a".."z"), any("0".."9"), any("ᅡᅢᅣᅤᅥᅦᅧᅨᅩᅪᅫᅬᅭᅮᅯᅰᅱᅲᅳᅴᅵ") ]) # VOWEL + CHOSEONG HIEUH
|
403
|
+
sub "ᄁ", "kk", before: any([any("-"), any("A".."Z"), any("a".."z"), any("0".."9"), any("ᅡᅢᅣᅤᅥᅦᅧᅨᅩᅪᅫᅬᅭᅮᅯᅰᅱᅲᅳᅴᅵ") ]) # VOWEL + CHOSEONG SSANGKIYEOK
|
404
|
+
sub "ᄄ", "tt", before: any([any("A".."Z"), any("a".."z"), any("0".."9"), any("ᅡᅢᅣᅤᅥᅦᅧᅨᅩᅪᅫᅬᅭᅮᅯᅰᅱᅲᅳᅴᅵ") ]) # VOWEL + CHOSEONG SSANGTIEUT
|
405
|
+
sub "ᄈ", "pp", before: any([any("A".."Z"), any("a".."z"), any("0".."9"), any("ᅡᅢᅣᅤᅥᅦᅧᅨᅩᅪᅫᅬᅭᅮᅯᅰᅱᅲᅳᅴᅵ") ]) # VOWEL + CHOSEONG SSANGPIEUP
|
406
|
+
sub "ᄊ", "ss", before: any([any("A".."Z"), any("a".."z"), any("0".."9"), any("ᅡᅢᅣᅤᅥᅦᅧᅨᅩᅪᅫᅬᅭᅮᅯᅰᅱᅲᅳᅴᅵ") ]) # VOWEL + CHOSEONG SSANGSIOS
|
407
|
+
sub "ᄍ", "jj", before: any([any("A".."Z"), any("a".."z"), any("0".."9"), any("ᅡᅢᅣᅤᅥᅦᅧᅨᅩᅪᅫᅬᅭᅮᅯᅰᅱᅲᅳᅴᅵ") ]) # VOWEL + CHOSEONG SSANGCIEUC
|
408
|
+
sub "ᆰᄀ", "lg" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG KIYEOK
|
409
|
+
sub "ᆰᄂ", "ngn" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG NIEUN
|
410
|
+
sub "ᆰᄃ", "kt" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG TIEUT
|
411
|
+
sub "ᆰᄅ", "ngn" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG RIEUL
|
412
|
+
sub "ᆰᄆ", "ngm" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG MIEUM
|
413
|
+
sub "ᆰᄇ", "kp" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG PIEUP
|
414
|
+
sub "ᆰᄉ", "ks" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG SIOS
|
415
|
+
sub "ᆰᄋ", "lg" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG IEUNG
|
416
|
+
sub "ᆰᄌ", "kj" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG CIEUC
|
417
|
+
sub "ᆰᄎ", "kch" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG CHIEUCH
|
418
|
+
sub "ᆰᄏ", "lkh" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG KHIEUKH
|
419
|
+
sub "ᆰᄐ", "kth" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG THIEUTH
|
420
|
+
sub "ᆰᄑ", "kph" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG PHIEUPH
|
421
|
+
sub "ᆰᄒ", "lkh" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG HIEUH
|
422
|
+
sub "ᆰᄁ", "lkk" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG SSANGKIYEOK
|
423
|
+
sub "ᆰᄄ", "ktt" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG SSANGTIEUT
|
424
|
+
sub "ᆰᄈ", "kpp" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG SSANGPIEUP
|
425
|
+
sub "ᆰᄊ", "kss" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG SSANGSIOS
|
426
|
+
sub "ᆰᄍ", "kjj" # HANGUL JONGSEONG RIEUL-KIYEOK + CHOSEONG SSANGCIEUC
|
427
|
+
sub "ᆱᄀ", "mg" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG KIYEOK
|
428
|
+
sub "ᆱᄂ", "mn" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG NIEUN
|
429
|
+
sub "ᆱᄃ", "md" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG TIEUT
|
430
|
+
sub "ᆱᄅ", "mr" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG RIEUL
|
431
|
+
sub "ᆱᄆ", "lm" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG MIEUM
|
432
|
+
sub "ᆱᄇ", "mb" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG PIEUP
|
433
|
+
sub "ᆱᄉ", "ms" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG SIOS
|
434
|
+
sub "ᆱᄋ", "lm" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG IEUNG
|
435
|
+
sub "ᆱᄌ", "mj" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG CIEUC
|
436
|
+
sub "ᆱᄎ", "mch" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG CHIEUCH
|
437
|
+
sub "ᆱᄏ", "mkh" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG KHIEUKH
|
438
|
+
sub "ᆱᄐ", "mth" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG THIEUTH
|
439
|
+
sub "ᆱᄑ", "mph" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG PHIEUPH
|
440
|
+
sub "ᆱᄒ", "mh" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG HIEUH
|
441
|
+
sub "ᆱᄁ", "mkk" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG SSANGKIYEOK
|
442
|
+
sub "ᆱᄄ", "mtt" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG SSANGTIEUT
|
443
|
+
sub "ᆱᄈ", "mpp" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG SSANGPIEUP
|
444
|
+
sub "ᆱᄊ", "mss" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG SSANGSIOS
|
445
|
+
sub "ᆱᄍ", "mjj" # HANGUL JONGSEONG RIEUL-MIEUM + CHOSEONG SSANGCIEUC
|
446
|
+
sub "ᆲᄀ", "pk" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG KIYEOK
|
447
|
+
sub "ᆲᄂ", "mn" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG NIEUN
|
448
|
+
sub "ᆲᄃ", "pt" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG TIEUT
|
449
|
+
sub "ᆲᄅ", "mr" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG RIEUL
|
450
|
+
sub "ᆲᄆ", "mm" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG MIEUM
|
451
|
+
sub "ᆲᄇ", "lb" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG PIEUP
|
452
|
+
sub "ᆲᄉ", "ps" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG SIOS
|
453
|
+
sub "ᆲᄋ", "lb" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG IEUNG
|
454
|
+
sub "ᆲᄌ", "pj" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG CIEUC
|
455
|
+
sub "ᆲᄎ", "pch" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG CHIEUCH
|
456
|
+
sub "ᆲᄏ", "pkh" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG KHIEUKH
|
457
|
+
sub "ᆲᄐ", "pth" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG THIEUTH
|
458
|
+
sub "ᆲᄑ", "lph" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG PHIEUPH
|
459
|
+
sub "ᆲᄒ", "lph" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG HIEUH
|
460
|
+
sub "ᆲᄁ", "pkk" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG SSANGKIYEOK
|
461
|
+
sub "ᆲᄄ", "ptt" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG SSANGTIEUT
|
462
|
+
sub "ᆲᄈ", "lpp" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG SSANGPIEUP
|
463
|
+
sub "ᆲᄊ", "pss" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG SSANGSIOS
|
464
|
+
sub "ᆲᄍ", "pjj" # HANGUL JONGSEONG RIEUL-PIEUP + CHOSEONG SSANGCIEUC
|
465
|
+
sub "ᄀ", "k", before: " " # HANGUL CHOSEONG KIYEOK
|
466
|
+
sub "ᄂ", "n", before: " " # HANGUL CHOSEONG NIEUN
|
467
|
+
sub "ᄃ", "t", before: " " # HANGUL CHOSEONG TIEUT
|
468
|
+
|
469
|
+
# DPRK does not follow the R-onset rule
|
470
|
+
# - pattern: "(?<= )ᄅ(?=[ᅣᅤᅧᅨᅭᅲ])"
|
471
|
+
# result: "" # HANGUL CHOSEONG RIEUL # R-onset rule
|
472
|
+
sub "ᄅ", "r", before: " " # result: "n" # HANGUL CHOSEONG RIEUL
|
473
|
+
|
474
|
+
sub "ᄆ", "m", before: " " # HANGUL CHOSEONG MIEUM
|
475
|
+
sub "ᄇ", "p", before: " " # HANGUL CHOSEONG PIEUP
|
476
|
+
sub "ᄉ", "s", before: " " # HANGUL CHOSEONG SIOS
|
477
|
+
sub "ᄋ", "", before: " " # HANGUL CHOSEONG IEUNG
|
478
|
+
sub "ᄌ", "j", before: " " # HANGUL CHOSEONG CIEUC
|
479
|
+
sub "ᄎ", "ch", before: " " # HANGUL CHOSEONG CHIEUCH
|
480
|
+
sub "ᄏ", "kh", before: " " # HANGUL CHOSEONG KHIEUKH
|
481
|
+
sub "ᄐ", "th", before: " " # HANGUL CHOSEONG THIEUTH
|
482
|
+
sub "ᄑ", "ph", before: " " # HANGUL CHOSEONG PHIEUPH
|
483
|
+
sub "ᄒ", "h", before: " " # HANGUL CHOSEONG HIEUH
|
484
|
+
sub "ᄁ", "kk", before: " " # HANGUL CHOSEONG SSANGKIYEOK
|
485
|
+
sub "ᄭ", "kk", before: " " # HANGUL CHOSEONG SIOS-KIYEOK
|
486
|
+
sub "ᄄ", "tt", before: " " # HANGUL CHOSEONG SSANGTIEUT
|
487
|
+
sub "ᄯ", "tt", before: " " # HANGUL CHOSEONG SIOS-TIEUT
|
488
|
+
sub "ᄈ", "pp", before: " " # HANGUL CHOSEONG SSANGPIEUP
|
489
|
+
sub "ᄲ", "pp", before: " " # HANGUL CHOSEONG SIOS-PIEUP
|
490
|
+
sub "ᄊ", "ss", before: " " # HANGUL CHOSEONG SSANGSIOS
|
491
|
+
sub "ᄍ", "jj", before: " " # HANGUL CHOSEONG SSANGCIEUC
|
492
|
+
sub "ᄶ", "jj", before: " " # HANGUL CHOSEONG SIOS-CIEUC
|
493
|
+
sub "ᅡ", "a" # HANGUL JUNGSEONG A
|
494
|
+
sub "ᅣ", "ya" # HANGUL JUNGSEONG YA
|
495
|
+
sub "ᅥ", "ŏ" # HANGUL JUNGSEONG EO
|
496
|
+
sub "ᅧ", "yŏ" # HANGUL JUNGSEONG YEO
|
497
|
+
sub "ᅩ", "o" # HANGUL JUNGSEONG O
|
498
|
+
sub "ᅭ", "yo" # HANGUL JUNGSEONG YO
|
499
|
+
sub "ᅮ", "u" # HANGUL JUNGSEONG U
|
500
|
+
sub "ᅲ", "yu" # HANGUL JUNGSEONG YU
|
501
|
+
sub "ᅳ", "ü" # HANGUL JUNGSEONG EU
|
502
|
+
sub "ᅵ", "i" # HANGUL JUNGSEONG I
|
503
|
+
sub "ᅢ", "ae" # HANGUL JUNGSEONG AE
|
504
|
+
sub "ᅤ", "yae" # HANGUL JUNGSEONG YAE
|
505
|
+
sub "ᅦ", "e" # HANGUL JUNGSEONG E
|
506
|
+
sub "ᅨ", "ye" # HANGUL JUNGSEONG YE
|
507
|
+
sub "ᅬ", "oe" # HANGUL JUNGSEONG OE
|
508
|
+
sub "ᅱ", "wi" # HANGUL JUNGSEONG WI
|
509
|
+
sub "ᅴ", "üi" # HANGUL JUNGSEONG YI
|
510
|
+
sub "ᅪ", "wa" # HANGUL JUNGSEONG WA
|
511
|
+
sub "ᅯ", "wo" # HANGUL JUNGSEONG WEO
|
512
|
+
sub "ᅫ", "wae" # HANGUL JUNGSEONG WAE
|
513
|
+
sub "ᅰ", "we" # HANGUL JUNGSEONG WE
|
514
|
+
sub "ᆨ", "k", not_after: unicode_hangul # HANGUL JONGSEONG KIYEOK
|
515
|
+
sub "ᆫ", "n", not_after: unicode_hangul # HANGUL JONGSEONG NIEUN
|
516
|
+
sub "ᆮ", "t", not_after: unicode_hangul # HANGUL JONGSEONG TIEUT
|
517
|
+
sub "ᆯ", "l", not_after: unicode_hangul # HANGUL JONGSEONG RIEUL
|
518
|
+
sub "ᆷ", "m", not_after: unicode_hangul # HANGUL JONGSEONG MIEUM
|
519
|
+
sub "ᆸ", "p", not_after: unicode_hangul # HANGUL JONGSEONG PIEUP
|
520
|
+
sub "ᆺ", "t", not_after: unicode_hangul # HANGUL JONGSEONG SIOS
|
521
|
+
sub "ᆼ", "ng", not_after: unicode_hangul # HANGUL JONGSEONG IEUNG
|
522
|
+
sub "ᆽ", "t", not_after: unicode_hangul # HANGUL JONGSEONG CIEUC
|
523
|
+
sub "ᆾ", "t", not_after: unicode_hangul # HANGUL JONGSEONG CHIEUCH
|
524
|
+
sub "ᆿ", "k", not_after: unicode_hangul # HANGUL JONGSEONG KHIEUKH
|
525
|
+
sub "ᇀ", "t", not_after: unicode_hangul # HANGUL JONGSEONG THIEUTH
|
526
|
+
sub "ᇁ", "p", not_after: unicode_hangul # HANGUL JONGSEONG PHIEUPH
|
527
|
+
sub "ᆰ", "k", not_after: unicode_hangul # HANGUL JONGSEONG RIEUL-KIYEOK
|
528
|
+
sub "ᆲ", "p", not_after: unicode_hangul # HANGUL JONGSEONG RIEUL-PIEUP
|
529
|
+
}
|
530
|
+
# Remove space added
|
531
|
+
sub line_start + " ", ""
|
532
|
+
sub " " + line_end, ""
|
533
|
+
|
534
|
+
|
535
|
+
# This is based on Jamo
|
536
|
+
|
537
|
+
|
538
|
+
title_case
|
539
|
+
}
|
540
|
+
|